diff --git "a/log/debug_0.log" "b/log/debug_0.log" --- "a/log/debug_0.log" +++ "b/log/debug_0.log" @@ -1,50022 +1,3 @@ -09/20/2021 14:28:12 - INFO - __main__ - Distributed environment: MULTI_GPU Backend: nccl -Num processes: 16 -Process index: 0 -Local process index: 0 -Device: cuda:0 -Use FP16 precision: True - -09/20/2021 14:28:13 - WARNING - huggingface_hub.repository - /home/leandro/codeparrot/./ is already a clone of https://huggingface.co/transformersbook/codeparrot. Make sure you pull the latest changes with `repo.git_pull()`. -09/20/2021 14:28:13 - WARNING - huggingface_hub.repository - Revision `vocal-universe-103` does not exist. Created and checked out branch `vocal-universe-103`. -09/20/2021 14:28:13 - WARNING - huggingface_hub.repository - M codeparrot_training.py -M requirements.txt - -09/20/2021 14:28:33 - INFO - datasets.load - Some files matched the pattern '*' at /home/leandro/codeparrot-train but don't have valid data file extensions: [PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/69/ef/69efdcdb035636e6a8cd18cfc4ef702f95730a381b5d86b36c10028b4df94090'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/70/b0/70b01a02ca2810cf2e74a43655979028b31de42c566bc65d8b749720d1b08fb2'), PosixPath('/home/leandro/codeparrot-train/.git/HEAD'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/ed/ae/edae53c081ce347a58430f0930ce4fb318a9f62e15f85aa638a86c1666f70df4'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/08/26/0826780cd0e3d564882321e246176eac0fb695b706bc72c6022925075047a62e'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/15/95/159531500b1c473455d10fda2fb82f6ea7814500799e27eaf5f2be6f124f994c'), PosixPath('/home/leandro/codeparrot-train/.git/description'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/ca/00/ca00ed91ba94519faaba619e5eec6498215695acc6b3f760dc056967cefeea80'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/14/b9/14b9124b7b2ffa27d79dc210ae77b9b970e067ad7d3dc4d3eebc08671b770c16'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/7f/4f/7f4fb07272574ef183fd21a911f45f989a941516a11fe1d71335954a54657e07'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/f0/f9/f0f92a74ef6e03d0c05ae2012d7e33242c3b091f3e01d2d8f942e68cf295f7a4'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/b9/d1/b9d1c713e023c821f98968ea670a01aa7127c1c915f3d7f6368616f17369e8f2'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/ba/86/ba86bfbe83793efcb2e89df75179188dee67b96ace3e7f1628c133ce11fc361e'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/3a/fc/3afc8a938123d0f8e566043d271b4c6a60e3df968b72d8939982a09527763aae'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/80/61/8061f4f61c3955c90dab77a1553ac22e9d1ff604c229375be54a38e32ce6f8ca'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/79/c1/79c13ad14568c659397387f3d0e1358393fb0041ff48ce9c98ad4f28df8cde4b'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/44/b6/44b6239e61c700810037d9d8aa2fe706d7eaeb5766e492fad95411ad184490f5'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/14/4f/144f1231964ab251596b40abdd80f37fe7ce4ac7b2b31fc517b942cc24110341'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/6a/34/6a34d6e3ac6572933b2f66c74af568a0df3b91b94622dd4b7e5d5538c04071ff'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/d0/20/d02098784b5ee7b5d5206ee9cc52e881782d98fc90530322af1c5cb7d401f1fd'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/4f/df/4fdfd51962dfc725568d88de53b29e285d52e858e849acb543101fe556779a42'), PosixPath('/home/leandro/codeparrot-train/.git/hooks/pre-push'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/8e/81/8e81a5187b909a82581e8030a8008ffb9517519e477797b195bbcf422ef6e20c'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/a0/53/a05359f8e5ca97304272052f806034ebdca89a94f0d052b719b8b81dd8ddd868'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/0b/de/0bde10d6ad4055811339a7ed51fca332317529d6b5854a4b7ce90000e352aa33'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/bd/9a/bd9af7b8106e0a773e5a12495aa88339995c2084c2f9a243733879eb73f595d8'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/44/79/447953386aab39785c0f6c5e44b7310d433886fb73a1e40efe67c9620639e6fa'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/93/51/935137f4370f4f5c85ba6a157825fe6102edb991a46610fa9939e2960be9653d'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/b1/70/b1705347d88e73a7de652d1486a3eccda92e420e65a58917c88af635baf55ac8'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/43/98/439848f817f432ceefdf7e69a64b60dd99a75cc6fb26599a0ea5ac1167c3db4c'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/8f/8a/8f8a74c1e1fc4ee43110f74ae0cc01de863a0ceb3f2c4815cab1dc1efeb5339a'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/97/af/97af2a98400865661b26c3d5c0a3b6be51603452f459136bc9ab2568667ed199'), PosixPath('/home/leandro/codeparrot-train/.git/hooks/pre-receive.sample'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/81/7c/817cc36de53f7c914d82e2536a5538c21330ef54662366733e45c76a3c770d06'), PosixPath('/home/leandro/codeparrot-train/.git/config'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/b4/2c/b42c05288d42233fb829266917ae1145a835f3ccf8e00ea21e5927f9528fb500'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/d5/74/d574d02117a4209d073c3d382e859fdf07d6e18ac38bed8a4d900c8c9975550c'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/ef/8b/ef8b57ab3924e70df4f4a37b6853205113144fa01ea6c0140bea3a21b14eafeb'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/5b/66/5b66654660bc52d66f5bf0e6a62e0b65a0dd2499ec316daed0432efb2c7a8d7b'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/02/a0/02a07bbab0f2b514c1a9d5296ca8c1a843aca846fcde56fc810700ee416db1b4'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/09/c2/09c237a78f8a49d7840d8e5fc58e79db7e225b9904323f46791dce8fd0585332'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/85/28/8528503b464d6cbf8041e0a1481681d0bff4bb24f9d18230fe56c3bc99dfa2ab'), PosixPath('/home/leandro/codeparrot-train/.git/hooks/update.sample'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/13/ae/13ae38510e10076edaa24cf051e6403a270c95febd0e2e9b9e052128d632fe36'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/1f/46/1f46dcfefd87339930fa912ec98a56b7b93c2f052d7f452f82c9c3d0043ffa43'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/46/df/46df1517cd973f00262b495f82b10c46ec077a33bcfc83bade078a36590c6d0a'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/1c/2e/1c2e85e92de0f8a29ed6e534983e0051fa2c79e31013c11c7cc66f3f3f1e0155'), PosixPath('/home/leandro/codeparrot-train/.git/logs/refs/heads/main'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/ba/38/ba38a25c6b8dd335baf2c6cd925ca5b91668af93f7ecee2b120ad352f46a6565'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/23/ee/23eed9f8512ca62c4b9b4fb28a84688ee550b75ec7658209f3cd5d82a2d4aa57'), PosixPath('/home/leandro/codeparrot-train/.git/hooks/pre-commit.sample'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/e1/7a/e17a32eafebfa6f8d8b0edf6c0463c639f06a72fadae7907c9fd026f01136b98'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/04/64/04647e38d2a928e08abccf777e680adf7cb0066862374bd847c492de44cb047f'), PosixPath('/home/leandro/codeparrot-train/.git/hooks/pre-push.sample'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/98/de/98de114cefba6caad86991425c276e59a5ab4a3a1006d29f73ec5cede6233efd'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/bd/a8/bda8ae48acb883ddb225719c3584e3baa76887afb7198d76478af06e7f80572e'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/44/18/44181da41968eab59b99558c2afd4d6f95397bc2b580622a96f2f9fb74f545b2'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/14/58/1458ee6ad39f24b25d2db9153ba9aa25f4ff2f16c2f624361a0186904a658a54'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/01/87/0187e92041e5ef1abe3190a48330ff50c7d5fc5ed1219c3bcbb465907430d34e'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/14/26/142694003d3fc3bc57e51dab9eaf07472e0f24a4b092d70159943ecc8c2496a4'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/fa/40/fa40f7fe8b2d031a32282dce9a40462d67eecff28203c1743fcace8ef4bb37e6'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/41/11/4111a00cda1b0988507f8b544a9e4da7bfb0bff35c13990c6fb1c360aa6a6688'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/c3/d3/c3d3e55004ff21e36332b9612e385ba07c2610b832b4a94cca2d9fda372a9fb4'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/03/bb/03bb832cf6fad7e4bc885cc1d9502cf312d2951a51afbd63fb6a90f53e49d096'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/0f/70/0f704aab387aa4e2f0f4dd866d5f0888b25d0d0b61ef7881c38b918f22802ec2'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/21/be/21be1bf5e86f5da2dbd83f0bb904a3d68d9abea09bbd5adab6a6873c53ed0112'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/5f/34/5f342fc03b8d9c90aa9ff917ca3ff3edce748b6f0b55f61aadc9940ca53b45d5'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/d5/98/d59884b54759159fcaf45b671dfe9ee2a7d7aea34f1cc7762a1c25499589efb9'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/60/07/6007f21e5625708f4710d48386db1297bb1dbd26196ced77b305e7e35da0300d'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/2c/a7/2ca7213ba4af470b5f4caa0b4439992b7483c8b4d1cb977089f9b9abef1c7fba'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/2d/15/2d15883c4954ffcaafce389f10ccbad7c93e66fae3b7ca7db0a50343180cedf4'), PosixPath('/home/leandro/codeparrot-train/.git/refs/remotes/origin/HEAD'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/33/27/3327f7692a61d984758a71929f4466af87f91a2db0a656321df0d331ef4def20'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/7c/bf/7cbfb385a3bbebdb3eed3e154c80f0c9bf6b397aa702e5410339c2b1d74ae867'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/4c/35/4c35db8d1672615cddac65cdf0a76ea9ca1ec9d1d8b18ce293be0df23ff694db'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/49/d8/49d89abc121b49ef8a540796b63edd68f67f679d6ad1b969d6637d852d59f79f'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/de/af/deaf9432f8e1fdc2bd3b9078dc3996c536e661ebb379b81818ecfc70a360c923'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/a2/17/a21791d67c018e486dde68b8956a16b8fa0c54af93dc3c6ec2c669da87861b02'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/f9/91/f9915d283d95c3316a76922f129897823efd397287916e8f7af88ed7aaf517b0'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/2b/ac/2bac46edf98c75901284aff8296f80fea6701821000b205bd85aef8399124074'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/07/b9/07b951a7cc55afc0d48a47f0dbd9e06c7311279e4a747256b5dcfe11ba56690d'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/cf/84/cf84f4c64b1173bb12e281b88ca920c4c6d130c54214b5172bccbcc045fb2d0f'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/82/4c/824c9524070c36ed317c12b9b0e77f8b9460e8519ba32c6795a5a2e7232d088c'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/25/16/25162ca0d0fa0474f367ba4720b75f0cb10c70b3f62dd90cbb6e201773c99cb3'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/96/f9/96f9e109fe3ebce8c82610b0af4398170d678185b18ce5bc0384d84eb421ace5'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/a0/cc/a0ccfd373c5bb31028d4b7abb80a9a328395361cc2ac4f7376f5b1f6e89d89d0'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/f1/a5/f1a543df8fe1562a57657011c09d45778915a202f279013041e4f08d6cb1b475'), PosixPath('/home/leandro/codeparrot-train/.git/objects/pack/pack-67102b35e20edaa7f1ed9c266f37841cd38f158a.pack'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/32/d9/32d95bf48e9ba4ed480df0015326b0ed07647ce17e84a48a5a445db22bc5de4a'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/6f/bc/6fbcee1936749498486745c2dd217ee108f1a243f054dcb2591cfee772906fae'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/69/63/6963f0671c853a7bb7ae245df7c1f07fd8db821e59e1ab83b74d07909e029111'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/d7/c8/d7c88386b6a3c339c8a6d0beead12bf440477473df676886099ca289057fbace'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/4f/2c/4f2cb5d9fe3ef94da4aa3ec743d37b83c2347d6f1d3d4696a5c667ff9968ea38'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/64/35/643576ec614d0ba328db99ae865b8f1321ec4f288164f76fd6746b3b83e34f19'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/a9/73/a973fc07ce8ae881a878bf92c6c70583c08ea6bdb2ca2583002271f96dab9543'), PosixPath('/home/leandro/codeparrot-train/.git/logs/HEAD'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/87/f9/87f9d6d6889eb78e70ba55d2f959fa4e896bd3a78d02dd347792e30ddd730bf6'), PosixPath('/home/leandro/codeparrot-train/.git/hooks/pre-applypatch.sample'), PosixPath('/home/leandro/codeparrot-train/.git/logs/refs/remotes/origin/HEAD'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/2a/ff/2aff254f1288353b713d8e718915f8a2eba7d65097ed5f5d0df520a7058ddf71'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/17/89/178953ae530dc7960c803bd22a37026f4190b822b95145240537840bfc5a1ad1'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/9c/83/9c83dabc6a7c8a9629093125ff70fc60f594b0b95cb56f2f12d2bd91352367c7'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/2e/b3/2eb3b4ea8f84ef14a84b43002a148d99df05f68c1cfc0c0f074572bda0e0e1ee'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/f3/5e/f35ec6ce622145756740be75b1fa969996e7e716ac0a15d9bbc4e86aed616000'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/17/da/17dac3999cf0cb027901ecb382180aa9560b4bb2c5b839f3afc8cadc229962bf'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/2b/85/2b85d040d424bde044014147be3c4949a8d2b0e558c4f4c2c65aead5ece2cde9'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/6b/f5/6bf5fd370b20157e47d88709fb5c8b572f1b682a1fdb80091900bfda70a36491'), PosixPath('/home/leandro/codeparrot-train/.git/hooks/prepare-commit-msg.sample'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/22/c4/22c47cc7619654f7faafe250a2dd0cabae5520263e967245b8d5638215244239'), PosixPath('/home/leandro/codeparrot-train/.git/hooks/post-checkout'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/0a/03/0a03d68d6dda083d189878113e864c580b9b5572e53d3e1684b93a9996c7699d'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/da/b9/dab942e6da72846fc60682ce21a8e8fa6bf3452a29abff69ec0750e058ab3b92'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/6b/ce/6bce0dd945b67accdd3077504bc286a26bdb4b03fbbf34d427c21582f3374994'), PosixPath('/home/leandro/codeparrot-train/.git/hooks/pre-rebase.sample'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/78/bb/78bbf19a9e7a29b17fa71e3d05842b9469e3187e938efd8c793ceadbdd38c709'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/08/4a/084a245793d30784f6ae4f8b666624293bdab2d05a5e1eeadf20b7d9db444951'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/37/9d/379db3f5d257369fd927b7395599ec2aef5cefcb57811a57281487da9fd58c5b'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/87/fb/87fb4ab74dad4c0f520d49769333d5d1b010fcb9e8f30c8dab16430a5a0af9d2'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/ee/25/ee25b95231437c8795fca58f4a4d95b2698995f29e7f264956f78670f37ea982'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/2a/6b/2a6b5f923b286f640ad586bc295e653ec0db8e4c8487db1c25fa384e216b6ce5'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/eb/34/eb344442f4771eb011e0e520b8b1666903717e5e8c59a5462fe80aa82401940a'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/4c/10/4c10f31fa342f81c13b27e7ae0761b17729ee82f6e02824361e2cfcc4ab096c1'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/94/e0/94e011d7b77e55164bb15d95c453fa1282d78e234ff378adb930d756bbd33f64'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/45/da/45da5a5e4acd37b6e288eb4045434fb6b4a8d77979ac61c8306ca9eca6d24128'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/9c/75/9c7526f2ec341f2d2483d9db25b2b2e9fe630b21b737fa7ebbc19965c6ee46b1'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/55/cb/55cb3e32311273135568ef3da7960400d95f63dad586ccfe56996561277b483f'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/4a/54/4a54ecd83d3083585ddc7beb921140b2b2e5b4fb82dec9543ac0932c6136e84b'), PosixPath('/home/leandro/codeparrot-train/.git/hooks/post-update.sample'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/21/e1/21e166aee17c30af55849b552e2eaa9c0641dc6cb0ac6386bd3f7797d8af2a9b'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/50/83/5083522f9ebdb4c72e4e384dfd9bce8293d84dcdf0a7580cab1ce8e44f2880da'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/14/83/14830fec70eb2227647b241d9ff90addbc461cbdcddfe12e015028cefaba6f4e'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/70/35/70353ba511fe03b0f820a7ef6156771de34ef20a404a1cc2c064033998de0f9f'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/b7/d8/b7d84fc6c01ec6eb79187a7e252a3f033bfd1f2ba297d569e1bf507af9b50fa6'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/95/2e/952eaf2d8448261925753def51d58ff5af595d6469207db42abc0b17204640fb'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/fc/eb/fcebafda8e3681732437c98581a30faedf7802c6b90c84394d2c42b792c32507'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/a9/df/a9dfb7586f9a1bfaaa7175a2384e101f51513b0b98ce01eeaafe5a783cdbad96'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/6d/c7/6dc73c3794ad5c29870563658a7003cb2a6cfb0c1852c47037a6eda6cc3cf3a1'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/c0/8a/c08ad7d3c85ef3631747172211b65c70912bae157b55f922f1f70016bf7f64e6'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/ff/bc/ffbc64d8a248deb916c3ef209d2a18fc5de5c56a2cfa546a633cbfec31e6ccb2'), PosixPath('/home/leandro/codeparrot-train/.git/hooks/post-merge'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/26/99/2699022bd98f8d49f5505ab457b15dd31156713279335d0c28db1c99edc36894'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/a2/af/a2af1215060dc01f13d389abee1fc25ff94ed84262c54dea264810a5bcc074fc'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/b9/07/b907e571662c19245abd148afb306b5c6e411d24a5117e0bb4c182a56afb9b97'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/37/f2/37f2a405d0e8c52b4a51f79b23f135bcb537eb3f61fe8a27a29ab63b74a37671'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/63/77/6377867a616a0b6e8e3e3691c5cce9cd566773ec5bbd02f5a457edac8a0f24d4'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/db/d4/dbd4ddc668c0c838eecd756db64c9a3c2127d8e9bbc05b3fcba00b075854b24c'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/1d/b3/1db3132794e05cd2decef99af5f56073af4b4a27c33e3a0d0b4289e61b34c9dc'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/1e/89/1e890b33c7f95f900932797f1ba2b15f1f1780926f744ea04e0a969bf270df1a'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/1c/6f/1c6ff13e754a4260b097390066ecc973302f45756b4151bbfb7efbb7b1ac9963'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/da/6e/da6e9d2f263cf7b0254b4c0a57483ed8ac9652d6f67a63d648e9d968c576d526'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/5c/d6/5cd6e14ff3ac522a3a7bac22ef6ec299833c685a9c343d347fe21152e4173856'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/39/32/39325e24ddd711eacc61305d421e004de68e6f6d0b649ca695ad53d4dc53b47f'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/47/d1/47d1fedd443c4edfca241c00be8984a2157c668726cc06d92ad7e2704cb5c951'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/11/70/1170a8200f43dfa3902e9d41088229febdf4d7044d9d762dd5809685e5448b11'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/c0/0f/c00f0550d90e881145954ad24df7fdf512ffc3d63c50d2aa0c85774757d8f37d'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/b5/3e/b53e982e883c26c1a21db49bff0a27d8d628f4fc498715739936fa93bfb5353e'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/44/10/4410ab4420ffe54105620e1f038b0f6b14afa88a8df9dcf63468f6a2c105d770'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/1b/c7/1bc7cd472751ec9917bf55ce8b05b8ea467453335103f16c4551e94daefdbaf0'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/62/03/6203a1aae8671a6a23849de3aa6aa3efec0e3fbe3275757643abfd63a9ee9af8'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/77/63/7763fa2cb60958f8d28fc6bebc0105ed3614addd32296fe929b7262e4d62f58a'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/f8/3b/f83b75420e369ae1d55e7009effe9f7a05577a31c19a8c02ce7f0b56b5dc8a87'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/6b/3d/6b3d8a7164286112196af65658426d2faeda5c50fc381bdebf378f0226342d4e'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/bd/9b/bd9be9097633349b5ecd400375be5d511e812feadf983f3c2cbcba263a3a14ab'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/e9/95/e995f5605e676fd577e4c78ee6bf43451324ddbcb04e841cf1dfce07c69dc1b6'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/8b/d9/8bd964dad421ed624f4bd5e4719e3e28f62d002b350d850e902688c9e9bcfd80'), PosixPath('/home/leandro/codeparrot-train/.git/index'), PosixPath('/home/leandro/codeparrot-train/.git/hooks/fsmonitor-watchman.sample'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/d6/ec/d6ecd24bfd9e0c2877dfa00417568e07d9f64a150c5518d471ff91ded60bf146'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/4c/b0/4cb0db5e545856bfeb62f7fa15d3472b705ac8fdeb8c4a831727b730951f8902'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/a7/6e/a76e8e4bbc39a74e4ff59e02aaf1404a8bc429f1033a216058b09f7e0ee3cd0c'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/02/dd/02ddc3cc1a121d8e237578028f34a994a7548f0d086a1312133c3864dbff6b37'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/8a/ae/8aae623a251bd31627554141be2150a5ffb8ddea900ae244fd8492cc03245b36'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/ba/5a/ba5ad5064f9ef5d1429abd4c4742cf37b56589c060ff3995e5331eb69fb9c1c5'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/7f/8d/7f8dc2a2357a3d91ecc5fa5f125c73181dfbe22524d853f672010513044c80f7'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/12/a7/12a785cd978d3ec0330adae618ad3103dd53f63c7c11b96a7a0d33254407aaa4'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/e6/f0/e6f0840fa125b6ad771b853937bd215b369bfb815ff521316cf6cb46fba66968'), PosixPath('/home/leandro/codeparrot-train/.git/refs/heads/main'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/2d/31/2d3127f22a64cf04b4ab8fd23512d5b7d6373429e36ffd68b3f86d0dff4e2fdb'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/55/db/55dbc21eb4360618b60fc5eaa4ce705ea71bb1e8241237099cfe43c59ed5b2ed'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/7d/d3/7dd37fe8445ee2641f14179d5a2aa636780822347d880a401d41c90bfd5cfd68'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/54/10/5410ae89d1cf3ea5325b7e948fd4db3d352e44bbd2a6a5c813f77be0da958c80'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/7d/04/7d049e95fe5200dc13c1451523e00fd08d37ffde2a863aa025f030f00d3d747b'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/f8/46/f84677f7389798b5c74ff00760d08732db022e99f60dc77e5bb4d900aa80dc60'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/eb/a4/eba49c7ea511320fd7040022951873a465016ddb72d078b958a4003c396ffb52'), PosixPath('/home/leandro/codeparrot-train/.git/objects/pack/pack-67102b35e20edaa7f1ed9c266f37841cd38f158a.idx'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/96/84/9684f7bb635a937d6899902ad758fd565826bfe5b8ea42c296d791dd7089b0f9'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/28/29/28290f1947521e2d6c58ee18d83b864b5d95e1fad3b54ee817799991642488ec'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/3a/b5/3ab5c68d9424b10ca45197172baa495813eae7efa9b3914ea4e4afd0201995b5'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/b8/ac/b8acca45caffd1db94c790f13ed8f1742b71d4f9cd3d242417e87bb150b6af20'), PosixPath('/home/leandro/codeparrot-train/.git/hooks/applypatch-msg.sample'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/77/13/77131f000b7ab27e1336a181a4e4188f31ed40cea3fdf98b6398b5bbddaa5c76'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/1c/5f/1c5f7b819a67cfca7be02b743fbf0dabf7d53a1c7ddf82e70e094d92973d95c7'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/1d/a5/1da55a92827ad63ee4eb1f5eabf14500459bf357c28b767756b80342024063d4'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/00/33/0033a83827749523a25d0ef661ef307b27edc162ce38c44e25fd033e9a187c76'), PosixPath('/home/leandro/codeparrot-train/.git/hooks/post-commit'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/0d/07/0d07213fb514be71d57406af05dafff0edd3c7506621df761c9453ff598d89c9'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/b3/84/b3849196f2777c6e3fb662ae301ae63561db9aaff9bd2ac2f32ad02e9d26d399'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/25/84/2584f186110af7310075f15e07ddadb9c50c26cafd4c66b2e2baaab040028c3b'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/e3/62/e3627cc99f31126c54a8a4188ce59123e876c812bdbdc5cba35d2f76e369a385'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/17/ba/17ba31d8c126b19d7dc4899e46ec476e059462beaf2364bf77471b2f920ddf37'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/fa/f2/faf2e65a89fda5ec7a00a36b9fd6c4b2429f1249072b838f2a02d5d01fcaeb18'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/a7/9a/a79a92653692037bf2fd6de92d93429455cd31dc7f96513adb40277d11be891d'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/e0/49/e049a0f4444d560849ab8c2d893157b975d183f839984001f101046ca74b7978'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/4f/5b/4f5b4ba86fe51a134d866d06e472bd6c6f9d1f122cb905c65cb7c0a35bf51acd'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/3d/35/3d354291d12d6be3833eda95bd0db307dcd26b5b4287a3f6ca33b3b51b2e46f2'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/05/9b/059bc5381874a28e5a467291be6ee44e3f667609290d74e5ed009be10329bdbb'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/d0/e5/d0e599bab79fe0054313a92ab57e7a89c65c2fc45011168aa73c0fe000c4f689'), PosixPath('/home/leandro/codeparrot-train/.git/packed-refs'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/9d/a6/9da6dd8c62377fcfe1e95882a17aa711a8fcc38e02cf21cc1a678f22a9e50d39'), PosixPath('/home/leandro/codeparrot-train/.git/info/exclude'), PosixPath('/home/leandro/codeparrot-train/.git/hooks/commit-msg.sample')] -09/20/2021 14:28:34 - INFO - datasets.load - Some files matched the pattern '*' at /home/leandro/codeparrot-train but don't have valid data file extensions: [PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/69/ef/69efdcdb035636e6a8cd18cfc4ef702f95730a381b5d86b36c10028b4df94090'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/70/b0/70b01a02ca2810cf2e74a43655979028b31de42c566bc65d8b749720d1b08fb2'), PosixPath('/home/leandro/codeparrot-train/.git/HEAD'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/ed/ae/edae53c081ce347a58430f0930ce4fb318a9f62e15f85aa638a86c1666f70df4'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/08/26/0826780cd0e3d564882321e246176eac0fb695b706bc72c6022925075047a62e'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/15/95/159531500b1c473455d10fda2fb82f6ea7814500799e27eaf5f2be6f124f994c'), PosixPath('/home/leandro/codeparrot-train/.git/description'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/ca/00/ca00ed91ba94519faaba619e5eec6498215695acc6b3f760dc056967cefeea80'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/14/b9/14b9124b7b2ffa27d79dc210ae77b9b970e067ad7d3dc4d3eebc08671b770c16'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/7f/4f/7f4fb07272574ef183fd21a911f45f989a941516a11fe1d71335954a54657e07'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/f0/f9/f0f92a74ef6e03d0c05ae2012d7e33242c3b091f3e01d2d8f942e68cf295f7a4'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/b9/d1/b9d1c713e023c821f98968ea670a01aa7127c1c915f3d7f6368616f17369e8f2'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/ba/86/ba86bfbe83793efcb2e89df75179188dee67b96ace3e7f1628c133ce11fc361e'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/3a/fc/3afc8a938123d0f8e566043d271b4c6a60e3df968b72d8939982a09527763aae'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/80/61/8061f4f61c3955c90dab77a1553ac22e9d1ff604c229375be54a38e32ce6f8ca'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/79/c1/79c13ad14568c659397387f3d0e1358393fb0041ff48ce9c98ad4f28df8cde4b'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/44/b6/44b6239e61c700810037d9d8aa2fe706d7eaeb5766e492fad95411ad184490f5'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/14/4f/144f1231964ab251596b40abdd80f37fe7ce4ac7b2b31fc517b942cc24110341'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/6a/34/6a34d6e3ac6572933b2f66c74af568a0df3b91b94622dd4b7e5d5538c04071ff'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/d0/20/d02098784b5ee7b5d5206ee9cc52e881782d98fc90530322af1c5cb7d401f1fd'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/4f/df/4fdfd51962dfc725568d88de53b29e285d52e858e849acb543101fe556779a42'), PosixPath('/home/leandro/codeparrot-train/.git/hooks/pre-push'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/8e/81/8e81a5187b909a82581e8030a8008ffb9517519e477797b195bbcf422ef6e20c'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/a0/53/a05359f8e5ca97304272052f806034ebdca89a94f0d052b719b8b81dd8ddd868'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/0b/de/0bde10d6ad4055811339a7ed51fca332317529d6b5854a4b7ce90000e352aa33'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/bd/9a/bd9af7b8106e0a773e5a12495aa88339995c2084c2f9a243733879eb73f595d8'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/44/79/447953386aab39785c0f6c5e44b7310d433886fb73a1e40efe67c9620639e6fa'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/93/51/935137f4370f4f5c85ba6a157825fe6102edb991a46610fa9939e2960be9653d'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/b1/70/b1705347d88e73a7de652d1486a3eccda92e420e65a58917c88af635baf55ac8'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/43/98/439848f817f432ceefdf7e69a64b60dd99a75cc6fb26599a0ea5ac1167c3db4c'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/8f/8a/8f8a74c1e1fc4ee43110f74ae0cc01de863a0ceb3f2c4815cab1dc1efeb5339a'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/97/af/97af2a98400865661b26c3d5c0a3b6be51603452f459136bc9ab2568667ed199'), PosixPath('/home/leandro/codeparrot-train/.git/hooks/pre-receive.sample'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/81/7c/817cc36de53f7c914d82e2536a5538c21330ef54662366733e45c76a3c770d06'), PosixPath('/home/leandro/codeparrot-train/.git/config'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/b4/2c/b42c05288d42233fb829266917ae1145a835f3ccf8e00ea21e5927f9528fb500'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/d5/74/d574d02117a4209d073c3d382e859fdf07d6e18ac38bed8a4d900c8c9975550c'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/ef/8b/ef8b57ab3924e70df4f4a37b6853205113144fa01ea6c0140bea3a21b14eafeb'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/5b/66/5b66654660bc52d66f5bf0e6a62e0b65a0dd2499ec316daed0432efb2c7a8d7b'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/02/a0/02a07bbab0f2b514c1a9d5296ca8c1a843aca846fcde56fc810700ee416db1b4'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/09/c2/09c237a78f8a49d7840d8e5fc58e79db7e225b9904323f46791dce8fd0585332'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/85/28/8528503b464d6cbf8041e0a1481681d0bff4bb24f9d18230fe56c3bc99dfa2ab'), PosixPath('/home/leandro/codeparrot-train/.git/hooks/update.sample'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/13/ae/13ae38510e10076edaa24cf051e6403a270c95febd0e2e9b9e052128d632fe36'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/1f/46/1f46dcfefd87339930fa912ec98a56b7b93c2f052d7f452f82c9c3d0043ffa43'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/46/df/46df1517cd973f00262b495f82b10c46ec077a33bcfc83bade078a36590c6d0a'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/1c/2e/1c2e85e92de0f8a29ed6e534983e0051fa2c79e31013c11c7cc66f3f3f1e0155'), PosixPath('/home/leandro/codeparrot-train/.git/logs/refs/heads/main'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/ba/38/ba38a25c6b8dd335baf2c6cd925ca5b91668af93f7ecee2b120ad352f46a6565'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/23/ee/23eed9f8512ca62c4b9b4fb28a84688ee550b75ec7658209f3cd5d82a2d4aa57'), PosixPath('/home/leandro/codeparrot-train/.git/hooks/pre-commit.sample'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/e1/7a/e17a32eafebfa6f8d8b0edf6c0463c639f06a72fadae7907c9fd026f01136b98'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/04/64/04647e38d2a928e08abccf777e680adf7cb0066862374bd847c492de44cb047f'), PosixPath('/home/leandro/codeparrot-train/.git/hooks/pre-push.sample'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/98/de/98de114cefba6caad86991425c276e59a5ab4a3a1006d29f73ec5cede6233efd'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/bd/a8/bda8ae48acb883ddb225719c3584e3baa76887afb7198d76478af06e7f80572e'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/44/18/44181da41968eab59b99558c2afd4d6f95397bc2b580622a96f2f9fb74f545b2'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/14/58/1458ee6ad39f24b25d2db9153ba9aa25f4ff2f16c2f624361a0186904a658a54'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/01/87/0187e92041e5ef1abe3190a48330ff50c7d5fc5ed1219c3bcbb465907430d34e'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/14/26/142694003d3fc3bc57e51dab9eaf07472e0f24a4b092d70159943ecc8c2496a4'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/fa/40/fa40f7fe8b2d031a32282dce9a40462d67eecff28203c1743fcace8ef4bb37e6'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/41/11/4111a00cda1b0988507f8b544a9e4da7bfb0bff35c13990c6fb1c360aa6a6688'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/c3/d3/c3d3e55004ff21e36332b9612e385ba07c2610b832b4a94cca2d9fda372a9fb4'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/03/bb/03bb832cf6fad7e4bc885cc1d9502cf312d2951a51afbd63fb6a90f53e49d096'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/0f/70/0f704aab387aa4e2f0f4dd866d5f0888b25d0d0b61ef7881c38b918f22802ec2'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/21/be/21be1bf5e86f5da2dbd83f0bb904a3d68d9abea09bbd5adab6a6873c53ed0112'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/5f/34/5f342fc03b8d9c90aa9ff917ca3ff3edce748b6f0b55f61aadc9940ca53b45d5'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/d5/98/d59884b54759159fcaf45b671dfe9ee2a7d7aea34f1cc7762a1c25499589efb9'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/60/07/6007f21e5625708f4710d48386db1297bb1dbd26196ced77b305e7e35da0300d'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/2c/a7/2ca7213ba4af470b5f4caa0b4439992b7483c8b4d1cb977089f9b9abef1c7fba'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/2d/15/2d15883c4954ffcaafce389f10ccbad7c93e66fae3b7ca7db0a50343180cedf4'), PosixPath('/home/leandro/codeparrot-train/.git/refs/remotes/origin/HEAD'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/33/27/3327f7692a61d984758a71929f4466af87f91a2db0a656321df0d331ef4def20'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/7c/bf/7cbfb385a3bbebdb3eed3e154c80f0c9bf6b397aa702e5410339c2b1d74ae867'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/4c/35/4c35db8d1672615cddac65cdf0a76ea9ca1ec9d1d8b18ce293be0df23ff694db'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/49/d8/49d89abc121b49ef8a540796b63edd68f67f679d6ad1b969d6637d852d59f79f'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/de/af/deaf9432f8e1fdc2bd3b9078dc3996c536e661ebb379b81818ecfc70a360c923'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/a2/17/a21791d67c018e486dde68b8956a16b8fa0c54af93dc3c6ec2c669da87861b02'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/f9/91/f9915d283d95c3316a76922f129897823efd397287916e8f7af88ed7aaf517b0'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/2b/ac/2bac46edf98c75901284aff8296f80fea6701821000b205bd85aef8399124074'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/07/b9/07b951a7cc55afc0d48a47f0dbd9e06c7311279e4a747256b5dcfe11ba56690d'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/cf/84/cf84f4c64b1173bb12e281b88ca920c4c6d130c54214b5172bccbcc045fb2d0f'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/82/4c/824c9524070c36ed317c12b9b0e77f8b9460e8519ba32c6795a5a2e7232d088c'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/25/16/25162ca0d0fa0474f367ba4720b75f0cb10c70b3f62dd90cbb6e201773c99cb3'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/96/f9/96f9e109fe3ebce8c82610b0af4398170d678185b18ce5bc0384d84eb421ace5'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/a0/cc/a0ccfd373c5bb31028d4b7abb80a9a328395361cc2ac4f7376f5b1f6e89d89d0'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/f1/a5/f1a543df8fe1562a57657011c09d45778915a202f279013041e4f08d6cb1b475'), PosixPath('/home/leandro/codeparrot-train/.git/objects/pack/pack-67102b35e20edaa7f1ed9c266f37841cd38f158a.pack'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/32/d9/32d95bf48e9ba4ed480df0015326b0ed07647ce17e84a48a5a445db22bc5de4a'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/6f/bc/6fbcee1936749498486745c2dd217ee108f1a243f054dcb2591cfee772906fae'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/69/63/6963f0671c853a7bb7ae245df7c1f07fd8db821e59e1ab83b74d07909e029111'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/d7/c8/d7c88386b6a3c339c8a6d0beead12bf440477473df676886099ca289057fbace'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/4f/2c/4f2cb5d9fe3ef94da4aa3ec743d37b83c2347d6f1d3d4696a5c667ff9968ea38'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/64/35/643576ec614d0ba328db99ae865b8f1321ec4f288164f76fd6746b3b83e34f19'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/a9/73/a973fc07ce8ae881a878bf92c6c70583c08ea6bdb2ca2583002271f96dab9543'), PosixPath('/home/leandro/codeparrot-train/.git/logs/HEAD'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/87/f9/87f9d6d6889eb78e70ba55d2f959fa4e896bd3a78d02dd347792e30ddd730bf6'), PosixPath('/home/leandro/codeparrot-train/.git/hooks/pre-applypatch.sample'), PosixPath('/home/leandro/codeparrot-train/.git/logs/refs/remotes/origin/HEAD'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/2a/ff/2aff254f1288353b713d8e718915f8a2eba7d65097ed5f5d0df520a7058ddf71'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/17/89/178953ae530dc7960c803bd22a37026f4190b822b95145240537840bfc5a1ad1'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/9c/83/9c83dabc6a7c8a9629093125ff70fc60f594b0b95cb56f2f12d2bd91352367c7'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/2e/b3/2eb3b4ea8f84ef14a84b43002a148d99df05f68c1cfc0c0f074572bda0e0e1ee'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/f3/5e/f35ec6ce622145756740be75b1fa969996e7e716ac0a15d9bbc4e86aed616000'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/17/da/17dac3999cf0cb027901ecb382180aa9560b4bb2c5b839f3afc8cadc229962bf'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/2b/85/2b85d040d424bde044014147be3c4949a8d2b0e558c4f4c2c65aead5ece2cde9'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/6b/f5/6bf5fd370b20157e47d88709fb5c8b572f1b682a1fdb80091900bfda70a36491'), PosixPath('/home/leandro/codeparrot-train/.git/hooks/prepare-commit-msg.sample'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/22/c4/22c47cc7619654f7faafe250a2dd0cabae5520263e967245b8d5638215244239'), PosixPath('/home/leandro/codeparrot-train/.git/hooks/post-checkout'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/0a/03/0a03d68d6dda083d189878113e864c580b9b5572e53d3e1684b93a9996c7699d'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/da/b9/dab942e6da72846fc60682ce21a8e8fa6bf3452a29abff69ec0750e058ab3b92'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/6b/ce/6bce0dd945b67accdd3077504bc286a26bdb4b03fbbf34d427c21582f3374994'), PosixPath('/home/leandro/codeparrot-train/.git/hooks/pre-rebase.sample'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/78/bb/78bbf19a9e7a29b17fa71e3d05842b9469e3187e938efd8c793ceadbdd38c709'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/08/4a/084a245793d30784f6ae4f8b666624293bdab2d05a5e1eeadf20b7d9db444951'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/37/9d/379db3f5d257369fd927b7395599ec2aef5cefcb57811a57281487da9fd58c5b'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/87/fb/87fb4ab74dad4c0f520d49769333d5d1b010fcb9e8f30c8dab16430a5a0af9d2'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/ee/25/ee25b95231437c8795fca58f4a4d95b2698995f29e7f264956f78670f37ea982'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/2a/6b/2a6b5f923b286f640ad586bc295e653ec0db8e4c8487db1c25fa384e216b6ce5'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/eb/34/eb344442f4771eb011e0e520b8b1666903717e5e8c59a5462fe80aa82401940a'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/4c/10/4c10f31fa342f81c13b27e7ae0761b17729ee82f6e02824361e2cfcc4ab096c1'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/94/e0/94e011d7b77e55164bb15d95c453fa1282d78e234ff378adb930d756bbd33f64'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/45/da/45da5a5e4acd37b6e288eb4045434fb6b4a8d77979ac61c8306ca9eca6d24128'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/9c/75/9c7526f2ec341f2d2483d9db25b2b2e9fe630b21b737fa7ebbc19965c6ee46b1'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/55/cb/55cb3e32311273135568ef3da7960400d95f63dad586ccfe56996561277b483f'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/4a/54/4a54ecd83d3083585ddc7beb921140b2b2e5b4fb82dec9543ac0932c6136e84b'), PosixPath('/home/leandro/codeparrot-train/.git/hooks/post-update.sample'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/21/e1/21e166aee17c30af55849b552e2eaa9c0641dc6cb0ac6386bd3f7797d8af2a9b'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/50/83/5083522f9ebdb4c72e4e384dfd9bce8293d84dcdf0a7580cab1ce8e44f2880da'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/14/83/14830fec70eb2227647b241d9ff90addbc461cbdcddfe12e015028cefaba6f4e'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/70/35/70353ba511fe03b0f820a7ef6156771de34ef20a404a1cc2c064033998de0f9f'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/b7/d8/b7d84fc6c01ec6eb79187a7e252a3f033bfd1f2ba297d569e1bf507af9b50fa6'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/95/2e/952eaf2d8448261925753def51d58ff5af595d6469207db42abc0b17204640fb'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/fc/eb/fcebafda8e3681732437c98581a30faedf7802c6b90c84394d2c42b792c32507'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/a9/df/a9dfb7586f9a1bfaaa7175a2384e101f51513b0b98ce01eeaafe5a783cdbad96'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/6d/c7/6dc73c3794ad5c29870563658a7003cb2a6cfb0c1852c47037a6eda6cc3cf3a1'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/c0/8a/c08ad7d3c85ef3631747172211b65c70912bae157b55f922f1f70016bf7f64e6'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/ff/bc/ffbc64d8a248deb916c3ef209d2a18fc5de5c56a2cfa546a633cbfec31e6ccb2'), PosixPath('/home/leandro/codeparrot-train/.git/hooks/post-merge'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/26/99/2699022bd98f8d49f5505ab457b15dd31156713279335d0c28db1c99edc36894'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/a2/af/a2af1215060dc01f13d389abee1fc25ff94ed84262c54dea264810a5bcc074fc'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/b9/07/b907e571662c19245abd148afb306b5c6e411d24a5117e0bb4c182a56afb9b97'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/37/f2/37f2a405d0e8c52b4a51f79b23f135bcb537eb3f61fe8a27a29ab63b74a37671'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/63/77/6377867a616a0b6e8e3e3691c5cce9cd566773ec5bbd02f5a457edac8a0f24d4'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/db/d4/dbd4ddc668c0c838eecd756db64c9a3c2127d8e9bbc05b3fcba00b075854b24c'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/1d/b3/1db3132794e05cd2decef99af5f56073af4b4a27c33e3a0d0b4289e61b34c9dc'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/1e/89/1e890b33c7f95f900932797f1ba2b15f1f1780926f744ea04e0a969bf270df1a'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/1c/6f/1c6ff13e754a4260b097390066ecc973302f45756b4151bbfb7efbb7b1ac9963'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/da/6e/da6e9d2f263cf7b0254b4c0a57483ed8ac9652d6f67a63d648e9d968c576d526'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/5c/d6/5cd6e14ff3ac522a3a7bac22ef6ec299833c685a9c343d347fe21152e4173856'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/39/32/39325e24ddd711eacc61305d421e004de68e6f6d0b649ca695ad53d4dc53b47f'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/47/d1/47d1fedd443c4edfca241c00be8984a2157c668726cc06d92ad7e2704cb5c951'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/11/70/1170a8200f43dfa3902e9d41088229febdf4d7044d9d762dd5809685e5448b11'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/c0/0f/c00f0550d90e881145954ad24df7fdf512ffc3d63c50d2aa0c85774757d8f37d'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/b5/3e/b53e982e883c26c1a21db49bff0a27d8d628f4fc498715739936fa93bfb5353e'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/44/10/4410ab4420ffe54105620e1f038b0f6b14afa88a8df9dcf63468f6a2c105d770'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/1b/c7/1bc7cd472751ec9917bf55ce8b05b8ea467453335103f16c4551e94daefdbaf0'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/62/03/6203a1aae8671a6a23849de3aa6aa3efec0e3fbe3275757643abfd63a9ee9af8'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/77/63/7763fa2cb60958f8d28fc6bebc0105ed3614addd32296fe929b7262e4d62f58a'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/f8/3b/f83b75420e369ae1d55e7009effe9f7a05577a31c19a8c02ce7f0b56b5dc8a87'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/6b/3d/6b3d8a7164286112196af65658426d2faeda5c50fc381bdebf378f0226342d4e'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/bd/9b/bd9be9097633349b5ecd400375be5d511e812feadf983f3c2cbcba263a3a14ab'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/e9/95/e995f5605e676fd577e4c78ee6bf43451324ddbcb04e841cf1dfce07c69dc1b6'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/8b/d9/8bd964dad421ed624f4bd5e4719e3e28f62d002b350d850e902688c9e9bcfd80'), PosixPath('/home/leandro/codeparrot-train/.git/index'), PosixPath('/home/leandro/codeparrot-train/.git/hooks/fsmonitor-watchman.sample'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/d6/ec/d6ecd24bfd9e0c2877dfa00417568e07d9f64a150c5518d471ff91ded60bf146'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/4c/b0/4cb0db5e545856bfeb62f7fa15d3472b705ac8fdeb8c4a831727b730951f8902'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/a7/6e/a76e8e4bbc39a74e4ff59e02aaf1404a8bc429f1033a216058b09f7e0ee3cd0c'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/02/dd/02ddc3cc1a121d8e237578028f34a994a7548f0d086a1312133c3864dbff6b37'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/8a/ae/8aae623a251bd31627554141be2150a5ffb8ddea900ae244fd8492cc03245b36'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/ba/5a/ba5ad5064f9ef5d1429abd4c4742cf37b56589c060ff3995e5331eb69fb9c1c5'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/7f/8d/7f8dc2a2357a3d91ecc5fa5f125c73181dfbe22524d853f672010513044c80f7'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/12/a7/12a785cd978d3ec0330adae618ad3103dd53f63c7c11b96a7a0d33254407aaa4'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/e6/f0/e6f0840fa125b6ad771b853937bd215b369bfb815ff521316cf6cb46fba66968'), PosixPath('/home/leandro/codeparrot-train/.git/refs/heads/main'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/2d/31/2d3127f22a64cf04b4ab8fd23512d5b7d6373429e36ffd68b3f86d0dff4e2fdb'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/55/db/55dbc21eb4360618b60fc5eaa4ce705ea71bb1e8241237099cfe43c59ed5b2ed'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/7d/d3/7dd37fe8445ee2641f14179d5a2aa636780822347d880a401d41c90bfd5cfd68'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/54/10/5410ae89d1cf3ea5325b7e948fd4db3d352e44bbd2a6a5c813f77be0da958c80'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/7d/04/7d049e95fe5200dc13c1451523e00fd08d37ffde2a863aa025f030f00d3d747b'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/f8/46/f84677f7389798b5c74ff00760d08732db022e99f60dc77e5bb4d900aa80dc60'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/eb/a4/eba49c7ea511320fd7040022951873a465016ddb72d078b958a4003c396ffb52'), PosixPath('/home/leandro/codeparrot-train/.git/objects/pack/pack-67102b35e20edaa7f1ed9c266f37841cd38f158a.idx'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/96/84/9684f7bb635a937d6899902ad758fd565826bfe5b8ea42c296d791dd7089b0f9'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/28/29/28290f1947521e2d6c58ee18d83b864b5d95e1fad3b54ee817799991642488ec'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/3a/b5/3ab5c68d9424b10ca45197172baa495813eae7efa9b3914ea4e4afd0201995b5'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/b8/ac/b8acca45caffd1db94c790f13ed8f1742b71d4f9cd3d242417e87bb150b6af20'), PosixPath('/home/leandro/codeparrot-train/.git/hooks/applypatch-msg.sample'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/77/13/77131f000b7ab27e1336a181a4e4188f31ed40cea3fdf98b6398b5bbddaa5c76'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/1c/5f/1c5f7b819a67cfca7be02b743fbf0dabf7d53a1c7ddf82e70e094d92973d95c7'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/1d/a5/1da55a92827ad63ee4eb1f5eabf14500459bf357c28b767756b80342024063d4'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/00/33/0033a83827749523a25d0ef661ef307b27edc162ce38c44e25fd033e9a187c76'), PosixPath('/home/leandro/codeparrot-train/.git/hooks/post-commit'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/0d/07/0d07213fb514be71d57406af05dafff0edd3c7506621df761c9453ff598d89c9'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/b3/84/b3849196f2777c6e3fb662ae301ae63561db9aaff9bd2ac2f32ad02e9d26d399'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/25/84/2584f186110af7310075f15e07ddadb9c50c26cafd4c66b2e2baaab040028c3b'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/e3/62/e3627cc99f31126c54a8a4188ce59123e876c812bdbdc5cba35d2f76e369a385'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/17/ba/17ba31d8c126b19d7dc4899e46ec476e059462beaf2364bf77471b2f920ddf37'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/fa/f2/faf2e65a89fda5ec7a00a36b9fd6c4b2429f1249072b838f2a02d5d01fcaeb18'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/a7/9a/a79a92653692037bf2fd6de92d93429455cd31dc7f96513adb40277d11be891d'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/e0/49/e049a0f4444d560849ab8c2d893157b975d183f839984001f101046ca74b7978'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/4f/5b/4f5b4ba86fe51a134d866d06e472bd6c6f9d1f122cb905c65cb7c0a35bf51acd'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/3d/35/3d354291d12d6be3833eda95bd0db307dcd26b5b4287a3f6ca33b3b51b2e46f2'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/05/9b/059bc5381874a28e5a467291be6ee44e3f667609290d74e5ed009be10329bdbb'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/d0/e5/d0e599bab79fe0054313a92ab57e7a89c65c2fc45011168aa73c0fe000c4f689'), PosixPath('/home/leandro/codeparrot-train/.git/packed-refs'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/9d/a6/9da6dd8c62377fcfe1e95882a17aa711a8fcc38e02cf21cc1a678f22a9e50d39'), PosixPath('/home/leandro/codeparrot-train/.git/info/exclude'), PosixPath('/home/leandro/codeparrot-train/.git/hooks/commit-msg.sample')] -09/20/2021 14:28:34 - WARNING - datasets.builder - Using custom data configuration codeparrot-train-272006ad98f3f880 -09/20/2021 14:28:34 - INFO - datasets.load - Some files matched the pattern '*' at /home/leandro/codeparrot-valid but don't have valid data file extensions: [PosixPath('/home/leandro/codeparrot-valid/.git/lfs/objects/43/23/432375a8140ca79af9fa62e3145815c0f7965af8026ed1847ce6e75a11f413fd'), PosixPath('/home/leandro/codeparrot-valid/.git/hooks/pre-rebase.sample'), PosixPath('/home/leandro/codeparrot-valid/.git/config'), PosixPath('/home/leandro/codeparrot-valid/.git/hooks/pre-commit.sample'), PosixPath('/home/leandro/codeparrot-valid/.git/info/exclude'), PosixPath('/home/leandro/codeparrot-valid/.git/hooks/commit-msg.sample'), PosixPath('/home/leandro/codeparrot-valid/.git/logs/refs/heads/main'), PosixPath('/home/leandro/codeparrot-valid/.git/hooks/pre-push.sample'), PosixPath('/home/leandro/codeparrot-valid/.git/hooks/fsmonitor-watchman.sample'), PosixPath('/home/leandro/codeparrot-valid/.git/objects/f3/fa800d7629eabb8ba09a504140b5a203d1341a'), PosixPath('/home/leandro/codeparrot-valid/.git/objects/0b/0462e46b355e305d77ff3b85f3a01776e188ea'), PosixPath('/home/leandro/codeparrot-valid/.git/packed-refs'), PosixPath('/home/leandro/codeparrot-valid/.git/index'), PosixPath('/home/leandro/codeparrot-valid/.git/HEAD'), PosixPath('/home/leandro/codeparrot-valid/.git/hooks/post-update.sample'), PosixPath('/home/leandro/codeparrot-valid/.git/objects/5e/9d29c73e4d5b8ecb2b60628d17a791508a514f'), PosixPath('/home/leandro/codeparrot-valid/.git/refs/heads/main'), PosixPath('/home/leandro/codeparrot-valid/.git/hooks/pre-push'), PosixPath('/home/leandro/codeparrot-valid/.git/objects/c9/b135a100a1770bcdc5ae26195bd4f7bd85a764'), PosixPath('/home/leandro/codeparrot-valid/.git/description'), PosixPath('/home/leandro/codeparrot-valid/.git/hooks/pre-applypatch.sample'), PosixPath('/home/leandro/codeparrot-valid/.git/logs/HEAD'), PosixPath('/home/leandro/codeparrot-valid/.git/hooks/pre-receive.sample'), PosixPath('/home/leandro/codeparrot-valid/.git/refs/remotes/origin/HEAD'), PosixPath('/home/leandro/codeparrot-valid/.git/hooks/post-merge'), PosixPath('/home/leandro/codeparrot-valid/.git/hooks/applypatch-msg.sample'), PosixPath('/home/leandro/codeparrot-valid/.git/hooks/post-commit'), PosixPath('/home/leandro/codeparrot-valid/.git/objects/07/f0db3339ad9053dc95b284c4ae14e014efff89'), PosixPath('/home/leandro/codeparrot-valid/.git/objects/d7/b8c495dd9e6df27bfd6a47dad7e33da0850a5b'), PosixPath('/home/leandro/codeparrot-valid/.git/objects/c6/7ccd65e0057c57364469d576a57387eaa57530'), PosixPath('/home/leandro/codeparrot-valid/.git/hooks/prepare-commit-msg.sample'), PosixPath('/home/leandro/codeparrot-valid/.git/hooks/update.sample'), PosixPath('/home/leandro/codeparrot-valid/.git/logs/refs/remotes/origin/HEAD'), PosixPath('/home/leandro/codeparrot-valid/.git/hooks/post-checkout')] -09/20/2021 14:28:34 - INFO - datasets.load - Some files matched the pattern '*' at /home/leandro/codeparrot-valid but don't have valid data file extensions: [PosixPath('/home/leandro/codeparrot-valid/.git/lfs/objects/43/23/432375a8140ca79af9fa62e3145815c0f7965af8026ed1847ce6e75a11f413fd'), PosixPath('/home/leandro/codeparrot-valid/.git/hooks/pre-rebase.sample'), PosixPath('/home/leandro/codeparrot-valid/.git/config'), PosixPath('/home/leandro/codeparrot-valid/.git/hooks/pre-commit.sample'), PosixPath('/home/leandro/codeparrot-valid/.git/info/exclude'), PosixPath('/home/leandro/codeparrot-valid/.git/hooks/commit-msg.sample'), PosixPath('/home/leandro/codeparrot-valid/.git/logs/refs/heads/main'), PosixPath('/home/leandro/codeparrot-valid/.git/hooks/pre-push.sample'), PosixPath('/home/leandro/codeparrot-valid/.git/hooks/fsmonitor-watchman.sample'), PosixPath('/home/leandro/codeparrot-valid/.git/objects/f3/fa800d7629eabb8ba09a504140b5a203d1341a'), PosixPath('/home/leandro/codeparrot-valid/.git/objects/0b/0462e46b355e305d77ff3b85f3a01776e188ea'), PosixPath('/home/leandro/codeparrot-valid/.git/packed-refs'), PosixPath('/home/leandro/codeparrot-valid/.git/index'), PosixPath('/home/leandro/codeparrot-valid/.git/HEAD'), PosixPath('/home/leandro/codeparrot-valid/.git/hooks/post-update.sample'), PosixPath('/home/leandro/codeparrot-valid/.git/objects/5e/9d29c73e4d5b8ecb2b60628d17a791508a514f'), PosixPath('/home/leandro/codeparrot-valid/.git/refs/heads/main'), PosixPath('/home/leandro/codeparrot-valid/.git/hooks/pre-push'), PosixPath('/home/leandro/codeparrot-valid/.git/objects/c9/b135a100a1770bcdc5ae26195bd4f7bd85a764'), PosixPath('/home/leandro/codeparrot-valid/.git/description'), PosixPath('/home/leandro/codeparrot-valid/.git/hooks/pre-applypatch.sample'), PosixPath('/home/leandro/codeparrot-valid/.git/logs/HEAD'), PosixPath('/home/leandro/codeparrot-valid/.git/hooks/pre-receive.sample'), PosixPath('/home/leandro/codeparrot-valid/.git/refs/remotes/origin/HEAD'), PosixPath('/home/leandro/codeparrot-valid/.git/hooks/post-merge'), PosixPath('/home/leandro/codeparrot-valid/.git/hooks/applypatch-msg.sample'), PosixPath('/home/leandro/codeparrot-valid/.git/hooks/post-commit'), PosixPath('/home/leandro/codeparrot-valid/.git/objects/07/f0db3339ad9053dc95b284c4ae14e014efff89'), PosixPath('/home/leandro/codeparrot-valid/.git/objects/d7/b8c495dd9e6df27bfd6a47dad7e33da0850a5b'), PosixPath('/home/leandro/codeparrot-valid/.git/objects/c6/7ccd65e0057c57364469d576a57387eaa57530'), PosixPath('/home/leandro/codeparrot-valid/.git/hooks/prepare-commit-msg.sample'), PosixPath('/home/leandro/codeparrot-valid/.git/hooks/update.sample'), PosixPath('/home/leandro/codeparrot-valid/.git/logs/refs/remotes/origin/HEAD'), PosixPath('/home/leandro/codeparrot-valid/.git/hooks/post-checkout')] -09/20/2021 14:28:34 - WARNING - datasets.builder - Using custom data configuration codeparrot-valid-faf4c4ef77c080fb -09/20/2021 14:29:08 - INFO - __main__ - Step 1: {'lr': 0.0, 'samples': 32, 'steps': 0, 'loss/train': 10.774224281311035} -09/20/2021 14:29:09 - INFO - root - Reducer buckets have been rebuilt in this iteration. -09/20/2021 14:29:09 - INFO - __main__ - Step 2: {'lr': 0.0, 'samples': 64, 'steps': 0, 'loss/train': 10.773880004882812} -09/20/2021 14:29:10 - INFO - __main__ - Step 3: {'lr': 0.0, 'samples': 96, 'steps': 0, 'loss/train': 10.767656326293945} -09/20/2021 14:29:10 - INFO - __main__ - Step 4: {'lr': 0.0, 'samples': 128, 'steps': 0, 'loss/train': 10.722071647644043} -09/20/2021 14:29:11 - INFO - __main__ - Step 5: {'lr': 0.0, 'samples': 160, 'steps': 0, 'loss/train': 10.732088088989258} -09/20/2021 14:29:12 - INFO - __main__ - Step 6: {'lr': 0.0, 'samples': 192, 'steps': 0, 'loss/train': 10.84278392791748} -09/20/2021 14:29:13 - INFO - __main__ - Step 7: {'lr': 0.0, 'samples': 224, 'steps': 0, 'loss/train': 10.884531021118164} -09/20/2021 14:29:13 - INFO - __main__ - Step 8: {'lr': 0.0, 'samples': 256, 'steps': 0, 'loss/train': 10.75090503692627} -09/20/2021 14:29:14 - INFO - __main__ - Step 9: {'lr': 0.0, 'samples': 288, 'steps': 0, 'loss/train': 10.733172416687012} -09/20/2021 14:29:15 - INFO - __main__ - Step 10: {'lr': 0.0, 'samples': 320, 'steps': 0, 'loss/train': 10.730609893798828} -09/20/2021 14:29:16 - INFO - __main__ - Step 11: {'lr': 0.0, 'samples': 352, 'steps': 0, 'loss/train': 10.706088066101074} -09/20/2021 14:29:16 - INFO - __main__ - Step 12: {'lr': 0.0, 'samples': 384, 'steps': 0, 'loss/train': 10.75394058227539} -09/20/2021 14:29:17 - INFO - __main__ - Step 13: {'lr': 0.0, 'samples': 416, 'steps': 0, 'loss/train': 10.684357643127441} -09/20/2021 14:29:18 - INFO - __main__ - Step 14: {'lr': 0.0, 'samples': 448, 'steps': 0, 'loss/train': 10.784319877624512} -09/20/2021 14:29:19 - INFO - __main__ - Step 15: {'lr': 0.0, 'samples': 480, 'steps': 0, 'loss/train': 10.79415225982666} -09/20/2021 14:29:19 - INFO - __main__ - Step 16: {'lr': 0.0, 'samples': 512, 'steps': 0, 'loss/train': 10.708978652954102} -09/20/2021 14:29:23 - INFO - __main__ - Step 17: {'lr': 2.6666666666666667e-07, 'samples': 544, 'steps': 1, 'loss/train': 10.737349510192871} -09/20/2021 14:29:23 - INFO - __main__ - Step 18: {'lr': 2.6666666666666667e-07, 'samples': 576, 'steps': 1, 'loss/train': 10.779191970825195} -09/20/2021 14:29:24 - INFO - __main__ - Step 19: {'lr': 2.6666666666666667e-07, 'samples': 608, 'steps': 1, 'loss/train': 10.796072959899902} -09/20/2021 14:29:25 - INFO - __main__ - Step 20: {'lr': 2.6666666666666667e-07, 'samples': 640, 'steps': 1, 'loss/train': 10.821568489074707} -09/20/2021 14:29:26 - INFO - __main__ - Step 21: {'lr': 2.6666666666666667e-07, 'samples': 672, 'steps': 1, 'loss/train': 10.740201950073242} -09/20/2021 14:29:26 - INFO - __main__ - Step 22: {'lr': 2.6666666666666667e-07, 'samples': 704, 'steps': 1, 'loss/train': 10.696013450622559} -09/20/2021 14:29:27 - INFO - __main__ - Step 23: {'lr': 2.6666666666666667e-07, 'samples': 736, 'steps': 1, 'loss/train': 10.770585060119629} -09/20/2021 14:29:28 - INFO - __main__ - Step 24: {'lr': 2.6666666666666667e-07, 'samples': 768, 'steps': 1, 'loss/train': 10.790505409240723} -09/20/2021 14:29:29 - INFO - __main__ - Step 25: {'lr': 2.6666666666666667e-07, 'samples': 800, 'steps': 1, 'loss/train': 10.688878059387207} -09/20/2021 14:29:29 - INFO - __main__ - Step 26: {'lr': 2.6666666666666667e-07, 'samples': 832, 'steps': 1, 'loss/train': 10.761898040771484} -09/20/2021 14:29:30 - INFO - __main__ - Step 27: {'lr': 2.6666666666666667e-07, 'samples': 864, 'steps': 1, 'loss/train': 10.70787525177002} -09/20/2021 14:29:31 - INFO - __main__ - Step 28: {'lr': 2.6666666666666667e-07, 'samples': 896, 'steps': 1, 'loss/train': 10.706584930419922} -09/20/2021 14:29:32 - INFO - __main__ - Step 29: {'lr': 2.6666666666666667e-07, 'samples': 928, 'steps': 1, 'loss/train': 10.73019790649414} -09/20/2021 14:29:32 - INFO - __main__ - Step 30: {'lr': 2.6666666666666667e-07, 'samples': 960, 'steps': 1, 'loss/train': 10.784171104431152} -09/20/2021 14:29:34 - INFO - __main__ - Step 31: {'lr': 2.6666666666666667e-07, 'samples': 992, 'steps': 1, 'loss/train': 10.767316818237305} -09/20/2021 14:29:34 - INFO - __main__ - Step 32: {'lr': 2.6666666666666667e-07, 'samples': 1024, 'steps': 1, 'loss/train': 10.746819496154785} -09/20/2021 14:29:35 - INFO - __main__ - Step 33: {'lr': 5.333333333333333e-07, 'samples': 1056, 'steps': 2, 'loss/train': 10.554855346679688} -09/20/2021 14:29:36 - INFO - __main__ - Step 34: {'lr': 5.333333333333333e-07, 'samples': 1088, 'steps': 2, 'loss/train': 10.542468070983887} -09/20/2021 14:29:37 - INFO - __main__ - Step 35: {'lr': 5.333333333333333e-07, 'samples': 1120, 'steps': 2, 'loss/train': 10.611211776733398} -09/20/2021 14:29:38 - INFO - __main__ - Step 36: {'lr': 5.333333333333333e-07, 'samples': 1152, 'steps': 2, 'loss/train': 10.654096603393555} -09/20/2021 14:29:38 - INFO - __main__ - Step 37: {'lr': 5.333333333333333e-07, 'samples': 1184, 'steps': 2, 'loss/train': 10.674487113952637} -09/20/2021 14:29:39 - INFO - __main__ - Step 38: {'lr': 5.333333333333333e-07, 'samples': 1216, 'steps': 2, 'loss/train': 10.66421890258789} -09/20/2021 14:29:40 - INFO - __main__ - Step 39: {'lr': 5.333333333333333e-07, 'samples': 1248, 'steps': 2, 'loss/train': 10.655780792236328} -09/20/2021 14:29:41 - INFO - __main__ - Step 40: {'lr': 5.333333333333333e-07, 'samples': 1280, 'steps': 2, 'loss/train': 10.635687828063965} -09/20/2021 14:29:41 - INFO - __main__ - Step 41: {'lr': 5.333333333333333e-07, 'samples': 1312, 'steps': 2, 'loss/train': 10.692303657531738} -09/20/2021 14:29:42 - INFO - __main__ - Step 42: {'lr': 5.333333333333333e-07, 'samples': 1344, 'steps': 2, 'loss/train': 10.68622875213623} -09/20/2021 14:29:43 - INFO - __main__ - Step 43: {'lr': 5.333333333333333e-07, 'samples': 1376, 'steps': 2, 'loss/train': 10.666109085083008} -09/20/2021 14:29:44 - INFO - __main__ - Step 44: {'lr': 5.333333333333333e-07, 'samples': 1408, 'steps': 2, 'loss/train': 10.588134765625} -09/20/2021 14:29:44 - INFO - __main__ - Step 45: {'lr': 5.333333333333333e-07, 'samples': 1440, 'steps': 2, 'loss/train': 10.62142562866211} -09/20/2021 14:29:45 - INFO - __main__ - Step 46: {'lr': 5.333333333333333e-07, 'samples': 1472, 'steps': 2, 'loss/train': 10.657995223999023} -09/20/2021 14:29:46 - INFO - __main__ - Step 47: {'lr': 5.333333333333333e-07, 'samples': 1504, 'steps': 2, 'loss/train': 10.694281578063965} -09/20/2021 14:29:47 - INFO - __main__ - Step 48: {'lr': 5.333333333333333e-07, 'samples': 1536, 'steps': 2, 'loss/train': 10.558058738708496} -09/20/2021 14:29:47 - INFO - __main__ - Step 49: {'lr': 8.000000000000001e-07, 'samples': 1568, 'steps': 3, 'loss/train': 10.35663890838623} -09/20/2021 14:29:48 - INFO - __main__ - Step 50: {'lr': 8.000000000000001e-07, 'samples': 1600, 'steps': 3, 'loss/train': 10.246391296386719} -09/20/2021 14:29:49 - INFO - __main__ - Step 51: {'lr': 8.000000000000001e-07, 'samples': 1632, 'steps': 3, 'loss/train': 10.446417808532715} -09/20/2021 14:29:50 - INFO - __main__ - Step 52: {'lr': 8.000000000000001e-07, 'samples': 1664, 'steps': 3, 'loss/train': 10.491007804870605} -09/20/2021 14:29:50 - INFO - __main__ - Step 53: {'lr': 8.000000000000001e-07, 'samples': 1696, 'steps': 3, 'loss/train': 10.480436325073242} -09/20/2021 14:29:51 - INFO - __main__ - Step 54: {'lr': 8.000000000000001e-07, 'samples': 1728, 'steps': 3, 'loss/train': 10.535933494567871} -09/20/2021 14:29:52 - INFO - __main__ - Step 55: {'lr': 8.000000000000001e-07, 'samples': 1760, 'steps': 3, 'loss/train': 10.369260787963867} -09/20/2021 14:29:53 - INFO - __main__ - Step 56: {'lr': 8.000000000000001e-07, 'samples': 1792, 'steps': 3, 'loss/train': 10.359262466430664} -09/20/2021 14:29:53 - INFO - __main__ - Step 57: {'lr': 8.000000000000001e-07, 'samples': 1824, 'steps': 3, 'loss/train': 10.416579246520996} -09/20/2021 14:29:54 - INFO - __main__ - Step 58: {'lr': 8.000000000000001e-07, 'samples': 1856, 'steps': 3, 'loss/train': 10.384167671203613} -09/20/2021 14:29:55 - INFO - __main__ - Step 59: {'lr': 8.000000000000001e-07, 'samples': 1888, 'steps': 3, 'loss/train': 10.269042015075684} -09/20/2021 14:29:56 - INFO - __main__ - Step 60: {'lr': 8.000000000000001e-07, 'samples': 1920, 'steps': 3, 'loss/train': 10.261059761047363} -09/20/2021 14:29:57 - INFO - __main__ - Step 61: {'lr': 8.000000000000001e-07, 'samples': 1952, 'steps': 3, 'loss/train': 10.493464469909668} -09/20/2021 14:29:58 - INFO - __main__ - Step 62: {'lr': 8.000000000000001e-07, 'samples': 1984, 'steps': 3, 'loss/train': 10.554738998413086} -09/20/2021 14:29:59 - INFO - __main__ - Step 63: {'lr': 8.000000000000001e-07, 'samples': 2016, 'steps': 3, 'loss/train': 10.338383674621582} -09/20/2021 14:29:59 - INFO - __main__ - Step 64: {'lr': 8.000000000000001e-07, 'samples': 2048, 'steps': 3, 'loss/train': 10.318178176879883} -09/20/2021 14:30:00 - INFO - __main__ - Step 65: {'lr': 1.0666666666666667e-06, 'samples': 2080, 'steps': 4, 'loss/train': 10.486148834228516} -09/20/2021 14:30:01 - INFO - __main__ - Step 66: {'lr': 1.0666666666666667e-06, 'samples': 2112, 'steps': 4, 'loss/train': 9.866499900817871} -09/20/2021 14:30:02 - INFO - __main__ - Step 67: {'lr': 1.0666666666666667e-06, 'samples': 2144, 'steps': 4, 'loss/train': 10.016646385192871} -09/20/2021 14:30:02 - INFO - __main__ - Step 68: {'lr': 1.0666666666666667e-06, 'samples': 2176, 'steps': 4, 'loss/train': 10.115442276000977} -09/20/2021 14:30:03 - INFO - __main__ - Step 69: {'lr': 1.0666666666666667e-06, 'samples': 2208, 'steps': 4, 'loss/train': 10.429139137268066} -09/20/2021 14:30:04 - INFO - __main__ - Step 70: {'lr': 1.0666666666666667e-06, 'samples': 2240, 'steps': 4, 'loss/train': 10.14297103881836} -09/20/2021 14:30:05 - INFO - __main__ - Step 71: {'lr': 1.0666666666666667e-06, 'samples': 2272, 'steps': 4, 'loss/train': 10.298738479614258} -09/20/2021 14:30:05 - INFO - __main__ - Step 72: {'lr': 1.0666666666666667e-06, 'samples': 2304, 'steps': 4, 'loss/train': 9.949441909790039} -09/20/2021 14:30:06 - INFO - __main__ - Step 73: {'lr': 1.0666666666666667e-06, 'samples': 2336, 'steps': 4, 'loss/train': 10.0211181640625} -09/20/2021 14:30:07 - INFO - __main__ - Step 74: {'lr': 1.0666666666666667e-06, 'samples': 2368, 'steps': 4, 'loss/train': 10.10930061340332} -09/20/2021 14:30:08 - INFO - __main__ - Step 75: {'lr': 1.0666666666666667e-06, 'samples': 2400, 'steps': 4, 'loss/train': 9.967339515686035} -09/20/2021 14:30:08 - INFO - __main__ - Step 76: {'lr': 1.0666666666666667e-06, 'samples': 2432, 'steps': 4, 'loss/train': 10.142324447631836} -09/20/2021 14:30:09 - INFO - __main__ - Step 77: {'lr': 1.0666666666666667e-06, 'samples': 2464, 'steps': 4, 'loss/train': 10.118136405944824} -09/20/2021 14:30:10 - INFO - __main__ - Step 78: {'lr': 1.0666666666666667e-06, 'samples': 2496, 'steps': 4, 'loss/train': 10.269981384277344} -09/20/2021 14:30:11 - INFO - __main__ - Step 79: {'lr': 1.0666666666666667e-06, 'samples': 2528, 'steps': 4, 'loss/train': 10.001642227172852} -09/20/2021 14:30:11 - INFO - __main__ - Step 80: {'lr': 1.0666666666666667e-06, 'samples': 2560, 'steps': 4, 'loss/train': 10.20645809173584} -09/20/2021 14:30:12 - INFO - __main__ - Step 81: {'lr': 1.3333333333333334e-06, 'samples': 2592, 'steps': 5, 'loss/train': 9.521819114685059} -09/20/2021 14:30:13 - INFO - __main__ - Step 82: {'lr': 1.3333333333333334e-06, 'samples': 2624, 'steps': 5, 'loss/train': 9.153255462646484} -09/20/2021 14:30:14 - INFO - __main__ - Step 83: {'lr': 1.3333333333333334e-06, 'samples': 2656, 'steps': 5, 'loss/train': 9.59922981262207} -09/20/2021 14:30:15 - INFO - __main__ - Step 84: {'lr': 1.3333333333333334e-06, 'samples': 2688, 'steps': 5, 'loss/train': 9.901582717895508} -09/20/2021 14:30:15 - INFO - __main__ - Step 85: {'lr': 1.3333333333333334e-06, 'samples': 2720, 'steps': 5, 'loss/train': 9.615211486816406} -09/20/2021 14:30:16 - INFO - __main__ - Step 86: {'lr': 1.3333333333333334e-06, 'samples': 2752, 'steps': 5, 'loss/train': 9.898027420043945} -09/20/2021 14:30:17 - INFO - __main__ - Step 87: {'lr': 1.3333333333333334e-06, 'samples': 2784, 'steps': 5, 'loss/train': 9.768525123596191} -09/20/2021 14:30:18 - INFO - __main__ - Step 88: {'lr': 1.3333333333333334e-06, 'samples': 2816, 'steps': 5, 'loss/train': 9.708690643310547} -09/20/2021 14:30:18 - INFO - __main__ - Step 89: {'lr': 1.3333333333333334e-06, 'samples': 2848, 'steps': 5, 'loss/train': 9.709917068481445} -09/20/2021 14:30:19 - INFO - __main__ - Step 90: {'lr': 1.3333333333333334e-06, 'samples': 2880, 'steps': 5, 'loss/train': 9.90368366241455} -09/20/2021 14:30:20 - INFO - __main__ - Step 91: {'lr': 1.3333333333333334e-06, 'samples': 2912, 'steps': 5, 'loss/train': 9.923727035522461} -09/20/2021 14:30:21 - INFO - __main__ - Step 92: {'lr': 1.3333333333333334e-06, 'samples': 2944, 'steps': 5, 'loss/train': 9.70739459991455} -09/20/2021 14:30:22 - INFO - __main__ - Step 93: {'lr': 1.3333333333333334e-06, 'samples': 2976, 'steps': 5, 'loss/train': 10.378307342529297} -09/20/2021 14:30:23 - INFO - __main__ - Step 94: {'lr': 1.3333333333333334e-06, 'samples': 3008, 'steps': 5, 'loss/train': 9.757561683654785} -09/20/2021 14:30:23 - INFO - __main__ - Step 95: {'lr': 1.3333333333333334e-06, 'samples': 3040, 'steps': 5, 'loss/train': 9.830108642578125} -09/20/2021 14:30:24 - INFO - __main__ - Step 96: {'lr': 1.3333333333333334e-06, 'samples': 3072, 'steps': 5, 'loss/train': 9.712736129760742} -09/20/2021 14:30:25 - INFO - __main__ - Step 97: {'lr': 1.6000000000000001e-06, 'samples': 3104, 'steps': 6, 'loss/train': 8.879112243652344} -09/20/2021 14:30:26 - INFO - __main__ - Step 98: {'lr': 1.6000000000000001e-06, 'samples': 3136, 'steps': 6, 'loss/train': 9.553325653076172} -09/20/2021 14:30:27 - INFO - __main__ - Step 99: {'lr': 1.6000000000000001e-06, 'samples': 3168, 'steps': 6, 'loss/train': 9.50730037689209} -09/20/2021 14:30:27 - INFO - __main__ - Step 100: {'lr': 1.6000000000000001e-06, 'samples': 3200, 'steps': 6, 'loss/train': 8.97494888305664} -09/20/2021 14:30:28 - INFO - __main__ - Step 101: {'lr': 1.6000000000000001e-06, 'samples': 3232, 'steps': 6, 'loss/train': 9.469138145446777} -09/20/2021 14:30:29 - INFO - __main__ - Step 102: {'lr': 1.6000000000000001e-06, 'samples': 3264, 'steps': 6, 'loss/train': 9.426682472229004} -09/20/2021 14:30:30 - INFO - __main__ - Step 103: {'lr': 1.6000000000000001e-06, 'samples': 3296, 'steps': 6, 'loss/train': 9.113446235656738} -09/20/2021 14:30:30 - INFO - __main__ - Step 104: {'lr': 1.6000000000000001e-06, 'samples': 3328, 'steps': 6, 'loss/train': 10.258001327514648} -09/20/2021 14:30:31 - INFO - __main__ - Step 105: {'lr': 1.6000000000000001e-06, 'samples': 3360, 'steps': 6, 'loss/train': 9.601887702941895} -09/20/2021 14:30:32 - INFO - __main__ - Step 106: {'lr': 1.6000000000000001e-06, 'samples': 3392, 'steps': 6, 'loss/train': 9.146980285644531} -09/20/2021 14:30:33 - INFO - __main__ - Step 107: {'lr': 1.6000000000000001e-06, 'samples': 3424, 'steps': 6, 'loss/train': 9.780786514282227} -09/20/2021 14:30:33 - INFO - __main__ - Step 108: {'lr': 1.6000000000000001e-06, 'samples': 3456, 'steps': 6, 'loss/train': 8.951713562011719} -09/20/2021 14:30:34 - INFO - __main__ - Step 109: {'lr': 1.6000000000000001e-06, 'samples': 3488, 'steps': 6, 'loss/train': 9.512404441833496} -09/20/2021 14:30:35 - INFO - __main__ - Step 110: {'lr': 1.6000000000000001e-06, 'samples': 3520, 'steps': 6, 'loss/train': 8.844427108764648} -09/20/2021 14:30:36 - INFO - __main__ - Step 111: {'lr': 1.6000000000000001e-06, 'samples': 3552, 'steps': 6, 'loss/train': 9.457303047180176} -09/20/2021 14:30:36 - INFO - __main__ - Step 112: {'lr': 1.6000000000000001e-06, 'samples': 3584, 'steps': 6, 'loss/train': 9.350332260131836} -09/20/2021 14:30:37 - INFO - __main__ - Step 113: {'lr': 1.8666666666666669e-06, 'samples': 3616, 'steps': 7, 'loss/train': 9.144501686096191} -09/20/2021 14:30:38 - INFO - __main__ - Step 114: {'lr': 1.8666666666666669e-06, 'samples': 3648, 'steps': 7, 'loss/train': 9.371633529663086} -09/20/2021 14:30:39 - INFO - __main__ - Step 115: {'lr': 1.8666666666666669e-06, 'samples': 3680, 'steps': 7, 'loss/train': 9.51986026763916} -09/20/2021 14:30:39 - INFO - __main__ - Step 116: {'lr': 1.8666666666666669e-06, 'samples': 3712, 'steps': 7, 'loss/train': 9.185944557189941} -09/20/2021 14:30:40 - INFO - __main__ - Step 117: {'lr': 1.8666666666666669e-06, 'samples': 3744, 'steps': 7, 'loss/train': 8.289783477783203} -09/20/2021 14:30:41 - INFO - __main__ - Step 118: {'lr': 1.8666666666666669e-06, 'samples': 3776, 'steps': 7, 'loss/train': 9.40110969543457} -09/20/2021 14:30:42 - INFO - __main__ - Step 119: {'lr': 1.8666666666666669e-06, 'samples': 3808, 'steps': 7, 'loss/train': 9.296404838562012} -09/20/2021 14:30:42 - INFO - __main__ - Step 120: {'lr': 1.8666666666666669e-06, 'samples': 3840, 'steps': 7, 'loss/train': 8.81103801727295} -09/20/2021 14:30:43 - INFO - __main__ - Step 121: {'lr': 1.8666666666666669e-06, 'samples': 3872, 'steps': 7, 'loss/train': 9.305680274963379} -09/20/2021 14:30:45 - INFO - __main__ - Step 122: {'lr': 1.8666666666666669e-06, 'samples': 3904, 'steps': 7, 'loss/train': 9.745590209960938} -09/20/2021 14:30:45 - INFO - __main__ - Step 123: {'lr': 1.8666666666666669e-06, 'samples': 3936, 'steps': 7, 'loss/train': 8.986610412597656} -09/20/2021 14:30:46 - INFO - __main__ - Step 124: {'lr': 1.8666666666666669e-06, 'samples': 3968, 'steps': 7, 'loss/train': 9.559576034545898} -09/20/2021 14:30:47 - INFO - __main__ - Step 125: {'lr': 1.8666666666666669e-06, 'samples': 4000, 'steps': 7, 'loss/train': 8.84313678741455} -09/20/2021 14:30:48 - INFO - __main__ - Step 126: {'lr': 1.8666666666666669e-06, 'samples': 4032, 'steps': 7, 'loss/train': 8.488707542419434} -09/20/2021 14:30:48 - INFO - __main__ - Step 127: {'lr': 1.8666666666666669e-06, 'samples': 4064, 'steps': 7, 'loss/train': 8.918740272521973} -09/20/2021 14:30:49 - INFO - __main__ - Step 128: {'lr': 1.8666666666666669e-06, 'samples': 4096, 'steps': 7, 'loss/train': 9.390033721923828} -09/20/2021 14:30:50 - INFO - __main__ - Step 129: {'lr': 2.1333333333333334e-06, 'samples': 4128, 'steps': 8, 'loss/train': 9.056205749511719} -09/20/2021 14:30:51 - INFO - __main__ - Step 130: {'lr': 2.1333333333333334e-06, 'samples': 4160, 'steps': 8, 'loss/train': 8.463839530944824} -09/20/2021 14:30:51 - INFO - __main__ - Step 131: {'lr': 2.1333333333333334e-06, 'samples': 4192, 'steps': 8, 'loss/train': 9.151128768920898} -09/20/2021 14:30:52 - INFO - __main__ - Step 132: {'lr': 2.1333333333333334e-06, 'samples': 4224, 'steps': 8, 'loss/train': 9.170570373535156} -09/20/2021 14:30:53 - INFO - __main__ - Step 133: {'lr': 2.1333333333333334e-06, 'samples': 4256, 'steps': 8, 'loss/train': 9.082758903503418} -09/20/2021 14:30:54 - INFO - __main__ - Step 134: {'lr': 2.1333333333333334e-06, 'samples': 4288, 'steps': 8, 'loss/train': 8.952345848083496} -09/20/2021 14:30:54 - INFO - __main__ - Step 135: {'lr': 2.1333333333333334e-06, 'samples': 4320, 'steps': 8, 'loss/train': 8.790618896484375} -09/20/2021 14:30:55 - INFO - __main__ - Step 136: {'lr': 2.1333333333333334e-06, 'samples': 4352, 'steps': 8, 'loss/train': 9.163252830505371} -09/20/2021 14:30:56 - INFO - __main__ - Step 137: {'lr': 2.1333333333333334e-06, 'samples': 4384, 'steps': 8, 'loss/train': 9.101499557495117} -09/20/2021 14:30:57 - INFO - __main__ - Step 138: {'lr': 2.1333333333333334e-06, 'samples': 4416, 'steps': 8, 'loss/train': 8.824095726013184} -09/20/2021 14:30:57 - INFO - __main__ - Step 139: {'lr': 2.1333333333333334e-06, 'samples': 4448, 'steps': 8, 'loss/train': 9.142293930053711} -09/20/2021 14:30:58 - INFO - __main__ - Step 140: {'lr': 2.1333333333333334e-06, 'samples': 4480, 'steps': 8, 'loss/train': 10.116113662719727} -09/20/2021 14:30:59 - INFO - __main__ - Step 141: {'lr': 2.1333333333333334e-06, 'samples': 4512, 'steps': 8, 'loss/train': 9.215624809265137} -09/20/2021 14:31:00 - INFO - __main__ - Step 142: {'lr': 2.1333333333333334e-06, 'samples': 4544, 'steps': 8, 'loss/train': 9.612702369689941} -09/20/2021 14:31:00 - INFO - __main__ - Step 143: {'lr': 2.1333333333333334e-06, 'samples': 4576, 'steps': 8, 'loss/train': 9.087225914001465} -09/20/2021 14:31:01 - INFO - __main__ - Step 144: {'lr': 2.1333333333333334e-06, 'samples': 4608, 'steps': 8, 'loss/train': 8.500539779663086} -09/20/2021 14:31:02 - INFO - __main__ - Step 145: {'lr': 2.4000000000000003e-06, 'samples': 4640, 'steps': 9, 'loss/train': 8.898508071899414} -09/20/2021 14:31:03 - INFO - __main__ - Step 146: {'lr': 2.4000000000000003e-06, 'samples': 4672, 'steps': 9, 'loss/train': 9.15835952758789} -09/20/2021 14:31:04 - INFO - __main__ - Step 147: {'lr': 2.4000000000000003e-06, 'samples': 4704, 'steps': 9, 'loss/train': 9.495782852172852} -09/20/2021 14:31:04 - INFO - __main__ - Step 148: {'lr': 2.4000000000000003e-06, 'samples': 4736, 'steps': 9, 'loss/train': 8.723994255065918} -09/20/2021 14:31:05 - INFO - __main__ - Step 149: {'lr': 2.4000000000000003e-06, 'samples': 4768, 'steps': 9, 'loss/train': 9.663128852844238} -09/20/2021 14:31:06 - INFO - __main__ - Step 150: {'lr': 2.4000000000000003e-06, 'samples': 4800, 'steps': 9, 'loss/train': 8.894539833068848} -09/20/2021 14:31:07 - INFO - __main__ - Step 151: {'lr': 2.4000000000000003e-06, 'samples': 4832, 'steps': 9, 'loss/train': 8.205784797668457} -09/20/2021 14:31:07 - INFO - __main__ - Step 152: {'lr': 2.4000000000000003e-06, 'samples': 4864, 'steps': 9, 'loss/train': 9.134984970092773} -09/20/2021 14:31:09 - INFO - __main__ - Step 153: {'lr': 2.4000000000000003e-06, 'samples': 4896, 'steps': 9, 'loss/train': 8.663310050964355} -09/20/2021 14:31:09 - INFO - __main__ - Step 154: {'lr': 2.4000000000000003e-06, 'samples': 4928, 'steps': 9, 'loss/train': 9.474404335021973} -09/20/2021 14:31:10 - INFO - __main__ - Step 155: {'lr': 2.4000000000000003e-06, 'samples': 4960, 'steps': 9, 'loss/train': 8.79813003540039} -09/20/2021 14:31:11 - INFO - __main__ - Step 156: {'lr': 2.4000000000000003e-06, 'samples': 4992, 'steps': 9, 'loss/train': 8.456768989562988} -09/20/2021 14:31:12 - INFO - __main__ - Step 157: {'lr': 2.4000000000000003e-06, 'samples': 5024, 'steps': 9, 'loss/train': 8.999434471130371} -09/20/2021 14:31:12 - INFO - __main__ - Step 158: {'lr': 2.4000000000000003e-06, 'samples': 5056, 'steps': 9, 'loss/train': 8.66516399383545} -09/20/2021 14:31:13 - INFO - __main__ - Step 159: {'lr': 2.4000000000000003e-06, 'samples': 5088, 'steps': 9, 'loss/train': 9.987896919250488} -09/20/2021 14:31:14 - INFO - __main__ - Step 160: {'lr': 2.4000000000000003e-06, 'samples': 5120, 'steps': 9, 'loss/train': 10.360553741455078} -09/20/2021 14:31:15 - INFO - __main__ - Step 161: {'lr': 2.666666666666667e-06, 'samples': 5152, 'steps': 10, 'loss/train': 10.1486234664917} -09/20/2021 14:31:16 - INFO - __main__ - Step 162: {'lr': 2.666666666666667e-06, 'samples': 5184, 'steps': 10, 'loss/train': 8.72321605682373} -09/20/2021 14:31:16 - INFO - __main__ - Step 163: {'lr': 2.666666666666667e-06, 'samples': 5216, 'steps': 10, 'loss/train': 8.840726852416992} -09/20/2021 14:31:17 - INFO - __main__ - Step 164: {'lr': 2.666666666666667e-06, 'samples': 5248, 'steps': 10, 'loss/train': 8.98475170135498} -09/20/2021 14:31:18 - INFO - __main__ - Step 165: {'lr': 2.666666666666667e-06, 'samples': 5280, 'steps': 10, 'loss/train': 10.165177345275879} -09/20/2021 14:31:19 - INFO - __main__ - Step 166: {'lr': 2.666666666666667e-06, 'samples': 5312, 'steps': 10, 'loss/train': 10.195971488952637} -09/20/2021 14:31:19 - INFO - __main__ - Step 167: {'lr': 2.666666666666667e-06, 'samples': 5344, 'steps': 10, 'loss/train': 9.792502403259277} -09/20/2021 14:31:20 - INFO - __main__ - Step 168: {'lr': 2.666666666666667e-06, 'samples': 5376, 'steps': 10, 'loss/train': 8.984392166137695} -09/20/2021 14:31:21 - INFO - __main__ - Step 169: {'lr': 2.666666666666667e-06, 'samples': 5408, 'steps': 10, 'loss/train': 8.13987922668457} -09/20/2021 14:31:22 - INFO - __main__ - Step 170: {'lr': 2.666666666666667e-06, 'samples': 5440, 'steps': 10, 'loss/train': 8.94565486907959} -09/20/2021 14:31:22 - INFO - __main__ - Step 171: {'lr': 2.666666666666667e-06, 'samples': 5472, 'steps': 10, 'loss/train': 9.066217422485352} -09/20/2021 14:31:23 - INFO - __main__ - Step 172: {'lr': 2.666666666666667e-06, 'samples': 5504, 'steps': 10, 'loss/train': 8.266522407531738} -09/20/2021 14:31:24 - INFO - __main__ - Step 173: {'lr': 2.666666666666667e-06, 'samples': 5536, 'steps': 10, 'loss/train': 8.597553253173828} -09/20/2021 14:31:25 - INFO - __main__ - Step 174: {'lr': 2.666666666666667e-06, 'samples': 5568, 'steps': 10, 'loss/train': 9.147146224975586} -09/20/2021 14:31:25 - INFO - __main__ - Step 175: {'lr': 2.666666666666667e-06, 'samples': 5600, 'steps': 10, 'loss/train': 8.968146324157715} -09/20/2021 14:31:26 - INFO - __main__ - Step 176: {'lr': 2.666666666666667e-06, 'samples': 5632, 'steps': 10, 'loss/train': 9.275249481201172} -09/20/2021 14:31:27 - INFO - __main__ - Step 177: {'lr': 2.9333333333333333e-06, 'samples': 5664, 'steps': 11, 'loss/train': 8.601914405822754} -09/20/2021 14:31:28 - INFO - __main__ - Step 178: {'lr': 2.9333333333333333e-06, 'samples': 5696, 'steps': 11, 'loss/train': 8.816274642944336} -09/20/2021 14:31:28 - INFO - __main__ - Step 179: {'lr': 2.9333333333333333e-06, 'samples': 5728, 'steps': 11, 'loss/train': 9.375834465026855} -09/20/2021 14:31:29 - INFO - __main__ - Step 180: {'lr': 2.9333333333333333e-06, 'samples': 5760, 'steps': 11, 'loss/train': 9.022726058959961} -09/20/2021 14:31:30 - INFO - __main__ - Step 181: {'lr': 2.9333333333333333e-06, 'samples': 5792, 'steps': 11, 'loss/train': 8.842888832092285} -09/20/2021 14:31:31 - INFO - __main__ - Step 182: {'lr': 2.9333333333333333e-06, 'samples': 5824, 'steps': 11, 'loss/train': 8.615532875061035} -09/20/2021 14:31:31 - INFO - __main__ - Step 183: {'lr': 2.9333333333333333e-06, 'samples': 5856, 'steps': 11, 'loss/train': 8.766458511352539} -09/20/2021 14:31:32 - INFO - __main__ - Step 184: {'lr': 2.9333333333333333e-06, 'samples': 5888, 'steps': 11, 'loss/train': 8.656167030334473} -09/20/2021 14:31:34 - INFO - __main__ - Step 185: {'lr': 2.9333333333333333e-06, 'samples': 5920, 'steps': 11, 'loss/train': 8.263057708740234} -09/20/2021 14:31:35 - INFO - __main__ - Step 186: {'lr': 2.9333333333333333e-06, 'samples': 5952, 'steps': 11, 'loss/train': 8.79660415649414} -09/20/2021 14:31:35 - INFO - __main__ - Step 187: {'lr': 2.9333333333333333e-06, 'samples': 5984, 'steps': 11, 'loss/train': 9.238103866577148} -09/20/2021 14:31:36 - INFO - __main__ - Step 188: {'lr': 2.9333333333333333e-06, 'samples': 6016, 'steps': 11, 'loss/train': 8.303010940551758} -09/20/2021 14:31:37 - INFO - __main__ - Step 189: {'lr': 2.9333333333333333e-06, 'samples': 6048, 'steps': 11, 'loss/train': 8.87806510925293} -09/20/2021 14:31:38 - INFO - __main__ - Step 190: {'lr': 2.9333333333333333e-06, 'samples': 6080, 'steps': 11, 'loss/train': 9.107654571533203} -09/20/2021 14:31:38 - INFO - __main__ - Step 191: {'lr': 2.9333333333333333e-06, 'samples': 6112, 'steps': 11, 'loss/train': 8.608586311340332} -09/20/2021 14:31:39 - INFO - __main__ - Step 192: {'lr': 2.9333333333333333e-06, 'samples': 6144, 'steps': 11, 'loss/train': 8.355098724365234} -09/20/2021 14:31:40 - INFO - __main__ - Step 193: {'lr': 3.2000000000000003e-06, 'samples': 6176, 'steps': 12, 'loss/train': 8.87690544128418} -09/20/2021 14:31:41 - INFO - __main__ - Step 194: {'lr': 3.2000000000000003e-06, 'samples': 6208, 'steps': 12, 'loss/train': 9.34322452545166} -09/20/2021 14:31:41 - INFO - __main__ - Step 195: {'lr': 3.2000000000000003e-06, 'samples': 6240, 'steps': 12, 'loss/train': 9.497793197631836} -09/20/2021 14:31:42 - INFO - __main__ - Step 196: {'lr': 3.2000000000000003e-06, 'samples': 6272, 'steps': 12, 'loss/train': 9.656044960021973} -09/20/2021 14:31:43 - INFO - __main__ - Step 197: {'lr': 3.2000000000000003e-06, 'samples': 6304, 'steps': 12, 'loss/train': 9.362903594970703} -09/20/2021 14:31:44 - INFO - __main__ - Step 198: {'lr': 3.2000000000000003e-06, 'samples': 6336, 'steps': 12, 'loss/train': 9.408992767333984} -09/20/2021 14:31:44 - INFO - __main__ - Step 199: {'lr': 3.2000000000000003e-06, 'samples': 6368, 'steps': 12, 'loss/train': 9.373254776000977} -09/20/2021 14:31:45 - INFO - __main__ - Step 200: {'lr': 3.2000000000000003e-06, 'samples': 6400, 'steps': 12, 'loss/train': 8.690385818481445} -09/20/2021 14:31:46 - INFO - __main__ - Step 201: {'lr': 3.2000000000000003e-06, 'samples': 6432, 'steps': 12, 'loss/train': 8.788789749145508} -09/20/2021 14:31:47 - INFO - __main__ - Step 202: {'lr': 3.2000000000000003e-06, 'samples': 6464, 'steps': 12, 'loss/train': 9.265264511108398} -09/20/2021 14:31:47 - INFO - __main__ - Step 203: {'lr': 3.2000000000000003e-06, 'samples': 6496, 'steps': 12, 'loss/train': 9.106616973876953} -09/20/2021 14:31:48 - INFO - __main__ - Step 204: {'lr': 3.2000000000000003e-06, 'samples': 6528, 'steps': 12, 'loss/train': 9.102849006652832} -09/20/2021 14:31:49 - INFO - __main__ - Step 205: {'lr': 3.2000000000000003e-06, 'samples': 6560, 'steps': 12, 'loss/train': 8.769621849060059} -09/20/2021 14:31:50 - INFO - __main__ - Step 206: {'lr': 3.2000000000000003e-06, 'samples': 6592, 'steps': 12, 'loss/train': 8.841911315917969} -09/20/2021 14:31:50 - INFO - __main__ - Step 207: {'lr': 3.2000000000000003e-06, 'samples': 6624, 'steps': 12, 'loss/train': 8.852032661437988} -09/20/2021 14:31:51 - INFO - __main__ - Step 208: {'lr': 3.2000000000000003e-06, 'samples': 6656, 'steps': 12, 'loss/train': 8.928462028503418} -09/20/2021 14:31:52 - INFO - __main__ - Step 209: {'lr': 3.466666666666667e-06, 'samples': 6688, 'steps': 13, 'loss/train': 8.366024017333984} -09/20/2021 14:31:53 - INFO - __main__ - Step 210: {'lr': 3.466666666666667e-06, 'samples': 6720, 'steps': 13, 'loss/train': 8.815940856933594} -09/20/2021 14:31:54 - INFO - __main__ - Step 211: {'lr': 3.466666666666667e-06, 'samples': 6752, 'steps': 13, 'loss/train': 9.064132690429688} -09/20/2021 14:31:54 - INFO - __main__ - Step 212: {'lr': 3.466666666666667e-06, 'samples': 6784, 'steps': 13, 'loss/train': 9.110072135925293} -09/20/2021 14:31:55 - INFO - __main__ - Step 213: {'lr': 3.466666666666667e-06, 'samples': 6816, 'steps': 13, 'loss/train': 8.382452011108398} -09/20/2021 14:31:56 - INFO - __main__ - Step 214: {'lr': 3.466666666666667e-06, 'samples': 6848, 'steps': 13, 'loss/train': 8.583623886108398} -09/20/2021 14:31:57 - INFO - __main__ - Step 215: {'lr': 3.466666666666667e-06, 'samples': 6880, 'steps': 13, 'loss/train': 8.573383331298828} -09/20/2021 14:31:58 - INFO - __main__ - Step 216: {'lr': 3.466666666666667e-06, 'samples': 6912, 'steps': 13, 'loss/train': 8.411163330078125} -09/20/2021 14:31:59 - INFO - __main__ - Step 217: {'lr': 3.466666666666667e-06, 'samples': 6944, 'steps': 13, 'loss/train': 8.663798332214355} -09/20/2021 14:32:00 - INFO - __main__ - Step 218: {'lr': 3.466666666666667e-06, 'samples': 6976, 'steps': 13, 'loss/train': 7.602853298187256} -09/20/2021 14:32:01 - INFO - __main__ - Step 219: {'lr': 3.466666666666667e-06, 'samples': 7008, 'steps': 13, 'loss/train': 8.659309387207031} -09/20/2021 14:32:01 - INFO - __main__ - Step 220: {'lr': 3.466666666666667e-06, 'samples': 7040, 'steps': 13, 'loss/train': 7.987866401672363} -09/20/2021 14:32:02 - INFO - __main__ - Step 221: {'lr': 3.466666666666667e-06, 'samples': 7072, 'steps': 13, 'loss/train': 8.941047668457031} -09/20/2021 14:32:03 - INFO - __main__ - Step 222: {'lr': 3.466666666666667e-06, 'samples': 7104, 'steps': 13, 'loss/train': 8.694915771484375} -09/20/2021 14:32:04 - INFO - __main__ - Step 223: {'lr': 3.466666666666667e-06, 'samples': 7136, 'steps': 13, 'loss/train': 8.689214706420898} -09/20/2021 14:32:04 - INFO - __main__ - Step 224: {'lr': 3.466666666666667e-06, 'samples': 7168, 'steps': 13, 'loss/train': 8.96923542022705} -09/20/2021 14:32:05 - INFO - __main__ - Step 225: {'lr': 3.7333333333333337e-06, 'samples': 7200, 'steps': 14, 'loss/train': 8.233803749084473} -09/20/2021 14:32:06 - INFO - __main__ - Step 226: {'lr': 3.7333333333333337e-06, 'samples': 7232, 'steps': 14, 'loss/train': 8.446198463439941} -09/20/2021 14:32:07 - INFO - __main__ - Step 227: {'lr': 3.7333333333333337e-06, 'samples': 7264, 'steps': 14, 'loss/train': 8.665852546691895} -09/20/2021 14:32:08 - INFO - __main__ - Step 228: {'lr': 3.7333333333333337e-06, 'samples': 7296, 'steps': 14, 'loss/train': 8.195846557617188} -09/20/2021 14:32:08 - INFO - __main__ - Step 229: {'lr': 3.7333333333333337e-06, 'samples': 7328, 'steps': 14, 'loss/train': 8.074995994567871} -09/20/2021 14:32:09 - INFO - __main__ - Step 230: {'lr': 3.7333333333333337e-06, 'samples': 7360, 'steps': 14, 'loss/train': 9.178439140319824} -09/20/2021 14:32:10 - INFO - __main__ - Step 231: {'lr': 3.7333333333333337e-06, 'samples': 7392, 'steps': 14, 'loss/train': 8.13422679901123} -09/20/2021 14:32:11 - INFO - __main__ - Step 232: {'lr': 3.7333333333333337e-06, 'samples': 7424, 'steps': 14, 'loss/train': 8.430084228515625} -09/20/2021 14:32:11 - INFO - __main__ - Step 233: {'lr': 3.7333333333333337e-06, 'samples': 7456, 'steps': 14, 'loss/train': 8.702278137207031} -09/20/2021 14:32:12 - INFO - __main__ - Step 234: {'lr': 3.7333333333333337e-06, 'samples': 7488, 'steps': 14, 'loss/train': 8.706531524658203} -09/20/2021 14:32:13 - INFO - __main__ - Step 235: {'lr': 3.7333333333333337e-06, 'samples': 7520, 'steps': 14, 'loss/train': 8.622607231140137} -09/20/2021 14:32:14 - INFO - __main__ - Step 236: {'lr': 3.7333333333333337e-06, 'samples': 7552, 'steps': 14, 'loss/train': 9.172739028930664} -09/20/2021 14:32:14 - INFO - __main__ - Step 237: {'lr': 3.7333333333333337e-06, 'samples': 7584, 'steps': 14, 'loss/train': 8.434710502624512} -09/20/2021 14:32:15 - INFO - __main__ - Step 238: {'lr': 3.7333333333333337e-06, 'samples': 7616, 'steps': 14, 'loss/train': 8.876091003417969} -09/20/2021 14:32:16 - INFO - __main__ - Step 239: {'lr': 3.7333333333333337e-06, 'samples': 7648, 'steps': 14, 'loss/train': 8.603859901428223} -09/20/2021 14:32:17 - INFO - __main__ - Step 240: {'lr': 3.7333333333333337e-06, 'samples': 7680, 'steps': 14, 'loss/train': 8.867888450622559} -09/20/2021 14:32:17 - INFO - __main__ - Step 241: {'lr': 4.000000000000001e-06, 'samples': 7712, 'steps': 15, 'loss/train': 8.376379013061523} -09/20/2021 14:32:18 - INFO - __main__ - Step 242: {'lr': 4.000000000000001e-06, 'samples': 7744, 'steps': 15, 'loss/train': 8.983189582824707} -09/20/2021 14:32:19 - INFO - __main__ - Step 243: {'lr': 4.000000000000001e-06, 'samples': 7776, 'steps': 15, 'loss/train': 8.112996101379395} -09/20/2021 14:32:20 - INFO - __main__ - Step 244: {'lr': 4.000000000000001e-06, 'samples': 7808, 'steps': 15, 'loss/train': 7.968819618225098} -09/20/2021 14:32:20 - INFO - __main__ - Step 245: {'lr': 4.000000000000001e-06, 'samples': 7840, 'steps': 15, 'loss/train': 9.07267951965332} -09/20/2021 14:32:22 - INFO - __main__ - Step 246: {'lr': 4.000000000000001e-06, 'samples': 7872, 'steps': 15, 'loss/train': 8.632586479187012} -09/20/2021 14:32:22 - INFO - __main__ - Step 247: {'lr': 4.000000000000001e-06, 'samples': 7904, 'steps': 15, 'loss/train': 8.060004234313965} -09/20/2021 14:32:23 - INFO - __main__ - Step 248: {'lr': 4.000000000000001e-06, 'samples': 7936, 'steps': 15, 'loss/train': 8.450980186462402} -09/20/2021 14:32:24 - INFO - __main__ - Step 249: {'lr': 4.000000000000001e-06, 'samples': 7968, 'steps': 15, 'loss/train': 8.683721542358398} -09/20/2021 14:32:25 - INFO - __main__ - Step 250: {'lr': 4.000000000000001e-06, 'samples': 8000, 'steps': 15, 'loss/train': 8.521979331970215} -09/20/2021 14:32:25 - INFO - __main__ - Step 251: {'lr': 4.000000000000001e-06, 'samples': 8032, 'steps': 15, 'loss/train': 8.868291854858398} -09/20/2021 14:32:26 - INFO - __main__ - Step 252: {'lr': 4.000000000000001e-06, 'samples': 8064, 'steps': 15, 'loss/train': 8.931967735290527} -09/20/2021 14:32:27 - INFO - __main__ - Step 253: {'lr': 4.000000000000001e-06, 'samples': 8096, 'steps': 15, 'loss/train': 8.304852485656738} -09/20/2021 14:32:28 - INFO - __main__ - Step 254: {'lr': 4.000000000000001e-06, 'samples': 8128, 'steps': 15, 'loss/train': 8.660804748535156} -09/20/2021 14:32:28 - INFO - __main__ - Step 255: {'lr': 4.000000000000001e-06, 'samples': 8160, 'steps': 15, 'loss/train': 8.367685317993164} -09/20/2021 14:32:29 - INFO - __main__ - Step 256: {'lr': 4.000000000000001e-06, 'samples': 8192, 'steps': 15, 'loss/train': 8.689079284667969} -09/20/2021 14:32:30 - INFO - __main__ - Step 257: {'lr': 4.266666666666667e-06, 'samples': 8224, 'steps': 16, 'loss/train': 8.291749000549316} -09/20/2021 14:32:31 - INFO - __main__ - Step 258: {'lr': 4.266666666666667e-06, 'samples': 8256, 'steps': 16, 'loss/train': 8.445318222045898} -09/20/2021 14:32:32 - INFO - __main__ - Step 259: {'lr': 4.266666666666667e-06, 'samples': 8288, 'steps': 16, 'loss/train': 7.47361946105957} -09/20/2021 14:32:32 - INFO - __main__ - Step 260: {'lr': 4.266666666666667e-06, 'samples': 8320, 'steps': 16, 'loss/train': 7.7060546875} -09/20/2021 14:32:33 - INFO - __main__ - Step 261: {'lr': 4.266666666666667e-06, 'samples': 8352, 'steps': 16, 'loss/train': 8.699097633361816} -09/20/2021 14:32:34 - INFO - __main__ - Step 262: {'lr': 4.266666666666667e-06, 'samples': 8384, 'steps': 16, 'loss/train': 8.997942924499512} -09/20/2021 14:32:35 - INFO - __main__ - Step 263: {'lr': 4.266666666666667e-06, 'samples': 8416, 'steps': 16, 'loss/train': 8.563644409179688} -09/20/2021 14:32:35 - INFO - __main__ - Step 264: {'lr': 4.266666666666667e-06, 'samples': 8448, 'steps': 16, 'loss/train': 8.52402400970459} -09/20/2021 14:32:36 - INFO - __main__ - Step 265: {'lr': 4.266666666666667e-06, 'samples': 8480, 'steps': 16, 'loss/train': 8.59157657623291} -09/20/2021 14:32:37 - INFO - __main__ - Step 266: {'lr': 4.266666666666667e-06, 'samples': 8512, 'steps': 16, 'loss/train': 9.02730941772461} -09/20/2021 14:32:38 - INFO - __main__ - Step 267: {'lr': 4.266666666666667e-06, 'samples': 8544, 'steps': 16, 'loss/train': 8.611414909362793} -09/20/2021 14:32:38 - INFO - __main__ - Step 268: {'lr': 4.266666666666667e-06, 'samples': 8576, 'steps': 16, 'loss/train': 8.606526374816895} -09/20/2021 14:32:39 - INFO - __main__ - Step 269: {'lr': 4.266666666666667e-06, 'samples': 8608, 'steps': 16, 'loss/train': 9.349578857421875} -09/20/2021 14:32:40 - INFO - __main__ - Step 270: {'lr': 4.266666666666667e-06, 'samples': 8640, 'steps': 16, 'loss/train': 8.48228931427002} -09/20/2021 14:32:41 - INFO - __main__ - Step 271: {'lr': 4.266666666666667e-06, 'samples': 8672, 'steps': 16, 'loss/train': 8.945440292358398} -09/20/2021 14:32:41 - INFO - __main__ - Step 272: {'lr': 4.266666666666667e-06, 'samples': 8704, 'steps': 16, 'loss/train': 8.172369956970215} -09/20/2021 14:32:42 - INFO - __main__ - Step 273: {'lr': 4.533333333333334e-06, 'samples': 8736, 'steps': 17, 'loss/train': 8.67249584197998} -09/20/2021 14:32:43 - INFO - __main__ - Step 274: {'lr': 4.533333333333334e-06, 'samples': 8768, 'steps': 17, 'loss/train': 8.854464530944824} -09/20/2021 14:32:44 - INFO - __main__ - Step 275: {'lr': 4.533333333333334e-06, 'samples': 8800, 'steps': 17, 'loss/train': 7.802404880523682} -09/20/2021 14:32:45 - INFO - __main__ - Step 276: {'lr': 4.533333333333334e-06, 'samples': 8832, 'steps': 17, 'loss/train': 8.723392486572266} -09/20/2021 14:32:46 - INFO - __main__ - Step 277: {'lr': 4.533333333333334e-06, 'samples': 8864, 'steps': 17, 'loss/train': 9.12875747680664} -09/20/2021 14:32:47 - INFO - __main__ - Step 278: {'lr': 4.533333333333334e-06, 'samples': 8896, 'steps': 17, 'loss/train': 8.52492904663086} -09/20/2021 14:32:47 - INFO - __main__ - Step 279: {'lr': 4.533333333333334e-06, 'samples': 8928, 'steps': 17, 'loss/train': 8.191666603088379} -09/20/2021 14:32:48 - INFO - __main__ - Step 280: {'lr': 4.533333333333334e-06, 'samples': 8960, 'steps': 17, 'loss/train': 8.180038452148438} -09/20/2021 14:32:49 - INFO - __main__ - Step 281: {'lr': 4.533333333333334e-06, 'samples': 8992, 'steps': 17, 'loss/train': 8.33659553527832} -09/20/2021 14:32:50 - INFO - __main__ - Step 282: {'lr': 4.533333333333334e-06, 'samples': 9024, 'steps': 17, 'loss/train': 8.380504608154297} -09/20/2021 14:32:50 - INFO - __main__ - Step 283: {'lr': 4.533333333333334e-06, 'samples': 9056, 'steps': 17, 'loss/train': 8.431884765625} -09/20/2021 14:32:51 - INFO - __main__ - Step 284: {'lr': 4.533333333333334e-06, 'samples': 9088, 'steps': 17, 'loss/train': 9.088956832885742} -09/20/2021 14:32:52 - INFO - __main__ - Step 285: {'lr': 4.533333333333334e-06, 'samples': 9120, 'steps': 17, 'loss/train': 8.294280052185059} -09/20/2021 14:32:53 - INFO - __main__ - Step 286: {'lr': 4.533333333333334e-06, 'samples': 9152, 'steps': 17, 'loss/train': 9.035836219787598} -09/20/2021 14:32:53 - INFO - __main__ - Step 287: {'lr': 4.533333333333334e-06, 'samples': 9184, 'steps': 17, 'loss/train': 8.32386302947998} -09/20/2021 14:32:54 - INFO - __main__ - Step 288: {'lr': 4.533333333333334e-06, 'samples': 9216, 'steps': 17, 'loss/train': 8.178072929382324} -09/20/2021 14:32:55 - INFO - __main__ - Step 289: {'lr': 4.800000000000001e-06, 'samples': 9248, 'steps': 18, 'loss/train': 8.364659309387207} -09/20/2021 14:32:56 - INFO - __main__ - Step 290: {'lr': 4.800000000000001e-06, 'samples': 9280, 'steps': 18, 'loss/train': 8.53239631652832} -09/20/2021 14:32:56 - INFO - __main__ - Step 291: {'lr': 4.800000000000001e-06, 'samples': 9312, 'steps': 18, 'loss/train': 8.941852569580078} -09/20/2021 14:32:57 - INFO - __main__ - Step 292: {'lr': 4.800000000000001e-06, 'samples': 9344, 'steps': 18, 'loss/train': 8.27403450012207} -09/20/2021 14:32:58 - INFO - __main__ - Step 293: {'lr': 4.800000000000001e-06, 'samples': 9376, 'steps': 18, 'loss/train': 8.341958045959473} -09/20/2021 14:32:59 - INFO - __main__ - Step 294: {'lr': 4.800000000000001e-06, 'samples': 9408, 'steps': 18, 'loss/train': 8.783493041992188} -09/20/2021 14:32:59 - INFO - __main__ - Step 295: {'lr': 4.800000000000001e-06, 'samples': 9440, 'steps': 18, 'loss/train': 8.28991985321045} -09/20/2021 14:33:00 - INFO - __main__ - Step 296: {'lr': 4.800000000000001e-06, 'samples': 9472, 'steps': 18, 'loss/train': 8.717666625976562} -09/20/2021 14:33:01 - INFO - __main__ - Step 297: {'lr': 4.800000000000001e-06, 'samples': 9504, 'steps': 18, 'loss/train': 8.224347114562988} -09/20/2021 14:33:02 - INFO - __main__ - Step 298: {'lr': 4.800000000000001e-06, 'samples': 9536, 'steps': 18, 'loss/train': 8.459529876708984} -09/20/2021 14:33:02 - INFO - __main__ - Step 299: {'lr': 4.800000000000001e-06, 'samples': 9568, 'steps': 18, 'loss/train': 8.414532661437988} -09/20/2021 14:33:03 - INFO - __main__ - Step 300: {'lr': 4.800000000000001e-06, 'samples': 9600, 'steps': 18, 'loss/train': 8.264294624328613} -09/20/2021 14:33:04 - INFO - __main__ - Step 301: {'lr': 4.800000000000001e-06, 'samples': 9632, 'steps': 18, 'loss/train': 8.166126251220703} -09/20/2021 14:33:05 - INFO - __main__ - Step 302: {'lr': 4.800000000000001e-06, 'samples': 9664, 'steps': 18, 'loss/train': 8.38692569732666} -09/20/2021 14:33:05 - INFO - __main__ - Step 303: {'lr': 4.800000000000001e-06, 'samples': 9696, 'steps': 18, 'loss/train': 8.629670143127441} -09/20/2021 14:33:06 - INFO - __main__ - Step 304: {'lr': 4.800000000000001e-06, 'samples': 9728, 'steps': 18, 'loss/train': 8.47204303741455} -09/20/2021 14:33:07 - INFO - __main__ - Step 305: {'lr': 5.066666666666667e-06, 'samples': 9760, 'steps': 19, 'loss/train': 8.487871170043945} -09/20/2021 14:33:08 - INFO - __main__ - Step 306: {'lr': 5.066666666666667e-06, 'samples': 9792, 'steps': 19, 'loss/train': 8.474513053894043} -09/20/2021 14:33:09 - INFO - __main__ - Step 307: {'lr': 5.066666666666667e-06, 'samples': 9824, 'steps': 19, 'loss/train': 8.702383041381836} -09/20/2021 14:33:10 - INFO - __main__ - Step 308: {'lr': 5.066666666666667e-06, 'samples': 9856, 'steps': 19, 'loss/train': 8.591322898864746} -09/20/2021 14:33:11 - INFO - __main__ - Step 309: {'lr': 5.066666666666667e-06, 'samples': 9888, 'steps': 19, 'loss/train': 7.8172454833984375} -09/20/2021 14:33:11 - INFO - __main__ - Step 310: {'lr': 5.066666666666667e-06, 'samples': 9920, 'steps': 19, 'loss/train': 8.515870094299316} -09/20/2021 14:33:12 - INFO - __main__ - Step 311: {'lr': 5.066666666666667e-06, 'samples': 9952, 'steps': 19, 'loss/train': 8.176741600036621} -09/20/2021 14:33:13 - INFO - __main__ - Step 312: {'lr': 5.066666666666667e-06, 'samples': 9984, 'steps': 19, 'loss/train': 8.62687873840332} -09/20/2021 14:33:14 - INFO - __main__ - Step 313: {'lr': 5.066666666666667e-06, 'samples': 10016, 'steps': 19, 'loss/train': 8.123113632202148} -09/20/2021 14:33:14 - INFO - __main__ - Step 314: {'lr': 5.066666666666667e-06, 'samples': 10048, 'steps': 19, 'loss/train': 9.251825332641602} -09/20/2021 14:33:15 - INFO - __main__ - Step 315: {'lr': 5.066666666666667e-06, 'samples': 10080, 'steps': 19, 'loss/train': 8.673247337341309} -09/20/2021 14:33:16 - INFO - __main__ - Step 316: {'lr': 5.066666666666667e-06, 'samples': 10112, 'steps': 19, 'loss/train': 8.73658561706543} -09/20/2021 14:33:17 - INFO - __main__ - Step 317: {'lr': 5.066666666666667e-06, 'samples': 10144, 'steps': 19, 'loss/train': 8.150056838989258} -09/20/2021 14:33:17 - INFO - __main__ - Step 318: {'lr': 5.066666666666667e-06, 'samples': 10176, 'steps': 19, 'loss/train': 8.768575668334961} -09/20/2021 14:33:18 - INFO - __main__ - Step 319: {'lr': 5.066666666666667e-06, 'samples': 10208, 'steps': 19, 'loss/train': 8.226738929748535} -09/20/2021 14:33:19 - INFO - __main__ - Step 320: {'lr': 5.066666666666667e-06, 'samples': 10240, 'steps': 19, 'loss/train': 8.476763725280762} -09/20/2021 14:33:20 - INFO - __main__ - Step 321: {'lr': 5.333333333333334e-06, 'samples': 10272, 'steps': 20, 'loss/train': 8.739855766296387} -09/20/2021 14:33:20 - INFO - __main__ - Step 322: {'lr': 5.333333333333334e-06, 'samples': 10304, 'steps': 20, 'loss/train': 8.142094612121582} -09/20/2021 14:33:21 - INFO - __main__ - Step 323: {'lr': 5.333333333333334e-06, 'samples': 10336, 'steps': 20, 'loss/train': 8.052844047546387} -09/20/2021 14:33:22 - INFO - __main__ - Step 324: {'lr': 5.333333333333334e-06, 'samples': 10368, 'steps': 20, 'loss/train': 8.558100700378418} -09/20/2021 14:33:23 - INFO - __main__ - Step 325: {'lr': 5.333333333333334e-06, 'samples': 10400, 'steps': 20, 'loss/train': 8.354575157165527} -09/20/2021 14:33:23 - INFO - __main__ - Step 326: {'lr': 5.333333333333334e-06, 'samples': 10432, 'steps': 20, 'loss/train': 8.589188575744629} -09/20/2021 14:33:24 - INFO - __main__ - Step 327: {'lr': 5.333333333333334e-06, 'samples': 10464, 'steps': 20, 'loss/train': 8.674665451049805} -09/20/2021 14:33:25 - INFO - __main__ - Step 328: {'lr': 5.333333333333334e-06, 'samples': 10496, 'steps': 20, 'loss/train': 8.909956932067871} -09/20/2021 14:33:26 - INFO - __main__ - Step 329: {'lr': 5.333333333333334e-06, 'samples': 10528, 'steps': 20, 'loss/train': 8.355966567993164} -09/20/2021 14:33:26 - INFO - __main__ - Step 330: {'lr': 5.333333333333334e-06, 'samples': 10560, 'steps': 20, 'loss/train': 8.676676750183105} -09/20/2021 14:33:27 - INFO - __main__ - Step 331: {'lr': 5.333333333333334e-06, 'samples': 10592, 'steps': 20, 'loss/train': 7.726262092590332} -09/20/2021 14:33:28 - INFO - __main__ - Step 332: {'lr': 5.333333333333334e-06, 'samples': 10624, 'steps': 20, 'loss/train': 8.478616714477539} -09/20/2021 14:33:29 - INFO - __main__ - Step 333: {'lr': 5.333333333333334e-06, 'samples': 10656, 'steps': 20, 'loss/train': 9.102471351623535} -09/20/2021 14:33:29 - INFO - __main__ - Step 334: {'lr': 5.333333333333334e-06, 'samples': 10688, 'steps': 20, 'loss/train': 8.264527320861816} -09/20/2021 14:33:30 - INFO - __main__ - Step 335: {'lr': 5.333333333333334e-06, 'samples': 10720, 'steps': 20, 'loss/train': 8.201118469238281} -09/20/2021 14:33:31 - INFO - __main__ - Step 336: {'lr': 5.333333333333334e-06, 'samples': 10752, 'steps': 20, 'loss/train': 8.85928726196289} -09/20/2021 14:33:32 - INFO - __main__ - Step 337: {'lr': 5.600000000000001e-06, 'samples': 10784, 'steps': 21, 'loss/train': 8.479593276977539} -09/20/2021 14:33:33 - INFO - __main__ - Step 338: {'lr': 5.600000000000001e-06, 'samples': 10816, 'steps': 21, 'loss/train': 9.214859008789062} -09/20/2021 14:33:34 - INFO - __main__ - Step 339: {'lr': 5.600000000000001e-06, 'samples': 10848, 'steps': 21, 'loss/train': 8.564558029174805} -09/20/2021 14:33:35 - INFO - __main__ - Step 340: {'lr': 5.600000000000001e-06, 'samples': 10880, 'steps': 21, 'loss/train': 9.13249683380127} -09/20/2021 14:33:35 - INFO - __main__ - Step 341: {'lr': 5.600000000000001e-06, 'samples': 10912, 'steps': 21, 'loss/train': 8.27839183807373} -09/20/2021 14:33:36 - INFO - __main__ - Step 342: {'lr': 5.600000000000001e-06, 'samples': 10944, 'steps': 21, 'loss/train': 8.609259605407715} -09/20/2021 14:33:37 - INFO - __main__ - Step 343: {'lr': 5.600000000000001e-06, 'samples': 10976, 'steps': 21, 'loss/train': 7.8586015701293945} -09/20/2021 14:33:38 - INFO - __main__ - Step 344: {'lr': 5.600000000000001e-06, 'samples': 11008, 'steps': 21, 'loss/train': 8.139322280883789} -09/20/2021 14:33:38 - INFO - __main__ - Step 345: {'lr': 5.600000000000001e-06, 'samples': 11040, 'steps': 21, 'loss/train': 8.515987396240234} -09/20/2021 14:33:39 - INFO - __main__ - Step 346: {'lr': 5.600000000000001e-06, 'samples': 11072, 'steps': 21, 'loss/train': 8.817667007446289} -09/20/2021 14:33:40 - INFO - __main__ - Step 347: {'lr': 5.600000000000001e-06, 'samples': 11104, 'steps': 21, 'loss/train': 8.328887939453125} -09/20/2021 14:33:41 - INFO - __main__ - Step 348: {'lr': 5.600000000000001e-06, 'samples': 11136, 'steps': 21, 'loss/train': 8.809547424316406} -09/20/2021 14:33:41 - INFO - __main__ - Step 349: {'lr': 5.600000000000001e-06, 'samples': 11168, 'steps': 21, 'loss/train': 8.047675132751465} -09/20/2021 14:33:42 - INFO - __main__ - Step 350: {'lr': 5.600000000000001e-06, 'samples': 11200, 'steps': 21, 'loss/train': 4.685243606567383} -09/20/2021 14:33:43 - INFO - __main__ - Step 351: {'lr': 5.600000000000001e-06, 'samples': 11232, 'steps': 21, 'loss/train': 8.096172332763672} -09/20/2021 14:33:44 - INFO - __main__ - Step 352: {'lr': 5.600000000000001e-06, 'samples': 11264, 'steps': 21, 'loss/train': 8.780291557312012} -09/20/2021 14:33:45 - INFO - __main__ - Step 353: {'lr': 5.866666666666667e-06, 'samples': 11296, 'steps': 22, 'loss/train': 8.625988006591797} -09/20/2021 14:33:45 - INFO - __main__ - Step 354: {'lr': 5.866666666666667e-06, 'samples': 11328, 'steps': 22, 'loss/train': 8.255498886108398} -09/20/2021 14:33:46 - INFO - __main__ - Step 355: {'lr': 5.866666666666667e-06, 'samples': 11360, 'steps': 22, 'loss/train': 8.279226303100586} -09/20/2021 14:33:47 - INFO - __main__ - Step 356: {'lr': 5.866666666666667e-06, 'samples': 11392, 'steps': 22, 'loss/train': 8.247941970825195} -09/20/2021 14:33:48 - INFO - __main__ - Step 357: {'lr': 5.866666666666667e-06, 'samples': 11424, 'steps': 22, 'loss/train': 8.120832443237305} -09/20/2021 14:33:48 - INFO - __main__ - Step 358: {'lr': 5.866666666666667e-06, 'samples': 11456, 'steps': 22, 'loss/train': 8.299846649169922} -09/20/2021 14:33:49 - INFO - __main__ - Step 359: {'lr': 5.866666666666667e-06, 'samples': 11488, 'steps': 22, 'loss/train': 8.057741165161133} -09/20/2021 14:33:50 - INFO - __main__ - Step 360: {'lr': 5.866666666666667e-06, 'samples': 11520, 'steps': 22, 'loss/train': 8.381936073303223} -09/20/2021 14:33:51 - INFO - __main__ - Step 361: {'lr': 5.866666666666667e-06, 'samples': 11552, 'steps': 22, 'loss/train': 8.423482894897461} -09/20/2021 14:33:51 - INFO - __main__ - Step 362: {'lr': 5.866666666666667e-06, 'samples': 11584, 'steps': 22, 'loss/train': 8.472229957580566} -09/20/2021 14:33:52 - INFO - __main__ - Step 363: {'lr': 5.866666666666667e-06, 'samples': 11616, 'steps': 22, 'loss/train': 8.171797752380371} -09/20/2021 14:33:53 - INFO - __main__ - Step 364: {'lr': 5.866666666666667e-06, 'samples': 11648, 'steps': 22, 'loss/train': 8.24300479888916} -09/20/2021 14:33:54 - INFO - __main__ - Step 365: {'lr': 5.866666666666667e-06, 'samples': 11680, 'steps': 22, 'loss/train': 8.768223762512207} -09/20/2021 14:33:54 - INFO - __main__ - Step 366: {'lr': 5.866666666666667e-06, 'samples': 11712, 'steps': 22, 'loss/train': 8.46615982055664} -09/20/2021 14:33:55 - INFO - __main__ - Step 367: {'lr': 5.866666666666667e-06, 'samples': 11744, 'steps': 22, 'loss/train': 8.236011505126953} -09/20/2021 14:33:56 - INFO - __main__ - Step 368: {'lr': 5.866666666666667e-06, 'samples': 11776, 'steps': 22, 'loss/train': 9.111892700195312} -09/20/2021 14:33:57 - INFO - __main__ - Step 369: {'lr': 6.133333333333334e-06, 'samples': 11808, 'steps': 23, 'loss/train': 8.470428466796875} -09/20/2021 14:33:58 - INFO - __main__ - Step 370: {'lr': 6.133333333333334e-06, 'samples': 11840, 'steps': 23, 'loss/train': 8.278343200683594} -09/20/2021 14:33:59 - INFO - __main__ - Step 371: {'lr': 6.133333333333334e-06, 'samples': 11872, 'steps': 23, 'loss/train': 8.43584156036377} -09/20/2021 14:34:00 - INFO - __main__ - Step 372: {'lr': 6.133333333333334e-06, 'samples': 11904, 'steps': 23, 'loss/train': 7.475155830383301} -09/20/2021 14:34:00 - INFO - __main__ - Step 373: {'lr': 6.133333333333334e-06, 'samples': 11936, 'steps': 23, 'loss/train': 8.12746810913086} -09/20/2021 14:34:01 - INFO - __main__ - Step 374: {'lr': 6.133333333333334e-06, 'samples': 11968, 'steps': 23, 'loss/train': 8.410913467407227} -09/20/2021 14:34:02 - INFO - __main__ - Step 375: {'lr': 6.133333333333334e-06, 'samples': 12000, 'steps': 23, 'loss/train': 7.971593379974365} -09/20/2021 14:34:03 - INFO - __main__ - Step 376: {'lr': 6.133333333333334e-06, 'samples': 12032, 'steps': 23, 'loss/train': 8.168719291687012} -09/20/2021 14:34:03 - INFO - __main__ - Step 377: {'lr': 6.133333333333334e-06, 'samples': 12064, 'steps': 23, 'loss/train': 8.627043724060059} -09/20/2021 14:34:04 - INFO - __main__ - Step 378: {'lr': 6.133333333333334e-06, 'samples': 12096, 'steps': 23, 'loss/train': 7.981350898742676} -09/20/2021 14:34:05 - INFO - __main__ - Step 379: {'lr': 6.133333333333334e-06, 'samples': 12128, 'steps': 23, 'loss/train': 8.996005058288574} -09/20/2021 14:34:06 - INFO - __main__ - Step 380: {'lr': 6.133333333333334e-06, 'samples': 12160, 'steps': 23, 'loss/train': 8.431379318237305} -09/20/2021 14:34:06 - INFO - __main__ - Step 381: {'lr': 6.133333333333334e-06, 'samples': 12192, 'steps': 23, 'loss/train': 8.818727493286133} -09/20/2021 14:34:07 - INFO - __main__ - Step 382: {'lr': 6.133333333333334e-06, 'samples': 12224, 'steps': 23, 'loss/train': 8.895380020141602} -09/20/2021 14:34:08 - INFO - __main__ - Step 383: {'lr': 6.133333333333334e-06, 'samples': 12256, 'steps': 23, 'loss/train': 8.549541473388672} -09/20/2021 14:34:09 - INFO - __main__ - Step 384: {'lr': 6.133333333333334e-06, 'samples': 12288, 'steps': 23, 'loss/train': 8.695388793945312} -09/20/2021 14:34:09 - INFO - __main__ - Step 385: {'lr': 6.4000000000000006e-06, 'samples': 12320, 'steps': 24, 'loss/train': 8.198637008666992} -09/20/2021 14:34:10 - INFO - __main__ - Step 386: {'lr': 6.4000000000000006e-06, 'samples': 12352, 'steps': 24, 'loss/train': 8.039265632629395} -09/20/2021 14:34:11 - INFO - __main__ - Step 387: {'lr': 6.4000000000000006e-06, 'samples': 12384, 'steps': 24, 'loss/train': 9.498437881469727} -09/20/2021 14:34:12 - INFO - __main__ - Step 388: {'lr': 6.4000000000000006e-06, 'samples': 12416, 'steps': 24, 'loss/train': 8.016845703125} -09/20/2021 14:34:12 - INFO - __main__ - Step 389: {'lr': 6.4000000000000006e-06, 'samples': 12448, 'steps': 24, 'loss/train': 8.611960411071777} -09/20/2021 14:34:13 - INFO - __main__ - Step 390: {'lr': 6.4000000000000006e-06, 'samples': 12480, 'steps': 24, 'loss/train': 7.852954387664795} -09/20/2021 14:34:14 - INFO - __main__ - Step 391: {'lr': 6.4000000000000006e-06, 'samples': 12512, 'steps': 24, 'loss/train': 8.23727035522461} -09/20/2021 14:34:15 - INFO - __main__ - Step 392: {'lr': 6.4000000000000006e-06, 'samples': 12544, 'steps': 24, 'loss/train': 8.428350448608398} -09/20/2021 14:34:15 - INFO - __main__ - Step 393: {'lr': 6.4000000000000006e-06, 'samples': 12576, 'steps': 24, 'loss/train': 7.881124973297119} -09/20/2021 14:34:16 - INFO - __main__ - Step 394: {'lr': 6.4000000000000006e-06, 'samples': 12608, 'steps': 24, 'loss/train': 8.210144996643066} -09/20/2021 14:34:17 - INFO - __main__ - Step 395: {'lr': 6.4000000000000006e-06, 'samples': 12640, 'steps': 24, 'loss/train': 8.723416328430176} -09/20/2021 14:34:18 - INFO - __main__ - Step 396: {'lr': 6.4000000000000006e-06, 'samples': 12672, 'steps': 24, 'loss/train': 7.735273361206055} -09/20/2021 14:34:18 - INFO - __main__ - Step 397: {'lr': 6.4000000000000006e-06, 'samples': 12704, 'steps': 24, 'loss/train': 8.016125679016113} -09/20/2021 14:34:19 - INFO - __main__ - Step 398: {'lr': 6.4000000000000006e-06, 'samples': 12736, 'steps': 24, 'loss/train': 7.692718982696533} -09/20/2021 14:34:20 - INFO - __main__ - Step 399: {'lr': 6.4000000000000006e-06, 'samples': 12768, 'steps': 24, 'loss/train': 9.064533233642578} -09/20/2021 14:34:21 - INFO - __main__ - Step 400: {'lr': 6.4000000000000006e-06, 'samples': 12800, 'steps': 24, 'loss/train': 8.269723892211914} -09/20/2021 14:34:22 - INFO - __main__ - Step 401: {'lr': 6.666666666666667e-06, 'samples': 12832, 'steps': 25, 'loss/train': 8.328325271606445} -09/20/2021 14:34:23 - INFO - __main__ - Step 402: {'lr': 6.666666666666667e-06, 'samples': 12864, 'steps': 25, 'loss/train': 8.385189056396484} -09/20/2021 14:34:24 - INFO - __main__ - Step 403: {'lr': 6.666666666666667e-06, 'samples': 12896, 'steps': 25, 'loss/train': 7.729237079620361} -09/20/2021 14:34:25 - INFO - __main__ - Step 404: {'lr': 6.666666666666667e-06, 'samples': 12928, 'steps': 25, 'loss/train': 8.172588348388672} -09/20/2021 14:34:25 - INFO - __main__ - Step 405: {'lr': 6.666666666666667e-06, 'samples': 12960, 'steps': 25, 'loss/train': 8.11401653289795} -09/20/2021 14:34:26 - INFO - __main__ - Step 406: {'lr': 6.666666666666667e-06, 'samples': 12992, 'steps': 25, 'loss/train': 8.354430198669434} -09/20/2021 14:34:27 - INFO - __main__ - Step 407: {'lr': 6.666666666666667e-06, 'samples': 13024, 'steps': 25, 'loss/train': 8.509937286376953} -09/20/2021 14:34:28 - INFO - __main__ - Step 408: {'lr': 6.666666666666667e-06, 'samples': 13056, 'steps': 25, 'loss/train': 8.434226036071777} -09/20/2021 14:34:28 - INFO - __main__ - Step 409: {'lr': 6.666666666666667e-06, 'samples': 13088, 'steps': 25, 'loss/train': 7.878507614135742} -09/20/2021 14:34:29 - INFO - __main__ - Step 410: {'lr': 6.666666666666667e-06, 'samples': 13120, 'steps': 25, 'loss/train': 8.508771896362305} -09/20/2021 14:34:30 - INFO - __main__ - Step 411: {'lr': 6.666666666666667e-06, 'samples': 13152, 'steps': 25, 'loss/train': 8.115318298339844} -09/20/2021 14:34:31 - INFO - __main__ - Step 412: {'lr': 6.666666666666667e-06, 'samples': 13184, 'steps': 25, 'loss/train': 8.135350227355957} -09/20/2021 14:34:31 - INFO - __main__ - Step 413: {'lr': 6.666666666666667e-06, 'samples': 13216, 'steps': 25, 'loss/train': 8.060239791870117} -09/20/2021 14:34:32 - INFO - __main__ - Step 414: {'lr': 6.666666666666667e-06, 'samples': 13248, 'steps': 25, 'loss/train': 8.196454048156738} -09/20/2021 14:34:33 - INFO - __main__ - Step 415: {'lr': 6.666666666666667e-06, 'samples': 13280, 'steps': 25, 'loss/train': 8.387123107910156} -09/20/2021 14:34:34 - INFO - __main__ - Step 416: {'lr': 6.666666666666667e-06, 'samples': 13312, 'steps': 25, 'loss/train': 7.7477126121521} -09/20/2021 14:34:35 - INFO - __main__ - Step 417: {'lr': 6.933333333333334e-06, 'samples': 13344, 'steps': 26, 'loss/train': 8.117823600769043} -09/20/2021 14:34:35 - INFO - __main__ - Step 418: {'lr': 6.933333333333334e-06, 'samples': 13376, 'steps': 26, 'loss/train': 8.00882339477539} -09/20/2021 14:34:36 - INFO - __main__ - Step 419: {'lr': 6.933333333333334e-06, 'samples': 13408, 'steps': 26, 'loss/train': 8.396756172180176} -09/20/2021 14:34:37 - INFO - __main__ - Step 420: {'lr': 6.933333333333334e-06, 'samples': 13440, 'steps': 26, 'loss/train': 8.665587425231934} -09/20/2021 14:34:38 - INFO - __main__ - Step 421: {'lr': 6.933333333333334e-06, 'samples': 13472, 'steps': 26, 'loss/train': 8.878520965576172} -09/20/2021 14:34:38 - INFO - __main__ - Step 422: {'lr': 6.933333333333334e-06, 'samples': 13504, 'steps': 26, 'loss/train': 8.00115966796875} -09/20/2021 14:34:39 - INFO - __main__ - Step 423: {'lr': 6.933333333333334e-06, 'samples': 13536, 'steps': 26, 'loss/train': 8.394485473632812} -09/20/2021 14:34:40 - INFO - __main__ - Step 424: {'lr': 6.933333333333334e-06, 'samples': 13568, 'steps': 26, 'loss/train': 8.606280326843262} -09/20/2021 14:34:41 - INFO - __main__ - Step 425: {'lr': 6.933333333333334e-06, 'samples': 13600, 'steps': 26, 'loss/train': 7.713921546936035} -09/20/2021 14:34:41 - INFO - __main__ - Step 426: {'lr': 6.933333333333334e-06, 'samples': 13632, 'steps': 26, 'loss/train': 7.972832202911377} -09/20/2021 14:34:42 - INFO - __main__ - Step 427: {'lr': 6.933333333333334e-06, 'samples': 13664, 'steps': 26, 'loss/train': 8.371808052062988} -09/20/2021 14:34:43 - INFO - __main__ - Step 428: {'lr': 6.933333333333334e-06, 'samples': 13696, 'steps': 26, 'loss/train': 9.563541412353516} -09/20/2021 14:34:44 - INFO - __main__ - Step 429: {'lr': 6.933333333333334e-06, 'samples': 13728, 'steps': 26, 'loss/train': 8.769476890563965} -09/20/2021 14:34:44 - INFO - __main__ - Step 430: {'lr': 6.933333333333334e-06, 'samples': 13760, 'steps': 26, 'loss/train': 8.472738265991211} -09/20/2021 14:34:45 - INFO - __main__ - Step 431: {'lr': 6.933333333333334e-06, 'samples': 13792, 'steps': 26, 'loss/train': 8.31693172454834} -09/20/2021 14:34:46 - INFO - __main__ - Step 432: {'lr': 6.933333333333334e-06, 'samples': 13824, 'steps': 26, 'loss/train': 8.549546241760254} -09/20/2021 14:34:47 - INFO - __main__ - Step 433: {'lr': 7.2e-06, 'samples': 13856, 'steps': 27, 'loss/train': 8.400809288024902} -09/20/2021 14:34:48 - INFO - __main__ - Step 434: {'lr': 7.2e-06, 'samples': 13888, 'steps': 27, 'loss/train': 8.292486190795898} -09/20/2021 14:34:49 - INFO - __main__ - Step 435: {'lr': 7.2e-06, 'samples': 13920, 'steps': 27, 'loss/train': 8.464280128479004} -09/20/2021 14:34:50 - INFO - __main__ - Step 436: {'lr': 7.2e-06, 'samples': 13952, 'steps': 27, 'loss/train': 7.918385982513428} -09/20/2021 14:34:50 - INFO - __main__ - Step 437: {'lr': 7.2e-06, 'samples': 13984, 'steps': 27, 'loss/train': 8.360090255737305} -09/20/2021 14:34:51 - INFO - __main__ - Step 438: {'lr': 7.2e-06, 'samples': 14016, 'steps': 27, 'loss/train': 7.759614944458008} -09/20/2021 14:34:52 - INFO - __main__ - Step 439: {'lr': 7.2e-06, 'samples': 14048, 'steps': 27, 'loss/train': 7.8694167137146} -09/20/2021 14:34:53 - INFO - __main__ - Step 440: {'lr': 7.2e-06, 'samples': 14080, 'steps': 27, 'loss/train': 7.899783134460449} -09/20/2021 14:34:53 - INFO - __main__ - Step 441: {'lr': 7.2e-06, 'samples': 14112, 'steps': 27, 'loss/train': 9.043051719665527} -09/20/2021 14:34:54 - INFO - __main__ - Step 442: {'lr': 7.2e-06, 'samples': 14144, 'steps': 27, 'loss/train': 8.599621772766113} -09/20/2021 14:34:55 - INFO - __main__ - Step 443: {'lr': 7.2e-06, 'samples': 14176, 'steps': 27, 'loss/train': 8.28348159790039} -09/20/2021 14:34:56 - INFO - __main__ - Step 444: {'lr': 7.2e-06, 'samples': 14208, 'steps': 27, 'loss/train': 7.950743675231934} -09/20/2021 14:34:56 - INFO - __main__ - Step 445: {'lr': 7.2e-06, 'samples': 14240, 'steps': 27, 'loss/train': 8.788931846618652} -09/20/2021 14:34:57 - INFO - __main__ - Step 446: {'lr': 7.2e-06, 'samples': 14272, 'steps': 27, 'loss/train': 7.021113395690918} -09/20/2021 14:34:58 - INFO - __main__ - Step 447: {'lr': 7.2e-06, 'samples': 14304, 'steps': 27, 'loss/train': 7.782106399536133} -09/20/2021 14:34:59 - INFO - __main__ - Step 448: {'lr': 7.2e-06, 'samples': 14336, 'steps': 27, 'loss/train': 8.295174598693848} -09/20/2021 14:34:59 - INFO - __main__ - Step 449: {'lr': 7.4666666666666675e-06, 'samples': 14368, 'steps': 28, 'loss/train': 8.030996322631836} -09/20/2021 14:35:00 - INFO - __main__ - Step 450: {'lr': 7.4666666666666675e-06, 'samples': 14400, 'steps': 28, 'loss/train': 8.738828659057617} -09/20/2021 14:35:01 - INFO - __main__ - Step 451: {'lr': 7.4666666666666675e-06, 'samples': 14432, 'steps': 28, 'loss/train': 8.022795677185059} -09/20/2021 14:35:02 - INFO - __main__ - Step 452: {'lr': 7.4666666666666675e-06, 'samples': 14464, 'steps': 28, 'loss/train': 9.244338035583496} -09/20/2021 14:35:02 - INFO - __main__ - Step 453: {'lr': 7.4666666666666675e-06, 'samples': 14496, 'steps': 28, 'loss/train': 8.203726768493652} -09/20/2021 14:35:03 - INFO - __main__ - Step 454: {'lr': 7.4666666666666675e-06, 'samples': 14528, 'steps': 28, 'loss/train': 8.976649284362793} -09/20/2021 14:35:04 - INFO - __main__ - Step 455: {'lr': 7.4666666666666675e-06, 'samples': 14560, 'steps': 28, 'loss/train': 8.62191390991211} -09/20/2021 14:35:05 - INFO - __main__ - Step 456: {'lr': 7.4666666666666675e-06, 'samples': 14592, 'steps': 28, 'loss/train': 9.046412467956543} -09/20/2021 14:35:05 - INFO - __main__ - Step 457: {'lr': 7.4666666666666675e-06, 'samples': 14624, 'steps': 28, 'loss/train': 7.672607898712158} -09/20/2021 14:35:06 - INFO - __main__ - Step 458: {'lr': 7.4666666666666675e-06, 'samples': 14656, 'steps': 28, 'loss/train': 8.199907302856445} -09/20/2021 14:35:07 - INFO - __main__ - Step 459: {'lr': 7.4666666666666675e-06, 'samples': 14688, 'steps': 28, 'loss/train': 8.235876083374023} -09/20/2021 14:35:08 - INFO - __main__ - Step 460: {'lr': 7.4666666666666675e-06, 'samples': 14720, 'steps': 28, 'loss/train': 8.451045989990234} -09/20/2021 14:35:08 - INFO - __main__ - Step 461: {'lr': 7.4666666666666675e-06, 'samples': 14752, 'steps': 28, 'loss/train': 8.916824340820312} -09/20/2021 14:35:10 - INFO - __main__ - Step 462: {'lr': 7.4666666666666675e-06, 'samples': 14784, 'steps': 28, 'loss/train': 8.333792686462402} -09/20/2021 14:35:11 - INFO - __main__ - Step 463: {'lr': 7.4666666666666675e-06, 'samples': 14816, 'steps': 28, 'loss/train': 8.420090675354004} -09/20/2021 14:35:12 - INFO - __main__ - Step 464: {'lr': 7.4666666666666675e-06, 'samples': 14848, 'steps': 28, 'loss/train': 7.639708995819092} -09/20/2021 14:35:12 - INFO - __main__ - Step 465: {'lr': 7.733333333333334e-06, 'samples': 14880, 'steps': 29, 'loss/train': 7.9451398849487305} -09/20/2021 14:35:13 - INFO - __main__ - Step 466: {'lr': 7.733333333333334e-06, 'samples': 14912, 'steps': 29, 'loss/train': 8.604597091674805} -09/20/2021 14:35:14 - INFO - __main__ - Step 467: {'lr': 7.733333333333334e-06, 'samples': 14944, 'steps': 29, 'loss/train': 8.254790306091309} -09/20/2021 14:35:15 - INFO - __main__ - Step 468: {'lr': 7.733333333333334e-06, 'samples': 14976, 'steps': 29, 'loss/train': 8.254915237426758} -09/20/2021 14:35:15 - INFO - __main__ - Step 469: {'lr': 7.733333333333334e-06, 'samples': 15008, 'steps': 29, 'loss/train': 8.341948509216309} -09/20/2021 14:35:16 - INFO - __main__ - Step 470: {'lr': 7.733333333333334e-06, 'samples': 15040, 'steps': 29, 'loss/train': 7.912728786468506} -09/20/2021 14:35:17 - INFO - __main__ - Step 471: {'lr': 7.733333333333334e-06, 'samples': 15072, 'steps': 29, 'loss/train': 8.326970100402832} -09/20/2021 14:35:18 - INFO - __main__ - Step 472: {'lr': 7.733333333333334e-06, 'samples': 15104, 'steps': 29, 'loss/train': 8.139504432678223} -09/20/2021 14:35:18 - INFO - __main__ - Step 473: {'lr': 7.733333333333334e-06, 'samples': 15136, 'steps': 29, 'loss/train': 8.804084777832031} -09/20/2021 14:35:19 - INFO - __main__ - Step 474: {'lr': 7.733333333333334e-06, 'samples': 15168, 'steps': 29, 'loss/train': 7.852630615234375} -09/20/2021 14:35:20 - INFO - __main__ - Step 475: {'lr': 7.733333333333334e-06, 'samples': 15200, 'steps': 29, 'loss/train': 8.385689735412598} -09/20/2021 14:35:21 - INFO - __main__ - Step 476: {'lr': 7.733333333333334e-06, 'samples': 15232, 'steps': 29, 'loss/train': 8.339958190917969} -09/20/2021 14:35:21 - INFO - __main__ - Step 477: {'lr': 7.733333333333334e-06, 'samples': 15264, 'steps': 29, 'loss/train': 9.15561294555664} -09/20/2021 14:35:22 - INFO - __main__ - Step 478: {'lr': 7.733333333333334e-06, 'samples': 15296, 'steps': 29, 'loss/train': 8.212031364440918} -09/20/2021 14:35:23 - INFO - __main__ - Step 479: {'lr': 7.733333333333334e-06, 'samples': 15328, 'steps': 29, 'loss/train': 8.480957984924316} -09/20/2021 14:35:24 - INFO - __main__ - Step 480: {'lr': 7.733333333333334e-06, 'samples': 15360, 'steps': 29, 'loss/train': 7.761654853820801} -09/20/2021 14:35:25 - INFO - __main__ - Step 481: {'lr': 8.000000000000001e-06, 'samples': 15392, 'steps': 30, 'loss/train': 8.667594909667969} -09/20/2021 14:35:25 - INFO - __main__ - Step 482: {'lr': 8.000000000000001e-06, 'samples': 15424, 'steps': 30, 'loss/train': 9.002825736999512} -09/20/2021 14:35:26 - INFO - __main__ - Step 483: {'lr': 8.000000000000001e-06, 'samples': 15456, 'steps': 30, 'loss/train': 8.651888847351074} -09/20/2021 14:35:27 - INFO - __main__ - Step 484: {'lr': 8.000000000000001e-06, 'samples': 15488, 'steps': 30, 'loss/train': 8.545669555664062} -09/20/2021 14:35:28 - INFO - __main__ - Step 485: {'lr': 8.000000000000001e-06, 'samples': 15520, 'steps': 30, 'loss/train': 8.601860046386719} -09/20/2021 14:35:28 - INFO - __main__ - Step 486: {'lr': 8.000000000000001e-06, 'samples': 15552, 'steps': 30, 'loss/train': 8.233880996704102} -09/20/2021 14:35:29 - INFO - __main__ - Step 487: {'lr': 8.000000000000001e-06, 'samples': 15584, 'steps': 30, 'loss/train': 8.150875091552734} -09/20/2021 14:35:30 - INFO - __main__ - Step 488: {'lr': 8.000000000000001e-06, 'samples': 15616, 'steps': 30, 'loss/train': 7.9031219482421875} -09/20/2021 14:35:31 - INFO - __main__ - Step 489: {'lr': 8.000000000000001e-06, 'samples': 15648, 'steps': 30, 'loss/train': 8.302803039550781} -09/20/2021 14:35:31 - INFO - __main__ - Step 490: {'lr': 8.000000000000001e-06, 'samples': 15680, 'steps': 30, 'loss/train': 7.920206546783447} -09/20/2021 14:35:32 - INFO - __main__ - Step 491: {'lr': 8.000000000000001e-06, 'samples': 15712, 'steps': 30, 'loss/train': 8.270291328430176} -09/20/2021 14:35:33 - INFO - __main__ - Step 492: {'lr': 8.000000000000001e-06, 'samples': 15744, 'steps': 30, 'loss/train': 9.063586235046387} -09/20/2021 14:35:34 - INFO - __main__ - Step 493: {'lr': 8.000000000000001e-06, 'samples': 15776, 'steps': 30, 'loss/train': 8.07690715789795} -09/20/2021 14:35:34 - INFO - __main__ - Step 494: {'lr': 8.000000000000001e-06, 'samples': 15808, 'steps': 30, 'loss/train': 8.41173267364502} -09/20/2021 14:35:36 - INFO - __main__ - Step 495: {'lr': 8.000000000000001e-06, 'samples': 15840, 'steps': 30, 'loss/train': 7.231734275817871} -09/20/2021 14:35:36 - INFO - __main__ - Step 496: {'lr': 8.000000000000001e-06, 'samples': 15872, 'steps': 30, 'loss/train': 8.984804153442383} -09/20/2021 14:35:37 - INFO - __main__ - Step 497: {'lr': 8.266666666666667e-06, 'samples': 15904, 'steps': 31, 'loss/train': 8.020291328430176} -09/20/2021 14:35:38 - INFO - __main__ - Step 498: {'lr': 8.266666666666667e-06, 'samples': 15936, 'steps': 31, 'loss/train': 7.670291900634766} -09/20/2021 14:35:39 - INFO - __main__ - Step 499: {'lr': 8.266666666666667e-06, 'samples': 15968, 'steps': 31, 'loss/train': 7.991480827331543} -09/20/2021 14:35:40 - INFO - __main__ - Step 500: {'lr': 8.266666666666667e-06, 'samples': 16000, 'steps': 31, 'loss/train': 8.749967575073242} -09/20/2021 14:35:40 - INFO - __main__ - Step 501: {'lr': 8.266666666666667e-06, 'samples': 16032, 'steps': 31, 'loss/train': 8.080130577087402} -09/20/2021 14:35:41 - INFO - __main__ - Step 502: {'lr': 8.266666666666667e-06, 'samples': 16064, 'steps': 31, 'loss/train': 7.747565269470215} -09/20/2021 14:35:42 - INFO - __main__ - Step 503: {'lr': 8.266666666666667e-06, 'samples': 16096, 'steps': 31, 'loss/train': 8.732550621032715} -09/20/2021 14:35:43 - INFO - __main__ - Step 504: {'lr': 8.266666666666667e-06, 'samples': 16128, 'steps': 31, 'loss/train': 7.799205303192139} -09/20/2021 14:35:43 - INFO - __main__ - Step 505: {'lr': 8.266666666666667e-06, 'samples': 16160, 'steps': 31, 'loss/train': 8.155591011047363} -09/20/2021 14:35:44 - INFO - __main__ - Step 506: {'lr': 8.266666666666667e-06, 'samples': 16192, 'steps': 31, 'loss/train': 8.588030815124512} -09/20/2021 14:35:45 - INFO - __main__ - Step 507: {'lr': 8.266666666666667e-06, 'samples': 16224, 'steps': 31, 'loss/train': 8.440332412719727} -09/20/2021 14:35:46 - INFO - __main__ - Step 508: {'lr': 8.266666666666667e-06, 'samples': 16256, 'steps': 31, 'loss/train': 8.794659614562988} -09/20/2021 14:35:46 - INFO - __main__ - Step 509: {'lr': 8.266666666666667e-06, 'samples': 16288, 'steps': 31, 'loss/train': 8.396638870239258} -09/20/2021 14:35:47 - INFO - __main__ - Step 510: {'lr': 8.266666666666667e-06, 'samples': 16320, 'steps': 31, 'loss/train': 8.408777236938477} -09/20/2021 14:35:48 - INFO - __main__ - Step 511: {'lr': 8.266666666666667e-06, 'samples': 16352, 'steps': 31, 'loss/train': 9.25987720489502} -09/20/2021 14:35:49 - INFO - __main__ - Step 512: {'lr': 8.266666666666667e-06, 'samples': 16384, 'steps': 31, 'loss/train': 8.11778450012207} -09/20/2021 14:35:49 - INFO - __main__ - Step 513: {'lr': 8.533333333333334e-06, 'samples': 16416, 'steps': 32, 'loss/train': 8.825359344482422} -09/20/2021 14:35:50 - INFO - __main__ - Step 514: {'lr': 8.533333333333334e-06, 'samples': 16448, 'steps': 32, 'loss/train': 8.835354804992676} -09/20/2021 14:35:51 - INFO - __main__ - Step 515: {'lr': 8.533333333333334e-06, 'samples': 16480, 'steps': 32, 'loss/train': 7.6844024658203125} -09/20/2021 14:35:52 - INFO - __main__ - Step 516: {'lr': 8.533333333333334e-06, 'samples': 16512, 'steps': 32, 'loss/train': 8.693580627441406} -09/20/2021 14:35:52 - INFO - __main__ - Step 517: {'lr': 8.533333333333334e-06, 'samples': 16544, 'steps': 32, 'loss/train': 8.878600120544434} -09/20/2021 14:35:53 - INFO - __main__ - Step 518: {'lr': 8.533333333333334e-06, 'samples': 16576, 'steps': 32, 'loss/train': 8.33576774597168} -09/20/2021 14:35:54 - INFO - __main__ - Step 519: {'lr': 8.533333333333334e-06, 'samples': 16608, 'steps': 32, 'loss/train': 8.393767356872559} -09/20/2021 14:35:55 - INFO - __main__ - Step 520: {'lr': 8.533333333333334e-06, 'samples': 16640, 'steps': 32, 'loss/train': 8.187295913696289} -09/20/2021 14:35:55 - INFO - __main__ - Step 521: {'lr': 8.533333333333334e-06, 'samples': 16672, 'steps': 32, 'loss/train': 8.288887977600098} -09/20/2021 14:35:56 - INFO - __main__ - Step 522: {'lr': 8.533333333333334e-06, 'samples': 16704, 'steps': 32, 'loss/train': 7.9046831130981445} -09/20/2021 14:35:57 - INFO - __main__ - Step 523: {'lr': 8.533333333333334e-06, 'samples': 16736, 'steps': 32, 'loss/train': 8.324329376220703} -09/20/2021 14:35:58 - INFO - __main__ - Step 524: {'lr': 8.533333333333334e-06, 'samples': 16768, 'steps': 32, 'loss/train': 8.056224822998047} -09/20/2021 14:35:59 - INFO - __main__ - Step 525: {'lr': 8.533333333333334e-06, 'samples': 16800, 'steps': 32, 'loss/train': 7.490893363952637} -09/20/2021 14:36:00 - INFO - __main__ - Step 526: {'lr': 8.533333333333334e-06, 'samples': 16832, 'steps': 32, 'loss/train': 8.320823669433594} -09/20/2021 14:36:01 - INFO - __main__ - Step 527: {'lr': 8.533333333333334e-06, 'samples': 16864, 'steps': 32, 'loss/train': 8.018965721130371} -09/20/2021 14:36:02 - INFO - __main__ - Step 528: {'lr': 8.533333333333334e-06, 'samples': 16896, 'steps': 32, 'loss/train': 7.911492347717285} -09/20/2021 14:36:03 - INFO - __main__ - Step 529: {'lr': 8.8e-06, 'samples': 16928, 'steps': 33, 'loss/train': 8.783736228942871} -09/20/2021 14:36:03 - INFO - __main__ - Step 530: {'lr': 8.8e-06, 'samples': 16960, 'steps': 33, 'loss/train': 9.046895027160645} -09/20/2021 14:36:04 - INFO - __main__ - Step 531: {'lr': 8.8e-06, 'samples': 16992, 'steps': 33, 'loss/train': 8.206110954284668} -09/20/2021 14:36:05 - INFO - __main__ - Step 532: {'lr': 8.8e-06, 'samples': 17024, 'steps': 33, 'loss/train': 7.160069942474365} -09/20/2021 14:36:06 - INFO - __main__ - Step 533: {'lr': 8.8e-06, 'samples': 17056, 'steps': 33, 'loss/train': 8.491114616394043} -09/20/2021 14:36:06 - INFO - __main__ - Step 534: {'lr': 8.8e-06, 'samples': 17088, 'steps': 33, 'loss/train': 9.388814926147461} -09/20/2021 14:36:07 - INFO - __main__ - Step 535: {'lr': 8.8e-06, 'samples': 17120, 'steps': 33, 'loss/train': 8.50621509552002} -09/20/2021 14:36:08 - INFO - __main__ - Step 536: {'lr': 8.8e-06, 'samples': 17152, 'steps': 33, 'loss/train': 8.300721168518066} -09/20/2021 14:36:09 - INFO - __main__ - Step 537: {'lr': 8.8e-06, 'samples': 17184, 'steps': 33, 'loss/train': 7.564702033996582} -09/20/2021 14:36:09 - INFO - __main__ - Step 538: {'lr': 8.8e-06, 'samples': 17216, 'steps': 33, 'loss/train': 8.575708389282227} -09/20/2021 14:36:10 - INFO - __main__ - Step 539: {'lr': 8.8e-06, 'samples': 17248, 'steps': 33, 'loss/train': 8.734574317932129} -09/20/2021 14:36:11 - INFO - __main__ - Step 540: {'lr': 8.8e-06, 'samples': 17280, 'steps': 33, 'loss/train': 8.04681396484375} -09/20/2021 14:36:12 - INFO - __main__ - Step 541: {'lr': 8.8e-06, 'samples': 17312, 'steps': 33, 'loss/train': 8.33742618560791} -09/20/2021 14:36:12 - INFO - __main__ - Step 542: {'lr': 8.8e-06, 'samples': 17344, 'steps': 33, 'loss/train': 7.7675909996032715} -09/20/2021 14:36:13 - INFO - __main__ - Step 543: {'lr': 8.8e-06, 'samples': 17376, 'steps': 33, 'loss/train': 9.688101768493652} -09/20/2021 14:36:14 - INFO - __main__ - Step 544: {'lr': 8.8e-06, 'samples': 17408, 'steps': 33, 'loss/train': 9.816047668457031} -09/20/2021 14:36:15 - INFO - __main__ - Step 545: {'lr': 9.066666666666667e-06, 'samples': 17440, 'steps': 34, 'loss/train': 9.425687789916992} -09/20/2021 14:36:15 - INFO - __main__ - Step 546: {'lr': 9.066666666666667e-06, 'samples': 17472, 'steps': 34, 'loss/train': 9.720455169677734} -09/20/2021 14:36:16 - INFO - __main__ - Step 547: {'lr': 9.066666666666667e-06, 'samples': 17504, 'steps': 34, 'loss/train': 9.632379531860352} -09/20/2021 14:36:17 - INFO - __main__ - Step 548: {'lr': 9.066666666666667e-06, 'samples': 17536, 'steps': 34, 'loss/train': 9.355306625366211} -09/20/2021 14:36:18 - INFO - __main__ - Step 549: {'lr': 9.066666666666667e-06, 'samples': 17568, 'steps': 34, 'loss/train': 9.736352920532227} -09/20/2021 14:36:18 - INFO - __main__ - Step 550: {'lr': 9.066666666666667e-06, 'samples': 17600, 'steps': 34, 'loss/train': 9.478496551513672} -09/20/2021 14:36:19 - INFO - __main__ - Step 551: {'lr': 9.066666666666667e-06, 'samples': 17632, 'steps': 34, 'loss/train': 9.364480018615723} -09/20/2021 14:36:20 - INFO - __main__ - Step 552: {'lr': 9.066666666666667e-06, 'samples': 17664, 'steps': 34, 'loss/train': 9.492999076843262} -09/20/2021 14:36:21 - INFO - __main__ - Step 553: {'lr': 9.066666666666667e-06, 'samples': 17696, 'steps': 34, 'loss/train': 9.483695030212402} -09/20/2021 14:36:21 - INFO - __main__ - Step 554: {'lr': 9.066666666666667e-06, 'samples': 17728, 'steps': 34, 'loss/train': 9.433053016662598} -09/20/2021 14:36:22 - INFO - __main__ - Step 555: {'lr': 9.066666666666667e-06, 'samples': 17760, 'steps': 34, 'loss/train': 9.593360900878906} -09/20/2021 14:36:23 - INFO - __main__ - Step 556: {'lr': 9.066666666666667e-06, 'samples': 17792, 'steps': 34, 'loss/train': 9.731925010681152} -09/20/2021 14:36:24 - INFO - __main__ - Step 557: {'lr': 9.066666666666667e-06, 'samples': 17824, 'steps': 34, 'loss/train': 9.55380916595459} -09/20/2021 14:36:24 - INFO - __main__ - Step 558: {'lr': 9.066666666666667e-06, 'samples': 17856, 'steps': 34, 'loss/train': 9.75314998626709} -09/20/2021 14:36:25 - INFO - __main__ - Step 559: {'lr': 9.066666666666667e-06, 'samples': 17888, 'steps': 34, 'loss/train': 9.529624938964844} -09/20/2021 14:36:26 - INFO - __main__ - Step 560: {'lr': 9.066666666666667e-06, 'samples': 17920, 'steps': 34, 'loss/train': 8.741135597229004} -09/20/2021 14:36:27 - INFO - __main__ - Step 561: {'lr': 9.333333333333334e-06, 'samples': 17952, 'steps': 35, 'loss/train': 8.412064552307129} -09/20/2021 14:36:28 - INFO - __main__ - Step 562: {'lr': 9.333333333333334e-06, 'samples': 17984, 'steps': 35, 'loss/train': 7.190771102905273} -09/20/2021 14:36:28 - INFO - __main__ - Step 563: {'lr': 9.333333333333334e-06, 'samples': 18016, 'steps': 35, 'loss/train': 8.33745002746582} -09/20/2021 14:36:29 - INFO - __main__ - Step 564: {'lr': 9.333333333333334e-06, 'samples': 18048, 'steps': 35, 'loss/train': 8.582221984863281} -09/20/2021 14:36:30 - INFO - __main__ - Step 565: {'lr': 9.333333333333334e-06, 'samples': 18080, 'steps': 35, 'loss/train': 8.222381591796875} -09/20/2021 14:36:31 - INFO - __main__ - Step 566: {'lr': 9.333333333333334e-06, 'samples': 18112, 'steps': 35, 'loss/train': 8.349543571472168} -09/20/2021 14:36:33 - INFO - __main__ - Step 567: {'lr': 9.333333333333334e-06, 'samples': 18144, 'steps': 35, 'loss/train': 7.718624114990234} -09/20/2021 14:36:33 - INFO - __main__ - Step 568: {'lr': 9.333333333333334e-06, 'samples': 18176, 'steps': 35, 'loss/train': 8.092018127441406} -09/20/2021 14:36:34 - INFO - __main__ - Step 569: {'lr': 9.333333333333334e-06, 'samples': 18208, 'steps': 35, 'loss/train': 8.079546928405762} -09/20/2021 14:36:35 - INFO - __main__ - Step 570: {'lr': 9.333333333333334e-06, 'samples': 18240, 'steps': 35, 'loss/train': 7.948099136352539} -09/20/2021 14:36:36 - INFO - __main__ - Step 571: {'lr': 9.333333333333334e-06, 'samples': 18272, 'steps': 35, 'loss/train': 8.212067604064941} -09/20/2021 14:36:36 - INFO - __main__ - Step 572: {'lr': 9.333333333333334e-06, 'samples': 18304, 'steps': 35, 'loss/train': 8.219112396240234} -09/20/2021 14:36:37 - INFO - __main__ - Step 573: {'lr': 9.333333333333334e-06, 'samples': 18336, 'steps': 35, 'loss/train': 8.142801284790039} -09/20/2021 14:36:38 - INFO - __main__ - Step 574: {'lr': 9.333333333333334e-06, 'samples': 18368, 'steps': 35, 'loss/train': 7.568868160247803} -09/20/2021 14:36:39 - INFO - __main__ - Step 575: {'lr': 9.333333333333334e-06, 'samples': 18400, 'steps': 35, 'loss/train': 8.55990219116211} -09/20/2021 14:36:39 - INFO - __main__ - Step 576: {'lr': 9.333333333333334e-06, 'samples': 18432, 'steps': 35, 'loss/train': 7.636648178100586} -09/20/2021 14:36:40 - INFO - __main__ - Step 577: {'lr': 9.600000000000001e-06, 'samples': 18464, 'steps': 36, 'loss/train': 8.44161319732666} -09/20/2021 14:36:41 - INFO - __main__ - Step 578: {'lr': 9.600000000000001e-06, 'samples': 18496, 'steps': 36, 'loss/train': 8.701559066772461} -09/20/2021 14:36:42 - INFO - __main__ - Step 579: {'lr': 9.600000000000001e-06, 'samples': 18528, 'steps': 36, 'loss/train': 8.326879501342773} -09/20/2021 14:36:42 - INFO - __main__ - Step 580: {'lr': 9.600000000000001e-06, 'samples': 18560, 'steps': 36, 'loss/train': 8.29944133758545} -09/20/2021 14:36:43 - INFO - __main__ - Step 581: {'lr': 9.600000000000001e-06, 'samples': 18592, 'steps': 36, 'loss/train': 7.866985321044922} -09/20/2021 14:36:44 - INFO - __main__ - Step 582: {'lr': 9.600000000000001e-06, 'samples': 18624, 'steps': 36, 'loss/train': 8.37120246887207} -09/20/2021 14:36:45 - INFO - __main__ - Step 583: {'lr': 9.600000000000001e-06, 'samples': 18656, 'steps': 36, 'loss/train': 8.124831199645996} -09/20/2021 14:36:45 - INFO - __main__ - Step 584: {'lr': 9.600000000000001e-06, 'samples': 18688, 'steps': 36, 'loss/train': 8.07022476196289} -09/20/2021 14:36:46 - INFO - __main__ - Step 585: {'lr': 9.600000000000001e-06, 'samples': 18720, 'steps': 36, 'loss/train': 8.087706565856934} -09/20/2021 14:36:47 - INFO - __main__ - Step 586: {'lr': 9.600000000000001e-06, 'samples': 18752, 'steps': 36, 'loss/train': 8.095897674560547} -09/20/2021 14:36:48 - INFO - __main__ - Step 587: {'lr': 9.600000000000001e-06, 'samples': 18784, 'steps': 36, 'loss/train': 7.755162715911865} -09/20/2021 14:36:48 - INFO - __main__ - Step 588: {'lr': 9.600000000000001e-06, 'samples': 18816, 'steps': 36, 'loss/train': 8.178751945495605} -09/20/2021 14:36:49 - INFO - __main__ - Step 589: {'lr': 9.600000000000001e-06, 'samples': 18848, 'steps': 36, 'loss/train': 8.528087615966797} -09/20/2021 14:36:50 - INFO - __main__ - Step 590: {'lr': 9.600000000000001e-06, 'samples': 18880, 'steps': 36, 'loss/train': 8.79305362701416} -09/20/2021 14:36:51 - INFO - __main__ - Step 591: {'lr': 9.600000000000001e-06, 'samples': 18912, 'steps': 36, 'loss/train': 9.014626502990723} -09/20/2021 14:36:51 - INFO - __main__ - Step 592: {'lr': 9.600000000000001e-06, 'samples': 18944, 'steps': 36, 'loss/train': 8.73847770690918} -09/20/2021 14:36:52 - INFO - __main__ - Step 593: {'lr': 9.866666666666667e-06, 'samples': 18976, 'steps': 37, 'loss/train': 7.951117992401123} -09/20/2021 14:36:53 - INFO - __main__ - Step 594: {'lr': 9.866666666666667e-06, 'samples': 19008, 'steps': 37, 'loss/train': 7.945525169372559} -09/20/2021 14:36:54 - INFO - __main__ - Step 595: {'lr': 9.866666666666667e-06, 'samples': 19040, 'steps': 37, 'loss/train': 8.020062446594238} -09/20/2021 14:36:55 - INFO - __main__ - Step 596: {'lr': 9.866666666666667e-06, 'samples': 19072, 'steps': 37, 'loss/train': 7.916811943054199} -09/20/2021 14:36:55 - INFO - __main__ - Step 597: {'lr': 9.866666666666667e-06, 'samples': 19104, 'steps': 37, 'loss/train': 9.150860786437988} -09/20/2021 14:36:57 - INFO - __main__ - Step 598: {'lr': 9.866666666666667e-06, 'samples': 19136, 'steps': 37, 'loss/train': 8.281364440917969} -09/20/2021 14:36:57 - INFO - __main__ - Step 599: {'lr': 9.866666666666667e-06, 'samples': 19168, 'steps': 37, 'loss/train': 7.7781782150268555} -09/20/2021 14:36:58 - INFO - __main__ - Step 600: {'lr': 9.866666666666667e-06, 'samples': 19200, 'steps': 37, 'loss/train': 8.38415241241455} -09/20/2021 14:36:59 - INFO - __main__ - Step 601: {'lr': 9.866666666666667e-06, 'samples': 19232, 'steps': 37, 'loss/train': 8.009666442871094} -09/20/2021 14:37:00 - INFO - __main__ - Step 602: {'lr': 9.866666666666667e-06, 'samples': 19264, 'steps': 37, 'loss/train': 8.265867233276367} -09/20/2021 14:37:00 - INFO - __main__ - Step 603: {'lr': 9.866666666666667e-06, 'samples': 19296, 'steps': 37, 'loss/train': 8.36002254486084} -09/20/2021 14:37:01 - INFO - __main__ - Step 604: {'lr': 9.866666666666667e-06, 'samples': 19328, 'steps': 37, 'loss/train': 8.168669700622559} -09/20/2021 14:37:02 - INFO - __main__ - Step 605: {'lr': 9.866666666666667e-06, 'samples': 19360, 'steps': 37, 'loss/train': 8.582223892211914} -09/20/2021 14:37:03 - INFO - __main__ - Step 606: {'lr': 9.866666666666667e-06, 'samples': 19392, 'steps': 37, 'loss/train': 8.509109497070312} -09/20/2021 14:37:03 - INFO - __main__ - Step 607: {'lr': 9.866666666666667e-06, 'samples': 19424, 'steps': 37, 'loss/train': 7.671741962432861} -09/20/2021 14:37:04 - INFO - __main__ - Step 608: {'lr': 9.866666666666667e-06, 'samples': 19456, 'steps': 37, 'loss/train': 7.870421409606934} -09/20/2021 14:37:05 - INFO - __main__ - Step 609: {'lr': 1.0133333333333333e-05, 'samples': 19488, 'steps': 38, 'loss/train': 8.09602165222168} -09/20/2021 14:37:06 - INFO - __main__ - Step 610: {'lr': 1.0133333333333333e-05, 'samples': 19520, 'steps': 38, 'loss/train': 8.51254653930664} -09/20/2021 14:37:06 - INFO - __main__ - Step 611: {'lr': 1.0133333333333333e-05, 'samples': 19552, 'steps': 38, 'loss/train': 8.62251091003418} -09/20/2021 14:37:07 - INFO - __main__ - Step 612: {'lr': 1.0133333333333333e-05, 'samples': 19584, 'steps': 38, 'loss/train': 8.159732818603516} -09/20/2021 14:37:08 - INFO - __main__ - Step 613: {'lr': 1.0133333333333333e-05, 'samples': 19616, 'steps': 38, 'loss/train': 8.589771270751953} -09/20/2021 14:37:09 - INFO - __main__ - Step 614: {'lr': 1.0133333333333333e-05, 'samples': 19648, 'steps': 38, 'loss/train': 8.612579345703125} -09/20/2021 14:37:09 - INFO - __main__ - Step 615: {'lr': 1.0133333333333333e-05, 'samples': 19680, 'steps': 38, 'loss/train': 8.160099029541016} -09/20/2021 14:37:10 - INFO - __main__ - Step 616: {'lr': 1.0133333333333333e-05, 'samples': 19712, 'steps': 38, 'loss/train': 8.790704727172852} -09/20/2021 14:37:11 - INFO - __main__ - Step 617: {'lr': 1.0133333333333333e-05, 'samples': 19744, 'steps': 38, 'loss/train': 7.502357482910156} -09/20/2021 14:37:12 - INFO - __main__ - Step 618: {'lr': 1.0133333333333333e-05, 'samples': 19776, 'steps': 38, 'loss/train': 7.9711432456970215} -09/20/2021 14:37:12 - INFO - __main__ - Step 619: {'lr': 1.0133333333333333e-05, 'samples': 19808, 'steps': 38, 'loss/train': 8.271267890930176} -09/20/2021 14:37:13 - INFO - __main__ - Step 620: {'lr': 1.0133333333333333e-05, 'samples': 19840, 'steps': 38, 'loss/train': 7.968970775604248} -09/20/2021 14:37:14 - INFO - __main__ - Step 621: {'lr': 1.0133333333333333e-05, 'samples': 19872, 'steps': 38, 'loss/train': 8.774761199951172} -09/20/2021 14:37:15 - INFO - __main__ - Step 622: {'lr': 1.0133333333333333e-05, 'samples': 19904, 'steps': 38, 'loss/train': 8.688358306884766} -09/20/2021 14:37:15 - INFO - __main__ - Step 623: {'lr': 1.0133333333333333e-05, 'samples': 19936, 'steps': 38, 'loss/train': 8.473465919494629} -09/20/2021 14:37:16 - INFO - __main__ - Step 624: {'lr': 1.0133333333333333e-05, 'samples': 19968, 'steps': 38, 'loss/train': 7.436355113983154} -09/20/2021 14:37:17 - INFO - __main__ - Step 625: {'lr': 1.04e-05, 'samples': 20000, 'steps': 39, 'loss/train': 7.904182434082031} -09/20/2021 14:37:18 - INFO - __main__ - Step 626: {'lr': 1.04e-05, 'samples': 20032, 'steps': 39, 'loss/train': 7.654538154602051} -09/20/2021 14:37:19 - INFO - __main__ - Step 627: {'lr': 1.04e-05, 'samples': 20064, 'steps': 39, 'loss/train': 8.440096855163574} -09/20/2021 14:37:20 - INFO - __main__ - Step 628: {'lr': 1.04e-05, 'samples': 20096, 'steps': 39, 'loss/train': 8.262388229370117} -09/20/2021 14:37:21 - INFO - __main__ - Step 629: {'lr': 1.04e-05, 'samples': 20128, 'steps': 39, 'loss/train': 7.936562538146973} -09/20/2021 14:37:21 - INFO - __main__ - Step 630: {'lr': 1.04e-05, 'samples': 20160, 'steps': 39, 'loss/train': 8.2278470993042} -09/20/2021 14:37:22 - INFO - __main__ - Step 631: {'lr': 1.04e-05, 'samples': 20192, 'steps': 39, 'loss/train': 7.647819995880127} -09/20/2021 14:37:23 - INFO - __main__ - Step 632: {'lr': 1.04e-05, 'samples': 20224, 'steps': 39, 'loss/train': 8.356863021850586} -09/20/2021 14:37:24 - INFO - __main__ - Step 633: {'lr': 1.04e-05, 'samples': 20256, 'steps': 39, 'loss/train': 7.685931205749512} -09/20/2021 14:37:24 - INFO - __main__ - Step 634: {'lr': 1.04e-05, 'samples': 20288, 'steps': 39, 'loss/train': 7.961510181427002} -09/20/2021 14:37:25 - INFO - __main__ - Step 635: {'lr': 1.04e-05, 'samples': 20320, 'steps': 39, 'loss/train': 8.423910140991211} -09/20/2021 14:37:26 - INFO - __main__ - Step 636: {'lr': 1.04e-05, 'samples': 20352, 'steps': 39, 'loss/train': 8.136650085449219} -09/20/2021 14:37:27 - INFO - __main__ - Step 637: {'lr': 1.04e-05, 'samples': 20384, 'steps': 39, 'loss/train': 9.513691902160645} -09/20/2021 14:37:27 - INFO - __main__ - Step 638: {'lr': 1.04e-05, 'samples': 20416, 'steps': 39, 'loss/train': 8.585381507873535} -09/20/2021 14:37:28 - INFO - __main__ - Step 639: {'lr': 1.04e-05, 'samples': 20448, 'steps': 39, 'loss/train': 8.060375213623047} -09/20/2021 14:37:29 - INFO - __main__ - Step 640: {'lr': 1.04e-05, 'samples': 20480, 'steps': 39, 'loss/train': 8.00006103515625} -09/20/2021 14:37:30 - INFO - __main__ - Step 641: {'lr': 1.0666666666666667e-05, 'samples': 20512, 'steps': 40, 'loss/train': 7.308459758758545} -09/20/2021 14:37:31 - INFO - __main__ - Step 642: {'lr': 1.0666666666666667e-05, 'samples': 20544, 'steps': 40, 'loss/train': 8.024554252624512} -09/20/2021 14:37:31 - INFO - __main__ - Step 643: {'lr': 1.0666666666666667e-05, 'samples': 20576, 'steps': 40, 'loss/train': 8.829021453857422} -09/20/2021 14:37:32 - INFO - __main__ - Step 644: {'lr': 1.0666666666666667e-05, 'samples': 20608, 'steps': 40, 'loss/train': 7.778556823730469} -09/20/2021 14:37:33 - INFO - __main__ - Step 645: {'lr': 1.0666666666666667e-05, 'samples': 20640, 'steps': 40, 'loss/train': 8.022852897644043} -09/20/2021 14:37:34 - INFO - __main__ - Step 646: {'lr': 1.0666666666666667e-05, 'samples': 20672, 'steps': 40, 'loss/train': 7.76801061630249} -09/20/2021 14:37:34 - INFO - __main__ - Step 647: {'lr': 1.0666666666666667e-05, 'samples': 20704, 'steps': 40, 'loss/train': 8.066608428955078} -09/20/2021 14:37:35 - INFO - __main__ - Step 648: {'lr': 1.0666666666666667e-05, 'samples': 20736, 'steps': 40, 'loss/train': 8.202385902404785} -09/20/2021 14:37:36 - INFO - __main__ - Step 649: {'lr': 1.0666666666666667e-05, 'samples': 20768, 'steps': 40, 'loss/train': 7.619396209716797} -09/20/2021 14:37:37 - INFO - __main__ - Step 650: {'lr': 1.0666666666666667e-05, 'samples': 20800, 'steps': 40, 'loss/train': 8.82582950592041} -09/20/2021 14:37:37 - INFO - __main__ - Step 651: {'lr': 1.0666666666666667e-05, 'samples': 20832, 'steps': 40, 'loss/train': 7.589515209197998} -09/20/2021 14:37:38 - INFO - __main__ - Step 652: {'lr': 1.0666666666666667e-05, 'samples': 20864, 'steps': 40, 'loss/train': 8.452483177185059} -09/20/2021 14:37:39 - INFO - __main__ - Step 653: {'lr': 1.0666666666666667e-05, 'samples': 20896, 'steps': 40, 'loss/train': 8.422913551330566} -09/20/2021 14:37:40 - INFO - __main__ - Step 654: {'lr': 1.0666666666666667e-05, 'samples': 20928, 'steps': 40, 'loss/train': 8.67952823638916} -09/20/2021 14:37:40 - INFO - __main__ - Step 655: {'lr': 1.0666666666666667e-05, 'samples': 20960, 'steps': 40, 'loss/train': 8.386114120483398} -09/20/2021 14:37:41 - INFO - __main__ - Step 656: {'lr': 1.0666666666666667e-05, 'samples': 20992, 'steps': 40, 'loss/train': 8.26198959350586} -09/20/2021 14:37:42 - INFO - __main__ - Step 657: {'lr': 1.0933333333333334e-05, 'samples': 21024, 'steps': 41, 'loss/train': 8.706418991088867} -09/20/2021 14:37:43 - INFO - __main__ - Step 658: {'lr': 1.0933333333333334e-05, 'samples': 21056, 'steps': 41, 'loss/train': 8.25497055053711} -09/20/2021 14:37:44 - INFO - __main__ - Step 659: {'lr': 1.0933333333333334e-05, 'samples': 21088, 'steps': 41, 'loss/train': 8.4746732711792} -09/20/2021 14:37:45 - INFO - __main__ - Step 660: {'lr': 1.0933333333333334e-05, 'samples': 21120, 'steps': 41, 'loss/train': 8.232172966003418} -09/20/2021 14:37:46 - INFO - __main__ - Step 661: {'lr': 1.0933333333333334e-05, 'samples': 21152, 'steps': 41, 'loss/train': 8.457083702087402} -09/20/2021 14:37:46 - INFO - __main__ - Step 662: {'lr': 1.0933333333333334e-05, 'samples': 21184, 'steps': 41, 'loss/train': 8.37494945526123} -09/20/2021 14:37:47 - INFO - __main__ - Step 663: {'lr': 1.0933333333333334e-05, 'samples': 21216, 'steps': 41, 'loss/train': 8.53903579711914} -09/20/2021 14:37:48 - INFO - __main__ - Step 664: {'lr': 1.0933333333333334e-05, 'samples': 21248, 'steps': 41, 'loss/train': 7.750667572021484} -09/20/2021 14:37:49 - INFO - __main__ - Step 665: {'lr': 1.0933333333333334e-05, 'samples': 21280, 'steps': 41, 'loss/train': 7.44536018371582} -09/20/2021 14:37:49 - INFO - __main__ - Step 666: {'lr': 1.0933333333333334e-05, 'samples': 21312, 'steps': 41, 'loss/train': 7.926060199737549} -09/20/2021 14:37:50 - INFO - __main__ - Step 667: {'lr': 1.0933333333333334e-05, 'samples': 21344, 'steps': 41, 'loss/train': 7.5139384269714355} -09/20/2021 14:37:51 - INFO - __main__ - Step 668: {'lr': 1.0933333333333334e-05, 'samples': 21376, 'steps': 41, 'loss/train': 8.306523323059082} -09/20/2021 14:37:52 - INFO - __main__ - Step 669: {'lr': 1.0933333333333334e-05, 'samples': 21408, 'steps': 41, 'loss/train': 8.263107299804688} -09/20/2021 14:37:52 - INFO - __main__ - Step 670: {'lr': 1.0933333333333334e-05, 'samples': 21440, 'steps': 41, 'loss/train': 7.740838527679443} -09/20/2021 14:37:53 - INFO - __main__ - Step 671: {'lr': 1.0933333333333334e-05, 'samples': 21472, 'steps': 41, 'loss/train': 8.224099159240723} -09/20/2021 14:37:54 - INFO - __main__ - Step 672: {'lr': 1.0933333333333334e-05, 'samples': 21504, 'steps': 41, 'loss/train': 8.64636516571045} -09/20/2021 14:37:55 - INFO - __main__ - Step 673: {'lr': 1.1200000000000001e-05, 'samples': 21536, 'steps': 42, 'loss/train': 7.763875961303711} -09/20/2021 14:37:55 - INFO - __main__ - Step 674: {'lr': 1.1200000000000001e-05, 'samples': 21568, 'steps': 42, 'loss/train': 8.552425384521484} -09/20/2021 14:37:56 - INFO - __main__ - Step 675: {'lr': 1.1200000000000001e-05, 'samples': 21600, 'steps': 42, 'loss/train': 8.715279579162598} -09/20/2021 14:37:57 - INFO - __main__ - Step 676: {'lr': 1.1200000000000001e-05, 'samples': 21632, 'steps': 42, 'loss/train': 8.853663444519043} -09/20/2021 14:37:58 - INFO - __main__ - Step 677: {'lr': 1.1200000000000001e-05, 'samples': 21664, 'steps': 42, 'loss/train': 8.752096176147461} -09/20/2021 14:37:58 - INFO - __main__ - Step 678: {'lr': 1.1200000000000001e-05, 'samples': 21696, 'steps': 42, 'loss/train': 8.208806991577148} -09/20/2021 14:37:59 - INFO - __main__ - Step 679: {'lr': 1.1200000000000001e-05, 'samples': 21728, 'steps': 42, 'loss/train': 8.30477237701416} -09/20/2021 14:38:00 - INFO - __main__ - Step 680: {'lr': 1.1200000000000001e-05, 'samples': 21760, 'steps': 42, 'loss/train': 8.172144889831543} -09/20/2021 14:38:01 - INFO - __main__ - Step 681: {'lr': 1.1200000000000001e-05, 'samples': 21792, 'steps': 42, 'loss/train': 7.4111247062683105} -09/20/2021 14:38:01 - INFO - __main__ - Step 682: {'lr': 1.1200000000000001e-05, 'samples': 21824, 'steps': 42, 'loss/train': 7.65539026260376} -09/20/2021 14:38:02 - INFO - __main__ - Step 683: {'lr': 1.1200000000000001e-05, 'samples': 21856, 'steps': 42, 'loss/train': 7.853024959564209} -09/20/2021 14:38:03 - INFO - __main__ - Step 684: {'lr': 1.1200000000000001e-05, 'samples': 21888, 'steps': 42, 'loss/train': 7.4219746589660645} -09/20/2021 14:38:04 - INFO - __main__ - Step 685: {'lr': 1.1200000000000001e-05, 'samples': 21920, 'steps': 42, 'loss/train': 8.378847122192383} -09/20/2021 14:38:04 - INFO - __main__ - Step 686: {'lr': 1.1200000000000001e-05, 'samples': 21952, 'steps': 42, 'loss/train': 7.828614234924316} -09/20/2021 14:38:05 - INFO - __main__ - Step 687: {'lr': 1.1200000000000001e-05, 'samples': 21984, 'steps': 42, 'loss/train': 7.3314104080200195} -09/20/2021 14:38:06 - INFO - __main__ - Step 688: {'lr': 1.1200000000000001e-05, 'samples': 22016, 'steps': 42, 'loss/train': 7.204861640930176} -09/20/2021 14:38:07 - INFO - __main__ - Step 689: {'lr': 1.1466666666666666e-05, 'samples': 22048, 'steps': 43, 'loss/train': 8.895034790039062} -09/20/2021 14:38:08 - INFO - __main__ - Step 690: {'lr': 1.1466666666666666e-05, 'samples': 22080, 'steps': 43, 'loss/train': 7.843775272369385} -09/20/2021 14:38:09 - INFO - __main__ - Step 691: {'lr': 1.1466666666666666e-05, 'samples': 22112, 'steps': 43, 'loss/train': 8.166061401367188} -09/20/2021 14:38:10 - INFO - __main__ - Step 692: {'lr': 1.1466666666666666e-05, 'samples': 22144, 'steps': 43, 'loss/train': 8.09485149383545} -09/20/2021 14:38:10 - INFO - __main__ - Step 693: {'lr': 1.1466666666666666e-05, 'samples': 22176, 'steps': 43, 'loss/train': 7.934488296508789} -09/20/2021 14:38:11 - INFO - __main__ - Step 694: {'lr': 1.1466666666666666e-05, 'samples': 22208, 'steps': 43, 'loss/train': 8.562483787536621} -09/20/2021 14:38:12 - INFO - __main__ - Step 695: {'lr': 1.1466666666666666e-05, 'samples': 22240, 'steps': 43, 'loss/train': 7.8697590827941895} -09/20/2021 14:38:13 - INFO - __main__ - Step 696: {'lr': 1.1466666666666666e-05, 'samples': 22272, 'steps': 43, 'loss/train': 7.242289066314697} -09/20/2021 14:38:13 - INFO - __main__ - Step 697: {'lr': 1.1466666666666666e-05, 'samples': 22304, 'steps': 43, 'loss/train': 7.033276557922363} -09/20/2021 14:38:14 - INFO - __main__ - Step 698: {'lr': 1.1466666666666666e-05, 'samples': 22336, 'steps': 43, 'loss/train': 8.194336891174316} -09/20/2021 14:38:15 - INFO - __main__ - Step 699: {'lr': 1.1466666666666666e-05, 'samples': 22368, 'steps': 43, 'loss/train': 7.9126296043396} -09/20/2021 14:38:16 - INFO - __main__ - Step 700: {'lr': 1.1466666666666666e-05, 'samples': 22400, 'steps': 43, 'loss/train': 7.53933572769165} -09/20/2021 14:38:16 - INFO - __main__ - Step 701: {'lr': 1.1466666666666666e-05, 'samples': 22432, 'steps': 43, 'loss/train': 8.280013084411621} -09/20/2021 14:38:17 - INFO - __main__ - Step 702: {'lr': 1.1466666666666666e-05, 'samples': 22464, 'steps': 43, 'loss/train': 8.451242446899414} -09/20/2021 14:38:18 - INFO - __main__ - Step 703: {'lr': 1.1466666666666666e-05, 'samples': 22496, 'steps': 43, 'loss/train': 8.355430603027344} -09/20/2021 14:38:19 - INFO - __main__ - Step 704: {'lr': 1.1466666666666666e-05, 'samples': 22528, 'steps': 43, 'loss/train': 8.32046890258789} -09/20/2021 14:38:20 - INFO - __main__ - Step 705: {'lr': 1.1733333333333333e-05, 'samples': 22560, 'steps': 44, 'loss/train': 8.096234321594238} -09/20/2021 14:38:20 - INFO - __main__ - Step 706: {'lr': 1.1733333333333333e-05, 'samples': 22592, 'steps': 44, 'loss/train': 7.6711626052856445} -09/20/2021 14:38:21 - INFO - __main__ - Step 707: {'lr': 1.1733333333333333e-05, 'samples': 22624, 'steps': 44, 'loss/train': 8.73442268371582} -09/20/2021 14:38:22 - INFO - __main__ - Step 708: {'lr': 1.1733333333333333e-05, 'samples': 22656, 'steps': 44, 'loss/train': 8.009572982788086} -09/20/2021 14:38:23 - INFO - __main__ - Step 709: {'lr': 1.1733333333333333e-05, 'samples': 22688, 'steps': 44, 'loss/train': 8.056120872497559} -09/20/2021 14:38:23 - INFO - __main__ - Step 710: {'lr': 1.1733333333333333e-05, 'samples': 22720, 'steps': 44, 'loss/train': 8.365805625915527} -09/20/2021 14:38:24 - INFO - __main__ - Step 711: {'lr': 1.1733333333333333e-05, 'samples': 22752, 'steps': 44, 'loss/train': 7.600273609161377} -09/20/2021 14:38:25 - INFO - __main__ - Step 712: {'lr': 1.1733333333333333e-05, 'samples': 22784, 'steps': 44, 'loss/train': 8.993945121765137} -09/20/2021 14:38:26 - INFO - __main__ - Step 713: {'lr': 1.1733333333333333e-05, 'samples': 22816, 'steps': 44, 'loss/train': 7.716423034667969} -09/20/2021 14:38:26 - INFO - __main__ - Step 714: {'lr': 1.1733333333333333e-05, 'samples': 22848, 'steps': 44, 'loss/train': 8.617433547973633} -09/20/2021 14:38:27 - INFO - __main__ - Step 715: {'lr': 1.1733333333333333e-05, 'samples': 22880, 'steps': 44, 'loss/train': 8.298069953918457} -09/20/2021 14:38:28 - INFO - __main__ - Step 716: {'lr': 1.1733333333333333e-05, 'samples': 22912, 'steps': 44, 'loss/train': 7.992016792297363} -09/20/2021 14:38:29 - INFO - __main__ - Step 717: {'lr': 1.1733333333333333e-05, 'samples': 22944, 'steps': 44, 'loss/train': 7.244071960449219} -09/20/2021 14:38:29 - INFO - __main__ - Step 718: {'lr': 1.1733333333333333e-05, 'samples': 22976, 'steps': 44, 'loss/train': 8.26088809967041} -09/20/2021 14:38:30 - INFO - __main__ - Step 719: {'lr': 1.1733333333333333e-05, 'samples': 23008, 'steps': 44, 'loss/train': 7.4592132568359375} -09/20/2021 14:38:31 - INFO - __main__ - Step 720: {'lr': 1.1733333333333333e-05, 'samples': 23040, 'steps': 44, 'loss/train': 7.924009323120117} -09/20/2021 14:38:32 - INFO - __main__ - Step 721: {'lr': 1.2e-05, 'samples': 23072, 'steps': 45, 'loss/train': 6.720010280609131} -09/20/2021 14:38:33 - INFO - __main__ - Step 722: {'lr': 1.2e-05, 'samples': 23104, 'steps': 45, 'loss/train': 8.626730918884277} -09/20/2021 14:38:34 - INFO - __main__ - Step 723: {'lr': 1.2e-05, 'samples': 23136, 'steps': 45, 'loss/train': 8.314199447631836} -09/20/2021 14:38:34 - INFO - __main__ - Step 724: {'lr': 1.2e-05, 'samples': 23168, 'steps': 45, 'loss/train': 8.005025863647461} -09/20/2021 14:38:35 - INFO - __main__ - Step 725: {'lr': 1.2e-05, 'samples': 23200, 'steps': 45, 'loss/train': 7.3646063804626465} -09/20/2021 14:38:36 - INFO - __main__ - Step 726: {'lr': 1.2e-05, 'samples': 23232, 'steps': 45, 'loss/train': 8.57480239868164} -09/20/2021 14:38:37 - INFO - __main__ - Step 727: {'lr': 1.2e-05, 'samples': 23264, 'steps': 45, 'loss/train': 7.457889556884766} -09/20/2021 14:38:37 - INFO - __main__ - Step 728: {'lr': 1.2e-05, 'samples': 23296, 'steps': 45, 'loss/train': 8.435787200927734} -09/20/2021 14:38:38 - INFO - __main__ - Step 729: {'lr': 1.2e-05, 'samples': 23328, 'steps': 45, 'loss/train': 7.515667915344238} -09/20/2021 14:38:39 - INFO - __main__ - Step 730: {'lr': 1.2e-05, 'samples': 23360, 'steps': 45, 'loss/train': 7.821084499359131} -09/20/2021 14:38:40 - INFO - __main__ - Step 731: {'lr': 1.2e-05, 'samples': 23392, 'steps': 45, 'loss/train': 7.958479404449463} -09/20/2021 14:38:40 - INFO - __main__ - Step 732: {'lr': 1.2e-05, 'samples': 23424, 'steps': 45, 'loss/train': 8.160594940185547} -09/20/2021 14:38:41 - INFO - __main__ - Step 733: {'lr': 1.2e-05, 'samples': 23456, 'steps': 45, 'loss/train': 7.75663423538208} -09/20/2021 14:38:42 - INFO - __main__ - Step 734: {'lr': 1.2e-05, 'samples': 23488, 'steps': 45, 'loss/train': 7.929126262664795} -09/20/2021 14:38:43 - INFO - __main__ - Step 735: {'lr': 1.2e-05, 'samples': 23520, 'steps': 45, 'loss/train': 8.036808013916016} -09/20/2021 14:38:43 - INFO - __main__ - Step 736: {'lr': 1.2e-05, 'samples': 23552, 'steps': 45, 'loss/train': 8.28764820098877} -09/20/2021 14:38:44 - INFO - __main__ - Step 737: {'lr': 1.2266666666666667e-05, 'samples': 23584, 'steps': 46, 'loss/train': 7.755274772644043} -09/20/2021 14:38:45 - INFO - __main__ - Step 738: {'lr': 1.2266666666666667e-05, 'samples': 23616, 'steps': 46, 'loss/train': 7.958768844604492} -09/20/2021 14:38:46 - INFO - __main__ - Step 739: {'lr': 1.2266666666666667e-05, 'samples': 23648, 'steps': 46, 'loss/train': 9.253718376159668} -09/20/2021 14:38:47 - INFO - __main__ - Step 740: {'lr': 1.2266666666666667e-05, 'samples': 23680, 'steps': 46, 'loss/train': 7.803175926208496} -09/20/2021 14:38:47 - INFO - __main__ - Step 741: {'lr': 1.2266666666666667e-05, 'samples': 23712, 'steps': 46, 'loss/train': 8.39889144897461} -09/20/2021 14:38:48 - INFO - __main__ - Step 742: {'lr': 1.2266666666666667e-05, 'samples': 23744, 'steps': 46, 'loss/train': 8.244004249572754} -09/20/2021 14:38:49 - INFO - __main__ - Step 743: {'lr': 1.2266666666666667e-05, 'samples': 23776, 'steps': 46, 'loss/train': 7.383885383605957} -09/20/2021 14:38:50 - INFO - __main__ - Step 744: {'lr': 1.2266666666666667e-05, 'samples': 23808, 'steps': 46, 'loss/train': 8.116004943847656} -09/20/2021 14:38:50 - INFO - __main__ - Step 745: {'lr': 1.2266666666666667e-05, 'samples': 23840, 'steps': 46, 'loss/train': 8.198166847229004} -09/20/2021 14:38:51 - INFO - __main__ - Step 746: {'lr': 1.2266666666666667e-05, 'samples': 23872, 'steps': 46, 'loss/train': 7.817671298980713} -09/20/2021 14:38:52 - INFO - __main__ - Step 747: {'lr': 1.2266666666666667e-05, 'samples': 23904, 'steps': 46, 'loss/train': 7.758698463439941} -09/20/2021 14:38:53 - INFO - __main__ - Step 748: {'lr': 1.2266666666666667e-05, 'samples': 23936, 'steps': 46, 'loss/train': 8.135115623474121} -09/20/2021 14:38:53 - INFO - __main__ - Step 749: {'lr': 1.2266666666666667e-05, 'samples': 23968, 'steps': 46, 'loss/train': 7.789400577545166} -09/20/2021 14:38:54 - INFO - __main__ - Step 750: {'lr': 1.2266666666666667e-05, 'samples': 24000, 'steps': 46, 'loss/train': 8.386804580688477} -09/20/2021 14:38:55 - INFO - __main__ - Step 751: {'lr': 1.2266666666666667e-05, 'samples': 24032, 'steps': 46, 'loss/train': 8.182560920715332} -09/20/2021 14:38:56 - INFO - __main__ - Step 752: {'lr': 1.2266666666666667e-05, 'samples': 24064, 'steps': 46, 'loss/train': 7.468614101409912} -09/20/2021 14:38:57 - INFO - __main__ - Step 753: {'lr': 1.2533333333333332e-05, 'samples': 24096, 'steps': 47, 'loss/train': 7.167172431945801} -09/20/2021 14:38:58 - INFO - __main__ - Step 754: {'lr': 1.2533333333333332e-05, 'samples': 24128, 'steps': 47, 'loss/train': 8.316615104675293} -09/20/2021 14:38:59 - INFO - __main__ - Step 755: {'lr': 1.2533333333333332e-05, 'samples': 24160, 'steps': 47, 'loss/train': 7.589546203613281} -09/20/2021 14:38:59 - INFO - __main__ - Step 756: {'lr': 1.2533333333333332e-05, 'samples': 24192, 'steps': 47, 'loss/train': 8.397175788879395} -09/20/2021 14:39:00 - INFO - __main__ - Step 757: {'lr': 1.2533333333333332e-05, 'samples': 24224, 'steps': 47, 'loss/train': 8.142778396606445} -09/20/2021 14:39:01 - INFO - __main__ - Step 758: {'lr': 1.2533333333333332e-05, 'samples': 24256, 'steps': 47, 'loss/train': 7.709090709686279} -09/20/2021 14:39:02 - INFO - __main__ - Step 759: {'lr': 1.2533333333333332e-05, 'samples': 24288, 'steps': 47, 'loss/train': 8.256985664367676} -09/20/2021 14:39:02 - INFO - __main__ - Step 760: {'lr': 1.2533333333333332e-05, 'samples': 24320, 'steps': 47, 'loss/train': 8.00131893157959} -09/20/2021 14:39:03 - INFO - __main__ - Step 761: {'lr': 1.2533333333333332e-05, 'samples': 24352, 'steps': 47, 'loss/train': 7.774507522583008} -09/20/2021 14:39:04 - INFO - __main__ - Step 762: {'lr': 1.2533333333333332e-05, 'samples': 24384, 'steps': 47, 'loss/train': 8.819207191467285} -09/20/2021 14:39:05 - INFO - __main__ - Step 763: {'lr': 1.2533333333333332e-05, 'samples': 24416, 'steps': 47, 'loss/train': 8.106202125549316} -09/20/2021 14:39:05 - INFO - __main__ - Step 764: {'lr': 1.2533333333333332e-05, 'samples': 24448, 'steps': 47, 'loss/train': 7.593352794647217} -09/20/2021 14:39:06 - INFO - __main__ - Step 765: {'lr': 1.2533333333333332e-05, 'samples': 24480, 'steps': 47, 'loss/train': 7.707650661468506} -09/20/2021 14:39:07 - INFO - __main__ - Step 766: {'lr': 1.2533333333333332e-05, 'samples': 24512, 'steps': 47, 'loss/train': 8.09741497039795} -09/20/2021 14:39:08 - INFO - __main__ - Step 767: {'lr': 1.2533333333333332e-05, 'samples': 24544, 'steps': 47, 'loss/train': 8.07087230682373} -09/20/2021 14:39:08 - INFO - __main__ - Step 768: {'lr': 1.2533333333333332e-05, 'samples': 24576, 'steps': 47, 'loss/train': 8.370221138000488} -09/20/2021 14:39:09 - INFO - __main__ - Step 769: {'lr': 1.2800000000000001e-05, 'samples': 24608, 'steps': 48, 'loss/train': 7.81860876083374} -09/20/2021 14:39:10 - INFO - __main__ - Step 770: {'lr': 1.2800000000000001e-05, 'samples': 24640, 'steps': 48, 'loss/train': 6.695842266082764} -09/20/2021 14:39:11 - INFO - __main__ - Step 771: {'lr': 1.2800000000000001e-05, 'samples': 24672, 'steps': 48, 'loss/train': 7.698928356170654} -09/20/2021 14:39:11 - INFO - __main__ - Step 772: {'lr': 1.2800000000000001e-05, 'samples': 24704, 'steps': 48, 'loss/train': 8.941821098327637} -09/20/2021 14:39:12 - INFO - __main__ - Step 773: {'lr': 1.2800000000000001e-05, 'samples': 24736, 'steps': 48, 'loss/train': 8.222102165222168} -09/20/2021 14:39:13 - INFO - __main__ - Step 774: {'lr': 1.2800000000000001e-05, 'samples': 24768, 'steps': 48, 'loss/train': 8.197006225585938} -09/20/2021 14:39:14 - INFO - __main__ - Step 775: {'lr': 1.2800000000000001e-05, 'samples': 24800, 'steps': 48, 'loss/train': 7.157008647918701} -09/20/2021 14:39:14 - INFO - __main__ - Step 776: {'lr': 1.2800000000000001e-05, 'samples': 24832, 'steps': 48, 'loss/train': 6.78796911239624} -09/20/2021 14:39:15 - INFO - __main__ - Step 777: {'lr': 1.2800000000000001e-05, 'samples': 24864, 'steps': 48, 'loss/train': 7.591231346130371} -09/20/2021 14:39:16 - INFO - __main__ - Step 778: {'lr': 1.2800000000000001e-05, 'samples': 24896, 'steps': 48, 'loss/train': 7.965935707092285} -09/20/2021 14:39:17 - INFO - __main__ - Step 779: {'lr': 1.2800000000000001e-05, 'samples': 24928, 'steps': 48, 'loss/train': 8.339872360229492} -09/20/2021 14:39:17 - INFO - __main__ - Step 780: {'lr': 1.2800000000000001e-05, 'samples': 24960, 'steps': 48, 'loss/train': 7.824363708496094} -09/20/2021 14:39:18 - INFO - __main__ - Step 781: {'lr': 1.2800000000000001e-05, 'samples': 24992, 'steps': 48, 'loss/train': 8.040072441101074} -09/20/2021 14:39:19 - INFO - __main__ - Step 782: {'lr': 1.2800000000000001e-05, 'samples': 25024, 'steps': 48, 'loss/train': 7.777928829193115} -09/20/2021 14:39:20 - INFO - __main__ - Step 783: {'lr': 1.2800000000000001e-05, 'samples': 25056, 'steps': 48, 'loss/train': 7.626590728759766} -09/20/2021 14:39:21 - INFO - __main__ - Step 784: {'lr': 1.2800000000000001e-05, 'samples': 25088, 'steps': 48, 'loss/train': 7.850025177001953} -09/20/2021 14:39:22 - INFO - __main__ - Step 785: {'lr': 1.3066666666666666e-05, 'samples': 25120, 'steps': 49, 'loss/train': 7.811474323272705} -09/20/2021 14:39:23 - INFO - __main__ - Step 786: {'lr': 1.3066666666666666e-05, 'samples': 25152, 'steps': 49, 'loss/train': 8.292600631713867} -09/20/2021 14:39:24 - INFO - __main__ - Step 787: {'lr': 1.3066666666666666e-05, 'samples': 25184, 'steps': 49, 'loss/train': 7.539063453674316} -09/20/2021 14:39:25 - INFO - __main__ - Step 788: {'lr': 1.3066666666666666e-05, 'samples': 25216, 'steps': 49, 'loss/train': 8.544281959533691} -09/20/2021 14:39:25 - INFO - __main__ - Step 789: {'lr': 1.3066666666666666e-05, 'samples': 25248, 'steps': 49, 'loss/train': 7.726984977722168} -09/20/2021 14:39:26 - INFO - __main__ - Step 790: {'lr': 1.3066666666666666e-05, 'samples': 25280, 'steps': 49, 'loss/train': 8.024653434753418} -09/20/2021 14:39:27 - INFO - __main__ - Step 791: {'lr': 1.3066666666666666e-05, 'samples': 25312, 'steps': 49, 'loss/train': 7.851199150085449} -09/20/2021 14:39:28 - INFO - __main__ - Step 792: {'lr': 1.3066666666666666e-05, 'samples': 25344, 'steps': 49, 'loss/train': 7.817882061004639} -09/20/2021 14:39:28 - INFO - __main__ - Step 793: {'lr': 1.3066666666666666e-05, 'samples': 25376, 'steps': 49, 'loss/train': 7.598984241485596} -09/20/2021 14:39:29 - INFO - __main__ - Step 794: {'lr': 1.3066666666666666e-05, 'samples': 25408, 'steps': 49, 'loss/train': 7.683237552642822} -09/20/2021 14:39:30 - INFO - __main__ - Step 795: {'lr': 1.3066666666666666e-05, 'samples': 25440, 'steps': 49, 'loss/train': 7.966630935668945} -09/20/2021 14:39:31 - INFO - __main__ - Step 796: {'lr': 1.3066666666666666e-05, 'samples': 25472, 'steps': 49, 'loss/train': 7.622010707855225} -09/20/2021 14:39:31 - INFO - __main__ - Step 797: {'lr': 1.3066666666666666e-05, 'samples': 25504, 'steps': 49, 'loss/train': 8.138557434082031} -09/20/2021 14:39:32 - INFO - __main__ - Step 798: {'lr': 1.3066666666666666e-05, 'samples': 25536, 'steps': 49, 'loss/train': 7.777377605438232} -09/20/2021 14:39:33 - INFO - __main__ - Step 799: {'lr': 1.3066666666666666e-05, 'samples': 25568, 'steps': 49, 'loss/train': 7.843005180358887} -09/20/2021 14:39:34 - INFO - __main__ - Step 800: {'lr': 1.3066666666666666e-05, 'samples': 25600, 'steps': 49, 'loss/train': 7.997946739196777} -09/20/2021 14:39:34 - INFO - __main__ - Step 801: {'lr': 1.3333333333333333e-05, 'samples': 25632, 'steps': 50, 'loss/train': 6.705613136291504} -09/20/2021 14:39:35 - INFO - __main__ - Step 802: {'lr': 1.3333333333333333e-05, 'samples': 25664, 'steps': 50, 'loss/train': 7.748145580291748} -09/20/2021 14:39:36 - INFO - __main__ - Step 803: {'lr': 1.3333333333333333e-05, 'samples': 25696, 'steps': 50, 'loss/train': 7.003438472747803} -09/20/2021 14:39:37 - INFO - __main__ - Step 804: {'lr': 1.3333333333333333e-05, 'samples': 25728, 'steps': 50, 'loss/train': 7.144864559173584} -09/20/2021 14:39:37 - INFO - __main__ - Step 805: {'lr': 1.3333333333333333e-05, 'samples': 25760, 'steps': 50, 'loss/train': 7.902780532836914} -09/20/2021 14:39:38 - INFO - __main__ - Step 806: {'lr': 1.3333333333333333e-05, 'samples': 25792, 'steps': 50, 'loss/train': 7.1761698722839355} -09/20/2021 14:39:39 - INFO - __main__ - Step 807: {'lr': 1.3333333333333333e-05, 'samples': 25824, 'steps': 50, 'loss/train': 7.663121700286865} -09/20/2021 14:39:40 - INFO - __main__ - Step 808: {'lr': 1.3333333333333333e-05, 'samples': 25856, 'steps': 50, 'loss/train': 7.563716888427734} -09/20/2021 14:39:40 - INFO - __main__ - Step 809: {'lr': 1.3333333333333333e-05, 'samples': 25888, 'steps': 50, 'loss/train': 7.705782413482666} -09/20/2021 14:39:41 - INFO - __main__ - Step 810: {'lr': 1.3333333333333333e-05, 'samples': 25920, 'steps': 50, 'loss/train': 7.583509922027588} -09/20/2021 14:39:42 - INFO - __main__ - Step 811: {'lr': 1.3333333333333333e-05, 'samples': 25952, 'steps': 50, 'loss/train': 7.606130599975586} -09/20/2021 14:39:43 - INFO - __main__ - Step 812: {'lr': 1.3333333333333333e-05, 'samples': 25984, 'steps': 50, 'loss/train': 7.970274925231934} -09/20/2021 14:39:43 - INFO - __main__ - Step 813: {'lr': 1.3333333333333333e-05, 'samples': 26016, 'steps': 50, 'loss/train': 7.776764392852783} -09/20/2021 14:39:44 - INFO - __main__ - Step 814: {'lr': 1.3333333333333333e-05, 'samples': 26048, 'steps': 50, 'loss/train': 7.275513648986816} -09/20/2021 14:39:46 - INFO - __main__ - Step 815: {'lr': 1.3333333333333333e-05, 'samples': 26080, 'steps': 50, 'loss/train': 7.104046821594238} -09/20/2021 14:39:46 - INFO - __main__ - Step 816: {'lr': 1.3333333333333333e-05, 'samples': 26112, 'steps': 50, 'loss/train': 7.447851657867432} -09/20/2021 14:39:47 - INFO - __main__ - Step 817: {'lr': 1.3600000000000002e-05, 'samples': 26144, 'steps': 51, 'loss/train': 7.486320495605469} -09/20/2021 14:39:48 - INFO - __main__ - Step 818: {'lr': 1.3600000000000002e-05, 'samples': 26176, 'steps': 51, 'loss/train': 7.45909309387207} -09/20/2021 14:39:49 - INFO - __main__ - Step 819: {'lr': 1.3600000000000002e-05, 'samples': 26208, 'steps': 51, 'loss/train': 7.801959991455078} -09/20/2021 14:39:49 - INFO - __main__ - Step 820: {'lr': 1.3600000000000002e-05, 'samples': 26240, 'steps': 51, 'loss/train': 7.366998672485352} -09/20/2021 14:39:50 - INFO - __main__ - Step 821: {'lr': 1.3600000000000002e-05, 'samples': 26272, 'steps': 51, 'loss/train': 7.582128524780273} -09/20/2021 14:39:51 - INFO - __main__ - Step 822: {'lr': 1.3600000000000002e-05, 'samples': 26304, 'steps': 51, 'loss/train': 7.255825042724609} -09/20/2021 14:39:52 - INFO - __main__ - Step 823: {'lr': 1.3600000000000002e-05, 'samples': 26336, 'steps': 51, 'loss/train': 7.798686504364014} -09/20/2021 14:39:52 - INFO - __main__ - Step 824: {'lr': 1.3600000000000002e-05, 'samples': 26368, 'steps': 51, 'loss/train': 7.860123634338379} -09/20/2021 14:39:53 - INFO - __main__ - Step 825: {'lr': 1.3600000000000002e-05, 'samples': 26400, 'steps': 51, 'loss/train': 6.85889196395874} -09/20/2021 14:39:54 - INFO - __main__ - Step 826: {'lr': 1.3600000000000002e-05, 'samples': 26432, 'steps': 51, 'loss/train': 8.182025909423828} -09/20/2021 14:39:55 - INFO - __main__ - Step 827: {'lr': 1.3600000000000002e-05, 'samples': 26464, 'steps': 51, 'loss/train': 8.348967552185059} -09/20/2021 14:39:55 - INFO - __main__ - Step 828: {'lr': 1.3600000000000002e-05, 'samples': 26496, 'steps': 51, 'loss/train': 7.553858280181885} -09/20/2021 14:39:56 - INFO - __main__ - Step 829: {'lr': 1.3600000000000002e-05, 'samples': 26528, 'steps': 51, 'loss/train': 7.84460973739624} -09/20/2021 14:39:57 - INFO - __main__ - Step 830: {'lr': 1.3600000000000002e-05, 'samples': 26560, 'steps': 51, 'loss/train': 8.45875358581543} -09/20/2021 14:39:58 - INFO - __main__ - Step 831: {'lr': 1.3600000000000002e-05, 'samples': 26592, 'steps': 51, 'loss/train': 9.015379905700684} -09/20/2021 14:39:58 - INFO - __main__ - Step 832: {'lr': 1.3600000000000002e-05, 'samples': 26624, 'steps': 51, 'loss/train': 7.321765422821045} -09/20/2021 14:39:59 - INFO - __main__ - Step 833: {'lr': 1.3866666666666667e-05, 'samples': 26656, 'steps': 52, 'loss/train': 6.801315784454346} -09/20/2021 14:40:00 - INFO - __main__ - Step 834: {'lr': 1.3866666666666667e-05, 'samples': 26688, 'steps': 52, 'loss/train': 7.143980979919434} -09/20/2021 14:40:01 - INFO - __main__ - Step 835: {'lr': 1.3866666666666667e-05, 'samples': 26720, 'steps': 52, 'loss/train': 6.903763294219971} -09/20/2021 14:40:02 - INFO - __main__ - Step 836: {'lr': 1.3866666666666667e-05, 'samples': 26752, 'steps': 52, 'loss/train': 7.402519702911377} -09/20/2021 14:40:02 - INFO - __main__ - Step 837: {'lr': 1.3866666666666667e-05, 'samples': 26784, 'steps': 52, 'loss/train': 6.700289726257324} -09/20/2021 14:40:03 - INFO - __main__ - Step 838: {'lr': 1.3866666666666667e-05, 'samples': 26816, 'steps': 52, 'loss/train': 8.015384674072266} -09/20/2021 14:40:04 - INFO - __main__ - Step 839: {'lr': 1.3866666666666667e-05, 'samples': 26848, 'steps': 52, 'loss/train': 8.097879409790039} -09/20/2021 14:40:05 - INFO - __main__ - Step 840: {'lr': 1.3866666666666667e-05, 'samples': 26880, 'steps': 52, 'loss/train': 7.398819446563721} -09/20/2021 14:40:05 - INFO - __main__ - Step 841: {'lr': 1.3866666666666667e-05, 'samples': 26912, 'steps': 52, 'loss/train': 7.815927505493164} -09/20/2021 14:40:06 - INFO - __main__ - Step 842: {'lr': 1.3866666666666667e-05, 'samples': 26944, 'steps': 52, 'loss/train': 8.026200294494629} -09/20/2021 14:40:07 - INFO - __main__ - Step 843: {'lr': 1.3866666666666667e-05, 'samples': 26976, 'steps': 52, 'loss/train': 7.74579381942749} -09/20/2021 14:40:08 - INFO - __main__ - Step 844: {'lr': 1.3866666666666667e-05, 'samples': 27008, 'steps': 52, 'loss/train': 6.99752950668335} -09/20/2021 14:40:08 - INFO - __main__ - Step 845: {'lr': 1.3866666666666667e-05, 'samples': 27040, 'steps': 52, 'loss/train': 8.27677059173584} -09/20/2021 14:40:09 - INFO - __main__ - Step 846: {'lr': 1.3866666666666667e-05, 'samples': 27072, 'steps': 52, 'loss/train': 6.538891792297363} -09/20/2021 14:40:11 - INFO - __main__ - Step 847: {'lr': 1.3866666666666667e-05, 'samples': 27104, 'steps': 52, 'loss/train': 6.936304569244385} -09/20/2021 14:40:12 - INFO - __main__ - Step 848: {'lr': 1.3866666666666667e-05, 'samples': 27136, 'steps': 52, 'loss/train': 6.88667106628418} -09/20/2021 14:40:12 - INFO - __main__ - Step 849: {'lr': 1.4133333333333334e-05, 'samples': 27168, 'steps': 53, 'loss/train': 7.459985256195068} -09/20/2021 14:40:13 - INFO - __main__ - Step 850: {'lr': 1.4133333333333334e-05, 'samples': 27200, 'steps': 53, 'loss/train': 7.593735218048096} -09/20/2021 14:40:14 - INFO - __main__ - Step 851: {'lr': 1.4133333333333334e-05, 'samples': 27232, 'steps': 53, 'loss/train': 6.980226516723633} -09/20/2021 14:40:15 - INFO - __main__ - Step 852: {'lr': 1.4133333333333334e-05, 'samples': 27264, 'steps': 53, 'loss/train': 8.123711585998535} -09/20/2021 14:40:15 - INFO - __main__ - Step 853: {'lr': 1.4133333333333334e-05, 'samples': 27296, 'steps': 53, 'loss/train': 7.967436790466309} -09/20/2021 14:40:16 - INFO - __main__ - Step 854: {'lr': 1.4133333333333334e-05, 'samples': 27328, 'steps': 53, 'loss/train': 8.346632957458496} -09/20/2021 14:40:17 - INFO - __main__ - Step 855: {'lr': 1.4133333333333334e-05, 'samples': 27360, 'steps': 53, 'loss/train': 6.68599271774292} -09/20/2021 14:40:18 - INFO - __main__ - Step 856: {'lr': 1.4133333333333334e-05, 'samples': 27392, 'steps': 53, 'loss/train': 7.7949652671813965} -09/20/2021 14:40:18 - INFO - __main__ - Step 857: {'lr': 1.4133333333333334e-05, 'samples': 27424, 'steps': 53, 'loss/train': 6.644408226013184} -09/20/2021 14:40:19 - INFO - __main__ - Step 858: {'lr': 1.4133333333333334e-05, 'samples': 27456, 'steps': 53, 'loss/train': 9.378437995910645} -09/20/2021 14:40:20 - INFO - __main__ - Step 859: {'lr': 1.4133333333333334e-05, 'samples': 27488, 'steps': 53, 'loss/train': 9.498302459716797} -09/20/2021 14:40:21 - INFO - __main__ - Step 860: {'lr': 1.4133333333333334e-05, 'samples': 27520, 'steps': 53, 'loss/train': 9.60245132446289} -09/20/2021 14:40:21 - INFO - __main__ - Step 861: {'lr': 1.4133333333333334e-05, 'samples': 27552, 'steps': 53, 'loss/train': 7.7172698974609375} -09/20/2021 14:40:22 - INFO - __main__ - Step 862: {'lr': 1.4133333333333334e-05, 'samples': 27584, 'steps': 53, 'loss/train': 7.876803398132324} -09/20/2021 14:40:23 - INFO - __main__ - Step 863: {'lr': 1.4133333333333334e-05, 'samples': 27616, 'steps': 53, 'loss/train': 8.526573181152344} -09/20/2021 14:40:24 - INFO - __main__ - Step 864: {'lr': 1.4133333333333334e-05, 'samples': 27648, 'steps': 53, 'loss/train': 8.497669219970703} -09/20/2021 14:40:25 - INFO - __main__ - Step 865: {'lr': 1.44e-05, 'samples': 27680, 'steps': 54, 'loss/train': 7.008090019226074} -09/20/2021 14:40:25 - INFO - __main__ - Step 866: {'lr': 1.44e-05, 'samples': 27712, 'steps': 54, 'loss/train': 7.258153438568115} -09/20/2021 14:40:26 - INFO - __main__ - Step 867: {'lr': 1.44e-05, 'samples': 27744, 'steps': 54, 'loss/train': 7.115903854370117} -09/20/2021 14:40:27 - INFO - __main__ - Step 868: {'lr': 1.44e-05, 'samples': 27776, 'steps': 54, 'loss/train': 8.25905704498291} -09/20/2021 14:40:28 - INFO - __main__ - Step 869: {'lr': 1.44e-05, 'samples': 27808, 'steps': 54, 'loss/train': 8.271703720092773} -09/20/2021 14:40:28 - INFO - __main__ - Step 870: {'lr': 1.44e-05, 'samples': 27840, 'steps': 54, 'loss/train': 7.702834606170654} -09/20/2021 14:40:29 - INFO - __main__ - Step 871: {'lr': 1.44e-05, 'samples': 27872, 'steps': 54, 'loss/train': 6.9401140213012695} -09/20/2021 14:40:30 - INFO - __main__ - Step 872: {'lr': 1.44e-05, 'samples': 27904, 'steps': 54, 'loss/train': 7.100647926330566} -09/20/2021 14:40:31 - INFO - __main__ - Step 873: {'lr': 1.44e-05, 'samples': 27936, 'steps': 54, 'loss/train': 7.890451908111572} -09/20/2021 14:40:31 - INFO - __main__ - Step 874: {'lr': 1.44e-05, 'samples': 27968, 'steps': 54, 'loss/train': 7.631584167480469} -09/20/2021 14:40:32 - INFO - __main__ - Step 875: {'lr': 1.44e-05, 'samples': 28000, 'steps': 54, 'loss/train': 7.837517738342285} -09/20/2021 14:40:33 - INFO - __main__ - Step 876: {'lr': 1.44e-05, 'samples': 28032, 'steps': 54, 'loss/train': 7.648595809936523} -09/20/2021 14:40:35 - INFO - __main__ - Step 877: {'lr': 1.44e-05, 'samples': 28064, 'steps': 54, 'loss/train': 8.723176002502441} -09/20/2021 14:40:36 - INFO - __main__ - Step 878: {'lr': 1.44e-05, 'samples': 28096, 'steps': 54, 'loss/train': 7.453305721282959} -09/20/2021 14:40:36 - INFO - __main__ - Step 879: {'lr': 1.44e-05, 'samples': 28128, 'steps': 54, 'loss/train': 7.9763031005859375} -09/20/2021 14:40:37 - INFO - __main__ - Step 880: {'lr': 1.44e-05, 'samples': 28160, 'steps': 54, 'loss/train': 7.057381629943848} -09/20/2021 14:40:38 - INFO - __main__ - Step 881: {'lr': 1.4666666666666668e-05, 'samples': 28192, 'steps': 55, 'loss/train': 7.354104518890381} -09/20/2021 14:40:39 - INFO - __main__ - Step 882: {'lr': 1.4666666666666668e-05, 'samples': 28224, 'steps': 55, 'loss/train': 7.059449195861816} -09/20/2021 14:40:40 - INFO - __main__ - Step 883: {'lr': 1.4666666666666668e-05, 'samples': 28256, 'steps': 55, 'loss/train': 7.4566850662231445} -09/20/2021 14:40:40 - INFO - __main__ - Step 884: {'lr': 1.4666666666666668e-05, 'samples': 28288, 'steps': 55, 'loss/train': 8.112844467163086} -09/20/2021 14:40:41 - INFO - __main__ - Step 885: {'lr': 1.4666666666666668e-05, 'samples': 28320, 'steps': 55, 'loss/train': 8.661636352539062} -09/20/2021 14:40:42 - INFO - __main__ - Step 886: {'lr': 1.4666666666666668e-05, 'samples': 28352, 'steps': 55, 'loss/train': 7.981234073638916} -09/20/2021 14:40:43 - INFO - __main__ - Step 887: {'lr': 1.4666666666666668e-05, 'samples': 28384, 'steps': 55, 'loss/train': 7.4876389503479} -09/20/2021 14:40:43 - INFO - __main__ - Step 888: {'lr': 1.4666666666666668e-05, 'samples': 28416, 'steps': 55, 'loss/train': 7.504430770874023} -09/20/2021 14:40:44 - INFO - __main__ - Step 889: {'lr': 1.4666666666666668e-05, 'samples': 28448, 'steps': 55, 'loss/train': 7.532563209533691} -09/20/2021 14:40:45 - INFO - __main__ - Step 890: {'lr': 1.4666666666666668e-05, 'samples': 28480, 'steps': 55, 'loss/train': 7.763226509094238} -09/20/2021 14:40:46 - INFO - __main__ - Step 891: {'lr': 1.4666666666666668e-05, 'samples': 28512, 'steps': 55, 'loss/train': 7.7389750480651855} -09/20/2021 14:40:46 - INFO - __main__ - Step 892: {'lr': 1.4666666666666668e-05, 'samples': 28544, 'steps': 55, 'loss/train': 7.4203009605407715} -09/20/2021 14:40:47 - INFO - __main__ - Step 893: {'lr': 1.4666666666666668e-05, 'samples': 28576, 'steps': 55, 'loss/train': 7.8625078201293945} -09/20/2021 14:40:48 - INFO - __main__ - Step 894: {'lr': 1.4666666666666668e-05, 'samples': 28608, 'steps': 55, 'loss/train': 8.605887413024902} -09/20/2021 14:40:49 - INFO - __main__ - Step 895: {'lr': 1.4666666666666668e-05, 'samples': 28640, 'steps': 55, 'loss/train': 9.857234954833984} -09/20/2021 14:40:49 - INFO - __main__ - Step 896: {'lr': 1.4666666666666668e-05, 'samples': 28672, 'steps': 55, 'loss/train': 9.881699562072754} -09/20/2021 14:40:50 - INFO - __main__ - Step 897: {'lr': 1.4933333333333335e-05, 'samples': 28704, 'steps': 56, 'loss/train': 9.644062042236328} -09/20/2021 14:40:51 - INFO - __main__ - Step 898: {'lr': 1.4933333333333335e-05, 'samples': 28736, 'steps': 56, 'loss/train': 9.719661712646484} -09/20/2021 14:40:52 - INFO - __main__ - Step 899: {'lr': 1.4933333333333335e-05, 'samples': 28768, 'steps': 56, 'loss/train': 9.670365333557129} -09/20/2021 14:40:52 - INFO - __main__ - Step 900: {'lr': 1.4933333333333335e-05, 'samples': 28800, 'steps': 56, 'loss/train': 6.908196449279785} -09/20/2021 14:40:53 - INFO - __main__ - Step 901: {'lr': 1.4933333333333335e-05, 'samples': 28832, 'steps': 56, 'loss/train': 7.738470554351807} -09/20/2021 14:40:54 - INFO - __main__ - Step 902: {'lr': 1.4933333333333335e-05, 'samples': 28864, 'steps': 56, 'loss/train': 7.6293792724609375} -09/20/2021 14:40:55 - INFO - __main__ - Step 903: {'lr': 1.4933333333333335e-05, 'samples': 28896, 'steps': 56, 'loss/train': 7.661438465118408} -09/20/2021 14:40:55 - INFO - __main__ - Step 904: {'lr': 1.4933333333333335e-05, 'samples': 28928, 'steps': 56, 'loss/train': 6.856693744659424} -09/20/2021 14:40:56 - INFO - __main__ - Step 905: {'lr': 1.4933333333333335e-05, 'samples': 28960, 'steps': 56, 'loss/train': 7.925997734069824} -09/20/2021 14:40:57 - INFO - __main__ - Step 906: {'lr': 1.4933333333333335e-05, 'samples': 28992, 'steps': 56, 'loss/train': 7.2550048828125} -09/20/2021 14:40:58 - INFO - __main__ - Step 907: {'lr': 1.4933333333333335e-05, 'samples': 29024, 'steps': 56, 'loss/train': 7.320627689361572} -09/20/2021 14:40:58 - INFO - __main__ - Step 908: {'lr': 1.4933333333333335e-05, 'samples': 29056, 'steps': 56, 'loss/train': 7.3221435546875} -09/20/2021 14:40:59 - INFO - __main__ - Step 909: {'lr': 1.4933333333333335e-05, 'samples': 29088, 'steps': 56, 'loss/train': 7.485440254211426} -09/20/2021 14:41:00 - INFO - __main__ - Step 910: {'lr': 1.4933333333333335e-05, 'samples': 29120, 'steps': 56, 'loss/train': 7.969925403594971} -09/20/2021 14:41:01 - INFO - __main__ - Step 911: {'lr': 1.4933333333333335e-05, 'samples': 29152, 'steps': 56, 'loss/train': 8.301508903503418} -09/20/2021 14:41:01 - INFO - __main__ - Step 912: {'lr': 1.4933333333333335e-05, 'samples': 29184, 'steps': 56, 'loss/train': 7.165955543518066} -09/20/2021 14:41:02 - INFO - __main__ - Step 913: {'lr': 1.52e-05, 'samples': 29216, 'steps': 57, 'loss/train': 7.908268451690674} -09/20/2021 14:41:03 - INFO - __main__ - Step 914: {'lr': 1.52e-05, 'samples': 29248, 'steps': 57, 'loss/train': 8.492167472839355} -09/20/2021 14:41:04 - INFO - __main__ - Step 915: {'lr': 1.52e-05, 'samples': 29280, 'steps': 57, 'loss/train': 7.855161666870117} -09/20/2021 14:41:05 - INFO - __main__ - Step 916: {'lr': 1.52e-05, 'samples': 29312, 'steps': 57, 'loss/train': 7.901766300201416} -09/20/2021 14:41:06 - INFO - __main__ - Step 917: {'lr': 1.52e-05, 'samples': 29344, 'steps': 57, 'loss/train': 8.381318092346191} -09/20/2021 14:41:07 - INFO - __main__ - Step 918: {'lr': 1.52e-05, 'samples': 29376, 'steps': 57, 'loss/train': 9.4214506149292} -09/20/2021 14:41:08 - INFO - __main__ - Step 919: {'lr': 1.52e-05, 'samples': 29408, 'steps': 57, 'loss/train': 8.135162353515625} -09/20/2021 14:41:08 - INFO - __main__ - Step 920: {'lr': 1.52e-05, 'samples': 29440, 'steps': 57, 'loss/train': 9.656207084655762} -09/20/2021 14:41:09 - INFO - __main__ - Step 921: {'lr': 1.52e-05, 'samples': 29472, 'steps': 57, 'loss/train': 7.46548318862915} -09/20/2021 14:41:10 - INFO - __main__ - Step 922: {'lr': 1.52e-05, 'samples': 29504, 'steps': 57, 'loss/train': 7.369948387145996} -09/20/2021 14:41:11 - INFO - __main__ - Step 923: {'lr': 1.52e-05, 'samples': 29536, 'steps': 57, 'loss/train': 6.860026836395264} -09/20/2021 14:41:11 - INFO - __main__ - Step 924: {'lr': 1.52e-05, 'samples': 29568, 'steps': 57, 'loss/train': 6.896186351776123} -09/20/2021 14:41:12 - INFO - __main__ - Step 925: {'lr': 1.52e-05, 'samples': 29600, 'steps': 57, 'loss/train': 6.962033271789551} -09/20/2021 14:41:13 - INFO - __main__ - Step 926: {'lr': 1.52e-05, 'samples': 29632, 'steps': 57, 'loss/train': 6.894598960876465} -09/20/2021 14:41:14 - INFO - __main__ - Step 927: {'lr': 1.52e-05, 'samples': 29664, 'steps': 57, 'loss/train': 7.656611919403076} -09/20/2021 14:41:14 - INFO - __main__ - Step 928: {'lr': 1.52e-05, 'samples': 29696, 'steps': 57, 'loss/train': 7.575782299041748} -09/20/2021 14:41:15 - INFO - __main__ - Step 929: {'lr': 1.546666666666667e-05, 'samples': 29728, 'steps': 58, 'loss/train': 8.021947860717773} -09/20/2021 14:41:16 - INFO - __main__ - Step 930: {'lr': 1.546666666666667e-05, 'samples': 29760, 'steps': 58, 'loss/train': 6.9510178565979} -09/20/2021 14:41:17 - INFO - __main__ - Step 931: {'lr': 1.546666666666667e-05, 'samples': 29792, 'steps': 58, 'loss/train': 7.898918628692627} -09/20/2021 14:41:17 - INFO - __main__ - Step 932: {'lr': 1.546666666666667e-05, 'samples': 29824, 'steps': 58, 'loss/train': 7.3956475257873535} -09/20/2021 14:41:18 - INFO - __main__ - Step 933: {'lr': 1.546666666666667e-05, 'samples': 29856, 'steps': 58, 'loss/train': 6.868228435516357} -09/20/2021 14:41:19 - INFO - __main__ - Step 934: {'lr': 1.546666666666667e-05, 'samples': 29888, 'steps': 58, 'loss/train': 7.367581844329834} -09/20/2021 14:41:20 - INFO - __main__ - Step 935: {'lr': 1.546666666666667e-05, 'samples': 29920, 'steps': 58, 'loss/train': 7.964627265930176} -09/20/2021 14:41:20 - INFO - __main__ - Step 936: {'lr': 1.546666666666667e-05, 'samples': 29952, 'steps': 58, 'loss/train': 7.766822814941406} -09/20/2021 14:41:21 - INFO - __main__ - Step 937: {'lr': 1.546666666666667e-05, 'samples': 29984, 'steps': 58, 'loss/train': 8.057583808898926} -09/20/2021 14:41:22 - INFO - __main__ - Step 938: {'lr': 1.546666666666667e-05, 'samples': 30016, 'steps': 58, 'loss/train': 7.176663398742676} -09/20/2021 14:41:23 - INFO - __main__ - Step 939: {'lr': 1.546666666666667e-05, 'samples': 30048, 'steps': 58, 'loss/train': 6.62006950378418} -09/20/2021 14:41:23 - INFO - __main__ - Step 940: {'lr': 1.546666666666667e-05, 'samples': 30080, 'steps': 58, 'loss/train': 7.25228214263916} -09/20/2021 14:41:24 - INFO - __main__ - Step 941: {'lr': 1.546666666666667e-05, 'samples': 30112, 'steps': 58, 'loss/train': 6.826840877532959} -09/20/2021 14:41:25 - INFO - __main__ - Step 942: {'lr': 1.546666666666667e-05, 'samples': 30144, 'steps': 58, 'loss/train': 8.120732307434082} -09/20/2021 14:41:26 - INFO - __main__ - Step 943: {'lr': 1.546666666666667e-05, 'samples': 30176, 'steps': 58, 'loss/train': 7.737004280090332} -09/20/2021 14:41:26 - INFO - __main__ - Step 944: {'lr': 1.546666666666667e-05, 'samples': 30208, 'steps': 58, 'loss/train': 7.333699703216553} -09/20/2021 14:41:27 - INFO - __main__ - Step 945: {'lr': 1.5733333333333334e-05, 'samples': 30240, 'steps': 59, 'loss/train': 7.671634674072266} -09/20/2021 14:41:28 - INFO - __main__ - Step 946: {'lr': 1.5733333333333334e-05, 'samples': 30272, 'steps': 59, 'loss/train': 6.658376693725586} -09/20/2021 14:41:29 - INFO - __main__ - Step 947: {'lr': 1.5733333333333334e-05, 'samples': 30304, 'steps': 59, 'loss/train': 10.161062240600586} -09/20/2021 14:41:30 - INFO - __main__ - Step 948: {'lr': 1.5733333333333334e-05, 'samples': 30336, 'steps': 59, 'loss/train': 7.177831649780273} -09/20/2021 14:41:31 - INFO - __main__ - Step 949: {'lr': 1.5733333333333334e-05, 'samples': 30368, 'steps': 59, 'loss/train': 8.581284523010254} -09/20/2021 14:41:32 - INFO - __main__ - Step 950: {'lr': 1.5733333333333334e-05, 'samples': 30400, 'steps': 59, 'loss/train': 7.218408107757568} -09/20/2021 14:41:32 - INFO - __main__ - Step 951: {'lr': 1.5733333333333334e-05, 'samples': 30432, 'steps': 59, 'loss/train': 7.482787609100342} -09/20/2021 14:41:33 - INFO - __main__ - Step 952: {'lr': 1.5733333333333334e-05, 'samples': 30464, 'steps': 59, 'loss/train': 7.496205806732178} -09/20/2021 14:41:34 - INFO - __main__ - Step 953: {'lr': 1.5733333333333334e-05, 'samples': 30496, 'steps': 59, 'loss/train': 7.704283714294434} -09/20/2021 14:41:35 - INFO - __main__ - Step 954: {'lr': 1.5733333333333334e-05, 'samples': 30528, 'steps': 59, 'loss/train': 7.677188873291016} -09/20/2021 14:41:35 - INFO - __main__ - Step 955: {'lr': 1.5733333333333334e-05, 'samples': 30560, 'steps': 59, 'loss/train': 7.7294816970825195} -09/20/2021 14:41:36 - INFO - __main__ - Step 956: {'lr': 1.5733333333333334e-05, 'samples': 30592, 'steps': 59, 'loss/train': 8.14849853515625} -09/20/2021 14:41:37 - INFO - __main__ - Step 957: {'lr': 1.5733333333333334e-05, 'samples': 30624, 'steps': 59, 'loss/train': 7.509145259857178} -09/20/2021 14:41:38 - INFO - __main__ - Step 958: {'lr': 1.5733333333333334e-05, 'samples': 30656, 'steps': 59, 'loss/train': 7.331686496734619} -09/20/2021 14:41:38 - INFO - __main__ - Step 959: {'lr': 1.5733333333333334e-05, 'samples': 30688, 'steps': 59, 'loss/train': 7.856742858886719} -09/20/2021 14:41:39 - INFO - __main__ - Step 960: {'lr': 1.5733333333333334e-05, 'samples': 30720, 'steps': 59, 'loss/train': 7.4157185554504395} -09/20/2021 14:41:40 - INFO - __main__ - Step 961: {'lr': 1.6000000000000003e-05, 'samples': 30752, 'steps': 60, 'loss/train': 7.337884426116943} -09/20/2021 14:41:41 - INFO - __main__ - Step 962: {'lr': 1.6000000000000003e-05, 'samples': 30784, 'steps': 60, 'loss/train': 8.402260780334473} -09/20/2021 14:41:42 - INFO - __main__ - Step 963: {'lr': 1.6000000000000003e-05, 'samples': 30816, 'steps': 60, 'loss/train': 7.441598892211914} -09/20/2021 14:41:42 - INFO - __main__ - Step 964: {'lr': 1.6000000000000003e-05, 'samples': 30848, 'steps': 60, 'loss/train': 7.283440589904785} -09/20/2021 14:41:43 - INFO - __main__ - Step 965: {'lr': 1.6000000000000003e-05, 'samples': 30880, 'steps': 60, 'loss/train': 7.739964008331299} -09/20/2021 14:41:44 - INFO - __main__ - Step 966: {'lr': 1.6000000000000003e-05, 'samples': 30912, 'steps': 60, 'loss/train': 7.368042469024658} -09/20/2021 14:41:45 - INFO - __main__ - Step 967: {'lr': 1.6000000000000003e-05, 'samples': 30944, 'steps': 60, 'loss/train': 1.5296342372894287} -09/20/2021 14:41:45 - INFO - __main__ - Step 968: {'lr': 1.6000000000000003e-05, 'samples': 30976, 'steps': 60, 'loss/train': 8.337325096130371} -09/20/2021 14:41:46 - INFO - __main__ - Step 969: {'lr': 1.6000000000000003e-05, 'samples': 31008, 'steps': 60, 'loss/train': 7.784377098083496} -09/20/2021 14:41:47 - INFO - __main__ - Step 970: {'lr': 1.6000000000000003e-05, 'samples': 31040, 'steps': 60, 'loss/train': 8.204645156860352} -09/20/2021 14:41:48 - INFO - __main__ - Step 971: {'lr': 1.6000000000000003e-05, 'samples': 31072, 'steps': 60, 'loss/train': 7.384739398956299} -09/20/2021 14:41:48 - INFO - __main__ - Step 972: {'lr': 1.6000000000000003e-05, 'samples': 31104, 'steps': 60, 'loss/train': 7.398707866668701} -09/20/2021 14:41:49 - INFO - __main__ - Step 973: {'lr': 1.6000000000000003e-05, 'samples': 31136, 'steps': 60, 'loss/train': 7.0282464027404785} -09/20/2021 14:41:50 - INFO - __main__ - Step 974: {'lr': 1.6000000000000003e-05, 'samples': 31168, 'steps': 60, 'loss/train': 6.4537434577941895} -09/20/2021 14:41:51 - INFO - __main__ - Step 975: {'lr': 1.6000000000000003e-05, 'samples': 31200, 'steps': 60, 'loss/train': 7.1599345207214355} -09/20/2021 14:41:51 - INFO - __main__ - Step 976: {'lr': 1.6000000000000003e-05, 'samples': 31232, 'steps': 60, 'loss/train': 8.796966552734375} -09/20/2021 14:41:52 - INFO - __main__ - Step 977: {'lr': 1.6266666666666665e-05, 'samples': 31264, 'steps': 61, 'loss/train': 7.4510674476623535} -09/20/2021 14:41:53 - INFO - __main__ - Step 978: {'lr': 1.6266666666666665e-05, 'samples': 31296, 'steps': 61, 'loss/train': 7.448990345001221} -09/20/2021 14:41:54 - INFO - __main__ - Step 979: {'lr': 1.6266666666666665e-05, 'samples': 31328, 'steps': 61, 'loss/train': 7.588810920715332} -09/20/2021 14:41:54 - INFO - __main__ - Step 980: {'lr': 1.6266666666666665e-05, 'samples': 31360, 'steps': 61, 'loss/train': 7.119534015655518} -09/20/2021 14:41:55 - INFO - __main__ - Step 981: {'lr': 1.6266666666666665e-05, 'samples': 31392, 'steps': 61, 'loss/train': 5.296873092651367} -09/20/2021 14:41:57 - INFO - __main__ - Step 982: {'lr': 1.6266666666666665e-05, 'samples': 31424, 'steps': 61, 'loss/train': 7.45318603515625} -09/20/2021 14:41:57 - INFO - __main__ - Step 983: {'lr': 1.6266666666666665e-05, 'samples': 31456, 'steps': 61, 'loss/train': 7.160688400268555} -09/20/2021 14:41:58 - INFO - __main__ - Step 984: {'lr': 1.6266666666666665e-05, 'samples': 31488, 'steps': 61, 'loss/train': 7.6530866622924805} -09/20/2021 14:41:59 - INFO - __main__ - Step 985: {'lr': 1.6266666666666665e-05, 'samples': 31520, 'steps': 61, 'loss/train': 8.35054874420166} -09/20/2021 14:41:59 - INFO - __main__ - Step 986: {'lr': 1.6266666666666665e-05, 'samples': 31552, 'steps': 61, 'loss/train': 6.5537824630737305} -09/20/2021 14:42:00 - INFO - __main__ - Step 987: {'lr': 1.6266666666666665e-05, 'samples': 31584, 'steps': 61, 'loss/train': 7.692201614379883} -09/20/2021 14:42:01 - INFO - __main__ - Step 988: {'lr': 1.6266666666666665e-05, 'samples': 31616, 'steps': 61, 'loss/train': 7.990808010101318} -09/20/2021 14:42:02 - INFO - __main__ - Step 989: {'lr': 1.6266666666666665e-05, 'samples': 31648, 'steps': 61, 'loss/train': 7.339212894439697} -09/20/2021 14:42:02 - INFO - __main__ - Step 990: {'lr': 1.6266666666666665e-05, 'samples': 31680, 'steps': 61, 'loss/train': 7.652698040008545} -09/20/2021 14:42:03 - INFO - __main__ - Step 991: {'lr': 1.6266666666666665e-05, 'samples': 31712, 'steps': 61, 'loss/train': 7.988891124725342} -09/20/2021 14:42:04 - INFO - __main__ - Step 992: {'lr': 1.6266666666666665e-05, 'samples': 31744, 'steps': 61, 'loss/train': 7.122201442718506} -09/20/2021 14:42:05 - INFO - __main__ - Step 993: {'lr': 1.6533333333333333e-05, 'samples': 31776, 'steps': 62, 'loss/train': 7.67077112197876} -09/20/2021 14:42:06 - INFO - __main__ - Step 994: {'lr': 1.6533333333333333e-05, 'samples': 31808, 'steps': 62, 'loss/train': 7.339214324951172} -09/20/2021 14:42:06 - INFO - __main__ - Step 995: {'lr': 1.6533333333333333e-05, 'samples': 31840, 'steps': 62, 'loss/train': 7.724555015563965} -09/20/2021 14:42:07 - INFO - __main__ - Step 996: {'lr': 1.6533333333333333e-05, 'samples': 31872, 'steps': 62, 'loss/train': 7.47060489654541} -09/20/2021 14:42:08 - INFO - __main__ - Step 997: {'lr': 1.6533333333333333e-05, 'samples': 31904, 'steps': 62, 'loss/train': 7.871269226074219} -09/20/2021 14:42:09 - INFO - __main__ - Step 998: {'lr': 1.6533333333333333e-05, 'samples': 31936, 'steps': 62, 'loss/train': 7.904464244842529} -09/20/2021 14:42:09 - INFO - __main__ - Step 999: {'lr': 1.6533333333333333e-05, 'samples': 31968, 'steps': 62, 'loss/train': 7.587808132171631} -09/20/2021 14:42:10 - INFO - __main__ - Step 1000: {'lr': 1.6533333333333333e-05, 'samples': 32000, 'steps': 62, 'loss/train': 7.713339805603027} -09/20/2021 14:42:11 - INFO - __main__ - Step 1001: {'lr': 1.6533333333333333e-05, 'samples': 32032, 'steps': 62, 'loss/train': 7.366071701049805} -09/20/2021 14:42:12 - INFO - __main__ - Step 1002: {'lr': 1.6533333333333333e-05, 'samples': 32064, 'steps': 62, 'loss/train': 7.862269401550293} -09/20/2021 14:42:12 - INFO - __main__ - Step 1003: {'lr': 1.6533333333333333e-05, 'samples': 32096, 'steps': 62, 'loss/train': 7.26649808883667} -09/20/2021 14:42:13 - INFO - __main__ - Step 1004: {'lr': 1.6533333333333333e-05, 'samples': 32128, 'steps': 62, 'loss/train': 8.080438613891602} -09/20/2021 14:42:14 - INFO - __main__ - Step 1005: {'lr': 1.6533333333333333e-05, 'samples': 32160, 'steps': 62, 'loss/train': 6.933586120605469} -09/20/2021 14:42:15 - INFO - __main__ - Step 1006: {'lr': 1.6533333333333333e-05, 'samples': 32192, 'steps': 62, 'loss/train': 6.5684051513671875} -09/20/2021 14:42:15 - INFO - __main__ - Step 1007: {'lr': 1.6533333333333333e-05, 'samples': 32224, 'steps': 62, 'loss/train': 9.859872817993164} -09/20/2021 14:42:16 - INFO - __main__ - Step 1008: {'lr': 1.6533333333333333e-05, 'samples': 32256, 'steps': 62, 'loss/train': 7.209011077880859} -09/20/2021 14:42:17 - INFO - __main__ - Step 1009: {'lr': 1.6800000000000002e-05, 'samples': 32288, 'steps': 63, 'loss/train': 7.298811435699463} -09/20/2021 14:42:18 - INFO - __main__ - Step 1010: {'lr': 1.6800000000000002e-05, 'samples': 32320, 'steps': 63, 'loss/train': 7.513772964477539} -09/20/2021 14:42:19 - INFO - __main__ - Step 1011: {'lr': 1.6800000000000002e-05, 'samples': 32352, 'steps': 63, 'loss/train': 7.228566646575928} -09/20/2021 14:42:20 - INFO - __main__ - Step 1012: {'lr': 1.6800000000000002e-05, 'samples': 32384, 'steps': 63, 'loss/train': 7.079514980316162} -09/20/2021 14:42:21 - INFO - __main__ - Step 1013: {'lr': 1.6800000000000002e-05, 'samples': 32416, 'steps': 63, 'loss/train': 7.652944564819336} -09/20/2021 14:42:21 - INFO - __main__ - Step 1014: {'lr': 1.6800000000000002e-05, 'samples': 32448, 'steps': 63, 'loss/train': 7.051092624664307} -09/20/2021 14:42:22 - INFO - __main__ - Step 1015: {'lr': 1.6800000000000002e-05, 'samples': 32480, 'steps': 63, 'loss/train': 6.899384021759033} -09/20/2021 14:42:23 - INFO - __main__ - Step 1016: {'lr': 1.6800000000000002e-05, 'samples': 32512, 'steps': 63, 'loss/train': 9.009860038757324} -09/20/2021 14:42:24 - INFO - __main__ - Step 1017: {'lr': 1.6800000000000002e-05, 'samples': 32544, 'steps': 63, 'loss/train': 8.933029174804688} -09/20/2021 14:42:24 - INFO - __main__ - Step 1018: {'lr': 1.6800000000000002e-05, 'samples': 32576, 'steps': 63, 'loss/train': 9.427841186523438} -09/20/2021 14:42:25 - INFO - __main__ - Step 1019: {'lr': 1.6800000000000002e-05, 'samples': 32608, 'steps': 63, 'loss/train': 7.143239974975586} -09/20/2021 14:42:26 - INFO - __main__ - Step 1020: {'lr': 1.6800000000000002e-05, 'samples': 32640, 'steps': 63, 'loss/train': 6.635833740234375} -09/20/2021 14:42:27 - INFO - __main__ - Step 1021: {'lr': 1.6800000000000002e-05, 'samples': 32672, 'steps': 63, 'loss/train': 7.121298313140869} -09/20/2021 14:42:27 - INFO - __main__ - Step 1022: {'lr': 1.6800000000000002e-05, 'samples': 32704, 'steps': 63, 'loss/train': 7.202362060546875} -09/20/2021 14:42:28 - INFO - __main__ - Step 1023: {'lr': 1.6800000000000002e-05, 'samples': 32736, 'steps': 63, 'loss/train': 8.120393753051758} -09/20/2021 14:42:29 - INFO - __main__ - Step 1024: {'lr': 1.6800000000000002e-05, 'samples': 32768, 'steps': 63, 'loss/train': 7.665238380432129} -09/20/2021 14:42:30 - INFO - __main__ - Step 1025: {'lr': 1.7066666666666667e-05, 'samples': 32800, 'steps': 64, 'loss/train': 7.662180423736572} -09/20/2021 14:42:31 - INFO - __main__ - Step 1026: {'lr': 1.7066666666666667e-05, 'samples': 32832, 'steps': 64, 'loss/train': 7.418685436248779} -09/20/2021 14:42:31 - INFO - __main__ - Step 1027: {'lr': 1.7066666666666667e-05, 'samples': 32864, 'steps': 64, 'loss/train': 6.577938079833984} -09/20/2021 14:42:32 - INFO - __main__ - Step 1028: {'lr': 1.7066666666666667e-05, 'samples': 32896, 'steps': 64, 'loss/train': 8.556751251220703} -09/20/2021 14:42:33 - INFO - __main__ - Step 1029: {'lr': 1.7066666666666667e-05, 'samples': 32928, 'steps': 64, 'loss/train': 7.192653179168701} -09/20/2021 14:42:34 - INFO - __main__ - Step 1030: {'lr': 1.7066666666666667e-05, 'samples': 32960, 'steps': 64, 'loss/train': 7.212543964385986} -09/20/2021 14:42:34 - INFO - __main__ - Step 1031: {'lr': 1.7066666666666667e-05, 'samples': 32992, 'steps': 64, 'loss/train': 7.574189186096191} -09/20/2021 14:42:35 - INFO - __main__ - Step 1032: {'lr': 1.7066666666666667e-05, 'samples': 33024, 'steps': 64, 'loss/train': 7.273203372955322} -09/20/2021 14:42:36 - INFO - __main__ - Step 1033: {'lr': 1.7066666666666667e-05, 'samples': 33056, 'steps': 64, 'loss/train': 7.447497367858887} -09/20/2021 14:42:37 - INFO - __main__ - Step 1034: {'lr': 1.7066666666666667e-05, 'samples': 33088, 'steps': 64, 'loss/train': 6.921879291534424} -09/20/2021 14:42:37 - INFO - __main__ - Step 1035: {'lr': 1.7066666666666667e-05, 'samples': 33120, 'steps': 64, 'loss/train': 6.999035358428955} -09/20/2021 14:42:38 - INFO - __main__ - Step 1036: {'lr': 1.7066666666666667e-05, 'samples': 33152, 'steps': 64, 'loss/train': 7.14263916015625} -09/20/2021 14:42:39 - INFO - __main__ - Step 1037: {'lr': 1.7066666666666667e-05, 'samples': 33184, 'steps': 64, 'loss/train': 7.323070526123047} -09/20/2021 14:42:40 - INFO - __main__ - Step 1038: {'lr': 1.7066666666666667e-05, 'samples': 33216, 'steps': 64, 'loss/train': 7.902733325958252} -09/20/2021 14:42:40 - INFO - __main__ - Step 1039: {'lr': 1.7066666666666667e-05, 'samples': 33248, 'steps': 64, 'loss/train': 6.776241302490234} -09/20/2021 14:42:41 - INFO - __main__ - Step 1040: {'lr': 1.7066666666666667e-05, 'samples': 33280, 'steps': 64, 'loss/train': 7.181065082550049} -09/20/2021 14:42:42 - INFO - __main__ - Step 1041: {'lr': 1.7333333333333336e-05, 'samples': 33312, 'steps': 65, 'loss/train': 6.9239726066589355} -09/20/2021 14:42:43 - INFO - __main__ - Step 1042: {'lr': 1.7333333333333336e-05, 'samples': 33344, 'steps': 65, 'loss/train': 8.270888328552246} -09/20/2021 14:42:43 - INFO - __main__ - Step 1043: {'lr': 1.7333333333333336e-05, 'samples': 33376, 'steps': 65, 'loss/train': 7.500242710113525} -09/20/2021 14:42:44 - INFO - __main__ - Step 1044: {'lr': 1.7333333333333336e-05, 'samples': 33408, 'steps': 65, 'loss/train': 6.443797588348389} -09/20/2021 14:42:46 - INFO - __main__ - Step 1045: {'lr': 1.7333333333333336e-05, 'samples': 33440, 'steps': 65, 'loss/train': 7.632541179656982} -09/20/2021 14:42:46 - INFO - __main__ - Step 1046: {'lr': 1.7333333333333336e-05, 'samples': 33472, 'steps': 65, 'loss/train': 9.510030746459961} -09/20/2021 14:42:47 - INFO - __main__ - Step 1047: {'lr': 1.7333333333333336e-05, 'samples': 33504, 'steps': 65, 'loss/train': 7.049824237823486} -09/20/2021 14:42:48 - INFO - __main__ - Step 1048: {'lr': 1.7333333333333336e-05, 'samples': 33536, 'steps': 65, 'loss/train': 6.526880264282227} -09/20/2021 14:42:49 - INFO - __main__ - Step 1049: {'lr': 1.7333333333333336e-05, 'samples': 33568, 'steps': 65, 'loss/train': 7.445962429046631} -09/20/2021 14:42:49 - INFO - __main__ - Step 1050: {'lr': 1.7333333333333336e-05, 'samples': 33600, 'steps': 65, 'loss/train': 7.321645736694336} -09/20/2021 14:42:50 - INFO - __main__ - Step 1051: {'lr': 1.7333333333333336e-05, 'samples': 33632, 'steps': 65, 'loss/train': 6.8155107498168945} -09/20/2021 14:42:51 - INFO - __main__ - Step 1052: {'lr': 1.7333333333333336e-05, 'samples': 33664, 'steps': 65, 'loss/train': 7.681716442108154} -09/20/2021 14:42:52 - INFO - __main__ - Step 1053: {'lr': 1.7333333333333336e-05, 'samples': 33696, 'steps': 65, 'loss/train': 7.895340442657471} -09/20/2021 14:42:52 - INFO - __main__ - Step 1054: {'lr': 1.7333333333333336e-05, 'samples': 33728, 'steps': 65, 'loss/train': 7.59862756729126} -09/20/2021 14:42:53 - INFO - __main__ - Step 1055: {'lr': 1.7333333333333336e-05, 'samples': 33760, 'steps': 65, 'loss/train': 7.482161521911621} -09/20/2021 14:42:54 - INFO - __main__ - Step 1056: {'lr': 1.7333333333333336e-05, 'samples': 33792, 'steps': 65, 'loss/train': 6.8573150634765625} -09/20/2021 14:42:55 - INFO - __main__ - Step 1057: {'lr': 1.76e-05, 'samples': 33824, 'steps': 66, 'loss/train': 7.005787372589111} -09/20/2021 14:42:55 - INFO - __main__ - Step 1058: {'lr': 1.76e-05, 'samples': 33856, 'steps': 66, 'loss/train': 7.561100006103516} -09/20/2021 14:42:56 - INFO - __main__ - Step 1059: {'lr': 1.76e-05, 'samples': 33888, 'steps': 66, 'loss/train': 7.802297592163086} -09/20/2021 14:42:57 - INFO - __main__ - Step 1060: {'lr': 1.76e-05, 'samples': 33920, 'steps': 66, 'loss/train': 6.895226001739502} -09/20/2021 14:42:58 - INFO - __main__ - Step 1061: {'lr': 1.76e-05, 'samples': 33952, 'steps': 66, 'loss/train': 7.520148277282715} -09/20/2021 14:42:58 - INFO - __main__ - Step 1062: {'lr': 1.76e-05, 'samples': 33984, 'steps': 66, 'loss/train': 6.389556884765625} -09/20/2021 14:42:59 - INFO - __main__ - Step 1063: {'lr': 1.76e-05, 'samples': 34016, 'steps': 66, 'loss/train': 7.920084476470947} -09/20/2021 14:43:00 - INFO - __main__ - Step 1064: {'lr': 1.76e-05, 'samples': 34048, 'steps': 66, 'loss/train': 8.69666862487793} -09/20/2021 14:43:01 - INFO - __main__ - Step 1065: {'lr': 1.76e-05, 'samples': 34080, 'steps': 66, 'loss/train': 8.612204551696777} -09/20/2021 14:43:01 - INFO - __main__ - Step 1066: {'lr': 1.76e-05, 'samples': 34112, 'steps': 66, 'loss/train': 7.111959934234619} -09/20/2021 14:43:02 - INFO - __main__ - Step 1067: {'lr': 1.76e-05, 'samples': 34144, 'steps': 66, 'loss/train': 8.073663711547852} -09/20/2021 14:43:03 - INFO - __main__ - Step 1068: {'lr': 1.76e-05, 'samples': 34176, 'steps': 66, 'loss/train': 7.131277561187744} -09/20/2021 14:43:04 - INFO - __main__ - Step 1069: {'lr': 1.76e-05, 'samples': 34208, 'steps': 66, 'loss/train': 7.809062480926514} -09/20/2021 14:43:04 - INFO - __main__ - Step 1070: {'lr': 1.76e-05, 'samples': 34240, 'steps': 66, 'loss/train': 7.054793357849121} -09/20/2021 14:43:05 - INFO - __main__ - Step 1071: {'lr': 1.76e-05, 'samples': 34272, 'steps': 66, 'loss/train': 7.489339828491211} -09/20/2021 14:43:06 - INFO - __main__ - Step 1072: {'lr': 1.76e-05, 'samples': 34304, 'steps': 66, 'loss/train': 7.412154197692871} -09/20/2021 14:43:07 - INFO - __main__ - Step 1073: {'lr': 1.7866666666666666e-05, 'samples': 34336, 'steps': 67, 'loss/train': 7.294134140014648} -09/20/2021 14:43:08 - INFO - __main__ - Step 1074: {'lr': 1.7866666666666666e-05, 'samples': 34368, 'steps': 67, 'loss/train': 7.8630051612854} -09/20/2021 14:43:08 - INFO - __main__ - Step 1075: {'lr': 1.7866666666666666e-05, 'samples': 34400, 'steps': 67, 'loss/train': 6.755832195281982} -09/20/2021 14:43:09 - INFO - __main__ - Step 1076: {'lr': 1.7866666666666666e-05, 'samples': 34432, 'steps': 67, 'loss/train': 7.579298973083496} -09/20/2021 14:43:10 - INFO - __main__ - Step 1077: {'lr': 1.7866666666666666e-05, 'samples': 34464, 'steps': 67, 'loss/train': 7.996589660644531} -09/20/2021 14:43:11 - INFO - __main__ - Step 1078: {'lr': 1.7866666666666666e-05, 'samples': 34496, 'steps': 67, 'loss/train': 7.07041597366333} -09/20/2021 14:43:12 - INFO - __main__ - Step 1079: {'lr': 1.7866666666666666e-05, 'samples': 34528, 'steps': 67, 'loss/train': 7.550715446472168} -09/20/2021 14:43:13 - INFO - __main__ - Step 1080: {'lr': 1.7866666666666666e-05, 'samples': 34560, 'steps': 67, 'loss/train': 6.659928321838379} -09/20/2021 14:43:13 - INFO - __main__ - Step 1081: {'lr': 1.7866666666666666e-05, 'samples': 34592, 'steps': 67, 'loss/train': 6.8895955085754395} -09/20/2021 14:43:14 - INFO - __main__ - Step 1082: {'lr': 1.7866666666666666e-05, 'samples': 34624, 'steps': 67, 'loss/train': 7.48750638961792} -09/20/2021 14:43:15 - INFO - __main__ - Step 1083: {'lr': 1.7866666666666666e-05, 'samples': 34656, 'steps': 67, 'loss/train': 5.184743881225586} -09/20/2021 14:43:16 - INFO - __main__ - Step 1084: {'lr': 1.7866666666666666e-05, 'samples': 34688, 'steps': 67, 'loss/train': 7.246478080749512} -09/20/2021 14:43:16 - INFO - __main__ - Step 1085: {'lr': 1.7866666666666666e-05, 'samples': 34720, 'steps': 67, 'loss/train': 7.3852620124816895} -09/20/2021 14:43:17 - INFO - __main__ - Step 1086: {'lr': 1.7866666666666666e-05, 'samples': 34752, 'steps': 67, 'loss/train': 6.473173141479492} -09/20/2021 14:43:18 - INFO - __main__ - Step 1087: {'lr': 1.7866666666666666e-05, 'samples': 34784, 'steps': 67, 'loss/train': 6.895011901855469} -09/20/2021 14:43:19 - INFO - __main__ - Step 1088: {'lr': 1.7866666666666666e-05, 'samples': 34816, 'steps': 67, 'loss/train': 8.216290473937988} -09/20/2021 14:43:20 - INFO - __main__ - Step 1089: {'lr': 1.8133333333333335e-05, 'samples': 34848, 'steps': 68, 'loss/train': 6.891305446624756} -09/20/2021 14:43:20 - INFO - __main__ - Step 1090: {'lr': 1.8133333333333335e-05, 'samples': 34880, 'steps': 68, 'loss/train': 7.224772930145264} -09/20/2021 14:43:21 - INFO - __main__ - Step 1091: {'lr': 1.8133333333333335e-05, 'samples': 34912, 'steps': 68, 'loss/train': 7.0554327964782715} -09/20/2021 14:43:22 - INFO - __main__ - Step 1092: {'lr': 1.8133333333333335e-05, 'samples': 34944, 'steps': 68, 'loss/train': 6.763323783874512} -09/20/2021 14:43:23 - INFO - __main__ - Step 1093: {'lr': 1.8133333333333335e-05, 'samples': 34976, 'steps': 68, 'loss/train': 7.959135055541992} -09/20/2021 14:43:23 - INFO - __main__ - Step 1094: {'lr': 1.8133333333333335e-05, 'samples': 35008, 'steps': 68, 'loss/train': 7.482904434204102} -09/20/2021 14:43:24 - INFO - __main__ - Step 1095: {'lr': 1.8133333333333335e-05, 'samples': 35040, 'steps': 68, 'loss/train': 6.4327545166015625} -09/20/2021 14:43:25 - INFO - __main__ - Step 1096: {'lr': 1.8133333333333335e-05, 'samples': 35072, 'steps': 68, 'loss/train': 7.46536922454834} -09/20/2021 14:43:26 - INFO - __main__ - Step 1097: {'lr': 1.8133333333333335e-05, 'samples': 35104, 'steps': 68, 'loss/train': 7.3268303871154785} -09/20/2021 14:43:26 - INFO - __main__ - Step 1098: {'lr': 1.8133333333333335e-05, 'samples': 35136, 'steps': 68, 'loss/train': 7.640202522277832} -09/20/2021 14:43:27 - INFO - __main__ - Step 1099: {'lr': 1.8133333333333335e-05, 'samples': 35168, 'steps': 68, 'loss/train': 7.847533226013184} -09/20/2021 14:43:28 - INFO - __main__ - Step 1100: {'lr': 1.8133333333333335e-05, 'samples': 35200, 'steps': 68, 'loss/train': 6.594987869262695} -09/20/2021 14:43:29 - INFO - __main__ - Step 1101: {'lr': 1.8133333333333335e-05, 'samples': 35232, 'steps': 68, 'loss/train': 7.512807846069336} -09/20/2021 14:43:29 - INFO - __main__ - Step 1102: {'lr': 1.8133333333333335e-05, 'samples': 35264, 'steps': 68, 'loss/train': 7.124242782592773} -09/20/2021 14:43:30 - INFO - __main__ - Step 1103: {'lr': 1.8133333333333335e-05, 'samples': 35296, 'steps': 68, 'loss/train': 6.80643367767334} -09/20/2021 14:43:31 - INFO - __main__ - Step 1104: {'lr': 1.8133333333333335e-05, 'samples': 35328, 'steps': 68, 'loss/train': 7.582176208496094} -09/20/2021 14:43:32 - INFO - __main__ - Step 1105: {'lr': 1.84e-05, 'samples': 35360, 'steps': 69, 'loss/train': 6.917186737060547} -09/20/2021 14:43:32 - INFO - __main__ - Step 1106: {'lr': 1.84e-05, 'samples': 35392, 'steps': 69, 'loss/train': 6.1422247886657715} -09/20/2021 14:43:33 - INFO - __main__ - Step 1107: {'lr': 1.84e-05, 'samples': 35424, 'steps': 69, 'loss/train': 6.871832370758057} -09/20/2021 14:43:35 - INFO - __main__ - Step 1108: {'lr': 1.84e-05, 'samples': 35456, 'steps': 69, 'loss/train': 6.963371753692627} -09/20/2021 14:43:35 - INFO - __main__ - Step 1109: {'lr': 1.84e-05, 'samples': 35488, 'steps': 69, 'loss/train': 7.756068706512451} -09/20/2021 14:43:36 - INFO - __main__ - Step 1110: {'lr': 1.84e-05, 'samples': 35520, 'steps': 69, 'loss/train': 6.725419044494629} -09/20/2021 14:43:37 - INFO - __main__ - Step 1111: {'lr': 1.84e-05, 'samples': 35552, 'steps': 69, 'loss/train': 7.52742338180542} -09/20/2021 14:43:38 - INFO - __main__ - Step 1112: {'lr': 1.84e-05, 'samples': 35584, 'steps': 69, 'loss/train': 7.0767669677734375} -09/20/2021 14:43:38 - INFO - __main__ - Step 1113: {'lr': 1.84e-05, 'samples': 35616, 'steps': 69, 'loss/train': 8.006622314453125} -09/20/2021 14:43:39 - INFO - __main__ - Step 1114: {'lr': 1.84e-05, 'samples': 35648, 'steps': 69, 'loss/train': 6.927874565124512} -09/20/2021 14:43:40 - INFO - __main__ - Step 1115: {'lr': 1.84e-05, 'samples': 35680, 'steps': 69, 'loss/train': 7.1843132972717285} -09/20/2021 14:43:41 - INFO - __main__ - Step 1116: {'lr': 1.84e-05, 'samples': 35712, 'steps': 69, 'loss/train': 7.877161979675293} -09/20/2021 14:43:41 - INFO - __main__ - Step 1117: {'lr': 1.84e-05, 'samples': 35744, 'steps': 69, 'loss/train': 7.683578968048096} -09/20/2021 14:43:42 - INFO - __main__ - Step 1118: {'lr': 1.84e-05, 'samples': 35776, 'steps': 69, 'loss/train': 7.344283580780029} -09/20/2021 14:43:43 - INFO - __main__ - Step 1119: {'lr': 1.84e-05, 'samples': 35808, 'steps': 69, 'loss/train': 7.0789079666137695} -09/20/2021 14:43:44 - INFO - __main__ - Step 1120: {'lr': 1.84e-05, 'samples': 35840, 'steps': 69, 'loss/train': 8.1862154006958} -09/20/2021 14:43:44 - INFO - __main__ - Step 1121: {'lr': 1.866666666666667e-05, 'samples': 35872, 'steps': 70, 'loss/train': 7.7049455642700195} -09/20/2021 14:43:45 - INFO - __main__ - Step 1122: {'lr': 1.866666666666667e-05, 'samples': 35904, 'steps': 70, 'loss/train': 7.654905796051025} -09/20/2021 14:43:46 - INFO - __main__ - Step 1123: {'lr': 1.866666666666667e-05, 'samples': 35936, 'steps': 70, 'loss/train': 9.358372688293457} -09/20/2021 14:43:47 - INFO - __main__ - Step 1124: {'lr': 1.866666666666667e-05, 'samples': 35968, 'steps': 70, 'loss/train': 6.60532808303833} -09/20/2021 14:43:47 - INFO - __main__ - Step 1125: {'lr': 1.866666666666667e-05, 'samples': 36000, 'steps': 70, 'loss/train': 7.669249057769775} -09/20/2021 14:43:48 - INFO - __main__ - Step 1126: {'lr': 1.866666666666667e-05, 'samples': 36032, 'steps': 70, 'loss/train': 6.854447364807129} -09/20/2021 14:43:49 - INFO - __main__ - Step 1127: {'lr': 1.866666666666667e-05, 'samples': 36064, 'steps': 70, 'loss/train': 7.906315803527832} -09/20/2021 14:43:50 - INFO - __main__ - Step 1128: {'lr': 1.866666666666667e-05, 'samples': 36096, 'steps': 70, 'loss/train': 8.437665939331055} -09/20/2021 14:43:50 - INFO - __main__ - Step 1129: {'lr': 1.866666666666667e-05, 'samples': 36128, 'steps': 70, 'loss/train': 8.106748580932617} -09/20/2021 14:43:51 - INFO - __main__ - Step 1130: {'lr': 1.866666666666667e-05, 'samples': 36160, 'steps': 70, 'loss/train': 7.631389617919922} -09/20/2021 14:43:52 - INFO - __main__ - Step 1131: {'lr': 1.866666666666667e-05, 'samples': 36192, 'steps': 70, 'loss/train': 7.155187606811523} -09/20/2021 14:43:53 - INFO - __main__ - Step 1132: {'lr': 1.866666666666667e-05, 'samples': 36224, 'steps': 70, 'loss/train': 7.112966537475586} -09/20/2021 14:43:53 - INFO - __main__ - Step 1133: {'lr': 1.866666666666667e-05, 'samples': 36256, 'steps': 70, 'loss/train': 7.481685161590576} -09/20/2021 14:43:54 - INFO - __main__ - Step 1134: {'lr': 1.866666666666667e-05, 'samples': 36288, 'steps': 70, 'loss/train': 7.712798595428467} -09/20/2021 14:43:55 - INFO - __main__ - Step 1135: {'lr': 1.866666666666667e-05, 'samples': 36320, 'steps': 70, 'loss/train': 6.554546356201172} -09/20/2021 14:43:56 - INFO - __main__ - Step 1136: {'lr': 1.866666666666667e-05, 'samples': 36352, 'steps': 70, 'loss/train': 7.87826681137085} -09/20/2021 14:43:57 - INFO - __main__ - Step 1137: {'lr': 1.8933333333333334e-05, 'samples': 36384, 'steps': 71, 'loss/train': 8.556035995483398} -09/20/2021 14:43:57 - INFO - __main__ - Step 1138: {'lr': 1.8933333333333334e-05, 'samples': 36416, 'steps': 71, 'loss/train': 7.709559917449951} -09/20/2021 14:43:58 - INFO - __main__ - Step 1139: {'lr': 1.8933333333333334e-05, 'samples': 36448, 'steps': 71, 'loss/train': 7.525731086730957} -09/20/2021 14:43:59 - INFO - __main__ - Step 1140: {'lr': 1.8933333333333334e-05, 'samples': 36480, 'steps': 71, 'loss/train': 7.240142822265625} -09/20/2021 14:44:00 - INFO - __main__ - Step 1141: {'lr': 1.8933333333333334e-05, 'samples': 36512, 'steps': 71, 'loss/train': 6.988956928253174} -09/20/2021 14:44:01 - INFO - __main__ - Step 1142: {'lr': 1.8933333333333334e-05, 'samples': 36544, 'steps': 71, 'loss/train': 6.963980674743652} -09/20/2021 14:44:02 - INFO - __main__ - Step 1143: {'lr': 1.8933333333333334e-05, 'samples': 36576, 'steps': 71, 'loss/train': 7.370689868927002} -09/20/2021 14:44:02 - INFO - __main__ - Step 1144: {'lr': 1.8933333333333334e-05, 'samples': 36608, 'steps': 71, 'loss/train': 7.8739848136901855} -09/20/2021 14:44:03 - INFO - __main__ - Step 1145: {'lr': 1.8933333333333334e-05, 'samples': 36640, 'steps': 71, 'loss/train': 7.323734760284424} -09/20/2021 14:44:04 - INFO - __main__ - Step 1146: {'lr': 1.8933333333333334e-05, 'samples': 36672, 'steps': 71, 'loss/train': 7.114187240600586} -09/20/2021 14:44:05 - INFO - __main__ - Step 1147: {'lr': 1.8933333333333334e-05, 'samples': 36704, 'steps': 71, 'loss/train': 7.714621543884277} -09/20/2021 14:44:05 - INFO - __main__ - Step 1148: {'lr': 1.8933333333333334e-05, 'samples': 36736, 'steps': 71, 'loss/train': 7.361697673797607} -09/20/2021 14:44:06 - INFO - __main__ - Step 1149: {'lr': 1.8933333333333334e-05, 'samples': 36768, 'steps': 71, 'loss/train': 8.078926086425781} -09/20/2021 14:44:07 - INFO - __main__ - Step 1150: {'lr': 1.8933333333333334e-05, 'samples': 36800, 'steps': 71, 'loss/train': 7.831512928009033} -09/20/2021 14:44:08 - INFO - __main__ - Step 1151: {'lr': 1.8933333333333334e-05, 'samples': 36832, 'steps': 71, 'loss/train': 7.686062335968018} -09/20/2021 14:44:08 - INFO - __main__ - Step 1152: {'lr': 1.8933333333333334e-05, 'samples': 36864, 'steps': 71, 'loss/train': 7.526142120361328} -09/20/2021 14:44:09 - INFO - __main__ - Step 1153: {'lr': 1.9200000000000003e-05, 'samples': 36896, 'steps': 72, 'loss/train': 7.073324680328369} -09/20/2021 14:44:10 - INFO - __main__ - Step 1154: {'lr': 1.9200000000000003e-05, 'samples': 36928, 'steps': 72, 'loss/train': 7.361159801483154} -09/20/2021 14:44:11 - INFO - __main__ - Step 1155: {'lr': 1.9200000000000003e-05, 'samples': 36960, 'steps': 72, 'loss/train': 6.909931182861328} -09/20/2021 14:44:12 - INFO - __main__ - Step 1156: {'lr': 1.9200000000000003e-05, 'samples': 36992, 'steps': 72, 'loss/train': 7.89625883102417} -09/20/2021 14:44:12 - INFO - __main__ - Step 1157: {'lr': 1.9200000000000003e-05, 'samples': 37024, 'steps': 72, 'loss/train': 6.722976207733154} -09/20/2021 14:44:13 - INFO - __main__ - Step 1158: {'lr': 1.9200000000000003e-05, 'samples': 37056, 'steps': 72, 'loss/train': 7.4174675941467285} -09/20/2021 14:44:14 - INFO - __main__ - Step 1159: {'lr': 1.9200000000000003e-05, 'samples': 37088, 'steps': 72, 'loss/train': 7.086045265197754} -09/20/2021 14:44:15 - INFO - __main__ - Step 1160: {'lr': 1.9200000000000003e-05, 'samples': 37120, 'steps': 72, 'loss/train': 7.216862678527832} -09/20/2021 14:44:15 - INFO - __main__ - Step 1161: {'lr': 1.9200000000000003e-05, 'samples': 37152, 'steps': 72, 'loss/train': 7.063986301422119} -09/20/2021 14:44:16 - INFO - __main__ - Step 1162: {'lr': 1.9200000000000003e-05, 'samples': 37184, 'steps': 72, 'loss/train': 6.192840099334717} -09/20/2021 14:44:17 - INFO - __main__ - Step 1163: {'lr': 1.9200000000000003e-05, 'samples': 37216, 'steps': 72, 'loss/train': 6.555092811584473} -09/20/2021 14:44:18 - INFO - __main__ - Step 1164: {'lr': 1.9200000000000003e-05, 'samples': 37248, 'steps': 72, 'loss/train': 6.839874744415283} -09/20/2021 14:44:18 - INFO - __main__ - Step 1165: {'lr': 1.9200000000000003e-05, 'samples': 37280, 'steps': 72, 'loss/train': 6.979328155517578} -09/20/2021 14:44:19 - INFO - __main__ - Step 1166: {'lr': 1.9200000000000003e-05, 'samples': 37312, 'steps': 72, 'loss/train': 7.222862243652344} -09/20/2021 14:44:20 - INFO - __main__ - Step 1167: {'lr': 1.9200000000000003e-05, 'samples': 37344, 'steps': 72, 'loss/train': 7.200576305389404} -09/20/2021 14:44:21 - INFO - __main__ - Step 1168: {'lr': 1.9200000000000003e-05, 'samples': 37376, 'steps': 72, 'loss/train': 7.665902614593506} -09/20/2021 14:44:22 - INFO - __main__ - Step 1169: {'lr': 1.9466666666666668e-05, 'samples': 37408, 'steps': 73, 'loss/train': 7.5635085105896} -09/20/2021 14:44:22 - INFO - __main__ - Step 1170: {'lr': 1.9466666666666668e-05, 'samples': 37440, 'steps': 73, 'loss/train': 6.732106685638428} -09/20/2021 14:44:23 - INFO - __main__ - Step 1171: {'lr': 1.9466666666666668e-05, 'samples': 37472, 'steps': 73, 'loss/train': 7.297885894775391} -09/20/2021 14:44:24 - INFO - __main__ - Step 1172: {'lr': 1.9466666666666668e-05, 'samples': 37504, 'steps': 73, 'loss/train': 7.17567777633667} -09/20/2021 14:44:25 - INFO - __main__ - Step 1173: {'lr': 1.9466666666666668e-05, 'samples': 37536, 'steps': 73, 'loss/train': 6.953014373779297} -09/20/2021 14:44:26 - INFO - __main__ - Step 1174: {'lr': 1.9466666666666668e-05, 'samples': 37568, 'steps': 73, 'loss/train': 6.390618801116943} -09/20/2021 14:44:27 - INFO - __main__ - Step 1175: {'lr': 1.9466666666666668e-05, 'samples': 37600, 'steps': 73, 'loss/train': 7.043236255645752} -09/20/2021 14:44:28 - INFO - __main__ - Step 1176: {'lr': 1.9466666666666668e-05, 'samples': 37632, 'steps': 73, 'loss/train': 7.8391289710998535} -09/20/2021 14:44:28 - INFO - __main__ - Step 1177: {'lr': 1.9466666666666668e-05, 'samples': 37664, 'steps': 73, 'loss/train': 6.971271991729736} -09/20/2021 14:44:29 - INFO - __main__ - Step 1178: {'lr': 1.9466666666666668e-05, 'samples': 37696, 'steps': 73, 'loss/train': 8.087117195129395} -09/20/2021 14:44:30 - INFO - __main__ - Step 1179: {'lr': 1.9466666666666668e-05, 'samples': 37728, 'steps': 73, 'loss/train': 6.912197113037109} -09/20/2021 14:44:31 - INFO - __main__ - Step 1180: {'lr': 1.9466666666666668e-05, 'samples': 37760, 'steps': 73, 'loss/train': 7.460375785827637} -09/20/2021 14:44:31 - INFO - __main__ - Step 1181: {'lr': 1.9466666666666668e-05, 'samples': 37792, 'steps': 73, 'loss/train': 7.652247905731201} -09/20/2021 14:44:32 - INFO - __main__ - Step 1182: {'lr': 1.9466666666666668e-05, 'samples': 37824, 'steps': 73, 'loss/train': 6.547821521759033} -09/20/2021 14:44:33 - INFO - __main__ - Step 1183: {'lr': 1.9466666666666668e-05, 'samples': 37856, 'steps': 73, 'loss/train': 7.049105644226074} -09/20/2021 14:44:34 - INFO - __main__ - Step 1184: {'lr': 1.9466666666666668e-05, 'samples': 37888, 'steps': 73, 'loss/train': 6.8223490715026855} -09/20/2021 14:44:35 - INFO - __main__ - Step 1185: {'lr': 1.9733333333333333e-05, 'samples': 37920, 'steps': 74, 'loss/train': 7.077586650848389} -09/20/2021 14:44:35 - INFO - __main__ - Step 1186: {'lr': 1.9733333333333333e-05, 'samples': 37952, 'steps': 74, 'loss/train': 6.939738750457764} -09/20/2021 14:44:36 - INFO - __main__ - Step 1187: {'lr': 1.9733333333333333e-05, 'samples': 37984, 'steps': 74, 'loss/train': 6.793521881103516} -09/20/2021 14:44:37 - INFO - __main__ - Step 1188: {'lr': 1.9733333333333333e-05, 'samples': 38016, 'steps': 74, 'loss/train': 6.794055938720703} -09/20/2021 14:44:38 - INFO - __main__ - Step 1189: {'lr': 1.9733333333333333e-05, 'samples': 38048, 'steps': 74, 'loss/train': 7.301736354827881} -09/20/2021 14:44:38 - INFO - __main__ - Step 1190: {'lr': 1.9733333333333333e-05, 'samples': 38080, 'steps': 74, 'loss/train': 7.447640895843506} -09/20/2021 14:44:39 - INFO - __main__ - Step 1191: {'lr': 1.9733333333333333e-05, 'samples': 38112, 'steps': 74, 'loss/train': 7.11446475982666} -09/20/2021 14:44:40 - INFO - __main__ - Step 1192: {'lr': 1.9733333333333333e-05, 'samples': 38144, 'steps': 74, 'loss/train': 7.274781703948975} -09/20/2021 14:44:41 - INFO - __main__ - Step 1193: {'lr': 1.9733333333333333e-05, 'samples': 38176, 'steps': 74, 'loss/train': 6.611105918884277} -09/20/2021 14:44:41 - INFO - __main__ - Step 1194: {'lr': 1.9733333333333333e-05, 'samples': 38208, 'steps': 74, 'loss/train': 7.013664722442627} -09/20/2021 14:44:42 - INFO - __main__ - Step 1195: {'lr': 1.9733333333333333e-05, 'samples': 38240, 'steps': 74, 'loss/train': 7.622310638427734} -09/20/2021 14:44:43 - INFO - __main__ - Step 1196: {'lr': 1.9733333333333333e-05, 'samples': 38272, 'steps': 74, 'loss/train': 7.5682220458984375} -09/20/2021 14:44:44 - INFO - __main__ - Step 1197: {'lr': 1.9733333333333333e-05, 'samples': 38304, 'steps': 74, 'loss/train': 6.492344379425049} -09/20/2021 14:44:44 - INFO - __main__ - Step 1198: {'lr': 1.9733333333333333e-05, 'samples': 38336, 'steps': 74, 'loss/train': 8.745185852050781} -09/20/2021 14:44:45 - INFO - __main__ - Step 1199: {'lr': 1.9733333333333333e-05, 'samples': 38368, 'steps': 74, 'loss/train': 6.965442180633545} -09/20/2021 14:44:46 - INFO - __main__ - Step 1200: {'lr': 1.9733333333333333e-05, 'samples': 38400, 'steps': 74, 'loss/train': 7.557473182678223} -09/20/2021 14:44:47 - INFO - __main__ - Step 1201: {'lr': 2e-05, 'samples': 38432, 'steps': 75, 'loss/train': 6.884886741638184} -09/20/2021 14:44:48 - INFO - __main__ - Step 1202: {'lr': 2e-05, 'samples': 38464, 'steps': 75, 'loss/train': 7.3290557861328125} -09/20/2021 14:44:48 - INFO - __main__ - Step 1203: {'lr': 2e-05, 'samples': 38496, 'steps': 75, 'loss/train': 6.973666191101074} -09/20/2021 14:44:49 - INFO - __main__ - Step 1204: {'lr': 2e-05, 'samples': 38528, 'steps': 75, 'loss/train': 7.755762100219727} -09/20/2021 14:44:50 - INFO - __main__ - Step 1205: {'lr': 2e-05, 'samples': 38560, 'steps': 75, 'loss/train': 6.034870624542236} -09/20/2021 14:44:51 - INFO - __main__ - Step 1206: {'lr': 2e-05, 'samples': 38592, 'steps': 75, 'loss/train': 6.097821235656738} -09/20/2021 14:44:51 - INFO - __main__ - Step 1207: {'lr': 2e-05, 'samples': 38624, 'steps': 75, 'loss/train': 6.2052001953125} -09/20/2021 14:44:52 - INFO - __main__ - Step 1208: {'lr': 2e-05, 'samples': 38656, 'steps': 75, 'loss/train': 6.756560802459717} -09/20/2021 14:44:53 - INFO - __main__ - Step 1209: {'lr': 2e-05, 'samples': 38688, 'steps': 75, 'loss/train': 6.618544101715088} -09/20/2021 14:44:54 - INFO - __main__ - Step 1210: {'lr': 2e-05, 'samples': 38720, 'steps': 75, 'loss/train': 8.164134979248047} -09/20/2021 14:44:54 - INFO - __main__ - Step 1211: {'lr': 2e-05, 'samples': 38752, 'steps': 75, 'loss/train': 7.945216178894043} -09/20/2021 14:44:56 - INFO - __main__ - Step 1212: {'lr': 2e-05, 'samples': 38784, 'steps': 75, 'loss/train': 6.4277191162109375} -09/20/2021 14:44:57 - INFO - __main__ - Step 1213: {'lr': 2e-05, 'samples': 38816, 'steps': 75, 'loss/train': 7.118281364440918} -09/20/2021 14:44:58 - INFO - __main__ - Step 1214: {'lr': 2e-05, 'samples': 38848, 'steps': 75, 'loss/train': 7.163132190704346} -09/20/2021 14:44:58 - INFO - __main__ - Step 1215: {'lr': 2e-05, 'samples': 38880, 'steps': 75, 'loss/train': 7.001889705657959} -09/20/2021 14:44:59 - INFO - __main__ - Step 1216: {'lr': 2e-05, 'samples': 38912, 'steps': 75, 'loss/train': 7.663928985595703} -09/20/2021 14:45:00 - INFO - __main__ - Step 1217: {'lr': 2.0266666666666667e-05, 'samples': 38944, 'steps': 76, 'loss/train': 7.1572465896606445} -09/20/2021 14:45:01 - INFO - __main__ - Step 1218: {'lr': 2.0266666666666667e-05, 'samples': 38976, 'steps': 76, 'loss/train': 7.133402347564697} -09/20/2021 14:45:01 - INFO - __main__ - Step 1219: {'lr': 2.0266666666666667e-05, 'samples': 39008, 'steps': 76, 'loss/train': 6.544497013092041} -09/20/2021 14:45:02 - INFO - __main__ - Step 1220: {'lr': 2.0266666666666667e-05, 'samples': 39040, 'steps': 76, 'loss/train': 6.892357349395752} -09/20/2021 14:45:03 - INFO - __main__ - Step 1221: {'lr': 2.0266666666666667e-05, 'samples': 39072, 'steps': 76, 'loss/train': 7.455821990966797} -09/20/2021 14:45:04 - INFO - __main__ - Step 1222: {'lr': 2.0266666666666667e-05, 'samples': 39104, 'steps': 76, 'loss/train': 7.535419940948486} -09/20/2021 14:45:04 - INFO - __main__ - Step 1223: {'lr': 2.0266666666666667e-05, 'samples': 39136, 'steps': 76, 'loss/train': 7.16645622253418} -09/20/2021 14:45:05 - INFO - __main__ - Step 1224: {'lr': 2.0266666666666667e-05, 'samples': 39168, 'steps': 76, 'loss/train': 6.742935657501221} -09/20/2021 14:45:06 - INFO - __main__ - Step 1225: {'lr': 2.0266666666666667e-05, 'samples': 39200, 'steps': 76, 'loss/train': 6.663435459136963} -09/20/2021 14:45:07 - INFO - __main__ - Step 1226: {'lr': 2.0266666666666667e-05, 'samples': 39232, 'steps': 76, 'loss/train': 7.460683822631836} -09/20/2021 14:45:07 - INFO - __main__ - Step 1227: {'lr': 2.0266666666666667e-05, 'samples': 39264, 'steps': 76, 'loss/train': 6.906180381774902} -09/20/2021 14:45:08 - INFO - __main__ - Step 1228: {'lr': 2.0266666666666667e-05, 'samples': 39296, 'steps': 76, 'loss/train': 7.326055526733398} -09/20/2021 14:45:09 - INFO - __main__ - Step 1229: {'lr': 2.0266666666666667e-05, 'samples': 39328, 'steps': 76, 'loss/train': 7.272572994232178} -09/20/2021 14:45:10 - INFO - __main__ - Step 1230: {'lr': 2.0266666666666667e-05, 'samples': 39360, 'steps': 76, 'loss/train': 6.792047500610352} -09/20/2021 14:45:10 - INFO - __main__ - Step 1231: {'lr': 2.0266666666666667e-05, 'samples': 39392, 'steps': 76, 'loss/train': 7.505480766296387} -09/20/2021 14:45:11 - INFO - __main__ - Step 1232: {'lr': 2.0266666666666667e-05, 'samples': 39424, 'steps': 76, 'loss/train': 6.771306991577148} -09/20/2021 14:45:12 - INFO - __main__ - Step 1233: {'lr': 2.0533333333333336e-05, 'samples': 39456, 'steps': 77, 'loss/train': 6.507347106933594} -09/20/2021 14:45:13 - INFO - __main__ - Step 1234: {'lr': 2.0533333333333336e-05, 'samples': 39488, 'steps': 77, 'loss/train': 6.737583160400391} -09/20/2021 14:45:14 - INFO - __main__ - Step 1235: {'lr': 2.0533333333333336e-05, 'samples': 39520, 'steps': 77, 'loss/train': 7.257676601409912} -09/20/2021 14:45:14 - INFO - __main__ - Step 1236: {'lr': 2.0533333333333336e-05, 'samples': 39552, 'steps': 77, 'loss/train': 6.467931270599365} -09/20/2021 14:45:15 - INFO - __main__ - Step 1237: {'lr': 2.0533333333333336e-05, 'samples': 39584, 'steps': 77, 'loss/train': 6.655056476593018} -09/20/2021 14:45:16 - INFO - __main__ - Step 1238: {'lr': 2.0533333333333336e-05, 'samples': 39616, 'steps': 77, 'loss/train': 6.851518154144287} -09/20/2021 14:45:17 - INFO - __main__ - Step 1239: {'lr': 2.0533333333333336e-05, 'samples': 39648, 'steps': 77, 'loss/train': 7.7107954025268555} -09/20/2021 14:45:17 - INFO - __main__ - Step 1240: {'lr': 2.0533333333333336e-05, 'samples': 39680, 'steps': 77, 'loss/train': 7.022248268127441} -09/20/2021 14:45:18 - INFO - __main__ - Step 1241: {'lr': 2.0533333333333336e-05, 'samples': 39712, 'steps': 77, 'loss/train': 7.238912582397461} -09/20/2021 14:45:19 - INFO - __main__ - Step 1242: {'lr': 2.0533333333333336e-05, 'samples': 39744, 'steps': 77, 'loss/train': 6.403892993927002} -09/20/2021 14:45:20 - INFO - __main__ - Step 1243: {'lr': 2.0533333333333336e-05, 'samples': 39776, 'steps': 77, 'loss/train': 6.5764546394348145} -09/20/2021 14:45:21 - INFO - __main__ - Step 1244: {'lr': 2.0533333333333336e-05, 'samples': 39808, 'steps': 77, 'loss/train': 8.998181343078613} -09/20/2021 14:45:22 - INFO - __main__ - Step 1245: {'lr': 2.0533333333333336e-05, 'samples': 39840, 'steps': 77, 'loss/train': 7.101668357849121} -09/20/2021 14:45:23 - INFO - __main__ - Step 1246: {'lr': 2.0533333333333336e-05, 'samples': 39872, 'steps': 77, 'loss/train': 6.602473258972168} -09/20/2021 14:45:23 - INFO - __main__ - Step 1247: {'lr': 2.0533333333333336e-05, 'samples': 39904, 'steps': 77, 'loss/train': 6.033279895782471} -09/20/2021 14:45:24 - INFO - __main__ - Step 1248: {'lr': 2.0533333333333336e-05, 'samples': 39936, 'steps': 77, 'loss/train': 7.939269542694092} -09/20/2021 14:45:25 - INFO - __main__ - Step 1249: {'lr': 2.08e-05, 'samples': 39968, 'steps': 78, 'loss/train': 6.074924945831299} -09/20/2021 14:45:26 - INFO - __main__ - Step 1250: {'lr': 2.08e-05, 'samples': 40000, 'steps': 78, 'loss/train': 6.077233791351318} -09/20/2021 14:45:27 - INFO - __main__ - Step 1251: {'lr': 2.08e-05, 'samples': 40032, 'steps': 78, 'loss/train': 5.543767929077148} -09/20/2021 14:45:27 - INFO - __main__ - Step 1252: {'lr': 2.08e-05, 'samples': 40064, 'steps': 78, 'loss/train': 6.107880115509033} -09/20/2021 14:45:28 - INFO - __main__ - Step 1253: {'lr': 2.08e-05, 'samples': 40096, 'steps': 78, 'loss/train': 7.0136260986328125} -09/20/2021 14:45:29 - INFO - __main__ - Step 1254: {'lr': 2.08e-05, 'samples': 40128, 'steps': 78, 'loss/train': 6.795555591583252} -09/20/2021 14:45:30 - INFO - __main__ - Step 1255: {'lr': 2.08e-05, 'samples': 40160, 'steps': 78, 'loss/train': 5.8849077224731445} -09/20/2021 14:45:30 - INFO - __main__ - Step 1256: {'lr': 2.08e-05, 'samples': 40192, 'steps': 78, 'loss/train': 6.970694065093994} -09/20/2021 14:45:31 - INFO - __main__ - Step 1257: {'lr': 2.08e-05, 'samples': 40224, 'steps': 78, 'loss/train': 6.8195481300354} -09/20/2021 14:45:32 - INFO - __main__ - Step 1258: {'lr': 2.08e-05, 'samples': 40256, 'steps': 78, 'loss/train': 9.26230239868164} -09/20/2021 14:45:33 - INFO - __main__ - Step 1259: {'lr': 2.08e-05, 'samples': 40288, 'steps': 78, 'loss/train': 6.56361198425293} -09/20/2021 14:45:33 - INFO - __main__ - Step 1260: {'lr': 2.08e-05, 'samples': 40320, 'steps': 78, 'loss/train': 6.853907585144043} -09/20/2021 14:45:34 - INFO - __main__ - Step 1261: {'lr': 2.08e-05, 'samples': 40352, 'steps': 78, 'loss/train': 7.778400897979736} -09/20/2021 14:45:35 - INFO - __main__ - Step 1262: {'lr': 2.08e-05, 'samples': 40384, 'steps': 78, 'loss/train': 7.166581153869629} -09/20/2021 14:45:36 - INFO - __main__ - Step 1263: {'lr': 2.08e-05, 'samples': 40416, 'steps': 78, 'loss/train': 7.394590854644775} -09/20/2021 14:45:36 - INFO - __main__ - Step 1264: {'lr': 2.08e-05, 'samples': 40448, 'steps': 78, 'loss/train': 7.1355156898498535} -09/20/2021 14:45:37 - INFO - __main__ - Step 1265: {'lr': 2.106666666666667e-05, 'samples': 40480, 'steps': 79, 'loss/train': 6.038400173187256} -09/20/2021 14:45:38 - INFO - __main__ - Step 1266: {'lr': 2.106666666666667e-05, 'samples': 40512, 'steps': 79, 'loss/train': 7.276357173919678} -09/20/2021 14:45:39 - INFO - __main__ - Step 1267: {'lr': 2.106666666666667e-05, 'samples': 40544, 'steps': 79, 'loss/train': 7.576699733734131} -09/20/2021 14:45:40 - INFO - __main__ - Step 1268: {'lr': 2.106666666666667e-05, 'samples': 40576, 'steps': 79, 'loss/train': 8.422048568725586} -09/20/2021 14:45:40 - INFO - __main__ - Step 1269: {'lr': 2.106666666666667e-05, 'samples': 40608, 'steps': 79, 'loss/train': 7.368470668792725} -09/20/2021 14:45:41 - INFO - __main__ - Step 1270: {'lr': 2.106666666666667e-05, 'samples': 40640, 'steps': 79, 'loss/train': 7.978740215301514} -09/20/2021 14:45:42 - INFO - __main__ - Step 1271: {'lr': 2.106666666666667e-05, 'samples': 40672, 'steps': 79, 'loss/train': 6.927475452423096} -09/20/2021 14:45:43 - INFO - __main__ - Step 1272: {'lr': 2.106666666666667e-05, 'samples': 40704, 'steps': 79, 'loss/train': 6.549900054931641} -09/20/2021 14:45:43 - INFO - __main__ - Step 1273: {'lr': 2.106666666666667e-05, 'samples': 40736, 'steps': 79, 'loss/train': 7.410633087158203} -09/20/2021 14:45:44 - INFO - __main__ - Step 1274: {'lr': 2.106666666666667e-05, 'samples': 40768, 'steps': 79, 'loss/train': 6.411174774169922} -09/20/2021 14:45:45 - INFO - __main__ - Step 1275: {'lr': 2.106666666666667e-05, 'samples': 40800, 'steps': 79, 'loss/train': 7.268575668334961} -09/20/2021 14:45:46 - INFO - __main__ - Step 1276: {'lr': 2.106666666666667e-05, 'samples': 40832, 'steps': 79, 'loss/train': 7.377386093139648} -09/20/2021 14:45:46 - INFO - __main__ - Step 1277: {'lr': 2.106666666666667e-05, 'samples': 40864, 'steps': 79, 'loss/train': 6.594907283782959} -09/20/2021 14:45:47 - INFO - __main__ - Step 1278: {'lr': 2.106666666666667e-05, 'samples': 40896, 'steps': 79, 'loss/train': 6.965612888336182} -09/20/2021 14:45:48 - INFO - __main__ - Step 1279: {'lr': 2.106666666666667e-05, 'samples': 40928, 'steps': 79, 'loss/train': 7.57487154006958} -09/20/2021 14:45:50 - INFO - __main__ - Step 1280: {'lr': 2.106666666666667e-05, 'samples': 40960, 'steps': 79, 'loss/train': 6.504504203796387} -09/20/2021 14:45:51 - INFO - __main__ - Step 1281: {'lr': 2.1333333333333335e-05, 'samples': 40992, 'steps': 80, 'loss/train': 7.228402137756348} -09/20/2021 14:45:51 - INFO - __main__ - Step 1282: {'lr': 2.1333333333333335e-05, 'samples': 41024, 'steps': 80, 'loss/train': 6.004291534423828} -09/20/2021 14:45:52 - INFO - __main__ - Step 1283: {'lr': 2.1333333333333335e-05, 'samples': 41056, 'steps': 80, 'loss/train': 6.648809909820557} -09/20/2021 14:45:53 - INFO - __main__ - Step 1284: {'lr': 2.1333333333333335e-05, 'samples': 41088, 'steps': 80, 'loss/train': 6.286359786987305} -09/20/2021 14:45:54 - INFO - __main__ - Step 1285: {'lr': 2.1333333333333335e-05, 'samples': 41120, 'steps': 80, 'loss/train': 6.917571544647217} -09/20/2021 14:45:54 - INFO - __main__ - Step 1286: {'lr': 2.1333333333333335e-05, 'samples': 41152, 'steps': 80, 'loss/train': 8.932031631469727} -09/20/2021 14:45:55 - INFO - __main__ - Step 1287: {'lr': 2.1333333333333335e-05, 'samples': 41184, 'steps': 80, 'loss/train': 6.856955528259277} -09/20/2021 14:45:56 - INFO - __main__ - Step 1288: {'lr': 2.1333333333333335e-05, 'samples': 41216, 'steps': 80, 'loss/train': 6.861624717712402} -09/20/2021 14:45:57 - INFO - __main__ - Step 1289: {'lr': 2.1333333333333335e-05, 'samples': 41248, 'steps': 80, 'loss/train': 7.45489501953125} -09/20/2021 14:45:57 - INFO - __main__ - Step 1290: {'lr': 2.1333333333333335e-05, 'samples': 41280, 'steps': 80, 'loss/train': 6.3581061363220215} -09/20/2021 14:45:58 - INFO - __main__ - Step 1291: {'lr': 2.1333333333333335e-05, 'samples': 41312, 'steps': 80, 'loss/train': 7.318788051605225} -09/20/2021 14:45:59 - INFO - __main__ - Step 1292: {'lr': 2.1333333333333335e-05, 'samples': 41344, 'steps': 80, 'loss/train': 6.866255283355713} -09/20/2021 14:46:00 - INFO - __main__ - Step 1293: {'lr': 2.1333333333333335e-05, 'samples': 41376, 'steps': 80, 'loss/train': 6.663376808166504} -09/20/2021 14:46:00 - INFO - __main__ - Step 1294: {'lr': 2.1333333333333335e-05, 'samples': 41408, 'steps': 80, 'loss/train': 7.36399507522583} -09/20/2021 14:46:01 - INFO - __main__ - Step 1295: {'lr': 2.1333333333333335e-05, 'samples': 41440, 'steps': 80, 'loss/train': 6.76483154296875} -09/20/2021 14:46:02 - INFO - __main__ - Step 1296: {'lr': 2.1333333333333335e-05, 'samples': 41472, 'steps': 80, 'loss/train': 6.9006829261779785} -09/20/2021 14:46:03 - INFO - __main__ - Step 1297: {'lr': 2.16e-05, 'samples': 41504, 'steps': 81, 'loss/train': 7.244690895080566} -09/20/2021 14:46:03 - INFO - __main__ - Step 1298: {'lr': 2.16e-05, 'samples': 41536, 'steps': 81, 'loss/train': 7.065092086791992} -09/20/2021 14:46:04 - INFO - __main__ - Step 1299: {'lr': 2.16e-05, 'samples': 41568, 'steps': 81, 'loss/train': 6.947916030883789} -09/20/2021 14:46:05 - INFO - __main__ - Step 1300: {'lr': 2.16e-05, 'samples': 41600, 'steps': 81, 'loss/train': 7.501931190490723} -09/20/2021 14:46:06 - INFO - __main__ - Step 1301: {'lr': 2.16e-05, 'samples': 41632, 'steps': 81, 'loss/train': 6.699307441711426} -09/20/2021 14:46:06 - INFO - __main__ - Step 1302: {'lr': 2.16e-05, 'samples': 41664, 'steps': 81, 'loss/train': 6.603437423706055} -09/20/2021 14:46:07 - INFO - __main__ - Step 1303: {'lr': 2.16e-05, 'samples': 41696, 'steps': 81, 'loss/train': 7.217294216156006} -09/20/2021 14:46:08 - INFO - __main__ - Step 1304: {'lr': 2.16e-05, 'samples': 41728, 'steps': 81, 'loss/train': 7.598348140716553} -09/20/2021 14:46:09 - INFO - __main__ - Step 1305: {'lr': 2.16e-05, 'samples': 41760, 'steps': 81, 'loss/train': 7.954002857208252} -09/20/2021 14:46:09 - INFO - __main__ - Step 1306: {'lr': 2.16e-05, 'samples': 41792, 'steps': 81, 'loss/train': 7.78129768371582} -09/20/2021 14:46:10 - INFO - __main__ - Step 1307: {'lr': 2.16e-05, 'samples': 41824, 'steps': 81, 'loss/train': 7.514669418334961} -09/20/2021 14:46:11 - INFO - __main__ - Step 1308: {'lr': 2.16e-05, 'samples': 41856, 'steps': 81, 'loss/train': 7.007674694061279} -09/20/2021 14:46:12 - INFO - __main__ - Step 1309: {'lr': 2.16e-05, 'samples': 41888, 'steps': 81, 'loss/train': 6.381060600280762} -09/20/2021 14:46:12 - INFO - __main__ - Step 1310: {'lr': 2.16e-05, 'samples': 41920, 'steps': 81, 'loss/train': 6.6566338539123535} -09/20/2021 14:46:13 - INFO - __main__ - Step 1311: {'lr': 2.16e-05, 'samples': 41952, 'steps': 81, 'loss/train': 6.902052402496338} -09/20/2021 14:46:14 - INFO - __main__ - Step 1312: {'lr': 2.16e-05, 'samples': 41984, 'steps': 81, 'loss/train': 6.898022651672363} -09/20/2021 14:46:15 - INFO - __main__ - Step 1313: {'lr': 2.186666666666667e-05, 'samples': 42016, 'steps': 82, 'loss/train': 6.456850528717041} -09/20/2021 14:46:16 - INFO - __main__ - Step 1314: {'lr': 2.186666666666667e-05, 'samples': 42048, 'steps': 82, 'loss/train': 6.61098051071167} -09/20/2021 14:46:16 - INFO - __main__ - Step 1315: {'lr': 2.186666666666667e-05, 'samples': 42080, 'steps': 82, 'loss/train': 7.348238468170166} -09/20/2021 14:46:17 - INFO - __main__ - Step 1316: {'lr': 2.186666666666667e-05, 'samples': 42112, 'steps': 82, 'loss/train': 6.0860185623168945} -09/20/2021 14:46:18 - INFO - __main__ - Step 1317: {'lr': 2.186666666666667e-05, 'samples': 42144, 'steps': 82, 'loss/train': 6.899518013000488} -09/20/2021 14:46:19 - INFO - __main__ - Step 1318: {'lr': 2.186666666666667e-05, 'samples': 42176, 'steps': 82, 'loss/train': 6.292327404022217} -09/20/2021 14:46:19 - INFO - __main__ - Step 1319: {'lr': 2.186666666666667e-05, 'samples': 42208, 'steps': 82, 'loss/train': 5.86102819442749} -09/20/2021 14:46:20 - INFO - __main__ - Step 1320: {'lr': 2.186666666666667e-05, 'samples': 42240, 'steps': 82, 'loss/train': 5.440418243408203} -09/20/2021 14:46:21 - INFO - __main__ - Step 1321: {'lr': 2.186666666666667e-05, 'samples': 42272, 'steps': 82, 'loss/train': 6.535080909729004} -09/20/2021 14:46:22 - INFO - __main__ - Step 1322: {'lr': 2.186666666666667e-05, 'samples': 42304, 'steps': 82, 'loss/train': 7.4993062019348145} -09/20/2021 14:46:22 - INFO - __main__ - Step 1323: {'lr': 2.186666666666667e-05, 'samples': 42336, 'steps': 82, 'loss/train': 7.344956398010254} -09/20/2021 14:46:24 - INFO - __main__ - Step 1324: {'lr': 2.186666666666667e-05, 'samples': 42368, 'steps': 82, 'loss/train': 6.559617042541504} -09/20/2021 14:46:24 - INFO - __main__ - Step 1325: {'lr': 2.186666666666667e-05, 'samples': 42400, 'steps': 82, 'loss/train': 7.102939128875732} -09/20/2021 14:46:25 - INFO - __main__ - Step 1326: {'lr': 2.186666666666667e-05, 'samples': 42432, 'steps': 82, 'loss/train': 7.471022605895996} -09/20/2021 14:46:26 - INFO - __main__ - Step 1327: {'lr': 2.186666666666667e-05, 'samples': 42464, 'steps': 82, 'loss/train': 7.146205425262451} -09/20/2021 14:46:27 - INFO - __main__ - Step 1328: {'lr': 2.186666666666667e-05, 'samples': 42496, 'steps': 82, 'loss/train': 6.37398624420166} -09/20/2021 14:46:28 - INFO - __main__ - Step 1329: {'lr': 2.2133333333333334e-05, 'samples': 42528, 'steps': 83, 'loss/train': 7.399117469787598} -09/20/2021 14:46:28 - INFO - __main__ - Step 1330: {'lr': 2.2133333333333334e-05, 'samples': 42560, 'steps': 83, 'loss/train': 6.852920055389404} -09/20/2021 14:46:29 - INFO - __main__ - Step 1331: {'lr': 2.2133333333333334e-05, 'samples': 42592, 'steps': 83, 'loss/train': 7.600358486175537} -09/20/2021 14:46:30 - INFO - __main__ - Step 1332: {'lr': 2.2133333333333334e-05, 'samples': 42624, 'steps': 83, 'loss/train': 6.589765548706055} -09/20/2021 14:46:31 - INFO - __main__ - Step 1333: {'lr': 2.2133333333333334e-05, 'samples': 42656, 'steps': 83, 'loss/train': 7.136337757110596} -09/20/2021 14:46:31 - INFO - __main__ - Step 1334: {'lr': 2.2133333333333334e-05, 'samples': 42688, 'steps': 83, 'loss/train': 7.2276458740234375} -09/20/2021 14:46:32 - INFO - __main__ - Step 1335: {'lr': 2.2133333333333334e-05, 'samples': 42720, 'steps': 83, 'loss/train': 5.996577262878418} -09/20/2021 14:46:33 - INFO - __main__ - Step 1336: {'lr': 2.2133333333333334e-05, 'samples': 42752, 'steps': 83, 'loss/train': 6.9766411781311035} -09/20/2021 14:46:34 - INFO - __main__ - Step 1337: {'lr': 2.2133333333333334e-05, 'samples': 42784, 'steps': 83, 'loss/train': 7.278964519500732} -09/20/2021 14:46:34 - INFO - __main__ - Step 1338: {'lr': 2.2133333333333334e-05, 'samples': 42816, 'steps': 83, 'loss/train': 7.345757484436035} -09/20/2021 14:46:35 - INFO - __main__ - Step 1339: {'lr': 2.2133333333333334e-05, 'samples': 42848, 'steps': 83, 'loss/train': 2.7349045276641846} -09/20/2021 14:46:36 - INFO - __main__ - Step 1340: {'lr': 2.2133333333333334e-05, 'samples': 42880, 'steps': 83, 'loss/train': 2.724766731262207} -09/20/2021 14:46:37 - INFO - __main__ - Step 1341: {'lr': 2.2133333333333334e-05, 'samples': 42912, 'steps': 83, 'loss/train': 2.7586348056793213} -09/20/2021 14:46:37 - INFO - __main__ - Step 1342: {'lr': 2.2133333333333334e-05, 'samples': 42944, 'steps': 83, 'loss/train': 2.744723081588745} -09/20/2021 14:46:38 - INFO - __main__ - Step 1343: {'lr': 2.2133333333333334e-05, 'samples': 42976, 'steps': 83, 'loss/train': 2.760462760925293} -09/20/2021 14:46:39 - INFO - __main__ - Step 1344: {'lr': 2.2133333333333334e-05, 'samples': 43008, 'steps': 83, 'loss/train': 6.594578742980957} -09/20/2021 14:46:40 - INFO - __main__ - Step 1345: {'lr': 2.2400000000000002e-05, 'samples': 43040, 'steps': 84, 'loss/train': 6.277400493621826} -09/20/2021 14:46:41 - INFO - __main__ - Step 1346: {'lr': 2.2400000000000002e-05, 'samples': 43072, 'steps': 84, 'loss/train': 6.763936519622803} -09/20/2021 14:46:41 - INFO - __main__ - Step 1347: {'lr': 2.2400000000000002e-05, 'samples': 43104, 'steps': 84, 'loss/train': 6.650808811187744} -09/20/2021 14:46:42 - INFO - __main__ - Step 1348: {'lr': 2.2400000000000002e-05, 'samples': 43136, 'steps': 84, 'loss/train': 6.801975727081299} -09/20/2021 14:46:43 - INFO - __main__ - Step 1349: {'lr': 2.2400000000000002e-05, 'samples': 43168, 'steps': 84, 'loss/train': 6.342635154724121} -09/20/2021 14:46:44 - INFO - __main__ - Step 1350: {'lr': 2.2400000000000002e-05, 'samples': 43200, 'steps': 84, 'loss/train': 7.915589809417725} -09/20/2021 14:46:44 - INFO - __main__ - Step 1351: {'lr': 2.2400000000000002e-05, 'samples': 43232, 'steps': 84, 'loss/train': 7.150181770324707} -09/20/2021 14:46:45 - INFO - __main__ - Step 1352: {'lr': 2.2400000000000002e-05, 'samples': 43264, 'steps': 84, 'loss/train': 7.155706882476807} -09/20/2021 14:46:46 - INFO - __main__ - Step 1353: {'lr': 2.2400000000000002e-05, 'samples': 43296, 'steps': 84, 'loss/train': 6.31610631942749} -09/20/2021 14:46:47 - INFO - __main__ - Step 1354: {'lr': 2.2400000000000002e-05, 'samples': 43328, 'steps': 84, 'loss/train': 6.812422752380371} -09/20/2021 14:46:47 - INFO - __main__ - Step 1355: {'lr': 2.2400000000000002e-05, 'samples': 43360, 'steps': 84, 'loss/train': 6.636787414550781} -09/20/2021 14:46:48 - INFO - __main__ - Step 1356: {'lr': 2.2400000000000002e-05, 'samples': 43392, 'steps': 84, 'loss/train': 6.598759651184082} -09/20/2021 14:46:49 - INFO - __main__ - Step 1357: {'lr': 2.2400000000000002e-05, 'samples': 43424, 'steps': 84, 'loss/train': 6.668702602386475} -09/20/2021 14:46:50 - INFO - __main__ - Step 1358: {'lr': 2.2400000000000002e-05, 'samples': 43456, 'steps': 84, 'loss/train': 6.902087688446045} -09/20/2021 14:46:50 - INFO - __main__ - Step 1359: {'lr': 2.2400000000000002e-05, 'samples': 43488, 'steps': 84, 'loss/train': 7.4140944480896} -09/20/2021 14:46:52 - INFO - __main__ - Step 1360: {'lr': 2.2400000000000002e-05, 'samples': 43520, 'steps': 84, 'loss/train': 7.6915059089660645} -09/20/2021 14:46:52 - INFO - __main__ - Step 1361: {'lr': 2.2666666666666668e-05, 'samples': 43552, 'steps': 85, 'loss/train': 6.808213710784912} -09/20/2021 14:46:53 - INFO - __main__ - Step 1362: {'lr': 2.2666666666666668e-05, 'samples': 43584, 'steps': 85, 'loss/train': 5.962756156921387} -09/20/2021 14:46:54 - INFO - __main__ - Step 1363: {'lr': 2.2666666666666668e-05, 'samples': 43616, 'steps': 85, 'loss/train': 5.942309379577637} -09/20/2021 14:46:55 - INFO - __main__ - Step 1364: {'lr': 2.2666666666666668e-05, 'samples': 43648, 'steps': 85, 'loss/train': 7.013086318969727} -09/20/2021 14:46:55 - INFO - __main__ - Step 1365: {'lr': 2.2666666666666668e-05, 'samples': 43680, 'steps': 85, 'loss/train': 6.632970333099365} -09/20/2021 14:46:56 - INFO - __main__ - Step 1366: {'lr': 2.2666666666666668e-05, 'samples': 43712, 'steps': 85, 'loss/train': 6.299832344055176} -09/20/2021 14:46:57 - INFO - __main__ - Step 1367: {'lr': 2.2666666666666668e-05, 'samples': 43744, 'steps': 85, 'loss/train': 7.043704986572266} -09/20/2021 14:46:58 - INFO - __main__ - Step 1368: {'lr': 2.2666666666666668e-05, 'samples': 43776, 'steps': 85, 'loss/train': 7.277287483215332} -09/20/2021 14:46:58 - INFO - __main__ - Step 1369: {'lr': 2.2666666666666668e-05, 'samples': 43808, 'steps': 85, 'loss/train': 6.4529619216918945} -09/20/2021 14:46:59 - INFO - __main__ - Step 1370: {'lr': 2.2666666666666668e-05, 'samples': 43840, 'steps': 85, 'loss/train': 7.101344108581543} -09/20/2021 14:47:00 - INFO - __main__ - Step 1371: {'lr': 2.2666666666666668e-05, 'samples': 43872, 'steps': 85, 'loss/train': 6.963600158691406} -09/20/2021 14:47:01 - INFO - __main__ - Step 1372: {'lr': 2.2666666666666668e-05, 'samples': 43904, 'steps': 85, 'loss/train': 6.677740097045898} -09/20/2021 14:47:01 - INFO - __main__ - Step 1373: {'lr': 2.2666666666666668e-05, 'samples': 43936, 'steps': 85, 'loss/train': 6.842301845550537} -09/20/2021 14:47:02 - INFO - __main__ - Step 1374: {'lr': 2.2666666666666668e-05, 'samples': 43968, 'steps': 85, 'loss/train': 7.03646993637085} -09/20/2021 14:47:03 - INFO - __main__ - Step 1375: {'lr': 2.2666666666666668e-05, 'samples': 44000, 'steps': 85, 'loss/train': 8.52812385559082} -09/20/2021 14:47:04 - INFO - __main__ - Step 1376: {'lr': 2.2666666666666668e-05, 'samples': 44032, 'steps': 85, 'loss/train': 7.626333713531494} -09/20/2021 14:47:05 - INFO - __main__ - Step 1377: {'lr': 2.2933333333333333e-05, 'samples': 44064, 'steps': 86, 'loss/train': 7.118978500366211} -09/20/2021 14:47:05 - INFO - __main__ - Step 1378: {'lr': 2.2933333333333333e-05, 'samples': 44096, 'steps': 86, 'loss/train': 7.335729122161865} -09/20/2021 14:47:06 - INFO - __main__ - Step 1379: {'lr': 2.2933333333333333e-05, 'samples': 44128, 'steps': 86, 'loss/train': 6.783117294311523} -09/20/2021 14:47:07 - INFO - __main__ - Step 1380: {'lr': 2.2933333333333333e-05, 'samples': 44160, 'steps': 86, 'loss/train': 6.911933898925781} -09/20/2021 14:47:08 - INFO - __main__ - Step 1381: {'lr': 2.2933333333333333e-05, 'samples': 44192, 'steps': 86, 'loss/train': 7.642375946044922} -09/20/2021 14:47:08 - INFO - __main__ - Step 1382: {'lr': 2.2933333333333333e-05, 'samples': 44224, 'steps': 86, 'loss/train': 7.1238813400268555} -09/20/2021 14:47:09 - INFO - __main__ - Step 1383: {'lr': 2.2933333333333333e-05, 'samples': 44256, 'steps': 86, 'loss/train': 8.120634078979492} -09/20/2021 14:47:10 - INFO - __main__ - Step 1384: {'lr': 2.2933333333333333e-05, 'samples': 44288, 'steps': 86, 'loss/train': 6.563902854919434} -09/20/2021 14:47:11 - INFO - __main__ - Step 1385: {'lr': 2.2933333333333333e-05, 'samples': 44320, 'steps': 86, 'loss/train': 6.8616719245910645} -09/20/2021 14:47:11 - INFO - __main__ - Step 1386: {'lr': 2.2933333333333333e-05, 'samples': 44352, 'steps': 86, 'loss/train': 7.503718376159668} -09/20/2021 14:47:12 - INFO - __main__ - Step 1387: {'lr': 2.2933333333333333e-05, 'samples': 44384, 'steps': 86, 'loss/train': 6.540370464324951} -09/20/2021 14:47:13 - INFO - __main__ - Step 1388: {'lr': 2.2933333333333333e-05, 'samples': 44416, 'steps': 86, 'loss/train': 7.036660194396973} -09/20/2021 14:47:14 - INFO - __main__ - Step 1389: {'lr': 2.2933333333333333e-05, 'samples': 44448, 'steps': 86, 'loss/train': 6.911251068115234} -09/20/2021 14:47:15 - INFO - __main__ - Step 1390: {'lr': 2.2933333333333333e-05, 'samples': 44480, 'steps': 86, 'loss/train': 7.03333044052124} -09/20/2021 14:47:16 - INFO - __main__ - Step 1391: {'lr': 2.2933333333333333e-05, 'samples': 44512, 'steps': 86, 'loss/train': 7.454707622528076} -09/20/2021 14:47:16 - INFO - __main__ - Step 1392: {'lr': 2.2933333333333333e-05, 'samples': 44544, 'steps': 86, 'loss/train': 6.3209028244018555} -09/20/2021 14:47:17 - INFO - __main__ - Step 1393: {'lr': 2.32e-05, 'samples': 44576, 'steps': 87, 'loss/train': 6.844849586486816} -09/20/2021 14:47:18 - INFO - __main__ - Step 1394: {'lr': 2.32e-05, 'samples': 44608, 'steps': 87, 'loss/train': 7.477930068969727} -09/20/2021 14:47:19 - INFO - __main__ - Step 1395: {'lr': 2.32e-05, 'samples': 44640, 'steps': 87, 'loss/train': 6.502898216247559} -09/20/2021 14:47:20 - INFO - __main__ - Step 1396: {'lr': 2.32e-05, 'samples': 44672, 'steps': 87, 'loss/train': 5.911944389343262} -09/20/2021 14:47:20 - INFO - __main__ - Step 1397: {'lr': 2.32e-05, 'samples': 44704, 'steps': 87, 'loss/train': 7.369197845458984} -09/20/2021 14:47:21 - INFO - __main__ - Step 1398: {'lr': 2.32e-05, 'samples': 44736, 'steps': 87, 'loss/train': 7.259982109069824} -09/20/2021 14:47:22 - INFO - __main__ - Step 1399: {'lr': 2.32e-05, 'samples': 44768, 'steps': 87, 'loss/train': 7.27367639541626} -09/20/2021 14:47:23 - INFO - __main__ - Step 1400: {'lr': 2.32e-05, 'samples': 44800, 'steps': 87, 'loss/train': 6.644550323486328} -09/20/2021 14:47:23 - INFO - __main__ - Step 1401: {'lr': 2.32e-05, 'samples': 44832, 'steps': 87, 'loss/train': 6.9535627365112305} -09/20/2021 14:47:24 - INFO - __main__ - Step 1402: {'lr': 2.32e-05, 'samples': 44864, 'steps': 87, 'loss/train': 8.051722526550293} -09/20/2021 14:47:25 - INFO - __main__ - Step 1403: {'lr': 2.32e-05, 'samples': 44896, 'steps': 87, 'loss/train': 7.176924705505371} -09/20/2021 14:47:26 - INFO - __main__ - Step 1404: {'lr': 2.32e-05, 'samples': 44928, 'steps': 87, 'loss/train': 6.824726581573486} -09/20/2021 14:47:26 - INFO - __main__ - Step 1405: {'lr': 2.32e-05, 'samples': 44960, 'steps': 87, 'loss/train': 6.569762706756592} -09/20/2021 14:47:27 - INFO - __main__ - Step 1406: {'lr': 2.32e-05, 'samples': 44992, 'steps': 87, 'loss/train': 7.526116847991943} -09/20/2021 14:47:28 - INFO - __main__ - Step 1407: {'lr': 2.32e-05, 'samples': 45024, 'steps': 87, 'loss/train': 6.847419738769531} -09/20/2021 14:47:29 - INFO - __main__ - Step 1408: {'lr': 2.32e-05, 'samples': 45056, 'steps': 87, 'loss/train': 6.404858112335205} -09/20/2021 14:47:30 - INFO - __main__ - Step 1409: {'lr': 2.3466666666666667e-05, 'samples': 45088, 'steps': 88, 'loss/train': 7.584743022918701} -09/20/2021 14:47:30 - INFO - __main__ - Step 1410: {'lr': 2.3466666666666667e-05, 'samples': 45120, 'steps': 88, 'loss/train': 8.540786743164062} -09/20/2021 14:47:31 - INFO - __main__ - Step 1411: {'lr': 2.3466666666666667e-05, 'samples': 45152, 'steps': 88, 'loss/train': 6.371461391448975} -09/20/2021 14:47:32 - INFO - __main__ - Step 1412: {'lr': 2.3466666666666667e-05, 'samples': 45184, 'steps': 88, 'loss/train': 7.026157379150391} -09/20/2021 14:47:33 - INFO - __main__ - Step 1413: {'lr': 2.3466666666666667e-05, 'samples': 45216, 'steps': 88, 'loss/train': 7.054463863372803} -09/20/2021 14:47:33 - INFO - __main__ - Step 1414: {'lr': 2.3466666666666667e-05, 'samples': 45248, 'steps': 88, 'loss/train': 7.362022399902344} -09/20/2021 14:47:34 - INFO - __main__ - Step 1415: {'lr': 2.3466666666666667e-05, 'samples': 45280, 'steps': 88, 'loss/train': 6.702137470245361} -09/20/2021 14:47:35 - INFO - __main__ - Step 1416: {'lr': 2.3466666666666667e-05, 'samples': 45312, 'steps': 88, 'loss/train': 6.812434196472168} -09/20/2021 14:47:36 - INFO - __main__ - Step 1417: {'lr': 2.3466666666666667e-05, 'samples': 45344, 'steps': 88, 'loss/train': 6.856886863708496} -09/20/2021 14:47:36 - INFO - __main__ - Step 1418: {'lr': 2.3466666666666667e-05, 'samples': 45376, 'steps': 88, 'loss/train': 6.737428188323975} -09/20/2021 14:47:37 - INFO - __main__ - Step 1419: {'lr': 2.3466666666666667e-05, 'samples': 45408, 'steps': 88, 'loss/train': 7.354835510253906} -09/20/2021 14:47:38 - INFO - __main__ - Step 1420: {'lr': 2.3466666666666667e-05, 'samples': 45440, 'steps': 88, 'loss/train': 6.784587860107422} -09/20/2021 14:47:39 - INFO - __main__ - Step 1421: {'lr': 2.3466666666666667e-05, 'samples': 45472, 'steps': 88, 'loss/train': 7.590674877166748} -09/20/2021 14:47:40 - INFO - __main__ - Step 1422: {'lr': 2.3466666666666667e-05, 'samples': 45504, 'steps': 88, 'loss/train': 7.4544758796691895} -09/20/2021 14:47:41 - INFO - __main__ - Step 1423: {'lr': 2.3466666666666667e-05, 'samples': 45536, 'steps': 88, 'loss/train': 6.927024841308594} -09/20/2021 14:47:41 - INFO - __main__ - Step 1424: {'lr': 2.3466666666666667e-05, 'samples': 45568, 'steps': 88, 'loss/train': 7.488018035888672} -09/20/2021 14:47:42 - INFO - __main__ - Step 1425: {'lr': 2.3733333333333335e-05, 'samples': 45600, 'steps': 89, 'loss/train': 6.5541157722473145} -09/20/2021 14:47:43 - INFO - __main__ - Step 1426: {'lr': 2.3733333333333335e-05, 'samples': 45632, 'steps': 89, 'loss/train': 7.0528950691223145} -09/20/2021 14:47:44 - INFO - __main__ - Step 1427: {'lr': 2.3733333333333335e-05, 'samples': 45664, 'steps': 89, 'loss/train': 6.543478488922119} -09/20/2021 14:47:44 - INFO - __main__ - Step 1428: {'lr': 2.3733333333333335e-05, 'samples': 45696, 'steps': 89, 'loss/train': 6.711031436920166} -09/20/2021 14:47:45 - INFO - __main__ - Step 1429: {'lr': 2.3733333333333335e-05, 'samples': 45728, 'steps': 89, 'loss/train': 7.85757303237915} -09/20/2021 14:47:46 - INFO - __main__ - Step 1430: {'lr': 2.3733333333333335e-05, 'samples': 45760, 'steps': 89, 'loss/train': 7.264464855194092} -09/20/2021 14:47:47 - INFO - __main__ - Step 1431: {'lr': 2.3733333333333335e-05, 'samples': 45792, 'steps': 89, 'loss/train': 7.949660301208496} -09/20/2021 14:47:47 - INFO - __main__ - Step 1432: {'lr': 2.3733333333333335e-05, 'samples': 45824, 'steps': 89, 'loss/train': 7.820850372314453} -09/20/2021 14:47:48 - INFO - __main__ - Step 1433: {'lr': 2.3733333333333335e-05, 'samples': 45856, 'steps': 89, 'loss/train': 7.533621311187744} -09/20/2021 14:47:49 - INFO - __main__ - Step 1434: {'lr': 2.3733333333333335e-05, 'samples': 45888, 'steps': 89, 'loss/train': 6.951545238494873} -09/20/2021 14:47:50 - INFO - __main__ - Step 1435: {'lr': 2.3733333333333335e-05, 'samples': 45920, 'steps': 89, 'loss/train': 7.220393180847168} -09/20/2021 14:47:50 - INFO - __main__ - Step 1436: {'lr': 2.3733333333333335e-05, 'samples': 45952, 'steps': 89, 'loss/train': 6.949118614196777} -09/20/2021 14:47:51 - INFO - __main__ - Step 1437: {'lr': 2.3733333333333335e-05, 'samples': 45984, 'steps': 89, 'loss/train': 6.752927780151367} -09/20/2021 14:47:52 - INFO - __main__ - Step 1438: {'lr': 2.3733333333333335e-05, 'samples': 46016, 'steps': 89, 'loss/train': 6.300153732299805} -09/20/2021 14:47:53 - INFO - __main__ - Step 1439: {'lr': 2.3733333333333335e-05, 'samples': 46048, 'steps': 89, 'loss/train': 7.4598469734191895} -09/20/2021 14:47:53 - INFO - __main__ - Step 1440: {'lr': 2.3733333333333335e-05, 'samples': 46080, 'steps': 89, 'loss/train': 7.23174524307251} -09/20/2021 14:47:54 - INFO - __main__ - Step 1441: {'lr': 2.4e-05, 'samples': 46112, 'steps': 90, 'loss/train': 6.993157386779785} -09/20/2021 14:47:55 - INFO - __main__ - Step 1442: {'lr': 2.4e-05, 'samples': 46144, 'steps': 90, 'loss/train': 7.203760623931885} -09/20/2021 14:47:56 - INFO - __main__ - Step 1443: {'lr': 2.4e-05, 'samples': 46176, 'steps': 90, 'loss/train': 6.821300506591797} -09/20/2021 14:47:57 - INFO - __main__ - Step 1444: {'lr': 2.4e-05, 'samples': 46208, 'steps': 90, 'loss/train': 7.938205718994141} -09/20/2021 14:47:57 - INFO - __main__ - Step 1445: {'lr': 2.4e-05, 'samples': 46240, 'steps': 90, 'loss/train': 7.3755059242248535} -09/20/2021 14:47:58 - INFO - __main__ - Step 1446: {'lr': 2.4e-05, 'samples': 46272, 'steps': 90, 'loss/train': 7.104341506958008} -09/20/2021 14:47:59 - INFO - __main__ - Step 1447: {'lr': 2.4e-05, 'samples': 46304, 'steps': 90, 'loss/train': 6.886888027191162} -09/20/2021 14:48:00 - INFO - __main__ - Step 1448: {'lr': 2.4e-05, 'samples': 46336, 'steps': 90, 'loss/train': 7.115821361541748} -09/20/2021 14:48:00 - INFO - __main__ - Step 1449: {'lr': 2.4e-05, 'samples': 46368, 'steps': 90, 'loss/train': 7.48318338394165} -09/20/2021 14:48:01 - INFO - __main__ - Step 1450: {'lr': 2.4e-05, 'samples': 46400, 'steps': 90, 'loss/train': 7.245957374572754} -09/20/2021 14:48:02 - INFO - __main__ - Step 1451: {'lr': 2.4e-05, 'samples': 46432, 'steps': 90, 'loss/train': 6.759549140930176} -09/20/2021 14:48:03 - INFO - __main__ - Step 1452: {'lr': 2.4e-05, 'samples': 46464, 'steps': 90, 'loss/train': 6.913377285003662} -09/20/2021 14:48:04 - INFO - __main__ - Step 1453: {'lr': 2.4e-05, 'samples': 46496, 'steps': 90, 'loss/train': 6.953636646270752} -09/20/2021 14:48:05 - INFO - __main__ - Step 1454: {'lr': 2.4e-05, 'samples': 46528, 'steps': 90, 'loss/train': 6.770787715911865} -09/20/2021 14:48:06 - INFO - __main__ - Step 1455: {'lr': 2.4e-05, 'samples': 46560, 'steps': 90, 'loss/train': 6.510721206665039} -09/20/2021 14:48:07 - INFO - __main__ - Step 1456: {'lr': 2.4e-05, 'samples': 46592, 'steps': 90, 'loss/train': 7.637651443481445} -09/20/2021 14:48:07 - INFO - __main__ - Step 1457: {'lr': 2.426666666666667e-05, 'samples': 46624, 'steps': 91, 'loss/train': 7.167266845703125} -09/20/2021 14:48:08 - INFO - __main__ - Step 1458: {'lr': 2.426666666666667e-05, 'samples': 46656, 'steps': 91, 'loss/train': 6.141096115112305} -09/20/2021 14:48:09 - INFO - __main__ - Step 1459: {'lr': 2.426666666666667e-05, 'samples': 46688, 'steps': 91, 'loss/train': 6.601771354675293} -09/20/2021 14:48:10 - INFO - __main__ - Step 1460: {'lr': 2.426666666666667e-05, 'samples': 46720, 'steps': 91, 'loss/train': 6.748319149017334} -09/20/2021 14:48:10 - INFO - __main__ - Step 1461: {'lr': 2.426666666666667e-05, 'samples': 46752, 'steps': 91, 'loss/train': 7.338825225830078} -09/20/2021 14:48:11 - INFO - __main__ - Step 1462: {'lr': 2.426666666666667e-05, 'samples': 46784, 'steps': 91, 'loss/train': 6.81221866607666} -09/20/2021 14:48:12 - INFO - __main__ - Step 1463: {'lr': 2.426666666666667e-05, 'samples': 46816, 'steps': 91, 'loss/train': 7.151991367340088} -09/20/2021 14:48:13 - INFO - __main__ - Step 1464: {'lr': 2.426666666666667e-05, 'samples': 46848, 'steps': 91, 'loss/train': 6.742116928100586} -09/20/2021 14:48:13 - INFO - __main__ - Step 1465: {'lr': 2.426666666666667e-05, 'samples': 46880, 'steps': 91, 'loss/train': 6.72812557220459} -09/20/2021 14:48:14 - INFO - __main__ - Step 1466: {'lr': 2.426666666666667e-05, 'samples': 46912, 'steps': 91, 'loss/train': 6.386335849761963} -09/20/2021 14:48:15 - INFO - __main__ - Step 1467: {'lr': 2.426666666666667e-05, 'samples': 46944, 'steps': 91, 'loss/train': 6.939550876617432} -09/20/2021 14:48:16 - INFO - __main__ - Step 1468: {'lr': 2.426666666666667e-05, 'samples': 46976, 'steps': 91, 'loss/train': 5.993419647216797} -09/20/2021 14:48:16 - INFO - __main__ - Step 1469: {'lr': 2.426666666666667e-05, 'samples': 47008, 'steps': 91, 'loss/train': 6.852316379547119} -09/20/2021 14:48:17 - INFO - __main__ - Step 1470: {'lr': 2.426666666666667e-05, 'samples': 47040, 'steps': 91, 'loss/train': 8.372739791870117} -09/20/2021 14:48:18 - INFO - __main__ - Step 1471: {'lr': 2.426666666666667e-05, 'samples': 47072, 'steps': 91, 'loss/train': 8.221210479736328} -09/20/2021 14:48:19 - INFO - __main__ - Step 1472: {'lr': 2.426666666666667e-05, 'samples': 47104, 'steps': 91, 'loss/train': 8.441248893737793} -09/20/2021 14:48:20 - INFO - __main__ - Step 1473: {'lr': 2.4533333333333334e-05, 'samples': 47136, 'steps': 92, 'loss/train': 8.363396644592285} -09/20/2021 14:48:20 - INFO - __main__ - Step 1474: {'lr': 2.4533333333333334e-05, 'samples': 47168, 'steps': 92, 'loss/train': 8.292197227478027} -09/20/2021 14:48:21 - INFO - __main__ - Step 1475: {'lr': 2.4533333333333334e-05, 'samples': 47200, 'steps': 92, 'loss/train': 8.348638534545898} -09/20/2021 14:48:22 - INFO - __main__ - Step 1476: {'lr': 2.4533333333333334e-05, 'samples': 47232, 'steps': 92, 'loss/train': 7.018089294433594} -09/20/2021 14:48:23 - INFO - __main__ - Step 1477: {'lr': 2.4533333333333334e-05, 'samples': 47264, 'steps': 92, 'loss/train': 5.8551859855651855} -09/20/2021 14:48:23 - INFO - __main__ - Step 1478: {'lr': 2.4533333333333334e-05, 'samples': 47296, 'steps': 92, 'loss/train': 7.832219123840332} -09/20/2021 14:48:24 - INFO - __main__ - Step 1479: {'lr': 2.4533333333333334e-05, 'samples': 47328, 'steps': 92, 'loss/train': 8.604214668273926} -09/20/2021 14:48:25 - INFO - __main__ - Step 1480: {'lr': 2.4533333333333334e-05, 'samples': 47360, 'steps': 92, 'loss/train': 8.518714904785156} -09/20/2021 14:48:26 - INFO - __main__ - Step 1481: {'lr': 2.4533333333333334e-05, 'samples': 47392, 'steps': 92, 'loss/train': 7.438953876495361} -09/20/2021 14:48:26 - INFO - __main__ - Step 1482: {'lr': 2.4533333333333334e-05, 'samples': 47424, 'steps': 92, 'loss/train': 6.600265979766846} -09/20/2021 14:48:27 - INFO - __main__ - Step 1483: {'lr': 2.4533333333333334e-05, 'samples': 47456, 'steps': 92, 'loss/train': 6.552595138549805} -09/20/2021 14:48:28 - INFO - __main__ - Step 1484: {'lr': 2.4533333333333334e-05, 'samples': 47488, 'steps': 92, 'loss/train': 7.032143592834473} -09/20/2021 14:48:29 - INFO - __main__ - Step 1485: {'lr': 2.4533333333333334e-05, 'samples': 47520, 'steps': 92, 'loss/train': 7.188249111175537} -09/20/2021 14:48:30 - INFO - __main__ - Step 1486: {'lr': 2.4533333333333334e-05, 'samples': 47552, 'steps': 92, 'loss/train': 7.181334972381592} -09/20/2021 14:48:31 - INFO - __main__ - Step 1487: {'lr': 2.4533333333333334e-05, 'samples': 47584, 'steps': 92, 'loss/train': 7.373607635498047} -09/20/2021 14:48:31 - INFO - __main__ - Step 1488: {'lr': 2.4533333333333334e-05, 'samples': 47616, 'steps': 92, 'loss/train': 6.817178249359131} -09/20/2021 14:48:32 - INFO - __main__ - Step 1489: {'lr': 2.48e-05, 'samples': 47648, 'steps': 93, 'loss/train': 7.146844863891602} -09/20/2021 14:48:33 - INFO - __main__ - Step 1490: {'lr': 2.48e-05, 'samples': 47680, 'steps': 93, 'loss/train': 7.098081111907959} -09/20/2021 14:48:34 - INFO - __main__ - Step 1491: {'lr': 2.48e-05, 'samples': 47712, 'steps': 93, 'loss/train': 6.9285478591918945} -09/20/2021 14:48:34 - INFO - __main__ - Step 1492: {'lr': 2.48e-05, 'samples': 47744, 'steps': 93, 'loss/train': 6.576025485992432} -09/20/2021 14:48:35 - INFO - __main__ - Step 1493: {'lr': 2.48e-05, 'samples': 47776, 'steps': 93, 'loss/train': 7.061032772064209} -09/20/2021 14:48:36 - INFO - __main__ - Step 1494: {'lr': 2.48e-05, 'samples': 47808, 'steps': 93, 'loss/train': 7.49500846862793} -09/20/2021 14:48:37 - INFO - __main__ - Step 1495: {'lr': 2.48e-05, 'samples': 47840, 'steps': 93, 'loss/train': 7.316258430480957} -09/20/2021 14:48:37 - INFO - __main__ - Step 1496: {'lr': 2.48e-05, 'samples': 47872, 'steps': 93, 'loss/train': 6.758616924285889} -09/20/2021 14:48:38 - INFO - __main__ - Step 1497: {'lr': 2.48e-05, 'samples': 47904, 'steps': 93, 'loss/train': 5.052849292755127} -09/20/2021 14:48:39 - INFO - __main__ - Step 1498: {'lr': 2.48e-05, 'samples': 47936, 'steps': 93, 'loss/train': 6.500176906585693} -09/20/2021 14:48:40 - INFO - __main__ - Step 1499: {'lr': 2.48e-05, 'samples': 47968, 'steps': 93, 'loss/train': 6.452937602996826} -09/20/2021 14:48:40 - INFO - __main__ - Step 1500: {'lr': 2.48e-05, 'samples': 48000, 'steps': 93, 'loss/train': 6.290328502655029} -09/20/2021 14:48:41 - INFO - __main__ - Step 1501: {'lr': 2.48e-05, 'samples': 48032, 'steps': 93, 'loss/train': 7.493202209472656} -09/20/2021 14:48:42 - INFO - __main__ - Step 1502: {'lr': 2.48e-05, 'samples': 48064, 'steps': 93, 'loss/train': 7.8693037033081055} -09/20/2021 14:48:43 - INFO - __main__ - Step 1503: {'lr': 2.48e-05, 'samples': 48096, 'steps': 93, 'loss/train': 6.392000675201416} -09/20/2021 14:48:43 - INFO - __main__ - Step 1504: {'lr': 2.48e-05, 'samples': 48128, 'steps': 93, 'loss/train': 6.990300178527832} -09/20/2021 14:48:44 - INFO - __main__ - Step 1505: {'lr': 2.5066666666666665e-05, 'samples': 48160, 'steps': 94, 'loss/train': 7.167797088623047} -09/20/2021 14:48:45 - INFO - __main__ - Step 1506: {'lr': 2.5066666666666665e-05, 'samples': 48192, 'steps': 94, 'loss/train': 5.30214262008667} -09/20/2021 14:48:46 - INFO - __main__ - Step 1507: {'lr': 2.5066666666666665e-05, 'samples': 48224, 'steps': 94, 'loss/train': 7.540078163146973} -09/20/2021 14:48:47 - INFO - __main__ - Step 1508: {'lr': 2.5066666666666665e-05, 'samples': 48256, 'steps': 94, 'loss/train': 6.679651260375977} -09/20/2021 14:48:47 - INFO - __main__ - Step 1509: {'lr': 2.5066666666666665e-05, 'samples': 48288, 'steps': 94, 'loss/train': 6.330169677734375} -09/20/2021 14:48:48 - INFO - __main__ - Step 1510: {'lr': 2.5066666666666665e-05, 'samples': 48320, 'steps': 94, 'loss/train': 7.244390964508057} -09/20/2021 14:48:49 - INFO - __main__ - Step 1511: {'lr': 2.5066666666666665e-05, 'samples': 48352, 'steps': 94, 'loss/train': 5.392919063568115} -09/20/2021 14:48:50 - INFO - __main__ - Step 1512: {'lr': 2.5066666666666665e-05, 'samples': 48384, 'steps': 94, 'loss/train': 7.171425819396973} -09/20/2021 14:48:50 - INFO - __main__ - Step 1513: {'lr': 2.5066666666666665e-05, 'samples': 48416, 'steps': 94, 'loss/train': 7.288106441497803} -09/20/2021 14:48:51 - INFO - __main__ - Step 1514: {'lr': 2.5066666666666665e-05, 'samples': 48448, 'steps': 94, 'loss/train': 6.59630012512207} -09/20/2021 14:48:52 - INFO - __main__ - Step 1515: {'lr': 2.5066666666666665e-05, 'samples': 48480, 'steps': 94, 'loss/train': 6.981513023376465} -09/20/2021 14:48:53 - INFO - __main__ - Step 1516: {'lr': 2.5066666666666665e-05, 'samples': 48512, 'steps': 94, 'loss/train': 6.597629547119141} -09/20/2021 14:48:54 - INFO - __main__ - Step 1517: {'lr': 2.5066666666666665e-05, 'samples': 48544, 'steps': 94, 'loss/train': 7.655509948730469} -09/20/2021 14:48:55 - INFO - __main__ - Step 1518: {'lr': 2.5066666666666665e-05, 'samples': 48576, 'steps': 94, 'loss/train': 6.515892028808594} -09/20/2021 14:48:55 - INFO - __main__ - Step 1519: {'lr': 2.5066666666666665e-05, 'samples': 48608, 'steps': 94, 'loss/train': 7.455440998077393} -09/20/2021 14:48:56 - INFO - __main__ - Step 1520: {'lr': 2.5066666666666665e-05, 'samples': 48640, 'steps': 94, 'loss/train': 7.360893726348877} -09/20/2021 14:48:57 - INFO - __main__ - Step 1521: {'lr': 2.5333333333333337e-05, 'samples': 48672, 'steps': 95, 'loss/train': 7.059614658355713} -09/20/2021 14:48:58 - INFO - __main__ - Step 1522: {'lr': 2.5333333333333337e-05, 'samples': 48704, 'steps': 95, 'loss/train': 7.533706188201904} -09/20/2021 14:48:59 - INFO - __main__ - Step 1523: {'lr': 2.5333333333333337e-05, 'samples': 48736, 'steps': 95, 'loss/train': 6.92440938949585} -09/20/2021 14:48:59 - INFO - __main__ - Step 1524: {'lr': 2.5333333333333337e-05, 'samples': 48768, 'steps': 95, 'loss/train': 6.711199760437012} -09/20/2021 14:49:00 - INFO - __main__ - Step 1525: {'lr': 2.5333333333333337e-05, 'samples': 48800, 'steps': 95, 'loss/train': 7.405246734619141} -09/20/2021 14:49:01 - INFO - __main__ - Step 1526: {'lr': 2.5333333333333337e-05, 'samples': 48832, 'steps': 95, 'loss/train': 6.883022785186768} -09/20/2021 14:49:02 - INFO - __main__ - Step 1527: {'lr': 2.5333333333333337e-05, 'samples': 48864, 'steps': 95, 'loss/train': 6.746815204620361} -09/20/2021 14:49:02 - INFO - __main__ - Step 1528: {'lr': 2.5333333333333337e-05, 'samples': 48896, 'steps': 95, 'loss/train': 7.168659687042236} -09/20/2021 14:49:03 - INFO - __main__ - Step 1529: {'lr': 2.5333333333333337e-05, 'samples': 48928, 'steps': 95, 'loss/train': 7.281334400177002} -09/20/2021 14:49:04 - INFO - __main__ - Step 1530: {'lr': 2.5333333333333337e-05, 'samples': 48960, 'steps': 95, 'loss/train': 6.875681400299072} -09/20/2021 14:49:05 - INFO - __main__ - Step 1531: {'lr': 2.5333333333333337e-05, 'samples': 48992, 'steps': 95, 'loss/train': 6.417508125305176} -09/20/2021 14:49:05 - INFO - __main__ - Step 1532: {'lr': 2.5333333333333337e-05, 'samples': 49024, 'steps': 95, 'loss/train': 7.8816022872924805} -09/20/2021 14:49:06 - INFO - __main__ - Step 1533: {'lr': 2.5333333333333337e-05, 'samples': 49056, 'steps': 95, 'loss/train': 5.779340744018555} -09/20/2021 14:49:07 - INFO - __main__ - Step 1534: {'lr': 2.5333333333333337e-05, 'samples': 49088, 'steps': 95, 'loss/train': 7.697337627410889} -09/20/2021 14:49:08 - INFO - __main__ - Step 1535: {'lr': 2.5333333333333337e-05, 'samples': 49120, 'steps': 95, 'loss/train': 6.832186222076416} -09/20/2021 14:49:08 - INFO - __main__ - Step 1536: {'lr': 2.5333333333333337e-05, 'samples': 49152, 'steps': 95, 'loss/train': 6.965168476104736} -09/20/2021 14:49:09 - INFO - __main__ - Step 1537: {'lr': 2.5600000000000002e-05, 'samples': 49184, 'steps': 96, 'loss/train': 7.183069705963135} -09/20/2021 14:49:10 - INFO - __main__ - Step 1538: {'lr': 2.5600000000000002e-05, 'samples': 49216, 'steps': 96, 'loss/train': 7.554845333099365} -09/20/2021 14:49:11 - INFO - __main__ - Step 1539: {'lr': 2.5600000000000002e-05, 'samples': 49248, 'steps': 96, 'loss/train': 7.284695148468018} -09/20/2021 14:49:11 - INFO - __main__ - Step 1540: {'lr': 2.5600000000000002e-05, 'samples': 49280, 'steps': 96, 'loss/train': 7.142947196960449} -09/20/2021 14:49:12 - INFO - __main__ - Step 1541: {'lr': 2.5600000000000002e-05, 'samples': 49312, 'steps': 96, 'loss/train': 6.46863317489624} -09/20/2021 14:49:13 - INFO - __main__ - Step 1542: {'lr': 2.5600000000000002e-05, 'samples': 49344, 'steps': 96, 'loss/train': 7.5153021812438965} -09/20/2021 14:49:14 - INFO - __main__ - Step 1543: {'lr': 2.5600000000000002e-05, 'samples': 49376, 'steps': 96, 'loss/train': 7.349370956420898} -09/20/2021 14:49:14 - INFO - __main__ - Step 1544: {'lr': 2.5600000000000002e-05, 'samples': 49408, 'steps': 96, 'loss/train': 7.035388946533203} -09/20/2021 14:49:16 - INFO - __main__ - Step 1545: {'lr': 2.5600000000000002e-05, 'samples': 49440, 'steps': 96, 'loss/train': 7.193082809448242} -09/20/2021 14:49:17 - INFO - __main__ - Step 1546: {'lr': 2.5600000000000002e-05, 'samples': 49472, 'steps': 96, 'loss/train': 6.463040828704834} -09/20/2021 14:49:18 - INFO - __main__ - Step 1547: {'lr': 2.5600000000000002e-05, 'samples': 49504, 'steps': 96, 'loss/train': 6.618950843811035} -09/20/2021 14:49:18 - INFO - __main__ - Step 1548: {'lr': 2.5600000000000002e-05, 'samples': 49536, 'steps': 96, 'loss/train': 7.661174774169922} -09/20/2021 14:49:19 - INFO - __main__ - Step 1549: {'lr': 2.5600000000000002e-05, 'samples': 49568, 'steps': 96, 'loss/train': 6.755197048187256} -09/20/2021 14:49:20 - INFO - __main__ - Step 1550: {'lr': 2.5600000000000002e-05, 'samples': 49600, 'steps': 96, 'loss/train': 6.818697452545166} -09/20/2021 14:49:21 - INFO - __main__ - Step 1551: {'lr': 2.5600000000000002e-05, 'samples': 49632, 'steps': 96, 'loss/train': 6.781591892242432} -09/20/2021 14:49:21 - INFO - __main__ - Step 1552: {'lr': 2.5600000000000002e-05, 'samples': 49664, 'steps': 96, 'loss/train': 6.014730930328369} -09/20/2021 14:49:22 - INFO - __main__ - Step 1553: {'lr': 2.5866666666666667e-05, 'samples': 49696, 'steps': 97, 'loss/train': 5.978657245635986} -09/20/2021 14:49:23 - INFO - __main__ - Step 1554: {'lr': 2.5866666666666667e-05, 'samples': 49728, 'steps': 97, 'loss/train': 6.531246662139893} -09/20/2021 14:49:24 - INFO - __main__ - Step 1555: {'lr': 2.5866666666666667e-05, 'samples': 49760, 'steps': 97, 'loss/train': 7.368689060211182} -09/20/2021 14:49:24 - INFO - __main__ - Step 1556: {'lr': 2.5866666666666667e-05, 'samples': 49792, 'steps': 97, 'loss/train': 6.2098870277404785} -09/20/2021 14:49:25 - INFO - __main__ - Step 1557: {'lr': 2.5866666666666667e-05, 'samples': 49824, 'steps': 97, 'loss/train': 5.639039993286133} -09/20/2021 14:49:26 - INFO - __main__ - Step 1558: {'lr': 2.5866666666666667e-05, 'samples': 49856, 'steps': 97, 'loss/train': 6.306752681732178} -09/20/2021 14:49:27 - INFO - __main__ - Step 1559: {'lr': 2.5866666666666667e-05, 'samples': 49888, 'steps': 97, 'loss/train': 6.368741035461426} -09/20/2021 14:49:27 - INFO - __main__ - Step 1560: {'lr': 2.5866666666666667e-05, 'samples': 49920, 'steps': 97, 'loss/train': 6.6494035720825195} -09/20/2021 14:49:28 - INFO - __main__ - Step 1561: {'lr': 2.5866666666666667e-05, 'samples': 49952, 'steps': 97, 'loss/train': 6.343544006347656} -09/20/2021 14:49:29 - INFO - __main__ - Step 1562: {'lr': 2.5866666666666667e-05, 'samples': 49984, 'steps': 97, 'loss/train': 6.463551998138428} -09/20/2021 14:49:30 - INFO - __main__ - Step 1563: {'lr': 2.5866666666666667e-05, 'samples': 50016, 'steps': 97, 'loss/train': 6.403754234313965} -09/20/2021 14:49:30 - INFO - __main__ - Step 1564: {'lr': 2.5866666666666667e-05, 'samples': 50048, 'steps': 97, 'loss/train': 6.922320365905762} -09/20/2021 14:49:31 - INFO - __main__ - Step 1565: {'lr': 2.5866666666666667e-05, 'samples': 50080, 'steps': 97, 'loss/train': 7.108663082122803} -09/20/2021 14:49:32 - INFO - __main__ - Step 1566: {'lr': 2.5866666666666667e-05, 'samples': 50112, 'steps': 97, 'loss/train': 6.783005237579346} -09/20/2021 14:49:33 - INFO - __main__ - Step 1567: {'lr': 2.5866666666666667e-05, 'samples': 50144, 'steps': 97, 'loss/train': 7.21034574508667} -09/20/2021 14:49:33 - INFO - __main__ - Step 1568: {'lr': 2.5866666666666667e-05, 'samples': 50176, 'steps': 97, 'loss/train': 7.063425540924072} -09/20/2021 14:49:34 - INFO - __main__ - Step 1569: {'lr': 2.6133333333333333e-05, 'samples': 50208, 'steps': 98, 'loss/train': 7.416402339935303} -09/20/2021 14:49:35 - INFO - __main__ - Step 1570: {'lr': 2.6133333333333333e-05, 'samples': 50240, 'steps': 98, 'loss/train': 6.458004474639893} -09/20/2021 14:49:36 - INFO - __main__ - Step 1571: {'lr': 2.6133333333333333e-05, 'samples': 50272, 'steps': 98, 'loss/train': 6.572519302368164} -09/20/2021 14:49:37 - INFO - __main__ - Step 1572: {'lr': 2.6133333333333333e-05, 'samples': 50304, 'steps': 98, 'loss/train': 7.31736946105957} -09/20/2021 14:49:37 - INFO - __main__ - Step 1573: {'lr': 2.6133333333333333e-05, 'samples': 50336, 'steps': 98, 'loss/train': 6.803414821624756} -09/20/2021 14:49:38 - INFO - __main__ - Step 1574: {'lr': 2.6133333333333333e-05, 'samples': 50368, 'steps': 98, 'loss/train': 6.896745204925537} -09/20/2021 14:49:39 - INFO - __main__ - Step 1575: {'lr': 2.6133333333333333e-05, 'samples': 50400, 'steps': 98, 'loss/train': 6.348362445831299} -09/20/2021 14:49:41 - INFO - __main__ - Step 1576: {'lr': 2.6133333333333333e-05, 'samples': 50432, 'steps': 98, 'loss/train': 7.024401664733887} -09/20/2021 14:49:41 - INFO - __main__ - Step 1577: {'lr': 2.6133333333333333e-05, 'samples': 50464, 'steps': 98, 'loss/train': 7.477882385253906} -09/20/2021 14:49:42 - INFO - __main__ - Step 1578: {'lr': 2.6133333333333333e-05, 'samples': 50496, 'steps': 98, 'loss/train': 8.07170581817627} -09/20/2021 14:49:43 - INFO - __main__ - Step 1579: {'lr': 2.6133333333333333e-05, 'samples': 50528, 'steps': 98, 'loss/train': 6.374888896942139} -09/20/2021 14:49:44 - INFO - __main__ - Step 1580: {'lr': 2.6133333333333333e-05, 'samples': 50560, 'steps': 98, 'loss/train': 6.725752830505371} -09/20/2021 14:49:44 - INFO - __main__ - Step 1581: {'lr': 2.6133333333333333e-05, 'samples': 50592, 'steps': 98, 'loss/train': 7.198315143585205} -09/20/2021 14:49:45 - INFO - __main__ - Step 1582: {'lr': 2.6133333333333333e-05, 'samples': 50624, 'steps': 98, 'loss/train': 6.646998882293701} -09/20/2021 14:49:46 - INFO - __main__ - Step 1583: {'lr': 2.6133333333333333e-05, 'samples': 50656, 'steps': 98, 'loss/train': 7.599323749542236} -09/20/2021 14:49:47 - INFO - __main__ - Step 1584: {'lr': 2.6133333333333333e-05, 'samples': 50688, 'steps': 98, 'loss/train': 6.270210266113281} -09/20/2021 14:49:48 - INFO - __main__ - Step 1585: {'lr': 2.64e-05, 'samples': 50720, 'steps': 99, 'loss/train': 7.650453567504883} -09/20/2021 14:49:48 - INFO - __main__ - Step 1586: {'lr': 2.64e-05, 'samples': 50752, 'steps': 99, 'loss/train': 6.982351779937744} -09/20/2021 14:49:49 - INFO - __main__ - Step 1587: {'lr': 2.64e-05, 'samples': 50784, 'steps': 99, 'loss/train': 6.560462474822998} -09/20/2021 14:49:50 - INFO - __main__ - Step 1588: {'lr': 2.64e-05, 'samples': 50816, 'steps': 99, 'loss/train': 7.012301921844482} -09/20/2021 14:49:51 - INFO - __main__ - Step 1589: {'lr': 2.64e-05, 'samples': 50848, 'steps': 99, 'loss/train': 5.96284294128418} -09/20/2021 14:49:51 - INFO - __main__ - Step 1590: {'lr': 2.64e-05, 'samples': 50880, 'steps': 99, 'loss/train': 6.854204177856445} -09/20/2021 14:49:52 - INFO - __main__ - Step 1591: {'lr': 2.64e-05, 'samples': 50912, 'steps': 99, 'loss/train': 7.292349338531494} -09/20/2021 14:49:53 - INFO - __main__ - Step 1592: {'lr': 2.64e-05, 'samples': 50944, 'steps': 99, 'loss/train': 6.762490272521973} -09/20/2021 14:49:54 - INFO - __main__ - Step 1593: {'lr': 2.64e-05, 'samples': 50976, 'steps': 99, 'loss/train': 6.466850757598877} -09/20/2021 14:49:54 - INFO - __main__ - Step 1594: {'lr': 2.64e-05, 'samples': 51008, 'steps': 99, 'loss/train': 7.333856105804443} -09/20/2021 14:49:55 - INFO - __main__ - Step 1595: {'lr': 2.64e-05, 'samples': 51040, 'steps': 99, 'loss/train': 6.90199613571167} -09/20/2021 14:49:56 - INFO - __main__ - Step 1596: {'lr': 2.64e-05, 'samples': 51072, 'steps': 99, 'loss/train': 5.800666332244873} -09/20/2021 14:49:57 - INFO - __main__ - Step 1597: {'lr': 2.64e-05, 'samples': 51104, 'steps': 99, 'loss/train': 6.823329448699951} -09/20/2021 14:49:57 - INFO - __main__ - Step 1598: {'lr': 2.64e-05, 'samples': 51136, 'steps': 99, 'loss/train': 6.857178211212158} -09/20/2021 14:49:58 - INFO - __main__ - Step 1599: {'lr': 2.64e-05, 'samples': 51168, 'steps': 99, 'loss/train': 7.036200046539307} -09/20/2021 14:49:59 - INFO - __main__ - Step 1600: {'lr': 2.64e-05, 'samples': 51200, 'steps': 99, 'loss/train': 6.250958442687988} -09/20/2021 14:50:00 - INFO - __main__ - Step 1601: {'lr': 2.6666666666666667e-05, 'samples': 51232, 'steps': 100, 'loss/train': 6.749054908752441} -09/20/2021 14:50:00 - INFO - __main__ - Step 1602: {'lr': 2.6666666666666667e-05, 'samples': 51264, 'steps': 100, 'loss/train': 6.5865960121154785} -09/20/2021 14:50:01 - INFO - __main__ - Step 1603: {'lr': 2.6666666666666667e-05, 'samples': 51296, 'steps': 100, 'loss/train': 6.857900619506836} -09/20/2021 14:50:02 - INFO - __main__ - Step 1604: {'lr': 2.6666666666666667e-05, 'samples': 51328, 'steps': 100, 'loss/train': 6.325868129730225} -09/20/2021 14:50:03 - INFO - __main__ - Step 1605: {'lr': 2.6666666666666667e-05, 'samples': 51360, 'steps': 100, 'loss/train': 6.559368133544922} -09/20/2021 14:50:04 - INFO - __main__ - Step 1606: {'lr': 2.6666666666666667e-05, 'samples': 51392, 'steps': 100, 'loss/train': 6.909264087677002} -09/20/2021 14:50:05 - INFO - __main__ - Step 1607: {'lr': 2.6666666666666667e-05, 'samples': 51424, 'steps': 100, 'loss/train': 7.3712639808654785} -09/20/2021 14:50:06 - INFO - __main__ - Step 1608: {'lr': 2.6666666666666667e-05, 'samples': 51456, 'steps': 100, 'loss/train': 6.704596042633057} -09/20/2021 14:50:07 - INFO - __main__ - Step 1609: {'lr': 2.6666666666666667e-05, 'samples': 51488, 'steps': 100, 'loss/train': 6.477755069732666} -09/20/2021 14:50:07 - INFO - __main__ - Step 1610: {'lr': 2.6666666666666667e-05, 'samples': 51520, 'steps': 100, 'loss/train': 6.859336853027344} -09/20/2021 14:50:08 - INFO - __main__ - Step 1611: {'lr': 2.6666666666666667e-05, 'samples': 51552, 'steps': 100, 'loss/train': 6.841298580169678} -09/20/2021 14:50:09 - INFO - __main__ - Step 1612: {'lr': 2.6666666666666667e-05, 'samples': 51584, 'steps': 100, 'loss/train': 8.306269645690918} -09/20/2021 14:50:10 - INFO - __main__ - Step 1613: {'lr': 2.6666666666666667e-05, 'samples': 51616, 'steps': 100, 'loss/train': 7.118026256561279} -09/20/2021 14:50:10 - INFO - __main__ - Step 1614: {'lr': 2.6666666666666667e-05, 'samples': 51648, 'steps': 100, 'loss/train': 6.549184322357178} -09/20/2021 14:50:11 - INFO - __main__ - Step 1615: {'lr': 2.6666666666666667e-05, 'samples': 51680, 'steps': 100, 'loss/train': 7.182253360748291} -09/20/2021 14:50:12 - INFO - __main__ - Step 1616: {'lr': 2.6666666666666667e-05, 'samples': 51712, 'steps': 100, 'loss/train': 7.039628028869629} -09/20/2021 14:50:13 - INFO - __main__ - Step 1617: {'lr': 2.6933333333333332e-05, 'samples': 51744, 'steps': 101, 'loss/train': 6.606952667236328} -09/20/2021 14:50:13 - INFO - __main__ - Step 1618: {'lr': 2.6933333333333332e-05, 'samples': 51776, 'steps': 101, 'loss/train': 9.535364151000977} -09/20/2021 14:50:14 - INFO - __main__ - Step 1619: {'lr': 2.6933333333333332e-05, 'samples': 51808, 'steps': 101, 'loss/train': 9.327640533447266} -09/20/2021 14:50:15 - INFO - __main__ - Step 1620: {'lr': 2.6933333333333332e-05, 'samples': 51840, 'steps': 101, 'loss/train': 8.523271560668945} -09/20/2021 14:50:16 - INFO - __main__ - Step 1621: {'lr': 2.6933333333333332e-05, 'samples': 51872, 'steps': 101, 'loss/train': 8.419593811035156} -09/20/2021 14:50:16 - INFO - __main__ - Step 1622: {'lr': 2.6933333333333332e-05, 'samples': 51904, 'steps': 101, 'loss/train': 8.700348854064941} -09/20/2021 14:50:17 - INFO - __main__ - Step 1623: {'lr': 2.6933333333333332e-05, 'samples': 51936, 'steps': 101, 'loss/train': 8.060775756835938} -09/20/2021 14:50:18 - INFO - __main__ - Step 1624: {'lr': 2.6933333333333332e-05, 'samples': 51968, 'steps': 101, 'loss/train': 9.206254005432129} -09/20/2021 14:50:19 - INFO - __main__ - Step 1625: {'lr': 2.6933333333333332e-05, 'samples': 52000, 'steps': 101, 'loss/train': 9.160350799560547} -09/20/2021 14:50:19 - INFO - __main__ - Step 1626: {'lr': 2.6933333333333332e-05, 'samples': 52032, 'steps': 101, 'loss/train': 8.68520736694336} -09/20/2021 14:50:20 - INFO - __main__ - Step 1627: {'lr': 2.6933333333333332e-05, 'samples': 52064, 'steps': 101, 'loss/train': 6.1594977378845215} -09/20/2021 14:50:21 - INFO - __main__ - Step 1628: {'lr': 2.6933333333333332e-05, 'samples': 52096, 'steps': 101, 'loss/train': 6.366283416748047} -09/20/2021 14:50:22 - INFO - __main__ - Step 1629: {'lr': 2.6933333333333332e-05, 'samples': 52128, 'steps': 101, 'loss/train': 6.396833896636963} -09/20/2021 14:50:22 - INFO - __main__ - Step 1630: {'lr': 2.6933333333333332e-05, 'samples': 52160, 'steps': 101, 'loss/train': 6.487987041473389} -09/20/2021 14:50:23 - INFO - __main__ - Step 1631: {'lr': 2.6933333333333332e-05, 'samples': 52192, 'steps': 101, 'loss/train': 6.522025108337402} -09/20/2021 14:50:24 - INFO - __main__ - Step 1632: {'lr': 2.6933333333333332e-05, 'samples': 52224, 'steps': 101, 'loss/train': 6.414955139160156} -09/20/2021 14:50:25 - INFO - __main__ - Step 1633: {'lr': 2.7200000000000004e-05, 'samples': 52256, 'steps': 102, 'loss/train': 6.770336627960205} -09/20/2021 14:50:26 - INFO - __main__ - Step 1634: {'lr': 2.7200000000000004e-05, 'samples': 52288, 'steps': 102, 'loss/train': 7.030030727386475} -09/20/2021 14:50:26 - INFO - __main__ - Step 1635: {'lr': 2.7200000000000004e-05, 'samples': 52320, 'steps': 102, 'loss/train': 7.1625590324401855} -09/20/2021 14:50:27 - INFO - __main__ - Step 1636: {'lr': 2.7200000000000004e-05, 'samples': 52352, 'steps': 102, 'loss/train': 6.084545135498047} -09/20/2021 14:50:28 - INFO - __main__ - Step 1637: {'lr': 2.7200000000000004e-05, 'samples': 52384, 'steps': 102, 'loss/train': 6.116086483001709} -09/20/2021 14:50:29 - INFO - __main__ - Step 1638: {'lr': 2.7200000000000004e-05, 'samples': 52416, 'steps': 102, 'loss/train': 6.2919135093688965} -09/20/2021 14:50:29 - INFO - __main__ - Step 1639: {'lr': 2.7200000000000004e-05, 'samples': 52448, 'steps': 102, 'loss/train': 6.67976713180542} -09/20/2021 14:50:30 - INFO - __main__ - Step 1640: {'lr': 2.7200000000000004e-05, 'samples': 52480, 'steps': 102, 'loss/train': 7.304195880889893} -09/20/2021 14:50:31 - INFO - __main__ - Step 1641: {'lr': 2.7200000000000004e-05, 'samples': 52512, 'steps': 102, 'loss/train': 6.830650806427002} -09/20/2021 14:50:32 - INFO - __main__ - Step 1642: {'lr': 2.7200000000000004e-05, 'samples': 52544, 'steps': 102, 'loss/train': 7.375284671783447} -09/20/2021 14:50:32 - INFO - __main__ - Step 1643: {'lr': 2.7200000000000004e-05, 'samples': 52576, 'steps': 102, 'loss/train': 6.967977046966553} -09/20/2021 14:50:33 - INFO - __main__ - Step 1644: {'lr': 2.7200000000000004e-05, 'samples': 52608, 'steps': 102, 'loss/train': 6.720880508422852} -09/20/2021 14:50:34 - INFO - __main__ - Step 1645: {'lr': 2.7200000000000004e-05, 'samples': 52640, 'steps': 102, 'loss/train': 7.295853614807129} -09/20/2021 14:50:35 - INFO - __main__ - Step 1646: {'lr': 2.7200000000000004e-05, 'samples': 52672, 'steps': 102, 'loss/train': 7.141063213348389} -09/20/2021 14:50:36 - INFO - __main__ - Step 1647: {'lr': 2.7200000000000004e-05, 'samples': 52704, 'steps': 102, 'loss/train': 6.9008708000183105} -09/20/2021 14:50:37 - INFO - __main__ - Step 1648: {'lr': 2.7200000000000004e-05, 'samples': 52736, 'steps': 102, 'loss/train': 7.456801414489746} -09/20/2021 14:50:38 - INFO - __main__ - Step 1649: {'lr': 2.746666666666667e-05, 'samples': 52768, 'steps': 103, 'loss/train': 6.961514949798584} -09/20/2021 14:50:38 - INFO - __main__ - Step 1650: {'lr': 2.746666666666667e-05, 'samples': 52800, 'steps': 103, 'loss/train': 6.9067606925964355} -09/20/2021 14:50:39 - INFO - __main__ - Step 1651: {'lr': 2.746666666666667e-05, 'samples': 52832, 'steps': 103, 'loss/train': 7.127151012420654} -09/20/2021 14:50:40 - INFO - __main__ - Step 1652: {'lr': 2.746666666666667e-05, 'samples': 52864, 'steps': 103, 'loss/train': 7.040297508239746} -09/20/2021 14:50:41 - INFO - __main__ - Step 1653: {'lr': 2.746666666666667e-05, 'samples': 52896, 'steps': 103, 'loss/train': 6.77119255065918} -09/20/2021 14:50:41 - INFO - __main__ - Step 1654: {'lr': 2.746666666666667e-05, 'samples': 52928, 'steps': 103, 'loss/train': 7.480414390563965} -09/20/2021 14:50:42 - INFO - __main__ - Step 1655: {'lr': 2.746666666666667e-05, 'samples': 52960, 'steps': 103, 'loss/train': 6.330386638641357} -09/20/2021 14:50:43 - INFO - __main__ - Step 1656: {'lr': 2.746666666666667e-05, 'samples': 52992, 'steps': 103, 'loss/train': 6.226858615875244} -09/20/2021 14:50:44 - INFO - __main__ - Step 1657: {'lr': 2.746666666666667e-05, 'samples': 53024, 'steps': 103, 'loss/train': 6.326478481292725} -09/20/2021 14:50:44 - INFO - __main__ - Step 1658: {'lr': 2.746666666666667e-05, 'samples': 53056, 'steps': 103, 'loss/train': 6.140662670135498} -09/20/2021 14:50:45 - INFO - __main__ - Step 1659: {'lr': 2.746666666666667e-05, 'samples': 53088, 'steps': 103, 'loss/train': 6.947600364685059} -09/20/2021 14:50:46 - INFO - __main__ - Step 1660: {'lr': 2.746666666666667e-05, 'samples': 53120, 'steps': 103, 'loss/train': 6.246621608734131} -09/20/2021 14:50:47 - INFO - __main__ - Step 1661: {'lr': 2.746666666666667e-05, 'samples': 53152, 'steps': 103, 'loss/train': 7.386404991149902} -09/20/2021 14:50:47 - INFO - __main__ - Step 1662: {'lr': 2.746666666666667e-05, 'samples': 53184, 'steps': 103, 'loss/train': 6.211913108825684} -09/20/2021 14:50:48 - INFO - __main__ - Step 1663: {'lr': 2.746666666666667e-05, 'samples': 53216, 'steps': 103, 'loss/train': 6.1278767585754395} -09/20/2021 14:50:49 - INFO - __main__ - Step 1664: {'lr': 2.746666666666667e-05, 'samples': 53248, 'steps': 103, 'loss/train': 6.591806411743164} -09/20/2021 14:50:50 - INFO - __main__ - Step 1665: {'lr': 2.7733333333333334e-05, 'samples': 53280, 'steps': 104, 'loss/train': 6.447636127471924} -09/20/2021 14:50:50 - INFO - __main__ - Step 1666: {'lr': 2.7733333333333334e-05, 'samples': 53312, 'steps': 104, 'loss/train': 7.3612775802612305} -09/20/2021 14:50:51 - INFO - __main__ - Step 1667: {'lr': 2.7733333333333334e-05, 'samples': 53344, 'steps': 104, 'loss/train': 5.67581844329834} -09/20/2021 14:50:52 - INFO - __main__ - Step 1668: {'lr': 2.7733333333333334e-05, 'samples': 53376, 'steps': 104, 'loss/train': 6.805301189422607} -09/20/2021 14:50:53 - INFO - __main__ - Step 1669: {'lr': 2.7733333333333334e-05, 'samples': 53408, 'steps': 104, 'loss/train': 6.221124649047852} -09/20/2021 14:50:53 - INFO - __main__ - Step 1670: {'lr': 2.7733333333333334e-05, 'samples': 53440, 'steps': 104, 'loss/train': 7.994207382202148} -09/20/2021 14:50:54 - INFO - __main__ - Step 1671: {'lr': 2.7733333333333334e-05, 'samples': 53472, 'steps': 104, 'loss/train': 8.388983726501465} -09/20/2021 14:50:55 - INFO - __main__ - Step 1672: {'lr': 2.7733333333333334e-05, 'samples': 53504, 'steps': 104, 'loss/train': 6.086758613586426} -09/20/2021 14:50:56 - INFO - __main__ - Step 1673: {'lr': 2.7733333333333334e-05, 'samples': 53536, 'steps': 104, 'loss/train': 6.671716213226318} -09/20/2021 14:50:56 - INFO - __main__ - Step 1674: {'lr': 2.7733333333333334e-05, 'samples': 53568, 'steps': 104, 'loss/train': 7.215109348297119} -09/20/2021 14:50:57 - INFO - __main__ - Step 1675: {'lr': 2.7733333333333334e-05, 'samples': 53600, 'steps': 104, 'loss/train': 6.3639960289001465} -09/20/2021 14:50:58 - INFO - __main__ - Step 1676: {'lr': 2.7733333333333334e-05, 'samples': 53632, 'steps': 104, 'loss/train': 6.837604999542236} -09/20/2021 14:50:59 - INFO - __main__ - Step 1677: {'lr': 2.7733333333333334e-05, 'samples': 53664, 'steps': 104, 'loss/train': 6.2848076820373535} -09/20/2021 14:51:00 - INFO - __main__ - Step 1678: {'lr': 2.7733333333333334e-05, 'samples': 53696, 'steps': 104, 'loss/train': 7.490596771240234} -09/20/2021 14:51:01 - INFO - __main__ - Step 1679: {'lr': 2.7733333333333334e-05, 'samples': 53728, 'steps': 104, 'loss/train': 6.443604469299316} -09/20/2021 14:51:01 - INFO - __main__ - Step 1680: {'lr': 2.7733333333333334e-05, 'samples': 53760, 'steps': 104, 'loss/train': 6.812562942504883} -09/20/2021 14:51:02 - INFO - __main__ - Step 1681: {'lr': 2.8000000000000003e-05, 'samples': 53792, 'steps': 105, 'loss/train': 6.465167045593262} -09/20/2021 14:51:03 - INFO - __main__ - Step 1682: {'lr': 2.8000000000000003e-05, 'samples': 53824, 'steps': 105, 'loss/train': 6.5762248039245605} -09/20/2021 14:51:04 - INFO - __main__ - Step 1683: {'lr': 2.8000000000000003e-05, 'samples': 53856, 'steps': 105, 'loss/train': 6.978451251983643} -09/20/2021 14:51:05 - INFO - __main__ - Step 1684: {'lr': 2.8000000000000003e-05, 'samples': 53888, 'steps': 105, 'loss/train': 6.2717509269714355} -09/20/2021 14:51:05 - INFO - __main__ - Step 1685: {'lr': 2.8000000000000003e-05, 'samples': 53920, 'steps': 105, 'loss/train': 7.292435169219971} -09/20/2021 14:51:06 - INFO - __main__ - Step 1686: {'lr': 2.8000000000000003e-05, 'samples': 53952, 'steps': 105, 'loss/train': 7.623319625854492} -09/20/2021 14:51:07 - INFO - __main__ - Step 1687: {'lr': 2.8000000000000003e-05, 'samples': 53984, 'steps': 105, 'loss/train': 7.3900580406188965} -09/20/2021 14:51:08 - INFO - __main__ - Step 1688: {'lr': 2.8000000000000003e-05, 'samples': 54016, 'steps': 105, 'loss/train': 6.409609317779541} -09/20/2021 14:51:08 - INFO - __main__ - Step 1689: {'lr': 2.8000000000000003e-05, 'samples': 54048, 'steps': 105, 'loss/train': 6.588659286499023} -09/20/2021 14:51:09 - INFO - __main__ - Step 1690: {'lr': 2.8000000000000003e-05, 'samples': 54080, 'steps': 105, 'loss/train': 7.260263919830322} -09/20/2021 14:51:10 - INFO - __main__ - Step 1691: {'lr': 2.8000000000000003e-05, 'samples': 54112, 'steps': 105, 'loss/train': 6.906129360198975} -09/20/2021 14:51:11 - INFO - __main__ - Step 1692: {'lr': 2.8000000000000003e-05, 'samples': 54144, 'steps': 105, 'loss/train': 6.321217060089111} -09/20/2021 14:51:11 - INFO - __main__ - Step 1693: {'lr': 2.8000000000000003e-05, 'samples': 54176, 'steps': 105, 'loss/train': 6.5388898849487305} -09/20/2021 14:51:12 - INFO - __main__ - Step 1694: {'lr': 2.8000000000000003e-05, 'samples': 54208, 'steps': 105, 'loss/train': 6.4841814041137695} -09/20/2021 14:51:13 - INFO - __main__ - Step 1695: {'lr': 2.8000000000000003e-05, 'samples': 54240, 'steps': 105, 'loss/train': 7.2622575759887695} -09/20/2021 14:51:14 - INFO - __main__ - Step 1696: {'lr': 2.8000000000000003e-05, 'samples': 54272, 'steps': 105, 'loss/train': 7.661412239074707} -09/20/2021 14:51:15 - INFO - __main__ - Step 1697: {'lr': 2.8266666666666668e-05, 'samples': 54304, 'steps': 106, 'loss/train': 6.8595967292785645} -09/20/2021 14:51:15 - INFO - __main__ - Step 1698: {'lr': 2.8266666666666668e-05, 'samples': 54336, 'steps': 106, 'loss/train': 6.6594929695129395} -09/20/2021 14:51:16 - INFO - __main__ - Step 1699: {'lr': 2.8266666666666668e-05, 'samples': 54368, 'steps': 106, 'loss/train': 6.677968502044678} -09/20/2021 14:51:17 - INFO - __main__ - Step 1700: {'lr': 2.8266666666666668e-05, 'samples': 54400, 'steps': 106, 'loss/train': 6.45175313949585} -09/20/2021 14:51:18 - INFO - __main__ - Step 1701: {'lr': 2.8266666666666668e-05, 'samples': 54432, 'steps': 106, 'loss/train': 6.708085060119629} -09/20/2021 14:51:18 - INFO - __main__ - Step 1702: {'lr': 2.8266666666666668e-05, 'samples': 54464, 'steps': 106, 'loss/train': 6.395713806152344} -09/20/2021 14:51:19 - INFO - __main__ - Step 1703: {'lr': 2.8266666666666668e-05, 'samples': 54496, 'steps': 106, 'loss/train': 6.724338531494141} -09/20/2021 14:51:20 - INFO - __main__ - Step 1704: {'lr': 2.8266666666666668e-05, 'samples': 54528, 'steps': 106, 'loss/train': 6.9152512550354} -09/20/2021 14:51:21 - INFO - __main__ - Step 1705: {'lr': 2.8266666666666668e-05, 'samples': 54560, 'steps': 106, 'loss/train': 6.855285167694092} -09/20/2021 14:51:21 - INFO - __main__ - Step 1706: {'lr': 2.8266666666666668e-05, 'samples': 54592, 'steps': 106, 'loss/train': 6.626635551452637} -09/20/2021 14:51:23 - INFO - __main__ - Step 1707: {'lr': 2.8266666666666668e-05, 'samples': 54624, 'steps': 106, 'loss/train': 7.077476978302002} -09/20/2021 14:51:23 - INFO - __main__ - Step 1708: {'lr': 2.8266666666666668e-05, 'samples': 54656, 'steps': 106, 'loss/train': 6.673079013824463} -09/20/2021 14:51:24 - INFO - __main__ - Step 1709: {'lr': 2.8266666666666668e-05, 'samples': 54688, 'steps': 106, 'loss/train': 6.253171443939209} -09/20/2021 14:51:25 - INFO - __main__ - Step 1710: {'lr': 2.8266666666666668e-05, 'samples': 54720, 'steps': 106, 'loss/train': 5.442764759063721} -09/20/2021 14:51:26 - INFO - __main__ - Step 1711: {'lr': 2.8266666666666668e-05, 'samples': 54752, 'steps': 106, 'loss/train': 7.054103851318359} -09/20/2021 14:51:26 - INFO - __main__ - Step 1712: {'lr': 2.8266666666666668e-05, 'samples': 54784, 'steps': 106, 'loss/train': 5.176662445068359} -09/20/2021 14:51:27 - INFO - __main__ - Step 1713: {'lr': 2.8533333333333333e-05, 'samples': 54816, 'steps': 107, 'loss/train': 5.618610858917236} -09/20/2021 14:51:28 - INFO - __main__ - Step 1714: {'lr': 2.8533333333333333e-05, 'samples': 54848, 'steps': 107, 'loss/train': 6.642454147338867} -09/20/2021 14:51:29 - INFO - __main__ - Step 1715: {'lr': 2.8533333333333333e-05, 'samples': 54880, 'steps': 107, 'loss/train': 6.433320999145508} -09/20/2021 14:51:30 - INFO - __main__ - Step 1716: {'lr': 2.8533333333333333e-05, 'samples': 54912, 'steps': 107, 'loss/train': 6.80247163772583} -09/20/2021 14:51:30 - INFO - __main__ - Step 1717: {'lr': 2.8533333333333333e-05, 'samples': 54944, 'steps': 107, 'loss/train': 6.786035537719727} -09/20/2021 14:51:31 - INFO - __main__ - Step 1718: {'lr': 2.8533333333333333e-05, 'samples': 54976, 'steps': 107, 'loss/train': 7.851870059967041} -09/20/2021 14:51:32 - INFO - __main__ - Step 1719: {'lr': 2.8533333333333333e-05, 'samples': 55008, 'steps': 107, 'loss/train': 7.134980201721191} -09/20/2021 14:51:33 - INFO - __main__ - Step 1720: {'lr': 2.8533333333333333e-05, 'samples': 55040, 'steps': 107, 'loss/train': 6.749288558959961} -09/20/2021 14:51:33 - INFO - __main__ - Step 1721: {'lr': 2.8533333333333333e-05, 'samples': 55072, 'steps': 107, 'loss/train': 7.062508583068848} -09/20/2021 14:51:34 - INFO - __main__ - Step 1722: {'lr': 2.8533333333333333e-05, 'samples': 55104, 'steps': 107, 'loss/train': 6.926645278930664} -09/20/2021 14:51:35 - INFO - __main__ - Step 1723: {'lr': 2.8533333333333333e-05, 'samples': 55136, 'steps': 107, 'loss/train': 6.690032482147217} -09/20/2021 14:51:36 - INFO - __main__ - Step 1724: {'lr': 2.8533333333333333e-05, 'samples': 55168, 'steps': 107, 'loss/train': 6.857491970062256} -09/20/2021 14:51:36 - INFO - __main__ - Step 1725: {'lr': 2.8533333333333333e-05, 'samples': 55200, 'steps': 107, 'loss/train': 6.7049946784973145} -09/20/2021 14:51:37 - INFO - __main__ - Step 1726: {'lr': 2.8533333333333333e-05, 'samples': 55232, 'steps': 107, 'loss/train': 5.933664321899414} -09/20/2021 14:51:38 - INFO - __main__ - Step 1727: {'lr': 2.8533333333333333e-05, 'samples': 55264, 'steps': 107, 'loss/train': 6.253852367401123} -09/20/2021 14:51:39 - INFO - __main__ - Step 1728: {'lr': 2.8533333333333333e-05, 'samples': 55296, 'steps': 107, 'loss/train': 7.4641571044921875} -09/20/2021 14:51:39 - INFO - __main__ - Step 1729: {'lr': 2.88e-05, 'samples': 55328, 'steps': 108, 'loss/train': 6.569970607757568} -09/20/2021 14:51:40 - INFO - __main__ - Step 1730: {'lr': 2.88e-05, 'samples': 55360, 'steps': 108, 'loss/train': 5.929459095001221} -09/20/2021 14:51:41 - INFO - __main__ - Step 1731: {'lr': 2.88e-05, 'samples': 55392, 'steps': 108, 'loss/train': 6.661436557769775} -09/20/2021 14:51:42 - INFO - __main__ - Step 1732: {'lr': 2.88e-05, 'samples': 55424, 'steps': 108, 'loss/train': 6.161383152008057} -09/20/2021 14:51:42 - INFO - __main__ - Step 1733: {'lr': 2.88e-05, 'samples': 55456, 'steps': 108, 'loss/train': 6.469416618347168} -09/20/2021 14:51:43 - INFO - __main__ - Step 1734: {'lr': 2.88e-05, 'samples': 55488, 'steps': 108, 'loss/train': 6.087306976318359} -09/20/2021 14:51:44 - INFO - __main__ - Step 1735: {'lr': 2.88e-05, 'samples': 55520, 'steps': 108, 'loss/train': 7.139195442199707} -09/20/2021 14:51:45 - INFO - __main__ - Step 1736: {'lr': 2.88e-05, 'samples': 55552, 'steps': 108, 'loss/train': 7.484576225280762} -09/20/2021 14:51:45 - INFO - __main__ - Step 1737: {'lr': 2.88e-05, 'samples': 55584, 'steps': 108, 'loss/train': 6.352415561676025} -09/20/2021 14:51:47 - INFO - __main__ - Step 1738: {'lr': 2.88e-05, 'samples': 55616, 'steps': 108, 'loss/train': 6.869617938995361} -09/20/2021 14:51:47 - INFO - __main__ - Step 1739: {'lr': 2.88e-05, 'samples': 55648, 'steps': 108, 'loss/train': 6.439413547515869} -09/20/2021 14:51:48 - INFO - __main__ - Step 1740: {'lr': 2.88e-05, 'samples': 55680, 'steps': 108, 'loss/train': 6.445118427276611} -09/20/2021 14:51:49 - INFO - __main__ - Step 1741: {'lr': 2.88e-05, 'samples': 55712, 'steps': 108, 'loss/train': 6.4367756843566895} -09/20/2021 14:51:50 - INFO - __main__ - Step 1742: {'lr': 2.88e-05, 'samples': 55744, 'steps': 108, 'loss/train': 5.826131343841553} -09/20/2021 14:51:50 - INFO - __main__ - Step 1743: {'lr': 2.88e-05, 'samples': 55776, 'steps': 108, 'loss/train': 6.391880512237549} -09/20/2021 14:51:51 - INFO - __main__ - Step 1744: {'lr': 2.88e-05, 'samples': 55808, 'steps': 108, 'loss/train': 6.668693542480469} -09/20/2021 14:51:52 - INFO - __main__ - Step 1745: {'lr': 2.906666666666667e-05, 'samples': 55840, 'steps': 109, 'loss/train': 6.487035274505615} -09/20/2021 14:51:53 - INFO - __main__ - Step 1746: {'lr': 2.906666666666667e-05, 'samples': 55872, 'steps': 109, 'loss/train': 7.701898097991943} -09/20/2021 14:51:54 - INFO - __main__ - Step 1747: {'lr': 2.906666666666667e-05, 'samples': 55904, 'steps': 109, 'loss/train': 7.236573219299316} -09/20/2021 14:51:54 - INFO - __main__ - Step 1748: {'lr': 2.906666666666667e-05, 'samples': 55936, 'steps': 109, 'loss/train': 6.93174934387207} -09/20/2021 14:51:55 - INFO - __main__ - Step 1749: {'lr': 2.906666666666667e-05, 'samples': 55968, 'steps': 109, 'loss/train': 6.749809741973877} -09/20/2021 14:51:56 - INFO - __main__ - Step 1750: {'lr': 2.906666666666667e-05, 'samples': 56000, 'steps': 109, 'loss/train': 7.2296857833862305} -09/20/2021 14:51:57 - INFO - __main__ - Step 1751: {'lr': 2.906666666666667e-05, 'samples': 56032, 'steps': 109, 'loss/train': 6.590333461761475} -09/20/2021 14:51:57 - INFO - __main__ - Step 1752: {'lr': 2.906666666666667e-05, 'samples': 56064, 'steps': 109, 'loss/train': 6.680716514587402} -09/20/2021 14:51:58 - INFO - __main__ - Step 1753: {'lr': 2.906666666666667e-05, 'samples': 56096, 'steps': 109, 'loss/train': 7.583479404449463} -09/20/2021 14:51:59 - INFO - __main__ - Step 1754: {'lr': 2.906666666666667e-05, 'samples': 56128, 'steps': 109, 'loss/train': 6.049078941345215} -09/20/2021 14:52:00 - INFO - __main__ - Step 1755: {'lr': 2.906666666666667e-05, 'samples': 56160, 'steps': 109, 'loss/train': 6.263136863708496} -09/20/2021 14:52:00 - INFO - __main__ - Step 1756: {'lr': 2.906666666666667e-05, 'samples': 56192, 'steps': 109, 'loss/train': 6.686461448669434} -09/20/2021 14:52:01 - INFO - __main__ - Step 1757: {'lr': 2.906666666666667e-05, 'samples': 56224, 'steps': 109, 'loss/train': 7.231515407562256} -09/20/2021 14:52:02 - INFO - __main__ - Step 1758: {'lr': 2.906666666666667e-05, 'samples': 56256, 'steps': 109, 'loss/train': 6.181962966918945} -09/20/2021 14:52:03 - INFO - __main__ - Step 1759: {'lr': 2.906666666666667e-05, 'samples': 56288, 'steps': 109, 'loss/train': 6.241127967834473} -09/20/2021 14:52:03 - INFO - __main__ - Step 1760: {'lr': 2.906666666666667e-05, 'samples': 56320, 'steps': 109, 'loss/train': 5.913502216339111} -09/20/2021 14:52:04 - INFO - __main__ - Step 1761: {'lr': 2.9333333333333336e-05, 'samples': 56352, 'steps': 110, 'loss/train': 6.436279773712158} -09/20/2021 14:52:05 - INFO - __main__ - Step 1762: {'lr': 2.9333333333333336e-05, 'samples': 56384, 'steps': 110, 'loss/train': 6.7641425132751465} -09/20/2021 14:52:06 - INFO - __main__ - Step 1763: {'lr': 2.9333333333333336e-05, 'samples': 56416, 'steps': 110, 'loss/train': 5.847098350524902} -09/20/2021 14:52:07 - INFO - __main__ - Step 1764: {'lr': 2.9333333333333336e-05, 'samples': 56448, 'steps': 110, 'loss/train': 6.828033924102783} -09/20/2021 14:52:07 - INFO - __main__ - Step 1765: {'lr': 2.9333333333333336e-05, 'samples': 56480, 'steps': 110, 'loss/train': 6.529211521148682} -09/20/2021 14:52:08 - INFO - __main__ - Step 1766: {'lr': 2.9333333333333336e-05, 'samples': 56512, 'steps': 110, 'loss/train': 6.52423095703125} -09/20/2021 14:52:09 - INFO - __main__ - Step 1767: {'lr': 2.9333333333333336e-05, 'samples': 56544, 'steps': 110, 'loss/train': 1.072803020477295} -09/20/2021 14:52:10 - INFO - __main__ - Step 1768: {'lr': 2.9333333333333336e-05, 'samples': 56576, 'steps': 110, 'loss/train': 6.622687339782715} -09/20/2021 14:52:11 - INFO - __main__ - Step 1769: {'lr': 2.9333333333333336e-05, 'samples': 56608, 'steps': 110, 'loss/train': 6.399142742156982} -09/20/2021 14:52:12 - INFO - __main__ - Step 1770: {'lr': 2.9333333333333336e-05, 'samples': 56640, 'steps': 110, 'loss/train': 5.786398410797119} -09/20/2021 14:52:12 - INFO - __main__ - Step 1771: {'lr': 2.9333333333333336e-05, 'samples': 56672, 'steps': 110, 'loss/train': 6.790797710418701} -09/20/2021 14:52:13 - INFO - __main__ - Step 1772: {'lr': 2.9333333333333336e-05, 'samples': 56704, 'steps': 110, 'loss/train': 6.458227157592773} -09/20/2021 14:52:14 - INFO - __main__ - Step 1773: {'lr': 2.9333333333333336e-05, 'samples': 56736, 'steps': 110, 'loss/train': 6.9048380851745605} -09/20/2021 14:52:15 - INFO - __main__ - Step 1774: {'lr': 2.9333333333333336e-05, 'samples': 56768, 'steps': 110, 'loss/train': 6.5764336585998535} -09/20/2021 14:52:15 - INFO - __main__ - Step 1775: {'lr': 2.9333333333333336e-05, 'samples': 56800, 'steps': 110, 'loss/train': 6.150598526000977} -09/20/2021 14:52:16 - INFO - __main__ - Step 1776: {'lr': 2.9333333333333336e-05, 'samples': 56832, 'steps': 110, 'loss/train': 6.567956447601318} -09/20/2021 14:52:17 - INFO - __main__ - Step 1777: {'lr': 2.96e-05, 'samples': 56864, 'steps': 111, 'loss/train': 7.220701217651367} -09/20/2021 14:52:18 - INFO - __main__ - Step 1778: {'lr': 2.96e-05, 'samples': 56896, 'steps': 111, 'loss/train': 6.541903018951416} -09/20/2021 14:52:18 - INFO - __main__ - Step 1779: {'lr': 2.96e-05, 'samples': 56928, 'steps': 111, 'loss/train': 6.907362937927246} -09/20/2021 14:52:19 - INFO - __main__ - Step 1780: {'lr': 2.96e-05, 'samples': 56960, 'steps': 111, 'loss/train': 8.02796459197998} -09/20/2021 14:52:20 - INFO - __main__ - Step 1781: {'lr': 2.96e-05, 'samples': 56992, 'steps': 111, 'loss/train': 6.584692001342773} -09/20/2021 14:52:21 - INFO - __main__ - Step 1782: {'lr': 2.96e-05, 'samples': 57024, 'steps': 111, 'loss/train': 6.902879238128662} -09/20/2021 14:52:21 - INFO - __main__ - Step 1783: {'lr': 2.96e-05, 'samples': 57056, 'steps': 111, 'loss/train': 7.166553020477295} -09/20/2021 14:52:22 - INFO - __main__ - Step 1784: {'lr': 2.96e-05, 'samples': 57088, 'steps': 111, 'loss/train': 5.788247108459473} -09/20/2021 14:52:23 - INFO - __main__ - Step 1785: {'lr': 2.96e-05, 'samples': 57120, 'steps': 111, 'loss/train': 6.606266021728516} -09/20/2021 14:52:24 - INFO - __main__ - Step 1786: {'lr': 2.96e-05, 'samples': 57152, 'steps': 111, 'loss/train': 6.333360195159912} -09/20/2021 14:52:24 - INFO - __main__ - Step 1787: {'lr': 2.96e-05, 'samples': 57184, 'steps': 111, 'loss/train': 5.779031276702881} -09/20/2021 14:52:25 - INFO - __main__ - Step 1788: {'lr': 2.96e-05, 'samples': 57216, 'steps': 111, 'loss/train': 6.401401519775391} -09/20/2021 14:52:26 - INFO - __main__ - Step 1789: {'lr': 2.96e-05, 'samples': 57248, 'steps': 111, 'loss/train': 6.250683784484863} -09/20/2021 14:52:27 - INFO - __main__ - Step 1790: {'lr': 2.96e-05, 'samples': 57280, 'steps': 111, 'loss/train': 6.7163405418396} -09/20/2021 14:52:27 - INFO - __main__ - Step 1791: {'lr': 2.96e-05, 'samples': 57312, 'steps': 111, 'loss/train': 6.953531265258789} -09/20/2021 14:52:28 - INFO - __main__ - Step 1792: {'lr': 2.96e-05, 'samples': 57344, 'steps': 111, 'loss/train': 6.009348392486572} -09/20/2021 14:52:29 - INFO - __main__ - Step 1793: {'lr': 2.986666666666667e-05, 'samples': 57376, 'steps': 112, 'loss/train': 6.357996463775635} -09/20/2021 14:52:30 - INFO - __main__ - Step 1794: {'lr': 2.986666666666667e-05, 'samples': 57408, 'steps': 112, 'loss/train': 6.954112529754639} -09/20/2021 14:52:31 - INFO - __main__ - Step 1795: {'lr': 2.986666666666667e-05, 'samples': 57440, 'steps': 112, 'loss/train': 6.905211925506592} -09/20/2021 14:52:31 - INFO - __main__ - Step 1796: {'lr': 2.986666666666667e-05, 'samples': 57472, 'steps': 112, 'loss/train': 6.722829818725586} -09/20/2021 14:52:32 - INFO - __main__ - Step 1797: {'lr': 2.986666666666667e-05, 'samples': 57504, 'steps': 112, 'loss/train': 6.600681304931641} -09/20/2021 14:52:33 - INFO - __main__ - Step 1798: {'lr': 2.986666666666667e-05, 'samples': 57536, 'steps': 112, 'loss/train': 6.762768268585205} -09/20/2021 14:52:34 - INFO - __main__ - Step 1799: {'lr': 2.986666666666667e-05, 'samples': 57568, 'steps': 112, 'loss/train': 6.9171576499938965} -09/20/2021 14:52:34 - INFO - __main__ - Step 1800: {'lr': 2.986666666666667e-05, 'samples': 57600, 'steps': 112, 'loss/train': 5.893004894256592} -09/20/2021 14:52:36 - INFO - __main__ - Step 1801: {'lr': 2.986666666666667e-05, 'samples': 57632, 'steps': 112, 'loss/train': 5.974733352661133} -09/20/2021 14:52:37 - INFO - __main__ - Step 1802: {'lr': 2.986666666666667e-05, 'samples': 57664, 'steps': 112, 'loss/train': 6.888535499572754} -09/20/2021 14:52:37 - INFO - __main__ - Step 1803: {'lr': 2.986666666666667e-05, 'samples': 57696, 'steps': 112, 'loss/train': 6.126288890838623} -09/20/2021 14:52:38 - INFO - __main__ - Step 1804: {'lr': 2.986666666666667e-05, 'samples': 57728, 'steps': 112, 'loss/train': 7.079688549041748} -09/20/2021 14:52:39 - INFO - __main__ - Step 1805: {'lr': 2.986666666666667e-05, 'samples': 57760, 'steps': 112, 'loss/train': 7.800229072570801} -09/20/2021 14:52:40 - INFO - __main__ - Step 1806: {'lr': 2.986666666666667e-05, 'samples': 57792, 'steps': 112, 'loss/train': 5.711235046386719} -09/20/2021 14:52:40 - INFO - __main__ - Step 1807: {'lr': 2.986666666666667e-05, 'samples': 57824, 'steps': 112, 'loss/train': 6.2763872146606445} -09/20/2021 14:52:41 - INFO - __main__ - Step 1808: {'lr': 2.986666666666667e-05, 'samples': 57856, 'steps': 112, 'loss/train': 6.543046951293945} -09/20/2021 14:52:42 - INFO - __main__ - Step 1809: {'lr': 3.0133333333333335e-05, 'samples': 57888, 'steps': 113, 'loss/train': 7.599948883056641} -09/20/2021 14:52:43 - INFO - __main__ - Step 1810: {'lr': 3.0133333333333335e-05, 'samples': 57920, 'steps': 113, 'loss/train': 6.327716827392578} -09/20/2021 14:52:43 - INFO - __main__ - Step 1811: {'lr': 3.0133333333333335e-05, 'samples': 57952, 'steps': 113, 'loss/train': 6.643850803375244} -09/20/2021 14:52:44 - INFO - __main__ - Step 1812: {'lr': 3.0133333333333335e-05, 'samples': 57984, 'steps': 113, 'loss/train': 6.443918228149414} -09/20/2021 14:52:45 - INFO - __main__ - Step 1813: {'lr': 3.0133333333333335e-05, 'samples': 58016, 'steps': 113, 'loss/train': 5.987512588500977} -09/20/2021 14:52:46 - INFO - __main__ - Step 1814: {'lr': 3.0133333333333335e-05, 'samples': 58048, 'steps': 113, 'loss/train': 6.151648998260498} -09/20/2021 14:52:46 - INFO - __main__ - Step 1815: {'lr': 3.0133333333333335e-05, 'samples': 58080, 'steps': 113, 'loss/train': 6.059235095977783} -09/20/2021 14:52:47 - INFO - __main__ - Step 1816: {'lr': 3.0133333333333335e-05, 'samples': 58112, 'steps': 113, 'loss/train': 6.060678958892822} -09/20/2021 14:52:48 - INFO - __main__ - Step 1817: {'lr': 3.0133333333333335e-05, 'samples': 58144, 'steps': 113, 'loss/train': 6.656537055969238} -09/20/2021 14:52:49 - INFO - __main__ - Step 1818: {'lr': 3.0133333333333335e-05, 'samples': 58176, 'steps': 113, 'loss/train': 5.651735305786133} -09/20/2021 14:52:49 - INFO - __main__ - Step 1819: {'lr': 3.0133333333333335e-05, 'samples': 58208, 'steps': 113, 'loss/train': 6.857237339019775} -09/20/2021 14:52:50 - INFO - __main__ - Step 1820: {'lr': 3.0133333333333335e-05, 'samples': 58240, 'steps': 113, 'loss/train': 5.8977131843566895} -09/20/2021 14:52:51 - INFO - __main__ - Step 1821: {'lr': 3.0133333333333335e-05, 'samples': 58272, 'steps': 113, 'loss/train': 6.166044235229492} -09/20/2021 14:52:52 - INFO - __main__ - Step 1822: {'lr': 3.0133333333333335e-05, 'samples': 58304, 'steps': 113, 'loss/train': 5.933762550354004} -09/20/2021 14:52:52 - INFO - __main__ - Step 1823: {'lr': 3.0133333333333335e-05, 'samples': 58336, 'steps': 113, 'loss/train': 6.954166412353516} -09/20/2021 14:52:53 - INFO - __main__ - Step 1824: {'lr': 3.0133333333333335e-05, 'samples': 58368, 'steps': 113, 'loss/train': 6.97127103805542} -09/20/2021 14:52:54 - INFO - __main__ - Step 1825: {'lr': 3.04e-05, 'samples': 58400, 'steps': 114, 'loss/train': 5.797971725463867} -09/20/2021 14:52:55 - INFO - __main__ - Step 1826: {'lr': 3.04e-05, 'samples': 58432, 'steps': 114, 'loss/train': 6.754187107086182} -09/20/2021 14:52:56 - INFO - __main__ - Step 1827: {'lr': 3.04e-05, 'samples': 58464, 'steps': 114, 'loss/train': 6.779458999633789} -09/20/2021 14:52:56 - INFO - __main__ - Step 1828: {'lr': 3.04e-05, 'samples': 58496, 'steps': 114, 'loss/train': 5.803163051605225} -09/20/2021 14:52:57 - INFO - __main__ - Step 1829: {'lr': 3.04e-05, 'samples': 58528, 'steps': 114, 'loss/train': 8.86689567565918} -09/20/2021 14:52:58 - INFO - __main__ - Step 1830: {'lr': 3.04e-05, 'samples': 58560, 'steps': 114, 'loss/train': 8.878554344177246} -09/20/2021 14:52:59 - INFO - __main__ - Step 1831: {'lr': 3.04e-05, 'samples': 58592, 'steps': 114, 'loss/train': 8.871567726135254} -09/20/2021 14:52:59 - INFO - __main__ - Step 1832: {'lr': 3.04e-05, 'samples': 58624, 'steps': 114, 'loss/train': 8.787714958190918} -09/20/2021 14:53:00 - INFO - __main__ - Step 1833: {'lr': 3.04e-05, 'samples': 58656, 'steps': 114, 'loss/train': 8.835437774658203} -09/20/2021 14:53:01 - INFO - __main__ - Step 1834: {'lr': 3.04e-05, 'samples': 58688, 'steps': 114, 'loss/train': 6.283212184906006} -09/20/2021 14:53:02 - INFO - __main__ - Step 1835: {'lr': 3.04e-05, 'samples': 58720, 'steps': 114, 'loss/train': 7.196908473968506} -09/20/2021 14:53:03 - INFO - __main__ - Step 1836: {'lr': 3.04e-05, 'samples': 58752, 'steps': 114, 'loss/train': 8.198741912841797} -09/20/2021 14:53:04 - INFO - __main__ - Step 1837: {'lr': 3.04e-05, 'samples': 58784, 'steps': 114, 'loss/train': 6.410491466522217} -09/20/2021 14:53:04 - INFO - __main__ - Step 1838: {'lr': 3.04e-05, 'samples': 58816, 'steps': 114, 'loss/train': 6.921299934387207} -09/20/2021 14:53:05 - INFO - __main__ - Step 1839: {'lr': 3.04e-05, 'samples': 58848, 'steps': 114, 'loss/train': 7.012816429138184} -09/20/2021 14:53:06 - INFO - __main__ - Step 1840: {'lr': 3.04e-05, 'samples': 58880, 'steps': 114, 'loss/train': 8.124260902404785} -09/20/2021 14:53:07 - INFO - __main__ - Step 1841: {'lr': 3.066666666666667e-05, 'samples': 58912, 'steps': 115, 'loss/train': 7.014801025390625} -09/20/2021 14:53:08 - INFO - __main__ - Step 1842: {'lr': 3.066666666666667e-05, 'samples': 58944, 'steps': 115, 'loss/train': 7.452143669128418} -09/20/2021 14:53:08 - INFO - __main__ - Step 1843: {'lr': 3.066666666666667e-05, 'samples': 58976, 'steps': 115, 'loss/train': 5.51560115814209} -09/20/2021 14:53:09 - INFO - __main__ - Step 1844: {'lr': 3.066666666666667e-05, 'samples': 59008, 'steps': 115, 'loss/train': 6.523744106292725} -09/20/2021 14:53:10 - INFO - __main__ - Step 1845: {'lr': 3.066666666666667e-05, 'samples': 59040, 'steps': 115, 'loss/train': 6.389472007751465} -09/20/2021 14:53:11 - INFO - __main__ - Step 1846: {'lr': 3.066666666666667e-05, 'samples': 59072, 'steps': 115, 'loss/train': 6.264469623565674} -09/20/2021 14:53:11 - INFO - __main__ - Step 1847: {'lr': 3.066666666666667e-05, 'samples': 59104, 'steps': 115, 'loss/train': 5.701825141906738} -09/20/2021 14:53:12 - INFO - __main__ - Step 1848: {'lr': 3.066666666666667e-05, 'samples': 59136, 'steps': 115, 'loss/train': 6.966446876525879} -09/20/2021 14:53:13 - INFO - __main__ - Step 1849: {'lr': 3.066666666666667e-05, 'samples': 59168, 'steps': 115, 'loss/train': 6.167634963989258} -09/20/2021 14:53:14 - INFO - __main__ - Step 1850: {'lr': 3.066666666666667e-05, 'samples': 59200, 'steps': 115, 'loss/train': 6.132457733154297} -09/20/2021 14:53:14 - INFO - __main__ - Step 1851: {'lr': 3.066666666666667e-05, 'samples': 59232, 'steps': 115, 'loss/train': 6.737553119659424} -09/20/2021 14:53:15 - INFO - __main__ - Step 1852: {'lr': 3.066666666666667e-05, 'samples': 59264, 'steps': 115, 'loss/train': 6.575310707092285} -09/20/2021 14:53:16 - INFO - __main__ - Step 1853: {'lr': 3.066666666666667e-05, 'samples': 59296, 'steps': 115, 'loss/train': 6.917254447937012} -09/20/2021 14:53:17 - INFO - __main__ - Step 1854: {'lr': 3.066666666666667e-05, 'samples': 59328, 'steps': 115, 'loss/train': 6.6251373291015625} -09/20/2021 14:53:17 - INFO - __main__ - Step 1855: {'lr': 3.066666666666667e-05, 'samples': 59360, 'steps': 115, 'loss/train': 6.628207683563232} -09/20/2021 14:53:18 - INFO - __main__ - Step 1856: {'lr': 3.066666666666667e-05, 'samples': 59392, 'steps': 115, 'loss/train': 6.55890417098999} -09/20/2021 14:53:19 - INFO - __main__ - Step 1857: {'lr': 3.093333333333334e-05, 'samples': 59424, 'steps': 116, 'loss/train': 6.573915958404541} -09/20/2021 14:53:20 - INFO - __main__ - Step 1858: {'lr': 3.093333333333334e-05, 'samples': 59456, 'steps': 116, 'loss/train': 7.11773157119751} -09/20/2021 14:53:20 - INFO - __main__ - Step 1859: {'lr': 3.093333333333334e-05, 'samples': 59488, 'steps': 116, 'loss/train': 6.2089128494262695} -09/20/2021 14:53:21 - INFO - __main__ - Step 1860: {'lr': 3.093333333333334e-05, 'samples': 59520, 'steps': 116, 'loss/train': 6.758141994476318} -09/20/2021 14:53:22 - INFO - __main__ - Step 1861: {'lr': 3.093333333333334e-05, 'samples': 59552, 'steps': 116, 'loss/train': 6.617177963256836} -09/20/2021 14:53:23 - INFO - __main__ - Step 1862: {'lr': 3.093333333333334e-05, 'samples': 59584, 'steps': 116, 'loss/train': 6.65860652923584} -09/20/2021 14:53:23 - INFO - __main__ - Step 1863: {'lr': 3.093333333333334e-05, 'samples': 59616, 'steps': 116, 'loss/train': 6.181654930114746} -09/20/2021 14:53:24 - INFO - __main__ - Step 1864: {'lr': 3.093333333333334e-05, 'samples': 59648, 'steps': 116, 'loss/train': 6.561133861541748} -09/20/2021 14:53:25 - INFO - __main__ - Step 1865: {'lr': 3.093333333333334e-05, 'samples': 59680, 'steps': 116, 'loss/train': 6.2186737060546875} -09/20/2021 14:53:26 - INFO - __main__ - Step 1866: {'lr': 3.093333333333334e-05, 'samples': 59712, 'steps': 116, 'loss/train': 6.29074239730835} -09/20/2021 14:53:27 - INFO - __main__ - Step 1867: {'lr': 3.093333333333334e-05, 'samples': 59744, 'steps': 116, 'loss/train': 5.518889904022217} -09/20/2021 14:53:28 - INFO - __main__ - Step 1868: {'lr': 3.093333333333334e-05, 'samples': 59776, 'steps': 116, 'loss/train': 6.821427345275879} -09/20/2021 14:53:29 - INFO - __main__ - Step 1869: {'lr': 3.093333333333334e-05, 'samples': 59808, 'steps': 116, 'loss/train': 7.070533752441406} -09/20/2021 14:53:29 - INFO - __main__ - Step 1870: {'lr': 3.093333333333334e-05, 'samples': 59840, 'steps': 116, 'loss/train': 6.852370262145996} -09/20/2021 14:53:30 - INFO - __main__ - Step 1871: {'lr': 3.093333333333334e-05, 'samples': 59872, 'steps': 116, 'loss/train': 5.8043060302734375} -09/20/2021 14:53:31 - INFO - __main__ - Step 1872: {'lr': 3.093333333333334e-05, 'samples': 59904, 'steps': 116, 'loss/train': 6.220953464508057} -09/20/2021 14:53:32 - INFO - __main__ - Step 1873: {'lr': 3.12e-05, 'samples': 59936, 'steps': 117, 'loss/train': 7.050163745880127} -09/20/2021 14:53:32 - INFO - __main__ - Step 1874: {'lr': 3.12e-05, 'samples': 59968, 'steps': 117, 'loss/train': 6.440095901489258} -09/20/2021 14:53:33 - INFO - __main__ - Step 1875: {'lr': 3.12e-05, 'samples': 60000, 'steps': 117, 'loss/train': 6.8150634765625} -09/20/2021 14:53:34 - INFO - __main__ - Step 1876: {'lr': 3.12e-05, 'samples': 60032, 'steps': 117, 'loss/train': 6.933142185211182} -09/20/2021 14:53:35 - INFO - __main__ - Step 1877: {'lr': 3.12e-05, 'samples': 60064, 'steps': 117, 'loss/train': 6.142337799072266} -09/20/2021 14:53:35 - INFO - __main__ - Step 1878: {'lr': 3.12e-05, 'samples': 60096, 'steps': 117, 'loss/train': 6.306290149688721} -09/20/2021 14:53:36 - INFO - __main__ - Step 1879: {'lr': 3.12e-05, 'samples': 60128, 'steps': 117, 'loss/train': 7.087667942047119} -09/20/2021 14:53:37 - INFO - __main__ - Step 1880: {'lr': 3.12e-05, 'samples': 60160, 'steps': 117, 'loss/train': 6.483727931976318} -09/20/2021 14:53:38 - INFO - __main__ - Step 1881: {'lr': 3.12e-05, 'samples': 60192, 'steps': 117, 'loss/train': 5.076791763305664} -09/20/2021 14:53:38 - INFO - __main__ - Step 1882: {'lr': 3.12e-05, 'samples': 60224, 'steps': 117, 'loss/train': 7.014932155609131} -09/20/2021 14:53:39 - INFO - __main__ - Step 1883: {'lr': 3.12e-05, 'samples': 60256, 'steps': 117, 'loss/train': 7.127142906188965} -09/20/2021 14:53:40 - INFO - __main__ - Step 1884: {'lr': 3.12e-05, 'samples': 60288, 'steps': 117, 'loss/train': 7.118346214294434} -09/20/2021 14:53:41 - INFO - __main__ - Step 1885: {'lr': 3.12e-05, 'samples': 60320, 'steps': 117, 'loss/train': 5.9547119140625} -09/20/2021 14:53:41 - INFO - __main__ - Step 1886: {'lr': 3.12e-05, 'samples': 60352, 'steps': 117, 'loss/train': 5.370534896850586} -09/20/2021 14:53:42 - INFO - __main__ - Step 1887: {'lr': 3.12e-05, 'samples': 60384, 'steps': 117, 'loss/train': 5.661940097808838} -09/20/2021 14:53:43 - INFO - __main__ - Step 1888: {'lr': 3.12e-05, 'samples': 60416, 'steps': 117, 'loss/train': 6.305938243865967} -09/20/2021 14:53:44 - INFO - __main__ - Step 1889: {'lr': 3.146666666666667e-05, 'samples': 60448, 'steps': 118, 'loss/train': 6.627176761627197} -09/20/2021 14:53:45 - INFO - __main__ - Step 1890: {'lr': 3.146666666666667e-05, 'samples': 60480, 'steps': 118, 'loss/train': 5.418166160583496} -09/20/2021 14:53:45 - INFO - __main__ - Step 1891: {'lr': 3.146666666666667e-05, 'samples': 60512, 'steps': 118, 'loss/train': 6.245001792907715} -09/20/2021 14:53:46 - INFO - __main__ - Step 1892: {'lr': 3.146666666666667e-05, 'samples': 60544, 'steps': 118, 'loss/train': 7.25372838973999} -09/20/2021 14:53:47 - INFO - __main__ - Step 1893: {'lr': 3.146666666666667e-05, 'samples': 60576, 'steps': 118, 'loss/train': 6.7761454582214355} -09/20/2021 14:53:48 - INFO - __main__ - Step 1894: {'lr': 3.146666666666667e-05, 'samples': 60608, 'steps': 118, 'loss/train': 6.611319541931152} -09/20/2021 14:53:48 - INFO - __main__ - Step 1895: {'lr': 3.146666666666667e-05, 'samples': 60640, 'steps': 118, 'loss/train': 7.28957986831665} -09/20/2021 14:53:49 - INFO - __main__ - Step 1896: {'lr': 3.146666666666667e-05, 'samples': 60672, 'steps': 118, 'loss/train': 6.2176361083984375} -09/20/2021 14:53:50 - INFO - __main__ - Step 1897: {'lr': 3.146666666666667e-05, 'samples': 60704, 'steps': 118, 'loss/train': 5.167111396789551} -09/20/2021 14:53:52 - INFO - __main__ - Step 1898: {'lr': 3.146666666666667e-05, 'samples': 60736, 'steps': 118, 'loss/train': 6.674505233764648} -09/20/2021 14:53:52 - INFO - __main__ - Step 1899: {'lr': 3.146666666666667e-05, 'samples': 60768, 'steps': 118, 'loss/train': 6.479441165924072} -09/20/2021 14:53:53 - INFO - __main__ - Step 1900: {'lr': 3.146666666666667e-05, 'samples': 60800, 'steps': 118, 'loss/train': 6.552905082702637} -09/20/2021 14:53:54 - INFO - __main__ - Step 1901: {'lr': 3.146666666666667e-05, 'samples': 60832, 'steps': 118, 'loss/train': 7.613687038421631} -09/20/2021 14:53:55 - INFO - __main__ - Step 1902: {'lr': 3.146666666666667e-05, 'samples': 60864, 'steps': 118, 'loss/train': 7.496888160705566} -09/20/2021 14:53:55 - INFO - __main__ - Step 1903: {'lr': 3.146666666666667e-05, 'samples': 60896, 'steps': 118, 'loss/train': 6.640780448913574} -09/20/2021 14:53:56 - INFO - __main__ - Step 1904: {'lr': 3.146666666666667e-05, 'samples': 60928, 'steps': 118, 'loss/train': 6.691221237182617} -09/20/2021 14:53:57 - INFO - __main__ - Step 1905: {'lr': 3.173333333333334e-05, 'samples': 60960, 'steps': 119, 'loss/train': 6.357285976409912} -09/20/2021 14:53:58 - INFO - __main__ - Step 1906: {'lr': 3.173333333333334e-05, 'samples': 60992, 'steps': 119, 'loss/train': 5.749533176422119} -09/20/2021 14:53:59 - INFO - __main__ - Step 1907: {'lr': 3.173333333333334e-05, 'samples': 61024, 'steps': 119, 'loss/train': 6.260130405426025} -09/20/2021 14:53:59 - INFO - __main__ - Step 1908: {'lr': 3.173333333333334e-05, 'samples': 61056, 'steps': 119, 'loss/train': 6.113763332366943} -09/20/2021 14:54:00 - INFO - __main__ - Step 1909: {'lr': 3.173333333333334e-05, 'samples': 61088, 'steps': 119, 'loss/train': 5.928813457489014} -09/20/2021 14:54:01 - INFO - __main__ - Step 1910: {'lr': 3.173333333333334e-05, 'samples': 61120, 'steps': 119, 'loss/train': 6.324496746063232} -09/20/2021 14:54:02 - INFO - __main__ - Step 1911: {'lr': 3.173333333333334e-05, 'samples': 61152, 'steps': 119, 'loss/train': 6.9030327796936035} -09/20/2021 14:54:02 - INFO - __main__ - Step 1912: {'lr': 3.173333333333334e-05, 'samples': 61184, 'steps': 119, 'loss/train': 6.2621073722839355} -09/20/2021 14:54:03 - INFO - __main__ - Step 1913: {'lr': 3.173333333333334e-05, 'samples': 61216, 'steps': 119, 'loss/train': 6.907510280609131} -09/20/2021 14:54:04 - INFO - __main__ - Step 1914: {'lr': 3.173333333333334e-05, 'samples': 61248, 'steps': 119, 'loss/train': 6.919442176818848} -09/20/2021 14:54:05 - INFO - __main__ - Step 1915: {'lr': 3.173333333333334e-05, 'samples': 61280, 'steps': 119, 'loss/train': 6.066860198974609} -09/20/2021 14:54:05 - INFO - __main__ - Step 1916: {'lr': 3.173333333333334e-05, 'samples': 61312, 'steps': 119, 'loss/train': 6.19516658782959} -09/20/2021 14:54:06 - INFO - __main__ - Step 1917: {'lr': 3.173333333333334e-05, 'samples': 61344, 'steps': 119, 'loss/train': 6.030703544616699} -09/20/2021 14:54:07 - INFO - __main__ - Step 1918: {'lr': 3.173333333333334e-05, 'samples': 61376, 'steps': 119, 'loss/train': 6.0235700607299805} -09/20/2021 14:54:08 - INFO - __main__ - Step 1919: {'lr': 3.173333333333334e-05, 'samples': 61408, 'steps': 119, 'loss/train': 6.253647327423096} -09/20/2021 14:54:08 - INFO - __main__ - Step 1920: {'lr': 3.173333333333334e-05, 'samples': 61440, 'steps': 119, 'loss/train': 6.668237209320068} -09/20/2021 14:54:09 - INFO - __main__ - Step 1921: {'lr': 3.2000000000000005e-05, 'samples': 61472, 'steps': 120, 'loss/train': 6.7220282554626465} -09/20/2021 14:54:10 - INFO - __main__ - Step 1922: {'lr': 3.2000000000000005e-05, 'samples': 61504, 'steps': 120, 'loss/train': 7.225880146026611} -09/20/2021 14:54:11 - INFO - __main__ - Step 1923: {'lr': 3.2000000000000005e-05, 'samples': 61536, 'steps': 120, 'loss/train': 5.877377033233643} -09/20/2021 14:54:12 - INFO - __main__ - Step 1924: {'lr': 3.2000000000000005e-05, 'samples': 61568, 'steps': 120, 'loss/train': 6.101190090179443} -09/20/2021 14:54:12 - INFO - __main__ - Step 1925: {'lr': 3.2000000000000005e-05, 'samples': 61600, 'steps': 120, 'loss/train': 6.772882461547852} -09/20/2021 14:54:13 - INFO - __main__ - Step 1926: {'lr': 3.2000000000000005e-05, 'samples': 61632, 'steps': 120, 'loss/train': 7.03941535949707} -09/20/2021 14:54:14 - INFO - __main__ - Step 1927: {'lr': 3.2000000000000005e-05, 'samples': 61664, 'steps': 120, 'loss/train': 5.686518669128418} -09/20/2021 14:54:15 - INFO - __main__ - Step 1928: {'lr': 3.2000000000000005e-05, 'samples': 61696, 'steps': 120, 'loss/train': 6.172118186950684} -09/20/2021 14:54:16 - INFO - __main__ - Step 1929: {'lr': 3.2000000000000005e-05, 'samples': 61728, 'steps': 120, 'loss/train': 6.176890850067139} -09/20/2021 14:54:17 - INFO - __main__ - Step 1930: {'lr': 3.2000000000000005e-05, 'samples': 61760, 'steps': 120, 'loss/train': 6.951632022857666} -09/20/2021 14:54:18 - INFO - __main__ - Step 1931: {'lr': 3.2000000000000005e-05, 'samples': 61792, 'steps': 120, 'loss/train': 7.476418972015381} -09/20/2021 14:54:18 - INFO - __main__ - Step 1932: {'lr': 3.2000000000000005e-05, 'samples': 61824, 'steps': 120, 'loss/train': 6.6551408767700195} -09/20/2021 14:54:19 - INFO - __main__ - Step 1933: {'lr': 3.2000000000000005e-05, 'samples': 61856, 'steps': 120, 'loss/train': 7.063642501831055} -09/20/2021 14:54:20 - INFO - __main__ - Step 1934: {'lr': 3.2000000000000005e-05, 'samples': 61888, 'steps': 120, 'loss/train': 6.309464931488037} -09/20/2021 14:54:21 - INFO - __main__ - Step 1935: {'lr': 3.2000000000000005e-05, 'samples': 61920, 'steps': 120, 'loss/train': 6.443771839141846} -09/20/2021 14:54:21 - INFO - __main__ - Step 1936: {'lr': 3.2000000000000005e-05, 'samples': 61952, 'steps': 120, 'loss/train': 7.567537784576416} -09/20/2021 14:54:22 - INFO - __main__ - Step 1937: {'lr': 3.226666666666667e-05, 'samples': 61984, 'steps': 121, 'loss/train': 6.373986721038818} -09/20/2021 14:54:23 - INFO - __main__ - Step 1938: {'lr': 3.226666666666667e-05, 'samples': 62016, 'steps': 121, 'loss/train': 5.809113025665283} -09/20/2021 14:54:24 - INFO - __main__ - Step 1939: {'lr': 3.226666666666667e-05, 'samples': 62048, 'steps': 121, 'loss/train': 6.998230457305908} -09/20/2021 14:54:24 - INFO - __main__ - Step 1940: {'lr': 3.226666666666667e-05, 'samples': 62080, 'steps': 121, 'loss/train': 6.567509651184082} -09/20/2021 14:54:25 - INFO - __main__ - Step 1941: {'lr': 3.226666666666667e-05, 'samples': 62112, 'steps': 121, 'loss/train': 6.121049404144287} -09/20/2021 14:54:26 - INFO - __main__ - Step 1942: {'lr': 3.226666666666667e-05, 'samples': 62144, 'steps': 121, 'loss/train': 6.006470203399658} -09/20/2021 14:54:27 - INFO - __main__ - Step 1943: {'lr': 3.226666666666667e-05, 'samples': 62176, 'steps': 121, 'loss/train': 6.868433475494385} -09/20/2021 14:54:27 - INFO - __main__ - Step 1944: {'lr': 3.226666666666667e-05, 'samples': 62208, 'steps': 121, 'loss/train': 6.2845587730407715} -09/20/2021 14:54:28 - INFO - __main__ - Step 1945: {'lr': 3.226666666666667e-05, 'samples': 62240, 'steps': 121, 'loss/train': 5.991539478302002} -09/20/2021 14:54:29 - INFO - __main__ - Step 1946: {'lr': 3.226666666666667e-05, 'samples': 62272, 'steps': 121, 'loss/train': 6.73064661026001} -09/20/2021 14:54:30 - INFO - __main__ - Step 1947: {'lr': 3.226666666666667e-05, 'samples': 62304, 'steps': 121, 'loss/train': 5.678685665130615} -09/20/2021 14:54:30 - INFO - __main__ - Step 1948: {'lr': 3.226666666666667e-05, 'samples': 62336, 'steps': 121, 'loss/train': 6.379401206970215} -09/20/2021 14:54:31 - INFO - __main__ - Step 1949: {'lr': 3.226666666666667e-05, 'samples': 62368, 'steps': 121, 'loss/train': 6.164097785949707} -09/20/2021 14:54:32 - INFO - __main__ - Step 1950: {'lr': 3.226666666666667e-05, 'samples': 62400, 'steps': 121, 'loss/train': 6.33875846862793} -09/20/2021 14:54:33 - INFO - __main__ - Step 1951: {'lr': 3.226666666666667e-05, 'samples': 62432, 'steps': 121, 'loss/train': 6.789287567138672} -09/20/2021 14:54:33 - INFO - __main__ - Step 1952: {'lr': 3.226666666666667e-05, 'samples': 62464, 'steps': 121, 'loss/train': 6.376349449157715} -09/20/2021 14:54:34 - INFO - __main__ - Step 1953: {'lr': 3.253333333333333e-05, 'samples': 62496, 'steps': 122, 'loss/train': 6.907968997955322} -09/20/2021 14:54:35 - INFO - __main__ - Step 1954: {'lr': 3.253333333333333e-05, 'samples': 62528, 'steps': 122, 'loss/train': 6.073740482330322} -09/20/2021 14:54:36 - INFO - __main__ - Step 1955: {'lr': 3.253333333333333e-05, 'samples': 62560, 'steps': 122, 'loss/train': 6.592769622802734} -09/20/2021 14:54:37 - INFO - __main__ - Step 1956: {'lr': 3.253333333333333e-05, 'samples': 62592, 'steps': 122, 'loss/train': 6.370107173919678} -09/20/2021 14:54:37 - INFO - __main__ - Step 1957: {'lr': 3.253333333333333e-05, 'samples': 62624, 'steps': 122, 'loss/train': 6.757734775543213} -09/20/2021 14:54:38 - INFO - __main__ - Step 1958: {'lr': 3.253333333333333e-05, 'samples': 62656, 'steps': 122, 'loss/train': 6.560579776763916} -09/20/2021 14:54:39 - INFO - __main__ - Step 1959: {'lr': 3.253333333333333e-05, 'samples': 62688, 'steps': 122, 'loss/train': 5.919027328491211} -09/20/2021 14:54:40 - INFO - __main__ - Step 1960: {'lr': 3.253333333333333e-05, 'samples': 62720, 'steps': 122, 'loss/train': 5.652429103851318} -09/20/2021 14:54:40 - INFO - __main__ - Step 1961: {'lr': 3.253333333333333e-05, 'samples': 62752, 'steps': 122, 'loss/train': 5.35901403427124} -09/20/2021 14:54:42 - INFO - __main__ - Step 1962: {'lr': 3.253333333333333e-05, 'samples': 62784, 'steps': 122, 'loss/train': 5.628092288970947} -09/20/2021 14:54:43 - INFO - __main__ - Step 1963: {'lr': 3.253333333333333e-05, 'samples': 62816, 'steps': 122, 'loss/train': 6.9239420890808105} -09/20/2021 14:54:44 - INFO - __main__ - Step 1964: {'lr': 3.253333333333333e-05, 'samples': 62848, 'steps': 122, 'loss/train': 6.485635280609131} -09/20/2021 14:54:44 - INFO - __main__ - Step 1965: {'lr': 3.253333333333333e-05, 'samples': 62880, 'steps': 122, 'loss/train': 7.250100135803223} -09/20/2021 14:54:45 - INFO - __main__ - Step 1966: {'lr': 3.253333333333333e-05, 'samples': 62912, 'steps': 122, 'loss/train': 6.306426048278809} -09/20/2021 14:54:46 - INFO - __main__ - Step 1967: {'lr': 3.253333333333333e-05, 'samples': 62944, 'steps': 122, 'loss/train': 5.821731090545654} -09/20/2021 14:54:47 - INFO - __main__ - Step 1968: {'lr': 3.253333333333333e-05, 'samples': 62976, 'steps': 122, 'loss/train': 5.892029285430908} -09/20/2021 14:54:47 - INFO - __main__ - Step 1969: {'lr': 3.2800000000000004e-05, 'samples': 63008, 'steps': 123, 'loss/train': 7.311915397644043} -09/20/2021 14:54:48 - INFO - __main__ - Step 1970: {'lr': 3.2800000000000004e-05, 'samples': 63040, 'steps': 123, 'loss/train': 6.095775604248047} -09/20/2021 14:54:49 - INFO - __main__ - Step 1971: {'lr': 3.2800000000000004e-05, 'samples': 63072, 'steps': 123, 'loss/train': 6.64158821105957} -09/20/2021 14:54:50 - INFO - __main__ - Step 1972: {'lr': 3.2800000000000004e-05, 'samples': 63104, 'steps': 123, 'loss/train': 7.547395706176758} -09/20/2021 14:54:50 - INFO - __main__ - Step 1973: {'lr': 3.2800000000000004e-05, 'samples': 63136, 'steps': 123, 'loss/train': 5.962305545806885} -09/20/2021 14:54:51 - INFO - __main__ - Step 1974: {'lr': 3.2800000000000004e-05, 'samples': 63168, 'steps': 123, 'loss/train': 6.34151029586792} -09/20/2021 14:54:52 - INFO - __main__ - Step 1975: {'lr': 3.2800000000000004e-05, 'samples': 63200, 'steps': 123, 'loss/train': 6.862957954406738} -09/20/2021 14:54:53 - INFO - __main__ - Step 1976: {'lr': 3.2800000000000004e-05, 'samples': 63232, 'steps': 123, 'loss/train': 5.606734275817871} -09/20/2021 14:54:53 - INFO - __main__ - Step 1977: {'lr': 3.2800000000000004e-05, 'samples': 63264, 'steps': 123, 'loss/train': 6.583481311798096} -09/20/2021 14:54:54 - INFO - __main__ - Step 1978: {'lr': 3.2800000000000004e-05, 'samples': 63296, 'steps': 123, 'loss/train': 5.8029093742370605} -09/20/2021 14:54:55 - INFO - __main__ - Step 1979: {'lr': 3.2800000000000004e-05, 'samples': 63328, 'steps': 123, 'loss/train': 6.4618682861328125} -09/20/2021 14:54:56 - INFO - __main__ - Step 1980: {'lr': 3.2800000000000004e-05, 'samples': 63360, 'steps': 123, 'loss/train': 7.396381855010986} -09/20/2021 14:54:56 - INFO - __main__ - Step 1981: {'lr': 3.2800000000000004e-05, 'samples': 63392, 'steps': 123, 'loss/train': 8.172107696533203} -09/20/2021 14:54:57 - INFO - __main__ - Step 1982: {'lr': 3.2800000000000004e-05, 'samples': 63424, 'steps': 123, 'loss/train': 7.319507122039795} -09/20/2021 14:54:58 - INFO - __main__ - Step 1983: {'lr': 3.2800000000000004e-05, 'samples': 63456, 'steps': 123, 'loss/train': 6.671170711517334} -09/20/2021 14:54:59 - INFO - __main__ - Step 1984: {'lr': 3.2800000000000004e-05, 'samples': 63488, 'steps': 123, 'loss/train': 5.778025150299072} -09/20/2021 14:55:00 - INFO - __main__ - Step 1985: {'lr': 3.3066666666666666e-05, 'samples': 63520, 'steps': 124, 'loss/train': 4.405661106109619} -09/20/2021 14:55:00 - INFO - __main__ - Step 1986: {'lr': 3.3066666666666666e-05, 'samples': 63552, 'steps': 124, 'loss/train': 4.566370010375977} -09/20/2021 14:55:01 - INFO - __main__ - Step 1987: {'lr': 3.3066666666666666e-05, 'samples': 63584, 'steps': 124, 'loss/train': 5.178475379943848} -09/20/2021 14:55:02 - INFO - __main__ - Step 1988: {'lr': 3.3066666666666666e-05, 'samples': 63616, 'steps': 124, 'loss/train': 4.997365951538086} -09/20/2021 14:55:03 - INFO - __main__ - Step 1989: {'lr': 3.3066666666666666e-05, 'samples': 63648, 'steps': 124, 'loss/train': 6.4608354568481445} -09/20/2021 14:55:03 - INFO - __main__ - Step 1990: {'lr': 3.3066666666666666e-05, 'samples': 63680, 'steps': 124, 'loss/train': 6.393615245819092} -09/20/2021 14:55:04 - INFO - __main__ - Step 1991: {'lr': 3.3066666666666666e-05, 'samples': 63712, 'steps': 124, 'loss/train': 6.537259101867676} -09/20/2021 14:55:05 - INFO - __main__ - Step 1992: {'lr': 3.3066666666666666e-05, 'samples': 63744, 'steps': 124, 'loss/train': 6.081437110900879} -09/20/2021 14:55:06 - INFO - __main__ - Step 1993: {'lr': 3.3066666666666666e-05, 'samples': 63776, 'steps': 124, 'loss/train': 6.910190582275391} -09/20/2021 14:55:06 - INFO - __main__ - Step 1994: {'lr': 3.3066666666666666e-05, 'samples': 63808, 'steps': 124, 'loss/train': 6.5122151374816895} -09/20/2021 14:55:07 - INFO - __main__ - Step 1995: {'lr': 3.3066666666666666e-05, 'samples': 63840, 'steps': 124, 'loss/train': 5.915347099304199} -09/20/2021 14:55:08 - INFO - __main__ - Step 1996: {'lr': 3.3066666666666666e-05, 'samples': 63872, 'steps': 124, 'loss/train': 7.024527549743652} -09/20/2021 14:55:09 - INFO - __main__ - Step 1997: {'lr': 3.3066666666666666e-05, 'samples': 63904, 'steps': 124, 'loss/train': 5.830668926239014} -09/20/2021 14:55:09 - INFO - __main__ - Step 1998: {'lr': 3.3066666666666666e-05, 'samples': 63936, 'steps': 124, 'loss/train': 7.073484897613525} -09/20/2021 14:55:11 - INFO - __main__ - Step 1999: {'lr': 3.3066666666666666e-05, 'samples': 63968, 'steps': 124, 'loss/train': 5.81990385055542} -09/20/2021 14:55:11 - INFO - __main__ - Step 2000: {'lr': 3.3066666666666666e-05, 'samples': 64000, 'steps': 124, 'loss/train': 6.440719127655029} -09/20/2021 14:55:12 - INFO - __main__ - Step 2001: {'lr': 3.3333333333333335e-05, 'samples': 64032, 'steps': 125, 'loss/train': 6.64794921875} -09/20/2021 14:55:13 - INFO - __main__ - Step 2002: {'lr': 3.3333333333333335e-05, 'samples': 64064, 'steps': 125, 'loss/train': 6.54712438583374} -09/20/2021 14:55:14 - INFO - __main__ - Step 2003: {'lr': 3.3333333333333335e-05, 'samples': 64096, 'steps': 125, 'loss/train': 6.3478803634643555} -09/20/2021 14:55:15 - INFO - __main__ - Step 2004: {'lr': 3.3333333333333335e-05, 'samples': 64128, 'steps': 125, 'loss/train': 7.367883682250977} -09/20/2021 14:55:15 - INFO - __main__ - Step 2005: {'lr': 3.3333333333333335e-05, 'samples': 64160, 'steps': 125, 'loss/train': 6.258336067199707} -09/20/2021 14:55:16 - INFO - __main__ - Step 2006: {'lr': 3.3333333333333335e-05, 'samples': 64192, 'steps': 125, 'loss/train': 6.45767879486084} -09/20/2021 14:55:17 - INFO - __main__ - Step 2007: {'lr': 3.3333333333333335e-05, 'samples': 64224, 'steps': 125, 'loss/train': 6.390842437744141} -09/20/2021 14:55:18 - INFO - __main__ - Step 2008: {'lr': 3.3333333333333335e-05, 'samples': 64256, 'steps': 125, 'loss/train': 6.109151840209961} -09/20/2021 14:55:18 - INFO - __main__ - Step 2009: {'lr': 3.3333333333333335e-05, 'samples': 64288, 'steps': 125, 'loss/train': 7.151824474334717} -09/20/2021 14:55:19 - INFO - __main__ - Step 2010: {'lr': 3.3333333333333335e-05, 'samples': 64320, 'steps': 125, 'loss/train': 6.7014546394348145} -09/20/2021 14:55:20 - INFO - __main__ - Step 2011: {'lr': 3.3333333333333335e-05, 'samples': 64352, 'steps': 125, 'loss/train': 6.1796674728393555} -09/20/2021 14:55:21 - INFO - __main__ - Step 2012: {'lr': 3.3333333333333335e-05, 'samples': 64384, 'steps': 125, 'loss/train': 7.809508323669434} -09/20/2021 14:55:21 - INFO - __main__ - Step 2013: {'lr': 3.3333333333333335e-05, 'samples': 64416, 'steps': 125, 'loss/train': 7.699117183685303} -09/20/2021 14:55:22 - INFO - __main__ - Step 2014: {'lr': 3.3333333333333335e-05, 'samples': 64448, 'steps': 125, 'loss/train': 5.629843235015869} -09/20/2021 14:55:23 - INFO - __main__ - Step 2015: {'lr': 3.3333333333333335e-05, 'samples': 64480, 'steps': 125, 'loss/train': 6.366392612457275} -09/20/2021 14:55:24 - INFO - __main__ - Step 2016: {'lr': 3.3333333333333335e-05, 'samples': 64512, 'steps': 125, 'loss/train': 5.659280776977539} -09/20/2021 14:55:24 - INFO - __main__ - Step 2017: {'lr': 3.3600000000000004e-05, 'samples': 64544, 'steps': 126, 'loss/train': 6.28075647354126} -09/20/2021 14:55:25 - INFO - __main__ - Step 2018: {'lr': 3.3600000000000004e-05, 'samples': 64576, 'steps': 126, 'loss/train': 6.326210021972656} -09/20/2021 14:55:26 - INFO - __main__ - Step 2019: {'lr': 3.3600000000000004e-05, 'samples': 64608, 'steps': 126, 'loss/train': 6.4523820877075195} -09/20/2021 14:55:27 - INFO - __main__ - Step 2020: {'lr': 3.3600000000000004e-05, 'samples': 64640, 'steps': 126, 'loss/train': 5.884279727935791} -09/20/2021 14:55:27 - INFO - __main__ - Step 2021: {'lr': 3.3600000000000004e-05, 'samples': 64672, 'steps': 126, 'loss/train': 6.232954025268555} -09/20/2021 14:55:28 - INFO - __main__ - Step 2022: {'lr': 3.3600000000000004e-05, 'samples': 64704, 'steps': 126, 'loss/train': 5.908555507659912} -09/20/2021 14:55:29 - INFO - __main__ - Step 2023: {'lr': 3.3600000000000004e-05, 'samples': 64736, 'steps': 126, 'loss/train': 6.097986698150635} -09/20/2021 14:55:30 - INFO - __main__ - Step 2024: {'lr': 3.3600000000000004e-05, 'samples': 64768, 'steps': 126, 'loss/train': 4.3818254470825195} -09/20/2021 14:55:30 - INFO - __main__ - Step 2025: {'lr': 3.3600000000000004e-05, 'samples': 64800, 'steps': 126, 'loss/train': 6.401528358459473} -09/20/2021 14:55:31 - INFO - __main__ - Step 2026: {'lr': 3.3600000000000004e-05, 'samples': 64832, 'steps': 126, 'loss/train': 6.639707088470459} -09/20/2021 14:55:32 - INFO - __main__ - Step 2027: {'lr': 3.3600000000000004e-05, 'samples': 64864, 'steps': 126, 'loss/train': 6.289498329162598} -09/20/2021 14:55:33 - INFO - __main__ - Step 2028: {'lr': 3.3600000000000004e-05, 'samples': 64896, 'steps': 126, 'loss/train': 6.45504093170166} -09/20/2021 14:55:34 - INFO - __main__ - Step 2029: {'lr': 3.3600000000000004e-05, 'samples': 64928, 'steps': 126, 'loss/train': 6.6306233406066895} -09/20/2021 14:55:35 - INFO - __main__ - Step 2030: {'lr': 3.3600000000000004e-05, 'samples': 64960, 'steps': 126, 'loss/train': 6.729381084442139} -09/20/2021 14:55:35 - INFO - __main__ - Step 2031: {'lr': 3.3600000000000004e-05, 'samples': 64992, 'steps': 126, 'loss/train': 6.067564487457275} -09/20/2021 14:55:36 - INFO - __main__ - Step 2032: {'lr': 3.3600000000000004e-05, 'samples': 65024, 'steps': 126, 'loss/train': 6.047272682189941} -09/20/2021 14:55:37 - INFO - __main__ - Step 2033: {'lr': 3.3866666666666665e-05, 'samples': 65056, 'steps': 127, 'loss/train': 5.915857315063477} -09/20/2021 14:55:38 - INFO - __main__ - Step 2034: {'lr': 3.3866666666666665e-05, 'samples': 65088, 'steps': 127, 'loss/train': 5.964664936065674} -09/20/2021 14:55:39 - INFO - __main__ - Step 2035: {'lr': 3.3866666666666665e-05, 'samples': 65120, 'steps': 127, 'loss/train': 6.899428367614746} -09/20/2021 14:55:39 - INFO - __main__ - Step 2036: {'lr': 3.3866666666666665e-05, 'samples': 65152, 'steps': 127, 'loss/train': 6.394204616546631} -09/20/2021 14:55:40 - INFO - __main__ - Step 2037: {'lr': 3.3866666666666665e-05, 'samples': 65184, 'steps': 127, 'loss/train': 7.054864406585693} -09/20/2021 14:55:41 - INFO - __main__ - Step 2038: {'lr': 3.3866666666666665e-05, 'samples': 65216, 'steps': 127, 'loss/train': 6.473769187927246} -09/20/2021 14:55:42 - INFO - __main__ - Step 2039: {'lr': 3.3866666666666665e-05, 'samples': 65248, 'steps': 127, 'loss/train': 6.066195011138916} -09/20/2021 14:55:42 - INFO - __main__ - Step 2040: {'lr': 3.3866666666666665e-05, 'samples': 65280, 'steps': 127, 'loss/train': 6.5058770179748535} -09/20/2021 14:55:43 - INFO - __main__ - Step 2041: {'lr': 3.3866666666666665e-05, 'samples': 65312, 'steps': 127, 'loss/train': 5.389967441558838} -09/20/2021 14:55:44 - INFO - __main__ - Step 2042: {'lr': 3.3866666666666665e-05, 'samples': 65344, 'steps': 127, 'loss/train': 6.509215831756592} -09/20/2021 14:55:45 - INFO - __main__ - Step 2043: {'lr': 3.3866666666666665e-05, 'samples': 65376, 'steps': 127, 'loss/train': 6.527456283569336} -09/20/2021 14:55:45 - INFO - __main__ - Step 2044: {'lr': 3.3866666666666665e-05, 'samples': 65408, 'steps': 127, 'loss/train': 6.726210117340088} -09/20/2021 14:55:46 - INFO - __main__ - Step 2045: {'lr': 3.3866666666666665e-05, 'samples': 65440, 'steps': 127, 'loss/train': 6.482949733734131} -09/20/2021 14:55:47 - INFO - __main__ - Step 2046: {'lr': 3.3866666666666665e-05, 'samples': 65472, 'steps': 127, 'loss/train': 6.088095664978027} -09/20/2021 14:55:48 - INFO - __main__ - Step 2047: {'lr': 3.3866666666666665e-05, 'samples': 65504, 'steps': 127, 'loss/train': 6.5499067306518555} -09/20/2021 14:55:48 - INFO - __main__ - Step 2048: {'lr': 3.3866666666666665e-05, 'samples': 65536, 'steps': 127, 'loss/train': 6.690189838409424} -09/20/2021 14:55:49 - INFO - __main__ - Step 2049: {'lr': 3.4133333333333334e-05, 'samples': 65568, 'steps': 128, 'loss/train': 6.124640941619873} -09/20/2021 14:55:50 - INFO - __main__ - Step 2050: {'lr': 3.4133333333333334e-05, 'samples': 65600, 'steps': 128, 'loss/train': 6.396017551422119} -09/20/2021 14:55:51 - INFO - __main__ - Step 2051: {'lr': 3.4133333333333334e-05, 'samples': 65632, 'steps': 128, 'loss/train': 6.586300373077393} -09/20/2021 14:55:51 - INFO - __main__ - Step 2052: {'lr': 3.4133333333333334e-05, 'samples': 65664, 'steps': 128, 'loss/train': 5.475715160369873} -09/20/2021 14:55:52 - INFO - __main__ - Step 2053: {'lr': 3.4133333333333334e-05, 'samples': 65696, 'steps': 128, 'loss/train': 5.398143291473389} -09/20/2021 14:55:53 - INFO - __main__ - Step 2054: {'lr': 3.4133333333333334e-05, 'samples': 65728, 'steps': 128, 'loss/train': 6.514486789703369} -09/20/2021 14:55:54 - INFO - __main__ - Step 2055: {'lr': 3.4133333333333334e-05, 'samples': 65760, 'steps': 128, 'loss/train': 5.439901828765869} -09/20/2021 14:55:54 - INFO - __main__ - Step 2056: {'lr': 3.4133333333333334e-05, 'samples': 65792, 'steps': 128, 'loss/train': 6.273301124572754} -09/20/2021 14:55:55 - INFO - __main__ - Step 2057: {'lr': 3.4133333333333334e-05, 'samples': 65824, 'steps': 128, 'loss/train': 6.217965126037598} -09/20/2021 14:55:56 - INFO - __main__ - Step 2058: {'lr': 3.4133333333333334e-05, 'samples': 65856, 'steps': 128, 'loss/train': 6.105907917022705} -09/20/2021 14:55:57 - INFO - __main__ - Step 2059: {'lr': 3.4133333333333334e-05, 'samples': 65888, 'steps': 128, 'loss/train': 6.138664722442627} -09/20/2021 14:55:58 - INFO - __main__ - Step 2060: {'lr': 3.4133333333333334e-05, 'samples': 65920, 'steps': 128, 'loss/train': 6.56662654876709} -09/20/2021 14:55:59 - INFO - __main__ - Step 2061: {'lr': 3.4133333333333334e-05, 'samples': 65952, 'steps': 128, 'loss/train': 5.557608127593994} -09/20/2021 14:56:00 - INFO - __main__ - Step 2062: {'lr': 3.4133333333333334e-05, 'samples': 65984, 'steps': 128, 'loss/train': 6.015231609344482} -09/20/2021 14:56:01 - INFO - __main__ - Step 2063: {'lr': 3.4133333333333334e-05, 'samples': 66016, 'steps': 128, 'loss/train': 5.549841403961182} -09/20/2021 14:56:01 - INFO - __main__ - Step 2064: {'lr': 3.4133333333333334e-05, 'samples': 66048, 'steps': 128, 'loss/train': 6.349067211151123} -09/20/2021 14:56:02 - INFO - __main__ - Step 2065: {'lr': 3.4399999999999996e-05, 'samples': 66080, 'steps': 129, 'loss/train': 6.0792555809021} -09/20/2021 14:56:03 - INFO - __main__ - Step 2066: {'lr': 3.4399999999999996e-05, 'samples': 66112, 'steps': 129, 'loss/train': 6.679035663604736} -09/20/2021 14:56:04 - INFO - __main__ - Step 2067: {'lr': 3.4399999999999996e-05, 'samples': 66144, 'steps': 129, 'loss/train': 6.098395824432373} -09/20/2021 14:56:04 - INFO - __main__ - Step 2068: {'lr': 3.4399999999999996e-05, 'samples': 66176, 'steps': 129, 'loss/train': 6.435916900634766} -09/20/2021 14:56:05 - INFO - __main__ - Step 2069: {'lr': 3.4399999999999996e-05, 'samples': 66208, 'steps': 129, 'loss/train': 6.311293125152588} -09/20/2021 14:56:06 - INFO - __main__ - Step 2070: {'lr': 3.4399999999999996e-05, 'samples': 66240, 'steps': 129, 'loss/train': 6.287459373474121} -09/20/2021 14:56:07 - INFO - __main__ - Step 2071: {'lr': 3.4399999999999996e-05, 'samples': 66272, 'steps': 129, 'loss/train': 5.564125061035156} -09/20/2021 14:56:07 - INFO - __main__ - Step 2072: {'lr': 3.4399999999999996e-05, 'samples': 66304, 'steps': 129, 'loss/train': 7.779865741729736} -09/20/2021 14:56:08 - INFO - __main__ - Step 2073: {'lr': 3.4399999999999996e-05, 'samples': 66336, 'steps': 129, 'loss/train': 7.211065292358398} -09/20/2021 14:56:09 - INFO - __main__ - Step 2074: {'lr': 3.4399999999999996e-05, 'samples': 66368, 'steps': 129, 'loss/train': 5.333184242248535} -09/20/2021 14:56:10 - INFO - __main__ - Step 2075: {'lr': 3.4399999999999996e-05, 'samples': 66400, 'steps': 129, 'loss/train': 6.190690517425537} -09/20/2021 14:56:10 - INFO - __main__ - Step 2076: {'lr': 3.4399999999999996e-05, 'samples': 66432, 'steps': 129, 'loss/train': 6.0703349113464355} -09/20/2021 14:56:11 - INFO - __main__ - Step 2077: {'lr': 3.4399999999999996e-05, 'samples': 66464, 'steps': 129, 'loss/train': 5.776200771331787} -09/20/2021 14:56:12 - INFO - __main__ - Step 2078: {'lr': 3.4399999999999996e-05, 'samples': 66496, 'steps': 129, 'loss/train': 6.488077163696289} -09/20/2021 14:56:13 - INFO - __main__ - Step 2079: {'lr': 3.4399999999999996e-05, 'samples': 66528, 'steps': 129, 'loss/train': 6.223832130432129} -09/20/2021 14:56:13 - INFO - __main__ - Step 2080: {'lr': 3.4399999999999996e-05, 'samples': 66560, 'steps': 129, 'loss/train': 5.871718406677246} -09/20/2021 14:56:14 - INFO - __main__ - Step 2081: {'lr': 3.466666666666667e-05, 'samples': 66592, 'steps': 130, 'loss/train': 6.274418354034424} -09/20/2021 14:56:15 - INFO - __main__ - Step 2082: {'lr': 3.466666666666667e-05, 'samples': 66624, 'steps': 130, 'loss/train': 5.651094913482666} -09/20/2021 14:56:16 - INFO - __main__ - Step 2083: {'lr': 3.466666666666667e-05, 'samples': 66656, 'steps': 130, 'loss/train': 6.3765411376953125} -09/20/2021 14:56:17 - INFO - __main__ - Step 2084: {'lr': 3.466666666666667e-05, 'samples': 66688, 'steps': 130, 'loss/train': 6.804633617401123} -09/20/2021 14:56:17 - INFO - __main__ - Step 2085: {'lr': 3.466666666666667e-05, 'samples': 66720, 'steps': 130, 'loss/train': 6.330347061157227} -09/20/2021 14:56:18 - INFO - __main__ - Step 2086: {'lr': 3.466666666666667e-05, 'samples': 66752, 'steps': 130, 'loss/train': 6.304810047149658} -09/20/2021 14:56:19 - INFO - __main__ - Step 2087: {'lr': 3.466666666666667e-05, 'samples': 66784, 'steps': 130, 'loss/train': 6.19861364364624} -09/20/2021 14:56:20 - INFO - __main__ - Step 2088: {'lr': 3.466666666666667e-05, 'samples': 66816, 'steps': 130, 'loss/train': 7.008781433105469} -09/20/2021 14:56:20 - INFO - __main__ - Step 2089: {'lr': 3.466666666666667e-05, 'samples': 66848, 'steps': 130, 'loss/train': 6.697539806365967} -09/20/2021 14:56:21 - INFO - __main__ - Step 2090: {'lr': 3.466666666666667e-05, 'samples': 66880, 'steps': 130, 'loss/train': 5.907107830047607} -09/20/2021 14:56:22 - INFO - __main__ - Step 2091: {'lr': 3.466666666666667e-05, 'samples': 66912, 'steps': 130, 'loss/train': 6.764490127563477} -09/20/2021 14:56:23 - INFO - __main__ - Step 2092: {'lr': 3.466666666666667e-05, 'samples': 66944, 'steps': 130, 'loss/train': 6.234456539154053} -09/20/2021 14:56:24 - INFO - __main__ - Step 2093: {'lr': 3.466666666666667e-05, 'samples': 66976, 'steps': 130, 'loss/train': 6.330366134643555} -09/20/2021 14:56:25 - INFO - __main__ - Step 2094: {'lr': 3.466666666666667e-05, 'samples': 67008, 'steps': 130, 'loss/train': 6.079643249511719} -09/20/2021 14:56:25 - INFO - __main__ - Step 2095: {'lr': 3.466666666666667e-05, 'samples': 67040, 'steps': 130, 'loss/train': 6.518743515014648} -09/20/2021 14:56:26 - INFO - __main__ - Step 2096: {'lr': 3.466666666666667e-05, 'samples': 67072, 'steps': 130, 'loss/train': 5.648323059082031} -09/20/2021 14:56:27 - INFO - __main__ - Step 2097: {'lr': 3.493333333333333e-05, 'samples': 67104, 'steps': 131, 'loss/train': 5.978809356689453} -09/20/2021 14:56:28 - INFO - __main__ - Step 2098: {'lr': 3.493333333333333e-05, 'samples': 67136, 'steps': 131, 'loss/train': 6.317226886749268} -09/20/2021 14:56:29 - INFO - __main__ - Step 2099: {'lr': 3.493333333333333e-05, 'samples': 67168, 'steps': 131, 'loss/train': 6.009545803070068} -09/20/2021 14:56:29 - INFO - __main__ - Step 2100: {'lr': 3.493333333333333e-05, 'samples': 67200, 'steps': 131, 'loss/train': 6.624419689178467} -09/20/2021 14:56:30 - INFO - __main__ - Step 2101: {'lr': 3.493333333333333e-05, 'samples': 67232, 'steps': 131, 'loss/train': 6.0318098068237305} -09/20/2021 14:56:31 - INFO - __main__ - Step 2102: {'lr': 3.493333333333333e-05, 'samples': 67264, 'steps': 131, 'loss/train': 6.821030139923096} -09/20/2021 14:56:32 - INFO - __main__ - Step 2103: {'lr': 3.493333333333333e-05, 'samples': 67296, 'steps': 131, 'loss/train': 6.12054443359375} -09/20/2021 14:56:32 - INFO - __main__ - Step 2104: {'lr': 3.493333333333333e-05, 'samples': 67328, 'steps': 131, 'loss/train': 6.306761741638184} -09/20/2021 14:56:33 - INFO - __main__ - Step 2105: {'lr': 3.493333333333333e-05, 'samples': 67360, 'steps': 131, 'loss/train': 7.64954137802124} -09/20/2021 14:56:34 - INFO - __main__ - Step 2106: {'lr': 3.493333333333333e-05, 'samples': 67392, 'steps': 131, 'loss/train': 6.508398056030273} -09/20/2021 14:56:35 - INFO - __main__ - Step 2107: {'lr': 3.493333333333333e-05, 'samples': 67424, 'steps': 131, 'loss/train': 6.161520481109619} -09/20/2021 14:56:35 - INFO - __main__ - Step 2108: {'lr': 3.493333333333333e-05, 'samples': 67456, 'steps': 131, 'loss/train': 6.688178062438965} -09/20/2021 14:56:36 - INFO - __main__ - Step 2109: {'lr': 3.493333333333333e-05, 'samples': 67488, 'steps': 131, 'loss/train': 6.052700042724609} -09/20/2021 14:56:37 - INFO - __main__ - Step 2110: {'lr': 3.493333333333333e-05, 'samples': 67520, 'steps': 131, 'loss/train': 8.421052932739258} -09/20/2021 14:56:38 - INFO - __main__ - Step 2111: {'lr': 3.493333333333333e-05, 'samples': 67552, 'steps': 131, 'loss/train': 6.238178253173828} -09/20/2021 14:56:38 - INFO - __main__ - Step 2112: {'lr': 3.493333333333333e-05, 'samples': 67584, 'steps': 131, 'loss/train': 6.491817951202393} -09/20/2021 14:56:39 - INFO - __main__ - Step 2113: {'lr': 3.52e-05, 'samples': 67616, 'steps': 132, 'loss/train': 6.676476955413818} -09/20/2021 14:56:40 - INFO - __main__ - Step 2114: {'lr': 3.52e-05, 'samples': 67648, 'steps': 132, 'loss/train': 6.376041412353516} -09/20/2021 14:56:41 - INFO - __main__ - Step 2115: {'lr': 3.52e-05, 'samples': 67680, 'steps': 132, 'loss/train': 6.180012226104736} -09/20/2021 14:56:41 - INFO - __main__ - Step 2116: {'lr': 3.52e-05, 'samples': 67712, 'steps': 132, 'loss/train': 5.822330474853516} -09/20/2021 14:56:42 - INFO - __main__ - Step 2117: {'lr': 3.52e-05, 'samples': 67744, 'steps': 132, 'loss/train': 6.680905818939209} -09/20/2021 14:56:43 - INFO - __main__ - Step 2118: {'lr': 3.52e-05, 'samples': 67776, 'steps': 132, 'loss/train': 6.527279376983643} -09/20/2021 14:56:44 - INFO - __main__ - Step 2119: {'lr': 3.52e-05, 'samples': 67808, 'steps': 132, 'loss/train': 6.245534420013428} -09/20/2021 14:56:44 - INFO - __main__ - Step 2120: {'lr': 3.52e-05, 'samples': 67840, 'steps': 132, 'loss/train': 6.40393590927124} -09/20/2021 14:56:46 - INFO - __main__ - Step 2121: {'lr': 3.52e-05, 'samples': 67872, 'steps': 132, 'loss/train': 6.735391616821289} -09/20/2021 14:56:47 - INFO - __main__ - Step 2122: {'lr': 3.52e-05, 'samples': 67904, 'steps': 132, 'loss/train': 6.591883659362793} -09/20/2021 14:56:48 - INFO - __main__ - Step 2123: {'lr': 3.52e-05, 'samples': 67936, 'steps': 132, 'loss/train': 7.933499813079834} -09/20/2021 14:56:48 - INFO - __main__ - Step 2124: {'lr': 3.52e-05, 'samples': 67968, 'steps': 132, 'loss/train': 7.453869819641113} -09/20/2021 14:56:49 - INFO - __main__ - Step 2125: {'lr': 3.52e-05, 'samples': 68000, 'steps': 132, 'loss/train': 6.265101432800293} -09/20/2021 14:56:50 - INFO - __main__ - Step 2126: {'lr': 3.52e-05, 'samples': 68032, 'steps': 132, 'loss/train': 6.843482494354248} -09/20/2021 14:56:51 - INFO - __main__ - Step 2127: {'lr': 3.52e-05, 'samples': 68064, 'steps': 132, 'loss/train': 6.281400203704834} -09/20/2021 14:56:51 - INFO - __main__ - Step 2128: {'lr': 3.52e-05, 'samples': 68096, 'steps': 132, 'loss/train': 6.475666046142578} -09/20/2021 14:56:52 - INFO - __main__ - Step 2129: {'lr': 3.546666666666667e-05, 'samples': 68128, 'steps': 133, 'loss/train': 5.650063991546631} -09/20/2021 14:56:53 - INFO - __main__ - Step 2130: {'lr': 3.546666666666667e-05, 'samples': 68160, 'steps': 133, 'loss/train': 6.447701454162598} -09/20/2021 14:56:54 - INFO - __main__ - Step 2131: {'lr': 3.546666666666667e-05, 'samples': 68192, 'steps': 133, 'loss/train': 6.252908706665039} -09/20/2021 14:56:54 - INFO - __main__ - Step 2132: {'lr': 3.546666666666667e-05, 'samples': 68224, 'steps': 133, 'loss/train': 6.469733238220215} -09/20/2021 14:56:55 - INFO - __main__ - Step 2133: {'lr': 3.546666666666667e-05, 'samples': 68256, 'steps': 133, 'loss/train': 6.016105651855469} -09/20/2021 14:56:56 - INFO - __main__ - Step 2134: {'lr': 3.546666666666667e-05, 'samples': 68288, 'steps': 133, 'loss/train': 5.299323558807373} -09/20/2021 14:56:57 - INFO - __main__ - Step 2135: {'lr': 3.546666666666667e-05, 'samples': 68320, 'steps': 133, 'loss/train': 6.812859535217285} -09/20/2021 14:56:57 - INFO - __main__ - Step 2136: {'lr': 3.546666666666667e-05, 'samples': 68352, 'steps': 133, 'loss/train': 6.318286895751953} -09/20/2021 14:56:58 - INFO - __main__ - Step 2137: {'lr': 3.546666666666667e-05, 'samples': 68384, 'steps': 133, 'loss/train': 6.388840675354004} -09/20/2021 14:56:59 - INFO - __main__ - Step 2138: {'lr': 3.546666666666667e-05, 'samples': 68416, 'steps': 133, 'loss/train': 5.480230331420898} -09/20/2021 14:57:00 - INFO - __main__ - Step 2139: {'lr': 3.546666666666667e-05, 'samples': 68448, 'steps': 133, 'loss/train': 5.662300109863281} -09/20/2021 14:57:00 - INFO - __main__ - Step 2140: {'lr': 3.546666666666667e-05, 'samples': 68480, 'steps': 133, 'loss/train': 5.918728351593018} -09/20/2021 14:57:01 - INFO - __main__ - Step 2141: {'lr': 3.546666666666667e-05, 'samples': 68512, 'steps': 133, 'loss/train': 5.36566162109375} -09/20/2021 14:57:02 - INFO - __main__ - Step 2142: {'lr': 3.546666666666667e-05, 'samples': 68544, 'steps': 133, 'loss/train': 5.476046085357666} -09/20/2021 14:57:03 - INFO - __main__ - Step 2143: {'lr': 3.546666666666667e-05, 'samples': 68576, 'steps': 133, 'loss/train': 5.206275463104248} -09/20/2021 14:57:03 - INFO - __main__ - Step 2144: {'lr': 3.546666666666667e-05, 'samples': 68608, 'steps': 133, 'loss/train': 5.767072677612305} -09/20/2021 14:57:04 - INFO - __main__ - Step 2145: {'lr': 3.573333333333333e-05, 'samples': 68640, 'steps': 134, 'loss/train': 6.745692729949951} -09/20/2021 14:57:05 - INFO - __main__ - Step 2146: {'lr': 3.573333333333333e-05, 'samples': 68672, 'steps': 134, 'loss/train': 4.517496109008789} -09/20/2021 14:57:06 - INFO - __main__ - Step 2147: {'lr': 3.573333333333333e-05, 'samples': 68704, 'steps': 134, 'loss/train': 5.334805965423584} -09/20/2021 14:57:07 - INFO - __main__ - Step 2148: {'lr': 3.573333333333333e-05, 'samples': 68736, 'steps': 134, 'loss/train': 5.019484519958496} -09/20/2021 14:57:07 - INFO - __main__ - Step 2149: {'lr': 3.573333333333333e-05, 'samples': 68768, 'steps': 134, 'loss/train': 5.3477463722229} -09/20/2021 14:57:08 - INFO - __main__ - Step 2150: {'lr': 3.573333333333333e-05, 'samples': 68800, 'steps': 134, 'loss/train': 4.767318248748779} -09/20/2021 14:57:09 - INFO - __main__ - Step 2151: {'lr': 3.573333333333333e-05, 'samples': 68832, 'steps': 134, 'loss/train': 6.243524074554443} -09/20/2021 14:57:10 - INFO - __main__ - Step 2152: {'lr': 3.573333333333333e-05, 'samples': 68864, 'steps': 134, 'loss/train': 6.013646125793457} -09/20/2021 14:57:11 - INFO - __main__ - Step 2153: {'lr': 3.573333333333333e-05, 'samples': 68896, 'steps': 134, 'loss/train': 6.826420307159424} -09/20/2021 14:57:12 - INFO - __main__ - Step 2154: {'lr': 3.573333333333333e-05, 'samples': 68928, 'steps': 134, 'loss/train': 7.46842098236084} -09/20/2021 14:57:12 - INFO - __main__ - Step 2155: {'lr': 3.573333333333333e-05, 'samples': 68960, 'steps': 134, 'loss/train': 6.0570549964904785} -09/20/2021 14:57:13 - INFO - __main__ - Step 2156: {'lr': 3.573333333333333e-05, 'samples': 68992, 'steps': 134, 'loss/train': 7.418774604797363} -09/20/2021 14:57:14 - INFO - __main__ - Step 2157: {'lr': 3.573333333333333e-05, 'samples': 69024, 'steps': 134, 'loss/train': 5.7054595947265625} -09/20/2021 14:57:15 - INFO - __main__ - Step 2158: {'lr': 3.573333333333333e-05, 'samples': 69056, 'steps': 134, 'loss/train': 7.454160690307617} -09/20/2021 14:57:15 - INFO - __main__ - Step 2159: {'lr': 3.573333333333333e-05, 'samples': 69088, 'steps': 134, 'loss/train': 6.409165859222412} -09/20/2021 14:57:16 - INFO - __main__ - Step 2160: {'lr': 3.573333333333333e-05, 'samples': 69120, 'steps': 134, 'loss/train': 8.130443572998047} -09/20/2021 14:57:17 - INFO - __main__ - Step 2161: {'lr': 3.6e-05, 'samples': 69152, 'steps': 135, 'loss/train': 5.374846458435059} -09/20/2021 14:57:18 - INFO - __main__ - Step 2162: {'lr': 3.6e-05, 'samples': 69184, 'steps': 135, 'loss/train': 6.514156818389893} -09/20/2021 14:57:19 - INFO - __main__ - Step 2163: {'lr': 3.6e-05, 'samples': 69216, 'steps': 135, 'loss/train': 5.231129169464111} -09/20/2021 14:57:19 - INFO - __main__ - Step 2164: {'lr': 3.6e-05, 'samples': 69248, 'steps': 135, 'loss/train': 6.273473262786865} -09/20/2021 14:57:20 - INFO - __main__ - Step 2165: {'lr': 3.6e-05, 'samples': 69280, 'steps': 135, 'loss/train': 6.219895362854004} -09/20/2021 14:57:21 - INFO - __main__ - Step 2166: {'lr': 3.6e-05, 'samples': 69312, 'steps': 135, 'loss/train': 5.992303848266602} -09/20/2021 14:57:22 - INFO - __main__ - Step 2167: {'lr': 3.6e-05, 'samples': 69344, 'steps': 135, 'loss/train': 5.9493184089660645} -09/20/2021 14:57:22 - INFO - __main__ - Step 2168: {'lr': 3.6e-05, 'samples': 69376, 'steps': 135, 'loss/train': 8.004152297973633} -09/20/2021 14:57:23 - INFO - __main__ - Step 2169: {'lr': 3.6e-05, 'samples': 69408, 'steps': 135, 'loss/train': 5.574527263641357} -09/20/2021 14:57:24 - INFO - __main__ - Step 2170: {'lr': 3.6e-05, 'samples': 69440, 'steps': 135, 'loss/train': 6.748113632202148} -09/20/2021 14:57:25 - INFO - __main__ - Step 2171: {'lr': 3.6e-05, 'samples': 69472, 'steps': 135, 'loss/train': 6.604585647583008} -09/20/2021 14:57:25 - INFO - __main__ - Step 2172: {'lr': 3.6e-05, 'samples': 69504, 'steps': 135, 'loss/train': 6.781185626983643} -09/20/2021 14:57:26 - INFO - __main__ - Step 2173: {'lr': 3.6e-05, 'samples': 69536, 'steps': 135, 'loss/train': 7.016073703765869} -09/20/2021 14:57:27 - INFO - __main__ - Step 2174: {'lr': 3.6e-05, 'samples': 69568, 'steps': 135, 'loss/train': 6.1478166580200195} -09/20/2021 14:57:28 - INFO - __main__ - Step 2175: {'lr': 3.6e-05, 'samples': 69600, 'steps': 135, 'loss/train': 7.510829925537109} -09/20/2021 14:57:28 - INFO - __main__ - Step 2176: {'lr': 3.6e-05, 'samples': 69632, 'steps': 135, 'loss/train': 5.944479465484619} -09/20/2021 14:57:29 - INFO - __main__ - Step 2177: {'lr': 3.626666666666667e-05, 'samples': 69664, 'steps': 136, 'loss/train': 6.989692211151123} -09/20/2021 14:57:30 - INFO - __main__ - Step 2178: {'lr': 3.626666666666667e-05, 'samples': 69696, 'steps': 136, 'loss/train': 5.310296058654785} -09/20/2021 14:57:31 - INFO - __main__ - Step 2179: {'lr': 3.626666666666667e-05, 'samples': 69728, 'steps': 136, 'loss/train': 4.774595737457275} -09/20/2021 14:57:31 - INFO - __main__ - Step 2180: {'lr': 3.626666666666667e-05, 'samples': 69760, 'steps': 136, 'loss/train': 5.011234760284424} -09/20/2021 14:57:32 - INFO - __main__ - Step 2181: {'lr': 3.626666666666667e-05, 'samples': 69792, 'steps': 136, 'loss/train': 5.839911460876465} -09/20/2021 14:57:33 - INFO - __main__ - Step 2182: {'lr': 3.626666666666667e-05, 'samples': 69824, 'steps': 136, 'loss/train': 6.49127721786499} -09/20/2021 14:57:34 - INFO - __main__ - Step 2183: {'lr': 3.626666666666667e-05, 'samples': 69856, 'steps': 136, 'loss/train': 5.348516941070557} -09/20/2021 14:57:35 - INFO - __main__ - Step 2184: {'lr': 3.626666666666667e-05, 'samples': 69888, 'steps': 136, 'loss/train': 5.906205177307129} -09/20/2021 14:57:36 - INFO - __main__ - Step 2185: {'lr': 3.626666666666667e-05, 'samples': 69920, 'steps': 136, 'loss/train': 6.446519374847412} -09/20/2021 14:57:37 - INFO - __main__ - Step 2186: {'lr': 3.626666666666667e-05, 'samples': 69952, 'steps': 136, 'loss/train': 5.620018482208252} -09/20/2021 14:57:37 - INFO - __main__ - Step 2187: {'lr': 3.626666666666667e-05, 'samples': 69984, 'steps': 136, 'loss/train': 6.506559371948242} -09/20/2021 14:57:38 - INFO - __main__ - Step 2188: {'lr': 3.626666666666667e-05, 'samples': 70016, 'steps': 136, 'loss/train': 6.212006092071533} -09/20/2021 14:57:39 - INFO - __main__ - Step 2189: {'lr': 3.626666666666667e-05, 'samples': 70048, 'steps': 136, 'loss/train': 6.486134052276611} -09/20/2021 14:57:40 - INFO - __main__ - Step 2190: {'lr': 3.626666666666667e-05, 'samples': 70080, 'steps': 136, 'loss/train': 6.15611457824707} -09/20/2021 14:57:40 - INFO - __main__ - Step 2191: {'lr': 3.626666666666667e-05, 'samples': 70112, 'steps': 136, 'loss/train': 6.863663196563721} -09/20/2021 14:57:41 - INFO - __main__ - Step 2192: {'lr': 3.626666666666667e-05, 'samples': 70144, 'steps': 136, 'loss/train': 6.679437160491943} -09/20/2021 14:57:42 - INFO - __main__ - Step 2193: {'lr': 3.653333333333334e-05, 'samples': 70176, 'steps': 137, 'loss/train': 5.006667137145996} -09/20/2021 14:57:43 - INFO - __main__ - Step 2194: {'lr': 3.653333333333334e-05, 'samples': 70208, 'steps': 137, 'loss/train': 6.5013251304626465} -09/20/2021 14:57:44 - INFO - __main__ - Step 2195: {'lr': 3.653333333333334e-05, 'samples': 70240, 'steps': 137, 'loss/train': 6.123168468475342} -09/20/2021 14:57:44 - INFO - __main__ - Step 2196: {'lr': 3.653333333333334e-05, 'samples': 70272, 'steps': 137, 'loss/train': 6.687150001525879} -09/20/2021 14:57:45 - INFO - __main__ - Step 2197: {'lr': 3.653333333333334e-05, 'samples': 70304, 'steps': 137, 'loss/train': 6.642352104187012} -09/20/2021 14:57:46 - INFO - __main__ - Step 2198: {'lr': 3.653333333333334e-05, 'samples': 70336, 'steps': 137, 'loss/train': 6.787682056427002} -09/20/2021 14:57:47 - INFO - __main__ - Step 2199: {'lr': 3.653333333333334e-05, 'samples': 70368, 'steps': 137, 'loss/train': 5.7800421714782715} -09/20/2021 14:57:47 - INFO - __main__ - Step 2200: {'lr': 3.653333333333334e-05, 'samples': 70400, 'steps': 137, 'loss/train': 6.375832557678223} -09/20/2021 14:57:48 - INFO - __main__ - Step 2201: {'lr': 3.653333333333334e-05, 'samples': 70432, 'steps': 137, 'loss/train': 6.5953264236450195} -09/20/2021 14:57:49 - INFO - __main__ - Step 2202: {'lr': 3.653333333333334e-05, 'samples': 70464, 'steps': 137, 'loss/train': 6.4138264656066895} -09/20/2021 14:57:50 - INFO - __main__ - Step 2203: {'lr': 3.653333333333334e-05, 'samples': 70496, 'steps': 137, 'loss/train': 5.739989757537842} -09/20/2021 14:57:50 - INFO - __main__ - Step 2204: {'lr': 3.653333333333334e-05, 'samples': 70528, 'steps': 137, 'loss/train': 6.185153007507324} -09/20/2021 14:57:51 - INFO - __main__ - Step 2205: {'lr': 3.653333333333334e-05, 'samples': 70560, 'steps': 137, 'loss/train': 6.79274845123291} -09/20/2021 14:57:52 - INFO - __main__ - Step 2206: {'lr': 3.653333333333334e-05, 'samples': 70592, 'steps': 137, 'loss/train': 6.721734046936035} -09/20/2021 14:57:53 - INFO - __main__ - Step 2207: {'lr': 3.653333333333334e-05, 'samples': 70624, 'steps': 137, 'loss/train': 6.383624076843262} -09/20/2021 14:57:53 - INFO - __main__ - Step 2208: {'lr': 3.653333333333334e-05, 'samples': 70656, 'steps': 137, 'loss/train': 6.53190279006958} -09/20/2021 14:57:54 - INFO - __main__ - Step 2209: {'lr': 3.68e-05, 'samples': 70688, 'steps': 138, 'loss/train': 8.160554885864258} -09/20/2021 14:57:55 - INFO - __main__ - Step 2210: {'lr': 3.68e-05, 'samples': 70720, 'steps': 138, 'loss/train': 6.780449390411377} -09/20/2021 14:57:56 - INFO - __main__ - Step 2211: {'lr': 3.68e-05, 'samples': 70752, 'steps': 138, 'loss/train': 5.746101379394531} -09/20/2021 14:57:56 - INFO - __main__ - Step 2212: {'lr': 3.68e-05, 'samples': 70784, 'steps': 138, 'loss/train': 6.318554401397705} -09/20/2021 14:57:57 - INFO - __main__ - Step 2213: {'lr': 3.68e-05, 'samples': 70816, 'steps': 138, 'loss/train': 6.8067708015441895} -09/20/2021 14:57:58 - INFO - __main__ - Step 2214: {'lr': 3.68e-05, 'samples': 70848, 'steps': 138, 'loss/train': 6.283014297485352} -09/20/2021 14:57:59 - INFO - __main__ - Step 2215: {'lr': 3.68e-05, 'samples': 70880, 'steps': 138, 'loss/train': 6.45927095413208} -09/20/2021 14:58:01 - INFO - __main__ - Step 2216: {'lr': 3.68e-05, 'samples': 70912, 'steps': 138, 'loss/train': 6.265902996063232} -09/20/2021 14:58:02 - INFO - __main__ - Step 2217: {'lr': 3.68e-05, 'samples': 70944, 'steps': 138, 'loss/train': 5.367911338806152} -09/20/2021 14:58:02 - INFO - __main__ - Step 2218: {'lr': 3.68e-05, 'samples': 70976, 'steps': 138, 'loss/train': 6.58816385269165} -09/20/2021 14:58:03 - INFO - __main__ - Step 2219: {'lr': 3.68e-05, 'samples': 71008, 'steps': 138, 'loss/train': 6.983344554901123} -09/20/2021 14:58:04 - INFO - __main__ - Step 2220: {'lr': 3.68e-05, 'samples': 71040, 'steps': 138, 'loss/train': 6.085146903991699} -09/20/2021 14:58:05 - INFO - __main__ - Step 2221: {'lr': 3.68e-05, 'samples': 71072, 'steps': 138, 'loss/train': 5.640705585479736} -09/20/2021 14:58:05 - INFO - __main__ - Step 2222: {'lr': 3.68e-05, 'samples': 71104, 'steps': 138, 'loss/train': 6.489269733428955} -09/20/2021 14:58:06 - INFO - __main__ - Step 2223: {'lr': 3.68e-05, 'samples': 71136, 'steps': 138, 'loss/train': 5.848585605621338} -09/20/2021 14:58:07 - INFO - __main__ - Step 2224: {'lr': 3.68e-05, 'samples': 71168, 'steps': 138, 'loss/train': 7.808628082275391} -09/20/2021 14:58:08 - INFO - __main__ - Step 2225: {'lr': 3.706666666666667e-05, 'samples': 71200, 'steps': 139, 'loss/train': 6.030270099639893} -09/20/2021 14:58:09 - INFO - __main__ - Step 2226: {'lr': 3.706666666666667e-05, 'samples': 71232, 'steps': 139, 'loss/train': 6.110476970672607} -09/20/2021 14:58:09 - INFO - __main__ - Step 2227: {'lr': 3.706666666666667e-05, 'samples': 71264, 'steps': 139, 'loss/train': 6.037475109100342} -09/20/2021 14:58:10 - INFO - __main__ - Step 2228: {'lr': 3.706666666666667e-05, 'samples': 71296, 'steps': 139, 'loss/train': 5.998317718505859} -09/20/2021 14:58:11 - INFO - __main__ - Step 2229: {'lr': 3.706666666666667e-05, 'samples': 71328, 'steps': 139, 'loss/train': 6.013703346252441} -09/20/2021 14:58:12 - INFO - __main__ - Step 2230: {'lr': 3.706666666666667e-05, 'samples': 71360, 'steps': 139, 'loss/train': 6.175745964050293} -09/20/2021 14:58:12 - INFO - __main__ - Step 2231: {'lr': 3.706666666666667e-05, 'samples': 71392, 'steps': 139, 'loss/train': 6.142911911010742} -09/20/2021 14:58:13 - INFO - __main__ - Step 2232: {'lr': 3.706666666666667e-05, 'samples': 71424, 'steps': 139, 'loss/train': 6.176095485687256} -09/20/2021 14:58:14 - INFO - __main__ - Step 2233: {'lr': 3.706666666666667e-05, 'samples': 71456, 'steps': 139, 'loss/train': 6.491353988647461} -09/20/2021 14:58:15 - INFO - __main__ - Step 2234: {'lr': 3.706666666666667e-05, 'samples': 71488, 'steps': 139, 'loss/train': 6.441026210784912} -09/20/2021 14:58:15 - INFO - __main__ - Step 2235: {'lr': 3.706666666666667e-05, 'samples': 71520, 'steps': 139, 'loss/train': 6.4460768699646} -09/20/2021 14:58:16 - INFO - __main__ - Step 2236: {'lr': 3.706666666666667e-05, 'samples': 71552, 'steps': 139, 'loss/train': 6.508646488189697} -09/20/2021 14:58:17 - INFO - __main__ - Step 2237: {'lr': 3.706666666666667e-05, 'samples': 71584, 'steps': 139, 'loss/train': 6.806925296783447} -09/20/2021 14:58:18 - INFO - __main__ - Step 2238: {'lr': 3.706666666666667e-05, 'samples': 71616, 'steps': 139, 'loss/train': 6.058590412139893} -09/20/2021 14:58:18 - INFO - __main__ - Step 2239: {'lr': 3.706666666666667e-05, 'samples': 71648, 'steps': 139, 'loss/train': 6.781269550323486} -09/20/2021 14:58:19 - INFO - __main__ - Step 2240: {'lr': 3.706666666666667e-05, 'samples': 71680, 'steps': 139, 'loss/train': 5.895963191986084} -09/20/2021 14:58:20 - INFO - __main__ - Step 2241: {'lr': 3.733333333333334e-05, 'samples': 71712, 'steps': 140, 'loss/train': 6.016989707946777} -09/20/2021 14:58:21 - INFO - __main__ - Step 2242: {'lr': 3.733333333333334e-05, 'samples': 71744, 'steps': 140, 'loss/train': 5.751189231872559} -09/20/2021 14:58:21 - INFO - __main__ - Step 2243: {'lr': 3.733333333333334e-05, 'samples': 71776, 'steps': 140, 'loss/train': 5.934811592102051} -09/20/2021 14:58:22 - INFO - __main__ - Step 2244: {'lr': 3.733333333333334e-05, 'samples': 71808, 'steps': 140, 'loss/train': 5.863578796386719} -09/20/2021 14:58:23 - INFO - __main__ - Step 2245: {'lr': 3.733333333333334e-05, 'samples': 71840, 'steps': 140, 'loss/train': 5.23285436630249} -09/20/2021 14:58:24 - INFO - __main__ - Step 2246: {'lr': 3.733333333333334e-05, 'samples': 71872, 'steps': 140, 'loss/train': 5.896046161651611} -09/20/2021 14:58:24 - INFO - __main__ - Step 2247: {'lr': 3.733333333333334e-05, 'samples': 71904, 'steps': 140, 'loss/train': 6.542251110076904} -09/20/2021 14:58:25 - INFO - __main__ - Step 2248: {'lr': 3.733333333333334e-05, 'samples': 71936, 'steps': 140, 'loss/train': 6.101861476898193} -09/20/2021 14:58:26 - INFO - __main__ - Step 2249: {'lr': 3.733333333333334e-05, 'samples': 71968, 'steps': 140, 'loss/train': 6.06851863861084} -09/20/2021 14:58:27 - INFO - __main__ - Step 2250: {'lr': 3.733333333333334e-05, 'samples': 72000, 'steps': 140, 'loss/train': 6.749871253967285} -09/20/2021 14:58:27 - INFO - __main__ - Step 2251: {'lr': 3.733333333333334e-05, 'samples': 72032, 'steps': 140, 'loss/train': 5.918732643127441} -09/20/2021 14:58:29 - INFO - __main__ - Step 2252: {'lr': 3.733333333333334e-05, 'samples': 72064, 'steps': 140, 'loss/train': 5.653304100036621} -09/20/2021 14:58:30 - INFO - __main__ - Step 2253: {'lr': 3.733333333333334e-05, 'samples': 72096, 'steps': 140, 'loss/train': 4.8899712562561035} -09/20/2021 14:58:30 - INFO - __main__ - Step 2254: {'lr': 3.733333333333334e-05, 'samples': 72128, 'steps': 140, 'loss/train': 6.214449882507324} -09/20/2021 14:58:31 - INFO - __main__ - Step 2255: {'lr': 3.733333333333334e-05, 'samples': 72160, 'steps': 140, 'loss/train': 6.020140647888184} -09/20/2021 14:58:32 - INFO - __main__ - Step 2256: {'lr': 3.733333333333334e-05, 'samples': 72192, 'steps': 140, 'loss/train': 6.1280317306518555} -09/20/2021 14:58:33 - INFO - __main__ - Step 2257: {'lr': 3.76e-05, 'samples': 72224, 'steps': 141, 'loss/train': 4.8492512702941895} -09/20/2021 14:58:34 - INFO - __main__ - Step 2258: {'lr': 3.76e-05, 'samples': 72256, 'steps': 141, 'loss/train': 5.685758113861084} -09/20/2021 14:58:34 - INFO - __main__ - Step 2259: {'lr': 3.76e-05, 'samples': 72288, 'steps': 141, 'loss/train': 5.939899921417236} -09/20/2021 14:58:35 - INFO - __main__ - Step 2260: {'lr': 3.76e-05, 'samples': 72320, 'steps': 141, 'loss/train': 6.245780944824219} -09/20/2021 14:58:36 - INFO - __main__ - Step 2261: {'lr': 3.76e-05, 'samples': 72352, 'steps': 141, 'loss/train': 6.765624046325684} -09/20/2021 14:58:37 - INFO - __main__ - Step 2262: {'lr': 3.76e-05, 'samples': 72384, 'steps': 141, 'loss/train': 5.836331844329834} -09/20/2021 14:58:37 - INFO - __main__ - Step 2263: {'lr': 3.76e-05, 'samples': 72416, 'steps': 141, 'loss/train': 5.959226131439209} -09/20/2021 14:58:38 - INFO - __main__ - Step 2264: {'lr': 3.76e-05, 'samples': 72448, 'steps': 141, 'loss/train': 7.482056140899658} -09/20/2021 14:58:39 - INFO - __main__ - Step 2265: {'lr': 3.76e-05, 'samples': 72480, 'steps': 141, 'loss/train': 6.200267791748047} -09/20/2021 14:58:40 - INFO - __main__ - Step 2266: {'lr': 3.76e-05, 'samples': 72512, 'steps': 141, 'loss/train': 6.0638041496276855} -09/20/2021 14:58:40 - INFO - __main__ - Step 2267: {'lr': 3.76e-05, 'samples': 72544, 'steps': 141, 'loss/train': 7.005498886108398} -09/20/2021 14:58:41 - INFO - __main__ - Step 2268: {'lr': 3.76e-05, 'samples': 72576, 'steps': 141, 'loss/train': 6.064748764038086} -09/20/2021 14:58:42 - INFO - __main__ - Step 2269: {'lr': 3.76e-05, 'samples': 72608, 'steps': 141, 'loss/train': 7.264112949371338} -09/20/2021 14:58:43 - INFO - __main__ - Step 2270: {'lr': 3.76e-05, 'samples': 72640, 'steps': 141, 'loss/train': 6.1293044090271} -09/20/2021 14:58:43 - INFO - __main__ - Step 2271: {'lr': 3.76e-05, 'samples': 72672, 'steps': 141, 'loss/train': 5.592441558837891} -09/20/2021 14:58:44 - INFO - __main__ - Step 2272: {'lr': 3.76e-05, 'samples': 72704, 'steps': 141, 'loss/train': 6.494841575622559} -09/20/2021 14:58:45 - INFO - __main__ - Step 2273: {'lr': 3.786666666666667e-05, 'samples': 72736, 'steps': 142, 'loss/train': 6.4694905281066895} -09/20/2021 14:58:46 - INFO - __main__ - Step 2274: {'lr': 3.786666666666667e-05, 'samples': 72768, 'steps': 142, 'loss/train': 5.371041297912598} -09/20/2021 14:58:46 - INFO - __main__ - Step 2275: {'lr': 3.786666666666667e-05, 'samples': 72800, 'steps': 142, 'loss/train': 6.3549323081970215} -09/20/2021 14:58:47 - INFO - __main__ - Step 2276: {'lr': 3.786666666666667e-05, 'samples': 72832, 'steps': 142, 'loss/train': 6.276108264923096} -09/20/2021 14:58:48 - INFO - __main__ - Step 2277: {'lr': 3.786666666666667e-05, 'samples': 72864, 'steps': 142, 'loss/train': 6.481751918792725} -09/20/2021 14:58:49 - INFO - __main__ - Step 2278: {'lr': 3.786666666666667e-05, 'samples': 72896, 'steps': 142, 'loss/train': 7.379664897918701} -09/20/2021 14:58:49 - INFO - __main__ - Step 2279: {'lr': 3.786666666666667e-05, 'samples': 72928, 'steps': 142, 'loss/train': 3.9519834518432617} -09/20/2021 14:58:50 - INFO - __main__ - Step 2280: {'lr': 3.786666666666667e-05, 'samples': 72960, 'steps': 142, 'loss/train': 6.060527324676514} -09/20/2021 14:58:51 - INFO - __main__ - Step 2281: {'lr': 3.786666666666667e-05, 'samples': 72992, 'steps': 142, 'loss/train': 6.2674150466918945} -09/20/2021 14:58:52 - INFO - __main__ - Step 2282: {'lr': 3.786666666666667e-05, 'samples': 73024, 'steps': 142, 'loss/train': 5.9174604415893555} -09/20/2021 14:58:53 - INFO - __main__ - Step 2283: {'lr': 3.786666666666667e-05, 'samples': 73056, 'steps': 142, 'loss/train': 5.747354984283447} -09/20/2021 14:58:54 - INFO - __main__ - Step 2284: {'lr': 3.786666666666667e-05, 'samples': 73088, 'steps': 142, 'loss/train': 5.6152873039245605} -09/20/2021 14:58:55 - INFO - __main__ - Step 2285: {'lr': 3.786666666666667e-05, 'samples': 73120, 'steps': 142, 'loss/train': 7.144567966461182} -09/20/2021 14:58:55 - INFO - __main__ - Step 2286: {'lr': 3.786666666666667e-05, 'samples': 73152, 'steps': 142, 'loss/train': 4.432087421417236} -09/20/2021 14:58:56 - INFO - __main__ - Step 2287: {'lr': 3.786666666666667e-05, 'samples': 73184, 'steps': 142, 'loss/train': 6.4796648025512695} -09/20/2021 14:58:57 - INFO - __main__ - Step 2288: {'lr': 3.786666666666667e-05, 'samples': 73216, 'steps': 142, 'loss/train': 5.872170925140381} -09/20/2021 14:58:58 - INFO - __main__ - Step 2289: {'lr': 3.8133333333333336e-05, 'samples': 73248, 'steps': 143, 'loss/train': 6.367855548858643} -09/20/2021 14:58:58 - INFO - __main__ - Step 2290: {'lr': 3.8133333333333336e-05, 'samples': 73280, 'steps': 143, 'loss/train': 6.4076104164123535} -09/20/2021 14:58:59 - INFO - __main__ - Step 2291: {'lr': 3.8133333333333336e-05, 'samples': 73312, 'steps': 143, 'loss/train': 5.561469554901123} -09/20/2021 14:59:00 - INFO - __main__ - Step 2292: {'lr': 3.8133333333333336e-05, 'samples': 73344, 'steps': 143, 'loss/train': 6.165071964263916} -09/20/2021 14:59:01 - INFO - __main__ - Step 2293: {'lr': 3.8133333333333336e-05, 'samples': 73376, 'steps': 143, 'loss/train': 5.960091590881348} -09/20/2021 14:59:01 - INFO - __main__ - Step 2294: {'lr': 3.8133333333333336e-05, 'samples': 73408, 'steps': 143, 'loss/train': 6.422591686248779} -09/20/2021 14:59:02 - INFO - __main__ - Step 2295: {'lr': 3.8133333333333336e-05, 'samples': 73440, 'steps': 143, 'loss/train': 5.080967426300049} -09/20/2021 14:59:03 - INFO - __main__ - Step 2296: {'lr': 3.8133333333333336e-05, 'samples': 73472, 'steps': 143, 'loss/train': 6.713353633880615} -09/20/2021 14:59:04 - INFO - __main__ - Step 2297: {'lr': 3.8133333333333336e-05, 'samples': 73504, 'steps': 143, 'loss/train': 4.197596073150635} -09/20/2021 14:59:04 - INFO - __main__ - Step 2298: {'lr': 3.8133333333333336e-05, 'samples': 73536, 'steps': 143, 'loss/train': 4.316659450531006} -09/20/2021 14:59:05 - INFO - __main__ - Step 2299: {'lr': 3.8133333333333336e-05, 'samples': 73568, 'steps': 143, 'loss/train': 4.309038162231445} -09/20/2021 14:59:06 - INFO - __main__ - Step 2300: {'lr': 3.8133333333333336e-05, 'samples': 73600, 'steps': 143, 'loss/train': 4.811618328094482} -09/20/2021 14:59:07 - INFO - __main__ - Step 2301: {'lr': 3.8133333333333336e-05, 'samples': 73632, 'steps': 143, 'loss/train': 4.756943702697754} -09/20/2021 14:59:07 - INFO - __main__ - Step 2302: {'lr': 3.8133333333333336e-05, 'samples': 73664, 'steps': 143, 'loss/train': 4.6295881271362305} -09/20/2021 14:59:08 - INFO - __main__ - Step 2303: {'lr': 3.8133333333333336e-05, 'samples': 73696, 'steps': 143, 'loss/train': 5.544652462005615} -09/20/2021 14:59:09 - INFO - __main__ - Step 2304: {'lr': 3.8133333333333336e-05, 'samples': 73728, 'steps': 143, 'loss/train': 4.642934799194336} -09/20/2021 14:59:10 - INFO - __main__ - Step 2305: {'lr': 3.8400000000000005e-05, 'samples': 73760, 'steps': 144, 'loss/train': 4.549211025238037} -09/20/2021 14:59:11 - INFO - __main__ - Step 2306: {'lr': 3.8400000000000005e-05, 'samples': 73792, 'steps': 144, 'loss/train': 6.275665283203125} -09/20/2021 14:59:11 - INFO - __main__ - Step 2307: {'lr': 3.8400000000000005e-05, 'samples': 73824, 'steps': 144, 'loss/train': 5.8601837158203125} -09/20/2021 14:59:12 - INFO - __main__ - Step 2308: {'lr': 3.8400000000000005e-05, 'samples': 73856, 'steps': 144, 'loss/train': 6.309483051300049} -09/20/2021 14:59:13 - INFO - __main__ - Step 2309: {'lr': 3.8400000000000005e-05, 'samples': 73888, 'steps': 144, 'loss/train': 5.405704975128174} -09/20/2021 14:59:14 - INFO - __main__ - Step 2310: {'lr': 3.8400000000000005e-05, 'samples': 73920, 'steps': 144, 'loss/train': 6.119488716125488} -09/20/2021 14:59:14 - INFO - __main__ - Step 2311: {'lr': 3.8400000000000005e-05, 'samples': 73952, 'steps': 144, 'loss/train': 6.170097827911377} -09/20/2021 14:59:15 - INFO - __main__ - Step 2312: {'lr': 3.8400000000000005e-05, 'samples': 73984, 'steps': 144, 'loss/train': 6.181628227233887} -09/20/2021 14:59:16 - INFO - __main__ - Step 2313: {'lr': 3.8400000000000005e-05, 'samples': 74016, 'steps': 144, 'loss/train': 7.345510005950928} -09/20/2021 14:59:17 - INFO - __main__ - Step 2314: {'lr': 3.8400000000000005e-05, 'samples': 74048, 'steps': 144, 'loss/train': 7.277095317840576} -09/20/2021 14:59:17 - INFO - __main__ - Step 2315: {'lr': 3.8400000000000005e-05, 'samples': 74080, 'steps': 144, 'loss/train': 6.2057881355285645} -09/20/2021 14:59:19 - INFO - __main__ - Step 2316: {'lr': 3.8400000000000005e-05, 'samples': 74112, 'steps': 144, 'loss/train': 6.6139302253723145} -09/20/2021 14:59:20 - INFO - __main__ - Step 2317: {'lr': 3.8400000000000005e-05, 'samples': 74144, 'steps': 144, 'loss/train': 5.889211177825928} -09/20/2021 14:59:20 - INFO - __main__ - Step 2318: {'lr': 3.8400000000000005e-05, 'samples': 74176, 'steps': 144, 'loss/train': 7.376870155334473} -09/20/2021 14:59:21 - INFO - __main__ - Step 2319: {'lr': 3.8400000000000005e-05, 'samples': 74208, 'steps': 144, 'loss/train': 6.453205585479736} -09/20/2021 14:59:22 - INFO - __main__ - Step 2320: {'lr': 3.8400000000000005e-05, 'samples': 74240, 'steps': 144, 'loss/train': 6.1376190185546875} -09/20/2021 14:59:23 - INFO - __main__ - Step 2321: {'lr': 3.866666666666667e-05, 'samples': 74272, 'steps': 145, 'loss/train': 6.170451641082764} -09/20/2021 14:59:24 - INFO - __main__ - Step 2322: {'lr': 3.866666666666667e-05, 'samples': 74304, 'steps': 145, 'loss/train': 6.312864780426025} -09/20/2021 14:59:24 - INFO - __main__ - Step 2323: {'lr': 3.866666666666667e-05, 'samples': 74336, 'steps': 145, 'loss/train': 6.97926664352417} -09/20/2021 14:59:25 - INFO - __main__ - Step 2324: {'lr': 3.866666666666667e-05, 'samples': 74368, 'steps': 145, 'loss/train': 7.221479415893555} -09/20/2021 14:59:26 - INFO - __main__ - Step 2325: {'lr': 3.866666666666667e-05, 'samples': 74400, 'steps': 145, 'loss/train': 7.13090705871582} -09/20/2021 14:59:27 - INFO - __main__ - Step 2326: {'lr': 3.866666666666667e-05, 'samples': 74432, 'steps': 145, 'loss/train': 7.4053568840026855} -09/20/2021 14:59:27 - INFO - __main__ - Step 2327: {'lr': 3.866666666666667e-05, 'samples': 74464, 'steps': 145, 'loss/train': 6.30894660949707} -09/20/2021 14:59:28 - INFO - __main__ - Step 2328: {'lr': 3.866666666666667e-05, 'samples': 74496, 'steps': 145, 'loss/train': 7.189276695251465} -09/20/2021 14:59:29 - INFO - __main__ - Step 2329: {'lr': 3.866666666666667e-05, 'samples': 74528, 'steps': 145, 'loss/train': 7.461504936218262} -09/20/2021 14:59:30 - INFO - __main__ - Step 2330: {'lr': 3.866666666666667e-05, 'samples': 74560, 'steps': 145, 'loss/train': 7.252240180969238} -09/20/2021 14:59:30 - INFO - __main__ - Step 2331: {'lr': 3.866666666666667e-05, 'samples': 74592, 'steps': 145, 'loss/train': 7.220885276794434} -09/20/2021 14:59:31 - INFO - __main__ - Step 2332: {'lr': 3.866666666666667e-05, 'samples': 74624, 'steps': 145, 'loss/train': 6.5380754470825195} -09/20/2021 14:59:32 - INFO - __main__ - Step 2333: {'lr': 3.866666666666667e-05, 'samples': 74656, 'steps': 145, 'loss/train': 7.0203857421875} -09/20/2021 14:59:33 - INFO - __main__ - Step 2334: {'lr': 3.866666666666667e-05, 'samples': 74688, 'steps': 145, 'loss/train': 6.202538967132568} -09/20/2021 14:59:33 - INFO - __main__ - Step 2335: {'lr': 3.866666666666667e-05, 'samples': 74720, 'steps': 145, 'loss/train': 6.090586185455322} -09/20/2021 14:59:34 - INFO - __main__ - Step 2336: {'lr': 3.866666666666667e-05, 'samples': 74752, 'steps': 145, 'loss/train': 8.864198684692383} -09/20/2021 14:59:35 - INFO - __main__ - Step 2337: {'lr': 3.8933333333333336e-05, 'samples': 74784, 'steps': 146, 'loss/train': 6.380397796630859} -09/20/2021 14:59:36 - INFO - __main__ - Step 2338: {'lr': 3.8933333333333336e-05, 'samples': 74816, 'steps': 146, 'loss/train': 6.112030029296875} -09/20/2021 14:59:36 - INFO - __main__ - Step 2339: {'lr': 3.8933333333333336e-05, 'samples': 74848, 'steps': 146, 'loss/train': 6.103203296661377} -09/20/2021 14:59:37 - INFO - __main__ - Step 2340: {'lr': 3.8933333333333336e-05, 'samples': 74880, 'steps': 146, 'loss/train': 6.518324375152588} -09/20/2021 14:59:38 - INFO - __main__ - Step 2341: {'lr': 3.8933333333333336e-05, 'samples': 74912, 'steps': 146, 'loss/train': 5.946488380432129} -09/20/2021 14:59:39 - INFO - __main__ - Step 2342: {'lr': 3.8933333333333336e-05, 'samples': 74944, 'steps': 146, 'loss/train': 6.4062066078186035} -09/20/2021 14:59:39 - INFO - __main__ - Step 2343: {'lr': 3.8933333333333336e-05, 'samples': 74976, 'steps': 146, 'loss/train': 4.901589393615723} -09/20/2021 14:59:40 - INFO - __main__ - Step 2344: {'lr': 3.8933333333333336e-05, 'samples': 75008, 'steps': 146, 'loss/train': 5.25922155380249} -09/20/2021 14:59:41 - INFO - __main__ - Step 2345: {'lr': 3.8933333333333336e-05, 'samples': 75040, 'steps': 146, 'loss/train': 6.469894886016846} -09/20/2021 14:59:42 - INFO - __main__ - Step 2346: {'lr': 3.8933333333333336e-05, 'samples': 75072, 'steps': 146, 'loss/train': 6.014387607574463} -09/20/2021 14:59:42 - INFO - __main__ - Step 2347: {'lr': 3.8933333333333336e-05, 'samples': 75104, 'steps': 146, 'loss/train': 10.494729042053223} -09/20/2021 14:59:43 - INFO - __main__ - Step 2348: {'lr': 3.8933333333333336e-05, 'samples': 75136, 'steps': 146, 'loss/train': 5.588451862335205} -09/20/2021 14:59:44 - INFO - __main__ - Step 2349: {'lr': 3.8933333333333336e-05, 'samples': 75168, 'steps': 146, 'loss/train': 6.582430362701416} -09/20/2021 14:59:45 - INFO - __main__ - Step 2350: {'lr': 3.8933333333333336e-05, 'samples': 75200, 'steps': 146, 'loss/train': 5.381967544555664} -09/20/2021 14:59:45 - INFO - __main__ - Step 2351: {'lr': 3.8933333333333336e-05, 'samples': 75232, 'steps': 146, 'loss/train': 5.214654922485352} -09/20/2021 14:59:46 - INFO - __main__ - Step 2352: {'lr': 3.8933333333333336e-05, 'samples': 75264, 'steps': 146, 'loss/train': 6.394961357116699} -09/20/2021 14:59:48 - INFO - __main__ - Step 2353: {'lr': 3.9200000000000004e-05, 'samples': 75296, 'steps': 147, 'loss/train': 5.836625099182129} -09/20/2021 14:59:48 - INFO - __main__ - Step 2354: {'lr': 3.9200000000000004e-05, 'samples': 75328, 'steps': 147, 'loss/train': 6.433752536773682} -09/20/2021 14:59:49 - INFO - __main__ - Step 2355: {'lr': 3.9200000000000004e-05, 'samples': 75360, 'steps': 147, 'loss/train': 6.370136260986328} -09/20/2021 14:59:50 - INFO - __main__ - Step 2356: {'lr': 3.9200000000000004e-05, 'samples': 75392, 'steps': 147, 'loss/train': 6.908847332000732} -09/20/2021 14:59:51 - INFO - __main__ - Step 2357: {'lr': 3.9200000000000004e-05, 'samples': 75424, 'steps': 147, 'loss/train': 5.739133834838867} -09/20/2021 14:59:51 - INFO - __main__ - Step 2358: {'lr': 3.9200000000000004e-05, 'samples': 75456, 'steps': 147, 'loss/train': 6.987489700317383} -09/20/2021 14:59:52 - INFO - __main__ - Step 2359: {'lr': 3.9200000000000004e-05, 'samples': 75488, 'steps': 147, 'loss/train': 5.685873508453369} -09/20/2021 14:59:53 - INFO - __main__ - Step 2360: {'lr': 3.9200000000000004e-05, 'samples': 75520, 'steps': 147, 'loss/train': 3.8028321266174316} -09/20/2021 14:59:54 - INFO - __main__ - Step 2361: {'lr': 3.9200000000000004e-05, 'samples': 75552, 'steps': 147, 'loss/train': 6.2599029541015625} -09/20/2021 14:59:54 - INFO - __main__ - Step 2362: {'lr': 3.9200000000000004e-05, 'samples': 75584, 'steps': 147, 'loss/train': 6.978109836578369} -09/20/2021 14:59:55 - INFO - __main__ - Step 2363: {'lr': 3.9200000000000004e-05, 'samples': 75616, 'steps': 147, 'loss/train': 6.147963047027588} -09/20/2021 14:59:56 - INFO - __main__ - Step 2364: {'lr': 3.9200000000000004e-05, 'samples': 75648, 'steps': 147, 'loss/train': 5.630116939544678} -09/20/2021 14:59:57 - INFO - __main__ - Step 2365: {'lr': 3.9200000000000004e-05, 'samples': 75680, 'steps': 147, 'loss/train': 6.101633548736572} -09/20/2021 14:59:57 - INFO - __main__ - Step 2366: {'lr': 3.9200000000000004e-05, 'samples': 75712, 'steps': 147, 'loss/train': 6.2492241859436035} -09/20/2021 14:59:58 - INFO - __main__ - Step 2367: {'lr': 3.9200000000000004e-05, 'samples': 75744, 'steps': 147, 'loss/train': 6.21793794631958} -09/20/2021 14:59:59 - INFO - __main__ - Step 2368: {'lr': 3.9200000000000004e-05, 'samples': 75776, 'steps': 147, 'loss/train': 6.4107208251953125} -09/20/2021 15:00:00 - INFO - __main__ - Step 2369: {'lr': 3.9466666666666666e-05, 'samples': 75808, 'steps': 148, 'loss/train': 6.0345683097839355} -09/20/2021 15:00:01 - INFO - __main__ - Step 2370: {'lr': 3.9466666666666666e-05, 'samples': 75840, 'steps': 148, 'loss/train': 5.293837547302246} -09/20/2021 15:00:01 - INFO - __main__ - Step 2371: {'lr': 3.9466666666666666e-05, 'samples': 75872, 'steps': 148, 'loss/train': 5.710004806518555} -09/20/2021 15:00:02 - INFO - __main__ - Step 2372: {'lr': 3.9466666666666666e-05, 'samples': 75904, 'steps': 148, 'loss/train': 5.644325256347656} -09/20/2021 15:00:03 - INFO - __main__ - Step 2373: {'lr': 3.9466666666666666e-05, 'samples': 75936, 'steps': 148, 'loss/train': 6.193685531616211} -09/20/2021 15:00:04 - INFO - __main__ - Step 2374: {'lr': 3.9466666666666666e-05, 'samples': 75968, 'steps': 148, 'loss/train': 5.323239326477051} -09/20/2021 15:00:04 - INFO - __main__ - Step 2375: {'lr': 3.9466666666666666e-05, 'samples': 76000, 'steps': 148, 'loss/train': 6.246066093444824} -09/20/2021 15:00:05 - INFO - __main__ - Step 2376: {'lr': 3.9466666666666666e-05, 'samples': 76032, 'steps': 148, 'loss/train': 6.346191883087158} -09/20/2021 15:00:06 - INFO - __main__ - Step 2377: {'lr': 3.9466666666666666e-05, 'samples': 76064, 'steps': 148, 'loss/train': 5.429062366485596} -09/20/2021 15:00:07 - INFO - __main__ - Step 2378: {'lr': 3.9466666666666666e-05, 'samples': 76096, 'steps': 148, 'loss/train': 6.238955020904541} -09/20/2021 15:00:07 - INFO - __main__ - Step 2379: {'lr': 3.9466666666666666e-05, 'samples': 76128, 'steps': 148, 'loss/train': 5.318933486938477} -09/20/2021 15:00:08 - INFO - __main__ - Step 2380: {'lr': 3.9466666666666666e-05, 'samples': 76160, 'steps': 148, 'loss/train': 5.8634538650512695} -09/20/2021 15:00:09 - INFO - __main__ - Step 2381: {'lr': 3.9466666666666666e-05, 'samples': 76192, 'steps': 148, 'loss/train': 6.534151077270508} -09/20/2021 15:00:10 - INFO - __main__ - Step 2382: {'lr': 3.9466666666666666e-05, 'samples': 76224, 'steps': 148, 'loss/train': 5.3882856369018555} -09/20/2021 15:00:11 - INFO - __main__ - Step 2383: {'lr': 3.9466666666666666e-05, 'samples': 76256, 'steps': 148, 'loss/train': 6.61303186416626} -09/20/2021 15:00:12 - INFO - __main__ - Step 2384: {'lr': 3.9466666666666666e-05, 'samples': 76288, 'steps': 148, 'loss/train': 6.443053245544434} -09/20/2021 15:00:13 - INFO - __main__ - Step 2385: {'lr': 3.9733333333333335e-05, 'samples': 76320, 'steps': 149, 'loss/train': 7.1140899658203125} -09/20/2021 15:00:13 - INFO - __main__ - Step 2386: {'lr': 3.9733333333333335e-05, 'samples': 76352, 'steps': 149, 'loss/train': 7.989988327026367} -09/20/2021 15:00:14 - INFO - __main__ - Step 2387: {'lr': 3.9733333333333335e-05, 'samples': 76384, 'steps': 149, 'loss/train': 5.8625383377075195} -09/20/2021 15:00:15 - INFO - __main__ - Step 2388: {'lr': 3.9733333333333335e-05, 'samples': 76416, 'steps': 149, 'loss/train': 5.824028015136719} -09/20/2021 15:00:16 - INFO - __main__ - Step 2389: {'lr': 3.9733333333333335e-05, 'samples': 76448, 'steps': 149, 'loss/train': 6.3651628494262695} -09/20/2021 15:00:16 - INFO - __main__ - Step 2390: {'lr': 3.9733333333333335e-05, 'samples': 76480, 'steps': 149, 'loss/train': 5.203049182891846} -09/20/2021 15:00:17 - INFO - __main__ - Step 2391: {'lr': 3.9733333333333335e-05, 'samples': 76512, 'steps': 149, 'loss/train': 6.014912128448486} -09/20/2021 15:00:18 - INFO - __main__ - Step 2392: {'lr': 3.9733333333333335e-05, 'samples': 76544, 'steps': 149, 'loss/train': 6.159536838531494} -09/20/2021 15:00:19 - INFO - __main__ - Step 2393: {'lr': 3.9733333333333335e-05, 'samples': 76576, 'steps': 149, 'loss/train': 5.921067237854004} -09/20/2021 15:00:19 - INFO - __main__ - Step 2394: {'lr': 3.9733333333333335e-05, 'samples': 76608, 'steps': 149, 'loss/train': 5.8216657638549805} -09/20/2021 15:00:20 - INFO - __main__ - Step 2395: {'lr': 3.9733333333333335e-05, 'samples': 76640, 'steps': 149, 'loss/train': 6.579406261444092} -09/20/2021 15:00:21 - INFO - __main__ - Step 2396: {'lr': 3.9733333333333335e-05, 'samples': 76672, 'steps': 149, 'loss/train': 5.991772174835205} -09/20/2021 15:00:22 - INFO - __main__ - Step 2397: {'lr': 3.9733333333333335e-05, 'samples': 76704, 'steps': 149, 'loss/train': 5.8262810707092285} -09/20/2021 15:00:22 - INFO - __main__ - Step 2398: {'lr': 3.9733333333333335e-05, 'samples': 76736, 'steps': 149, 'loss/train': 5.794602394104004} -09/20/2021 15:00:23 - INFO - __main__ - Step 2399: {'lr': 3.9733333333333335e-05, 'samples': 76768, 'steps': 149, 'loss/train': 6.122905731201172} -09/20/2021 15:00:24 - INFO - __main__ - Step 2400: {'lr': 3.9733333333333335e-05, 'samples': 76800, 'steps': 149, 'loss/train': 5.921288013458252} -09/20/2021 15:00:25 - INFO - __main__ - Step 2401: {'lr': 4e-05, 'samples': 76832, 'steps': 150, 'loss/train': 5.039218902587891} -09/20/2021 15:00:26 - INFO - __main__ - Step 2402: {'lr': 4e-05, 'samples': 76864, 'steps': 150, 'loss/train': 5.408051490783691} -09/20/2021 15:00:26 - INFO - __main__ - Step 2403: {'lr': 4e-05, 'samples': 76896, 'steps': 150, 'loss/train': 5.699455738067627} -09/20/2021 15:00:27 - INFO - __main__ - Step 2404: {'lr': 4e-05, 'samples': 76928, 'steps': 150, 'loss/train': 6.602104663848877} -09/20/2021 15:00:28 - INFO - __main__ - Step 2405: {'lr': 4e-05, 'samples': 76960, 'steps': 150, 'loss/train': 5.136485576629639} -09/20/2021 15:00:29 - INFO - __main__ - Step 2406: {'lr': 4e-05, 'samples': 76992, 'steps': 150, 'loss/train': 5.105165481567383} -09/20/2021 15:00:29 - INFO - __main__ - Step 2407: {'lr': 4e-05, 'samples': 77024, 'steps': 150, 'loss/train': 5.055327892303467} -09/20/2021 15:00:30 - INFO - __main__ - Step 2408: {'lr': 4e-05, 'samples': 77056, 'steps': 150, 'loss/train': 5.091908931732178} -09/20/2021 15:00:31 - INFO - __main__ - Step 2409: {'lr': 4e-05, 'samples': 77088, 'steps': 150, 'loss/train': 5.0867919921875} -09/20/2021 15:00:32 - INFO - __main__ - Step 2410: {'lr': 4e-05, 'samples': 77120, 'steps': 150, 'loss/train': 5.932521820068359} -09/20/2021 15:00:32 - INFO - __main__ - Step 2411: {'lr': 4e-05, 'samples': 77152, 'steps': 150, 'loss/train': 6.9238715171813965} -09/20/2021 15:00:33 - INFO - __main__ - Step 2412: {'lr': 4e-05, 'samples': 77184, 'steps': 150, 'loss/train': 6.158914566040039} -09/20/2021 15:00:34 - INFO - __main__ - Step 2413: {'lr': 4e-05, 'samples': 77216, 'steps': 150, 'loss/train': 6.4466471672058105} -09/20/2021 15:00:35 - INFO - __main__ - Step 2414: {'lr': 4e-05, 'samples': 77248, 'steps': 150, 'loss/train': 7.361713409423828} -09/20/2021 15:00:35 - INFO - __main__ - Step 2415: {'lr': 4e-05, 'samples': 77280, 'steps': 150, 'loss/train': 4.450642108917236} -09/20/2021 15:00:36 - INFO - __main__ - Step 2416: {'lr': 4e-05, 'samples': 77312, 'steps': 150, 'loss/train': 5.7275543212890625} -09/20/2021 15:00:37 - INFO - __main__ - Step 2417: {'lr': 4.026666666666667e-05, 'samples': 77344, 'steps': 151, 'loss/train': 6.479875564575195} -09/20/2021 15:00:39 - INFO - __main__ - Step 2418: {'lr': 4.026666666666667e-05, 'samples': 77376, 'steps': 151, 'loss/train': 5.849270820617676} -09/20/2021 15:00:40 - INFO - __main__ - Step 2419: {'lr': 4.026666666666667e-05, 'samples': 77408, 'steps': 151, 'loss/train': 5.906253814697266} -09/20/2021 15:00:41 - INFO - __main__ - Step 2420: {'lr': 4.026666666666667e-05, 'samples': 77440, 'steps': 151, 'loss/train': 6.089856147766113} -09/20/2021 15:00:41 - INFO - __main__ - Step 2421: {'lr': 4.026666666666667e-05, 'samples': 77472, 'steps': 151, 'loss/train': 7.122966289520264} -09/20/2021 15:00:42 - INFO - __main__ - Step 2422: {'lr': 4.026666666666667e-05, 'samples': 77504, 'steps': 151, 'loss/train': 7.363900184631348} -09/20/2021 15:00:43 - INFO - __main__ - Step 2423: {'lr': 4.026666666666667e-05, 'samples': 77536, 'steps': 151, 'loss/train': 6.167317867279053} -09/20/2021 15:00:44 - INFO - __main__ - Step 2424: {'lr': 4.026666666666667e-05, 'samples': 77568, 'steps': 151, 'loss/train': 6.639521598815918} -09/20/2021 15:00:44 - INFO - __main__ - Step 2425: {'lr': 4.026666666666667e-05, 'samples': 77600, 'steps': 151, 'loss/train': 6.128981590270996} -09/20/2021 15:00:45 - INFO - __main__ - Step 2426: {'lr': 4.026666666666667e-05, 'samples': 77632, 'steps': 151, 'loss/train': 5.979608535766602} -09/20/2021 15:00:46 - INFO - __main__ - Step 2427: {'lr': 4.026666666666667e-05, 'samples': 77664, 'steps': 151, 'loss/train': 6.653136253356934} -09/20/2021 15:00:47 - INFO - __main__ - Step 2428: {'lr': 4.026666666666667e-05, 'samples': 77696, 'steps': 151, 'loss/train': 6.027210235595703} -09/20/2021 15:00:47 - INFO - __main__ - Step 2429: {'lr': 4.026666666666667e-05, 'samples': 77728, 'steps': 151, 'loss/train': 6.8543829917907715} -09/20/2021 15:00:48 - INFO - __main__ - Step 2430: {'lr': 4.026666666666667e-05, 'samples': 77760, 'steps': 151, 'loss/train': 6.435595989227295} -09/20/2021 15:00:49 - INFO - __main__ - Step 2431: {'lr': 4.026666666666667e-05, 'samples': 77792, 'steps': 151, 'loss/train': 5.943674564361572} -09/20/2021 15:00:50 - INFO - __main__ - Step 2432: {'lr': 4.026666666666667e-05, 'samples': 77824, 'steps': 151, 'loss/train': 7.10731315612793} -09/20/2021 15:00:51 - INFO - __main__ - Step 2433: {'lr': 4.0533333333333334e-05, 'samples': 77856, 'steps': 152, 'loss/train': 6.265143871307373} -09/20/2021 15:00:51 - INFO - __main__ - Step 2434: {'lr': 4.0533333333333334e-05, 'samples': 77888, 'steps': 152, 'loss/train': 5.455266952514648} -09/20/2021 15:00:52 - INFO - __main__ - Step 2435: {'lr': 4.0533333333333334e-05, 'samples': 77920, 'steps': 152, 'loss/train': 6.012631416320801} -09/20/2021 15:00:53 - INFO - __main__ - Step 2436: {'lr': 4.0533333333333334e-05, 'samples': 77952, 'steps': 152, 'loss/train': 6.772637844085693} -09/20/2021 15:00:54 - INFO - __main__ - Step 2437: {'lr': 4.0533333333333334e-05, 'samples': 77984, 'steps': 152, 'loss/train': 6.524227142333984} -09/20/2021 15:00:54 - INFO - __main__ - Step 2438: {'lr': 4.0533333333333334e-05, 'samples': 78016, 'steps': 152, 'loss/train': 6.129908561706543} -09/20/2021 15:00:55 - INFO - __main__ - Step 2439: {'lr': 4.0533333333333334e-05, 'samples': 78048, 'steps': 152, 'loss/train': 6.745294094085693} -09/20/2021 15:00:56 - INFO - __main__ - Step 2440: {'lr': 4.0533333333333334e-05, 'samples': 78080, 'steps': 152, 'loss/train': 5.982281684875488} -09/20/2021 15:00:57 - INFO - __main__ - Step 2441: {'lr': 4.0533333333333334e-05, 'samples': 78112, 'steps': 152, 'loss/train': 6.73214864730835} -09/20/2021 15:00:57 - INFO - __main__ - Step 2442: {'lr': 4.0533333333333334e-05, 'samples': 78144, 'steps': 152, 'loss/train': 6.607121467590332} -09/20/2021 15:00:58 - INFO - __main__ - Step 2443: {'lr': 4.0533333333333334e-05, 'samples': 78176, 'steps': 152, 'loss/train': 5.8456830978393555} -09/20/2021 15:00:59 - INFO - __main__ - Step 2444: {'lr': 4.0533333333333334e-05, 'samples': 78208, 'steps': 152, 'loss/train': 6.063998222351074} -09/20/2021 15:01:00 - INFO - __main__ - Step 2445: {'lr': 4.0533333333333334e-05, 'samples': 78240, 'steps': 152, 'loss/train': 6.201157569885254} -09/20/2021 15:01:00 - INFO - __main__ - Step 2446: {'lr': 4.0533333333333334e-05, 'samples': 78272, 'steps': 152, 'loss/train': 8.327589988708496} -09/20/2021 15:01:01 - INFO - __main__ - Step 2447: {'lr': 4.0533333333333334e-05, 'samples': 78304, 'steps': 152, 'loss/train': 7.046227931976318} -09/20/2021 15:01:02 - INFO - __main__ - Step 2448: {'lr': 4.0533333333333334e-05, 'samples': 78336, 'steps': 152, 'loss/train': 6.864868640899658} -09/20/2021 15:01:03 - INFO - __main__ - Step 2449: {'lr': 4.08e-05, 'samples': 78368, 'steps': 153, 'loss/train': 6.108758926391602} -09/20/2021 15:01:03 - INFO - __main__ - Step 2450: {'lr': 4.08e-05, 'samples': 78400, 'steps': 153, 'loss/train': 5.771704196929932} -09/20/2021 15:01:04 - INFO - __main__ - Step 2451: {'lr': 4.08e-05, 'samples': 78432, 'steps': 153, 'loss/train': 7.43412446975708} -09/20/2021 15:01:05 - INFO - __main__ - Step 2452: {'lr': 4.08e-05, 'samples': 78464, 'steps': 153, 'loss/train': 7.867547512054443} -09/20/2021 15:01:06 - INFO - __main__ - Step 2453: {'lr': 4.08e-05, 'samples': 78496, 'steps': 153, 'loss/train': 6.9889302253723145} -09/20/2021 15:01:06 - INFO - __main__ - Step 2454: {'lr': 4.08e-05, 'samples': 78528, 'steps': 153, 'loss/train': 7.449956893920898} -09/20/2021 15:01:07 - INFO - __main__ - Step 2455: {'lr': 4.08e-05, 'samples': 78560, 'steps': 153, 'loss/train': 7.189932346343994} -09/20/2021 15:01:08 - INFO - __main__ - Step 2456: {'lr': 4.08e-05, 'samples': 78592, 'steps': 153, 'loss/train': 7.712790012359619} -09/20/2021 15:01:09 - INFO - __main__ - Step 2457: {'lr': 4.08e-05, 'samples': 78624, 'steps': 153, 'loss/train': 7.940590858459473} -09/20/2021 15:01:10 - INFO - __main__ - Step 2458: {'lr': 4.08e-05, 'samples': 78656, 'steps': 153, 'loss/train': 7.39838171005249} -09/20/2021 15:01:11 - INFO - __main__ - Step 2459: {'lr': 4.08e-05, 'samples': 78688, 'steps': 153, 'loss/train': 6.4366230964660645} -09/20/2021 15:01:11 - INFO - __main__ - Step 2460: {'lr': 4.08e-05, 'samples': 78720, 'steps': 153, 'loss/train': 5.71842098236084} -09/20/2021 15:01:12 - INFO - __main__ - Step 2461: {'lr': 4.08e-05, 'samples': 78752, 'steps': 153, 'loss/train': 6.403326034545898} -09/20/2021 15:01:13 - INFO - __main__ - Step 2462: {'lr': 4.08e-05, 'samples': 78784, 'steps': 153, 'loss/train': 6.393619537353516} -09/20/2021 15:01:14 - INFO - __main__ - Step 2463: {'lr': 4.08e-05, 'samples': 78816, 'steps': 153, 'loss/train': 6.412029266357422} -09/20/2021 15:01:14 - INFO - __main__ - Step 2464: {'lr': 4.08e-05, 'samples': 78848, 'steps': 153, 'loss/train': 6.683584213256836} -09/20/2021 15:01:15 - INFO - __main__ - Step 2465: {'lr': 4.106666666666667e-05, 'samples': 78880, 'steps': 154, 'loss/train': 6.266972541809082} -09/20/2021 15:01:16 - INFO - __main__ - Step 2466: {'lr': 4.106666666666667e-05, 'samples': 78912, 'steps': 154, 'loss/train': 5.710607528686523} -09/20/2021 15:01:17 - INFO - __main__ - Step 2467: {'lr': 4.106666666666667e-05, 'samples': 78944, 'steps': 154, 'loss/train': 6.391040802001953} -09/20/2021 15:01:18 - INFO - __main__ - Step 2468: {'lr': 4.106666666666667e-05, 'samples': 78976, 'steps': 154, 'loss/train': 5.61561393737793} -09/20/2021 15:01:18 - INFO - __main__ - Step 2469: {'lr': 4.106666666666667e-05, 'samples': 79008, 'steps': 154, 'loss/train': 6.11440896987915} -09/20/2021 15:01:19 - INFO - __main__ - Step 2470: {'lr': 4.106666666666667e-05, 'samples': 79040, 'steps': 154, 'loss/train': 6.873351097106934} -09/20/2021 15:01:20 - INFO - __main__ - Step 2471: {'lr': 4.106666666666667e-05, 'samples': 79072, 'steps': 154, 'loss/train': 6.764773845672607} -09/20/2021 15:01:21 - INFO - __main__ - Step 2472: {'lr': 4.106666666666667e-05, 'samples': 79104, 'steps': 154, 'loss/train': 6.200422763824463} -09/20/2021 15:01:21 - INFO - __main__ - Step 2473: {'lr': 4.106666666666667e-05, 'samples': 79136, 'steps': 154, 'loss/train': 6.330258369445801} -09/20/2021 15:01:22 - INFO - __main__ - Step 2474: {'lr': 4.106666666666667e-05, 'samples': 79168, 'steps': 154, 'loss/train': 6.423024654388428} -09/20/2021 15:01:23 - INFO - __main__ - Step 2475: {'lr': 4.106666666666667e-05, 'samples': 79200, 'steps': 154, 'loss/train': 1.6903332471847534} -09/20/2021 15:01:24 - INFO - __main__ - Step 2476: {'lr': 4.106666666666667e-05, 'samples': 79232, 'steps': 154, 'loss/train': 6.302234172821045} -09/20/2021 15:01:24 - INFO - __main__ - Step 2477: {'lr': 4.106666666666667e-05, 'samples': 79264, 'steps': 154, 'loss/train': 5.80399751663208} -09/20/2021 15:01:25 - INFO - __main__ - Step 2478: {'lr': 4.106666666666667e-05, 'samples': 79296, 'steps': 154, 'loss/train': 6.555335998535156} -09/20/2021 15:01:26 - INFO - __main__ - Step 2479: {'lr': 4.106666666666667e-05, 'samples': 79328, 'steps': 154, 'loss/train': 5.797046184539795} -09/20/2021 15:01:27 - INFO - __main__ - Step 2480: {'lr': 4.106666666666667e-05, 'samples': 79360, 'steps': 154, 'loss/train': 6.393826007843018} -09/20/2021 15:01:27 - INFO - __main__ - Step 2481: {'lr': 4.133333333333333e-05, 'samples': 79392, 'steps': 155, 'loss/train': 5.607860088348389} -09/20/2021 15:01:28 - INFO - __main__ - Step 2482: {'lr': 4.133333333333333e-05, 'samples': 79424, 'steps': 155, 'loss/train': 6.131834983825684} -09/20/2021 15:01:29 - INFO - __main__ - Step 2483: {'lr': 4.133333333333333e-05, 'samples': 79456, 'steps': 155, 'loss/train': 5.750481605529785} -09/20/2021 15:01:30 - INFO - __main__ - Step 2484: {'lr': 4.133333333333333e-05, 'samples': 79488, 'steps': 155, 'loss/train': 6.896501541137695} -09/20/2021 15:01:30 - INFO - __main__ - Step 2485: {'lr': 4.133333333333333e-05, 'samples': 79520, 'steps': 155, 'loss/train': 5.548871994018555} -09/20/2021 15:01:31 - INFO - __main__ - Step 2486: {'lr': 4.133333333333333e-05, 'samples': 79552, 'steps': 155, 'loss/train': 6.670544624328613} -09/20/2021 15:01:32 - INFO - __main__ - Step 2487: {'lr': 4.133333333333333e-05, 'samples': 79584, 'steps': 155, 'loss/train': 6.386887550354004} -09/20/2021 15:01:33 - INFO - __main__ - Step 2488: {'lr': 4.133333333333333e-05, 'samples': 79616, 'steps': 155, 'loss/train': 5.73793363571167} -09/20/2021 15:01:34 - INFO - __main__ - Step 2489: {'lr': 4.133333333333333e-05, 'samples': 79648, 'steps': 155, 'loss/train': 5.4828362464904785} -09/20/2021 15:01:35 - INFO - __main__ - Step 2490: {'lr': 4.133333333333333e-05, 'samples': 79680, 'steps': 155, 'loss/train': 6.385136127471924} -09/20/2021 15:01:36 - INFO - __main__ - Step 2491: {'lr': 4.133333333333333e-05, 'samples': 79712, 'steps': 155, 'loss/train': 5.932218074798584} -09/20/2021 15:01:36 - INFO - __main__ - Step 2492: {'lr': 4.133333333333333e-05, 'samples': 79744, 'steps': 155, 'loss/train': 5.9479780197143555} -09/20/2021 15:01:37 - INFO - __main__ - Step 2493: {'lr': 4.133333333333333e-05, 'samples': 79776, 'steps': 155, 'loss/train': 6.079336643218994} -09/20/2021 15:01:38 - INFO - __main__ - Step 2494: {'lr': 4.133333333333333e-05, 'samples': 79808, 'steps': 155, 'loss/train': 6.497676849365234} -09/20/2021 15:01:39 - INFO - __main__ - Step 2495: {'lr': 4.133333333333333e-05, 'samples': 79840, 'steps': 155, 'loss/train': 5.813429832458496} -09/20/2021 15:01:39 - INFO - __main__ - Step 2496: {'lr': 4.133333333333333e-05, 'samples': 79872, 'steps': 155, 'loss/train': 6.022780418395996} -09/20/2021 15:01:40 - INFO - __main__ - Step 2497: {'lr': 4.16e-05, 'samples': 79904, 'steps': 156, 'loss/train': 5.938256740570068} -09/20/2021 15:01:41 - INFO - __main__ - Step 2498: {'lr': 4.16e-05, 'samples': 79936, 'steps': 156, 'loss/train': 5.800051212310791} -09/20/2021 15:01:42 - INFO - __main__ - Step 2499: {'lr': 4.16e-05, 'samples': 79968, 'steps': 156, 'loss/train': 6.263347148895264} -09/20/2021 15:01:42 - INFO - __main__ - Step 2500: {'lr': 4.16e-05, 'samples': 80000, 'steps': 156, 'loss/train': 6.104167461395264} -09/20/2021 15:01:43 - INFO - __main__ - Step 2501: {'lr': 4.16e-05, 'samples': 80032, 'steps': 156, 'loss/train': 5.73416805267334} -09/20/2021 15:01:44 - INFO - __main__ - Step 2502: {'lr': 4.16e-05, 'samples': 80064, 'steps': 156, 'loss/train': 6.124878883361816} -09/20/2021 15:01:45 - INFO - __main__ - Step 2503: {'lr': 4.16e-05, 'samples': 80096, 'steps': 156, 'loss/train': 6.382125377655029} -09/20/2021 15:01:45 - INFO - __main__ - Step 2504: {'lr': 4.16e-05, 'samples': 80128, 'steps': 156, 'loss/train': 5.155949115753174} -09/20/2021 15:01:46 - INFO - __main__ - Step 2505: {'lr': 4.16e-05, 'samples': 80160, 'steps': 156, 'loss/train': 5.841557502746582} -09/20/2021 15:01:47 - INFO - __main__ - Step 2506: {'lr': 4.16e-05, 'samples': 80192, 'steps': 156, 'loss/train': 6.192776203155518} -09/20/2021 15:01:48 - INFO - __main__ - Step 2507: {'lr': 4.16e-05, 'samples': 80224, 'steps': 156, 'loss/train': 5.999773979187012} -09/20/2021 15:01:48 - INFO - __main__ - Step 2508: {'lr': 4.16e-05, 'samples': 80256, 'steps': 156, 'loss/train': 6.2453227043151855} -09/20/2021 15:01:49 - INFO - __main__ - Step 2509: {'lr': 4.16e-05, 'samples': 80288, 'steps': 156, 'loss/train': 7.7046799659729} -09/20/2021 15:01:50 - INFO - __main__ - Step 2510: {'lr': 4.16e-05, 'samples': 80320, 'steps': 156, 'loss/train': 6.253943920135498} -09/20/2021 15:01:51 - INFO - __main__ - Step 2511: {'lr': 4.16e-05, 'samples': 80352, 'steps': 156, 'loss/train': 6.013951778411865} -09/20/2021 15:01:51 - INFO - __main__ - Step 2512: {'lr': 4.16e-05, 'samples': 80384, 'steps': 156, 'loss/train': 6.277663707733154} -09/20/2021 15:01:52 - INFO - __main__ - Step 2513: {'lr': 4.186666666666667e-05, 'samples': 80416, 'steps': 157, 'loss/train': 6.420281410217285} -09/20/2021 15:01:53 - INFO - __main__ - Step 2514: {'lr': 4.186666666666667e-05, 'samples': 80448, 'steps': 157, 'loss/train': 6.207426071166992} -09/20/2021 15:01:54 - INFO - __main__ - Step 2515: {'lr': 4.186666666666667e-05, 'samples': 80480, 'steps': 157, 'loss/train': 6.669621467590332} -09/20/2021 15:01:55 - INFO - __main__ - Step 2516: {'lr': 4.186666666666667e-05, 'samples': 80512, 'steps': 157, 'loss/train': 6.797295093536377} -09/20/2021 15:01:55 - INFO - __main__ - Step 2517: {'lr': 4.186666666666667e-05, 'samples': 80544, 'steps': 157, 'loss/train': 5.939659118652344} -09/20/2021 15:01:56 - INFO - __main__ - Step 2518: {'lr': 4.186666666666667e-05, 'samples': 80576, 'steps': 157, 'loss/train': 6.226371765136719} -09/20/2021 15:01:57 - INFO - __main__ - Step 2519: {'lr': 4.186666666666667e-05, 'samples': 80608, 'steps': 157, 'loss/train': 6.942317962646484} -09/20/2021 15:01:58 - INFO - __main__ - Step 2520: {'lr': 4.186666666666667e-05, 'samples': 80640, 'steps': 157, 'loss/train': 6.247735500335693} -09/20/2021 15:01:59 - INFO - __main__ - Step 2521: {'lr': 4.186666666666667e-05, 'samples': 80672, 'steps': 157, 'loss/train': 5.582824230194092} -09/20/2021 15:02:00 - INFO - __main__ - Step 2522: {'lr': 4.186666666666667e-05, 'samples': 80704, 'steps': 157, 'loss/train': 5.410653114318848} -09/20/2021 15:02:00 - INFO - __main__ - Step 2523: {'lr': 4.186666666666667e-05, 'samples': 80736, 'steps': 157, 'loss/train': 6.127928256988525} -09/20/2021 15:02:01 - INFO - __main__ - Step 2524: {'lr': 4.186666666666667e-05, 'samples': 80768, 'steps': 157, 'loss/train': 6.245342254638672} -09/20/2021 15:02:02 - INFO - __main__ - Step 2525: {'lr': 4.186666666666667e-05, 'samples': 80800, 'steps': 157, 'loss/train': 5.931537628173828} -09/20/2021 15:02:03 - INFO - __main__ - Step 2526: {'lr': 4.186666666666667e-05, 'samples': 80832, 'steps': 157, 'loss/train': 6.07809591293335} -09/20/2021 15:02:03 - INFO - __main__ - Step 2527: {'lr': 4.186666666666667e-05, 'samples': 80864, 'steps': 157, 'loss/train': 6.120916366577148} -09/20/2021 15:02:04 - INFO - __main__ - Step 2528: {'lr': 4.186666666666667e-05, 'samples': 80896, 'steps': 157, 'loss/train': 5.095183849334717} -09/20/2021 15:02:05 - INFO - __main__ - Step 2529: {'lr': 4.213333333333334e-05, 'samples': 80928, 'steps': 158, 'loss/train': 6.062344551086426} -09/20/2021 15:02:06 - INFO - __main__ - Step 2530: {'lr': 4.213333333333334e-05, 'samples': 80960, 'steps': 158, 'loss/train': 6.565893650054932} -09/20/2021 15:02:06 - INFO - __main__ - Step 2531: {'lr': 4.213333333333334e-05, 'samples': 80992, 'steps': 158, 'loss/train': 6.6047163009643555} -09/20/2021 15:02:07 - INFO - __main__ - Step 2532: {'lr': 4.213333333333334e-05, 'samples': 81024, 'steps': 158, 'loss/train': 5.864922046661377} -09/20/2021 15:02:08 - INFO - __main__ - Step 2533: {'lr': 4.213333333333334e-05, 'samples': 81056, 'steps': 158, 'loss/train': 5.964928150177002} -09/20/2021 15:02:09 - INFO - __main__ - Step 2534: {'lr': 4.213333333333334e-05, 'samples': 81088, 'steps': 158, 'loss/train': 6.063560485839844} -09/20/2021 15:02:09 - INFO - __main__ - Step 2535: {'lr': 4.213333333333334e-05, 'samples': 81120, 'steps': 158, 'loss/train': 6.041872024536133} -09/20/2021 15:02:10 - INFO - __main__ - Step 2536: {'lr': 4.213333333333334e-05, 'samples': 81152, 'steps': 158, 'loss/train': 5.480569362640381} -09/20/2021 15:02:11 - INFO - __main__ - Step 2537: {'lr': 4.213333333333334e-05, 'samples': 81184, 'steps': 158, 'loss/train': 5.757949352264404} -09/20/2021 15:02:12 - INFO - __main__ - Step 2538: {'lr': 4.213333333333334e-05, 'samples': 81216, 'steps': 158, 'loss/train': 6.600811004638672} -09/20/2021 15:02:12 - INFO - __main__ - Step 2539: {'lr': 4.213333333333334e-05, 'samples': 81248, 'steps': 158, 'loss/train': 6.776731014251709} -09/20/2021 15:02:13 - INFO - __main__ - Step 2540: {'lr': 4.213333333333334e-05, 'samples': 81280, 'steps': 158, 'loss/train': 6.588965892791748} -09/20/2021 15:02:14 - INFO - __main__ - Step 2541: {'lr': 4.213333333333334e-05, 'samples': 81312, 'steps': 158, 'loss/train': 4.926036834716797} -09/20/2021 15:02:15 - INFO - __main__ - Step 2542: {'lr': 4.213333333333334e-05, 'samples': 81344, 'steps': 158, 'loss/train': 7.53963041305542} -09/20/2021 15:02:15 - INFO - __main__ - Step 2543: {'lr': 4.213333333333334e-05, 'samples': 81376, 'steps': 158, 'loss/train': 7.525889873504639} -09/20/2021 15:02:16 - INFO - __main__ - Step 2544: {'lr': 4.213333333333334e-05, 'samples': 81408, 'steps': 158, 'loss/train': 7.177288055419922} -09/20/2021 15:02:17 - INFO - __main__ - Step 2545: {'lr': 4.24e-05, 'samples': 81440, 'steps': 159, 'loss/train': 4.383800029754639} -09/20/2021 15:02:18 - INFO - __main__ - Step 2546: {'lr': 4.24e-05, 'samples': 81472, 'steps': 159, 'loss/train': 6.478893280029297} -09/20/2021 15:02:19 - INFO - __main__ - Step 2547: {'lr': 4.24e-05, 'samples': 81504, 'steps': 159, 'loss/train': 5.639415264129639} -09/20/2021 15:02:19 - INFO - __main__ - Step 2548: {'lr': 4.24e-05, 'samples': 81536, 'steps': 159, 'loss/train': 6.68930721282959} -09/20/2021 15:02:20 - INFO - __main__ - Step 2549: {'lr': 4.24e-05, 'samples': 81568, 'steps': 159, 'loss/train': 6.616140365600586} -09/20/2021 15:02:21 - INFO - __main__ - Step 2550: {'lr': 4.24e-05, 'samples': 81600, 'steps': 159, 'loss/train': 6.88444185256958} -09/20/2021 15:02:22 - INFO - __main__ - Step 2551: {'lr': 4.24e-05, 'samples': 81632, 'steps': 159, 'loss/train': 5.4573140144348145} -09/20/2021 15:02:23 - INFO - __main__ - Step 2552: {'lr': 4.24e-05, 'samples': 81664, 'steps': 159, 'loss/train': 6.8632001876831055} -09/20/2021 15:02:24 - INFO - __main__ - Step 2553: {'lr': 4.24e-05, 'samples': 81696, 'steps': 159, 'loss/train': 5.829990863800049} -09/20/2021 15:02:24 - INFO - __main__ - Step 2554: {'lr': 4.24e-05, 'samples': 81728, 'steps': 159, 'loss/train': 6.802834987640381} -09/20/2021 15:02:25 - INFO - __main__ - Step 2555: {'lr': 4.24e-05, 'samples': 81760, 'steps': 159, 'loss/train': 4.879003524780273} -09/20/2021 15:02:26 - INFO - __main__ - Step 2556: {'lr': 4.24e-05, 'samples': 81792, 'steps': 159, 'loss/train': 6.007147789001465} -09/20/2021 15:02:27 - INFO - __main__ - Step 2557: {'lr': 4.24e-05, 'samples': 81824, 'steps': 159, 'loss/train': 6.11210823059082} -09/20/2021 15:02:27 - INFO - __main__ - Step 2558: {'lr': 4.24e-05, 'samples': 81856, 'steps': 159, 'loss/train': 6.8124470710754395} -09/20/2021 15:02:28 - INFO - __main__ - Step 2559: {'lr': 4.24e-05, 'samples': 81888, 'steps': 159, 'loss/train': 6.472072124481201} -09/20/2021 15:02:29 - INFO - __main__ - Step 2560: {'lr': 4.24e-05, 'samples': 81920, 'steps': 159, 'loss/train': 5.929097652435303} -09/20/2021 15:02:30 - INFO - __main__ - Step 2561: {'lr': 4.266666666666667e-05, 'samples': 81952, 'steps': 160, 'loss/train': 6.36329984664917} -09/20/2021 15:02:31 - INFO - __main__ - Step 2562: {'lr': 4.266666666666667e-05, 'samples': 81984, 'steps': 160, 'loss/train': 6.170423984527588} -09/20/2021 15:02:31 - INFO - __main__ - Step 2563: {'lr': 4.266666666666667e-05, 'samples': 82016, 'steps': 160, 'loss/train': 6.134052276611328} -09/20/2021 15:02:32 - INFO - __main__ - Step 2564: {'lr': 4.266666666666667e-05, 'samples': 82048, 'steps': 160, 'loss/train': 5.862811088562012} -09/20/2021 15:02:33 - INFO - __main__ - Step 2565: {'lr': 4.266666666666667e-05, 'samples': 82080, 'steps': 160, 'loss/train': 6.679874420166016} -09/20/2021 15:02:34 - INFO - __main__ - Step 2566: {'lr': 4.266666666666667e-05, 'samples': 82112, 'steps': 160, 'loss/train': 6.376524925231934} -09/20/2021 15:02:34 - INFO - __main__ - Step 2567: {'lr': 4.266666666666667e-05, 'samples': 82144, 'steps': 160, 'loss/train': 6.351700782775879} -09/20/2021 15:02:35 - INFO - __main__ - Step 2568: {'lr': 4.266666666666667e-05, 'samples': 82176, 'steps': 160, 'loss/train': 5.995226860046387} -09/20/2021 15:02:36 - INFO - __main__ - Step 2569: {'lr': 4.266666666666667e-05, 'samples': 82208, 'steps': 160, 'loss/train': 5.327423095703125} -09/20/2021 15:02:37 - INFO - __main__ - Step 2570: {'lr': 4.266666666666667e-05, 'samples': 82240, 'steps': 160, 'loss/train': 6.1184306144714355} -09/20/2021 15:02:37 - INFO - __main__ - Step 2571: {'lr': 4.266666666666667e-05, 'samples': 82272, 'steps': 160, 'loss/train': 6.57465934753418} -09/20/2021 15:02:38 - INFO - __main__ - Step 2572: {'lr': 4.266666666666667e-05, 'samples': 82304, 'steps': 160, 'loss/train': 6.861964225769043} -09/20/2021 15:02:39 - INFO - __main__ - Step 2573: {'lr': 4.266666666666667e-05, 'samples': 82336, 'steps': 160, 'loss/train': 5.751716613769531} -09/20/2021 15:02:40 - INFO - __main__ - Step 2574: {'lr': 4.266666666666667e-05, 'samples': 82368, 'steps': 160, 'loss/train': 6.166990756988525} -09/20/2021 15:02:40 - INFO - __main__ - Step 2575: {'lr': 4.266666666666667e-05, 'samples': 82400, 'steps': 160, 'loss/train': 6.8498311042785645} -09/20/2021 15:02:41 - INFO - __main__ - Step 2576: {'lr': 4.266666666666667e-05, 'samples': 82432, 'steps': 160, 'loss/train': 5.307199954986572} -09/20/2021 15:02:42 - INFO - __main__ - Step 2577: {'lr': 4.293333333333334e-05, 'samples': 82464, 'steps': 161, 'loss/train': 5.736014366149902} -09/20/2021 15:02:43 - INFO - __main__ - Step 2578: {'lr': 4.293333333333334e-05, 'samples': 82496, 'steps': 161, 'loss/train': 6.610804080963135} -09/20/2021 15:02:43 - INFO - __main__ - Step 2579: {'lr': 4.293333333333334e-05, 'samples': 82528, 'steps': 161, 'loss/train': 5.265331268310547} -09/20/2021 15:02:44 - INFO - __main__ - Step 2580: {'lr': 4.293333333333334e-05, 'samples': 82560, 'steps': 161, 'loss/train': 6.463908672332764} -09/20/2021 15:02:46 - INFO - __main__ - Step 2581: {'lr': 4.293333333333334e-05, 'samples': 82592, 'steps': 161, 'loss/train': 6.219603538513184} -09/20/2021 15:02:47 - INFO - __main__ - Step 2582: {'lr': 4.293333333333334e-05, 'samples': 82624, 'steps': 161, 'loss/train': 5.588942050933838} -09/20/2021 15:02:48 - INFO - __main__ - Step 2583: {'lr': 4.293333333333334e-05, 'samples': 82656, 'steps': 161, 'loss/train': 6.42734956741333} -09/20/2021 15:02:48 - INFO - __main__ - Step 2584: {'lr': 4.293333333333334e-05, 'samples': 82688, 'steps': 161, 'loss/train': 5.6403422355651855} -09/20/2021 15:02:49 - INFO - __main__ - Step 2585: {'lr': 4.293333333333334e-05, 'samples': 82720, 'steps': 161, 'loss/train': 6.402869701385498} -09/20/2021 15:02:50 - INFO - __main__ - Step 2586: {'lr': 4.293333333333334e-05, 'samples': 82752, 'steps': 161, 'loss/train': 6.092564582824707} -09/20/2021 15:02:51 - INFO - __main__ - Step 2587: {'lr': 4.293333333333334e-05, 'samples': 82784, 'steps': 161, 'loss/train': 6.1983962059021} -09/20/2021 15:02:51 - INFO - __main__ - Step 2588: {'lr': 4.293333333333334e-05, 'samples': 82816, 'steps': 161, 'loss/train': 6.40958309173584} -09/20/2021 15:02:52 - INFO - __main__ - Step 2589: {'lr': 4.293333333333334e-05, 'samples': 82848, 'steps': 161, 'loss/train': 6.221890449523926} -09/20/2021 15:02:53 - INFO - __main__ - Step 2590: {'lr': 4.293333333333334e-05, 'samples': 82880, 'steps': 161, 'loss/train': 5.756240367889404} -09/20/2021 15:02:54 - INFO - __main__ - Step 2591: {'lr': 4.293333333333334e-05, 'samples': 82912, 'steps': 161, 'loss/train': 7.5603508949279785} -09/20/2021 15:02:54 - INFO - __main__ - Step 2592: {'lr': 4.293333333333334e-05, 'samples': 82944, 'steps': 161, 'loss/train': 6.139090538024902} -09/20/2021 15:02:55 - INFO - __main__ - Step 2593: {'lr': 4.32e-05, 'samples': 82976, 'steps': 162, 'loss/train': 5.211459636688232} -09/20/2021 15:02:56 - INFO - __main__ - Step 2594: {'lr': 4.32e-05, 'samples': 83008, 'steps': 162, 'loss/train': 6.191188335418701} -09/20/2021 15:02:57 - INFO - __main__ - Step 2595: {'lr': 4.32e-05, 'samples': 83040, 'steps': 162, 'loss/train': 5.785233497619629} -09/20/2021 15:02:57 - INFO - __main__ - Step 2596: {'lr': 4.32e-05, 'samples': 83072, 'steps': 162, 'loss/train': 5.784493923187256} -09/20/2021 15:02:58 - INFO - __main__ - Step 2597: {'lr': 4.32e-05, 'samples': 83104, 'steps': 162, 'loss/train': 5.662668704986572} -09/20/2021 15:02:59 - INFO - __main__ - Step 2598: {'lr': 4.32e-05, 'samples': 83136, 'steps': 162, 'loss/train': 6.282014846801758} -09/20/2021 15:03:00 - INFO - __main__ - Step 2599: {'lr': 4.32e-05, 'samples': 83168, 'steps': 162, 'loss/train': 4.356054782867432} -09/20/2021 15:03:00 - INFO - __main__ - Step 2600: {'lr': 4.32e-05, 'samples': 83200, 'steps': 162, 'loss/train': 5.992147445678711} -09/20/2021 15:03:01 - INFO - __main__ - Step 2601: {'lr': 4.32e-05, 'samples': 83232, 'steps': 162, 'loss/train': 6.151191711425781} -09/20/2021 15:03:02 - INFO - __main__ - Step 2602: {'lr': 4.32e-05, 'samples': 83264, 'steps': 162, 'loss/train': 5.20988655090332} -09/20/2021 15:03:03 - INFO - __main__ - Step 2603: {'lr': 4.32e-05, 'samples': 83296, 'steps': 162, 'loss/train': 6.317473888397217} -09/20/2021 15:03:03 - INFO - __main__ - Step 2604: {'lr': 4.32e-05, 'samples': 83328, 'steps': 162, 'loss/train': 6.824505805969238} -09/20/2021 15:03:04 - INFO - __main__ - Step 2605: {'lr': 4.32e-05, 'samples': 83360, 'steps': 162, 'loss/train': 6.426881790161133} -09/20/2021 15:03:05 - INFO - __main__ - Step 2606: {'lr': 4.32e-05, 'samples': 83392, 'steps': 162, 'loss/train': 6.028285026550293} -09/20/2021 15:03:06 - INFO - __main__ - Step 2607: {'lr': 4.32e-05, 'samples': 83424, 'steps': 162, 'loss/train': 5.794271469116211} -09/20/2021 15:03:06 - INFO - __main__ - Step 2608: {'lr': 4.32e-05, 'samples': 83456, 'steps': 162, 'loss/train': 5.322343826293945} -09/20/2021 15:03:07 - INFO - __main__ - Step 2609: {'lr': 4.346666666666667e-05, 'samples': 83488, 'steps': 163, 'loss/train': 6.003962516784668} -09/20/2021 15:03:08 - INFO - __main__ - Step 2610: {'lr': 4.346666666666667e-05, 'samples': 83520, 'steps': 163, 'loss/train': 5.863370895385742} -09/20/2021 15:03:09 - INFO - __main__ - Step 2611: {'lr': 4.346666666666667e-05, 'samples': 83552, 'steps': 163, 'loss/train': 5.21474552154541} -09/20/2021 15:03:10 - INFO - __main__ - Step 2612: {'lr': 4.346666666666667e-05, 'samples': 83584, 'steps': 163, 'loss/train': 5.956271648406982} -09/20/2021 15:03:11 - INFO - __main__ - Step 2613: {'lr': 4.346666666666667e-05, 'samples': 83616, 'steps': 163, 'loss/train': 5.711556434631348} -09/20/2021 15:03:12 - INFO - __main__ - Step 2614: {'lr': 4.346666666666667e-05, 'samples': 83648, 'steps': 163, 'loss/train': 6.851556777954102} -09/20/2021 15:03:13 - INFO - __main__ - Step 2615: {'lr': 4.346666666666667e-05, 'samples': 83680, 'steps': 163, 'loss/train': 5.865117073059082} -09/20/2021 15:03:13 - INFO - __main__ - Step 2616: {'lr': 4.346666666666667e-05, 'samples': 83712, 'steps': 163, 'loss/train': 5.739682197570801} -09/20/2021 15:03:14 - INFO - __main__ - Step 2617: {'lr': 4.346666666666667e-05, 'samples': 83744, 'steps': 163, 'loss/train': 6.557872772216797} -09/20/2021 15:03:15 - INFO - __main__ - Step 2618: {'lr': 4.346666666666667e-05, 'samples': 83776, 'steps': 163, 'loss/train': 5.930615425109863} -09/20/2021 15:03:16 - INFO - __main__ - Step 2619: {'lr': 4.346666666666667e-05, 'samples': 83808, 'steps': 163, 'loss/train': 5.3031697273254395} -09/20/2021 15:03:16 - INFO - __main__ - Step 2620: {'lr': 4.346666666666667e-05, 'samples': 83840, 'steps': 163, 'loss/train': 5.7120795249938965} -09/20/2021 15:03:17 - INFO - __main__ - Step 2621: {'lr': 4.346666666666667e-05, 'samples': 83872, 'steps': 163, 'loss/train': 6.072360992431641} -09/20/2021 15:03:18 - INFO - __main__ - Step 2622: {'lr': 4.346666666666667e-05, 'samples': 83904, 'steps': 163, 'loss/train': 5.050556182861328} -09/20/2021 15:03:19 - INFO - __main__ - Step 2623: {'lr': 4.346666666666667e-05, 'samples': 83936, 'steps': 163, 'loss/train': 6.025839805603027} -09/20/2021 15:03:19 - INFO - __main__ - Step 2624: {'lr': 4.346666666666667e-05, 'samples': 83968, 'steps': 163, 'loss/train': 5.532792091369629} -09/20/2021 15:03:20 - INFO - __main__ - Step 2625: {'lr': 4.373333333333334e-05, 'samples': 84000, 'steps': 164, 'loss/train': 5.782102108001709} -09/20/2021 15:03:21 - INFO - __main__ - Step 2626: {'lr': 4.373333333333334e-05, 'samples': 84032, 'steps': 164, 'loss/train': 5.874716758728027} -09/20/2021 15:03:22 - INFO - __main__ - Step 2627: {'lr': 4.373333333333334e-05, 'samples': 84064, 'steps': 164, 'loss/train': 5.945744037628174} -09/20/2021 15:03:23 - INFO - __main__ - Step 2628: {'lr': 4.373333333333334e-05, 'samples': 84096, 'steps': 164, 'loss/train': 5.808272838592529} -09/20/2021 15:03:23 - INFO - __main__ - Step 2629: {'lr': 4.373333333333334e-05, 'samples': 84128, 'steps': 164, 'loss/train': 5.73525857925415} -09/20/2021 15:03:24 - INFO - __main__ - Step 2630: {'lr': 4.373333333333334e-05, 'samples': 84160, 'steps': 164, 'loss/train': 5.694440841674805} -09/20/2021 15:03:25 - INFO - __main__ - Step 2631: {'lr': 4.373333333333334e-05, 'samples': 84192, 'steps': 164, 'loss/train': 5.86282205581665} -09/20/2021 15:03:26 - INFO - __main__ - Step 2632: {'lr': 4.373333333333334e-05, 'samples': 84224, 'steps': 164, 'loss/train': 6.113814353942871} -09/20/2021 15:03:26 - INFO - __main__ - Step 2633: {'lr': 4.373333333333334e-05, 'samples': 84256, 'steps': 164, 'loss/train': 4.959403038024902} -09/20/2021 15:03:27 - INFO - __main__ - Step 2634: {'lr': 4.373333333333334e-05, 'samples': 84288, 'steps': 164, 'loss/train': 5.970380783081055} -09/20/2021 15:03:28 - INFO - __main__ - Step 2635: {'lr': 4.373333333333334e-05, 'samples': 84320, 'steps': 164, 'loss/train': 5.962685585021973} -09/20/2021 15:03:28 - INFO - __main__ - Step 2636: {'lr': 4.373333333333334e-05, 'samples': 84352, 'steps': 164, 'loss/train': 5.310928821563721} -09/20/2021 15:03:29 - INFO - __main__ - Step 2637: {'lr': 4.373333333333334e-05, 'samples': 84384, 'steps': 164, 'loss/train': 5.289916038513184} -09/20/2021 15:03:30 - INFO - __main__ - Step 2638: {'lr': 4.373333333333334e-05, 'samples': 84416, 'steps': 164, 'loss/train': 6.261023044586182} -09/20/2021 15:03:31 - INFO - __main__ - Step 2639: {'lr': 4.373333333333334e-05, 'samples': 84448, 'steps': 164, 'loss/train': 6.683660507202148} -09/20/2021 15:03:32 - INFO - __main__ - Step 2640: {'lr': 4.373333333333334e-05, 'samples': 84480, 'steps': 164, 'loss/train': 5.8831024169921875} -09/20/2021 15:03:32 - INFO - __main__ - Step 2641: {'lr': 4.4000000000000006e-05, 'samples': 84512, 'steps': 165, 'loss/train': 7.355615615844727} -09/20/2021 15:03:34 - INFO - __main__ - Step 2642: {'lr': 4.4000000000000006e-05, 'samples': 84544, 'steps': 165, 'loss/train': 5.526116847991943} -09/20/2021 15:03:34 - INFO - __main__ - Step 2643: {'lr': 4.4000000000000006e-05, 'samples': 84576, 'steps': 165, 'loss/train': 6.3997979164123535} -09/20/2021 15:03:35 - INFO - __main__ - Step 2644: {'lr': 4.4000000000000006e-05, 'samples': 84608, 'steps': 165, 'loss/train': 7.886075019836426} -09/20/2021 15:03:36 - INFO - __main__ - Step 2645: {'lr': 4.4000000000000006e-05, 'samples': 84640, 'steps': 165, 'loss/train': 5.7764177322387695} -09/20/2021 15:03:37 - INFO - __main__ - Step 2646: {'lr': 4.4000000000000006e-05, 'samples': 84672, 'steps': 165, 'loss/train': 5.779234886169434} -09/20/2021 15:03:37 - INFO - __main__ - Step 2647: {'lr': 4.4000000000000006e-05, 'samples': 84704, 'steps': 165, 'loss/train': 6.05281925201416} -09/20/2021 15:03:38 - INFO - __main__ - Step 2648: {'lr': 4.4000000000000006e-05, 'samples': 84736, 'steps': 165, 'loss/train': 4.8599324226379395} -09/20/2021 15:03:39 - INFO - __main__ - Step 2649: {'lr': 4.4000000000000006e-05, 'samples': 84768, 'steps': 165, 'loss/train': 6.438215255737305} -09/20/2021 15:03:40 - INFO - __main__ - Step 2650: {'lr': 4.4000000000000006e-05, 'samples': 84800, 'steps': 165, 'loss/train': 5.3492207527160645} -09/20/2021 15:03:40 - INFO - __main__ - Step 2651: {'lr': 4.4000000000000006e-05, 'samples': 84832, 'steps': 165, 'loss/train': 5.081808567047119} -09/20/2021 15:03:41 - INFO - __main__ - Step 2652: {'lr': 4.4000000000000006e-05, 'samples': 84864, 'steps': 165, 'loss/train': 6.213245391845703} -09/20/2021 15:03:42 - INFO - __main__ - Step 2653: {'lr': 4.4000000000000006e-05, 'samples': 84896, 'steps': 165, 'loss/train': 6.563084125518799} -09/20/2021 15:03:43 - INFO - __main__ - Step 2654: {'lr': 4.4000000000000006e-05, 'samples': 84928, 'steps': 165, 'loss/train': 6.756069660186768} -09/20/2021 15:03:43 - INFO - __main__ - Step 2655: {'lr': 4.4000000000000006e-05, 'samples': 84960, 'steps': 165, 'loss/train': 5.835290431976318} -09/20/2021 15:03:44 - INFO - __main__ - Step 2656: {'lr': 4.4000000000000006e-05, 'samples': 84992, 'steps': 165, 'loss/train': 6.03394079208374} -09/20/2021 15:03:45 - INFO - __main__ - Step 2657: {'lr': 4.426666666666667e-05, 'samples': 85024, 'steps': 166, 'loss/train': 6.610917091369629} -09/20/2021 15:03:46 - INFO - __main__ - Step 2658: {'lr': 4.426666666666667e-05, 'samples': 85056, 'steps': 166, 'loss/train': 5.711658477783203} -09/20/2021 15:03:47 - INFO - __main__ - Step 2659: {'lr': 4.426666666666667e-05, 'samples': 85088, 'steps': 166, 'loss/train': 5.710326194763184} -09/20/2021 15:03:47 - INFO - __main__ - Step 2660: {'lr': 4.426666666666667e-05, 'samples': 85120, 'steps': 166, 'loss/train': 8.940583229064941} -09/20/2021 15:03:48 - INFO - __main__ - Step 2661: {'lr': 4.426666666666667e-05, 'samples': 85152, 'steps': 166, 'loss/train': 6.043191909790039} -09/20/2021 15:03:49 - INFO - __main__ - Step 2662: {'lr': 4.426666666666667e-05, 'samples': 85184, 'steps': 166, 'loss/train': 6.104350566864014} -09/20/2021 15:03:50 - INFO - __main__ - Step 2663: {'lr': 4.426666666666667e-05, 'samples': 85216, 'steps': 166, 'loss/train': 5.734332084655762} -09/20/2021 15:03:50 - INFO - __main__ - Step 2664: {'lr': 4.426666666666667e-05, 'samples': 85248, 'steps': 166, 'loss/train': 5.903233528137207} -09/20/2021 15:03:51 - INFO - __main__ - Step 2665: {'lr': 4.426666666666667e-05, 'samples': 85280, 'steps': 166, 'loss/train': 4.195363998413086} -09/20/2021 15:03:52 - INFO - __main__ - Step 2666: {'lr': 4.426666666666667e-05, 'samples': 85312, 'steps': 166, 'loss/train': 6.077828884124756} -09/20/2021 15:03:53 - INFO - __main__ - Step 2667: {'lr': 4.426666666666667e-05, 'samples': 85344, 'steps': 166, 'loss/train': 6.400421619415283} -09/20/2021 15:03:53 - INFO - __main__ - Step 2668: {'lr': 4.426666666666667e-05, 'samples': 85376, 'steps': 166, 'loss/train': 6.0994462966918945} -09/20/2021 15:03:54 - INFO - __main__ - Step 2669: {'lr': 4.426666666666667e-05, 'samples': 85408, 'steps': 166, 'loss/train': 5.883744239807129} -09/20/2021 15:03:55 - INFO - __main__ - Step 2670: {'lr': 4.426666666666667e-05, 'samples': 85440, 'steps': 166, 'loss/train': 5.416818141937256} -09/20/2021 15:03:56 - INFO - __main__ - Step 2671: {'lr': 4.426666666666667e-05, 'samples': 85472, 'steps': 166, 'loss/train': 4.696366310119629} -09/20/2021 15:03:56 - INFO - __main__ - Step 2672: {'lr': 4.426666666666667e-05, 'samples': 85504, 'steps': 166, 'loss/train': 6.03773307800293} -09/20/2021 15:03:58 - INFO - __main__ - Step 2673: {'lr': 4.4533333333333336e-05, 'samples': 85536, 'steps': 167, 'loss/train': 6.193160057067871} -09/20/2021 15:03:59 - INFO - __main__ - Step 2674: {'lr': 4.4533333333333336e-05, 'samples': 85568, 'steps': 167, 'loss/train': 6.103191375732422} -09/20/2021 15:03:59 - INFO - __main__ - Step 2675: {'lr': 4.4533333333333336e-05, 'samples': 85600, 'steps': 167, 'loss/train': 5.554469108581543} -09/20/2021 15:04:00 - INFO - __main__ - Step 2676: {'lr': 4.4533333333333336e-05, 'samples': 85632, 'steps': 167, 'loss/train': 5.467002868652344} -09/20/2021 15:04:01 - INFO - __main__ - Step 2677: {'lr': 4.4533333333333336e-05, 'samples': 85664, 'steps': 167, 'loss/train': 5.721968173980713} -09/20/2021 15:04:02 - INFO - __main__ - Step 2678: {'lr': 4.4533333333333336e-05, 'samples': 85696, 'steps': 167, 'loss/train': 6.192720890045166} -09/20/2021 15:04:02 - INFO - __main__ - Step 2679: {'lr': 4.4533333333333336e-05, 'samples': 85728, 'steps': 167, 'loss/train': 5.9405598640441895} -09/20/2021 15:04:03 - INFO - __main__ - Step 2680: {'lr': 4.4533333333333336e-05, 'samples': 85760, 'steps': 167, 'loss/train': 6.226830005645752} -09/20/2021 15:04:04 - INFO - __main__ - Step 2681: {'lr': 4.4533333333333336e-05, 'samples': 85792, 'steps': 167, 'loss/train': 5.422060966491699} -09/20/2021 15:04:05 - INFO - __main__ - Step 2682: {'lr': 4.4533333333333336e-05, 'samples': 85824, 'steps': 167, 'loss/train': 6.130623817443848} -09/20/2021 15:04:05 - INFO - __main__ - Step 2683: {'lr': 4.4533333333333336e-05, 'samples': 85856, 'steps': 167, 'loss/train': 5.728705406188965} -09/20/2021 15:04:06 - INFO - __main__ - Step 2684: {'lr': 4.4533333333333336e-05, 'samples': 85888, 'steps': 167, 'loss/train': 5.965126037597656} -09/20/2021 15:04:07 - INFO - __main__ - Step 2685: {'lr': 4.4533333333333336e-05, 'samples': 85920, 'steps': 167, 'loss/train': 5.787815570831299} -09/20/2021 15:04:08 - INFO - __main__ - Step 2686: {'lr': 4.4533333333333336e-05, 'samples': 85952, 'steps': 167, 'loss/train': 5.5031514167785645} -09/20/2021 15:04:08 - INFO - __main__ - Step 2687: {'lr': 4.4533333333333336e-05, 'samples': 85984, 'steps': 167, 'loss/train': 6.501001358032227} -09/20/2021 15:04:09 - INFO - __main__ - Step 2688: {'lr': 4.4533333333333336e-05, 'samples': 86016, 'steps': 167, 'loss/train': 6.456551551818848} -09/20/2021 15:04:10 - INFO - __main__ - Step 2689: {'lr': 4.4800000000000005e-05, 'samples': 86048, 'steps': 168, 'loss/train': 4.430202960968018} -09/20/2021 15:04:11 - INFO - __main__ - Step 2690: {'lr': 4.4800000000000005e-05, 'samples': 86080, 'steps': 168, 'loss/train': 5.466331481933594} -09/20/2021 15:04:12 - INFO - __main__ - Step 2691: {'lr': 4.4800000000000005e-05, 'samples': 86112, 'steps': 168, 'loss/train': 4.6244683265686035} -09/20/2021 15:04:12 - INFO - __main__ - Step 2692: {'lr': 4.4800000000000005e-05, 'samples': 86144, 'steps': 168, 'loss/train': 5.520321846008301} -09/20/2021 15:04:13 - INFO - __main__ - Step 2693: {'lr': 4.4800000000000005e-05, 'samples': 86176, 'steps': 168, 'loss/train': 5.295507907867432} -09/20/2021 15:04:14 - INFO - __main__ - Step 2694: {'lr': 4.4800000000000005e-05, 'samples': 86208, 'steps': 168, 'loss/train': 5.870983600616455} -09/20/2021 15:04:15 - INFO - __main__ - Step 2695: {'lr': 4.4800000000000005e-05, 'samples': 86240, 'steps': 168, 'loss/train': 3.6184685230255127} -09/20/2021 15:04:15 - INFO - __main__ - Step 2696: {'lr': 4.4800000000000005e-05, 'samples': 86272, 'steps': 168, 'loss/train': 5.496644020080566} -09/20/2021 15:04:16 - INFO - __main__ - Step 2697: {'lr': 4.4800000000000005e-05, 'samples': 86304, 'steps': 168, 'loss/train': 6.143137454986572} -09/20/2021 15:04:17 - INFO - __main__ - Step 2698: {'lr': 4.4800000000000005e-05, 'samples': 86336, 'steps': 168, 'loss/train': 6.548900127410889} -09/20/2021 15:04:18 - INFO - __main__ - Step 2699: {'lr': 4.4800000000000005e-05, 'samples': 86368, 'steps': 168, 'loss/train': 5.866508483886719} -09/20/2021 15:04:18 - INFO - __main__ - Step 2700: {'lr': 4.4800000000000005e-05, 'samples': 86400, 'steps': 168, 'loss/train': 5.911900997161865} -09/20/2021 15:04:19 - INFO - __main__ - Step 2701: {'lr': 4.4800000000000005e-05, 'samples': 86432, 'steps': 168, 'loss/train': 6.242246627807617} -09/20/2021 15:04:20 - INFO - __main__ - Step 2702: {'lr': 4.4800000000000005e-05, 'samples': 86464, 'steps': 168, 'loss/train': 6.73186731338501} -09/20/2021 15:04:21 - INFO - __main__ - Step 2703: {'lr': 4.4800000000000005e-05, 'samples': 86496, 'steps': 168, 'loss/train': 5.415243148803711} -09/20/2021 15:04:22 - INFO - __main__ - Step 2704: {'lr': 4.4800000000000005e-05, 'samples': 86528, 'steps': 168, 'loss/train': 6.017303943634033} -09/20/2021 15:04:23 - INFO - __main__ - Step 2705: {'lr': 4.5066666666666667e-05, 'samples': 86560, 'steps': 169, 'loss/train': 6.82559061050415} -09/20/2021 15:04:24 - INFO - __main__ - Step 2706: {'lr': 4.5066666666666667e-05, 'samples': 86592, 'steps': 169, 'loss/train': 6.061911106109619} -09/20/2021 15:04:24 - INFO - __main__ - Step 2707: {'lr': 4.5066666666666667e-05, 'samples': 86624, 'steps': 169, 'loss/train': 5.500299453735352} -09/20/2021 15:04:25 - INFO - __main__ - Step 2708: {'lr': 4.5066666666666667e-05, 'samples': 86656, 'steps': 169, 'loss/train': 5.929204940795898} -09/20/2021 15:04:26 - INFO - __main__ - Step 2709: {'lr': 4.5066666666666667e-05, 'samples': 86688, 'steps': 169, 'loss/train': 5.9855427742004395} -09/20/2021 15:04:27 - INFO - __main__ - Step 2710: {'lr': 4.5066666666666667e-05, 'samples': 86720, 'steps': 169, 'loss/train': 5.834914684295654} -09/20/2021 15:04:27 - INFO - __main__ - Step 2711: {'lr': 4.5066666666666667e-05, 'samples': 86752, 'steps': 169, 'loss/train': 5.955563068389893} -09/20/2021 15:04:28 - INFO - __main__ - Step 2712: {'lr': 4.5066666666666667e-05, 'samples': 86784, 'steps': 169, 'loss/train': 5.668453693389893} -09/20/2021 15:04:29 - INFO - __main__ - Step 2713: {'lr': 4.5066666666666667e-05, 'samples': 86816, 'steps': 169, 'loss/train': 5.949316024780273} -09/20/2021 15:04:30 - INFO - __main__ - Step 2714: {'lr': 4.5066666666666667e-05, 'samples': 86848, 'steps': 169, 'loss/train': 5.911174774169922} -09/20/2021 15:04:30 - INFO - __main__ - Step 2715: {'lr': 4.5066666666666667e-05, 'samples': 86880, 'steps': 169, 'loss/train': 7.367857933044434} -09/20/2021 15:04:31 - INFO - __main__ - Step 2716: {'lr': 4.5066666666666667e-05, 'samples': 86912, 'steps': 169, 'loss/train': 6.342865943908691} -09/20/2021 15:04:32 - INFO - __main__ - Step 2717: {'lr': 4.5066666666666667e-05, 'samples': 86944, 'steps': 169, 'loss/train': 6.344953536987305} -09/20/2021 15:04:33 - INFO - __main__ - Step 2718: {'lr': 4.5066666666666667e-05, 'samples': 86976, 'steps': 169, 'loss/train': 5.862834930419922} -09/20/2021 15:04:33 - INFO - __main__ - Step 2719: {'lr': 4.5066666666666667e-05, 'samples': 87008, 'steps': 169, 'loss/train': 5.5154571533203125} -09/20/2021 15:04:34 - INFO - __main__ - Step 2720: {'lr': 4.5066666666666667e-05, 'samples': 87040, 'steps': 169, 'loss/train': 7.541612148284912} -09/20/2021 15:04:35 - INFO - __main__ - Step 2721: {'lr': 4.5333333333333335e-05, 'samples': 87072, 'steps': 170, 'loss/train': 6.202362060546875} -09/20/2021 15:04:36 - INFO - __main__ - Step 2722: {'lr': 4.5333333333333335e-05, 'samples': 87104, 'steps': 170, 'loss/train': 5.73436164855957} -09/20/2021 15:04:36 - INFO - __main__ - Step 2723: {'lr': 4.5333333333333335e-05, 'samples': 87136, 'steps': 170, 'loss/train': 5.267917156219482} -09/20/2021 15:04:37 - INFO - __main__ - Step 2724: {'lr': 4.5333333333333335e-05, 'samples': 87168, 'steps': 170, 'loss/train': 5.609590530395508} -09/20/2021 15:04:38 - INFO - __main__ - Step 2725: {'lr': 4.5333333333333335e-05, 'samples': 87200, 'steps': 170, 'loss/train': 6.140828609466553} -09/20/2021 15:04:39 - INFO - __main__ - Step 2726: {'lr': 4.5333333333333335e-05, 'samples': 87232, 'steps': 170, 'loss/train': 6.452967166900635} -09/20/2021 15:04:39 - INFO - __main__ - Step 2727: {'lr': 4.5333333333333335e-05, 'samples': 87264, 'steps': 170, 'loss/train': 5.426800727844238} -09/20/2021 15:04:40 - INFO - __main__ - Step 2728: {'lr': 4.5333333333333335e-05, 'samples': 87296, 'steps': 170, 'loss/train': 6.553935527801514} -09/20/2021 15:04:41 - INFO - __main__ - Step 2729: {'lr': 4.5333333333333335e-05, 'samples': 87328, 'steps': 170, 'loss/train': 6.058254718780518} -09/20/2021 15:04:42 - INFO - __main__ - Step 2730: {'lr': 4.5333333333333335e-05, 'samples': 87360, 'steps': 170, 'loss/train': 5.862202167510986} -09/20/2021 15:04:42 - INFO - __main__ - Step 2731: {'lr': 4.5333333333333335e-05, 'samples': 87392, 'steps': 170, 'loss/train': 5.450389862060547} -09/20/2021 15:04:43 - INFO - __main__ - Step 2732: {'lr': 4.5333333333333335e-05, 'samples': 87424, 'steps': 170, 'loss/train': 6.296876907348633} -09/20/2021 15:04:44 - INFO - __main__ - Step 2733: {'lr': 4.5333333333333335e-05, 'samples': 87456, 'steps': 170, 'loss/train': 4.876692771911621} -09/20/2021 15:04:45 - INFO - __main__ - Step 2734: {'lr': 4.5333333333333335e-05, 'samples': 87488, 'steps': 170, 'loss/train': 1.1899096965789795} -09/20/2021 15:04:46 - INFO - __main__ - Step 2735: {'lr': 4.5333333333333335e-05, 'samples': 87520, 'steps': 170, 'loss/train': 7.236367225646973} -09/20/2021 15:04:47 - INFO - __main__ - Step 2736: {'lr': 4.5333333333333335e-05, 'samples': 87552, 'steps': 170, 'loss/train': 5.459300994873047} -09/20/2021 15:04:48 - INFO - __main__ - Step 2737: {'lr': 4.5600000000000004e-05, 'samples': 87584, 'steps': 171, 'loss/train': 7.0817389488220215} -09/20/2021 15:04:48 - INFO - __main__ - Step 2738: {'lr': 4.5600000000000004e-05, 'samples': 87616, 'steps': 171, 'loss/train': 6.165060520172119} -09/20/2021 15:04:49 - INFO - __main__ - Step 2739: {'lr': 4.5600000000000004e-05, 'samples': 87648, 'steps': 171, 'loss/train': 7.03971529006958} -09/20/2021 15:04:50 - INFO - __main__ - Step 2740: {'lr': 4.5600000000000004e-05, 'samples': 87680, 'steps': 171, 'loss/train': 6.3894758224487305} -09/20/2021 15:04:51 - INFO - __main__ - Step 2741: {'lr': 4.5600000000000004e-05, 'samples': 87712, 'steps': 171, 'loss/train': 5.467348575592041} -09/20/2021 15:04:51 - INFO - __main__ - Step 2742: {'lr': 4.5600000000000004e-05, 'samples': 87744, 'steps': 171, 'loss/train': 6.591375827789307} -09/20/2021 15:04:52 - INFO - __main__ - Step 2743: {'lr': 4.5600000000000004e-05, 'samples': 87776, 'steps': 171, 'loss/train': 6.320373058319092} -09/20/2021 15:04:53 - INFO - __main__ - Step 2744: {'lr': 4.5600000000000004e-05, 'samples': 87808, 'steps': 171, 'loss/train': 5.469454765319824} -09/20/2021 15:04:54 - INFO - __main__ - Step 2745: {'lr': 4.5600000000000004e-05, 'samples': 87840, 'steps': 171, 'loss/train': 6.259981632232666} -09/20/2021 15:04:54 - INFO - __main__ - Step 2746: {'lr': 4.5600000000000004e-05, 'samples': 87872, 'steps': 171, 'loss/train': 5.458749294281006} -09/20/2021 15:04:55 - INFO - __main__ - Step 2747: {'lr': 4.5600000000000004e-05, 'samples': 87904, 'steps': 171, 'loss/train': 5.3827900886535645} -09/20/2021 15:04:56 - INFO - __main__ - Step 2748: {'lr': 4.5600000000000004e-05, 'samples': 87936, 'steps': 171, 'loss/train': 5.498313903808594} -09/20/2021 15:04:57 - INFO - __main__ - Step 2749: {'lr': 4.5600000000000004e-05, 'samples': 87968, 'steps': 171, 'loss/train': 5.1130194664001465} -09/20/2021 15:04:57 - INFO - __main__ - Step 2750: {'lr': 4.5600000000000004e-05, 'samples': 88000, 'steps': 171, 'loss/train': 5.4325714111328125} -09/20/2021 15:04:58 - INFO - __main__ - Step 2751: {'lr': 4.5600000000000004e-05, 'samples': 88032, 'steps': 171, 'loss/train': 5.764361381530762} -09/20/2021 15:04:59 - INFO - __main__ - Step 2752: {'lr': 4.5600000000000004e-05, 'samples': 88064, 'steps': 171, 'loss/train': 6.178882598876953} -09/20/2021 15:05:00 - INFO - __main__ - Step 2753: {'lr': 4.5866666666666666e-05, 'samples': 88096, 'steps': 172, 'loss/train': 3.375703811645508} -09/20/2021 15:05:00 - INFO - __main__ - Step 2754: {'lr': 4.5866666666666666e-05, 'samples': 88128, 'steps': 172, 'loss/train': 6.550299167633057} -09/20/2021 15:05:01 - INFO - __main__ - Step 2755: {'lr': 4.5866666666666666e-05, 'samples': 88160, 'steps': 172, 'loss/train': 5.400622367858887} -09/20/2021 15:05:02 - INFO - __main__ - Step 2756: {'lr': 4.5866666666666666e-05, 'samples': 88192, 'steps': 172, 'loss/train': 5.50462007522583} -09/20/2021 15:05:03 - INFO - __main__ - Step 2757: {'lr': 4.5866666666666666e-05, 'samples': 88224, 'steps': 172, 'loss/train': 5.233240127563477} -09/20/2021 15:05:03 - INFO - __main__ - Step 2758: {'lr': 4.5866666666666666e-05, 'samples': 88256, 'steps': 172, 'loss/train': 6.684303283691406} -09/20/2021 15:05:04 - INFO - __main__ - Step 2759: {'lr': 4.5866666666666666e-05, 'samples': 88288, 'steps': 172, 'loss/train': 5.662454605102539} -09/20/2021 15:05:05 - INFO - __main__ - Step 2760: {'lr': 4.5866666666666666e-05, 'samples': 88320, 'steps': 172, 'loss/train': 6.418270111083984} -09/20/2021 15:05:06 - INFO - __main__ - Step 2761: {'lr': 4.5866666666666666e-05, 'samples': 88352, 'steps': 172, 'loss/train': 6.1330389976501465} -09/20/2021 15:05:06 - INFO - __main__ - Step 2762: {'lr': 4.5866666666666666e-05, 'samples': 88384, 'steps': 172, 'loss/train': 5.698133945465088} -09/20/2021 15:05:07 - INFO - __main__ - Step 2763: {'lr': 4.5866666666666666e-05, 'samples': 88416, 'steps': 172, 'loss/train': 5.95339822769165} -09/20/2021 15:05:09 - INFO - __main__ - Step 2764: {'lr': 4.5866666666666666e-05, 'samples': 88448, 'steps': 172, 'loss/train': 6.499260425567627} -09/20/2021 15:05:09 - INFO - __main__ - Step 2765: {'lr': 4.5866666666666666e-05, 'samples': 88480, 'steps': 172, 'loss/train': 5.961517333984375} -09/20/2021 15:05:10 - INFO - __main__ - Step 2766: {'lr': 4.5866666666666666e-05, 'samples': 88512, 'steps': 172, 'loss/train': 5.659806251525879} -09/20/2021 15:05:11 - INFO - __main__ - Step 2767: {'lr': 4.5866666666666666e-05, 'samples': 88544, 'steps': 172, 'loss/train': 5.614408493041992} -09/20/2021 15:05:12 - INFO - __main__ - Step 2768: {'lr': 4.5866666666666666e-05, 'samples': 88576, 'steps': 172, 'loss/train': 5.809414863586426} -09/20/2021 15:05:12 - INFO - __main__ - Step 2769: {'lr': 4.6133333333333334e-05, 'samples': 88608, 'steps': 173, 'loss/train': 5.604325294494629} -09/20/2021 15:05:13 - INFO - __main__ - Step 2770: {'lr': 4.6133333333333334e-05, 'samples': 88640, 'steps': 173, 'loss/train': 6.115484714508057} -09/20/2021 15:05:14 - INFO - __main__ - Step 2771: {'lr': 4.6133333333333334e-05, 'samples': 88672, 'steps': 173, 'loss/train': 6.4027581214904785} -09/20/2021 15:05:15 - INFO - __main__ - Step 2772: {'lr': 4.6133333333333334e-05, 'samples': 88704, 'steps': 173, 'loss/train': 6.212957382202148} -09/20/2021 15:05:15 - INFO - __main__ - Step 2773: {'lr': 4.6133333333333334e-05, 'samples': 88736, 'steps': 173, 'loss/train': 5.117983818054199} -09/20/2021 15:05:16 - INFO - __main__ - Step 2774: {'lr': 4.6133333333333334e-05, 'samples': 88768, 'steps': 173, 'loss/train': 5.695807456970215} -09/20/2021 15:05:17 - INFO - __main__ - Step 2775: {'lr': 4.6133333333333334e-05, 'samples': 88800, 'steps': 173, 'loss/train': 6.236452102661133} -09/20/2021 15:05:18 - INFO - __main__ - Step 2776: {'lr': 4.6133333333333334e-05, 'samples': 88832, 'steps': 173, 'loss/train': 5.9874467849731445} -09/20/2021 15:05:18 - INFO - __main__ - Step 2777: {'lr': 4.6133333333333334e-05, 'samples': 88864, 'steps': 173, 'loss/train': 6.334357738494873} -09/20/2021 15:05:19 - INFO - __main__ - Step 2778: {'lr': 4.6133333333333334e-05, 'samples': 88896, 'steps': 173, 'loss/train': 5.870070934295654} -09/20/2021 15:05:20 - INFO - __main__ - Step 2779: {'lr': 4.6133333333333334e-05, 'samples': 88928, 'steps': 173, 'loss/train': 6.748870372772217} -09/20/2021 15:05:21 - INFO - __main__ - Step 2780: {'lr': 4.6133333333333334e-05, 'samples': 88960, 'steps': 173, 'loss/train': 5.661139011383057} -09/20/2021 15:05:21 - INFO - __main__ - Step 2781: {'lr': 4.6133333333333334e-05, 'samples': 88992, 'steps': 173, 'loss/train': 4.9138407707214355} -09/20/2021 15:05:22 - INFO - __main__ - Step 2782: {'lr': 4.6133333333333334e-05, 'samples': 89024, 'steps': 173, 'loss/train': 5.991639137268066} -09/20/2021 15:05:23 - INFO - __main__ - Step 2783: {'lr': 4.6133333333333334e-05, 'samples': 89056, 'steps': 173, 'loss/train': 5.018368244171143} -09/20/2021 15:05:24 - INFO - __main__ - Step 2784: {'lr': 4.6133333333333334e-05, 'samples': 89088, 'steps': 173, 'loss/train': 6.3607048988342285} -09/20/2021 15:05:25 - INFO - __main__ - Step 2785: {'lr': 4.64e-05, 'samples': 89120, 'steps': 174, 'loss/train': 6.0565972328186035} -09/20/2021 15:05:25 - INFO - __main__ - Step 2786: {'lr': 4.64e-05, 'samples': 89152, 'steps': 174, 'loss/train': 6.166740894317627} -09/20/2021 15:05:26 - INFO - __main__ - Step 2787: {'lr': 4.64e-05, 'samples': 89184, 'steps': 174, 'loss/train': 6.758132457733154} -09/20/2021 15:05:27 - INFO - __main__ - Step 2788: {'lr': 4.64e-05, 'samples': 89216, 'steps': 174, 'loss/train': 5.171188831329346} -09/20/2021 15:05:28 - INFO - __main__ - Step 2789: {'lr': 4.64e-05, 'samples': 89248, 'steps': 174, 'loss/train': 6.129892826080322} -09/20/2021 15:05:28 - INFO - __main__ - Step 2790: {'lr': 4.64e-05, 'samples': 89280, 'steps': 174, 'loss/train': 5.32188081741333} -09/20/2021 15:05:29 - INFO - __main__ - Step 2791: {'lr': 4.64e-05, 'samples': 89312, 'steps': 174, 'loss/train': 5.153021812438965} -09/20/2021 15:05:30 - INFO - __main__ - Step 2792: {'lr': 4.64e-05, 'samples': 89344, 'steps': 174, 'loss/train': 6.348729133605957} -09/20/2021 15:05:31 - INFO - __main__ - Step 2793: {'lr': 4.64e-05, 'samples': 89376, 'steps': 174, 'loss/train': 5.835715293884277} -09/20/2021 15:05:32 - INFO - __main__ - Step 2794: {'lr': 4.64e-05, 'samples': 89408, 'steps': 174, 'loss/train': 5.88422966003418} -09/20/2021 15:05:33 - INFO - __main__ - Step 2795: {'lr': 4.64e-05, 'samples': 89440, 'steps': 174, 'loss/train': 5.407137870788574} -09/20/2021 15:05:34 - INFO - __main__ - Step 2796: {'lr': 4.64e-05, 'samples': 89472, 'steps': 174, 'loss/train': 6.610720157623291} -09/20/2021 15:05:34 - INFO - __main__ - Step 2797: {'lr': 4.64e-05, 'samples': 89504, 'steps': 174, 'loss/train': 4.720858573913574} -09/20/2021 15:05:35 - INFO - __main__ - Step 2798: {'lr': 4.64e-05, 'samples': 89536, 'steps': 174, 'loss/train': 6.1742730140686035} -09/20/2021 15:05:36 - INFO - __main__ - Step 2799: {'lr': 4.64e-05, 'samples': 89568, 'steps': 174, 'loss/train': 5.748600959777832} -09/20/2021 15:05:37 - INFO - __main__ - Step 2800: {'lr': 4.64e-05, 'samples': 89600, 'steps': 174, 'loss/train': 6.053680896759033} -09/20/2021 15:05:37 - INFO - __main__ - Step 2801: {'lr': 4.666666666666667e-05, 'samples': 89632, 'steps': 175, 'loss/train': 5.442779541015625} -09/20/2021 15:05:38 - INFO - __main__ - Step 2802: {'lr': 4.666666666666667e-05, 'samples': 89664, 'steps': 175, 'loss/train': 5.875706672668457} -09/20/2021 15:05:39 - INFO - __main__ - Step 2803: {'lr': 4.666666666666667e-05, 'samples': 89696, 'steps': 175, 'loss/train': 6.806637763977051} -09/20/2021 15:05:40 - INFO - __main__ - Step 2804: {'lr': 4.666666666666667e-05, 'samples': 89728, 'steps': 175, 'loss/train': 7.402374744415283} -09/20/2021 15:05:40 - INFO - __main__ - Step 2805: {'lr': 4.666666666666667e-05, 'samples': 89760, 'steps': 175, 'loss/train': 6.696723937988281} -09/20/2021 15:05:41 - INFO - __main__ - Step 2806: {'lr': 4.666666666666667e-05, 'samples': 89792, 'steps': 175, 'loss/train': 5.348050117492676} -09/20/2021 15:05:42 - INFO - __main__ - Step 2807: {'lr': 4.666666666666667e-05, 'samples': 89824, 'steps': 175, 'loss/train': 6.9976677894592285} -09/20/2021 15:05:43 - INFO - __main__ - Step 2808: {'lr': 4.666666666666667e-05, 'samples': 89856, 'steps': 175, 'loss/train': 7.0963263511657715} -09/20/2021 15:05:43 - INFO - __main__ - Step 2809: {'lr': 4.666666666666667e-05, 'samples': 89888, 'steps': 175, 'loss/train': 6.779289722442627} -09/20/2021 15:05:44 - INFO - __main__ - Step 2810: {'lr': 4.666666666666667e-05, 'samples': 89920, 'steps': 175, 'loss/train': 6.44900369644165} -09/20/2021 15:05:45 - INFO - __main__ - Step 2811: {'lr': 4.666666666666667e-05, 'samples': 89952, 'steps': 175, 'loss/train': 6.802170276641846} -09/20/2021 15:05:46 - INFO - __main__ - Step 2812: {'lr': 4.666666666666667e-05, 'samples': 89984, 'steps': 175, 'loss/train': 5.99936580657959} -09/20/2021 15:05:46 - INFO - __main__ - Step 2813: {'lr': 4.666666666666667e-05, 'samples': 90016, 'steps': 175, 'loss/train': 5.99515962600708} -09/20/2021 15:05:47 - INFO - __main__ - Step 2814: {'lr': 4.666666666666667e-05, 'samples': 90048, 'steps': 175, 'loss/train': 5.814268589019775} -09/20/2021 15:05:48 - INFO - __main__ - Step 2815: {'lr': 4.666666666666667e-05, 'samples': 90080, 'steps': 175, 'loss/train': 5.707694053649902} -09/20/2021 15:05:49 - INFO - __main__ - Step 2816: {'lr': 4.666666666666667e-05, 'samples': 90112, 'steps': 175, 'loss/train': 6.127281665802002} -09/20/2021 15:05:50 - INFO - __main__ - Step 2817: {'lr': 4.6933333333333333e-05, 'samples': 90144, 'steps': 176, 'loss/train': 5.968621253967285} -09/20/2021 15:05:50 - INFO - __main__ - Step 2818: {'lr': 4.6933333333333333e-05, 'samples': 90176, 'steps': 176, 'loss/train': 6.3730058670043945} -09/20/2021 15:05:51 - INFO - __main__ - Step 2819: {'lr': 4.6933333333333333e-05, 'samples': 90208, 'steps': 176, 'loss/train': 5.892547607421875} -09/20/2021 15:05:52 - INFO - __main__ - Step 2820: {'lr': 4.6933333333333333e-05, 'samples': 90240, 'steps': 176, 'loss/train': 5.579571723937988} -09/20/2021 15:05:53 - INFO - __main__ - Step 2821: {'lr': 4.6933333333333333e-05, 'samples': 90272, 'steps': 176, 'loss/train': 5.663902282714844} -09/20/2021 15:05:53 - INFO - __main__ - Step 2822: {'lr': 4.6933333333333333e-05, 'samples': 90304, 'steps': 176, 'loss/train': 7.024765968322754} -09/20/2021 15:05:54 - INFO - __main__ - Step 2823: {'lr': 4.6933333333333333e-05, 'samples': 90336, 'steps': 176, 'loss/train': 5.851842403411865} -09/20/2021 15:05:55 - INFO - __main__ - Step 2824: {'lr': 4.6933333333333333e-05, 'samples': 90368, 'steps': 176, 'loss/train': 7.17542839050293} -09/20/2021 15:05:56 - INFO - __main__ - Step 2825: {'lr': 4.6933333333333333e-05, 'samples': 90400, 'steps': 176, 'loss/train': 7.851382732391357} -09/20/2021 15:05:57 - INFO - __main__ - Step 2826: {'lr': 4.6933333333333333e-05, 'samples': 90432, 'steps': 176, 'loss/train': 5.174217700958252} -09/20/2021 15:05:58 - INFO - __main__ - Step 2827: {'lr': 4.6933333333333333e-05, 'samples': 90464, 'steps': 176, 'loss/train': 5.019989967346191} -09/20/2021 15:05:59 - INFO - __main__ - Step 2828: {'lr': 4.6933333333333333e-05, 'samples': 90496, 'steps': 176, 'loss/train': 4.252453327178955} -09/20/2021 15:05:59 - INFO - __main__ - Step 2829: {'lr': 4.6933333333333333e-05, 'samples': 90528, 'steps': 176, 'loss/train': 4.237749099731445} -09/20/2021 15:06:00 - INFO - __main__ - Step 2830: {'lr': 4.6933333333333333e-05, 'samples': 90560, 'steps': 176, 'loss/train': 5.231051445007324} -09/20/2021 15:06:01 - INFO - __main__ - Step 2831: {'lr': 4.6933333333333333e-05, 'samples': 90592, 'steps': 176, 'loss/train': 6.032166481018066} -09/20/2021 15:06:02 - INFO - __main__ - Step 2832: {'lr': 4.6933333333333333e-05, 'samples': 90624, 'steps': 176, 'loss/train': 5.787530899047852} -09/20/2021 15:06:02 - INFO - __main__ - Step 2833: {'lr': 4.72e-05, 'samples': 90656, 'steps': 177, 'loss/train': 5.127337455749512} -09/20/2021 15:06:03 - INFO - __main__ - Step 2834: {'lr': 4.72e-05, 'samples': 90688, 'steps': 177, 'loss/train': 6.584522247314453} -09/20/2021 15:06:04 - INFO - __main__ - Step 2835: {'lr': 4.72e-05, 'samples': 90720, 'steps': 177, 'loss/train': 5.728933811187744} -09/20/2021 15:06:05 - INFO - __main__ - Step 2836: {'lr': 4.72e-05, 'samples': 90752, 'steps': 177, 'loss/train': 4.7812299728393555} -09/20/2021 15:06:05 - INFO - __main__ - Step 2837: {'lr': 4.72e-05, 'samples': 90784, 'steps': 177, 'loss/train': 6.5281081199646} -09/20/2021 15:06:06 - INFO - __main__ - Step 2838: {'lr': 4.72e-05, 'samples': 90816, 'steps': 177, 'loss/train': 6.403400421142578} -09/20/2021 15:06:07 - INFO - __main__ - Step 2839: {'lr': 4.72e-05, 'samples': 90848, 'steps': 177, 'loss/train': 5.5522780418396} -09/20/2021 15:06:08 - INFO - __main__ - Step 2840: {'lr': 4.72e-05, 'samples': 90880, 'steps': 177, 'loss/train': 5.476378440856934} -09/20/2021 15:06:08 - INFO - __main__ - Step 2841: {'lr': 4.72e-05, 'samples': 90912, 'steps': 177, 'loss/train': 6.4725141525268555} -09/20/2021 15:06:09 - INFO - __main__ - Step 2842: {'lr': 4.72e-05, 'samples': 90944, 'steps': 177, 'loss/train': 6.763460159301758} -09/20/2021 15:06:10 - INFO - __main__ - Step 2843: {'lr': 4.72e-05, 'samples': 90976, 'steps': 177, 'loss/train': 6.849384307861328} -09/20/2021 15:06:11 - INFO - __main__ - Step 2844: {'lr': 4.72e-05, 'samples': 91008, 'steps': 177, 'loss/train': 6.946477890014648} -09/20/2021 15:06:11 - INFO - __main__ - Step 2845: {'lr': 4.72e-05, 'samples': 91040, 'steps': 177, 'loss/train': 6.431899070739746} -09/20/2021 15:06:12 - INFO - __main__ - Step 2846: {'lr': 4.72e-05, 'samples': 91072, 'steps': 177, 'loss/train': 6.31098747253418} -09/20/2021 15:06:13 - INFO - __main__ - Step 2847: {'lr': 4.72e-05, 'samples': 91104, 'steps': 177, 'loss/train': 5.219291687011719} -09/20/2021 15:06:14 - INFO - __main__ - Step 2848: {'lr': 4.72e-05, 'samples': 91136, 'steps': 177, 'loss/train': 5.875304698944092} -09/20/2021 15:06:15 - INFO - __main__ - Step 2849: {'lr': 4.746666666666667e-05, 'samples': 91168, 'steps': 178, 'loss/train': 6.270319938659668} -09/20/2021 15:06:15 - INFO - __main__ - Step 2850: {'lr': 4.746666666666667e-05, 'samples': 91200, 'steps': 178, 'loss/train': 5.953029155731201} -09/20/2021 15:06:16 - INFO - __main__ - Step 2851: {'lr': 4.746666666666667e-05, 'samples': 91232, 'steps': 178, 'loss/train': 6.173214435577393} -09/20/2021 15:06:17 - INFO - __main__ - Step 2852: {'lr': 4.746666666666667e-05, 'samples': 91264, 'steps': 178, 'loss/train': 6.970661163330078} -09/20/2021 15:06:18 - INFO - __main__ - Step 2853: {'lr': 4.746666666666667e-05, 'samples': 91296, 'steps': 178, 'loss/train': 5.699576377868652} -09/20/2021 15:06:18 - INFO - __main__ - Step 2854: {'lr': 4.746666666666667e-05, 'samples': 91328, 'steps': 178, 'loss/train': 6.246718883514404} -09/20/2021 15:06:19 - INFO - __main__ - Step 2855: {'lr': 4.746666666666667e-05, 'samples': 91360, 'steps': 178, 'loss/train': 5.601895809173584} -09/20/2021 15:06:21 - INFO - __main__ - Step 2856: {'lr': 4.746666666666667e-05, 'samples': 91392, 'steps': 178, 'loss/train': 5.251691818237305} -09/20/2021 15:06:21 - INFO - __main__ - Step 2857: {'lr': 4.746666666666667e-05, 'samples': 91424, 'steps': 178, 'loss/train': 5.773843288421631} -09/20/2021 15:06:22 - INFO - __main__ - Step 2858: {'lr': 4.746666666666667e-05, 'samples': 91456, 'steps': 178, 'loss/train': 6.0099921226501465} -09/20/2021 15:06:23 - INFO - __main__ - Step 2859: {'lr': 4.746666666666667e-05, 'samples': 91488, 'steps': 178, 'loss/train': 5.340570449829102} -09/20/2021 15:06:24 - INFO - __main__ - Step 2860: {'lr': 4.746666666666667e-05, 'samples': 91520, 'steps': 178, 'loss/train': 5.3582587242126465} -09/20/2021 15:06:24 - INFO - __main__ - Step 2861: {'lr': 4.746666666666667e-05, 'samples': 91552, 'steps': 178, 'loss/train': 5.508859157562256} -09/20/2021 15:06:25 - INFO - __main__ - Step 2862: {'lr': 4.746666666666667e-05, 'samples': 91584, 'steps': 178, 'loss/train': 5.974771499633789} -09/20/2021 15:06:26 - INFO - __main__ - Step 2863: {'lr': 4.746666666666667e-05, 'samples': 91616, 'steps': 178, 'loss/train': 10.301634788513184} -09/20/2021 15:06:27 - INFO - __main__ - Step 2864: {'lr': 4.746666666666667e-05, 'samples': 91648, 'steps': 178, 'loss/train': 10.332151412963867} -09/20/2021 15:06:28 - INFO - __main__ - Step 2865: {'lr': 4.773333333333333e-05, 'samples': 91680, 'steps': 179, 'loss/train': 9.6670503616333} -09/20/2021 15:06:28 - INFO - __main__ - Step 2866: {'lr': 4.773333333333333e-05, 'samples': 91712, 'steps': 179, 'loss/train': 9.630072593688965} -09/20/2021 15:06:29 - INFO - __main__ - Step 2867: {'lr': 4.773333333333333e-05, 'samples': 91744, 'steps': 179, 'loss/train': 9.677740097045898} -09/20/2021 15:06:30 - INFO - __main__ - Step 2868: {'lr': 4.773333333333333e-05, 'samples': 91776, 'steps': 179, 'loss/train': 10.081344604492188} -09/20/2021 15:06:31 - INFO - __main__ - Step 2869: {'lr': 4.773333333333333e-05, 'samples': 91808, 'steps': 179, 'loss/train': 9.796602249145508} -09/20/2021 15:06:31 - INFO - __main__ - Step 2870: {'lr': 4.773333333333333e-05, 'samples': 91840, 'steps': 179, 'loss/train': 5.268296241760254} -09/20/2021 15:06:32 - INFO - __main__ - Step 2871: {'lr': 4.773333333333333e-05, 'samples': 91872, 'steps': 179, 'loss/train': 7.306575775146484} -09/20/2021 15:06:33 - INFO - __main__ - Step 2872: {'lr': 4.773333333333333e-05, 'samples': 91904, 'steps': 179, 'loss/train': 5.68529748916626} -09/20/2021 15:06:34 - INFO - __main__ - Step 2873: {'lr': 4.773333333333333e-05, 'samples': 91936, 'steps': 179, 'loss/train': 6.068352699279785} -09/20/2021 15:06:34 - INFO - __main__ - Step 2874: {'lr': 4.773333333333333e-05, 'samples': 91968, 'steps': 179, 'loss/train': 5.159449100494385} -09/20/2021 15:06:35 - INFO - __main__ - Step 2875: {'lr': 4.773333333333333e-05, 'samples': 92000, 'steps': 179, 'loss/train': 7.11942720413208} -09/20/2021 15:06:36 - INFO - __main__ - Step 2876: {'lr': 4.773333333333333e-05, 'samples': 92032, 'steps': 179, 'loss/train': 7.023151397705078} -09/20/2021 15:06:37 - INFO - __main__ - Step 2877: {'lr': 4.773333333333333e-05, 'samples': 92064, 'steps': 179, 'loss/train': 5.944748401641846} -09/20/2021 15:06:37 - INFO - __main__ - Step 2878: {'lr': 4.773333333333333e-05, 'samples': 92096, 'steps': 179, 'loss/train': 5.661788463592529} -09/20/2021 15:06:38 - INFO - __main__ - Step 2879: {'lr': 4.773333333333333e-05, 'samples': 92128, 'steps': 179, 'loss/train': 6.040464878082275} -09/20/2021 15:06:39 - INFO - __main__ - Step 2880: {'lr': 4.773333333333333e-05, 'samples': 92160, 'steps': 179, 'loss/train': 5.8114824295043945} -09/20/2021 15:06:40 - INFO - __main__ - Step 2881: {'lr': 4.8e-05, 'samples': 92192, 'steps': 180, 'loss/train': 6.123759746551514} -09/20/2021 15:06:40 - INFO - __main__ - Step 2882: {'lr': 4.8e-05, 'samples': 92224, 'steps': 180, 'loss/train': 6.088200569152832} -09/20/2021 15:06:41 - INFO - __main__ - Step 2883: {'lr': 4.8e-05, 'samples': 92256, 'steps': 180, 'loss/train': 6.740952014923096} -09/20/2021 15:06:42 - INFO - __main__ - Step 2884: {'lr': 4.8e-05, 'samples': 92288, 'steps': 180, 'loss/train': 6.698484420776367} -09/20/2021 15:06:43 - INFO - __main__ - Step 2885: {'lr': 4.8e-05, 'samples': 92320, 'steps': 180, 'loss/train': 6.37304162979126} -09/20/2021 15:06:43 - INFO - __main__ - Step 2886: {'lr': 4.8e-05, 'samples': 92352, 'steps': 180, 'loss/train': 6.577147483825684} -09/20/2021 15:06:44 - INFO - __main__ - Step 2887: {'lr': 4.8e-05, 'samples': 92384, 'steps': 180, 'loss/train': 5.110363006591797} -09/20/2021 15:06:45 - INFO - __main__ - Step 2888: {'lr': 4.8e-05, 'samples': 92416, 'steps': 180, 'loss/train': 4.41012716293335} -09/20/2021 15:06:46 - INFO - __main__ - Step 2889: {'lr': 4.8e-05, 'samples': 92448, 'steps': 180, 'loss/train': 4.608786106109619} -09/20/2021 15:06:46 - INFO - __main__ - Step 2890: {'lr': 4.8e-05, 'samples': 92480, 'steps': 180, 'loss/train': 4.8500237464904785} -09/20/2021 15:06:47 - INFO - __main__ - Step 2891: {'lr': 4.8e-05, 'samples': 92512, 'steps': 180, 'loss/train': 4.8277082443237305} -09/20/2021 15:06:49 - INFO - __main__ - Step 2892: {'lr': 4.8e-05, 'samples': 92544, 'steps': 180, 'loss/train': 4.403400421142578} -09/20/2021 15:06:50 - INFO - __main__ - Step 2893: {'lr': 4.8e-05, 'samples': 92576, 'steps': 180, 'loss/train': 6.159444332122803} -09/20/2021 15:06:51 - INFO - __main__ - Step 2894: {'lr': 4.8e-05, 'samples': 92608, 'steps': 180, 'loss/train': 8.393726348876953} -09/20/2021 15:06:52 - INFO - __main__ - Step 2895: {'lr': 4.8e-05, 'samples': 92640, 'steps': 180, 'loss/train': 6.903430938720703} -09/20/2021 15:06:52 - INFO - __main__ - Step 2896: {'lr': 4.8e-05, 'samples': 92672, 'steps': 180, 'loss/train': 6.15749454498291} -09/20/2021 15:06:53 - INFO - __main__ - Step 2897: {'lr': 4.826666666666667e-05, 'samples': 92704, 'steps': 181, 'loss/train': 6.579908847808838} -09/20/2021 15:06:54 - INFO - __main__ - Step 2898: {'lr': 4.826666666666667e-05, 'samples': 92736, 'steps': 181, 'loss/train': 6.691740036010742} -09/20/2021 15:06:55 - INFO - __main__ - Step 2899: {'lr': 4.826666666666667e-05, 'samples': 92768, 'steps': 181, 'loss/train': 6.74843168258667} -09/20/2021 15:06:55 - INFO - __main__ - Step 2900: {'lr': 4.826666666666667e-05, 'samples': 92800, 'steps': 181, 'loss/train': 5.684828758239746} -09/20/2021 15:06:56 - INFO - __main__ - Step 2901: {'lr': 4.826666666666667e-05, 'samples': 92832, 'steps': 181, 'loss/train': 6.480532169342041} -09/20/2021 15:06:57 - INFO - __main__ - Step 2902: {'lr': 4.826666666666667e-05, 'samples': 92864, 'steps': 181, 'loss/train': 6.068843364715576} -09/20/2021 15:06:58 - INFO - __main__ - Step 2903: {'lr': 4.826666666666667e-05, 'samples': 92896, 'steps': 181, 'loss/train': 5.344466209411621} -09/20/2021 15:06:58 - INFO - __main__ - Step 2904: {'lr': 4.826666666666667e-05, 'samples': 92928, 'steps': 181, 'loss/train': 5.413015842437744} -09/20/2021 15:06:59 - INFO - __main__ - Step 2905: {'lr': 4.826666666666667e-05, 'samples': 92960, 'steps': 181, 'loss/train': 5.737546443939209} -09/20/2021 15:07:00 - INFO - __main__ - Step 2906: {'lr': 4.826666666666667e-05, 'samples': 92992, 'steps': 181, 'loss/train': 5.641221523284912} -09/20/2021 15:07:01 - INFO - __main__ - Step 2907: {'lr': 4.826666666666667e-05, 'samples': 93024, 'steps': 181, 'loss/train': 5.693188667297363} -09/20/2021 15:07:01 - INFO - __main__ - Step 2908: {'lr': 4.826666666666667e-05, 'samples': 93056, 'steps': 181, 'loss/train': 6.906539440155029} -09/20/2021 15:07:02 - INFO - __main__ - Step 2909: {'lr': 4.826666666666667e-05, 'samples': 93088, 'steps': 181, 'loss/train': 5.636757850646973} -09/20/2021 15:07:03 - INFO - __main__ - Step 2910: {'lr': 4.826666666666667e-05, 'samples': 93120, 'steps': 181, 'loss/train': 6.613471031188965} -09/20/2021 15:07:04 - INFO - __main__ - Step 2911: {'lr': 4.826666666666667e-05, 'samples': 93152, 'steps': 181, 'loss/train': 6.782854080200195} -09/20/2021 15:07:04 - INFO - __main__ - Step 2912: {'lr': 4.826666666666667e-05, 'samples': 93184, 'steps': 181, 'loss/train': 5.725091934204102} -09/20/2021 15:07:05 - INFO - __main__ - Step 2913: {'lr': 4.853333333333334e-05, 'samples': 93216, 'steps': 182, 'loss/train': 6.029468536376953} -09/20/2021 15:07:06 - INFO - __main__ - Step 2914: {'lr': 4.853333333333334e-05, 'samples': 93248, 'steps': 182, 'loss/train': 6.010964393615723} -09/20/2021 15:07:07 - INFO - __main__ - Step 2915: {'lr': 4.853333333333334e-05, 'samples': 93280, 'steps': 182, 'loss/train': 5.2040486335754395} -09/20/2021 15:07:08 - INFO - __main__ - Step 2916: {'lr': 4.853333333333334e-05, 'samples': 93312, 'steps': 182, 'loss/train': 5.866878986358643} -09/20/2021 15:07:08 - INFO - __main__ - Step 2917: {'lr': 4.853333333333334e-05, 'samples': 93344, 'steps': 182, 'loss/train': 6.006232738494873} -09/20/2021 15:07:09 - INFO - __main__ - Step 2918: {'lr': 4.853333333333334e-05, 'samples': 93376, 'steps': 182, 'loss/train': 6.66288948059082} -09/20/2021 15:07:10 - INFO - __main__ - Step 2919: {'lr': 4.853333333333334e-05, 'samples': 93408, 'steps': 182, 'loss/train': 5.929534435272217} -09/20/2021 15:07:11 - INFO - __main__ - Step 2920: {'lr': 4.853333333333334e-05, 'samples': 93440, 'steps': 182, 'loss/train': 5.132516860961914} -09/20/2021 15:07:11 - INFO - __main__ - Step 2921: {'lr': 4.853333333333334e-05, 'samples': 93472, 'steps': 182, 'loss/train': 6.555658340454102} -09/20/2021 15:07:12 - INFO - __main__ - Step 2922: {'lr': 4.853333333333334e-05, 'samples': 93504, 'steps': 182, 'loss/train': 6.106895923614502} -09/20/2021 15:07:13 - INFO - __main__ - Step 2923: {'lr': 4.853333333333334e-05, 'samples': 93536, 'steps': 182, 'loss/train': 6.420740604400635} -09/20/2021 15:07:14 - INFO - __main__ - Step 2924: {'lr': 4.853333333333334e-05, 'samples': 93568, 'steps': 182, 'loss/train': 5.733519077301025} -09/20/2021 15:07:14 - INFO - __main__ - Step 2925: {'lr': 4.853333333333334e-05, 'samples': 93600, 'steps': 182, 'loss/train': 5.8557915687561035} -09/20/2021 15:07:15 - INFO - __main__ - Step 2926: {'lr': 4.853333333333334e-05, 'samples': 93632, 'steps': 182, 'loss/train': 4.937131881713867} -09/20/2021 15:07:16 - INFO - __main__ - Step 2927: {'lr': 4.853333333333334e-05, 'samples': 93664, 'steps': 182, 'loss/train': 5.962679386138916} -09/20/2021 15:07:17 - INFO - __main__ - Step 2928: {'lr': 4.853333333333334e-05, 'samples': 93696, 'steps': 182, 'loss/train': 5.422728061676025} -09/20/2021 15:07:18 - INFO - __main__ - Step 2929: {'lr': 4.88e-05, 'samples': 93728, 'steps': 183, 'loss/train': 5.671014308929443} -09/20/2021 15:07:19 - INFO - __main__ - Step 2930: {'lr': 4.88e-05, 'samples': 93760, 'steps': 183, 'loss/train': 6.768764019012451} -09/20/2021 15:07:19 - INFO - __main__ - Step 2931: {'lr': 4.88e-05, 'samples': 93792, 'steps': 183, 'loss/train': 6.0278778076171875} -09/20/2021 15:07:20 - INFO - __main__ - Step 2932: {'lr': 4.88e-05, 'samples': 93824, 'steps': 183, 'loss/train': 3.8197803497314453} -09/20/2021 15:07:21 - INFO - __main__ - Step 2933: {'lr': 4.88e-05, 'samples': 93856, 'steps': 183, 'loss/train': 5.425760746002197} -09/20/2021 15:07:22 - INFO - __main__ - Step 2934: {'lr': 4.88e-05, 'samples': 93888, 'steps': 183, 'loss/train': 5.7167067527771} -09/20/2021 15:07:22 - INFO - __main__ - Step 2935: {'lr': 4.88e-05, 'samples': 93920, 'steps': 183, 'loss/train': 6.441887378692627} -09/20/2021 15:07:23 - INFO - __main__ - Step 2936: {'lr': 4.88e-05, 'samples': 93952, 'steps': 183, 'loss/train': 6.447636127471924} -09/20/2021 15:07:24 - INFO - __main__ - Step 2937: {'lr': 4.88e-05, 'samples': 93984, 'steps': 183, 'loss/train': 6.567512512207031} -09/20/2021 15:07:25 - INFO - __main__ - Step 2938: {'lr': 4.88e-05, 'samples': 94016, 'steps': 183, 'loss/train': 6.136054515838623} -09/20/2021 15:07:25 - INFO - __main__ - Step 2939: {'lr': 4.88e-05, 'samples': 94048, 'steps': 183, 'loss/train': 5.595654487609863} -09/20/2021 15:07:26 - INFO - __main__ - Step 2940: {'lr': 4.88e-05, 'samples': 94080, 'steps': 183, 'loss/train': 5.450980186462402} -09/20/2021 15:07:27 - INFO - __main__ - Step 2941: {'lr': 4.88e-05, 'samples': 94112, 'steps': 183, 'loss/train': 5.940357208251953} -09/20/2021 15:07:28 - INFO - __main__ - Step 2942: {'lr': 4.88e-05, 'samples': 94144, 'steps': 183, 'loss/train': 6.670854091644287} -09/20/2021 15:07:28 - INFO - __main__ - Step 2943: {'lr': 4.88e-05, 'samples': 94176, 'steps': 183, 'loss/train': 5.894989967346191} -09/20/2021 15:07:29 - INFO - __main__ - Step 2944: {'lr': 4.88e-05, 'samples': 94208, 'steps': 183, 'loss/train': 6.227982044219971} -09/20/2021 15:07:30 - INFO - __main__ - Step 2945: {'lr': 4.906666666666667e-05, 'samples': 94240, 'steps': 184, 'loss/train': 6.115265846252441} -09/20/2021 15:07:31 - INFO - __main__ - Step 2946: {'lr': 4.906666666666667e-05, 'samples': 94272, 'steps': 184, 'loss/train': 6.011228561401367} -09/20/2021 15:07:32 - INFO - __main__ - Step 2947: {'lr': 4.906666666666667e-05, 'samples': 94304, 'steps': 184, 'loss/train': 6.136854648590088} -09/20/2021 15:07:32 - INFO - __main__ - Step 2948: {'lr': 4.906666666666667e-05, 'samples': 94336, 'steps': 184, 'loss/train': 6.601929187774658} -09/20/2021 15:07:33 - INFO - __main__ - Step 2949: {'lr': 4.906666666666667e-05, 'samples': 94368, 'steps': 184, 'loss/train': 5.837001323699951} -09/20/2021 15:07:34 - INFO - __main__ - Step 2950: {'lr': 4.906666666666667e-05, 'samples': 94400, 'steps': 184, 'loss/train': 5.376768589019775} -09/20/2021 15:07:35 - INFO - __main__ - Step 2951: {'lr': 4.906666666666667e-05, 'samples': 94432, 'steps': 184, 'loss/train': 5.347487449645996} -09/20/2021 15:07:35 - INFO - __main__ - Step 2952: {'lr': 4.906666666666667e-05, 'samples': 94464, 'steps': 184, 'loss/train': 5.691023826599121} -09/20/2021 15:07:36 - INFO - __main__ - Step 2953: {'lr': 4.906666666666667e-05, 'samples': 94496, 'steps': 184, 'loss/train': 5.4140753746032715} -09/20/2021 15:07:37 - INFO - __main__ - Step 2954: {'lr': 4.906666666666667e-05, 'samples': 94528, 'steps': 184, 'loss/train': 1.366663932800293} -09/20/2021 15:07:38 - INFO - __main__ - Step 2955: {'lr': 4.906666666666667e-05, 'samples': 94560, 'steps': 184, 'loss/train': 6.196070671081543} -09/20/2021 15:07:38 - INFO - __main__ - Step 2956: {'lr': 4.906666666666667e-05, 'samples': 94592, 'steps': 184, 'loss/train': 6.301774978637695} -09/20/2021 15:07:39 - INFO - __main__ - Step 2957: {'lr': 4.906666666666667e-05, 'samples': 94624, 'steps': 184, 'loss/train': 6.469149112701416} -09/20/2021 15:07:40 - INFO - __main__ - Step 2958: {'lr': 4.906666666666667e-05, 'samples': 94656, 'steps': 184, 'loss/train': 5.636573314666748} -09/20/2021 15:07:41 - INFO - __main__ - Step 2959: {'lr': 4.906666666666667e-05, 'samples': 94688, 'steps': 184, 'loss/train': 6.160274982452393} -09/20/2021 15:07:42 - INFO - __main__ - Step 2960: {'lr': 4.906666666666667e-05, 'samples': 94720, 'steps': 184, 'loss/train': 5.9087395668029785} -09/20/2021 15:07:43 - INFO - __main__ - Step 2961: {'lr': 4.933333333333334e-05, 'samples': 94752, 'steps': 185, 'loss/train': 6.2983832359313965} -09/20/2021 15:07:44 - INFO - __main__ - Step 2962: {'lr': 4.933333333333334e-05, 'samples': 94784, 'steps': 185, 'loss/train': 6.132440090179443} -09/20/2021 15:07:44 - INFO - __main__ - Step 2963: {'lr': 4.933333333333334e-05, 'samples': 94816, 'steps': 185, 'loss/train': 6.2157206535339355} -09/20/2021 15:07:45 - INFO - __main__ - Step 2964: {'lr': 4.933333333333334e-05, 'samples': 94848, 'steps': 185, 'loss/train': 5.455899715423584} -09/20/2021 15:07:46 - INFO - __main__ - Step 2965: {'lr': 4.933333333333334e-05, 'samples': 94880, 'steps': 185, 'loss/train': 6.399825096130371} -09/20/2021 15:07:47 - INFO - __main__ - Step 2966: {'lr': 4.933333333333334e-05, 'samples': 94912, 'steps': 185, 'loss/train': 7.771252155303955} -09/20/2021 15:07:47 - INFO - __main__ - Step 2967: {'lr': 4.933333333333334e-05, 'samples': 94944, 'steps': 185, 'loss/train': 6.54949426651001} -09/20/2021 15:07:48 - INFO - __main__ - Step 2968: {'lr': 4.933333333333334e-05, 'samples': 94976, 'steps': 185, 'loss/train': 5.228808879852295} -09/20/2021 15:07:49 - INFO - __main__ - Step 2969: {'lr': 4.933333333333334e-05, 'samples': 95008, 'steps': 185, 'loss/train': 5.9146409034729} -09/20/2021 15:07:50 - INFO - __main__ - Step 2970: {'lr': 4.933333333333334e-05, 'samples': 95040, 'steps': 185, 'loss/train': 5.826418876647949} -09/20/2021 15:07:50 - INFO - __main__ - Step 2971: {'lr': 4.933333333333334e-05, 'samples': 95072, 'steps': 185, 'loss/train': 6.609462738037109} -09/20/2021 15:07:51 - INFO - __main__ - Step 2972: {'lr': 4.933333333333334e-05, 'samples': 95104, 'steps': 185, 'loss/train': 5.700295925140381} -09/20/2021 15:07:52 - INFO - __main__ - Step 2973: {'lr': 4.933333333333334e-05, 'samples': 95136, 'steps': 185, 'loss/train': 6.200838088989258} -09/20/2021 15:07:53 - INFO - __main__ - Step 2974: {'lr': 4.933333333333334e-05, 'samples': 95168, 'steps': 185, 'loss/train': 5.753887176513672} -09/20/2021 15:07:53 - INFO - __main__ - Step 2975: {'lr': 4.933333333333334e-05, 'samples': 95200, 'steps': 185, 'loss/train': 5.628616809844971} -09/20/2021 15:07:54 - INFO - __main__ - Step 2976: {'lr': 4.933333333333334e-05, 'samples': 95232, 'steps': 185, 'loss/train': 4.883317470550537} -09/20/2021 15:07:55 - INFO - __main__ - Step 2977: {'lr': 4.96e-05, 'samples': 95264, 'steps': 186, 'loss/train': 5.276725769042969} -09/20/2021 15:07:56 - INFO - __main__ - Step 2978: {'lr': 4.96e-05, 'samples': 95296, 'steps': 186, 'loss/train': 6.75452184677124} -09/20/2021 15:07:56 - INFO - __main__ - Step 2979: {'lr': 4.96e-05, 'samples': 95328, 'steps': 186, 'loss/train': 7.133015155792236} -09/20/2021 15:07:57 - INFO - __main__ - Step 2980: {'lr': 4.96e-05, 'samples': 95360, 'steps': 186, 'loss/train': 5.857351303100586} -09/20/2021 15:07:58 - INFO - __main__ - Step 2981: {'lr': 4.96e-05, 'samples': 95392, 'steps': 186, 'loss/train': 5.6871724128723145} -09/20/2021 15:07:59 - INFO - __main__ - Step 2982: {'lr': 4.96e-05, 'samples': 95424, 'steps': 186, 'loss/train': 5.3465986251831055} -09/20/2021 15:07:59 - INFO - __main__ - Step 2983: {'lr': 4.96e-05, 'samples': 95456, 'steps': 186, 'loss/train': 5.047416687011719} -09/20/2021 15:08:00 - INFO - __main__ - Step 2984: {'lr': 4.96e-05, 'samples': 95488, 'steps': 186, 'loss/train': 5.862918376922607} -09/20/2021 15:08:01 - INFO - __main__ - Step 2985: {'lr': 4.96e-05, 'samples': 95520, 'steps': 186, 'loss/train': 5.356547832489014} -09/20/2021 15:08:02 - INFO - __main__ - Step 2986: {'lr': 4.96e-05, 'samples': 95552, 'steps': 186, 'loss/train': 5.789919853210449} -09/20/2021 15:08:02 - INFO - __main__ - Step 2987: {'lr': 4.96e-05, 'samples': 95584, 'steps': 186, 'loss/train': 5.048076629638672} -09/20/2021 15:08:03 - INFO - __main__ - Step 2988: {'lr': 4.96e-05, 'samples': 95616, 'steps': 186, 'loss/train': 6.255715370178223} -09/20/2021 15:08:05 - INFO - __main__ - Step 2989: {'lr': 4.96e-05, 'samples': 95648, 'steps': 186, 'loss/train': 5.733706951141357} -09/20/2021 15:08:05 - INFO - __main__ - Step 2990: {'lr': 4.96e-05, 'samples': 95680, 'steps': 186, 'loss/train': 4.7234296798706055} -09/20/2021 15:08:06 - INFO - __main__ - Step 2991: {'lr': 4.96e-05, 'samples': 95712, 'steps': 186, 'loss/train': 6.377892017364502} -09/20/2021 15:08:07 - INFO - __main__ - Step 2992: {'lr': 4.96e-05, 'samples': 95744, 'steps': 186, 'loss/train': 5.903626441955566} -09/20/2021 15:08:08 - INFO - __main__ - Step 2993: {'lr': 4.986666666666667e-05, 'samples': 95776, 'steps': 187, 'loss/train': 5.674102783203125} -09/20/2021 15:08:09 - INFO - __main__ - Step 2994: {'lr': 4.986666666666667e-05, 'samples': 95808, 'steps': 187, 'loss/train': 6.974520683288574} -09/20/2021 15:08:09 - INFO - __main__ - Step 2995: {'lr': 4.986666666666667e-05, 'samples': 95840, 'steps': 187, 'loss/train': 6.215253829956055} -09/20/2021 15:08:10 - INFO - __main__ - Step 2996: {'lr': 4.986666666666667e-05, 'samples': 95872, 'steps': 187, 'loss/train': 6.119963645935059} -09/20/2021 15:08:11 - INFO - __main__ - Step 2997: {'lr': 4.986666666666667e-05, 'samples': 95904, 'steps': 187, 'loss/train': 5.671295642852783} -09/20/2021 15:08:12 - INFO - __main__ - Step 2998: {'lr': 4.986666666666667e-05, 'samples': 95936, 'steps': 187, 'loss/train': 5.461169719696045} -09/20/2021 15:08:12 - INFO - __main__ - Step 2999: {'lr': 4.986666666666667e-05, 'samples': 95968, 'steps': 187, 'loss/train': 6.139457702636719} -09/20/2021 15:08:13 - INFO - __main__ - Step 3000: {'lr': 4.986666666666667e-05, 'samples': 96000, 'steps': 187, 'loss/train': 6.208123207092285} -09/20/2021 15:08:14 - INFO - __main__ - Step 3001: {'lr': 4.986666666666667e-05, 'samples': 96032, 'steps': 187, 'loss/train': 6.490942001342773} -09/20/2021 15:08:15 - INFO - __main__ - Step 3002: {'lr': 4.986666666666667e-05, 'samples': 96064, 'steps': 187, 'loss/train': 6.022582530975342} -09/20/2021 15:08:15 - INFO - __main__ - Step 3003: {'lr': 4.986666666666667e-05, 'samples': 96096, 'steps': 187, 'loss/train': 6.911489486694336} -09/20/2021 15:08:16 - INFO - __main__ - Step 3004: {'lr': 4.986666666666667e-05, 'samples': 96128, 'steps': 187, 'loss/train': 6.867422580718994} -09/20/2021 15:08:17 - INFO - __main__ - Step 3005: {'lr': 4.986666666666667e-05, 'samples': 96160, 'steps': 187, 'loss/train': 6.177224636077881} -09/20/2021 15:08:18 - INFO - __main__ - Step 3006: {'lr': 4.986666666666667e-05, 'samples': 96192, 'steps': 187, 'loss/train': 7.539350986480713} -09/20/2021 15:08:18 - INFO - __main__ - Step 3007: {'lr': 4.986666666666667e-05, 'samples': 96224, 'steps': 187, 'loss/train': 6.813504219055176} -09/20/2021 15:08:19 - INFO - __main__ - Step 3008: {'lr': 4.986666666666667e-05, 'samples': 96256, 'steps': 187, 'loss/train': 7.498203277587891} -09/20/2021 15:08:20 - INFO - __main__ - Step 3009: {'lr': 5.013333333333333e-05, 'samples': 96288, 'steps': 188, 'loss/train': 3.9592883586883545} -09/20/2021 15:08:21 - INFO - __main__ - Step 3010: {'lr': 5.013333333333333e-05, 'samples': 96320, 'steps': 188, 'loss/train': 5.580134391784668} -09/20/2021 15:08:21 - INFO - __main__ - Step 3011: {'lr': 5.013333333333333e-05, 'samples': 96352, 'steps': 188, 'loss/train': 6.2395124435424805} -09/20/2021 15:08:22 - INFO - __main__ - Step 3012: {'lr': 5.013333333333333e-05, 'samples': 96384, 'steps': 188, 'loss/train': 5.718607425689697} -09/20/2021 15:08:23 - INFO - __main__ - Step 3013: {'lr': 5.013333333333333e-05, 'samples': 96416, 'steps': 188, 'loss/train': 5.648902416229248} -09/20/2021 15:08:24 - INFO - __main__ - Step 3014: {'lr': 5.013333333333333e-05, 'samples': 96448, 'steps': 188, 'loss/train': 6.551687717437744} -09/20/2021 15:08:24 - INFO - __main__ - Step 3015: {'lr': 5.013333333333333e-05, 'samples': 96480, 'steps': 188, 'loss/train': 5.754380702972412} -09/20/2021 15:08:25 - INFO - __main__ - Step 3016: {'lr': 5.013333333333333e-05, 'samples': 96512, 'steps': 188, 'loss/train': 4.667171478271484} -09/20/2021 15:08:26 - INFO - __main__ - Step 3017: {'lr': 5.013333333333333e-05, 'samples': 96544, 'steps': 188, 'loss/train': 5.661316871643066} -09/20/2021 15:08:27 - INFO - __main__ - Step 3018: {'lr': 5.013333333333333e-05, 'samples': 96576, 'steps': 188, 'loss/train': 7.11868953704834} -09/20/2021 15:08:27 - INFO - __main__ - Step 3019: {'lr': 5.013333333333333e-05, 'samples': 96608, 'steps': 188, 'loss/train': 6.939640045166016} -09/20/2021 15:08:28 - INFO - __main__ - Step 3020: {'lr': 5.013333333333333e-05, 'samples': 96640, 'steps': 188, 'loss/train': 6.32624626159668} -09/20/2021 15:08:29 - INFO - __main__ - Step 3021: {'lr': 5.013333333333333e-05, 'samples': 96672, 'steps': 188, 'loss/train': 6.846172332763672} -09/20/2021 15:08:30 - INFO - __main__ - Step 3022: {'lr': 5.013333333333333e-05, 'samples': 96704, 'steps': 188, 'loss/train': 6.2842841148376465} -09/20/2021 15:08:31 - INFO - __main__ - Step 3023: {'lr': 5.013333333333333e-05, 'samples': 96736, 'steps': 188, 'loss/train': 5.836642742156982} -09/20/2021 15:08:32 - INFO - __main__ - Step 3024: {'lr': 5.013333333333333e-05, 'samples': 96768, 'steps': 188, 'loss/train': 6.606442928314209} -09/20/2021 15:08:33 - INFO - __main__ - Step 3025: {'lr': 5.0400000000000005e-05, 'samples': 96800, 'steps': 189, 'loss/train': 5.706470012664795} -09/20/2021 15:08:33 - INFO - __main__ - Step 3026: {'lr': 5.0400000000000005e-05, 'samples': 96832, 'steps': 189, 'loss/train': 5.760131359100342} -09/20/2021 15:08:34 - INFO - __main__ - Step 3027: {'lr': 5.0400000000000005e-05, 'samples': 96864, 'steps': 189, 'loss/train': 5.651432991027832} -09/20/2021 15:08:35 - INFO - __main__ - Step 3028: {'lr': 5.0400000000000005e-05, 'samples': 96896, 'steps': 189, 'loss/train': 6.303522109985352} -09/20/2021 15:08:36 - INFO - __main__ - Step 3029: {'lr': 5.0400000000000005e-05, 'samples': 96928, 'steps': 189, 'loss/train': 5.703310489654541} -09/20/2021 15:08:36 - INFO - __main__ - Step 3030: {'lr': 5.0400000000000005e-05, 'samples': 96960, 'steps': 189, 'loss/train': 6.107039451599121} -09/20/2021 15:08:37 - INFO - __main__ - Step 3031: {'lr': 5.0400000000000005e-05, 'samples': 96992, 'steps': 189, 'loss/train': 5.708629131317139} -09/20/2021 15:08:38 - INFO - __main__ - Step 3032: {'lr': 5.0400000000000005e-05, 'samples': 97024, 'steps': 189, 'loss/train': 6.1776123046875} -09/20/2021 15:08:39 - INFO - __main__ - Step 3033: {'lr': 5.0400000000000005e-05, 'samples': 97056, 'steps': 189, 'loss/train': 5.4718217849731445} -09/20/2021 15:08:39 - INFO - __main__ - Step 3034: {'lr': 5.0400000000000005e-05, 'samples': 97088, 'steps': 189, 'loss/train': 6.356401443481445} -09/20/2021 15:08:40 - INFO - __main__ - Step 3035: {'lr': 5.0400000000000005e-05, 'samples': 97120, 'steps': 189, 'loss/train': 5.831132411956787} -09/20/2021 15:08:41 - INFO - __main__ - Step 3036: {'lr': 5.0400000000000005e-05, 'samples': 97152, 'steps': 189, 'loss/train': 5.751835346221924} -09/20/2021 15:08:42 - INFO - __main__ - Step 3037: {'lr': 5.0400000000000005e-05, 'samples': 97184, 'steps': 189, 'loss/train': 6.05264949798584} -09/20/2021 15:08:42 - INFO - __main__ - Step 3038: {'lr': 5.0400000000000005e-05, 'samples': 97216, 'steps': 189, 'loss/train': 5.2485880851745605} -09/20/2021 15:08:43 - INFO - __main__ - Step 3039: {'lr': 5.0400000000000005e-05, 'samples': 97248, 'steps': 189, 'loss/train': 5.621045112609863} -09/20/2021 15:08:44 - INFO - __main__ - Step 3040: {'lr': 5.0400000000000005e-05, 'samples': 97280, 'steps': 189, 'loss/train': 6.015568733215332} -09/20/2021 15:08:45 - INFO - __main__ - Step 3041: {'lr': 5.0666666666666674e-05, 'samples': 97312, 'steps': 190, 'loss/train': 7.365818500518799} -09/20/2021 15:08:46 - INFO - __main__ - Step 3042: {'lr': 5.0666666666666674e-05, 'samples': 97344, 'steps': 190, 'loss/train': 4.856250286102295} -09/20/2021 15:08:46 - INFO - __main__ - Step 3043: {'lr': 5.0666666666666674e-05, 'samples': 97376, 'steps': 190, 'loss/train': 5.693509101867676} -09/20/2021 15:08:47 - INFO - __main__ - Step 3044: {'lr': 5.0666666666666674e-05, 'samples': 97408, 'steps': 190, 'loss/train': 5.7013092041015625} -09/20/2021 15:08:48 - INFO - __main__ - Step 3045: {'lr': 5.0666666666666674e-05, 'samples': 97440, 'steps': 190, 'loss/train': 7.067870616912842} -09/20/2021 15:08:49 - INFO - __main__ - Step 3046: {'lr': 5.0666666666666674e-05, 'samples': 97472, 'steps': 190, 'loss/train': 6.270987033843994} -09/20/2021 15:08:49 - INFO - __main__ - Step 3047: {'lr': 5.0666666666666674e-05, 'samples': 97504, 'steps': 190, 'loss/train': 5.431723594665527} -09/20/2021 15:08:50 - INFO - __main__ - Step 3048: {'lr': 5.0666666666666674e-05, 'samples': 97536, 'steps': 190, 'loss/train': 4.522390842437744} -09/20/2021 15:08:51 - INFO - __main__ - Step 3049: {'lr': 5.0666666666666674e-05, 'samples': 97568, 'steps': 190, 'loss/train': 4.508565902709961} -09/20/2021 15:08:52 - INFO - __main__ - Step 3050: {'lr': 5.0666666666666674e-05, 'samples': 97600, 'steps': 190, 'loss/train': 5.909707069396973} -09/20/2021 15:08:52 - INFO - __main__ - Step 3051: {'lr': 5.0666666666666674e-05, 'samples': 97632, 'steps': 190, 'loss/train': 5.9157395362854} -09/20/2021 15:08:54 - INFO - __main__ - Step 3052: {'lr': 5.0666666666666674e-05, 'samples': 97664, 'steps': 190, 'loss/train': 5.517138957977295} -09/20/2021 15:08:54 - INFO - __main__ - Step 3053: {'lr': 5.0666666666666674e-05, 'samples': 97696, 'steps': 190, 'loss/train': 6.60287618637085} -09/20/2021 15:08:55 - INFO - __main__ - Step 3054: {'lr': 5.0666666666666674e-05, 'samples': 97728, 'steps': 190, 'loss/train': 5.476126670837402} -09/20/2021 15:08:56 - INFO - __main__ - Step 3055: {'lr': 5.0666666666666674e-05, 'samples': 97760, 'steps': 190, 'loss/train': 6.163523197174072} -09/20/2021 15:08:57 - INFO - __main__ - Step 3056: {'lr': 5.0666666666666674e-05, 'samples': 97792, 'steps': 190, 'loss/train': 5.322733402252197} -09/20/2021 15:08:58 - INFO - __main__ - Step 3057: {'lr': 5.0933333333333336e-05, 'samples': 97824, 'steps': 191, 'loss/train': 3.4952149391174316} -09/20/2021 15:08:58 - INFO - __main__ - Step 3058: {'lr': 5.0933333333333336e-05, 'samples': 97856, 'steps': 191, 'loss/train': 5.6020283699035645} -09/20/2021 15:08:59 - INFO - __main__ - Step 3059: {'lr': 5.0933333333333336e-05, 'samples': 97888, 'steps': 191, 'loss/train': 5.685643196105957} -09/20/2021 15:09:00 - INFO - __main__ - Step 3060: {'lr': 5.0933333333333336e-05, 'samples': 97920, 'steps': 191, 'loss/train': 7.102001190185547} -09/20/2021 15:09:01 - INFO - __main__ - Step 3061: {'lr': 5.0933333333333336e-05, 'samples': 97952, 'steps': 191, 'loss/train': 5.671895980834961} -09/20/2021 15:09:01 - INFO - __main__ - Step 3062: {'lr': 5.0933333333333336e-05, 'samples': 97984, 'steps': 191, 'loss/train': 6.969152450561523} -09/20/2021 15:09:02 - INFO - __main__ - Step 3063: {'lr': 5.0933333333333336e-05, 'samples': 98016, 'steps': 191, 'loss/train': 4.92141580581665} -09/20/2021 15:09:03 - INFO - __main__ - Step 3064: {'lr': 5.0933333333333336e-05, 'samples': 98048, 'steps': 191, 'loss/train': 5.770232677459717} -09/20/2021 15:09:04 - INFO - __main__ - Step 3065: {'lr': 5.0933333333333336e-05, 'samples': 98080, 'steps': 191, 'loss/train': 5.667346000671387} -09/20/2021 15:09:04 - INFO - __main__ - Step 3066: {'lr': 5.0933333333333336e-05, 'samples': 98112, 'steps': 191, 'loss/train': 5.642574310302734} -09/20/2021 15:09:05 - INFO - __main__ - Step 3067: {'lr': 5.0933333333333336e-05, 'samples': 98144, 'steps': 191, 'loss/train': 5.55702543258667} -09/20/2021 15:09:06 - INFO - __main__ - Step 3068: {'lr': 5.0933333333333336e-05, 'samples': 98176, 'steps': 191, 'loss/train': 6.419243812561035} -09/20/2021 15:09:07 - INFO - __main__ - Step 3069: {'lr': 5.0933333333333336e-05, 'samples': 98208, 'steps': 191, 'loss/train': 8.190020561218262} -09/20/2021 15:09:07 - INFO - __main__ - Step 3070: {'lr': 5.0933333333333336e-05, 'samples': 98240, 'steps': 191, 'loss/train': 8.314566612243652} -09/20/2021 15:09:08 - INFO - __main__ - Step 3071: {'lr': 5.0933333333333336e-05, 'samples': 98272, 'steps': 191, 'loss/train': 8.639009475708008} -09/20/2021 15:09:09 - INFO - __main__ - Step 3072: {'lr': 5.0933333333333336e-05, 'samples': 98304, 'steps': 191, 'loss/train': 6.2455363273620605} -09/20/2021 15:09:10 - INFO - __main__ - Step 3073: {'lr': 5.1200000000000004e-05, 'samples': 98336, 'steps': 192, 'loss/train': 6.286764621734619} -09/20/2021 15:09:10 - INFO - __main__ - Step 3074: {'lr': 5.1200000000000004e-05, 'samples': 98368, 'steps': 192, 'loss/train': 5.60247278213501} -09/20/2021 15:09:11 - INFO - __main__ - Step 3075: {'lr': 5.1200000000000004e-05, 'samples': 98400, 'steps': 192, 'loss/train': 3.67559552192688} -09/20/2021 15:09:12 - INFO - __main__ - Step 3076: {'lr': 5.1200000000000004e-05, 'samples': 98432, 'steps': 192, 'loss/train': 5.7183098793029785} -09/20/2021 15:09:13 - INFO - __main__ - Step 3077: {'lr': 5.1200000000000004e-05, 'samples': 98464, 'steps': 192, 'loss/train': 5.806381702423096} -09/20/2021 15:09:13 - INFO - __main__ - Step 3078: {'lr': 5.1200000000000004e-05, 'samples': 98496, 'steps': 192, 'loss/train': 5.685588359832764} -09/20/2021 15:09:14 - INFO - __main__ - Step 3079: {'lr': 5.1200000000000004e-05, 'samples': 98528, 'steps': 192, 'loss/train': 5.7264251708984375} -09/20/2021 15:09:15 - INFO - __main__ - Step 3080: {'lr': 5.1200000000000004e-05, 'samples': 98560, 'steps': 192, 'loss/train': 6.068676948547363} -09/20/2021 15:09:16 - INFO - __main__ - Step 3081: {'lr': 5.1200000000000004e-05, 'samples': 98592, 'steps': 192, 'loss/train': 7.0218071937561035} -09/20/2021 15:09:16 - INFO - __main__ - Step 3082: {'lr': 5.1200000000000004e-05, 'samples': 98624, 'steps': 192, 'loss/train': 5.460942268371582} -09/20/2021 15:09:17 - INFO - __main__ - Step 3083: {'lr': 5.1200000000000004e-05, 'samples': 98656, 'steps': 192, 'loss/train': 6.2562642097473145} -09/20/2021 15:09:18 - INFO - __main__ - Step 3084: {'lr': 5.1200000000000004e-05, 'samples': 98688, 'steps': 192, 'loss/train': 5.150286674499512} -09/20/2021 15:09:19 - INFO - __main__ - Step 3085: {'lr': 5.1200000000000004e-05, 'samples': 98720, 'steps': 192, 'loss/train': 5.560622692108154} -09/20/2021 15:09:20 - INFO - __main__ - Step 3086: {'lr': 5.1200000000000004e-05, 'samples': 98752, 'steps': 192, 'loss/train': 5.186324119567871} -09/20/2021 15:09:21 - INFO - __main__ - Step 3087: {'lr': 5.1200000000000004e-05, 'samples': 98784, 'steps': 192, 'loss/train': 6.001952648162842} -09/20/2021 15:09:22 - INFO - __main__ - Step 3088: {'lr': 5.1200000000000004e-05, 'samples': 98816, 'steps': 192, 'loss/train': 6.33391809463501} -09/20/2021 15:09:22 - INFO - __main__ - Step 3089: {'lr': 5.146666666666667e-05, 'samples': 98848, 'steps': 193, 'loss/train': 6.49352502822876} -09/20/2021 15:09:23 - INFO - __main__ - Step 3090: {'lr': 5.146666666666667e-05, 'samples': 98880, 'steps': 193, 'loss/train': 5.434447765350342} -09/20/2021 15:09:24 - INFO - __main__ - Step 3091: {'lr': 5.146666666666667e-05, 'samples': 98912, 'steps': 193, 'loss/train': 6.094029426574707} -09/20/2021 15:09:25 - INFO - __main__ - Step 3092: {'lr': 5.146666666666667e-05, 'samples': 98944, 'steps': 193, 'loss/train': 6.185773849487305} -09/20/2021 15:09:25 - INFO - __main__ - Step 3093: {'lr': 5.146666666666667e-05, 'samples': 98976, 'steps': 193, 'loss/train': 6.249237537384033} -09/20/2021 15:09:26 - INFO - __main__ - Step 3094: {'lr': 5.146666666666667e-05, 'samples': 99008, 'steps': 193, 'loss/train': 5.8756842613220215} -09/20/2021 15:09:27 - INFO - __main__ - Step 3095: {'lr': 5.146666666666667e-05, 'samples': 99040, 'steps': 193, 'loss/train': 5.891757965087891} -09/20/2021 15:09:28 - INFO - __main__ - Step 3096: {'lr': 5.146666666666667e-05, 'samples': 99072, 'steps': 193, 'loss/train': 5.972500801086426} -09/20/2021 15:09:28 - INFO - __main__ - Step 3097: {'lr': 5.146666666666667e-05, 'samples': 99104, 'steps': 193, 'loss/train': 6.215282440185547} -09/20/2021 15:09:29 - INFO - __main__ - Step 3098: {'lr': 5.146666666666667e-05, 'samples': 99136, 'steps': 193, 'loss/train': 5.0387864112854} -09/20/2021 15:09:30 - INFO - __main__ - Step 3099: {'lr': 5.146666666666667e-05, 'samples': 99168, 'steps': 193, 'loss/train': 7.021320819854736} -09/20/2021 15:09:31 - INFO - __main__ - Step 3100: {'lr': 5.146666666666667e-05, 'samples': 99200, 'steps': 193, 'loss/train': 5.74606466293335} -09/20/2021 15:09:31 - INFO - __main__ - Step 3101: {'lr': 5.146666666666667e-05, 'samples': 99232, 'steps': 193, 'loss/train': 6.248360633850098} -09/20/2021 15:09:32 - INFO - __main__ - Step 3102: {'lr': 5.146666666666667e-05, 'samples': 99264, 'steps': 193, 'loss/train': 6.299119472503662} -09/20/2021 15:09:33 - INFO - __main__ - Step 3103: {'lr': 5.146666666666667e-05, 'samples': 99296, 'steps': 193, 'loss/train': 5.680226802825928} -09/20/2021 15:09:34 - INFO - __main__ - Step 3104: {'lr': 5.146666666666667e-05, 'samples': 99328, 'steps': 193, 'loss/train': 5.9390082359313965} -09/20/2021 15:09:35 - INFO - __main__ - Step 3105: {'lr': 5.1733333333333335e-05, 'samples': 99360, 'steps': 194, 'loss/train': 5.3521199226379395} -09/20/2021 15:09:35 - INFO - __main__ - Step 3106: {'lr': 5.1733333333333335e-05, 'samples': 99392, 'steps': 194, 'loss/train': 5.5911173820495605} -09/20/2021 15:09:36 - INFO - __main__ - Step 3107: {'lr': 5.1733333333333335e-05, 'samples': 99424, 'steps': 194, 'loss/train': 6.046151638031006} -09/20/2021 15:09:37 - INFO - __main__ - Step 3108: {'lr': 5.1733333333333335e-05, 'samples': 99456, 'steps': 194, 'loss/train': 6.732293128967285} -09/20/2021 15:09:38 - INFO - __main__ - Step 3109: {'lr': 5.1733333333333335e-05, 'samples': 99488, 'steps': 194, 'loss/train': 6.214412212371826} -09/20/2021 15:09:38 - INFO - __main__ - Step 3110: {'lr': 5.1733333333333335e-05, 'samples': 99520, 'steps': 194, 'loss/train': 7.214353084564209} -09/20/2021 15:09:39 - INFO - __main__ - Step 3111: {'lr': 5.1733333333333335e-05, 'samples': 99552, 'steps': 194, 'loss/train': 5.711883068084717} -09/20/2021 15:09:40 - INFO - __main__ - Step 3112: {'lr': 5.1733333333333335e-05, 'samples': 99584, 'steps': 194, 'loss/train': 5.994289875030518} -09/20/2021 15:09:41 - INFO - __main__ - Step 3113: {'lr': 5.1733333333333335e-05, 'samples': 99616, 'steps': 194, 'loss/train': 5.9098429679870605} -09/20/2021 15:09:41 - INFO - __main__ - Step 3114: {'lr': 5.1733333333333335e-05, 'samples': 99648, 'steps': 194, 'loss/train': 5.335230350494385} -09/20/2021 15:09:43 - INFO - __main__ - Step 3115: {'lr': 5.1733333333333335e-05, 'samples': 99680, 'steps': 194, 'loss/train': 6.069617748260498} -09/20/2021 15:09:43 - INFO - __main__ - Step 3116: {'lr': 5.1733333333333335e-05, 'samples': 99712, 'steps': 194, 'loss/train': 7.487666130065918} -09/20/2021 15:09:44 - INFO - __main__ - Step 3117: {'lr': 5.1733333333333335e-05, 'samples': 99744, 'steps': 194, 'loss/train': 5.232104778289795} -09/20/2021 15:09:45 - INFO - __main__ - Step 3118: {'lr': 5.1733333333333335e-05, 'samples': 99776, 'steps': 194, 'loss/train': 6.810012340545654} -09/20/2021 15:09:46 - INFO - __main__ - Step 3119: {'lr': 5.1733333333333335e-05, 'samples': 99808, 'steps': 194, 'loss/train': 7.639316558837891} -09/20/2021 15:09:46 - INFO - __main__ - Step 3120: {'lr': 5.1733333333333335e-05, 'samples': 99840, 'steps': 194, 'loss/train': 7.6270952224731445} -09/20/2021 15:09:47 - INFO - __main__ - Step 3121: {'lr': 5.2000000000000004e-05, 'samples': 99872, 'steps': 195, 'loss/train': 7.196738243103027} -09/20/2021 15:09:48 - INFO - __main__ - Step 3122: {'lr': 5.2000000000000004e-05, 'samples': 99904, 'steps': 195, 'loss/train': 7.2279510498046875} -09/20/2021 15:09:49 - INFO - __main__ - Step 3123: {'lr': 5.2000000000000004e-05, 'samples': 99936, 'steps': 195, 'loss/train': 5.727688789367676} -09/20/2021 15:09:50 - INFO - __main__ - Step 3124: {'lr': 5.2000000000000004e-05, 'samples': 99968, 'steps': 195, 'loss/train': 5.223618507385254} -09/20/2021 15:09:50 - INFO - __main__ - Step 3125: {'lr': 5.2000000000000004e-05, 'samples': 100000, 'steps': 195, 'loss/train': 5.862478256225586} -09/20/2021 15:09:51 - INFO - __main__ - Step 3126: {'lr': 5.2000000000000004e-05, 'samples': 100032, 'steps': 195, 'loss/train': 5.82754373550415} -09/20/2021 15:09:52 - INFO - __main__ - Step 3127: {'lr': 5.2000000000000004e-05, 'samples': 100064, 'steps': 195, 'loss/train': 6.173554420471191} -09/20/2021 15:09:53 - INFO - __main__ - Step 3128: {'lr': 5.2000000000000004e-05, 'samples': 100096, 'steps': 195, 'loss/train': 6.167606353759766} -09/20/2021 15:09:53 - INFO - __main__ - Step 3129: {'lr': 5.2000000000000004e-05, 'samples': 100128, 'steps': 195, 'loss/train': 6.558963298797607} -09/20/2021 15:09:54 - INFO - __main__ - Step 3130: {'lr': 5.2000000000000004e-05, 'samples': 100160, 'steps': 195, 'loss/train': 5.990572452545166} -09/20/2021 15:09:55 - INFO - __main__ - Step 3131: {'lr': 5.2000000000000004e-05, 'samples': 100192, 'steps': 195, 'loss/train': 6.294030666351318} -09/20/2021 15:09:56 - INFO - __main__ - Step 3132: {'lr': 5.2000000000000004e-05, 'samples': 100224, 'steps': 195, 'loss/train': 5.735404968261719} -09/20/2021 15:09:56 - INFO - __main__ - Step 3133: {'lr': 5.2000000000000004e-05, 'samples': 100256, 'steps': 195, 'loss/train': 5.535519599914551} -09/20/2021 15:09:57 - INFO - __main__ - Step 3134: {'lr': 5.2000000000000004e-05, 'samples': 100288, 'steps': 195, 'loss/train': 6.425562858581543} -09/20/2021 15:09:58 - INFO - __main__ - Step 3135: {'lr': 5.2000000000000004e-05, 'samples': 100320, 'steps': 195, 'loss/train': 6.055722236633301} -09/20/2021 15:09:59 - INFO - __main__ - Step 3136: {'lr': 5.2000000000000004e-05, 'samples': 100352, 'steps': 195, 'loss/train': 6.232863903045654} -09/20/2021 15:10:00 - INFO - __main__ - Step 3137: {'lr': 5.2266666666666665e-05, 'samples': 100384, 'steps': 196, 'loss/train': 5.104255676269531} -09/20/2021 15:10:00 - INFO - __main__ - Step 3138: {'lr': 5.2266666666666665e-05, 'samples': 100416, 'steps': 196, 'loss/train': 5.118544578552246} -09/20/2021 15:10:01 - INFO - __main__ - Step 3139: {'lr': 5.2266666666666665e-05, 'samples': 100448, 'steps': 196, 'loss/train': 5.922077178955078} -09/20/2021 15:10:02 - INFO - __main__ - Step 3140: {'lr': 5.2266666666666665e-05, 'samples': 100480, 'steps': 196, 'loss/train': 5.758835792541504} -09/20/2021 15:10:03 - INFO - __main__ - Step 3141: {'lr': 5.2266666666666665e-05, 'samples': 100512, 'steps': 196, 'loss/train': 6.578885555267334} -09/20/2021 15:10:03 - INFO - __main__ - Step 3142: {'lr': 5.2266666666666665e-05, 'samples': 100544, 'steps': 196, 'loss/train': 6.533924579620361} -09/20/2021 15:10:04 - INFO - __main__ - Step 3143: {'lr': 5.2266666666666665e-05, 'samples': 100576, 'steps': 196, 'loss/train': 5.356889247894287} -09/20/2021 15:10:05 - INFO - __main__ - Step 3144: {'lr': 5.2266666666666665e-05, 'samples': 100608, 'steps': 196, 'loss/train': 5.217057704925537} -09/20/2021 15:10:06 - INFO - __main__ - Step 3145: {'lr': 5.2266666666666665e-05, 'samples': 100640, 'steps': 196, 'loss/train': 6.1527323722839355} -09/20/2021 15:10:06 - INFO - __main__ - Step 3146: {'lr': 5.2266666666666665e-05, 'samples': 100672, 'steps': 196, 'loss/train': 6.443562984466553} -09/20/2021 15:10:07 - INFO - __main__ - Step 3147: {'lr': 5.2266666666666665e-05, 'samples': 100704, 'steps': 196, 'loss/train': 6.673051357269287} -09/20/2021 15:10:09 - INFO - __main__ - Step 3148: {'lr': 5.2266666666666665e-05, 'samples': 100736, 'steps': 196, 'loss/train': 5.946042537689209} -09/20/2021 15:10:09 - INFO - __main__ - Step 3149: {'lr': 5.2266666666666665e-05, 'samples': 100768, 'steps': 196, 'loss/train': 5.2609686851501465} -09/20/2021 15:10:10 - INFO - __main__ - Step 3150: {'lr': 5.2266666666666665e-05, 'samples': 100800, 'steps': 196, 'loss/train': 6.524703502655029} -09/20/2021 15:10:11 - INFO - __main__ - Step 3151: {'lr': 5.2266666666666665e-05, 'samples': 100832, 'steps': 196, 'loss/train': 6.5992608070373535} -09/20/2021 15:10:12 - INFO - __main__ - Step 3152: {'lr': 5.2266666666666665e-05, 'samples': 100864, 'steps': 196, 'loss/train': 5.719122409820557} -09/20/2021 15:10:12 - INFO - __main__ - Step 3153: {'lr': 5.2533333333333334e-05, 'samples': 100896, 'steps': 197, 'loss/train': 5.967243194580078} -09/20/2021 15:10:13 - INFO - __main__ - Step 3154: {'lr': 5.2533333333333334e-05, 'samples': 100928, 'steps': 197, 'loss/train': 5.9199676513671875} -09/20/2021 15:10:14 - INFO - __main__ - Step 3155: {'lr': 5.2533333333333334e-05, 'samples': 100960, 'steps': 197, 'loss/train': 6.114523887634277} -09/20/2021 15:10:15 - INFO - __main__ - Step 3156: {'lr': 5.2533333333333334e-05, 'samples': 100992, 'steps': 197, 'loss/train': 5.729577541351318} -09/20/2021 15:10:15 - INFO - __main__ - Step 3157: {'lr': 5.2533333333333334e-05, 'samples': 101024, 'steps': 197, 'loss/train': 5.939037322998047} -09/20/2021 15:10:16 - INFO - __main__ - Step 3158: {'lr': 5.2533333333333334e-05, 'samples': 101056, 'steps': 197, 'loss/train': 5.4659833908081055} -09/20/2021 15:10:17 - INFO - __main__ - Step 3159: {'lr': 5.2533333333333334e-05, 'samples': 101088, 'steps': 197, 'loss/train': 5.675246715545654} -09/20/2021 15:10:18 - INFO - __main__ - Step 3160: {'lr': 5.2533333333333334e-05, 'samples': 101120, 'steps': 197, 'loss/train': 6.2067060470581055} -09/20/2021 15:10:18 - INFO - __main__ - Step 3161: {'lr': 5.2533333333333334e-05, 'samples': 101152, 'steps': 197, 'loss/train': 6.128935813903809} -09/20/2021 15:10:19 - INFO - __main__ - Step 3162: {'lr': 5.2533333333333334e-05, 'samples': 101184, 'steps': 197, 'loss/train': 5.699390888214111} -09/20/2021 15:10:20 - INFO - __main__ - Step 3163: {'lr': 5.2533333333333334e-05, 'samples': 101216, 'steps': 197, 'loss/train': 6.264615058898926} -09/20/2021 15:10:21 - INFO - __main__ - Step 3164: {'lr': 5.2533333333333334e-05, 'samples': 101248, 'steps': 197, 'loss/train': 6.075412273406982} -09/20/2021 15:10:21 - INFO - __main__ - Step 3165: {'lr': 5.2533333333333334e-05, 'samples': 101280, 'steps': 197, 'loss/train': 6.4854021072387695} -09/20/2021 15:10:22 - INFO - __main__ - Step 3166: {'lr': 5.2533333333333334e-05, 'samples': 101312, 'steps': 197, 'loss/train': 6.175037860870361} -09/20/2021 15:10:23 - INFO - __main__ - Step 3167: {'lr': 5.2533333333333334e-05, 'samples': 101344, 'steps': 197, 'loss/train': 6.1355509757995605} -09/20/2021 15:10:24 - INFO - __main__ - Step 3168: {'lr': 5.2533333333333334e-05, 'samples': 101376, 'steps': 197, 'loss/train': 5.223048210144043} -09/20/2021 15:10:25 - INFO - __main__ - Step 3169: {'lr': 5.28e-05, 'samples': 101408, 'steps': 198, 'loss/train': 6.128709316253662} -09/20/2021 15:10:25 - INFO - __main__ - Step 3170: {'lr': 5.28e-05, 'samples': 101440, 'steps': 198, 'loss/train': 5.749942779541016} -09/20/2021 15:10:26 - INFO - __main__ - Step 3171: {'lr': 5.28e-05, 'samples': 101472, 'steps': 198, 'loss/train': 5.864528179168701} -09/20/2021 15:10:27 - INFO - __main__ - Step 3172: {'lr': 5.28e-05, 'samples': 101504, 'steps': 198, 'loss/train': 5.749206066131592} -09/20/2021 15:10:28 - INFO - __main__ - Step 3173: {'lr': 5.28e-05, 'samples': 101536, 'steps': 198, 'loss/train': 6.343986988067627} -09/20/2021 15:10:28 - INFO - __main__ - Step 3174: {'lr': 5.28e-05, 'samples': 101568, 'steps': 198, 'loss/train': 5.662599563598633} -09/20/2021 15:10:29 - INFO - __main__ - Step 3175: {'lr': 5.28e-05, 'samples': 101600, 'steps': 198, 'loss/train': 4.3784613609313965} -09/20/2021 15:10:30 - INFO - __main__ - Step 3176: {'lr': 5.28e-05, 'samples': 101632, 'steps': 198, 'loss/train': 4.197738170623779} -09/20/2021 15:10:31 - INFO - __main__ - Step 3177: {'lr': 5.28e-05, 'samples': 101664, 'steps': 198, 'loss/train': 4.180964946746826} -09/20/2021 15:10:31 - INFO - __main__ - Step 3178: {'lr': 5.28e-05, 'samples': 101696, 'steps': 198, 'loss/train': 4.190148830413818} -09/20/2021 15:10:32 - INFO - __main__ - Step 3179: {'lr': 5.28e-05, 'samples': 101728, 'steps': 198, 'loss/train': 4.428207874298096} -09/20/2021 15:10:33 - INFO - __main__ - Step 3180: {'lr': 5.28e-05, 'samples': 101760, 'steps': 198, 'loss/train': 6.148026943206787} -09/20/2021 15:10:34 - INFO - __main__ - Step 3181: {'lr': 5.28e-05, 'samples': 101792, 'steps': 198, 'loss/train': 5.88201379776001} -09/20/2021 15:10:35 - INFO - __main__ - Step 3182: {'lr': 5.28e-05, 'samples': 101824, 'steps': 198, 'loss/train': 5.560147762298584} -09/20/2021 15:10:36 - INFO - __main__ - Step 3183: {'lr': 5.28e-05, 'samples': 101856, 'steps': 198, 'loss/train': 5.962932586669922} -09/20/2021 15:10:36 - INFO - __main__ - Step 3184: {'lr': 5.28e-05, 'samples': 101888, 'steps': 198, 'loss/train': 5.285445690155029} -09/20/2021 15:10:37 - INFO - __main__ - Step 3185: {'lr': 5.3066666666666665e-05, 'samples': 101920, 'steps': 199, 'loss/train': 6.055176734924316} -09/20/2021 15:10:38 - INFO - __main__ - Step 3186: {'lr': 5.3066666666666665e-05, 'samples': 101952, 'steps': 199, 'loss/train': 5.899539947509766} -09/20/2021 15:10:39 - INFO - __main__ - Step 3187: {'lr': 5.3066666666666665e-05, 'samples': 101984, 'steps': 199, 'loss/train': 6.71774959564209} -09/20/2021 15:10:39 - INFO - __main__ - Step 3188: {'lr': 5.3066666666666665e-05, 'samples': 102016, 'steps': 199, 'loss/train': 5.606783390045166} -09/20/2021 15:10:40 - INFO - __main__ - Step 3189: {'lr': 5.3066666666666665e-05, 'samples': 102048, 'steps': 199, 'loss/train': 5.067574977874756} -09/20/2021 15:10:41 - INFO - __main__ - Step 3190: {'lr': 5.3066666666666665e-05, 'samples': 102080, 'steps': 199, 'loss/train': 5.852926254272461} -09/20/2021 15:10:42 - INFO - __main__ - Step 3191: {'lr': 5.3066666666666665e-05, 'samples': 102112, 'steps': 199, 'loss/train': 6.036534786224365} -09/20/2021 15:10:42 - INFO - __main__ - Step 3192: {'lr': 5.3066666666666665e-05, 'samples': 102144, 'steps': 199, 'loss/train': 5.980940341949463} -09/20/2021 15:10:43 - INFO - __main__ - Step 3193: {'lr': 5.3066666666666665e-05, 'samples': 102176, 'steps': 199, 'loss/train': 6.537544250488281} -09/20/2021 15:10:44 - INFO - __main__ - Step 3194: {'lr': 5.3066666666666665e-05, 'samples': 102208, 'steps': 199, 'loss/train': 5.673810005187988} -09/20/2021 15:10:45 - INFO - __main__ - Step 3195: {'lr': 5.3066666666666665e-05, 'samples': 102240, 'steps': 199, 'loss/train': 5.187787055969238} -09/20/2021 15:10:45 - INFO - __main__ - Step 3196: {'lr': 5.3066666666666665e-05, 'samples': 102272, 'steps': 199, 'loss/train': 6.600401878356934} -09/20/2021 15:10:46 - INFO - __main__ - Step 3197: {'lr': 5.3066666666666665e-05, 'samples': 102304, 'steps': 199, 'loss/train': 5.564239025115967} -09/20/2021 15:10:47 - INFO - __main__ - Step 3198: {'lr': 5.3066666666666665e-05, 'samples': 102336, 'steps': 199, 'loss/train': 6.029198169708252} -09/20/2021 15:10:48 - INFO - __main__ - Step 3199: {'lr': 5.3066666666666665e-05, 'samples': 102368, 'steps': 199, 'loss/train': 5.934338569641113} -09/20/2021 15:10:48 - INFO - __main__ - Step 3200: {'lr': 5.3066666666666665e-05, 'samples': 102400, 'steps': 199, 'loss/train': 6.504249095916748} -09/20/2021 15:10:49 - INFO - __main__ - Step 3201: {'lr': 5.333333333333333e-05, 'samples': 102432, 'steps': 200, 'loss/train': 7.364745140075684} -09/20/2021 15:10:50 - INFO - __main__ - Step 3202: {'lr': 5.333333333333333e-05, 'samples': 102464, 'steps': 200, 'loss/train': 5.859498500823975} -09/20/2021 15:10:51 - INFO - __main__ - Step 3203: {'lr': 5.333333333333333e-05, 'samples': 102496, 'steps': 200, 'loss/train': 6.6390461921691895} -09/20/2021 15:10:52 - INFO - __main__ - Step 3204: {'lr': 5.333333333333333e-05, 'samples': 102528, 'steps': 200, 'loss/train': 6.381119728088379} -09/20/2021 15:10:52 - INFO - __main__ - Step 3205: {'lr': 5.333333333333333e-05, 'samples': 102560, 'steps': 200, 'loss/train': 5.745388031005859} -09/20/2021 15:10:53 - INFO - __main__ - Step 3206: {'lr': 5.333333333333333e-05, 'samples': 102592, 'steps': 200, 'loss/train': 6.543476581573486} -09/20/2021 15:10:54 - INFO - __main__ - Step 3207: {'lr': 5.333333333333333e-05, 'samples': 102624, 'steps': 200, 'loss/train': 5.063370227813721} -09/20/2021 15:10:55 - INFO - __main__ - Step 3208: {'lr': 5.333333333333333e-05, 'samples': 102656, 'steps': 200, 'loss/train': 6.354869365692139} -09/20/2021 15:10:55 - INFO - __main__ - Step 3209: {'lr': 5.333333333333333e-05, 'samples': 102688, 'steps': 200, 'loss/train': 6.368072986602783} -09/20/2021 15:10:56 - INFO - __main__ - Step 3210: {'lr': 5.333333333333333e-05, 'samples': 102720, 'steps': 200, 'loss/train': 5.450056076049805} -09/20/2021 15:10:58 - INFO - __main__ - Step 3211: {'lr': 5.333333333333333e-05, 'samples': 102752, 'steps': 200, 'loss/train': 5.598771095275879} -09/20/2021 15:10:59 - INFO - __main__ - Step 3212: {'lr': 5.333333333333333e-05, 'samples': 102784, 'steps': 200, 'loss/train': 5.187529563903809} -09/20/2021 15:10:59 - INFO - __main__ - Step 3213: {'lr': 5.333333333333333e-05, 'samples': 102816, 'steps': 200, 'loss/train': 5.345273494720459} -09/20/2021 15:11:00 - INFO - __main__ - Step 3214: {'lr': 5.333333333333333e-05, 'samples': 102848, 'steps': 200, 'loss/train': 5.599050045013428} -09/20/2021 15:11:01 - INFO - __main__ - Step 3215: {'lr': 5.333333333333333e-05, 'samples': 102880, 'steps': 200, 'loss/train': 5.163571357727051} -09/20/2021 15:11:02 - INFO - __main__ - Step 3216: {'lr': 5.333333333333333e-05, 'samples': 102912, 'steps': 200, 'loss/train': 5.2088141441345215} -09/20/2021 15:11:03 - INFO - __main__ - Step 3217: {'lr': 5.360000000000001e-05, 'samples': 102944, 'steps': 201, 'loss/train': 5.470898628234863} -09/20/2021 15:11:03 - INFO - __main__ - Step 3218: {'lr': 5.360000000000001e-05, 'samples': 102976, 'steps': 201, 'loss/train': 6.246304988861084} -09/20/2021 15:11:04 - INFO - __main__ - Step 3219: {'lr': 5.360000000000001e-05, 'samples': 103008, 'steps': 201, 'loss/train': 6.369602680206299} -09/20/2021 15:11:05 - INFO - __main__ - Step 3220: {'lr': 5.360000000000001e-05, 'samples': 103040, 'steps': 201, 'loss/train': 5.597744941711426} -09/20/2021 15:11:06 - INFO - __main__ - Step 3221: {'lr': 5.360000000000001e-05, 'samples': 103072, 'steps': 201, 'loss/train': 5.838569164276123} -09/20/2021 15:11:06 - INFO - __main__ - Step 3222: {'lr': 5.360000000000001e-05, 'samples': 103104, 'steps': 201, 'loss/train': 6.467062473297119} -09/20/2021 15:11:07 - INFO - __main__ - Step 3223: {'lr': 5.360000000000001e-05, 'samples': 103136, 'steps': 201, 'loss/train': 5.471625328063965} -09/20/2021 15:11:08 - INFO - __main__ - Step 3224: {'lr': 5.360000000000001e-05, 'samples': 103168, 'steps': 201, 'loss/train': 5.922796249389648} -09/20/2021 15:11:09 - INFO - __main__ - Step 3225: {'lr': 5.360000000000001e-05, 'samples': 103200, 'steps': 201, 'loss/train': 5.712939739227295} -09/20/2021 15:11:09 - INFO - __main__ - Step 3226: {'lr': 5.360000000000001e-05, 'samples': 103232, 'steps': 201, 'loss/train': 5.848893642425537} -09/20/2021 15:11:10 - INFO - __main__ - Step 3227: {'lr': 5.360000000000001e-05, 'samples': 103264, 'steps': 201, 'loss/train': 5.861618995666504} -09/20/2021 15:11:11 - INFO - __main__ - Step 3228: {'lr': 5.360000000000001e-05, 'samples': 103296, 'steps': 201, 'loss/train': 7.033451557159424} -09/20/2021 15:11:12 - INFO - __main__ - Step 3229: {'lr': 5.360000000000001e-05, 'samples': 103328, 'steps': 201, 'loss/train': 6.360104084014893} -09/20/2021 15:11:12 - INFO - __main__ - Step 3230: {'lr': 5.360000000000001e-05, 'samples': 103360, 'steps': 201, 'loss/train': 6.934819221496582} -09/20/2021 15:11:13 - INFO - __main__ - Step 3231: {'lr': 5.360000000000001e-05, 'samples': 103392, 'steps': 201, 'loss/train': 7.272984027862549} -09/20/2021 15:11:14 - INFO - __main__ - Step 3232: {'lr': 5.360000000000001e-05, 'samples': 103424, 'steps': 201, 'loss/train': 5.874741077423096} -09/20/2021 15:11:15 - INFO - __main__ - Step 3233: {'lr': 5.3866666666666664e-05, 'samples': 103456, 'steps': 202, 'loss/train': 5.867066860198975} -09/20/2021 15:11:15 - INFO - __main__ - Step 3234: {'lr': 5.3866666666666664e-05, 'samples': 103488, 'steps': 202, 'loss/train': 5.898739337921143} -09/20/2021 15:11:16 - INFO - __main__ - Step 3235: {'lr': 5.3866666666666664e-05, 'samples': 103520, 'steps': 202, 'loss/train': 5.297445774078369} -09/20/2021 15:11:17 - INFO - __main__ - Step 3236: {'lr': 5.3866666666666664e-05, 'samples': 103552, 'steps': 202, 'loss/train': 5.149487495422363} -09/20/2021 15:11:18 - INFO - __main__ - Step 3237: {'lr': 5.3866666666666664e-05, 'samples': 103584, 'steps': 202, 'loss/train': 6.469545841217041} -09/20/2021 15:11:18 - INFO - __main__ - Step 3238: {'lr': 5.3866666666666664e-05, 'samples': 103616, 'steps': 202, 'loss/train': 5.816241264343262} -09/20/2021 15:11:19 - INFO - __main__ - Step 3239: {'lr': 5.3866666666666664e-05, 'samples': 103648, 'steps': 202, 'loss/train': 5.666479587554932} -09/20/2021 15:11:20 - INFO - __main__ - Step 3240: {'lr': 5.3866666666666664e-05, 'samples': 103680, 'steps': 202, 'loss/train': 5.554166316986084} -09/20/2021 15:11:21 - INFO - __main__ - Step 3241: {'lr': 5.3866666666666664e-05, 'samples': 103712, 'steps': 202, 'loss/train': 5.286786079406738} -09/20/2021 15:11:22 - INFO - __main__ - Step 3242: {'lr': 5.3866666666666664e-05, 'samples': 103744, 'steps': 202, 'loss/train': 5.536684036254883} -09/20/2021 15:11:23 - INFO - __main__ - Step 3243: {'lr': 5.3866666666666664e-05, 'samples': 103776, 'steps': 202, 'loss/train': 6.172159671783447} -09/20/2021 15:11:23 - INFO - __main__ - Step 3244: {'lr': 5.3866666666666664e-05, 'samples': 103808, 'steps': 202, 'loss/train': 6.351017475128174} -09/20/2021 15:11:24 - INFO - __main__ - Step 3245: {'lr': 5.3866666666666664e-05, 'samples': 103840, 'steps': 202, 'loss/train': 5.936014652252197} -09/20/2021 15:11:25 - INFO - __main__ - Step 3246: {'lr': 5.3866666666666664e-05, 'samples': 103872, 'steps': 202, 'loss/train': 5.684876918792725} -09/20/2021 15:11:26 - INFO - __main__ - Step 3247: {'lr': 5.3866666666666664e-05, 'samples': 103904, 'steps': 202, 'loss/train': 5.856678009033203} -09/20/2021 15:11:26 - INFO - __main__ - Step 3248: {'lr': 5.3866666666666664e-05, 'samples': 103936, 'steps': 202, 'loss/train': 6.34390926361084} -09/20/2021 15:11:27 - INFO - __main__ - Step 3249: {'lr': 5.413333333333334e-05, 'samples': 103968, 'steps': 203, 'loss/train': 6.126351833343506} -09/20/2021 15:11:28 - INFO - __main__ - Step 3250: {'lr': 5.413333333333334e-05, 'samples': 104000, 'steps': 203, 'loss/train': 5.616748332977295} -09/20/2021 15:11:29 - INFO - __main__ - Step 3251: {'lr': 5.413333333333334e-05, 'samples': 104032, 'steps': 203, 'loss/train': 6.170934677124023} -09/20/2021 15:11:30 - INFO - __main__ - Step 3252: {'lr': 5.413333333333334e-05, 'samples': 104064, 'steps': 203, 'loss/train': 6.81226110458374} -09/20/2021 15:11:30 - INFO - __main__ - Step 3253: {'lr': 5.413333333333334e-05, 'samples': 104096, 'steps': 203, 'loss/train': 5.6181535720825195} -09/20/2021 15:11:31 - INFO - __main__ - Step 3254: {'lr': 5.413333333333334e-05, 'samples': 104128, 'steps': 203, 'loss/train': 5.970429420471191} -09/20/2021 15:11:32 - INFO - __main__ - Step 3255: {'lr': 5.413333333333334e-05, 'samples': 104160, 'steps': 203, 'loss/train': 5.920804500579834} -09/20/2021 15:11:33 - INFO - __main__ - Step 3256: {'lr': 5.413333333333334e-05, 'samples': 104192, 'steps': 203, 'loss/train': 5.723638534545898} -09/20/2021 15:11:33 - INFO - __main__ - Step 3257: {'lr': 5.413333333333334e-05, 'samples': 104224, 'steps': 203, 'loss/train': 6.534539699554443} -09/20/2021 15:11:34 - INFO - __main__ - Step 3258: {'lr': 5.413333333333334e-05, 'samples': 104256, 'steps': 203, 'loss/train': 5.71569299697876} -09/20/2021 15:11:35 - INFO - __main__ - Step 3259: {'lr': 5.413333333333334e-05, 'samples': 104288, 'steps': 203, 'loss/train': 5.47739839553833} -09/20/2021 15:11:36 - INFO - __main__ - Step 3260: {'lr': 5.413333333333334e-05, 'samples': 104320, 'steps': 203, 'loss/train': 5.578474521636963} -09/20/2021 15:11:36 - INFO - __main__ - Step 3261: {'lr': 5.413333333333334e-05, 'samples': 104352, 'steps': 203, 'loss/train': 5.764491558074951} -09/20/2021 15:11:37 - INFO - __main__ - Step 3262: {'lr': 5.413333333333334e-05, 'samples': 104384, 'steps': 203, 'loss/train': 5.60609769821167} -09/20/2021 15:11:38 - INFO - __main__ - Step 3263: {'lr': 5.413333333333334e-05, 'samples': 104416, 'steps': 203, 'loss/train': 5.57835054397583} -09/20/2021 15:11:39 - INFO - __main__ - Step 3264: {'lr': 5.413333333333334e-05, 'samples': 104448, 'steps': 203, 'loss/train': 4.747824668884277} -09/20/2021 15:11:40 - INFO - __main__ - Step 3265: {'lr': 5.440000000000001e-05, 'samples': 104480, 'steps': 204, 'loss/train': 5.850223064422607} -09/20/2021 15:11:40 - INFO - __main__ - Step 3266: {'lr': 5.440000000000001e-05, 'samples': 104512, 'steps': 204, 'loss/train': 6.166018486022949} -09/20/2021 15:11:41 - INFO - __main__ - Step 3267: {'lr': 5.440000000000001e-05, 'samples': 104544, 'steps': 204, 'loss/train': 6.4256720542907715} -09/20/2021 15:11:42 - INFO - __main__ - Step 3268: {'lr': 5.440000000000001e-05, 'samples': 104576, 'steps': 204, 'loss/train': 5.679245948791504} -09/20/2021 15:11:43 - INFO - __main__ - Step 3269: {'lr': 5.440000000000001e-05, 'samples': 104608, 'steps': 204, 'loss/train': 5.661729335784912} -09/20/2021 15:11:43 - INFO - __main__ - Step 3270: {'lr': 5.440000000000001e-05, 'samples': 104640, 'steps': 204, 'loss/train': 5.75294303894043} -09/20/2021 15:11:44 - INFO - __main__ - Step 3271: {'lr': 5.440000000000001e-05, 'samples': 104672, 'steps': 204, 'loss/train': 5.676864147186279} -09/20/2021 15:11:45 - INFO - __main__ - Step 3272: {'lr': 5.440000000000001e-05, 'samples': 104704, 'steps': 204, 'loss/train': 6.109148979187012} -09/20/2021 15:11:46 - INFO - __main__ - Step 3273: {'lr': 5.440000000000001e-05, 'samples': 104736, 'steps': 204, 'loss/train': 6.497394561767578} -09/20/2021 15:11:47 - INFO - __main__ - Step 3274: {'lr': 5.440000000000001e-05, 'samples': 104768, 'steps': 204, 'loss/train': 3.9443414211273193} -09/20/2021 15:11:48 - INFO - __main__ - Step 3275: {'lr': 5.440000000000001e-05, 'samples': 104800, 'steps': 204, 'loss/train': 3.8898141384124756} -09/20/2021 15:11:49 - INFO - __main__ - Step 3276: {'lr': 5.440000000000001e-05, 'samples': 104832, 'steps': 204, 'loss/train': 4.612909317016602} -09/20/2021 15:11:49 - INFO - __main__ - Step 3277: {'lr': 5.440000000000001e-05, 'samples': 104864, 'steps': 204, 'loss/train': 6.010329723358154} -09/20/2021 15:11:50 - INFO - __main__ - Step 3278: {'lr': 5.440000000000001e-05, 'samples': 104896, 'steps': 204, 'loss/train': 6.298149108886719} -09/20/2021 15:11:51 - INFO - __main__ - Step 3279: {'lr': 5.440000000000001e-05, 'samples': 104928, 'steps': 204, 'loss/train': 5.700962066650391} -09/20/2021 15:11:52 - INFO - __main__ - Step 3280: {'lr': 5.440000000000001e-05, 'samples': 104960, 'steps': 204, 'loss/train': 4.094084739685059} -09/20/2021 15:11:53 - INFO - __main__ - Step 3281: {'lr': 5.466666666666666e-05, 'samples': 104992, 'steps': 205, 'loss/train': 4.042451858520508} -09/20/2021 15:11:53 - INFO - __main__ - Step 3282: {'lr': 5.466666666666666e-05, 'samples': 105024, 'steps': 205, 'loss/train': 4.469601154327393} -09/20/2021 15:11:54 - INFO - __main__ - Step 3283: {'lr': 5.466666666666666e-05, 'samples': 105056, 'steps': 205, 'loss/train': 3.537456750869751} -09/20/2021 15:11:55 - INFO - __main__ - Step 3284: {'lr': 5.466666666666666e-05, 'samples': 105088, 'steps': 205, 'loss/train': 3.78621244430542} -09/20/2021 15:11:56 - INFO - __main__ - Step 3285: {'lr': 5.466666666666666e-05, 'samples': 105120, 'steps': 205, 'loss/train': 5.323331832885742} -09/20/2021 15:11:56 - INFO - __main__ - Step 3286: {'lr': 5.466666666666666e-05, 'samples': 105152, 'steps': 205, 'loss/train': 6.956617832183838} -09/20/2021 15:11:57 - INFO - __main__ - Step 3287: {'lr': 5.466666666666666e-05, 'samples': 105184, 'steps': 205, 'loss/train': 4.821713924407959} -09/20/2021 15:11:58 - INFO - __main__ - Step 3288: {'lr': 5.466666666666666e-05, 'samples': 105216, 'steps': 205, 'loss/train': 5.957865238189697} -09/20/2021 15:11:59 - INFO - __main__ - Step 3289: {'lr': 5.466666666666666e-05, 'samples': 105248, 'steps': 205, 'loss/train': 5.081448554992676} -09/20/2021 15:11:59 - INFO - __main__ - Step 3290: {'lr': 5.466666666666666e-05, 'samples': 105280, 'steps': 205, 'loss/train': 5.227928161621094} -09/20/2021 15:12:00 - INFO - __main__ - Step 3291: {'lr': 5.466666666666666e-05, 'samples': 105312, 'steps': 205, 'loss/train': 4.633972644805908} -09/20/2021 15:12:01 - INFO - __main__ - Step 3292: {'lr': 5.466666666666666e-05, 'samples': 105344, 'steps': 205, 'loss/train': 4.512956619262695} -09/20/2021 15:12:02 - INFO - __main__ - Step 3293: {'lr': 5.466666666666666e-05, 'samples': 105376, 'steps': 205, 'loss/train': 6.301919460296631} -09/20/2021 15:12:02 - INFO - __main__ - Step 3294: {'lr': 5.466666666666666e-05, 'samples': 105408, 'steps': 205, 'loss/train': 6.433948040008545} -09/20/2021 15:12:03 - INFO - __main__ - Step 3295: {'lr': 5.466666666666666e-05, 'samples': 105440, 'steps': 205, 'loss/train': 4.6213836669921875} -09/20/2021 15:12:04 - INFO - __main__ - Step 3296: {'lr': 5.466666666666666e-05, 'samples': 105472, 'steps': 205, 'loss/train': 5.907901287078857} -09/20/2021 15:12:05 - INFO - __main__ - Step 3297: {'lr': 5.493333333333334e-05, 'samples': 105504, 'steps': 206, 'loss/train': 6.050973892211914} -09/20/2021 15:12:05 - INFO - __main__ - Step 3298: {'lr': 5.493333333333334e-05, 'samples': 105536, 'steps': 206, 'loss/train': 5.165439605712891} -09/20/2021 15:12:06 - INFO - __main__ - Step 3299: {'lr': 5.493333333333334e-05, 'samples': 105568, 'steps': 206, 'loss/train': 5.935155868530273} -09/20/2021 15:12:07 - INFO - __main__ - Step 3300: {'lr': 5.493333333333334e-05, 'samples': 105600, 'steps': 206, 'loss/train': 5.1518778800964355} -09/20/2021 15:12:08 - INFO - __main__ - Step 3301: {'lr': 5.493333333333334e-05, 'samples': 105632, 'steps': 206, 'loss/train': 6.0207743644714355} -09/20/2021 15:12:08 - INFO - __main__ - Step 3302: {'lr': 5.493333333333334e-05, 'samples': 105664, 'steps': 206, 'loss/train': 6.3249430656433105} -09/20/2021 15:12:09 - INFO - __main__ - Step 3303: {'lr': 5.493333333333334e-05, 'samples': 105696, 'steps': 206, 'loss/train': 5.602453231811523} -09/20/2021 15:12:10 - INFO - __main__ - Step 3304: {'lr': 5.493333333333334e-05, 'samples': 105728, 'steps': 206, 'loss/train': 5.272799015045166} -09/20/2021 15:12:11 - INFO - __main__ - Step 3305: {'lr': 5.493333333333334e-05, 'samples': 105760, 'steps': 206, 'loss/train': 6.082634449005127} -09/20/2021 15:12:11 - INFO - __main__ - Step 3306: {'lr': 5.493333333333334e-05, 'samples': 105792, 'steps': 206, 'loss/train': 4.942625999450684} -09/20/2021 15:12:12 - INFO - __main__ - Step 3307: {'lr': 5.493333333333334e-05, 'samples': 105824, 'steps': 206, 'loss/train': 4.866952896118164} -09/20/2021 15:12:13 - INFO - __main__ - Step 3308: {'lr': 5.493333333333334e-05, 'samples': 105856, 'steps': 206, 'loss/train': 6.9695563316345215} -09/20/2021 15:12:14 - INFO - __main__ - Step 3309: {'lr': 5.493333333333334e-05, 'samples': 105888, 'steps': 206, 'loss/train': 5.144078254699707} -09/20/2021 15:12:15 - INFO - __main__ - Step 3310: {'lr': 5.493333333333334e-05, 'samples': 105920, 'steps': 206, 'loss/train': 4.230056285858154} -09/20/2021 15:12:16 - INFO - __main__ - Step 3311: {'lr': 5.493333333333334e-05, 'samples': 105952, 'steps': 206, 'loss/train': 5.638094425201416} -09/20/2021 15:12:16 - INFO - __main__ - Step 3312: {'lr': 5.493333333333334e-05, 'samples': 105984, 'steps': 206, 'loss/train': 6.076585292816162} -09/20/2021 15:12:17 - INFO - __main__ - Step 3313: {'lr': 5.520000000000001e-05, 'samples': 106016, 'steps': 207, 'loss/train': 5.422543048858643} -09/20/2021 15:12:18 - INFO - __main__ - Step 3314: {'lr': 5.520000000000001e-05, 'samples': 106048, 'steps': 207, 'loss/train': 5.659474849700928} -09/20/2021 15:12:19 - INFO - __main__ - Step 3315: {'lr': 5.520000000000001e-05, 'samples': 106080, 'steps': 207, 'loss/train': 5.876163482666016} -09/20/2021 15:12:20 - INFO - __main__ - Step 3316: {'lr': 5.520000000000001e-05, 'samples': 106112, 'steps': 207, 'loss/train': 5.313589572906494} -09/20/2021 15:12:20 - INFO - __main__ - Step 3317: {'lr': 5.520000000000001e-05, 'samples': 106144, 'steps': 207, 'loss/train': 5.304947853088379} -09/20/2021 15:12:21 - INFO - __main__ - Step 3318: {'lr': 5.520000000000001e-05, 'samples': 106176, 'steps': 207, 'loss/train': 6.376590251922607} -09/20/2021 15:12:22 - INFO - __main__ - Step 3319: {'lr': 5.520000000000001e-05, 'samples': 106208, 'steps': 207, 'loss/train': 5.7564826011657715} -09/20/2021 15:12:23 - INFO - __main__ - Step 3320: {'lr': 5.520000000000001e-05, 'samples': 106240, 'steps': 207, 'loss/train': 5.970577239990234} -09/20/2021 15:12:23 - INFO - __main__ - Step 3321: {'lr': 5.520000000000001e-05, 'samples': 106272, 'steps': 207, 'loss/train': 5.415234565734863} -09/20/2021 15:12:24 - INFO - __main__ - Step 3322: {'lr': 5.520000000000001e-05, 'samples': 106304, 'steps': 207, 'loss/train': 5.61488151550293} -09/20/2021 15:12:25 - INFO - __main__ - Step 3323: {'lr': 5.520000000000001e-05, 'samples': 106336, 'steps': 207, 'loss/train': 6.580893516540527} -09/20/2021 15:12:26 - INFO - __main__ - Step 3324: {'lr': 5.520000000000001e-05, 'samples': 106368, 'steps': 207, 'loss/train': 4.991863250732422} -09/20/2021 15:12:26 - INFO - __main__ - Step 3325: {'lr': 5.520000000000001e-05, 'samples': 106400, 'steps': 207, 'loss/train': 5.149253845214844} -09/20/2021 15:12:27 - INFO - __main__ - Step 3326: {'lr': 5.520000000000001e-05, 'samples': 106432, 'steps': 207, 'loss/train': 6.34046745300293} -09/20/2021 15:12:28 - INFO - __main__ - Step 3327: {'lr': 5.520000000000001e-05, 'samples': 106464, 'steps': 207, 'loss/train': 6.436407566070557} -09/20/2021 15:12:29 - INFO - __main__ - Step 3328: {'lr': 5.520000000000001e-05, 'samples': 106496, 'steps': 207, 'loss/train': 5.83427095413208} -09/20/2021 15:12:29 - INFO - __main__ - Step 3329: {'lr': 5.546666666666667e-05, 'samples': 106528, 'steps': 208, 'loss/train': 5.941085338592529} -09/20/2021 15:12:30 - INFO - __main__ - Step 3330: {'lr': 5.546666666666667e-05, 'samples': 106560, 'steps': 208, 'loss/train': 5.111279487609863} -09/20/2021 15:12:31 - INFO - __main__ - Step 3331: {'lr': 5.546666666666667e-05, 'samples': 106592, 'steps': 208, 'loss/train': 4.950228214263916} -09/20/2021 15:12:32 - INFO - __main__ - Step 3332: {'lr': 5.546666666666667e-05, 'samples': 106624, 'steps': 208, 'loss/train': 5.750357627868652} -09/20/2021 15:12:32 - INFO - __main__ - Step 3333: {'lr': 5.546666666666667e-05, 'samples': 106656, 'steps': 208, 'loss/train': 6.306267261505127} -09/20/2021 15:12:33 - INFO - __main__ - Step 3334: {'lr': 5.546666666666667e-05, 'samples': 106688, 'steps': 208, 'loss/train': 6.046755790710449} -09/20/2021 15:12:34 - INFO - __main__ - Step 3335: {'lr': 5.546666666666667e-05, 'samples': 106720, 'steps': 208, 'loss/train': 5.0890703201293945} -09/20/2021 15:12:35 - INFO - __main__ - Step 3336: {'lr': 5.546666666666667e-05, 'samples': 106752, 'steps': 208, 'loss/train': 5.842859268188477} -09/20/2021 15:12:35 - INFO - __main__ - Step 3337: {'lr': 5.546666666666667e-05, 'samples': 106784, 'steps': 208, 'loss/train': 4.929736137390137} -09/20/2021 15:12:36 - INFO - __main__ - Step 3338: {'lr': 5.546666666666667e-05, 'samples': 106816, 'steps': 208, 'loss/train': 5.388038158416748} -09/20/2021 15:12:38 - INFO - __main__ - Step 3339: {'lr': 5.546666666666667e-05, 'samples': 106848, 'steps': 208, 'loss/train': 5.962072849273682} -09/20/2021 15:12:38 - INFO - __main__ - Step 3340: {'lr': 5.546666666666667e-05, 'samples': 106880, 'steps': 208, 'loss/train': 5.674485683441162} -09/20/2021 15:12:39 - INFO - __main__ - Step 3341: {'lr': 5.546666666666667e-05, 'samples': 106912, 'steps': 208, 'loss/train': 5.949653625488281} -09/20/2021 15:12:40 - INFO - __main__ - Step 3342: {'lr': 5.546666666666667e-05, 'samples': 106944, 'steps': 208, 'loss/train': 5.73410701751709} -09/20/2021 15:12:41 - INFO - __main__ - Step 3343: {'lr': 5.546666666666667e-05, 'samples': 106976, 'steps': 208, 'loss/train': 5.866941928863525} -09/20/2021 15:12:41 - INFO - __main__ - Step 3344: {'lr': 5.546666666666667e-05, 'samples': 107008, 'steps': 208, 'loss/train': 5.236491680145264} -09/20/2021 15:12:42 - INFO - __main__ - Step 3345: {'lr': 5.573333333333334e-05, 'samples': 107040, 'steps': 209, 'loss/train': 5.902146339416504} -09/20/2021 15:12:43 - INFO - __main__ - Step 3346: {'lr': 5.573333333333334e-05, 'samples': 107072, 'steps': 209, 'loss/train': 5.859011650085449} -09/20/2021 15:12:44 - INFO - __main__ - Step 3347: {'lr': 5.573333333333334e-05, 'samples': 107104, 'steps': 209, 'loss/train': 4.926307201385498} -09/20/2021 15:12:45 - INFO - __main__ - Step 3348: {'lr': 5.573333333333334e-05, 'samples': 107136, 'steps': 209, 'loss/train': 7.188333034515381} -09/20/2021 15:12:45 - INFO - __main__ - Step 3349: {'lr': 5.573333333333334e-05, 'samples': 107168, 'steps': 209, 'loss/train': 6.186385631561279} -09/20/2021 15:12:46 - INFO - __main__ - Step 3350: {'lr': 5.573333333333334e-05, 'samples': 107200, 'steps': 209, 'loss/train': 5.5409674644470215} -09/20/2021 15:12:47 - INFO - __main__ - Step 3351: {'lr': 5.573333333333334e-05, 'samples': 107232, 'steps': 209, 'loss/train': 5.498532772064209} -09/20/2021 15:12:48 - INFO - __main__ - Step 3352: {'lr': 5.573333333333334e-05, 'samples': 107264, 'steps': 209, 'loss/train': 7.594634532928467} -09/20/2021 15:12:48 - INFO - __main__ - Step 3353: {'lr': 5.573333333333334e-05, 'samples': 107296, 'steps': 209, 'loss/train': 6.048120021820068} -09/20/2021 15:12:49 - INFO - __main__ - Step 3354: {'lr': 5.573333333333334e-05, 'samples': 107328, 'steps': 209, 'loss/train': 5.465426921844482} -09/20/2021 15:12:50 - INFO - __main__ - Step 3355: {'lr': 5.573333333333334e-05, 'samples': 107360, 'steps': 209, 'loss/train': 5.0487961769104} -09/20/2021 15:12:51 - INFO - __main__ - Step 3356: {'lr': 5.573333333333334e-05, 'samples': 107392, 'steps': 209, 'loss/train': 5.8885979652404785} -09/20/2021 15:12:51 - INFO - __main__ - Step 3357: {'lr': 5.573333333333334e-05, 'samples': 107424, 'steps': 209, 'loss/train': 5.475398540496826} -09/20/2021 15:12:52 - INFO - __main__ - Step 3358: {'lr': 5.573333333333334e-05, 'samples': 107456, 'steps': 209, 'loss/train': 5.639043807983398} -09/20/2021 15:12:53 - INFO - __main__ - Step 3359: {'lr': 5.573333333333334e-05, 'samples': 107488, 'steps': 209, 'loss/train': 6.098813056945801} -09/20/2021 15:12:54 - INFO - __main__ - Step 3360: {'lr': 5.573333333333334e-05, 'samples': 107520, 'steps': 209, 'loss/train': 6.041276454925537} -09/20/2021 15:12:54 - INFO - __main__ - Step 3361: {'lr': 5.6000000000000006e-05, 'samples': 107552, 'steps': 210, 'loss/train': 5.715883731842041} -09/20/2021 15:12:55 - INFO - __main__ - Step 3362: {'lr': 5.6000000000000006e-05, 'samples': 107584, 'steps': 210, 'loss/train': 6.6241960525512695} -09/20/2021 15:12:56 - INFO - __main__ - Step 3363: {'lr': 5.6000000000000006e-05, 'samples': 107616, 'steps': 210, 'loss/train': 6.426231861114502} -09/20/2021 15:12:57 - INFO - __main__ - Step 3364: {'lr': 5.6000000000000006e-05, 'samples': 107648, 'steps': 210, 'loss/train': 6.142449378967285} -09/20/2021 15:12:57 - INFO - __main__ - Step 3365: {'lr': 5.6000000000000006e-05, 'samples': 107680, 'steps': 210, 'loss/train': 6.707741737365723} -09/20/2021 15:12:58 - INFO - __main__ - Step 3366: {'lr': 5.6000000000000006e-05, 'samples': 107712, 'steps': 210, 'loss/train': 8.724963188171387} -09/20/2021 15:12:59 - INFO - __main__ - Step 3367: {'lr': 5.6000000000000006e-05, 'samples': 107744, 'steps': 210, 'loss/train': 5.858310699462891} -09/20/2021 15:13:00 - INFO - __main__ - Step 3368: {'lr': 5.6000000000000006e-05, 'samples': 107776, 'steps': 210, 'loss/train': 7.277842044830322} -09/20/2021 15:13:00 - INFO - __main__ - Step 3369: {'lr': 5.6000000000000006e-05, 'samples': 107808, 'steps': 210, 'loss/train': 4.990050315856934} -09/20/2021 15:13:02 - INFO - __main__ - Step 3370: {'lr': 5.6000000000000006e-05, 'samples': 107840, 'steps': 210, 'loss/train': 5.709041118621826} -09/20/2021 15:13:02 - INFO - __main__ - Step 3371: {'lr': 5.6000000000000006e-05, 'samples': 107872, 'steps': 210, 'loss/train': 5.7729878425598145} -09/20/2021 15:13:03 - INFO - __main__ - Step 3372: {'lr': 5.6000000000000006e-05, 'samples': 107904, 'steps': 210, 'loss/train': 5.782525539398193} -09/20/2021 15:13:04 - INFO - __main__ - Step 3373: {'lr': 5.6000000000000006e-05, 'samples': 107936, 'steps': 210, 'loss/train': 6.161109447479248} -09/20/2021 15:13:05 - INFO - __main__ - Step 3374: {'lr': 5.6000000000000006e-05, 'samples': 107968, 'steps': 210, 'loss/train': 5.878137588500977} -09/20/2021 15:13:05 - INFO - __main__ - Step 3375: {'lr': 5.6000000000000006e-05, 'samples': 108000, 'steps': 210, 'loss/train': 5.468287467956543} -09/20/2021 15:13:06 - INFO - __main__ - Step 3376: {'lr': 5.6000000000000006e-05, 'samples': 108032, 'steps': 210, 'loss/train': 5.57853364944458} -09/20/2021 15:13:07 - INFO - __main__ - Step 3377: {'lr': 5.626666666666667e-05, 'samples': 108064, 'steps': 211, 'loss/train': 5.939549446105957} -09/20/2021 15:13:08 - INFO - __main__ - Step 3378: {'lr': 5.626666666666667e-05, 'samples': 108096, 'steps': 211, 'loss/train': 5.839690685272217} -09/20/2021 15:13:09 - INFO - __main__ - Step 3379: {'lr': 5.626666666666667e-05, 'samples': 108128, 'steps': 211, 'loss/train': 5.879246234893799} -09/20/2021 15:13:09 - INFO - __main__ - Step 3380: {'lr': 5.626666666666667e-05, 'samples': 108160, 'steps': 211, 'loss/train': 7.559290409088135} -09/20/2021 15:13:10 - INFO - __main__ - Step 3381: {'lr': 5.626666666666667e-05, 'samples': 108192, 'steps': 211, 'loss/train': 5.392391204833984} -09/20/2021 15:13:11 - INFO - __main__ - Step 3382: {'lr': 5.626666666666667e-05, 'samples': 108224, 'steps': 211, 'loss/train': 6.221250057220459} -09/20/2021 15:13:12 - INFO - __main__ - Step 3383: {'lr': 5.626666666666667e-05, 'samples': 108256, 'steps': 211, 'loss/train': 5.849564552307129} -09/20/2021 15:13:12 - INFO - __main__ - Step 3384: {'lr': 5.626666666666667e-05, 'samples': 108288, 'steps': 211, 'loss/train': 5.373847007751465} -09/20/2021 15:13:13 - INFO - __main__ - Step 3385: {'lr': 5.626666666666667e-05, 'samples': 108320, 'steps': 211, 'loss/train': 6.238867282867432} -09/20/2021 15:13:14 - INFO - __main__ - Step 3386: {'lr': 5.626666666666667e-05, 'samples': 108352, 'steps': 211, 'loss/train': 6.29409646987915} -09/20/2021 15:13:15 - INFO - __main__ - Step 3387: {'lr': 5.626666666666667e-05, 'samples': 108384, 'steps': 211, 'loss/train': 6.87113094329834} -09/20/2021 15:13:15 - INFO - __main__ - Step 3388: {'lr': 5.626666666666667e-05, 'samples': 108416, 'steps': 211, 'loss/train': 6.027515411376953} -09/20/2021 15:13:16 - INFO - __main__ - Step 3389: {'lr': 5.626666666666667e-05, 'samples': 108448, 'steps': 211, 'loss/train': 6.088496208190918} -09/20/2021 15:13:17 - INFO - __main__ - Step 3390: {'lr': 5.626666666666667e-05, 'samples': 108480, 'steps': 211, 'loss/train': 5.837799072265625} -09/20/2021 15:13:18 - INFO - __main__ - Step 3391: {'lr': 5.626666666666667e-05, 'samples': 108512, 'steps': 211, 'loss/train': 5.338809967041016} -09/20/2021 15:13:18 - INFO - __main__ - Step 3392: {'lr': 5.626666666666667e-05, 'samples': 108544, 'steps': 211, 'loss/train': 5.953395843505859} -09/20/2021 15:13:19 - INFO - __main__ - Step 3393: {'lr': 5.6533333333333336e-05, 'samples': 108576, 'steps': 212, 'loss/train': 6.118219375610352} -09/20/2021 15:13:20 - INFO - __main__ - Step 3394: {'lr': 5.6533333333333336e-05, 'samples': 108608, 'steps': 212, 'loss/train': 5.416900634765625} -09/20/2021 15:13:21 - INFO - __main__ - Step 3395: {'lr': 5.6533333333333336e-05, 'samples': 108640, 'steps': 212, 'loss/train': 4.9389119148254395} -09/20/2021 15:13:21 - INFO - __main__ - Step 3396: {'lr': 5.6533333333333336e-05, 'samples': 108672, 'steps': 212, 'loss/train': 6.040527820587158} -09/20/2021 15:13:22 - INFO - __main__ - Step 3397: {'lr': 5.6533333333333336e-05, 'samples': 108704, 'steps': 212, 'loss/train': 5.79476261138916} -09/20/2021 15:13:23 - INFO - __main__ - Step 3398: {'lr': 5.6533333333333336e-05, 'samples': 108736, 'steps': 212, 'loss/train': 5.263989448547363} -09/20/2021 15:13:24 - INFO - __main__ - Step 3399: {'lr': 5.6533333333333336e-05, 'samples': 108768, 'steps': 212, 'loss/train': 5.920090675354004} -09/20/2021 15:13:25 - INFO - __main__ - Step 3400: {'lr': 5.6533333333333336e-05, 'samples': 108800, 'steps': 212, 'loss/train': 5.5892791748046875} -09/20/2021 15:13:26 - INFO - __main__ - Step 3401: {'lr': 5.6533333333333336e-05, 'samples': 108832, 'steps': 212, 'loss/train': 5.774768352508545} -09/20/2021 15:13:27 - INFO - __main__ - Step 3402: {'lr': 5.6533333333333336e-05, 'samples': 108864, 'steps': 212, 'loss/train': 5.591148853302002} -09/20/2021 15:13:27 - INFO - __main__ - Step 3403: {'lr': 5.6533333333333336e-05, 'samples': 108896, 'steps': 212, 'loss/train': 6.104406356811523} -09/20/2021 15:13:28 - INFO - __main__ - Step 3404: {'lr': 5.6533333333333336e-05, 'samples': 108928, 'steps': 212, 'loss/train': 5.5027618408203125} -09/20/2021 15:13:29 - INFO - __main__ - Step 3405: {'lr': 5.6533333333333336e-05, 'samples': 108960, 'steps': 212, 'loss/train': 7.047525882720947} -09/20/2021 15:13:30 - INFO - __main__ - Step 3406: {'lr': 5.6533333333333336e-05, 'samples': 108992, 'steps': 212, 'loss/train': 5.829832553863525} -09/20/2021 15:13:30 - INFO - __main__ - Step 3407: {'lr': 5.6533333333333336e-05, 'samples': 109024, 'steps': 212, 'loss/train': 5.402120113372803} -09/20/2021 15:13:31 - INFO - __main__ - Step 3408: {'lr': 5.6533333333333336e-05, 'samples': 109056, 'steps': 212, 'loss/train': 6.502711296081543} -09/20/2021 15:13:32 - INFO - __main__ - Step 3409: {'lr': 5.68e-05, 'samples': 109088, 'steps': 213, 'loss/train': 6.087539196014404} -09/20/2021 15:13:33 - INFO - __main__ - Step 3410: {'lr': 5.68e-05, 'samples': 109120, 'steps': 213, 'loss/train': 5.353795051574707} -09/20/2021 15:13:33 - INFO - __main__ - Step 3411: {'lr': 5.68e-05, 'samples': 109152, 'steps': 213, 'loss/train': 5.996677875518799} -09/20/2021 15:13:34 - INFO - __main__ - Step 3412: {'lr': 5.68e-05, 'samples': 109184, 'steps': 213, 'loss/train': 5.720418453216553} -09/20/2021 15:13:35 - INFO - __main__ - Step 3413: {'lr': 5.68e-05, 'samples': 109216, 'steps': 213, 'loss/train': 4.866767883300781} -09/20/2021 15:13:36 - INFO - __main__ - Step 3414: {'lr': 5.68e-05, 'samples': 109248, 'steps': 213, 'loss/train': 5.93094539642334} -09/20/2021 15:13:36 - INFO - __main__ - Step 3415: {'lr': 5.68e-05, 'samples': 109280, 'steps': 213, 'loss/train': 5.929579734802246} -09/20/2021 15:13:37 - INFO - __main__ - Step 3416: {'lr': 5.68e-05, 'samples': 109312, 'steps': 213, 'loss/train': 5.473577499389648} -09/20/2021 15:13:38 - INFO - __main__ - Step 3417: {'lr': 5.68e-05, 'samples': 109344, 'steps': 213, 'loss/train': 6.536037445068359} -09/20/2021 15:13:39 - INFO - __main__ - Step 3418: {'lr': 5.68e-05, 'samples': 109376, 'steps': 213, 'loss/train': 5.630011558532715} -09/20/2021 15:13:39 - INFO - __main__ - Step 3419: {'lr': 5.68e-05, 'samples': 109408, 'steps': 213, 'loss/train': 5.8319292068481445} -09/20/2021 15:13:40 - INFO - __main__ - Step 3420: {'lr': 5.68e-05, 'samples': 109440, 'steps': 213, 'loss/train': 5.552813529968262} -09/20/2021 15:13:41 - INFO - __main__ - Step 3421: {'lr': 5.68e-05, 'samples': 109472, 'steps': 213, 'loss/train': 6.6199445724487305} -09/20/2021 15:13:42 - INFO - __main__ - Step 3422: {'lr': 5.68e-05, 'samples': 109504, 'steps': 213, 'loss/train': 5.642897605895996} -09/20/2021 15:13:42 - INFO - __main__ - Step 3423: {'lr': 5.68e-05, 'samples': 109536, 'steps': 213, 'loss/train': 4.875718116760254} -09/20/2021 15:13:43 - INFO - __main__ - Step 3424: {'lr': 5.68e-05, 'samples': 109568, 'steps': 213, 'loss/train': 5.394330978393555} -09/20/2021 15:13:44 - INFO - __main__ - Step 3425: {'lr': 5.706666666666667e-05, 'samples': 109600, 'steps': 214, 'loss/train': 5.549553394317627} -09/20/2021 15:13:45 - INFO - __main__ - Step 3426: {'lr': 5.706666666666667e-05, 'samples': 109632, 'steps': 214, 'loss/train': 6.64230489730835} -09/20/2021 15:13:46 - INFO - __main__ - Step 3427: {'lr': 5.706666666666667e-05, 'samples': 109664, 'steps': 214, 'loss/train': 6.195418357849121} -09/20/2021 15:13:46 - INFO - __main__ - Step 3428: {'lr': 5.706666666666667e-05, 'samples': 109696, 'steps': 214, 'loss/train': 7.192736625671387} -09/20/2021 15:13:47 - INFO - __main__ - Step 3429: {'lr': 5.706666666666667e-05, 'samples': 109728, 'steps': 214, 'loss/train': 5.9404191970825195} -09/20/2021 15:13:48 - INFO - __main__ - Step 3430: {'lr': 5.706666666666667e-05, 'samples': 109760, 'steps': 214, 'loss/train': 7.282442092895508} -09/20/2021 15:13:49 - INFO - __main__ - Step 3431: {'lr': 5.706666666666667e-05, 'samples': 109792, 'steps': 214, 'loss/train': 7.298046588897705} -09/20/2021 15:13:50 - INFO - __main__ - Step 3432: {'lr': 5.706666666666667e-05, 'samples': 109824, 'steps': 214, 'loss/train': 5.317721843719482} -09/20/2021 15:13:51 - INFO - __main__ - Step 3433: {'lr': 5.706666666666667e-05, 'samples': 109856, 'steps': 214, 'loss/train': 5.505086898803711} -09/20/2021 15:13:51 - INFO - __main__ - Step 3434: {'lr': 5.706666666666667e-05, 'samples': 109888, 'steps': 214, 'loss/train': 5.35696268081665} -09/20/2021 15:13:52 - INFO - __main__ - Step 3435: {'lr': 5.706666666666667e-05, 'samples': 109920, 'steps': 214, 'loss/train': 5.963290691375732} -09/20/2021 15:13:53 - INFO - __main__ - Step 3436: {'lr': 5.706666666666667e-05, 'samples': 109952, 'steps': 214, 'loss/train': 7.419007778167725} -09/20/2021 15:13:54 - INFO - __main__ - Step 3437: {'lr': 5.706666666666667e-05, 'samples': 109984, 'steps': 214, 'loss/train': 4.876739025115967} -09/20/2021 15:13:54 - INFO - __main__ - Step 3438: {'lr': 5.706666666666667e-05, 'samples': 110016, 'steps': 214, 'loss/train': 6.875759124755859} -09/20/2021 15:13:55 - INFO - __main__ - Step 3439: {'lr': 5.706666666666667e-05, 'samples': 110048, 'steps': 214, 'loss/train': 5.893091201782227} -09/20/2021 15:13:56 - INFO - __main__ - Step 3440: {'lr': 5.706666666666667e-05, 'samples': 110080, 'steps': 214, 'loss/train': 5.464139938354492} -09/20/2021 15:13:57 - INFO - __main__ - Step 3441: {'lr': 5.7333333333333336e-05, 'samples': 110112, 'steps': 215, 'loss/train': 5.092898845672607} -09/20/2021 15:13:58 - INFO - __main__ - Step 3442: {'lr': 5.7333333333333336e-05, 'samples': 110144, 'steps': 215, 'loss/train': 5.7648444175720215} -09/20/2021 15:13:58 - INFO - __main__ - Step 3443: {'lr': 5.7333333333333336e-05, 'samples': 110176, 'steps': 215, 'loss/train': 5.546387195587158} -09/20/2021 15:13:59 - INFO - __main__ - Step 3444: {'lr': 5.7333333333333336e-05, 'samples': 110208, 'steps': 215, 'loss/train': 5.677882671356201} -09/20/2021 15:14:00 - INFO - __main__ - Step 3445: {'lr': 5.7333333333333336e-05, 'samples': 110240, 'steps': 215, 'loss/train': 5.702584266662598} -09/20/2021 15:14:01 - INFO - __main__ - Step 3446: {'lr': 5.7333333333333336e-05, 'samples': 110272, 'steps': 215, 'loss/train': 5.569883346557617} -09/20/2021 15:14:01 - INFO - __main__ - Step 3447: {'lr': 5.7333333333333336e-05, 'samples': 110304, 'steps': 215, 'loss/train': 6.481102466583252} -09/20/2021 15:14:02 - INFO - __main__ - Step 3448: {'lr': 5.7333333333333336e-05, 'samples': 110336, 'steps': 215, 'loss/train': 5.5379791259765625} -09/20/2021 15:14:03 - INFO - __main__ - Step 3449: {'lr': 5.7333333333333336e-05, 'samples': 110368, 'steps': 215, 'loss/train': 5.583001136779785} -09/20/2021 15:14:04 - INFO - __main__ - Step 3450: {'lr': 5.7333333333333336e-05, 'samples': 110400, 'steps': 215, 'loss/train': 5.73982048034668} -09/20/2021 15:14:04 - INFO - __main__ - Step 3451: {'lr': 5.7333333333333336e-05, 'samples': 110432, 'steps': 215, 'loss/train': 5.702364921569824} -09/20/2021 15:14:05 - INFO - __main__ - Step 3452: {'lr': 5.7333333333333336e-05, 'samples': 110464, 'steps': 215, 'loss/train': 6.3763041496276855} -09/20/2021 15:14:06 - INFO - __main__ - Step 3453: {'lr': 5.7333333333333336e-05, 'samples': 110496, 'steps': 215, 'loss/train': 5.517265319824219} -09/20/2021 15:14:07 - INFO - __main__ - Step 3454: {'lr': 5.7333333333333336e-05, 'samples': 110528, 'steps': 215, 'loss/train': 5.7904276847839355} -09/20/2021 15:14:07 - INFO - __main__ - Step 3455: {'lr': 5.7333333333333336e-05, 'samples': 110560, 'steps': 215, 'loss/train': 5.881722450256348} -09/20/2021 15:14:08 - INFO - __main__ - Step 3456: {'lr': 5.7333333333333336e-05, 'samples': 110592, 'steps': 215, 'loss/train': 5.687761306762695} -09/20/2021 15:14:09 - INFO - __main__ - Step 3457: {'lr': 5.76e-05, 'samples': 110624, 'steps': 216, 'loss/train': 5.654074668884277} -09/20/2021 15:14:10 - INFO - __main__ - Step 3458: {'lr': 5.76e-05, 'samples': 110656, 'steps': 216, 'loss/train': 5.418470859527588} -09/20/2021 15:14:10 - INFO - __main__ - Step 3459: {'lr': 5.76e-05, 'samples': 110688, 'steps': 216, 'loss/train': 6.091576099395752} -09/20/2021 15:14:11 - INFO - __main__ - Step 3460: {'lr': 5.76e-05, 'samples': 110720, 'steps': 216, 'loss/train': 5.722798824310303} -09/20/2021 15:14:12 - INFO - __main__ - Step 3461: {'lr': 5.76e-05, 'samples': 110752, 'steps': 216, 'loss/train': 6.099167346954346} -09/20/2021 15:14:13 - INFO - __main__ - Step 3462: {'lr': 5.76e-05, 'samples': 110784, 'steps': 216, 'loss/train': 4.938934326171875} -09/20/2021 15:14:14 - INFO - __main__ - Step 3463: {'lr': 5.76e-05, 'samples': 110816, 'steps': 216, 'loss/train': 5.933901786804199} -09/20/2021 15:14:15 - INFO - __main__ - Step 3464: {'lr': 5.76e-05, 'samples': 110848, 'steps': 216, 'loss/train': 5.487724304199219} -09/20/2021 15:14:16 - INFO - __main__ - Step 3465: {'lr': 5.76e-05, 'samples': 110880, 'steps': 216, 'loss/train': 5.832444667816162} -09/20/2021 15:14:16 - INFO - __main__ - Step 3466: {'lr': 5.76e-05, 'samples': 110912, 'steps': 216, 'loss/train': 6.520080089569092} -09/20/2021 15:14:17 - INFO - __main__ - Step 3467: {'lr': 5.76e-05, 'samples': 110944, 'steps': 216, 'loss/train': 6.762547969818115} -09/20/2021 15:14:18 - INFO - __main__ - Step 3468: {'lr': 5.76e-05, 'samples': 110976, 'steps': 216, 'loss/train': 5.820230007171631} -09/20/2021 15:14:19 - INFO - __main__ - Step 3469: {'lr': 5.76e-05, 'samples': 111008, 'steps': 216, 'loss/train': 5.693449974060059} -09/20/2021 15:14:19 - INFO - __main__ - Step 3470: {'lr': 5.76e-05, 'samples': 111040, 'steps': 216, 'loss/train': 5.789962291717529} -09/20/2021 15:14:20 - INFO - __main__ - Step 3471: {'lr': 5.76e-05, 'samples': 111072, 'steps': 216, 'loss/train': 5.641305923461914} -09/20/2021 15:14:21 - INFO - __main__ - Step 3472: {'lr': 5.76e-05, 'samples': 111104, 'steps': 216, 'loss/train': 6.172465801239014} -09/20/2021 15:14:22 - INFO - __main__ - Step 3473: {'lr': 5.7866666666666666e-05, 'samples': 111136, 'steps': 217, 'loss/train': 6.311516761779785} -09/20/2021 15:14:22 - INFO - __main__ - Step 3474: {'lr': 5.7866666666666666e-05, 'samples': 111168, 'steps': 217, 'loss/train': 5.4807868003845215} -09/20/2021 15:14:23 - INFO - __main__ - Step 3475: {'lr': 5.7866666666666666e-05, 'samples': 111200, 'steps': 217, 'loss/train': 6.792464256286621} -09/20/2021 15:14:24 - INFO - __main__ - Step 3476: {'lr': 5.7866666666666666e-05, 'samples': 111232, 'steps': 217, 'loss/train': 5.4247870445251465} -09/20/2021 15:14:25 - INFO - __main__ - Step 3477: {'lr': 5.7866666666666666e-05, 'samples': 111264, 'steps': 217, 'loss/train': 6.510135650634766} -09/20/2021 15:14:25 - INFO - __main__ - Step 3478: {'lr': 5.7866666666666666e-05, 'samples': 111296, 'steps': 217, 'loss/train': 4.88031530380249} -09/20/2021 15:14:26 - INFO - __main__ - Step 3479: {'lr': 5.7866666666666666e-05, 'samples': 111328, 'steps': 217, 'loss/train': 5.999759674072266} -09/20/2021 15:14:27 - INFO - __main__ - Step 3480: {'lr': 5.7866666666666666e-05, 'samples': 111360, 'steps': 217, 'loss/train': 6.438917636871338} -09/20/2021 15:14:28 - INFO - __main__ - Step 3481: {'lr': 5.7866666666666666e-05, 'samples': 111392, 'steps': 217, 'loss/train': 5.586921215057373} -09/20/2021 15:14:28 - INFO - __main__ - Step 3482: {'lr': 5.7866666666666666e-05, 'samples': 111424, 'steps': 217, 'loss/train': 6.14276123046875} -09/20/2021 15:14:29 - INFO - __main__ - Step 3483: {'lr': 5.7866666666666666e-05, 'samples': 111456, 'steps': 217, 'loss/train': 6.719966888427734} -09/20/2021 15:14:30 - INFO - __main__ - Step 3484: {'lr': 5.7866666666666666e-05, 'samples': 111488, 'steps': 217, 'loss/train': 5.474096775054932} -09/20/2021 15:14:31 - INFO - __main__ - Step 3485: {'lr': 5.7866666666666666e-05, 'samples': 111520, 'steps': 217, 'loss/train': 5.228114128112793} -09/20/2021 15:14:31 - INFO - __main__ - Step 3486: {'lr': 5.7866666666666666e-05, 'samples': 111552, 'steps': 217, 'loss/train': 5.53922176361084} -09/20/2021 15:14:32 - INFO - __main__ - Step 3487: {'lr': 5.7866666666666666e-05, 'samples': 111584, 'steps': 217, 'loss/train': 6.17775821685791} -09/20/2021 15:14:33 - INFO - __main__ - Step 3488: {'lr': 5.7866666666666666e-05, 'samples': 111616, 'steps': 217, 'loss/train': 5.607181072235107} -09/20/2021 15:14:34 - INFO - __main__ - Step 3489: {'lr': 5.813333333333334e-05, 'samples': 111648, 'steps': 218, 'loss/train': 5.977768898010254} -09/20/2021 15:14:35 - INFO - __main__ - Step 3490: {'lr': 5.813333333333334e-05, 'samples': 111680, 'steps': 218, 'loss/train': 5.8252692222595215} -09/20/2021 15:14:35 - INFO - __main__ - Step 3491: {'lr': 5.813333333333334e-05, 'samples': 111712, 'steps': 218, 'loss/train': 6.501298904418945} -09/20/2021 15:14:36 - INFO - __main__ - Step 3492: {'lr': 5.813333333333334e-05, 'samples': 111744, 'steps': 218, 'loss/train': 4.930428504943848} -09/20/2021 15:14:37 - INFO - __main__ - Step 3493: {'lr': 5.813333333333334e-05, 'samples': 111776, 'steps': 218, 'loss/train': 6.501364231109619} -09/20/2021 15:14:38 - INFO - __main__ - Step 3494: {'lr': 5.813333333333334e-05, 'samples': 111808, 'steps': 218, 'loss/train': 6.3654632568359375} -09/20/2021 15:14:39 - INFO - __main__ - Step 3495: {'lr': 5.813333333333334e-05, 'samples': 111840, 'steps': 218, 'loss/train': 6.071518898010254} -09/20/2021 15:14:40 - INFO - __main__ - Step 3496: {'lr': 5.813333333333334e-05, 'samples': 111872, 'steps': 218, 'loss/train': 5.71311092376709} -09/20/2021 15:14:40 - INFO - __main__ - Step 3497: {'lr': 5.813333333333334e-05, 'samples': 111904, 'steps': 218, 'loss/train': 6.134367942810059} -09/20/2021 15:14:41 - INFO - __main__ - Step 3498: {'lr': 5.813333333333334e-05, 'samples': 111936, 'steps': 218, 'loss/train': 5.055002212524414} -09/20/2021 15:14:42 - INFO - __main__ - Step 3499: {'lr': 5.813333333333334e-05, 'samples': 111968, 'steps': 218, 'loss/train': 5.776863098144531} -09/20/2021 15:14:43 - INFO - __main__ - Step 3500: {'lr': 5.813333333333334e-05, 'samples': 112000, 'steps': 218, 'loss/train': 5.663311958312988} -09/20/2021 15:14:43 - INFO - __main__ - Step 3501: {'lr': 5.813333333333334e-05, 'samples': 112032, 'steps': 218, 'loss/train': 5.58604621887207} -09/20/2021 15:14:44 - INFO - __main__ - Step 3502: {'lr': 5.813333333333334e-05, 'samples': 112064, 'steps': 218, 'loss/train': 6.296107769012451} -09/20/2021 15:14:45 - INFO - __main__ - Step 3503: {'lr': 5.813333333333334e-05, 'samples': 112096, 'steps': 218, 'loss/train': 6.00358772277832} -09/20/2021 15:14:46 - INFO - __main__ - Step 3504: {'lr': 5.813333333333334e-05, 'samples': 112128, 'steps': 218, 'loss/train': 5.660144329071045} -09/20/2021 15:14:47 - INFO - __main__ - Step 3505: {'lr': 5.8399999999999997e-05, 'samples': 112160, 'steps': 219, 'loss/train': 5.621368408203125} -09/20/2021 15:14:47 - INFO - __main__ - Step 3506: {'lr': 5.8399999999999997e-05, 'samples': 112192, 'steps': 219, 'loss/train': 6.12385368347168} -09/20/2021 15:14:48 - INFO - __main__ - Step 3507: {'lr': 5.8399999999999997e-05, 'samples': 112224, 'steps': 219, 'loss/train': 5.882819652557373} -09/20/2021 15:14:49 - INFO - __main__ - Step 3508: {'lr': 5.8399999999999997e-05, 'samples': 112256, 'steps': 219, 'loss/train': 6.041082382202148} -09/20/2021 15:14:50 - INFO - __main__ - Step 3509: {'lr': 5.8399999999999997e-05, 'samples': 112288, 'steps': 219, 'loss/train': 5.683553695678711} -09/20/2021 15:14:50 - INFO - __main__ - Step 3510: {'lr': 5.8399999999999997e-05, 'samples': 112320, 'steps': 219, 'loss/train': 4.674715042114258} -09/20/2021 15:14:51 - INFO - __main__ - Step 3511: {'lr': 5.8399999999999997e-05, 'samples': 112352, 'steps': 219, 'loss/train': 4.302555084228516} -09/20/2021 15:14:52 - INFO - __main__ - Step 3512: {'lr': 5.8399999999999997e-05, 'samples': 112384, 'steps': 219, 'loss/train': 5.81662130355835} -09/20/2021 15:14:53 - INFO - __main__ - Step 3513: {'lr': 5.8399999999999997e-05, 'samples': 112416, 'steps': 219, 'loss/train': 6.107090473175049} -09/20/2021 15:14:53 - INFO - __main__ - Step 3514: {'lr': 5.8399999999999997e-05, 'samples': 112448, 'steps': 219, 'loss/train': 6.088041305541992} -09/20/2021 15:14:54 - INFO - __main__ - Step 3515: {'lr': 5.8399999999999997e-05, 'samples': 112480, 'steps': 219, 'loss/train': 3.69635272026062} -09/20/2021 15:14:55 - INFO - __main__ - Step 3516: {'lr': 5.8399999999999997e-05, 'samples': 112512, 'steps': 219, 'loss/train': 5.282824993133545} -09/20/2021 15:14:56 - INFO - __main__ - Step 3517: {'lr': 5.8399999999999997e-05, 'samples': 112544, 'steps': 219, 'loss/train': 5.5322184562683105} -09/20/2021 15:14:56 - INFO - __main__ - Step 3518: {'lr': 5.8399999999999997e-05, 'samples': 112576, 'steps': 219, 'loss/train': 5.44492769241333} -09/20/2021 15:14:57 - INFO - __main__ - Step 3519: {'lr': 5.8399999999999997e-05, 'samples': 112608, 'steps': 219, 'loss/train': 4.188705921173096} -09/20/2021 15:14:58 - INFO - __main__ - Step 3520: {'lr': 5.8399999999999997e-05, 'samples': 112640, 'steps': 219, 'loss/train': 5.828688144683838} -09/20/2021 15:14:59 - INFO - __main__ - Step 3521: {'lr': 5.866666666666667e-05, 'samples': 112672, 'steps': 220, 'loss/train': 3.666743040084839} -09/20/2021 15:14:59 - INFO - __main__ - Step 3522: {'lr': 5.866666666666667e-05, 'samples': 112704, 'steps': 220, 'loss/train': 5.79398250579834} -09/20/2021 15:15:00 - INFO - __main__ - Step 3523: {'lr': 5.866666666666667e-05, 'samples': 112736, 'steps': 220, 'loss/train': 5.419137954711914} -09/20/2021 15:15:01 - INFO - __main__ - Step 3524: {'lr': 5.866666666666667e-05, 'samples': 112768, 'steps': 220, 'loss/train': 8.945194244384766} -09/20/2021 15:15:02 - INFO - __main__ - Step 3525: {'lr': 5.866666666666667e-05, 'samples': 112800, 'steps': 220, 'loss/train': 6.351607799530029} -09/20/2021 15:15:03 - INFO - __main__ - Step 3526: {'lr': 5.866666666666667e-05, 'samples': 112832, 'steps': 220, 'loss/train': 6.227593898773193} -09/20/2021 15:15:04 - INFO - __main__ - Step 3527: {'lr': 5.866666666666667e-05, 'samples': 112864, 'steps': 220, 'loss/train': 5.221078395843506} -09/20/2021 15:15:04 - INFO - __main__ - Step 3528: {'lr': 5.866666666666667e-05, 'samples': 112896, 'steps': 220, 'loss/train': 5.765185356140137} -09/20/2021 15:15:05 - INFO - __main__ - Step 3529: {'lr': 5.866666666666667e-05, 'samples': 112928, 'steps': 220, 'loss/train': 6.194811820983887} -09/20/2021 15:15:06 - INFO - __main__ - Step 3530: {'lr': 5.866666666666667e-05, 'samples': 112960, 'steps': 220, 'loss/train': 5.345686912536621} -09/20/2021 15:15:07 - INFO - __main__ - Step 3531: {'lr': 5.866666666666667e-05, 'samples': 112992, 'steps': 220, 'loss/train': 5.94242000579834} -09/20/2021 15:15:07 - INFO - __main__ - Step 3532: {'lr': 5.866666666666667e-05, 'samples': 113024, 'steps': 220, 'loss/train': 5.261044025421143} -09/20/2021 15:15:08 - INFO - __main__ - Step 3533: {'lr': 5.866666666666667e-05, 'samples': 113056, 'steps': 220, 'loss/train': 5.662413597106934} -09/20/2021 15:15:09 - INFO - __main__ - Step 3534: {'lr': 5.866666666666667e-05, 'samples': 113088, 'steps': 220, 'loss/train': 5.57628059387207} -09/20/2021 15:15:10 - INFO - __main__ - Step 3535: {'lr': 5.866666666666667e-05, 'samples': 113120, 'steps': 220, 'loss/train': 5.839224815368652} -09/20/2021 15:15:10 - INFO - __main__ - Step 3536: {'lr': 5.866666666666667e-05, 'samples': 113152, 'steps': 220, 'loss/train': 5.898126125335693} -09/20/2021 15:15:11 - INFO - __main__ - Step 3537: {'lr': 5.893333333333334e-05, 'samples': 113184, 'steps': 221, 'loss/train': 5.597121715545654} -09/20/2021 15:15:12 - INFO - __main__ - Step 3538: {'lr': 5.893333333333334e-05, 'samples': 113216, 'steps': 221, 'loss/train': 4.663077354431152} -09/20/2021 15:15:13 - INFO - __main__ - Step 3539: {'lr': 5.893333333333334e-05, 'samples': 113248, 'steps': 221, 'loss/train': 5.9990129470825195} -09/20/2021 15:15:14 - INFO - __main__ - Step 3540: {'lr': 5.893333333333334e-05, 'samples': 113280, 'steps': 221, 'loss/train': 5.5653276443481445} -09/20/2021 15:15:14 - INFO - __main__ - Step 3541: {'lr': 5.893333333333334e-05, 'samples': 113312, 'steps': 221, 'loss/train': 5.38848352432251} -09/20/2021 15:15:15 - INFO - __main__ - Step 3542: {'lr': 5.893333333333334e-05, 'samples': 113344, 'steps': 221, 'loss/train': 6.276246547698975} -09/20/2021 15:15:16 - INFO - __main__ - Step 3543: {'lr': 5.893333333333334e-05, 'samples': 113376, 'steps': 221, 'loss/train': 4.961794376373291} -09/20/2021 15:15:17 - INFO - __main__ - Step 3544: {'lr': 5.893333333333334e-05, 'samples': 113408, 'steps': 221, 'loss/train': 5.957047939300537} -09/20/2021 15:15:17 - INFO - __main__ - Step 3545: {'lr': 5.893333333333334e-05, 'samples': 113440, 'steps': 221, 'loss/train': 6.313279628753662} -09/20/2021 15:15:18 - INFO - __main__ - Step 3546: {'lr': 5.893333333333334e-05, 'samples': 113472, 'steps': 221, 'loss/train': 5.510916233062744} -09/20/2021 15:15:19 - INFO - __main__ - Step 3547: {'lr': 5.893333333333334e-05, 'samples': 113504, 'steps': 221, 'loss/train': 5.593291759490967} -09/20/2021 15:15:20 - INFO - __main__ - Step 3548: {'lr': 5.893333333333334e-05, 'samples': 113536, 'steps': 221, 'loss/train': 5.08629035949707} -09/20/2021 15:15:20 - INFO - __main__ - Step 3549: {'lr': 5.893333333333334e-05, 'samples': 113568, 'steps': 221, 'loss/train': 4.662815570831299} -09/20/2021 15:15:21 - INFO - __main__ - Step 3550: {'lr': 5.893333333333334e-05, 'samples': 113600, 'steps': 221, 'loss/train': 5.699073314666748} -09/20/2021 15:15:22 - INFO - __main__ - Step 3551: {'lr': 5.893333333333334e-05, 'samples': 113632, 'steps': 221, 'loss/train': 6.702118873596191} -09/20/2021 15:15:23 - INFO - __main__ - Step 3552: {'lr': 5.893333333333334e-05, 'samples': 113664, 'steps': 221, 'loss/train': 6.38386344909668} -09/20/2021 15:15:24 - INFO - __main__ - Step 3553: {'lr': 5.92e-05, 'samples': 113696, 'steps': 222, 'loss/train': 5.870210647583008} -09/20/2021 15:15:24 - INFO - __main__ - Step 3554: {'lr': 5.92e-05, 'samples': 113728, 'steps': 222, 'loss/train': 5.612343788146973} -09/20/2021 15:15:25 - INFO - __main__ - Step 3555: {'lr': 5.92e-05, 'samples': 113760, 'steps': 222, 'loss/train': 6.811529159545898} -09/20/2021 15:15:27 - INFO - __main__ - Step 3556: {'lr': 5.92e-05, 'samples': 113792, 'steps': 222, 'loss/train': 5.517138957977295} -09/20/2021 15:15:28 - INFO - __main__ - Step 3557: {'lr': 5.92e-05, 'samples': 113824, 'steps': 222, 'loss/train': 4.955230236053467} -09/20/2021 15:15:28 - INFO - __main__ - Step 3558: {'lr': 5.92e-05, 'samples': 113856, 'steps': 222, 'loss/train': 6.24470853805542} -09/20/2021 15:15:29 - INFO - __main__ - Step 3559: {'lr': 5.92e-05, 'samples': 113888, 'steps': 222, 'loss/train': 5.318664073944092} -09/20/2021 15:15:30 - INFO - __main__ - Step 3560: {'lr': 5.92e-05, 'samples': 113920, 'steps': 222, 'loss/train': 5.529002666473389} -09/20/2021 15:15:31 - INFO - __main__ - Step 3561: {'lr': 5.92e-05, 'samples': 113952, 'steps': 222, 'loss/train': 5.622723579406738} -09/20/2021 15:15:31 - INFO - __main__ - Step 3562: {'lr': 5.92e-05, 'samples': 113984, 'steps': 222, 'loss/train': 5.827330589294434} -09/20/2021 15:15:32 - INFO - __main__ - Step 3563: {'lr': 5.92e-05, 'samples': 114016, 'steps': 222, 'loss/train': 5.748408794403076} -09/20/2021 15:15:33 - INFO - __main__ - Step 3564: {'lr': 5.92e-05, 'samples': 114048, 'steps': 222, 'loss/train': 5.856979846954346} -09/20/2021 15:15:34 - INFO - __main__ - Step 3565: {'lr': 5.92e-05, 'samples': 114080, 'steps': 222, 'loss/train': 3.592526912689209} -09/20/2021 15:15:34 - INFO - __main__ - Step 3566: {'lr': 5.92e-05, 'samples': 114112, 'steps': 222, 'loss/train': 5.7588677406311035} -09/20/2021 15:15:35 - INFO - __main__ - Step 3567: {'lr': 5.92e-05, 'samples': 114144, 'steps': 222, 'loss/train': 4.913257598876953} -09/20/2021 15:15:36 - INFO - __main__ - Step 3568: {'lr': 5.92e-05, 'samples': 114176, 'steps': 222, 'loss/train': 5.269636154174805} -09/20/2021 15:15:37 - INFO - __main__ - Step 3569: {'lr': 5.946666666666667e-05, 'samples': 114208, 'steps': 223, 'loss/train': 5.81718111038208} -09/20/2021 15:15:38 - INFO - __main__ - Step 3570: {'lr': 5.946666666666667e-05, 'samples': 114240, 'steps': 223, 'loss/train': 5.405052661895752} -09/20/2021 15:15:38 - INFO - __main__ - Step 3571: {'lr': 5.946666666666667e-05, 'samples': 114272, 'steps': 223, 'loss/train': 5.487229824066162} -09/20/2021 15:15:39 - INFO - __main__ - Step 3572: {'lr': 5.946666666666667e-05, 'samples': 114304, 'steps': 223, 'loss/train': 5.651031017303467} -09/20/2021 15:15:40 - INFO - __main__ - Step 3573: {'lr': 5.946666666666667e-05, 'samples': 114336, 'steps': 223, 'loss/train': 5.100864887237549} -09/20/2021 15:15:41 - INFO - __main__ - Step 3574: {'lr': 5.946666666666667e-05, 'samples': 114368, 'steps': 223, 'loss/train': 3.8717379570007324} -09/20/2021 15:15:41 - INFO - __main__ - Step 3575: {'lr': 5.946666666666667e-05, 'samples': 114400, 'steps': 223, 'loss/train': 3.6144773960113525} -09/20/2021 15:15:42 - INFO - __main__ - Step 3576: {'lr': 5.946666666666667e-05, 'samples': 114432, 'steps': 223, 'loss/train': 4.149318218231201} -09/20/2021 15:15:43 - INFO - __main__ - Step 3577: {'lr': 5.946666666666667e-05, 'samples': 114464, 'steps': 223, 'loss/train': 6.339078903198242} -09/20/2021 15:15:44 - INFO - __main__ - Step 3578: {'lr': 5.946666666666667e-05, 'samples': 114496, 'steps': 223, 'loss/train': 5.672388553619385} -09/20/2021 15:15:44 - INFO - __main__ - Step 3579: {'lr': 5.946666666666667e-05, 'samples': 114528, 'steps': 223, 'loss/train': 5.522083759307861} -09/20/2021 15:15:45 - INFO - __main__ - Step 3580: {'lr': 5.946666666666667e-05, 'samples': 114560, 'steps': 223, 'loss/train': 5.541284561157227} -09/20/2021 15:15:46 - INFO - __main__ - Step 3581: {'lr': 5.946666666666667e-05, 'samples': 114592, 'steps': 223, 'loss/train': 5.906991004943848} -09/20/2021 15:15:47 - INFO - __main__ - Step 3582: {'lr': 5.946666666666667e-05, 'samples': 114624, 'steps': 223, 'loss/train': 5.58195161819458} -09/20/2021 15:15:47 - INFO - __main__ - Step 3583: {'lr': 5.946666666666667e-05, 'samples': 114656, 'steps': 223, 'loss/train': 4.432800769805908} -09/20/2021 15:15:48 - INFO - __main__ - Step 3584: {'lr': 5.946666666666667e-05, 'samples': 114688, 'steps': 223, 'loss/train': 5.430471420288086} -09/20/2021 15:15:49 - INFO - __main__ - Step 3585: {'lr': 5.973333333333334e-05, 'samples': 114720, 'steps': 224, 'loss/train': 3.869401693344116} -09/20/2021 15:15:50 - INFO - __main__ - Step 3586: {'lr': 5.973333333333334e-05, 'samples': 114752, 'steps': 224, 'loss/train': 4.295925617218018} -09/20/2021 15:15:51 - INFO - __main__ - Step 3587: {'lr': 5.973333333333334e-05, 'samples': 114784, 'steps': 224, 'loss/train': 3.272006034851074} -09/20/2021 15:15:52 - INFO - __main__ - Step 3588: {'lr': 5.973333333333334e-05, 'samples': 114816, 'steps': 224, 'loss/train': 3.248133420944214} -09/20/2021 15:15:53 - INFO - __main__ - Step 3589: {'lr': 5.973333333333334e-05, 'samples': 114848, 'steps': 224, 'loss/train': 6.027968883514404} -09/20/2021 15:15:53 - INFO - __main__ - Step 3590: {'lr': 5.973333333333334e-05, 'samples': 114880, 'steps': 224, 'loss/train': 5.359322547912598} -09/20/2021 15:15:54 - INFO - __main__ - Step 3591: {'lr': 5.973333333333334e-05, 'samples': 114912, 'steps': 224, 'loss/train': 5.671648025512695} -09/20/2021 15:15:55 - INFO - __main__ - Step 3592: {'lr': 5.973333333333334e-05, 'samples': 114944, 'steps': 224, 'loss/train': 5.77127742767334} -09/20/2021 15:15:56 - INFO - __main__ - Step 3593: {'lr': 5.973333333333334e-05, 'samples': 114976, 'steps': 224, 'loss/train': 5.036993503570557} -09/20/2021 15:15:56 - INFO - __main__ - Step 3594: {'lr': 5.973333333333334e-05, 'samples': 115008, 'steps': 224, 'loss/train': 5.484053134918213} -09/20/2021 15:15:57 - INFO - __main__ - Step 3595: {'lr': 5.973333333333334e-05, 'samples': 115040, 'steps': 224, 'loss/train': 6.110162258148193} -09/20/2021 15:15:58 - INFO - __main__ - Step 3596: {'lr': 5.973333333333334e-05, 'samples': 115072, 'steps': 224, 'loss/train': 6.170070171356201} -09/20/2021 15:15:59 - INFO - __main__ - Step 3597: {'lr': 5.973333333333334e-05, 'samples': 115104, 'steps': 224, 'loss/train': 7.323403835296631} -09/20/2021 15:15:59 - INFO - __main__ - Step 3598: {'lr': 5.973333333333334e-05, 'samples': 115136, 'steps': 224, 'loss/train': 5.146838665008545} -09/20/2021 15:16:00 - INFO - __main__ - Step 3599: {'lr': 5.973333333333334e-05, 'samples': 115168, 'steps': 224, 'loss/train': 5.211742877960205} -09/20/2021 15:16:01 - INFO - __main__ - Step 3600: {'lr': 5.973333333333334e-05, 'samples': 115200, 'steps': 224, 'loss/train': 5.6989288330078125} -09/20/2021 15:16:02 - INFO - __main__ - Step 3601: {'lr': 6e-05, 'samples': 115232, 'steps': 225, 'loss/train': 5.810235023498535} -09/20/2021 15:16:02 - INFO - __main__ - Step 3602: {'lr': 6e-05, 'samples': 115264, 'steps': 225, 'loss/train': 6.323145389556885} -09/20/2021 15:16:03 - INFO - __main__ - Step 3603: {'lr': 6e-05, 'samples': 115296, 'steps': 225, 'loss/train': 5.421960830688477} -09/20/2021 15:16:04 - INFO - __main__ - Step 3604: {'lr': 6e-05, 'samples': 115328, 'steps': 225, 'loss/train': 5.7603960037231445} -09/20/2021 15:16:05 - INFO - __main__ - Step 3605: {'lr': 6e-05, 'samples': 115360, 'steps': 225, 'loss/train': 5.537116527557373} -09/20/2021 15:16:05 - INFO - __main__ - Step 3606: {'lr': 6e-05, 'samples': 115392, 'steps': 225, 'loss/train': 5.421171188354492} -09/20/2021 15:16:06 - INFO - __main__ - Step 3607: {'lr': 6e-05, 'samples': 115424, 'steps': 225, 'loss/train': 4.788185119628906} -09/20/2021 15:16:07 - INFO - __main__ - Step 3608: {'lr': 6e-05, 'samples': 115456, 'steps': 225, 'loss/train': 5.727273464202881} -09/20/2021 15:16:08 - INFO - __main__ - Step 3609: {'lr': 6e-05, 'samples': 115488, 'steps': 225, 'loss/train': 6.015009880065918} -09/20/2021 15:16:08 - INFO - __main__ - Step 3610: {'lr': 6e-05, 'samples': 115520, 'steps': 225, 'loss/train': 4.025050163269043} -09/20/2021 15:16:09 - INFO - __main__ - Step 3611: {'lr': 6e-05, 'samples': 115552, 'steps': 225, 'loss/train': 5.957204341888428} -09/20/2021 15:16:10 - INFO - __main__ - Step 3612: {'lr': 6e-05, 'samples': 115584, 'steps': 225, 'loss/train': 5.561399936676025} -09/20/2021 15:16:11 - INFO - __main__ - Step 3613: {'lr': 6e-05, 'samples': 115616, 'steps': 225, 'loss/train': 5.935126781463623} -09/20/2021 15:16:11 - INFO - __main__ - Step 3614: {'lr': 6e-05, 'samples': 115648, 'steps': 225, 'loss/train': 7.177533149719238} -09/20/2021 15:16:12 - INFO - __main__ - Step 3615: {'lr': 6e-05, 'samples': 115680, 'steps': 225, 'loss/train': 6.370319843292236} -09/20/2021 15:16:13 - INFO - __main__ - Step 3616: {'lr': 6e-05, 'samples': 115712, 'steps': 225, 'loss/train': 5.667575836181641} -09/20/2021 15:16:14 - INFO - __main__ - Step 3617: {'lr': 6.026666666666667e-05, 'samples': 115744, 'steps': 226, 'loss/train': 5.21154260635376} -09/20/2021 15:16:15 - INFO - __main__ - Step 3618: {'lr': 6.026666666666667e-05, 'samples': 115776, 'steps': 226, 'loss/train': 5.962111473083496} -09/20/2021 15:16:16 - INFO - __main__ - Step 3619: {'lr': 6.026666666666667e-05, 'samples': 115808, 'steps': 226, 'loss/train': 5.917334079742432} -09/20/2021 15:16:17 - INFO - __main__ - Step 3620: {'lr': 6.026666666666667e-05, 'samples': 115840, 'steps': 226, 'loss/train': 5.735583305358887} -09/20/2021 15:16:17 - INFO - __main__ - Step 3621: {'lr': 6.026666666666667e-05, 'samples': 115872, 'steps': 226, 'loss/train': 5.736191749572754} -09/20/2021 15:16:18 - INFO - __main__ - Step 3622: {'lr': 6.026666666666667e-05, 'samples': 115904, 'steps': 226, 'loss/train': 5.294795036315918} -09/20/2021 15:16:19 - INFO - __main__ - Step 3623: {'lr': 6.026666666666667e-05, 'samples': 115936, 'steps': 226, 'loss/train': 5.953428268432617} -09/20/2021 15:16:20 - INFO - __main__ - Step 3624: {'lr': 6.026666666666667e-05, 'samples': 115968, 'steps': 226, 'loss/train': 5.954840660095215} -09/20/2021 15:16:20 - INFO - __main__ - Step 3625: {'lr': 6.026666666666667e-05, 'samples': 116000, 'steps': 226, 'loss/train': 5.802914619445801} -09/20/2021 15:16:21 - INFO - __main__ - Step 3626: {'lr': 6.026666666666667e-05, 'samples': 116032, 'steps': 226, 'loss/train': 6.366607666015625} -09/20/2021 15:16:22 - INFO - __main__ - Step 3627: {'lr': 6.026666666666667e-05, 'samples': 116064, 'steps': 226, 'loss/train': 5.780169486999512} -09/20/2021 15:16:23 - INFO - __main__ - Step 3628: {'lr': 6.026666666666667e-05, 'samples': 116096, 'steps': 226, 'loss/train': 5.917928695678711} -09/20/2021 15:16:23 - INFO - __main__ - Step 3629: {'lr': 6.026666666666667e-05, 'samples': 116128, 'steps': 226, 'loss/train': 5.221551895141602} -09/20/2021 15:16:24 - INFO - __main__ - Step 3630: {'lr': 6.026666666666667e-05, 'samples': 116160, 'steps': 226, 'loss/train': 5.87816047668457} -09/20/2021 15:16:25 - INFO - __main__ - Step 3631: {'lr': 6.026666666666667e-05, 'samples': 116192, 'steps': 226, 'loss/train': 5.742859363555908} -09/20/2021 15:16:26 - INFO - __main__ - Step 3632: {'lr': 6.026666666666667e-05, 'samples': 116224, 'steps': 226, 'loss/train': 5.357707500457764} -09/20/2021 15:16:27 - INFO - __main__ - Step 3633: {'lr': 6.053333333333333e-05, 'samples': 116256, 'steps': 227, 'loss/train': 5.551604747772217} -09/20/2021 15:16:27 - INFO - __main__ - Step 3634: {'lr': 6.053333333333333e-05, 'samples': 116288, 'steps': 227, 'loss/train': 6.640946865081787} -09/20/2021 15:16:28 - INFO - __main__ - Step 3635: {'lr': 6.053333333333333e-05, 'samples': 116320, 'steps': 227, 'loss/train': 5.909051895141602} -09/20/2021 15:16:29 - INFO - __main__ - Step 3636: {'lr': 6.053333333333333e-05, 'samples': 116352, 'steps': 227, 'loss/train': 5.07712459564209} -09/20/2021 15:16:30 - INFO - __main__ - Step 3637: {'lr': 6.053333333333333e-05, 'samples': 116384, 'steps': 227, 'loss/train': 5.748754978179932} -09/20/2021 15:16:30 - INFO - __main__ - Step 3638: {'lr': 6.053333333333333e-05, 'samples': 116416, 'steps': 227, 'loss/train': 4.193017959594727} -09/20/2021 15:16:31 - INFO - __main__ - Step 3639: {'lr': 6.053333333333333e-05, 'samples': 116448, 'steps': 227, 'loss/train': 5.97644567489624} -09/20/2021 15:16:32 - INFO - __main__ - Step 3640: {'lr': 6.053333333333333e-05, 'samples': 116480, 'steps': 227, 'loss/train': 4.980973720550537} -09/20/2021 15:16:33 - INFO - __main__ - Step 3641: {'lr': 6.053333333333333e-05, 'samples': 116512, 'steps': 227, 'loss/train': 5.151247978210449} -09/20/2021 15:16:33 - INFO - __main__ - Step 3642: {'lr': 6.053333333333333e-05, 'samples': 116544, 'steps': 227, 'loss/train': 5.4576497077941895} -09/20/2021 15:16:34 - INFO - __main__ - Step 3643: {'lr': 6.053333333333333e-05, 'samples': 116576, 'steps': 227, 'loss/train': 6.938976764678955} -09/20/2021 15:16:35 - INFO - __main__ - Step 3644: {'lr': 6.053333333333333e-05, 'samples': 116608, 'steps': 227, 'loss/train': 5.179114818572998} -09/20/2021 15:16:36 - INFO - __main__ - Step 3645: {'lr': 6.053333333333333e-05, 'samples': 116640, 'steps': 227, 'loss/train': 5.1858086585998535} -09/20/2021 15:16:36 - INFO - __main__ - Step 3646: {'lr': 6.053333333333333e-05, 'samples': 116672, 'steps': 227, 'loss/train': 5.196259498596191} -09/20/2021 15:16:37 - INFO - __main__ - Step 3647: {'lr': 6.053333333333333e-05, 'samples': 116704, 'steps': 227, 'loss/train': 6.477843284606934} -09/20/2021 15:16:38 - INFO - __main__ - Step 3648: {'lr': 6.053333333333333e-05, 'samples': 116736, 'steps': 227, 'loss/train': 5.741018295288086} -09/20/2021 15:16:39 - INFO - __main__ - Step 3649: {'lr': 6.08e-05, 'samples': 116768, 'steps': 228, 'loss/train': 5.2736687660217285} -09/20/2021 15:16:39 - INFO - __main__ - Step 3650: {'lr': 6.08e-05, 'samples': 116800, 'steps': 228, 'loss/train': 5.558673858642578} -09/20/2021 15:16:41 - INFO - __main__ - Step 3651: {'lr': 6.08e-05, 'samples': 116832, 'steps': 228, 'loss/train': 5.4949259757995605} -09/20/2021 15:16:41 - INFO - __main__ - Step 3652: {'lr': 6.08e-05, 'samples': 116864, 'steps': 228, 'loss/train': 5.93024206161499} -09/20/2021 15:16:42 - INFO - __main__ - Step 3653: {'lr': 6.08e-05, 'samples': 116896, 'steps': 228, 'loss/train': 5.422210693359375} -09/20/2021 15:16:43 - INFO - __main__ - Step 3654: {'lr': 6.08e-05, 'samples': 116928, 'steps': 228, 'loss/train': 5.740616321563721} -09/20/2021 15:16:44 - INFO - __main__ - Step 3655: {'lr': 6.08e-05, 'samples': 116960, 'steps': 228, 'loss/train': 5.125904560089111} -09/20/2021 15:16:44 - INFO - __main__ - Step 3656: {'lr': 6.08e-05, 'samples': 116992, 'steps': 228, 'loss/train': 5.8491291999816895} -09/20/2021 15:16:45 - INFO - __main__ - Step 3657: {'lr': 6.08e-05, 'samples': 117024, 'steps': 228, 'loss/train': 5.573641777038574} -09/20/2021 15:16:46 - INFO - __main__ - Step 3658: {'lr': 6.08e-05, 'samples': 117056, 'steps': 228, 'loss/train': 5.234427452087402} -09/20/2021 15:16:47 - INFO - __main__ - Step 3659: {'lr': 6.08e-05, 'samples': 117088, 'steps': 228, 'loss/train': 4.455129146575928} -09/20/2021 15:16:47 - INFO - __main__ - Step 3660: {'lr': 6.08e-05, 'samples': 117120, 'steps': 228, 'loss/train': 6.54387903213501} -09/20/2021 15:16:48 - INFO - __main__ - Step 3661: {'lr': 6.08e-05, 'samples': 117152, 'steps': 228, 'loss/train': 5.912605285644531} -09/20/2021 15:16:49 - INFO - __main__ - Step 3662: {'lr': 6.08e-05, 'samples': 117184, 'steps': 228, 'loss/train': 4.575259685516357} -09/20/2021 15:16:50 - INFO - __main__ - Step 3663: {'lr': 6.08e-05, 'samples': 117216, 'steps': 228, 'loss/train': 5.77974271774292} -09/20/2021 15:16:50 - INFO - __main__ - Step 3664: {'lr': 6.08e-05, 'samples': 117248, 'steps': 228, 'loss/train': 5.817755699157715} -09/20/2021 15:16:51 - INFO - __main__ - Step 3665: {'lr': 6.106666666666667e-05, 'samples': 117280, 'steps': 229, 'loss/train': 5.878486156463623} -09/20/2021 15:16:52 - INFO - __main__ - Step 3666: {'lr': 6.106666666666667e-05, 'samples': 117312, 'steps': 229, 'loss/train': 4.118947982788086} -09/20/2021 15:16:53 - INFO - __main__ - Step 3667: {'lr': 6.106666666666667e-05, 'samples': 117344, 'steps': 229, 'loss/train': 5.7952961921691895} -09/20/2021 15:16:54 - INFO - __main__ - Step 3668: {'lr': 6.106666666666667e-05, 'samples': 117376, 'steps': 229, 'loss/train': 5.384823799133301} -09/20/2021 15:16:54 - INFO - __main__ - Step 3669: {'lr': 6.106666666666667e-05, 'samples': 117408, 'steps': 229, 'loss/train': 4.909682273864746} -09/20/2021 15:16:55 - INFO - __main__ - Step 3670: {'lr': 6.106666666666667e-05, 'samples': 117440, 'steps': 229, 'loss/train': 5.7879228591918945} -09/20/2021 15:16:56 - INFO - __main__ - Step 3671: {'lr': 6.106666666666667e-05, 'samples': 117472, 'steps': 229, 'loss/train': 5.9438934326171875} -09/20/2021 15:16:57 - INFO - __main__ - Step 3672: {'lr': 6.106666666666667e-05, 'samples': 117504, 'steps': 229, 'loss/train': 5.695220947265625} -09/20/2021 15:16:57 - INFO - __main__ - Step 3673: {'lr': 6.106666666666667e-05, 'samples': 117536, 'steps': 229, 'loss/train': 5.602137088775635} -09/20/2021 15:16:58 - INFO - __main__ - Step 3674: {'lr': 6.106666666666667e-05, 'samples': 117568, 'steps': 229, 'loss/train': 5.4321513175964355} -09/20/2021 15:16:59 - INFO - __main__ - Step 3675: {'lr': 6.106666666666667e-05, 'samples': 117600, 'steps': 229, 'loss/train': 5.664882659912109} -09/20/2021 15:17:00 - INFO - __main__ - Step 3676: {'lr': 6.106666666666667e-05, 'samples': 117632, 'steps': 229, 'loss/train': 5.766697883605957} -09/20/2021 15:17:00 - INFO - __main__ - Step 3677: {'lr': 6.106666666666667e-05, 'samples': 117664, 'steps': 229, 'loss/train': 5.9540629386901855} -09/20/2021 15:17:01 - INFO - __main__ - Step 3678: {'lr': 6.106666666666667e-05, 'samples': 117696, 'steps': 229, 'loss/train': 5.607203483581543} -09/20/2021 15:17:02 - INFO - __main__ - Step 3679: {'lr': 6.106666666666667e-05, 'samples': 117728, 'steps': 229, 'loss/train': 5.443039894104004} -09/20/2021 15:17:03 - INFO - __main__ - Step 3680: {'lr': 6.106666666666667e-05, 'samples': 117760, 'steps': 229, 'loss/train': 6.141624927520752} -09/20/2021 15:17:03 - INFO - __main__ - Step 3681: {'lr': 6.133333333333334e-05, 'samples': 117792, 'steps': 230, 'loss/train': 5.774490833282471} -09/20/2021 15:17:05 - INFO - __main__ - Step 3682: {'lr': 6.133333333333334e-05, 'samples': 117824, 'steps': 230, 'loss/train': 5.837663173675537} -09/20/2021 15:17:05 - INFO - __main__ - Step 3683: {'lr': 6.133333333333334e-05, 'samples': 117856, 'steps': 230, 'loss/train': 5.670105934143066} -09/20/2021 15:17:06 - INFO - __main__ - Step 3684: {'lr': 6.133333333333334e-05, 'samples': 117888, 'steps': 230, 'loss/train': 6.77301549911499} -09/20/2021 15:17:07 - INFO - __main__ - Step 3685: {'lr': 6.133333333333334e-05, 'samples': 117920, 'steps': 230, 'loss/train': 5.490170955657959} -09/20/2021 15:17:08 - INFO - __main__ - Step 3686: {'lr': 6.133333333333334e-05, 'samples': 117952, 'steps': 230, 'loss/train': 5.758613109588623} -09/20/2021 15:17:08 - INFO - __main__ - Step 3687: {'lr': 6.133333333333334e-05, 'samples': 117984, 'steps': 230, 'loss/train': 5.158083915710449} -09/20/2021 15:17:09 - INFO - __main__ - Step 3688: {'lr': 6.133333333333334e-05, 'samples': 118016, 'steps': 230, 'loss/train': 6.284224033355713} -09/20/2021 15:17:10 - INFO - __main__ - Step 3689: {'lr': 6.133333333333334e-05, 'samples': 118048, 'steps': 230, 'loss/train': 5.748170375823975} -09/20/2021 15:17:11 - INFO - __main__ - Step 3690: {'lr': 6.133333333333334e-05, 'samples': 118080, 'steps': 230, 'loss/train': 6.0458879470825195} -09/20/2021 15:17:11 - INFO - __main__ - Step 3691: {'lr': 6.133333333333334e-05, 'samples': 118112, 'steps': 230, 'loss/train': 5.4348297119140625} -09/20/2021 15:17:12 - INFO - __main__ - Step 3692: {'lr': 6.133333333333334e-05, 'samples': 118144, 'steps': 230, 'loss/train': 6.337057113647461} -09/20/2021 15:17:13 - INFO - __main__ - Step 3693: {'lr': 6.133333333333334e-05, 'samples': 118176, 'steps': 230, 'loss/train': 5.5498948097229} -09/20/2021 15:17:14 - INFO - __main__ - Step 3694: {'lr': 6.133333333333334e-05, 'samples': 118208, 'steps': 230, 'loss/train': 5.766611099243164} -09/20/2021 15:17:14 - INFO - __main__ - Step 3695: {'lr': 6.133333333333334e-05, 'samples': 118240, 'steps': 230, 'loss/train': 5.178515911102295} -09/20/2021 15:17:15 - INFO - __main__ - Step 3696: {'lr': 6.133333333333334e-05, 'samples': 118272, 'steps': 230, 'loss/train': 4.674350261688232} -09/20/2021 15:17:16 - INFO - __main__ - Step 3697: {'lr': 6.16e-05, 'samples': 118304, 'steps': 231, 'loss/train': 5.722556114196777} -09/20/2021 15:17:17 - INFO - __main__ - Step 3698: {'lr': 6.16e-05, 'samples': 118336, 'steps': 231, 'loss/train': 6.079049110412598} -09/20/2021 15:17:18 - INFO - __main__ - Step 3699: {'lr': 6.16e-05, 'samples': 118368, 'steps': 231, 'loss/train': 6.163975715637207} -09/20/2021 15:17:18 - INFO - __main__ - Step 3700: {'lr': 6.16e-05, 'samples': 118400, 'steps': 231, 'loss/train': 6.245505332946777} -09/20/2021 15:17:19 - INFO - __main__ - Step 3701: {'lr': 6.16e-05, 'samples': 118432, 'steps': 231, 'loss/train': 6.908943176269531} -09/20/2021 15:17:20 - INFO - __main__ - Step 3702: {'lr': 6.16e-05, 'samples': 118464, 'steps': 231, 'loss/train': 5.385489463806152} -09/20/2021 15:17:21 - INFO - __main__ - Step 3703: {'lr': 6.16e-05, 'samples': 118496, 'steps': 231, 'loss/train': 5.495174884796143} -09/20/2021 15:17:21 - INFO - __main__ - Step 3704: {'lr': 6.16e-05, 'samples': 118528, 'steps': 231, 'loss/train': 5.906505584716797} -09/20/2021 15:17:22 - INFO - __main__ - Step 3705: {'lr': 6.16e-05, 'samples': 118560, 'steps': 231, 'loss/train': 6.17833948135376} -09/20/2021 15:17:23 - INFO - __main__ - Step 3706: {'lr': 6.16e-05, 'samples': 118592, 'steps': 231, 'loss/train': 5.4364333152771} -09/20/2021 15:17:24 - INFO - __main__ - Step 3707: {'lr': 6.16e-05, 'samples': 118624, 'steps': 231, 'loss/train': 5.821580410003662} -09/20/2021 15:17:24 - INFO - __main__ - Step 3708: {'lr': 6.16e-05, 'samples': 118656, 'steps': 231, 'loss/train': 6.350300312042236} -09/20/2021 15:17:25 - INFO - __main__ - Step 3709: {'lr': 6.16e-05, 'samples': 118688, 'steps': 231, 'loss/train': 6.358614444732666} -09/20/2021 15:17:26 - INFO - __main__ - Step 3710: {'lr': 6.16e-05, 'samples': 118720, 'steps': 231, 'loss/train': 6.0988993644714355} -09/20/2021 15:17:27 - INFO - __main__ - Step 3711: {'lr': 6.16e-05, 'samples': 118752, 'steps': 231, 'loss/train': 6.147984027862549} -09/20/2021 15:17:28 - INFO - __main__ - Step 3712: {'lr': 6.16e-05, 'samples': 118784, 'steps': 231, 'loss/train': 4.621575832366943} -09/20/2021 15:17:29 - INFO - __main__ - Step 3713: {'lr': 6.186666666666668e-05, 'samples': 118816, 'steps': 232, 'loss/train': 6.777341842651367} -09/20/2021 15:17:30 - INFO - __main__ - Step 3714: {'lr': 6.186666666666668e-05, 'samples': 118848, 'steps': 232, 'loss/train': 5.883638858795166} -09/20/2021 15:17:30 - INFO - __main__ - Step 3715: {'lr': 6.186666666666668e-05, 'samples': 118880, 'steps': 232, 'loss/train': 5.678956985473633} -09/20/2021 15:17:31 - INFO - __main__ - Step 3716: {'lr': 6.186666666666668e-05, 'samples': 118912, 'steps': 232, 'loss/train': 5.100409984588623} -09/20/2021 15:17:32 - INFO - __main__ - Step 3717: {'lr': 6.186666666666668e-05, 'samples': 118944, 'steps': 232, 'loss/train': 5.937255382537842} -09/20/2021 15:17:33 - INFO - __main__ - Step 3718: {'lr': 6.186666666666668e-05, 'samples': 118976, 'steps': 232, 'loss/train': 5.558115482330322} -09/20/2021 15:17:33 - INFO - __main__ - Step 3719: {'lr': 6.186666666666668e-05, 'samples': 119008, 'steps': 232, 'loss/train': 6.194077968597412} -09/20/2021 15:17:34 - INFO - __main__ - Step 3720: {'lr': 6.186666666666668e-05, 'samples': 119040, 'steps': 232, 'loss/train': 5.032587051391602} -09/20/2021 15:17:35 - INFO - __main__ - Step 3721: {'lr': 6.186666666666668e-05, 'samples': 119072, 'steps': 232, 'loss/train': 5.801778793334961} -09/20/2021 15:17:36 - INFO - __main__ - Step 3722: {'lr': 6.186666666666668e-05, 'samples': 119104, 'steps': 232, 'loss/train': 5.854519844055176} -09/20/2021 15:17:36 - INFO - __main__ - Step 3723: {'lr': 6.186666666666668e-05, 'samples': 119136, 'steps': 232, 'loss/train': 5.892938137054443} -09/20/2021 15:17:37 - INFO - __main__ - Step 3724: {'lr': 6.186666666666668e-05, 'samples': 119168, 'steps': 232, 'loss/train': 5.566176414489746} -09/20/2021 15:17:38 - INFO - __main__ - Step 3725: {'lr': 6.186666666666668e-05, 'samples': 119200, 'steps': 232, 'loss/train': 5.899580001831055} -09/20/2021 15:17:39 - INFO - __main__ - Step 3726: {'lr': 6.186666666666668e-05, 'samples': 119232, 'steps': 232, 'loss/train': 5.48056697845459} -09/20/2021 15:17:39 - INFO - __main__ - Step 3727: {'lr': 6.186666666666668e-05, 'samples': 119264, 'steps': 232, 'loss/train': 5.951858997344971} -09/20/2021 15:17:40 - INFO - __main__ - Step 3728: {'lr': 6.186666666666668e-05, 'samples': 119296, 'steps': 232, 'loss/train': 5.278842449188232} -09/20/2021 15:17:41 - INFO - __main__ - Step 3729: {'lr': 6.213333333333333e-05, 'samples': 119328, 'steps': 233, 'loss/train': 6.269542217254639} -09/20/2021 15:17:42 - INFO - __main__ - Step 3730: {'lr': 6.213333333333333e-05, 'samples': 119360, 'steps': 233, 'loss/train': 5.646985054016113} -09/20/2021 15:17:43 - INFO - __main__ - Step 3731: {'lr': 6.213333333333333e-05, 'samples': 119392, 'steps': 233, 'loss/train': 5.676627159118652} -09/20/2021 15:17:43 - INFO - __main__ - Step 3732: {'lr': 6.213333333333333e-05, 'samples': 119424, 'steps': 233, 'loss/train': 5.630072593688965} -09/20/2021 15:17:44 - INFO - __main__ - Step 3733: {'lr': 6.213333333333333e-05, 'samples': 119456, 'steps': 233, 'loss/train': 6.420199871063232} -09/20/2021 15:17:45 - INFO - __main__ - Step 3734: {'lr': 6.213333333333333e-05, 'samples': 119488, 'steps': 233, 'loss/train': 7.0390119552612305} -09/20/2021 15:17:46 - INFO - __main__ - Step 3735: {'lr': 6.213333333333333e-05, 'samples': 119520, 'steps': 233, 'loss/train': 6.105480670928955} -09/20/2021 15:17:46 - INFO - __main__ - Step 3736: {'lr': 6.213333333333333e-05, 'samples': 119552, 'steps': 233, 'loss/train': 4.98555326461792} -09/20/2021 15:17:47 - INFO - __main__ - Step 3737: {'lr': 6.213333333333333e-05, 'samples': 119584, 'steps': 233, 'loss/train': 2.9297187328338623} -09/20/2021 15:17:48 - INFO - __main__ - Step 3738: {'lr': 6.213333333333333e-05, 'samples': 119616, 'steps': 233, 'loss/train': 5.3452839851379395} -09/20/2021 15:17:49 - INFO - __main__ - Step 3739: {'lr': 6.213333333333333e-05, 'samples': 119648, 'steps': 233, 'loss/train': 5.993170738220215} -09/20/2021 15:17:49 - INFO - __main__ - Step 3740: {'lr': 6.213333333333333e-05, 'samples': 119680, 'steps': 233, 'loss/train': 3.837390184402466} -09/20/2021 15:17:50 - INFO - __main__ - Step 3741: {'lr': 6.213333333333333e-05, 'samples': 119712, 'steps': 233, 'loss/train': 4.630731105804443} -09/20/2021 15:17:51 - INFO - __main__ - Step 3742: {'lr': 6.213333333333333e-05, 'samples': 119744, 'steps': 233, 'loss/train': 4.785085678100586} -09/20/2021 15:17:52 - INFO - __main__ - Step 3743: {'lr': 6.213333333333333e-05, 'samples': 119776, 'steps': 233, 'loss/train': 5.9247870445251465} -09/20/2021 15:17:53 - INFO - __main__ - Step 3744: {'lr': 6.213333333333333e-05, 'samples': 119808, 'steps': 233, 'loss/train': 5.193817615509033} -09/20/2021 15:17:54 - INFO - __main__ - Step 3745: {'lr': 6.24e-05, 'samples': 119840, 'steps': 234, 'loss/train': 4.870463848114014} -09/20/2021 15:17:55 - INFO - __main__ - Step 3746: {'lr': 6.24e-05, 'samples': 119872, 'steps': 234, 'loss/train': 5.069127559661865} -09/20/2021 15:17:56 - INFO - __main__ - Step 3747: {'lr': 6.24e-05, 'samples': 119904, 'steps': 234, 'loss/train': 5.5202460289001465} -09/20/2021 15:17:56 - INFO - __main__ - Step 3748: {'lr': 6.24e-05, 'samples': 119936, 'steps': 234, 'loss/train': 6.132241725921631} -09/20/2021 15:17:57 - INFO - __main__ - Step 3749: {'lr': 6.24e-05, 'samples': 119968, 'steps': 234, 'loss/train': 5.746934413909912} -09/20/2021 15:17:58 - INFO - __main__ - Step 3750: {'lr': 6.24e-05, 'samples': 120000, 'steps': 234, 'loss/train': 5.3583149909973145} -09/20/2021 15:17:59 - INFO - __main__ - Step 3751: {'lr': 6.24e-05, 'samples': 120032, 'steps': 234, 'loss/train': 5.182952404022217} -09/20/2021 15:17:59 - INFO - __main__ - Step 3752: {'lr': 6.24e-05, 'samples': 120064, 'steps': 234, 'loss/train': 5.050523281097412} -09/20/2021 15:18:00 - INFO - __main__ - Step 3753: {'lr': 6.24e-05, 'samples': 120096, 'steps': 234, 'loss/train': 5.483836650848389} -09/20/2021 15:18:01 - INFO - __main__ - Step 3754: {'lr': 6.24e-05, 'samples': 120128, 'steps': 234, 'loss/train': 6.331022262573242} -09/20/2021 15:18:02 - INFO - __main__ - Step 3755: {'lr': 6.24e-05, 'samples': 120160, 'steps': 234, 'loss/train': 4.746170997619629} -09/20/2021 15:18:02 - INFO - __main__ - Step 3756: {'lr': 6.24e-05, 'samples': 120192, 'steps': 234, 'loss/train': 3.955632209777832} -09/20/2021 15:18:03 - INFO - __main__ - Step 3757: {'lr': 6.24e-05, 'samples': 120224, 'steps': 234, 'loss/train': 3.172990560531616} -09/20/2021 15:18:04 - INFO - __main__ - Step 3758: {'lr': 6.24e-05, 'samples': 120256, 'steps': 234, 'loss/train': 4.220169544219971} -09/20/2021 15:18:05 - INFO - __main__ - Step 3759: {'lr': 6.24e-05, 'samples': 120288, 'steps': 234, 'loss/train': 5.18764591217041} -09/20/2021 15:18:05 - INFO - __main__ - Step 3760: {'lr': 6.24e-05, 'samples': 120320, 'steps': 234, 'loss/train': 5.467648983001709} -09/20/2021 15:18:06 - INFO - __main__ - Step 3761: {'lr': 6.266666666666667e-05, 'samples': 120352, 'steps': 235, 'loss/train': 5.73032283782959} -09/20/2021 15:18:07 - INFO - __main__ - Step 3762: {'lr': 6.266666666666667e-05, 'samples': 120384, 'steps': 235, 'loss/train': 5.2533769607543945} -09/20/2021 15:18:08 - INFO - __main__ - Step 3763: {'lr': 6.266666666666667e-05, 'samples': 120416, 'steps': 235, 'loss/train': 5.416926383972168} -09/20/2021 15:18:08 - INFO - __main__ - Step 3764: {'lr': 6.266666666666667e-05, 'samples': 120448, 'steps': 235, 'loss/train': 5.624542713165283} -09/20/2021 15:18:09 - INFO - __main__ - Step 3765: {'lr': 6.266666666666667e-05, 'samples': 120480, 'steps': 235, 'loss/train': 5.152019500732422} -09/20/2021 15:18:10 - INFO - __main__ - Step 3766: {'lr': 6.266666666666667e-05, 'samples': 120512, 'steps': 235, 'loss/train': 5.695651531219482} -09/20/2021 15:18:11 - INFO - __main__ - Step 3767: {'lr': 6.266666666666667e-05, 'samples': 120544, 'steps': 235, 'loss/train': 5.607049465179443} -09/20/2021 15:18:11 - INFO - __main__ - Step 3768: {'lr': 6.266666666666667e-05, 'samples': 120576, 'steps': 235, 'loss/train': 6.278257846832275} -09/20/2021 15:18:12 - INFO - __main__ - Step 3769: {'lr': 6.266666666666667e-05, 'samples': 120608, 'steps': 235, 'loss/train': 7.556760311126709} -09/20/2021 15:18:13 - INFO - __main__ - Step 3770: {'lr': 6.266666666666667e-05, 'samples': 120640, 'steps': 235, 'loss/train': 7.645198345184326} -09/20/2021 15:18:14 - INFO - __main__ - Step 3771: {'lr': 6.266666666666667e-05, 'samples': 120672, 'steps': 235, 'loss/train': 7.580348491668701} -09/20/2021 15:18:14 - INFO - __main__ - Step 3772: {'lr': 6.266666666666667e-05, 'samples': 120704, 'steps': 235, 'loss/train': 7.572882652282715} -09/20/2021 15:18:15 - INFO - __main__ - Step 3773: {'lr': 6.266666666666667e-05, 'samples': 120736, 'steps': 235, 'loss/train': 7.645169734954834} -09/20/2021 15:18:16 - INFO - __main__ - Step 3774: {'lr': 6.266666666666667e-05, 'samples': 120768, 'steps': 235, 'loss/train': 5.567675590515137} -09/20/2021 15:18:17 - INFO - __main__ - Step 3775: {'lr': 6.266666666666667e-05, 'samples': 120800, 'steps': 235, 'loss/train': 5.157048225402832} -09/20/2021 15:18:17 - INFO - __main__ - Step 3776: {'lr': 6.266666666666667e-05, 'samples': 120832, 'steps': 235, 'loss/train': 5.803066730499268} -09/20/2021 15:18:19 - INFO - __main__ - Step 3777: {'lr': 6.293333333333334e-05, 'samples': 120864, 'steps': 236, 'loss/train': 5.80116605758667} -09/20/2021 15:18:20 - INFO - __main__ - Step 3778: {'lr': 6.293333333333334e-05, 'samples': 120896, 'steps': 236, 'loss/train': 5.684926986694336} -09/20/2021 15:18:20 - INFO - __main__ - Step 3779: {'lr': 6.293333333333334e-05, 'samples': 120928, 'steps': 236, 'loss/train': 5.112777233123779} -09/20/2021 15:18:21 - INFO - __main__ - Step 3780: {'lr': 6.293333333333334e-05, 'samples': 120960, 'steps': 236, 'loss/train': 7.7456135749816895} -09/20/2021 15:18:22 - INFO - __main__ - Step 3781: {'lr': 6.293333333333334e-05, 'samples': 120992, 'steps': 236, 'loss/train': 5.8783650398254395} -09/20/2021 15:18:23 - INFO - __main__ - Step 3782: {'lr': 6.293333333333334e-05, 'samples': 121024, 'steps': 236, 'loss/train': 6.007120609283447} -09/20/2021 15:18:23 - INFO - __main__ - Step 3783: {'lr': 6.293333333333334e-05, 'samples': 121056, 'steps': 236, 'loss/train': 6.141436576843262} -09/20/2021 15:18:24 - INFO - __main__ - Step 3784: {'lr': 6.293333333333334e-05, 'samples': 121088, 'steps': 236, 'loss/train': 5.285059928894043} -09/20/2021 15:18:25 - INFO - __main__ - Step 3785: {'lr': 6.293333333333334e-05, 'samples': 121120, 'steps': 236, 'loss/train': 5.8758745193481445} -09/20/2021 15:18:26 - INFO - __main__ - Step 3786: {'lr': 6.293333333333334e-05, 'samples': 121152, 'steps': 236, 'loss/train': 5.556518077850342} -09/20/2021 15:18:26 - INFO - __main__ - Step 3787: {'lr': 6.293333333333334e-05, 'samples': 121184, 'steps': 236, 'loss/train': 5.193629264831543} -09/20/2021 15:18:27 - INFO - __main__ - Step 3788: {'lr': 6.293333333333334e-05, 'samples': 121216, 'steps': 236, 'loss/train': 6.237914562225342} -09/20/2021 15:18:28 - INFO - __main__ - Step 3789: {'lr': 6.293333333333334e-05, 'samples': 121248, 'steps': 236, 'loss/train': 6.654810905456543} -09/20/2021 15:18:29 - INFO - __main__ - Step 3790: {'lr': 6.293333333333334e-05, 'samples': 121280, 'steps': 236, 'loss/train': 5.760837554931641} -09/20/2021 15:18:29 - INFO - __main__ - Step 3791: {'lr': 6.293333333333334e-05, 'samples': 121312, 'steps': 236, 'loss/train': 5.489837169647217} -09/20/2021 15:18:30 - INFO - __main__ - Step 3792: {'lr': 6.293333333333334e-05, 'samples': 121344, 'steps': 236, 'loss/train': 5.797726631164551} -09/20/2021 15:18:31 - INFO - __main__ - Step 3793: {'lr': 6.32e-05, 'samples': 121376, 'steps': 237, 'loss/train': 1.543304443359375} -09/20/2021 15:18:32 - INFO - __main__ - Step 3794: {'lr': 6.32e-05, 'samples': 121408, 'steps': 237, 'loss/train': 6.1679253578186035} -09/20/2021 15:18:33 - INFO - __main__ - Step 3795: {'lr': 6.32e-05, 'samples': 121440, 'steps': 237, 'loss/train': 5.881311893463135} -09/20/2021 15:18:33 - INFO - __main__ - Step 3796: {'lr': 6.32e-05, 'samples': 121472, 'steps': 237, 'loss/train': 3.0394370555877686} -09/20/2021 15:18:34 - INFO - __main__ - Step 3797: {'lr': 6.32e-05, 'samples': 121504, 'steps': 237, 'loss/train': 5.65924072265625} -09/20/2021 15:18:35 - INFO - __main__ - Step 3798: {'lr': 6.32e-05, 'samples': 121536, 'steps': 237, 'loss/train': 5.570468902587891} -09/20/2021 15:18:36 - INFO - __main__ - Step 3799: {'lr': 6.32e-05, 'samples': 121568, 'steps': 237, 'loss/train': 5.4883270263671875} -09/20/2021 15:18:36 - INFO - __main__ - Step 3800: {'lr': 6.32e-05, 'samples': 121600, 'steps': 237, 'loss/train': 5.454019546508789} -09/20/2021 15:18:37 - INFO - __main__ - Step 3801: {'lr': 6.32e-05, 'samples': 121632, 'steps': 237, 'loss/train': 5.302845478057861} -09/20/2021 15:18:38 - INFO - __main__ - Step 3802: {'lr': 6.32e-05, 'samples': 121664, 'steps': 237, 'loss/train': 5.219648838043213} -09/20/2021 15:18:39 - INFO - __main__ - Step 3803: {'lr': 6.32e-05, 'samples': 121696, 'steps': 237, 'loss/train': 5.180100917816162} -09/20/2021 15:18:39 - INFO - __main__ - Step 3804: {'lr': 6.32e-05, 'samples': 121728, 'steps': 237, 'loss/train': 5.866270065307617} -09/20/2021 15:18:40 - INFO - __main__ - Step 3805: {'lr': 6.32e-05, 'samples': 121760, 'steps': 237, 'loss/train': 5.874119758605957} -09/20/2021 15:18:41 - INFO - __main__ - Step 3806: {'lr': 6.32e-05, 'samples': 121792, 'steps': 237, 'loss/train': 5.564833641052246} -09/20/2021 15:18:42 - INFO - __main__ - Step 3807: {'lr': 6.32e-05, 'samples': 121824, 'steps': 237, 'loss/train': 3.6852519512176514} -09/20/2021 15:18:42 - INFO - __main__ - Step 3808: {'lr': 6.32e-05, 'samples': 121856, 'steps': 237, 'loss/train': 2.9855151176452637} -09/20/2021 15:18:44 - INFO - __main__ - Step 3809: {'lr': 6.346666666666667e-05, 'samples': 121888, 'steps': 238, 'loss/train': 4.5504350662231445} -09/20/2021 15:18:45 - INFO - __main__ - Step 3810: {'lr': 6.346666666666667e-05, 'samples': 121920, 'steps': 238, 'loss/train': 6.572904109954834} -09/20/2021 15:18:45 - INFO - __main__ - Step 3811: {'lr': 6.346666666666667e-05, 'samples': 121952, 'steps': 238, 'loss/train': 6.796319484710693} -09/20/2021 15:18:46 - INFO - __main__ - Step 3812: {'lr': 6.346666666666667e-05, 'samples': 121984, 'steps': 238, 'loss/train': 6.080317974090576} -09/20/2021 15:18:47 - INFO - __main__ - Step 3813: {'lr': 6.346666666666667e-05, 'samples': 122016, 'steps': 238, 'loss/train': 5.998452663421631} -09/20/2021 15:18:48 - INFO - __main__ - Step 3814: {'lr': 6.346666666666667e-05, 'samples': 122048, 'steps': 238, 'loss/train': 7.14946174621582} -09/20/2021 15:18:48 - INFO - __main__ - Step 3815: {'lr': 6.346666666666667e-05, 'samples': 122080, 'steps': 238, 'loss/train': 5.986937522888184} -09/20/2021 15:18:49 - INFO - __main__ - Step 3816: {'lr': 6.346666666666667e-05, 'samples': 122112, 'steps': 238, 'loss/train': 6.209962844848633} -09/20/2021 15:18:50 - INFO - __main__ - Step 3817: {'lr': 6.346666666666667e-05, 'samples': 122144, 'steps': 238, 'loss/train': 4.840332984924316} -09/20/2021 15:18:51 - INFO - __main__ - Step 3818: {'lr': 6.346666666666667e-05, 'samples': 122176, 'steps': 238, 'loss/train': 3.980691432952881} -09/20/2021 15:18:51 - INFO - __main__ - Step 3819: {'lr': 6.346666666666667e-05, 'samples': 122208, 'steps': 238, 'loss/train': 5.386669158935547} -09/20/2021 15:18:52 - INFO - __main__ - Step 3820: {'lr': 6.346666666666667e-05, 'samples': 122240, 'steps': 238, 'loss/train': 4.0555100440979} -09/20/2021 15:18:53 - INFO - __main__ - Step 3821: {'lr': 6.346666666666667e-05, 'samples': 122272, 'steps': 238, 'loss/train': 3.017967939376831} -09/20/2021 15:18:54 - INFO - __main__ - Step 3822: {'lr': 6.346666666666667e-05, 'samples': 122304, 'steps': 238, 'loss/train': 5.256331443786621} -09/20/2021 15:18:54 - INFO - __main__ - Step 3823: {'lr': 6.346666666666667e-05, 'samples': 122336, 'steps': 238, 'loss/train': 5.027674674987793} -09/20/2021 15:18:55 - INFO - __main__ - Step 3824: {'lr': 6.346666666666667e-05, 'samples': 122368, 'steps': 238, 'loss/train': 5.484823226928711} -09/20/2021 15:18:56 - INFO - __main__ - Step 3825: {'lr': 6.373333333333333e-05, 'samples': 122400, 'steps': 239, 'loss/train': 5.149718284606934} -09/20/2021 15:18:57 - INFO - __main__ - Step 3826: {'lr': 6.373333333333333e-05, 'samples': 122432, 'steps': 239, 'loss/train': 5.467172145843506} -09/20/2021 15:18:58 - INFO - __main__ - Step 3827: {'lr': 6.373333333333333e-05, 'samples': 122464, 'steps': 239, 'loss/train': 5.889028072357178} -09/20/2021 15:18:58 - INFO - __main__ - Step 3828: {'lr': 6.373333333333333e-05, 'samples': 122496, 'steps': 239, 'loss/train': 5.935150146484375} -09/20/2021 15:18:59 - INFO - __main__ - Step 3829: {'lr': 6.373333333333333e-05, 'samples': 122528, 'steps': 239, 'loss/train': 5.586497783660889} -09/20/2021 15:19:00 - INFO - __main__ - Step 3830: {'lr': 6.373333333333333e-05, 'samples': 122560, 'steps': 239, 'loss/train': 6.372483253479004} -09/20/2021 15:19:01 - INFO - __main__ - Step 3831: {'lr': 6.373333333333333e-05, 'samples': 122592, 'steps': 239, 'loss/train': 5.24879264831543} -09/20/2021 15:19:01 - INFO - __main__ - Step 3832: {'lr': 6.373333333333333e-05, 'samples': 122624, 'steps': 239, 'loss/train': 6.242884159088135} -09/20/2021 15:19:02 - INFO - __main__ - Step 3833: {'lr': 6.373333333333333e-05, 'samples': 122656, 'steps': 239, 'loss/train': 5.573155403137207} -09/20/2021 15:19:03 - INFO - __main__ - Step 3834: {'lr': 6.373333333333333e-05, 'samples': 122688, 'steps': 239, 'loss/train': 5.985745906829834} -09/20/2021 15:19:04 - INFO - __main__ - Step 3835: {'lr': 6.373333333333333e-05, 'samples': 122720, 'steps': 239, 'loss/train': 6.133049488067627} -09/20/2021 15:19:04 - INFO - __main__ - Step 3836: {'lr': 6.373333333333333e-05, 'samples': 122752, 'steps': 239, 'loss/train': 6.208991527557373} -09/20/2021 15:19:05 - INFO - __main__ - Step 3837: {'lr': 6.373333333333333e-05, 'samples': 122784, 'steps': 239, 'loss/train': 6.4832916259765625} -09/20/2021 15:19:06 - INFO - __main__ - Step 3838: {'lr': 6.373333333333333e-05, 'samples': 122816, 'steps': 239, 'loss/train': 5.770963191986084} -09/20/2021 15:19:07 - INFO - __main__ - Step 3839: {'lr': 6.373333333333333e-05, 'samples': 122848, 'steps': 239, 'loss/train': 5.530559062957764} -09/20/2021 15:19:08 - INFO - __main__ - Step 3840: {'lr': 6.373333333333333e-05, 'samples': 122880, 'steps': 239, 'loss/train': 6.07515287399292} -09/20/2021 15:19:09 - INFO - __main__ - Step 3841: {'lr': 6.400000000000001e-05, 'samples': 122912, 'steps': 240, 'loss/train': 5.3113908767700195} -09/20/2021 15:19:10 - INFO - __main__ - Step 3842: {'lr': 6.400000000000001e-05, 'samples': 122944, 'steps': 240, 'loss/train': 6.007519721984863} -09/20/2021 15:19:10 - INFO - __main__ - Step 3843: {'lr': 6.400000000000001e-05, 'samples': 122976, 'steps': 240, 'loss/train': 5.404677867889404} -09/20/2021 15:19:11 - INFO - __main__ - Step 3844: {'lr': 6.400000000000001e-05, 'samples': 123008, 'steps': 240, 'loss/train': 6.176792621612549} -09/20/2021 15:19:12 - INFO - __main__ - Step 3845: {'lr': 6.400000000000001e-05, 'samples': 123040, 'steps': 240, 'loss/train': 6.389839172363281} -09/20/2021 15:19:13 - INFO - __main__ - Step 3846: {'lr': 6.400000000000001e-05, 'samples': 123072, 'steps': 240, 'loss/train': 5.515730381011963} -09/20/2021 15:19:13 - INFO - __main__ - Step 3847: {'lr': 6.400000000000001e-05, 'samples': 123104, 'steps': 240, 'loss/train': 6.023606300354004} -09/20/2021 15:19:14 - INFO - __main__ - Step 3848: {'lr': 6.400000000000001e-05, 'samples': 123136, 'steps': 240, 'loss/train': 6.614278316497803} -09/20/2021 15:19:15 - INFO - __main__ - Step 3849: {'lr': 6.400000000000001e-05, 'samples': 123168, 'steps': 240, 'loss/train': 3.0076041221618652} -09/20/2021 15:19:16 - INFO - __main__ - Step 3850: {'lr': 6.400000000000001e-05, 'samples': 123200, 'steps': 240, 'loss/train': 2.6946418285369873} -09/20/2021 15:19:16 - INFO - __main__ - Step 3851: {'lr': 6.400000000000001e-05, 'samples': 123232, 'steps': 240, 'loss/train': 5.6664934158325195} -09/20/2021 15:19:17 - INFO - __main__ - Step 3852: {'lr': 6.400000000000001e-05, 'samples': 123264, 'steps': 240, 'loss/train': 6.421703815460205} -09/20/2021 15:19:18 - INFO - __main__ - Step 3853: {'lr': 6.400000000000001e-05, 'samples': 123296, 'steps': 240, 'loss/train': 5.693647861480713} -09/20/2021 15:19:19 - INFO - __main__ - Step 3854: {'lr': 6.400000000000001e-05, 'samples': 123328, 'steps': 240, 'loss/train': 6.8177289962768555} -09/20/2021 15:19:19 - INFO - __main__ - Step 3855: {'lr': 6.400000000000001e-05, 'samples': 123360, 'steps': 240, 'loss/train': 5.323268413543701} -09/20/2021 15:19:20 - INFO - __main__ - Step 3856: {'lr': 6.400000000000001e-05, 'samples': 123392, 'steps': 240, 'loss/train': 5.406132698059082} -09/20/2021 15:19:21 - INFO - __main__ - Step 3857: {'lr': 6.426666666666668e-05, 'samples': 123424, 'steps': 241, 'loss/train': 4.150576591491699} -09/20/2021 15:19:22 - INFO - __main__ - Step 3858: {'lr': 6.426666666666668e-05, 'samples': 123456, 'steps': 241, 'loss/train': 5.405360221862793} -09/20/2021 15:19:22 - INFO - __main__ - Step 3859: {'lr': 6.426666666666668e-05, 'samples': 123488, 'steps': 241, 'loss/train': 6.62393856048584} -09/20/2021 15:19:23 - INFO - __main__ - Step 3860: {'lr': 6.426666666666668e-05, 'samples': 123520, 'steps': 241, 'loss/train': 5.575405120849609} -09/20/2021 15:19:24 - INFO - __main__ - Step 3861: {'lr': 6.426666666666668e-05, 'samples': 123552, 'steps': 241, 'loss/train': 5.520208835601807} -09/20/2021 15:19:25 - INFO - __main__ - Step 3862: {'lr': 6.426666666666668e-05, 'samples': 123584, 'steps': 241, 'loss/train': 5.588081359863281} -09/20/2021 15:19:25 - INFO - __main__ - Step 3863: {'lr': 6.426666666666668e-05, 'samples': 123616, 'steps': 241, 'loss/train': 5.345492362976074} -09/20/2021 15:19:26 - INFO - __main__ - Step 3864: {'lr': 6.426666666666668e-05, 'samples': 123648, 'steps': 241, 'loss/train': 5.130277633666992} -09/20/2021 15:19:27 - INFO - __main__ - Step 3865: {'lr': 6.426666666666668e-05, 'samples': 123680, 'steps': 241, 'loss/train': 5.466216087341309} -09/20/2021 15:19:28 - INFO - __main__ - Step 3866: {'lr': 6.426666666666668e-05, 'samples': 123712, 'steps': 241, 'loss/train': 5.444468021392822} -09/20/2021 15:19:28 - INFO - __main__ - Step 3867: {'lr': 6.426666666666668e-05, 'samples': 123744, 'steps': 241, 'loss/train': 6.18338680267334} -09/20/2021 15:19:29 - INFO - __main__ - Step 3868: {'lr': 6.426666666666668e-05, 'samples': 123776, 'steps': 241, 'loss/train': 5.351159572601318} -09/20/2021 15:19:30 - INFO - __main__ - Step 3869: {'lr': 6.426666666666668e-05, 'samples': 123808, 'steps': 241, 'loss/train': 6.295376777648926} -09/20/2021 15:19:31 - INFO - __main__ - Step 3870: {'lr': 6.426666666666668e-05, 'samples': 123840, 'steps': 241, 'loss/train': 7.46649694442749} -09/20/2021 15:19:32 - INFO - __main__ - Step 3871: {'lr': 6.426666666666668e-05, 'samples': 123872, 'steps': 241, 'loss/train': 7.236949443817139} -09/20/2021 15:19:33 - INFO - __main__ - Step 3872: {'lr': 6.426666666666668e-05, 'samples': 123904, 'steps': 241, 'loss/train': 4.69148063659668} -09/20/2021 15:19:34 - INFO - __main__ - Step 3873: {'lr': 6.453333333333333e-05, 'samples': 123936, 'steps': 242, 'loss/train': 5.406404495239258} -09/20/2021 15:19:35 - INFO - __main__ - Step 3874: {'lr': 6.453333333333333e-05, 'samples': 123968, 'steps': 242, 'loss/train': 6.0559258460998535} -09/20/2021 15:19:36 - INFO - __main__ - Step 3875: {'lr': 6.453333333333333e-05, 'samples': 124000, 'steps': 242, 'loss/train': 5.757380962371826} -09/20/2021 15:19:36 - INFO - __main__ - Step 3876: {'lr': 6.453333333333333e-05, 'samples': 124032, 'steps': 242, 'loss/train': 4.92398738861084} -09/20/2021 15:19:37 - INFO - __main__ - Step 3877: {'lr': 6.453333333333333e-05, 'samples': 124064, 'steps': 242, 'loss/train': 6.331212997436523} -09/20/2021 15:19:38 - INFO - __main__ - Step 3878: {'lr': 6.453333333333333e-05, 'samples': 124096, 'steps': 242, 'loss/train': 5.655849456787109} -09/20/2021 15:19:39 - INFO - __main__ - Step 3879: {'lr': 6.453333333333333e-05, 'samples': 124128, 'steps': 242, 'loss/train': 5.833495140075684} -09/20/2021 15:19:39 - INFO - __main__ - Step 3880: {'lr': 6.453333333333333e-05, 'samples': 124160, 'steps': 242, 'loss/train': 5.921886444091797} -09/20/2021 15:19:40 - INFO - __main__ - Step 3881: {'lr': 6.453333333333333e-05, 'samples': 124192, 'steps': 242, 'loss/train': 5.545573711395264} -09/20/2021 15:19:41 - INFO - __main__ - Step 3882: {'lr': 6.453333333333333e-05, 'samples': 124224, 'steps': 242, 'loss/train': 5.415772438049316} -09/20/2021 15:19:42 - INFO - __main__ - Step 3883: {'lr': 6.453333333333333e-05, 'samples': 124256, 'steps': 242, 'loss/train': 5.701204299926758} -09/20/2021 15:19:42 - INFO - __main__ - Step 3884: {'lr': 6.453333333333333e-05, 'samples': 124288, 'steps': 242, 'loss/train': 6.389959812164307} -09/20/2021 15:19:43 - INFO - __main__ - Step 3885: {'lr': 6.453333333333333e-05, 'samples': 124320, 'steps': 242, 'loss/train': 5.04066276550293} -09/20/2021 15:19:44 - INFO - __main__ - Step 3886: {'lr': 6.453333333333333e-05, 'samples': 124352, 'steps': 242, 'loss/train': 5.736823081970215} -09/20/2021 15:19:45 - INFO - __main__ - Step 3887: {'lr': 6.453333333333333e-05, 'samples': 124384, 'steps': 242, 'loss/train': 7.750133514404297} -09/20/2021 15:19:45 - INFO - __main__ - Step 3888: {'lr': 6.453333333333333e-05, 'samples': 124416, 'steps': 242, 'loss/train': 5.595031261444092} -09/20/2021 15:19:46 - INFO - __main__ - Step 3889: {'lr': 6.48e-05, 'samples': 124448, 'steps': 243, 'loss/train': 5.883978843688965} -09/20/2021 15:19:47 - INFO - __main__ - Step 3890: {'lr': 6.48e-05, 'samples': 124480, 'steps': 243, 'loss/train': 5.716435432434082} -09/20/2021 15:19:48 - INFO - __main__ - Step 3891: {'lr': 6.48e-05, 'samples': 124512, 'steps': 243, 'loss/train': 6.372438430786133} -09/20/2021 15:19:48 - INFO - __main__ - Step 3892: {'lr': 6.48e-05, 'samples': 124544, 'steps': 243, 'loss/train': 5.006877422332764} -09/20/2021 15:19:49 - INFO - __main__ - Step 3893: {'lr': 6.48e-05, 'samples': 124576, 'steps': 243, 'loss/train': 5.47763729095459} -09/20/2021 15:19:50 - INFO - __main__ - Step 3894: {'lr': 6.48e-05, 'samples': 124608, 'steps': 243, 'loss/train': 6.369289398193359} -09/20/2021 15:19:51 - INFO - __main__ - Step 3895: {'lr': 6.48e-05, 'samples': 124640, 'steps': 243, 'loss/train': 5.056110858917236} -09/20/2021 15:19:51 - INFO - __main__ - Step 3896: {'lr': 6.48e-05, 'samples': 124672, 'steps': 243, 'loss/train': 5.351711273193359} -09/20/2021 15:19:52 - INFO - __main__ - Step 3897: {'lr': 6.48e-05, 'samples': 124704, 'steps': 243, 'loss/train': 5.322361946105957} -09/20/2021 15:19:53 - INFO - __main__ - Step 3898: {'lr': 6.48e-05, 'samples': 124736, 'steps': 243, 'loss/train': 5.93291711807251} -09/20/2021 15:19:54 - INFO - __main__ - Step 3899: {'lr': 6.48e-05, 'samples': 124768, 'steps': 243, 'loss/train': 6.194584846496582} -09/20/2021 15:19:54 - INFO - __main__ - Step 3900: {'lr': 6.48e-05, 'samples': 124800, 'steps': 243, 'loss/train': 4.933460235595703} -09/20/2021 15:19:55 - INFO - __main__ - Step 3901: {'lr': 6.48e-05, 'samples': 124832, 'steps': 243, 'loss/train': 5.672712326049805} -09/20/2021 15:19:57 - INFO - __main__ - Step 3902: {'lr': 6.48e-05, 'samples': 124864, 'steps': 243, 'loss/train': 4.834049224853516} -09/20/2021 15:19:58 - INFO - __main__ - Step 3903: {'lr': 6.48e-05, 'samples': 124896, 'steps': 243, 'loss/train': 5.69187068939209} -09/20/2021 15:19:58 - INFO - __main__ - Step 3904: {'lr': 6.48e-05, 'samples': 124928, 'steps': 243, 'loss/train': 5.415924072265625} -09/20/2021 15:19:59 - INFO - __main__ - Step 3905: {'lr': 6.506666666666666e-05, 'samples': 124960, 'steps': 244, 'loss/train': 5.240459442138672} -09/20/2021 15:20:00 - INFO - __main__ - Step 3906: {'lr': 6.506666666666666e-05, 'samples': 124992, 'steps': 244, 'loss/train': 5.103694438934326} -09/20/2021 15:20:01 - INFO - __main__ - Step 3907: {'lr': 6.506666666666666e-05, 'samples': 125024, 'steps': 244, 'loss/train': 5.364474773406982} -09/20/2021 15:20:02 - INFO - __main__ - Step 3908: {'lr': 6.506666666666666e-05, 'samples': 125056, 'steps': 244, 'loss/train': 5.239205360412598} -09/20/2021 15:20:02 - INFO - __main__ - Step 3909: {'lr': 6.506666666666666e-05, 'samples': 125088, 'steps': 244, 'loss/train': 5.058754920959473} -09/20/2021 15:20:03 - INFO - __main__ - Step 3910: {'lr': 6.506666666666666e-05, 'samples': 125120, 'steps': 244, 'loss/train': 5.205142021179199} -09/20/2021 15:20:04 - INFO - __main__ - Step 3911: {'lr': 6.506666666666666e-05, 'samples': 125152, 'steps': 244, 'loss/train': 5.488426685333252} -09/20/2021 15:20:05 - INFO - __main__ - Step 3912: {'lr': 6.506666666666666e-05, 'samples': 125184, 'steps': 244, 'loss/train': 5.9357500076293945} -09/20/2021 15:20:05 - INFO - __main__ - Step 3913: {'lr': 6.506666666666666e-05, 'samples': 125216, 'steps': 244, 'loss/train': 5.800868034362793} -09/20/2021 15:20:06 - INFO - __main__ - Step 3914: {'lr': 6.506666666666666e-05, 'samples': 125248, 'steps': 244, 'loss/train': 5.532899856567383} -09/20/2021 15:20:07 - INFO - __main__ - Step 3915: {'lr': 6.506666666666666e-05, 'samples': 125280, 'steps': 244, 'loss/train': 5.795613765716553} -09/20/2021 15:20:08 - INFO - __main__ - Step 3916: {'lr': 6.506666666666666e-05, 'samples': 125312, 'steps': 244, 'loss/train': 5.301483631134033} -09/20/2021 15:20:08 - INFO - __main__ - Step 3917: {'lr': 6.506666666666666e-05, 'samples': 125344, 'steps': 244, 'loss/train': 4.7513203620910645} -09/20/2021 15:20:09 - INFO - __main__ - Step 3918: {'lr': 6.506666666666666e-05, 'samples': 125376, 'steps': 244, 'loss/train': 6.1378583908081055} -09/20/2021 15:20:10 - INFO - __main__ - Step 3919: {'lr': 6.506666666666666e-05, 'samples': 125408, 'steps': 244, 'loss/train': 7.193597793579102} -09/20/2021 15:20:11 - INFO - __main__ - Step 3920: {'lr': 6.506666666666666e-05, 'samples': 125440, 'steps': 244, 'loss/train': 6.15313720703125} -09/20/2021 15:20:12 - INFO - __main__ - Step 3921: {'lr': 6.533333333333334e-05, 'samples': 125472, 'steps': 245, 'loss/train': 5.6343889236450195} -09/20/2021 15:20:12 - INFO - __main__ - Step 3922: {'lr': 6.533333333333334e-05, 'samples': 125504, 'steps': 245, 'loss/train': 5.666740894317627} -09/20/2021 15:20:13 - INFO - __main__ - Step 3923: {'lr': 6.533333333333334e-05, 'samples': 125536, 'steps': 245, 'loss/train': 5.705801010131836} -09/20/2021 15:20:14 - INFO - __main__ - Step 3924: {'lr': 6.533333333333334e-05, 'samples': 125568, 'steps': 245, 'loss/train': 5.542792797088623} -09/20/2021 15:20:15 - INFO - __main__ - Step 3925: {'lr': 6.533333333333334e-05, 'samples': 125600, 'steps': 245, 'loss/train': 5.509735107421875} -09/20/2021 15:20:15 - INFO - __main__ - Step 3926: {'lr': 6.533333333333334e-05, 'samples': 125632, 'steps': 245, 'loss/train': 5.62032413482666} -09/20/2021 15:20:16 - INFO - __main__ - Step 3927: {'lr': 6.533333333333334e-05, 'samples': 125664, 'steps': 245, 'loss/train': 0.8878492712974548} -09/20/2021 15:20:17 - INFO - __main__ - Step 3928: {'lr': 6.533333333333334e-05, 'samples': 125696, 'steps': 245, 'loss/train': 5.59294319152832} -09/20/2021 15:20:18 - INFO - __main__ - Step 3929: {'lr': 6.533333333333334e-05, 'samples': 125728, 'steps': 245, 'loss/train': 5.799490451812744} -09/20/2021 15:20:18 - INFO - __main__ - Step 3930: {'lr': 6.533333333333334e-05, 'samples': 125760, 'steps': 245, 'loss/train': 6.049159526824951} -09/20/2021 15:20:19 - INFO - __main__ - Step 3931: {'lr': 6.533333333333334e-05, 'samples': 125792, 'steps': 245, 'loss/train': 5.510241985321045} -09/20/2021 15:20:20 - INFO - __main__ - Step 3932: {'lr': 6.533333333333334e-05, 'samples': 125824, 'steps': 245, 'loss/train': 3.876382350921631} -09/20/2021 15:20:21 - INFO - __main__ - Step 3933: {'lr': 6.533333333333334e-05, 'samples': 125856, 'steps': 245, 'loss/train': 4.581949710845947} -09/20/2021 15:20:21 - INFO - __main__ - Step 3934: {'lr': 6.533333333333334e-05, 'samples': 125888, 'steps': 245, 'loss/train': 3.9767582416534424} -09/20/2021 15:20:22 - INFO - __main__ - Step 3935: {'lr': 6.533333333333334e-05, 'samples': 125920, 'steps': 245, 'loss/train': 4.132674217224121} -09/20/2021 15:20:23 - INFO - __main__ - Step 3936: {'lr': 6.533333333333334e-05, 'samples': 125952, 'steps': 245, 'loss/train': 4.57648229598999} -09/20/2021 15:20:24 - INFO - __main__ - Step 3937: {'lr': 6.560000000000001e-05, 'samples': 125984, 'steps': 246, 'loss/train': 6.173035144805908} -09/20/2021 15:20:25 - INFO - __main__ - Step 3938: {'lr': 6.560000000000001e-05, 'samples': 126016, 'steps': 246, 'loss/train': 3.4986982345581055} -09/20/2021 15:20:26 - INFO - __main__ - Step 3939: {'lr': 6.560000000000001e-05, 'samples': 126048, 'steps': 246, 'loss/train': 5.18153190612793} -09/20/2021 15:20:27 - INFO - __main__ - Step 3940: {'lr': 6.560000000000001e-05, 'samples': 126080, 'steps': 246, 'loss/train': 5.605130672454834} -09/20/2021 15:20:27 - INFO - __main__ - Step 3941: {'lr': 6.560000000000001e-05, 'samples': 126112, 'steps': 246, 'loss/train': 6.154917240142822} -09/20/2021 15:20:28 - INFO - __main__ - Step 3942: {'lr': 6.560000000000001e-05, 'samples': 126144, 'steps': 246, 'loss/train': 5.009115695953369} -09/20/2021 15:20:29 - INFO - __main__ - Step 3943: {'lr': 6.560000000000001e-05, 'samples': 126176, 'steps': 246, 'loss/train': 6.45194149017334} -09/20/2021 15:20:30 - INFO - __main__ - Step 3944: {'lr': 6.560000000000001e-05, 'samples': 126208, 'steps': 246, 'loss/train': 5.409929275512695} -09/20/2021 15:20:30 - INFO - __main__ - Step 3945: {'lr': 6.560000000000001e-05, 'samples': 126240, 'steps': 246, 'loss/train': 6.964240550994873} -09/20/2021 15:20:31 - INFO - __main__ - Step 3946: {'lr': 6.560000000000001e-05, 'samples': 126272, 'steps': 246, 'loss/train': 6.207835674285889} -09/20/2021 15:20:32 - INFO - __main__ - Step 3947: {'lr': 6.560000000000001e-05, 'samples': 126304, 'steps': 246, 'loss/train': 5.423651695251465} -09/20/2021 15:20:33 - INFO - __main__ - Step 3948: {'lr': 6.560000000000001e-05, 'samples': 126336, 'steps': 246, 'loss/train': 5.3500285148620605} -09/20/2021 15:20:33 - INFO - __main__ - Step 3949: {'lr': 6.560000000000001e-05, 'samples': 126368, 'steps': 246, 'loss/train': 4.736054420471191} -09/20/2021 15:20:34 - INFO - __main__ - Step 3950: {'lr': 6.560000000000001e-05, 'samples': 126400, 'steps': 246, 'loss/train': 5.851919651031494} -09/20/2021 15:20:35 - INFO - __main__ - Step 3951: {'lr': 6.560000000000001e-05, 'samples': 126432, 'steps': 246, 'loss/train': 5.802483081817627} -09/20/2021 15:20:36 - INFO - __main__ - Step 3952: {'lr': 6.560000000000001e-05, 'samples': 126464, 'steps': 246, 'loss/train': 5.539889335632324} -09/20/2021 15:20:36 - INFO - __main__ - Step 3953: {'lr': 6.586666666666666e-05, 'samples': 126496, 'steps': 247, 'loss/train': 6.404880046844482} -09/20/2021 15:20:37 - INFO - __main__ - Step 3954: {'lr': 6.586666666666666e-05, 'samples': 126528, 'steps': 247, 'loss/train': 6.2978196144104} -09/20/2021 15:20:38 - INFO - __main__ - Step 3955: {'lr': 6.586666666666666e-05, 'samples': 126560, 'steps': 247, 'loss/train': 5.436906814575195} -09/20/2021 15:20:39 - INFO - __main__ - Step 3956: {'lr': 6.586666666666666e-05, 'samples': 126592, 'steps': 247, 'loss/train': 6.0330400466918945} -09/20/2021 15:20:39 - INFO - __main__ - Step 3957: {'lr': 6.586666666666666e-05, 'samples': 126624, 'steps': 247, 'loss/train': 5.4937872886657715} -09/20/2021 15:20:40 - INFO - __main__ - Step 3958: {'lr': 6.586666666666666e-05, 'samples': 126656, 'steps': 247, 'loss/train': 5.568051338195801} -09/20/2021 15:20:41 - INFO - __main__ - Step 3959: {'lr': 6.586666666666666e-05, 'samples': 126688, 'steps': 247, 'loss/train': 6.2291669845581055} -09/20/2021 15:20:42 - INFO - __main__ - Step 3960: {'lr': 6.586666666666666e-05, 'samples': 126720, 'steps': 247, 'loss/train': 5.4485602378845215} -09/20/2021 15:20:42 - INFO - __main__ - Step 3961: {'lr': 6.586666666666666e-05, 'samples': 126752, 'steps': 247, 'loss/train': 5.213764190673828} -09/20/2021 15:20:43 - INFO - __main__ - Step 3962: {'lr': 6.586666666666666e-05, 'samples': 126784, 'steps': 247, 'loss/train': 6.672460079193115} -09/20/2021 15:20:44 - INFO - __main__ - Step 3963: {'lr': 6.586666666666666e-05, 'samples': 126816, 'steps': 247, 'loss/train': 5.809399127960205} -09/20/2021 15:20:45 - INFO - __main__ - Step 3964: {'lr': 6.586666666666666e-05, 'samples': 126848, 'steps': 247, 'loss/train': 5.580756187438965} -09/20/2021 15:20:45 - INFO - __main__ - Step 3965: {'lr': 6.586666666666666e-05, 'samples': 126880, 'steps': 247, 'loss/train': 5.596133708953857} -09/20/2021 15:20:46 - INFO - __main__ - Step 3966: {'lr': 6.586666666666666e-05, 'samples': 126912, 'steps': 247, 'loss/train': 5.912768840789795} -09/20/2021 15:20:47 - INFO - __main__ - Step 3967: {'lr': 6.586666666666666e-05, 'samples': 126944, 'steps': 247, 'loss/train': 5.623694896697998} -09/20/2021 15:20:48 - INFO - __main__ - Step 3968: {'lr': 6.586666666666666e-05, 'samples': 126976, 'steps': 247, 'loss/train': 6.112414836883545} -09/20/2021 15:20:49 - INFO - __main__ - Step 3969: {'lr': 6.613333333333333e-05, 'samples': 127008, 'steps': 248, 'loss/train': 5.130025863647461} -09/20/2021 15:20:50 - INFO - __main__ - Step 3970: {'lr': 6.613333333333333e-05, 'samples': 127040, 'steps': 248, 'loss/train': 5.706536293029785} -09/20/2021 15:20:51 - INFO - __main__ - Step 3971: {'lr': 6.613333333333333e-05, 'samples': 127072, 'steps': 248, 'loss/train': 5.652656078338623} -09/20/2021 15:20:51 - INFO - __main__ - Step 3972: {'lr': 6.613333333333333e-05, 'samples': 127104, 'steps': 248, 'loss/train': 4.984909534454346} -09/20/2021 15:20:52 - INFO - __main__ - Step 3973: {'lr': 6.613333333333333e-05, 'samples': 127136, 'steps': 248, 'loss/train': 5.473530292510986} -09/20/2021 15:20:53 - INFO - __main__ - Step 3974: {'lr': 6.613333333333333e-05, 'samples': 127168, 'steps': 248, 'loss/train': 5.188750267028809} -09/20/2021 15:20:54 - INFO - __main__ - Step 3975: {'lr': 6.613333333333333e-05, 'samples': 127200, 'steps': 248, 'loss/train': 5.261286735534668} -09/20/2021 15:20:54 - INFO - __main__ - Step 3976: {'lr': 6.613333333333333e-05, 'samples': 127232, 'steps': 248, 'loss/train': 5.169721603393555} -09/20/2021 15:20:55 - INFO - __main__ - Step 3977: {'lr': 6.613333333333333e-05, 'samples': 127264, 'steps': 248, 'loss/train': 5.235636234283447} -09/20/2021 15:20:56 - INFO - __main__ - Step 3978: {'lr': 6.613333333333333e-05, 'samples': 127296, 'steps': 248, 'loss/train': 4.956790447235107} -09/20/2021 15:20:57 - INFO - __main__ - Step 3979: {'lr': 6.613333333333333e-05, 'samples': 127328, 'steps': 248, 'loss/train': 5.456563949584961} -09/20/2021 15:20:57 - INFO - __main__ - Step 3980: {'lr': 6.613333333333333e-05, 'samples': 127360, 'steps': 248, 'loss/train': 0.8804845809936523} -09/20/2021 15:20:58 - INFO - __main__ - Step 3981: {'lr': 6.613333333333333e-05, 'samples': 127392, 'steps': 248, 'loss/train': 5.57061243057251} -09/20/2021 15:20:59 - INFO - __main__ - Step 3982: {'lr': 6.613333333333333e-05, 'samples': 127424, 'steps': 248, 'loss/train': 5.958280086517334} -09/20/2021 15:21:00 - INFO - __main__ - Step 3983: {'lr': 6.613333333333333e-05, 'samples': 127456, 'steps': 248, 'loss/train': 6.192836284637451} -09/20/2021 15:21:00 - INFO - __main__ - Step 3984: {'lr': 6.613333333333333e-05, 'samples': 127488, 'steps': 248, 'loss/train': 5.164173126220703} -09/20/2021 15:21:01 - INFO - __main__ - Step 3985: {'lr': 6.64e-05, 'samples': 127520, 'steps': 249, 'loss/train': 5.34039831161499} -09/20/2021 15:21:02 - INFO - __main__ - Step 3986: {'lr': 6.64e-05, 'samples': 127552, 'steps': 249, 'loss/train': 5.445080757141113} -09/20/2021 15:21:03 - INFO - __main__ - Step 3987: {'lr': 6.64e-05, 'samples': 127584, 'steps': 249, 'loss/train': 7.247925758361816} -09/20/2021 15:21:04 - INFO - __main__ - Step 3988: {'lr': 6.64e-05, 'samples': 127616, 'steps': 249, 'loss/train': 7.255225658416748} -09/20/2021 15:21:04 - INFO - __main__ - Step 3989: {'lr': 6.64e-05, 'samples': 127648, 'steps': 249, 'loss/train': 7.350756645202637} -09/20/2021 15:21:05 - INFO - __main__ - Step 3990: {'lr': 6.64e-05, 'samples': 127680, 'steps': 249, 'loss/train': 7.396363258361816} -09/20/2021 15:21:06 - INFO - __main__ - Step 3991: {'lr': 6.64e-05, 'samples': 127712, 'steps': 249, 'loss/train': 6.256543159484863} -09/20/2021 15:21:07 - INFO - __main__ - Step 3992: {'lr': 6.64e-05, 'samples': 127744, 'steps': 249, 'loss/train': 7.552675247192383} -09/20/2021 15:21:07 - INFO - __main__ - Step 3993: {'lr': 6.64e-05, 'samples': 127776, 'steps': 249, 'loss/train': 5.495728969573975} -09/20/2021 15:21:08 - INFO - __main__ - Step 3994: {'lr': 6.64e-05, 'samples': 127808, 'steps': 249, 'loss/train': 5.988507270812988} -09/20/2021 15:21:09 - INFO - __main__ - Step 3995: {'lr': 6.64e-05, 'samples': 127840, 'steps': 249, 'loss/train': 5.899311542510986} -09/20/2021 15:21:10 - INFO - __main__ - Step 3996: {'lr': 6.64e-05, 'samples': 127872, 'steps': 249, 'loss/train': 5.673116683959961} -09/20/2021 15:21:10 - INFO - __main__ - Step 3997: {'lr': 6.64e-05, 'samples': 127904, 'steps': 249, 'loss/train': 4.572505950927734} -09/20/2021 15:21:11 - INFO - __main__ - Step 3998: {'lr': 6.64e-05, 'samples': 127936, 'steps': 249, 'loss/train': 6.698160648345947} -09/20/2021 15:21:12 - INFO - __main__ - Step 3999: {'lr': 6.64e-05, 'samples': 127968, 'steps': 249, 'loss/train': 6.2935404777526855} -09/20/2021 15:21:13 - INFO - __main__ - Step 4000: {'lr': 6.64e-05, 'samples': 128000, 'steps': 249, 'loss/train': 5.559673309326172} -09/20/2021 15:21:13 - INFO - __main__ - Step 4001: {'lr': 6.666666666666667e-05, 'samples': 128032, 'steps': 250, 'loss/train': 5.60994291305542} -09/20/2021 15:21:14 - INFO - __main__ - Step 4002: {'lr': 6.666666666666667e-05, 'samples': 128064, 'steps': 250, 'loss/train': 5.810640811920166} -09/20/2021 15:21:16 - INFO - __main__ - Step 4003: {'lr': 6.666666666666667e-05, 'samples': 128096, 'steps': 250, 'loss/train': 6.066250801086426} -09/20/2021 15:21:16 - INFO - __main__ - Step 4004: {'lr': 6.666666666666667e-05, 'samples': 128128, 'steps': 250, 'loss/train': 4.050546646118164} -09/20/2021 15:21:17 - INFO - __main__ - Step 4005: {'lr': 6.666666666666667e-05, 'samples': 128160, 'steps': 250, 'loss/train': 6.59076452255249} -09/20/2021 15:21:18 - INFO - __main__ - Step 4006: {'lr': 6.666666666666667e-05, 'samples': 128192, 'steps': 250, 'loss/train': 5.26745080947876} -09/20/2021 15:21:19 - INFO - __main__ - Step 4007: {'lr': 6.666666666666667e-05, 'samples': 128224, 'steps': 250, 'loss/train': 5.264621734619141} -09/20/2021 15:21:19 - INFO - __main__ - Step 4008: {'lr': 6.666666666666667e-05, 'samples': 128256, 'steps': 250, 'loss/train': 5.742919445037842} -09/20/2021 15:21:20 - INFO - __main__ - Step 4009: {'lr': 6.666666666666667e-05, 'samples': 128288, 'steps': 250, 'loss/train': 6.226856708526611} -09/20/2021 15:21:21 - INFO - __main__ - Step 4010: {'lr': 6.666666666666667e-05, 'samples': 128320, 'steps': 250, 'loss/train': 5.710068225860596} -09/20/2021 15:21:22 - INFO - __main__ - Step 4011: {'lr': 6.666666666666667e-05, 'samples': 128352, 'steps': 250, 'loss/train': 5.83457088470459} -09/20/2021 15:21:22 - INFO - __main__ - Step 4012: {'lr': 6.666666666666667e-05, 'samples': 128384, 'steps': 250, 'loss/train': 5.628114700317383} -09/20/2021 15:21:23 - INFO - __main__ - Step 4013: {'lr': 6.666666666666667e-05, 'samples': 128416, 'steps': 250, 'loss/train': 5.373640537261963} -09/20/2021 15:21:24 - INFO - __main__ - Step 4014: {'lr': 6.666666666666667e-05, 'samples': 128448, 'steps': 250, 'loss/train': 6.741521835327148} -09/20/2021 15:21:25 - INFO - __main__ - Step 4015: {'lr': 6.666666666666667e-05, 'samples': 128480, 'steps': 250, 'loss/train': 6.691746234893799} -09/20/2021 15:21:25 - INFO - __main__ - Step 4016: {'lr': 6.666666666666667e-05, 'samples': 128512, 'steps': 250, 'loss/train': 5.019698619842529} -09/20/2021 15:21:26 - INFO - __main__ - Step 4017: {'lr': 6.693333333333334e-05, 'samples': 128544, 'steps': 251, 'loss/train': 5.571440696716309} -09/20/2021 15:21:27 - INFO - __main__ - Step 4018: {'lr': 6.693333333333334e-05, 'samples': 128576, 'steps': 251, 'loss/train': 5.410815238952637} -09/20/2021 15:21:28 - INFO - __main__ - Step 4019: {'lr': 6.693333333333334e-05, 'samples': 128608, 'steps': 251, 'loss/train': 4.535571098327637} -09/20/2021 15:21:28 - INFO - __main__ - Step 4020: {'lr': 6.693333333333334e-05, 'samples': 128640, 'steps': 251, 'loss/train': 5.160256385803223} -09/20/2021 15:21:29 - INFO - __main__ - Step 4021: {'lr': 6.693333333333334e-05, 'samples': 128672, 'steps': 251, 'loss/train': 6.713772773742676} -09/20/2021 15:21:30 - INFO - __main__ - Step 4022: {'lr': 6.693333333333334e-05, 'samples': 128704, 'steps': 251, 'loss/train': 5.712887287139893} -09/20/2021 15:21:31 - INFO - __main__ - Step 4023: {'lr': 6.693333333333334e-05, 'samples': 128736, 'steps': 251, 'loss/train': 5.840760231018066} -09/20/2021 15:21:31 - INFO - __main__ - Step 4024: {'lr': 6.693333333333334e-05, 'samples': 128768, 'steps': 251, 'loss/train': 5.073295593261719} -09/20/2021 15:21:32 - INFO - __main__ - Step 4025: {'lr': 6.693333333333334e-05, 'samples': 128800, 'steps': 251, 'loss/train': 5.2835516929626465} -09/20/2021 15:21:33 - INFO - __main__ - Step 4026: {'lr': 6.693333333333334e-05, 'samples': 128832, 'steps': 251, 'loss/train': 5.827837944030762} -09/20/2021 15:21:34 - INFO - __main__ - Step 4027: {'lr': 6.693333333333334e-05, 'samples': 128864, 'steps': 251, 'loss/train': 5.367954730987549} -09/20/2021 15:21:34 - INFO - __main__ - Step 4028: {'lr': 6.693333333333334e-05, 'samples': 128896, 'steps': 251, 'loss/train': 4.827786922454834} -09/20/2021 15:21:35 - INFO - __main__ - Step 4029: {'lr': 6.693333333333334e-05, 'samples': 128928, 'steps': 251, 'loss/train': 5.162095546722412} -09/20/2021 15:21:36 - INFO - __main__ - Step 4030: {'lr': 6.693333333333334e-05, 'samples': 128960, 'steps': 251, 'loss/train': 5.611853122711182} -09/20/2021 15:21:37 - INFO - __main__ - Step 4031: {'lr': 6.693333333333334e-05, 'samples': 128992, 'steps': 251, 'loss/train': 6.061139106750488} -09/20/2021 15:21:37 - INFO - __main__ - Step 4032: {'lr': 6.693333333333334e-05, 'samples': 129024, 'steps': 251, 'loss/train': 5.201991558074951} -09/20/2021 15:21:38 - INFO - __main__ - Step 4033: {'lr': 6.720000000000001e-05, 'samples': 129056, 'steps': 252, 'loss/train': 5.572150230407715} -09/20/2021 15:21:39 - INFO - __main__ - Step 4034: {'lr': 6.720000000000001e-05, 'samples': 129088, 'steps': 252, 'loss/train': 5.564417839050293} -09/20/2021 15:21:40 - INFO - __main__ - Step 4035: {'lr': 6.720000000000001e-05, 'samples': 129120, 'steps': 252, 'loss/train': 3.9955079555511475} -09/20/2021 15:21:41 - INFO - __main__ - Step 4036: {'lr': 6.720000000000001e-05, 'samples': 129152, 'steps': 252, 'loss/train': 5.05230188369751} -09/20/2021 15:21:42 - INFO - __main__ - Step 4037: {'lr': 6.720000000000001e-05, 'samples': 129184, 'steps': 252, 'loss/train': 6.420419692993164} -09/20/2021 15:21:43 - INFO - __main__ - Step 4038: {'lr': 6.720000000000001e-05, 'samples': 129216, 'steps': 252, 'loss/train': 5.189384460449219} -09/20/2021 15:21:43 - INFO - __main__ - Step 4039: {'lr': 6.720000000000001e-05, 'samples': 129248, 'steps': 252, 'loss/train': 6.025969505310059} -09/20/2021 15:21:44 - INFO - __main__ - Step 4040: {'lr': 6.720000000000001e-05, 'samples': 129280, 'steps': 252, 'loss/train': 6.382761001586914} -09/20/2021 15:21:45 - INFO - __main__ - Step 4041: {'lr': 6.720000000000001e-05, 'samples': 129312, 'steps': 252, 'loss/train': 5.552805423736572} -09/20/2021 15:21:46 - INFO - __main__ - Step 4042: {'lr': 6.720000000000001e-05, 'samples': 129344, 'steps': 252, 'loss/train': 5.247740268707275} -09/20/2021 15:21:46 - INFO - __main__ - Step 4043: {'lr': 6.720000000000001e-05, 'samples': 129376, 'steps': 252, 'loss/train': 6.131734848022461} -09/20/2021 15:21:47 - INFO - __main__ - Step 4044: {'lr': 6.720000000000001e-05, 'samples': 129408, 'steps': 252, 'loss/train': 4.576050758361816} -09/20/2021 15:21:48 - INFO - __main__ - Step 4045: {'lr': 6.720000000000001e-05, 'samples': 129440, 'steps': 252, 'loss/train': 5.433841228485107} -09/20/2021 15:21:49 - INFO - __main__ - Step 4046: {'lr': 6.720000000000001e-05, 'samples': 129472, 'steps': 252, 'loss/train': 5.593077182769775} -09/20/2021 15:21:49 - INFO - __main__ - Step 4047: {'lr': 6.720000000000001e-05, 'samples': 129504, 'steps': 252, 'loss/train': 5.776475429534912} -09/20/2021 15:21:50 - INFO - __main__ - Step 4048: {'lr': 6.720000000000001e-05, 'samples': 129536, 'steps': 252, 'loss/train': 5.565225124359131} -09/20/2021 15:21:51 - INFO - __main__ - Step 4049: {'lr': 6.746666666666666e-05, 'samples': 129568, 'steps': 253, 'loss/train': 5.481166362762451} -09/20/2021 15:21:52 - INFO - __main__ - Step 4050: {'lr': 6.746666666666666e-05, 'samples': 129600, 'steps': 253, 'loss/train': 5.439233303070068} -09/20/2021 15:21:52 - INFO - __main__ - Step 4051: {'lr': 6.746666666666666e-05, 'samples': 129632, 'steps': 253, 'loss/train': 6.002931118011475} -09/20/2021 15:21:53 - INFO - __main__ - Step 4052: {'lr': 6.746666666666666e-05, 'samples': 129664, 'steps': 253, 'loss/train': 6.014723300933838} -09/20/2021 15:21:54 - INFO - __main__ - Step 4053: {'lr': 6.746666666666666e-05, 'samples': 129696, 'steps': 253, 'loss/train': 5.135450839996338} -09/20/2021 15:21:55 - INFO - __main__ - Step 4054: {'lr': 6.746666666666666e-05, 'samples': 129728, 'steps': 253, 'loss/train': 6.105199337005615} -09/20/2021 15:21:55 - INFO - __main__ - Step 4055: {'lr': 6.746666666666666e-05, 'samples': 129760, 'steps': 253, 'loss/train': 6.009659290313721} -09/20/2021 15:21:56 - INFO - __main__ - Step 4056: {'lr': 6.746666666666666e-05, 'samples': 129792, 'steps': 253, 'loss/train': 5.432352542877197} -09/20/2021 15:21:57 - INFO - __main__ - Step 4057: {'lr': 6.746666666666666e-05, 'samples': 129824, 'steps': 253, 'loss/train': 5.74725341796875} -09/20/2021 15:21:58 - INFO - __main__ - Step 4058: {'lr': 6.746666666666666e-05, 'samples': 129856, 'steps': 253, 'loss/train': 6.352019786834717} -09/20/2021 15:21:58 - INFO - __main__ - Step 4059: {'lr': 6.746666666666666e-05, 'samples': 129888, 'steps': 253, 'loss/train': 5.294723987579346} -09/20/2021 15:21:59 - INFO - __main__ - Step 4060: {'lr': 6.746666666666666e-05, 'samples': 129920, 'steps': 253, 'loss/train': 5.791189670562744} -09/20/2021 15:22:00 - INFO - __main__ - Step 4061: {'lr': 6.746666666666666e-05, 'samples': 129952, 'steps': 253, 'loss/train': 4.939887046813965} -09/20/2021 15:22:01 - INFO - __main__ - Step 4062: {'lr': 6.746666666666666e-05, 'samples': 129984, 'steps': 253, 'loss/train': 6.236031532287598} -09/20/2021 15:22:01 - INFO - __main__ - Step 4063: {'lr': 6.746666666666666e-05, 'samples': 130016, 'steps': 253, 'loss/train': 6.293827056884766} -09/20/2021 15:22:02 - INFO - __main__ - Step 4064: {'lr': 6.746666666666666e-05, 'samples': 130048, 'steps': 253, 'loss/train': 6.449406147003174} -09/20/2021 15:22:03 - INFO - __main__ - Step 4065: {'lr': 6.773333333333333e-05, 'samples': 130080, 'steps': 254, 'loss/train': 6.005726337432861} -09/20/2021 15:22:04 - INFO - __main__ - Step 4066: {'lr': 6.773333333333333e-05, 'samples': 130112, 'steps': 254, 'loss/train': 5.719218730926514} -09/20/2021 15:22:05 - INFO - __main__ - Step 4067: {'lr': 6.773333333333333e-05, 'samples': 130144, 'steps': 254, 'loss/train': 4.915843963623047} -09/20/2021 15:22:06 - INFO - __main__ - Step 4068: {'lr': 6.773333333333333e-05, 'samples': 130176, 'steps': 254, 'loss/train': 5.564783096313477} -09/20/2021 15:22:07 - INFO - __main__ - Step 4069: {'lr': 6.773333333333333e-05, 'samples': 130208, 'steps': 254, 'loss/train': 5.946286678314209} -09/20/2021 15:22:07 - INFO - __main__ - Step 4070: {'lr': 6.773333333333333e-05, 'samples': 130240, 'steps': 254, 'loss/train': 6.8529372215271} -09/20/2021 15:22:08 - INFO - __main__ - Step 4071: {'lr': 6.773333333333333e-05, 'samples': 130272, 'steps': 254, 'loss/train': 5.795254707336426} -09/20/2021 15:22:09 - INFO - __main__ - Step 4072: {'lr': 6.773333333333333e-05, 'samples': 130304, 'steps': 254, 'loss/train': 5.262046813964844} -09/20/2021 15:22:10 - INFO - __main__ - Step 4073: {'lr': 6.773333333333333e-05, 'samples': 130336, 'steps': 254, 'loss/train': 5.437093257904053} -09/20/2021 15:22:10 - INFO - __main__ - Step 4074: {'lr': 6.773333333333333e-05, 'samples': 130368, 'steps': 254, 'loss/train': 5.808574199676514} -09/20/2021 15:22:11 - INFO - __main__ - Step 4075: {'lr': 6.773333333333333e-05, 'samples': 130400, 'steps': 254, 'loss/train': 5.83043098449707} -09/20/2021 15:22:12 - INFO - __main__ - Step 4076: {'lr': 6.773333333333333e-05, 'samples': 130432, 'steps': 254, 'loss/train': 5.709782600402832} -09/20/2021 15:22:13 - INFO - __main__ - Step 4077: {'lr': 6.773333333333333e-05, 'samples': 130464, 'steps': 254, 'loss/train': 5.062604904174805} -09/20/2021 15:22:13 - INFO - __main__ - Step 4078: {'lr': 6.773333333333333e-05, 'samples': 130496, 'steps': 254, 'loss/train': 5.439661502838135} -09/20/2021 15:22:14 - INFO - __main__ - Step 4079: {'lr': 6.773333333333333e-05, 'samples': 130528, 'steps': 254, 'loss/train': 5.505727291107178} -09/20/2021 15:22:15 - INFO - __main__ - Step 4080: {'lr': 6.773333333333333e-05, 'samples': 130560, 'steps': 254, 'loss/train': 5.987401008605957} -09/20/2021 15:22:16 - INFO - __main__ - Step 4081: {'lr': 6.800000000000001e-05, 'samples': 130592, 'steps': 255, 'loss/train': 5.7451653480529785} -09/20/2021 15:22:17 - INFO - __main__ - Step 4082: {'lr': 6.800000000000001e-05, 'samples': 130624, 'steps': 255, 'loss/train': 6.262058734893799} -09/20/2021 15:22:17 - INFO - __main__ - Step 4083: {'lr': 6.800000000000001e-05, 'samples': 130656, 'steps': 255, 'loss/train': 5.378565788269043} -09/20/2021 15:22:18 - INFO - __main__ - Step 4084: {'lr': 6.800000000000001e-05, 'samples': 130688, 'steps': 255, 'loss/train': 5.351409912109375} -09/20/2021 15:22:19 - INFO - __main__ - Step 4085: {'lr': 6.800000000000001e-05, 'samples': 130720, 'steps': 255, 'loss/train': 5.580038070678711} -09/20/2021 15:22:20 - INFO - __main__ - Step 4086: {'lr': 6.800000000000001e-05, 'samples': 130752, 'steps': 255, 'loss/train': 5.533458232879639} -09/20/2021 15:22:20 - INFO - __main__ - Step 4087: {'lr': 6.800000000000001e-05, 'samples': 130784, 'steps': 255, 'loss/train': 6.133034706115723} -09/20/2021 15:22:21 - INFO - __main__ - Step 4088: {'lr': 6.800000000000001e-05, 'samples': 130816, 'steps': 255, 'loss/train': 5.872997760772705} -09/20/2021 15:22:22 - INFO - __main__ - Step 4089: {'lr': 6.800000000000001e-05, 'samples': 130848, 'steps': 255, 'loss/train': 6.100282192230225} -09/20/2021 15:22:23 - INFO - __main__ - Step 4090: {'lr': 6.800000000000001e-05, 'samples': 130880, 'steps': 255, 'loss/train': 4.915903091430664} -09/20/2021 15:22:23 - INFO - __main__ - Step 4091: {'lr': 6.800000000000001e-05, 'samples': 130912, 'steps': 255, 'loss/train': 5.353174686431885} -09/20/2021 15:22:24 - INFO - __main__ - Step 4092: {'lr': 6.800000000000001e-05, 'samples': 130944, 'steps': 255, 'loss/train': 5.194579124450684} -09/20/2021 15:22:25 - INFO - __main__ - Step 4093: {'lr': 6.800000000000001e-05, 'samples': 130976, 'steps': 255, 'loss/train': 3.46362566947937} -09/20/2021 15:22:26 - INFO - __main__ - Step 4094: {'lr': 6.800000000000001e-05, 'samples': 131008, 'steps': 255, 'loss/train': 4.846240997314453} -09/20/2021 15:22:26 - INFO - __main__ - Step 4095: {'lr': 6.800000000000001e-05, 'samples': 131040, 'steps': 255, 'loss/train': 5.457118988037109} -09/20/2021 15:22:28 - INFO - __main__ - Step 4096: {'lr': 6.800000000000001e-05, 'samples': 131072, 'steps': 255, 'loss/train': 5.718449115753174} -09/20/2021 15:22:29 - INFO - __main__ - Step 4097: {'lr': 6.826666666666667e-05, 'samples': 131104, 'steps': 256, 'loss/train': 5.391017913818359} -09/20/2021 15:22:30 - INFO - __main__ - Step 4098: {'lr': 6.826666666666667e-05, 'samples': 131136, 'steps': 256, 'loss/train': 5.014470100402832} -09/20/2021 15:22:30 - INFO - __main__ - Step 4099: {'lr': 6.826666666666667e-05, 'samples': 131168, 'steps': 256, 'loss/train': 6.627771854400635} -09/20/2021 15:22:31 - INFO - __main__ - Step 4100: {'lr': 6.826666666666667e-05, 'samples': 131200, 'steps': 256, 'loss/train': 5.09644889831543} -09/20/2021 15:22:32 - INFO - __main__ - Step 4101: {'lr': 6.826666666666667e-05, 'samples': 131232, 'steps': 256, 'loss/train': 5.357210636138916} -09/20/2021 15:22:33 - INFO - __main__ - Step 4102: {'lr': 6.826666666666667e-05, 'samples': 131264, 'steps': 256, 'loss/train': 4.9082136154174805} -09/20/2021 15:22:33 - INFO - __main__ - Step 4103: {'lr': 6.826666666666667e-05, 'samples': 131296, 'steps': 256, 'loss/train': 5.505955696105957} -09/20/2021 15:22:34 - INFO - __main__ - Step 4104: {'lr': 6.826666666666667e-05, 'samples': 131328, 'steps': 256, 'loss/train': 5.367413520812988} -09/20/2021 15:22:35 - INFO - __main__ - Step 4105: {'lr': 6.826666666666667e-05, 'samples': 131360, 'steps': 256, 'loss/train': 5.514647483825684} -09/20/2021 15:22:36 - INFO - __main__ - Step 4106: {'lr': 6.826666666666667e-05, 'samples': 131392, 'steps': 256, 'loss/train': 5.69857120513916} -09/20/2021 15:22:36 - INFO - __main__ - Step 4107: {'lr': 6.826666666666667e-05, 'samples': 131424, 'steps': 256, 'loss/train': 5.02207612991333} -09/20/2021 15:22:37 - INFO - __main__ - Step 4108: {'lr': 6.826666666666667e-05, 'samples': 131456, 'steps': 256, 'loss/train': 6.219720363616943} -09/20/2021 15:22:38 - INFO - __main__ - Step 4109: {'lr': 6.826666666666667e-05, 'samples': 131488, 'steps': 256, 'loss/train': 4.627923488616943} -09/20/2021 15:22:39 - INFO - __main__ - Step 4110: {'lr': 6.826666666666667e-05, 'samples': 131520, 'steps': 256, 'loss/train': 5.437260150909424} -09/20/2021 15:22:39 - INFO - __main__ - Step 4111: {'lr': 6.826666666666667e-05, 'samples': 131552, 'steps': 256, 'loss/train': 5.339524745941162} -09/20/2021 15:22:40 - INFO - __main__ - Step 4112: {'lr': 6.826666666666667e-05, 'samples': 131584, 'steps': 256, 'loss/train': 5.747112274169922} -09/20/2021 15:22:41 - INFO - __main__ - Step 4113: {'lr': 6.853333333333334e-05, 'samples': 131616, 'steps': 257, 'loss/train': 4.8740339279174805} -09/20/2021 15:22:42 - INFO - __main__ - Step 4114: {'lr': 6.853333333333334e-05, 'samples': 131648, 'steps': 257, 'loss/train': 5.478601455688477} -09/20/2021 15:22:42 - INFO - __main__ - Step 4115: {'lr': 6.853333333333334e-05, 'samples': 131680, 'steps': 257, 'loss/train': 7.246883392333984} -09/20/2021 15:22:43 - INFO - __main__ - Step 4116: {'lr': 6.853333333333334e-05, 'samples': 131712, 'steps': 257, 'loss/train': 6.985013008117676} -09/20/2021 15:22:44 - INFO - __main__ - Step 4117: {'lr': 6.853333333333334e-05, 'samples': 131744, 'steps': 257, 'loss/train': 6.964136600494385} -09/20/2021 15:22:45 - INFO - __main__ - Step 4118: {'lr': 6.853333333333334e-05, 'samples': 131776, 'steps': 257, 'loss/train': 6.842834949493408} -09/20/2021 15:22:45 - INFO - __main__ - Step 4119: {'lr': 6.853333333333334e-05, 'samples': 131808, 'steps': 257, 'loss/train': 6.491487979888916} -09/20/2021 15:22:46 - INFO - __main__ - Step 4120: {'lr': 6.853333333333334e-05, 'samples': 131840, 'steps': 257, 'loss/train': 6.653123378753662} -09/20/2021 15:22:47 - INFO - __main__ - Step 4121: {'lr': 6.853333333333334e-05, 'samples': 131872, 'steps': 257, 'loss/train': 6.697238445281982} -09/20/2021 15:22:48 - INFO - __main__ - Step 4122: {'lr': 6.853333333333334e-05, 'samples': 131904, 'steps': 257, 'loss/train': 5.717917442321777} -09/20/2021 15:22:48 - INFO - __main__ - Step 4123: {'lr': 6.853333333333334e-05, 'samples': 131936, 'steps': 257, 'loss/train': 5.945523738861084} -09/20/2021 15:22:49 - INFO - __main__ - Step 4124: {'lr': 6.853333333333334e-05, 'samples': 131968, 'steps': 257, 'loss/train': 5.312764644622803} -09/20/2021 15:22:50 - INFO - __main__ - Step 4125: {'lr': 6.853333333333334e-05, 'samples': 132000, 'steps': 257, 'loss/train': 5.9600749015808105} -09/20/2021 15:22:51 - INFO - __main__ - Step 4126: {'lr': 6.853333333333334e-05, 'samples': 132032, 'steps': 257, 'loss/train': 4.904303550720215} -09/20/2021 15:22:51 - INFO - __main__ - Step 4127: {'lr': 6.853333333333334e-05, 'samples': 132064, 'steps': 257, 'loss/train': 5.77440071105957} -09/20/2021 15:22:52 - INFO - __main__ - Step 4128: {'lr': 6.853333333333334e-05, 'samples': 132096, 'steps': 257, 'loss/train': 5.203930854797363} -09/20/2021 15:22:54 - INFO - __main__ - Step 4129: {'lr': 6.879999999999999e-05, 'samples': 132128, 'steps': 258, 'loss/train': 5.131797790527344} -09/20/2021 15:22:54 - INFO - __main__ - Step 4130: {'lr': 6.879999999999999e-05, 'samples': 132160, 'steps': 258, 'loss/train': 5.465910911560059} -09/20/2021 15:22:55 - INFO - __main__ - Step 4131: {'lr': 6.879999999999999e-05, 'samples': 132192, 'steps': 258, 'loss/train': 5.5232977867126465} -09/20/2021 15:22:56 - INFO - __main__ - Step 4132: {'lr': 6.879999999999999e-05, 'samples': 132224, 'steps': 258, 'loss/train': 5.546286106109619} -09/20/2021 15:22:57 - INFO - __main__ - Step 4133: {'lr': 6.879999999999999e-05, 'samples': 132256, 'steps': 258, 'loss/train': 5.621540546417236} -09/20/2021 15:22:57 - INFO - __main__ - Step 4134: {'lr': 6.879999999999999e-05, 'samples': 132288, 'steps': 258, 'loss/train': 5.363887310028076} -09/20/2021 15:22:58 - INFO - __main__ - Step 4135: {'lr': 6.879999999999999e-05, 'samples': 132320, 'steps': 258, 'loss/train': 5.456352710723877} -09/20/2021 15:22:59 - INFO - __main__ - Step 4136: {'lr': 6.879999999999999e-05, 'samples': 132352, 'steps': 258, 'loss/train': 5.08817720413208} -09/20/2021 15:23:00 - INFO - __main__ - Step 4137: {'lr': 6.879999999999999e-05, 'samples': 132384, 'steps': 258, 'loss/train': 6.151931285858154} -09/20/2021 15:23:00 - INFO - __main__ - Step 4138: {'lr': 6.879999999999999e-05, 'samples': 132416, 'steps': 258, 'loss/train': 5.248673915863037} -09/20/2021 15:23:01 - INFO - __main__ - Step 4139: {'lr': 6.879999999999999e-05, 'samples': 132448, 'steps': 258, 'loss/train': 5.021778106689453} -09/20/2021 15:23:02 - INFO - __main__ - Step 4140: {'lr': 6.879999999999999e-05, 'samples': 132480, 'steps': 258, 'loss/train': 6.002615928649902} -09/20/2021 15:23:03 - INFO - __main__ - Step 4141: {'lr': 6.879999999999999e-05, 'samples': 132512, 'steps': 258, 'loss/train': 5.298261642456055} -09/20/2021 15:23:03 - INFO - __main__ - Step 4142: {'lr': 6.879999999999999e-05, 'samples': 132544, 'steps': 258, 'loss/train': 5.604989528656006} -09/20/2021 15:23:04 - INFO - __main__ - Step 4143: {'lr': 6.879999999999999e-05, 'samples': 132576, 'steps': 258, 'loss/train': 6.057802200317383} -09/20/2021 15:23:05 - INFO - __main__ - Step 4144: {'lr': 6.879999999999999e-05, 'samples': 132608, 'steps': 258, 'loss/train': 5.983456134796143} -09/20/2021 15:23:06 - INFO - __main__ - Step 4145: {'lr': 6.906666666666667e-05, 'samples': 132640, 'steps': 259, 'loss/train': 5.987879753112793} -09/20/2021 15:23:07 - INFO - __main__ - Step 4146: {'lr': 6.906666666666667e-05, 'samples': 132672, 'steps': 259, 'loss/train': 5.705751895904541} -09/20/2021 15:23:07 - INFO - __main__ - Step 4147: {'lr': 6.906666666666667e-05, 'samples': 132704, 'steps': 259, 'loss/train': 6.152171611785889} -09/20/2021 15:23:08 - INFO - __main__ - Step 4148: {'lr': 6.906666666666667e-05, 'samples': 132736, 'steps': 259, 'loss/train': 4.678244113922119} -09/20/2021 15:23:09 - INFO - __main__ - Step 4149: {'lr': 6.906666666666667e-05, 'samples': 132768, 'steps': 259, 'loss/train': 6.235036849975586} -09/20/2021 15:23:10 - INFO - __main__ - Step 4150: {'lr': 6.906666666666667e-05, 'samples': 132800, 'steps': 259, 'loss/train': 5.395657539367676} -09/20/2021 15:23:10 - INFO - __main__ - Step 4151: {'lr': 6.906666666666667e-05, 'samples': 132832, 'steps': 259, 'loss/train': 5.282878875732422} -09/20/2021 15:23:11 - INFO - __main__ - Step 4152: {'lr': 6.906666666666667e-05, 'samples': 132864, 'steps': 259, 'loss/train': 6.0751776695251465} -09/20/2021 15:23:12 - INFO - __main__ - Step 4153: {'lr': 6.906666666666667e-05, 'samples': 132896, 'steps': 259, 'loss/train': 5.646658897399902} -09/20/2021 15:23:13 - INFO - __main__ - Step 4154: {'lr': 6.906666666666667e-05, 'samples': 132928, 'steps': 259, 'loss/train': 6.600839614868164} -09/20/2021 15:23:13 - INFO - __main__ - Step 4155: {'lr': 6.906666666666667e-05, 'samples': 132960, 'steps': 259, 'loss/train': 5.51961088180542} -09/20/2021 15:23:14 - INFO - __main__ - Step 4156: {'lr': 6.906666666666667e-05, 'samples': 132992, 'steps': 259, 'loss/train': 5.588998317718506} -09/20/2021 15:23:15 - INFO - __main__ - Step 4157: {'lr': 6.906666666666667e-05, 'samples': 133024, 'steps': 259, 'loss/train': 6.036911964416504} -09/20/2021 15:23:16 - INFO - __main__ - Step 4158: {'lr': 6.906666666666667e-05, 'samples': 133056, 'steps': 259, 'loss/train': 4.791509628295898} -09/20/2021 15:23:17 - INFO - __main__ - Step 4159: {'lr': 6.906666666666667e-05, 'samples': 133088, 'steps': 259, 'loss/train': 5.681788444519043} -09/20/2021 15:23:18 - INFO - __main__ - Step 4160: {'lr': 6.906666666666667e-05, 'samples': 133120, 'steps': 259, 'loss/train': 6.037106990814209} -09/20/2021 15:23:19 - INFO - __main__ - Step 4161: {'lr': 6.933333333333334e-05, 'samples': 133152, 'steps': 260, 'loss/train': 5.508028507232666} -09/20/2021 15:23:19 - INFO - __main__ - Step 4162: {'lr': 6.933333333333334e-05, 'samples': 133184, 'steps': 260, 'loss/train': 5.3469977378845215} -09/20/2021 15:23:20 - INFO - __main__ - Step 4163: {'lr': 6.933333333333334e-05, 'samples': 133216, 'steps': 260, 'loss/train': 3.5061402320861816} -09/20/2021 15:23:21 - INFO - __main__ - Step 4164: {'lr': 6.933333333333334e-05, 'samples': 133248, 'steps': 260, 'loss/train': 5.454527378082275} -09/20/2021 15:23:22 - INFO - __main__ - Step 4165: {'lr': 6.933333333333334e-05, 'samples': 133280, 'steps': 260, 'loss/train': 5.500779628753662} -09/20/2021 15:23:22 - INFO - __main__ - Step 4166: {'lr': 6.933333333333334e-05, 'samples': 133312, 'steps': 260, 'loss/train': 6.532834529876709} -09/20/2021 15:23:23 - INFO - __main__ - Step 4167: {'lr': 6.933333333333334e-05, 'samples': 133344, 'steps': 260, 'loss/train': 5.795638084411621} -09/20/2021 15:23:24 - INFO - __main__ - Step 4168: {'lr': 6.933333333333334e-05, 'samples': 133376, 'steps': 260, 'loss/train': 7.434771537780762} -09/20/2021 15:23:25 - INFO - __main__ - Step 4169: {'lr': 6.933333333333334e-05, 'samples': 133408, 'steps': 260, 'loss/train': 6.789015769958496} -09/20/2021 15:23:25 - INFO - __main__ - Step 4170: {'lr': 6.933333333333334e-05, 'samples': 133440, 'steps': 260, 'loss/train': 5.115960121154785} -09/20/2021 15:23:26 - INFO - __main__ - Step 4171: {'lr': 6.933333333333334e-05, 'samples': 133472, 'steps': 260, 'loss/train': 4.848780632019043} -09/20/2021 15:23:27 - INFO - __main__ - Step 4172: {'lr': 6.933333333333334e-05, 'samples': 133504, 'steps': 260, 'loss/train': 6.249265670776367} -09/20/2021 15:23:28 - INFO - __main__ - Step 4173: {'lr': 6.933333333333334e-05, 'samples': 133536, 'steps': 260, 'loss/train': 5.474110126495361} -09/20/2021 15:23:28 - INFO - __main__ - Step 4174: {'lr': 6.933333333333334e-05, 'samples': 133568, 'steps': 260, 'loss/train': 6.401390075683594} -09/20/2021 15:23:29 - INFO - __main__ - Step 4175: {'lr': 6.933333333333334e-05, 'samples': 133600, 'steps': 260, 'loss/train': 4.926366806030273} -09/20/2021 15:23:30 - INFO - __main__ - Step 4176: {'lr': 6.933333333333334e-05, 'samples': 133632, 'steps': 260, 'loss/train': 5.6097893714904785} -09/20/2021 15:23:31 - INFO - __main__ - Step 4177: {'lr': 6.96e-05, 'samples': 133664, 'steps': 261, 'loss/train': 4.731888294219971} -09/20/2021 15:23:31 - INFO - __main__ - Step 4178: {'lr': 6.96e-05, 'samples': 133696, 'steps': 261, 'loss/train': 7.738072872161865} -09/20/2021 15:23:32 - INFO - __main__ - Step 4179: {'lr': 6.96e-05, 'samples': 133728, 'steps': 261, 'loss/train': 5.439280033111572} -09/20/2021 15:23:33 - INFO - __main__ - Step 4180: {'lr': 6.96e-05, 'samples': 133760, 'steps': 261, 'loss/train': 6.012444496154785} -09/20/2021 15:23:34 - INFO - __main__ - Step 4181: {'lr': 6.96e-05, 'samples': 133792, 'steps': 261, 'loss/train': 5.3555097579956055} -09/20/2021 15:23:34 - INFO - __main__ - Step 4182: {'lr': 6.96e-05, 'samples': 133824, 'steps': 261, 'loss/train': 5.797379970550537} -09/20/2021 15:23:35 - INFO - __main__ - Step 4183: {'lr': 6.96e-05, 'samples': 133856, 'steps': 261, 'loss/train': 5.114512920379639} -09/20/2021 15:23:36 - INFO - __main__ - Step 4184: {'lr': 6.96e-05, 'samples': 133888, 'steps': 261, 'loss/train': 6.187909126281738} -09/20/2021 15:23:37 - INFO - __main__ - Step 4185: {'lr': 6.96e-05, 'samples': 133920, 'steps': 261, 'loss/train': 6.2139573097229} -09/20/2021 15:23:37 - INFO - __main__ - Step 4186: {'lr': 6.96e-05, 'samples': 133952, 'steps': 261, 'loss/train': 5.785510540008545} -09/20/2021 15:23:38 - INFO - __main__ - Step 4187: {'lr': 6.96e-05, 'samples': 133984, 'steps': 261, 'loss/train': 6.226385116577148} -09/20/2021 15:23:39 - INFO - __main__ - Step 4188: {'lr': 6.96e-05, 'samples': 134016, 'steps': 261, 'loss/train': 6.105184078216553} -09/20/2021 15:23:40 - INFO - __main__ - Step 4189: {'lr': 6.96e-05, 'samples': 134048, 'steps': 261, 'loss/train': 5.38762092590332} -09/20/2021 15:23:40 - INFO - __main__ - Step 4190: {'lr': 6.96e-05, 'samples': 134080, 'steps': 261, 'loss/train': 5.981031894683838} -09/20/2021 15:23:42 - INFO - __main__ - Step 4191: {'lr': 6.96e-05, 'samples': 134112, 'steps': 261, 'loss/train': 4.759799957275391} -09/20/2021 15:23:43 - INFO - __main__ - Step 4192: {'lr': 6.96e-05, 'samples': 134144, 'steps': 261, 'loss/train': 5.518543243408203} -09/20/2021 15:23:43 - INFO - __main__ - Step 4193: {'lr': 6.986666666666667e-05, 'samples': 134176, 'steps': 262, 'loss/train': 5.994354724884033} -09/20/2021 15:23:44 - INFO - __main__ - Step 4194: {'lr': 6.986666666666667e-05, 'samples': 134208, 'steps': 262, 'loss/train': 5.021031856536865} -09/20/2021 15:23:45 - INFO - __main__ - Step 4195: {'lr': 6.986666666666667e-05, 'samples': 134240, 'steps': 262, 'loss/train': 5.653661251068115} -09/20/2021 15:23:46 - INFO - __main__ - Step 4196: {'lr': 6.986666666666667e-05, 'samples': 134272, 'steps': 262, 'loss/train': 5.246338367462158} -09/20/2021 15:23:46 - INFO - __main__ - Step 4197: {'lr': 6.986666666666667e-05, 'samples': 134304, 'steps': 262, 'loss/train': 5.279577732086182} -09/20/2021 15:23:47 - INFO - __main__ - Step 4198: {'lr': 6.986666666666667e-05, 'samples': 134336, 'steps': 262, 'loss/train': 4.715202808380127} -09/20/2021 15:23:48 - INFO - __main__ - Step 4199: {'lr': 6.986666666666667e-05, 'samples': 134368, 'steps': 262, 'loss/train': 5.1149091720581055} -09/20/2021 15:23:49 - INFO - __main__ - Step 4200: {'lr': 6.986666666666667e-05, 'samples': 134400, 'steps': 262, 'loss/train': 5.78434944152832} -09/20/2021 15:23:49 - INFO - __main__ - Step 4201: {'lr': 6.986666666666667e-05, 'samples': 134432, 'steps': 262, 'loss/train': 4.953207015991211} -09/20/2021 15:23:50 - INFO - __main__ - Step 4202: {'lr': 6.986666666666667e-05, 'samples': 134464, 'steps': 262, 'loss/train': 5.089198112487793} -09/20/2021 15:23:51 - INFO - __main__ - Step 4203: {'lr': 6.986666666666667e-05, 'samples': 134496, 'steps': 262, 'loss/train': 6.4155964851379395} -09/20/2021 15:23:52 - INFO - __main__ - Step 4204: {'lr': 6.986666666666667e-05, 'samples': 134528, 'steps': 262, 'loss/train': 5.450276851654053} -09/20/2021 15:23:52 - INFO - __main__ - Step 4205: {'lr': 6.986666666666667e-05, 'samples': 134560, 'steps': 262, 'loss/train': 5.848806381225586} -09/20/2021 15:23:53 - INFO - __main__ - Step 4206: {'lr': 6.986666666666667e-05, 'samples': 134592, 'steps': 262, 'loss/train': 5.342129707336426} -09/20/2021 15:23:54 - INFO - __main__ - Step 4207: {'lr': 6.986666666666667e-05, 'samples': 134624, 'steps': 262, 'loss/train': 4.943987846374512} -09/20/2021 15:23:55 - INFO - __main__ - Step 4208: {'lr': 6.986666666666667e-05, 'samples': 134656, 'steps': 262, 'loss/train': 6.13270378112793} -09/20/2021 15:23:56 - INFO - __main__ - Step 4209: {'lr': 7.013333333333333e-05, 'samples': 134688, 'steps': 263, 'loss/train': 6.6532511711120605} -09/20/2021 15:23:56 - INFO - __main__ - Step 4210: {'lr': 7.013333333333333e-05, 'samples': 134720, 'steps': 263, 'loss/train': 4.814615249633789} -09/20/2021 15:23:57 - INFO - __main__ - Step 4211: {'lr': 7.013333333333333e-05, 'samples': 134752, 'steps': 263, 'loss/train': 6.262118816375732} -09/20/2021 15:23:58 - INFO - __main__ - Step 4212: {'lr': 7.013333333333333e-05, 'samples': 134784, 'steps': 263, 'loss/train': 5.991631984710693} -09/20/2021 15:23:59 - INFO - __main__ - Step 4213: {'lr': 7.013333333333333e-05, 'samples': 134816, 'steps': 263, 'loss/train': 5.462632656097412} -09/20/2021 15:23:59 - INFO - __main__ - Step 4214: {'lr': 7.013333333333333e-05, 'samples': 134848, 'steps': 263, 'loss/train': 5.521574974060059} -09/20/2021 15:24:00 - INFO - __main__ - Step 4215: {'lr': 7.013333333333333e-05, 'samples': 134880, 'steps': 263, 'loss/train': 5.842101573944092} -09/20/2021 15:24:01 - INFO - __main__ - Step 4216: {'lr': 7.013333333333333e-05, 'samples': 134912, 'steps': 263, 'loss/train': 5.541849613189697} -09/20/2021 15:24:02 - INFO - __main__ - Step 4217: {'lr': 7.013333333333333e-05, 'samples': 134944, 'steps': 263, 'loss/train': 6.52003812789917} -09/20/2021 15:24:02 - INFO - __main__ - Step 4218: {'lr': 7.013333333333333e-05, 'samples': 134976, 'steps': 263, 'loss/train': 6.130032062530518} -09/20/2021 15:24:03 - INFO - __main__ - Step 4219: {'lr': 7.013333333333333e-05, 'samples': 135008, 'steps': 263, 'loss/train': 5.688045024871826} -09/20/2021 15:24:04 - INFO - __main__ - Step 4220: {'lr': 7.013333333333333e-05, 'samples': 135040, 'steps': 263, 'loss/train': 6.195140361785889} -09/20/2021 15:24:06 - INFO - __main__ - Step 4221: {'lr': 7.013333333333333e-05, 'samples': 135072, 'steps': 263, 'loss/train': 5.604165554046631} -09/20/2021 15:24:06 - INFO - __main__ - Step 4222: {'lr': 7.013333333333333e-05, 'samples': 135104, 'steps': 263, 'loss/train': 5.127861499786377} -09/20/2021 15:24:07 - INFO - __main__ - Step 4223: {'lr': 7.013333333333333e-05, 'samples': 135136, 'steps': 263, 'loss/train': 5.559274673461914} -09/20/2021 15:24:08 - INFO - __main__ - Step 4224: {'lr': 7.013333333333333e-05, 'samples': 135168, 'steps': 263, 'loss/train': 5.426085472106934} -09/20/2021 15:24:09 - INFO - __main__ - Step 4225: {'lr': 7.04e-05, 'samples': 135200, 'steps': 264, 'loss/train': 5.340009689331055} -09/20/2021 15:24:10 - INFO - __main__ - Step 4226: {'lr': 7.04e-05, 'samples': 135232, 'steps': 264, 'loss/train': 6.191738605499268} -09/20/2021 15:24:10 - INFO - __main__ - Step 4227: {'lr': 7.04e-05, 'samples': 135264, 'steps': 264, 'loss/train': 4.358558177947998} -09/20/2021 15:24:11 - INFO - __main__ - Step 4228: {'lr': 7.04e-05, 'samples': 135296, 'steps': 264, 'loss/train': 3.8846676349639893} -09/20/2021 15:24:12 - INFO - __main__ - Step 4229: {'lr': 7.04e-05, 'samples': 135328, 'steps': 264, 'loss/train': 3.5488617420196533} -09/20/2021 15:24:13 - INFO - __main__ - Step 4230: {'lr': 7.04e-05, 'samples': 135360, 'steps': 264, 'loss/train': 6.333919525146484} -09/20/2021 15:24:13 - INFO - __main__ - Step 4231: {'lr': 7.04e-05, 'samples': 135392, 'steps': 264, 'loss/train': 5.574543476104736} -09/20/2021 15:24:14 - INFO - __main__ - Step 4232: {'lr': 7.04e-05, 'samples': 135424, 'steps': 264, 'loss/train': 4.784530162811279} -09/20/2021 15:24:15 - INFO - __main__ - Step 4233: {'lr': 7.04e-05, 'samples': 135456, 'steps': 264, 'loss/train': 5.670361042022705} -09/20/2021 15:24:16 - INFO - __main__ - Step 4234: {'lr': 7.04e-05, 'samples': 135488, 'steps': 264, 'loss/train': 5.23295259475708} -09/20/2021 15:24:16 - INFO - __main__ - Step 4235: {'lr': 7.04e-05, 'samples': 135520, 'steps': 264, 'loss/train': 5.358185768127441} -09/20/2021 15:24:17 - INFO - __main__ - Step 4236: {'lr': 7.04e-05, 'samples': 135552, 'steps': 264, 'loss/train': 5.6967244148254395} -09/20/2021 15:24:18 - INFO - __main__ - Step 4237: {'lr': 7.04e-05, 'samples': 135584, 'steps': 264, 'loss/train': 5.783092498779297} -09/20/2021 15:24:19 - INFO - __main__ - Step 4238: {'lr': 7.04e-05, 'samples': 135616, 'steps': 264, 'loss/train': 5.291306495666504} -09/20/2021 15:24:19 - INFO - __main__ - Step 4239: {'lr': 7.04e-05, 'samples': 135648, 'steps': 264, 'loss/train': 5.515512466430664} -09/20/2021 15:24:20 - INFO - __main__ - Step 4240: {'lr': 7.04e-05, 'samples': 135680, 'steps': 264, 'loss/train': 5.26078462600708} -09/20/2021 15:24:21 - INFO - __main__ - Step 4241: {'lr': 7.066666666666667e-05, 'samples': 135712, 'steps': 265, 'loss/train': 6.456225872039795} -09/20/2021 15:24:22 - INFO - __main__ - Step 4242: {'lr': 7.066666666666667e-05, 'samples': 135744, 'steps': 265, 'loss/train': 5.305810451507568} -09/20/2021 15:24:22 - INFO - __main__ - Step 4243: {'lr': 7.066666666666667e-05, 'samples': 135776, 'steps': 265, 'loss/train': 5.179373264312744} -09/20/2021 15:24:23 - INFO - __main__ - Step 4244: {'lr': 7.066666666666667e-05, 'samples': 135808, 'steps': 265, 'loss/train': 4.591829299926758} -09/20/2021 15:24:24 - INFO - __main__ - Step 4245: {'lr': 7.066666666666667e-05, 'samples': 135840, 'steps': 265, 'loss/train': 5.3407721519470215} -09/20/2021 15:24:25 - INFO - __main__ - Step 4246: {'lr': 7.066666666666667e-05, 'samples': 135872, 'steps': 265, 'loss/train': 4.6069111824035645} -09/20/2021 15:24:25 - INFO - __main__ - Step 4247: {'lr': 7.066666666666667e-05, 'samples': 135904, 'steps': 265, 'loss/train': 5.60190486907959} -09/20/2021 15:24:26 - INFO - __main__ - Step 4248: {'lr': 7.066666666666667e-05, 'samples': 135936, 'steps': 265, 'loss/train': 5.460510730743408} -09/20/2021 15:24:27 - INFO - __main__ - Step 4249: {'lr': 7.066666666666667e-05, 'samples': 135968, 'steps': 265, 'loss/train': 5.194378852844238} -09/20/2021 15:24:28 - INFO - __main__ - Step 4250: {'lr': 7.066666666666667e-05, 'samples': 136000, 'steps': 265, 'loss/train': 5.612444877624512} -09/20/2021 15:24:28 - INFO - __main__ - Step 4251: {'lr': 7.066666666666667e-05, 'samples': 136032, 'steps': 265, 'loss/train': 5.849413871765137} -09/20/2021 15:24:30 - INFO - __main__ - Step 4252: {'lr': 7.066666666666667e-05, 'samples': 136064, 'steps': 265, 'loss/train': 5.2577900886535645} -09/20/2021 15:24:31 - INFO - __main__ - Step 4253: {'lr': 7.066666666666667e-05, 'samples': 136096, 'steps': 265, 'loss/train': 4.788538455963135} -09/20/2021 15:24:31 - INFO - __main__ - Step 4254: {'lr': 7.066666666666667e-05, 'samples': 136128, 'steps': 265, 'loss/train': 5.343808650970459} -09/20/2021 15:24:32 - INFO - __main__ - Step 4255: {'lr': 7.066666666666667e-05, 'samples': 136160, 'steps': 265, 'loss/train': 6.303623676300049} -09/20/2021 15:24:33 - INFO - __main__ - Step 4256: {'lr': 7.066666666666667e-05, 'samples': 136192, 'steps': 265, 'loss/train': 6.433369159698486} -09/20/2021 15:24:34 - INFO - __main__ - Step 4257: {'lr': 7.093333333333334e-05, 'samples': 136224, 'steps': 266, 'loss/train': 5.737975120544434} -09/20/2021 15:24:34 - INFO - __main__ - Step 4258: {'lr': 7.093333333333334e-05, 'samples': 136256, 'steps': 266, 'loss/train': 6.0682291984558105} -09/20/2021 15:24:35 - INFO - __main__ - Step 4259: {'lr': 7.093333333333334e-05, 'samples': 136288, 'steps': 266, 'loss/train': 5.8183794021606445} -09/20/2021 15:24:36 - INFO - __main__ - Step 4260: {'lr': 7.093333333333334e-05, 'samples': 136320, 'steps': 266, 'loss/train': 4.584500789642334} -09/20/2021 15:24:37 - INFO - __main__ - Step 4261: {'lr': 7.093333333333334e-05, 'samples': 136352, 'steps': 266, 'loss/train': 5.817342281341553} -09/20/2021 15:24:37 - INFO - __main__ - Step 4262: {'lr': 7.093333333333334e-05, 'samples': 136384, 'steps': 266, 'loss/train': 4.6508588790893555} -09/20/2021 15:24:38 - INFO - __main__ - Step 4263: {'lr': 7.093333333333334e-05, 'samples': 136416, 'steps': 266, 'loss/train': 6.416836738586426} -09/20/2021 15:24:39 - INFO - __main__ - Step 4264: {'lr': 7.093333333333334e-05, 'samples': 136448, 'steps': 266, 'loss/train': 5.836806297302246} -09/20/2021 15:24:40 - INFO - __main__ - Step 4265: {'lr': 7.093333333333334e-05, 'samples': 136480, 'steps': 266, 'loss/train': 5.667080402374268} -09/20/2021 15:24:40 - INFO - __main__ - Step 4266: {'lr': 7.093333333333334e-05, 'samples': 136512, 'steps': 266, 'loss/train': 5.683448791503906} -09/20/2021 15:24:41 - INFO - __main__ - Step 4267: {'lr': 7.093333333333334e-05, 'samples': 136544, 'steps': 266, 'loss/train': 5.561091899871826} -09/20/2021 15:24:42 - INFO - __main__ - Step 4268: {'lr': 7.093333333333334e-05, 'samples': 136576, 'steps': 266, 'loss/train': 5.653260707855225} -09/20/2021 15:24:43 - INFO - __main__ - Step 4269: {'lr': 7.093333333333334e-05, 'samples': 136608, 'steps': 266, 'loss/train': 5.439690113067627} -09/20/2021 15:24:43 - INFO - __main__ - Step 4270: {'lr': 7.093333333333334e-05, 'samples': 136640, 'steps': 266, 'loss/train': 4.507430553436279} -09/20/2021 15:24:44 - INFO - __main__ - Step 4271: {'lr': 7.093333333333334e-05, 'samples': 136672, 'steps': 266, 'loss/train': 2.9228830337524414} -09/20/2021 15:24:45 - INFO - __main__ - Step 4272: {'lr': 7.093333333333334e-05, 'samples': 136704, 'steps': 266, 'loss/train': 7.248995780944824} -09/20/2021 15:24:46 - INFO - __main__ - Step 4273: {'lr': 7.12e-05, 'samples': 136736, 'steps': 267, 'loss/train': 5.676933288574219} -09/20/2021 15:24:47 - INFO - __main__ - Step 4274: {'lr': 7.12e-05, 'samples': 136768, 'steps': 267, 'loss/train': 5.664374828338623} -09/20/2021 15:24:47 - INFO - __main__ - Step 4275: {'lr': 7.12e-05, 'samples': 136800, 'steps': 267, 'loss/train': 5.0975542068481445} -09/20/2021 15:24:48 - INFO - __main__ - Step 4276: {'lr': 7.12e-05, 'samples': 136832, 'steps': 267, 'loss/train': 6.4589409828186035} -09/20/2021 15:24:49 - INFO - __main__ - Step 4277: {'lr': 7.12e-05, 'samples': 136864, 'steps': 267, 'loss/train': 5.608900547027588} -09/20/2021 15:24:50 - INFO - __main__ - Step 4278: {'lr': 7.12e-05, 'samples': 136896, 'steps': 267, 'loss/train': 6.023500442504883} -09/20/2021 15:24:50 - INFO - __main__ - Step 4279: {'lr': 7.12e-05, 'samples': 136928, 'steps': 267, 'loss/train': 5.106395721435547} -09/20/2021 15:24:51 - INFO - __main__ - Step 4280: {'lr': 7.12e-05, 'samples': 136960, 'steps': 267, 'loss/train': 5.132558822631836} -09/20/2021 15:24:52 - INFO - __main__ - Step 4281: {'lr': 7.12e-05, 'samples': 136992, 'steps': 267, 'loss/train': 5.438318252563477} -09/20/2021 15:24:53 - INFO - __main__ - Step 4282: {'lr': 7.12e-05, 'samples': 137024, 'steps': 267, 'loss/train': 4.172806739807129} -09/20/2021 15:24:53 - INFO - __main__ - Step 4283: {'lr': 7.12e-05, 'samples': 137056, 'steps': 267, 'loss/train': 3.6428616046905518} -09/20/2021 15:24:55 - INFO - __main__ - Step 4284: {'lr': 7.12e-05, 'samples': 137088, 'steps': 267, 'loss/train': 3.3894455432891846} -09/20/2021 15:24:55 - INFO - __main__ - Step 4285: {'lr': 7.12e-05, 'samples': 137120, 'steps': 267, 'loss/train': 5.329221248626709} -09/20/2021 15:24:56 - INFO - __main__ - Step 4286: {'lr': 7.12e-05, 'samples': 137152, 'steps': 267, 'loss/train': 6.089878559112549} -09/20/2021 15:24:57 - INFO - __main__ - Step 4287: {'lr': 7.12e-05, 'samples': 137184, 'steps': 267, 'loss/train': 5.001715660095215} -09/20/2021 15:24:58 - INFO - __main__ - Step 4288: {'lr': 7.12e-05, 'samples': 137216, 'steps': 267, 'loss/train': 6.468151092529297} -09/20/2021 15:24:59 - INFO - __main__ - Step 4289: {'lr': 7.146666666666666e-05, 'samples': 137248, 'steps': 268, 'loss/train': 5.45476770401001} -09/20/2021 15:24:59 - INFO - __main__ - Step 4290: {'lr': 7.146666666666666e-05, 'samples': 137280, 'steps': 268, 'loss/train': 5.852313995361328} -09/20/2021 15:25:00 - INFO - __main__ - Step 4291: {'lr': 7.146666666666666e-05, 'samples': 137312, 'steps': 268, 'loss/train': 5.896988868713379} -09/20/2021 15:25:01 - INFO - __main__ - Step 4292: {'lr': 7.146666666666666e-05, 'samples': 137344, 'steps': 268, 'loss/train': 5.142933368682861} -09/20/2021 15:25:02 - INFO - __main__ - Step 4293: {'lr': 7.146666666666666e-05, 'samples': 137376, 'steps': 268, 'loss/train': 6.47316837310791} -09/20/2021 15:25:02 - INFO - __main__ - Step 4294: {'lr': 7.146666666666666e-05, 'samples': 137408, 'steps': 268, 'loss/train': 6.016228675842285} -09/20/2021 15:25:03 - INFO - __main__ - Step 4295: {'lr': 7.146666666666666e-05, 'samples': 137440, 'steps': 268, 'loss/train': 4.857963562011719} -09/20/2021 15:25:04 - INFO - __main__ - Step 4296: {'lr': 7.146666666666666e-05, 'samples': 137472, 'steps': 268, 'loss/train': 5.935636520385742} -09/20/2021 15:25:05 - INFO - __main__ - Step 4297: {'lr': 7.146666666666666e-05, 'samples': 137504, 'steps': 268, 'loss/train': 5.282544136047363} -09/20/2021 15:25:05 - INFO - __main__ - Step 4298: {'lr': 7.146666666666666e-05, 'samples': 137536, 'steps': 268, 'loss/train': 5.875457286834717} -09/20/2021 15:25:06 - INFO - __main__ - Step 4299: {'lr': 7.146666666666666e-05, 'samples': 137568, 'steps': 268, 'loss/train': 7.177484035491943} -09/20/2021 15:25:07 - INFO - __main__ - Step 4300: {'lr': 7.146666666666666e-05, 'samples': 137600, 'steps': 268, 'loss/train': 7.080787658691406} -09/20/2021 15:25:08 - INFO - __main__ - Step 4301: {'lr': 7.146666666666666e-05, 'samples': 137632, 'steps': 268, 'loss/train': 5.505031585693359} -09/20/2021 15:25:08 - INFO - __main__ - Step 4302: {'lr': 7.146666666666666e-05, 'samples': 137664, 'steps': 268, 'loss/train': 5.391508102416992} -09/20/2021 15:25:09 - INFO - __main__ - Step 4303: {'lr': 7.146666666666666e-05, 'samples': 137696, 'steps': 268, 'loss/train': 5.4578046798706055} -09/20/2021 15:25:10 - INFO - __main__ - Step 4304: {'lr': 7.146666666666666e-05, 'samples': 137728, 'steps': 268, 'loss/train': 6.104618072509766} -09/20/2021 15:25:11 - INFO - __main__ - Step 4305: {'lr': 7.173333333333335e-05, 'samples': 137760, 'steps': 269, 'loss/train': 5.4191508293151855} -09/20/2021 15:25:11 - INFO - __main__ - Step 4306: {'lr': 7.173333333333335e-05, 'samples': 137792, 'steps': 269, 'loss/train': 5.015893459320068} -09/20/2021 15:25:12 - INFO - __main__ - Step 4307: {'lr': 7.173333333333335e-05, 'samples': 137824, 'steps': 269, 'loss/train': 5.5131516456604} -09/20/2021 15:25:13 - INFO - __main__ - Step 4308: {'lr': 7.173333333333335e-05, 'samples': 137856, 'steps': 269, 'loss/train': 5.497686862945557} -09/20/2021 15:25:14 - INFO - __main__ - Step 4309: {'lr': 7.173333333333335e-05, 'samples': 137888, 'steps': 269, 'loss/train': 5.179861068725586} -09/20/2021 15:25:14 - INFO - __main__ - Step 4310: {'lr': 7.173333333333335e-05, 'samples': 137920, 'steps': 269, 'loss/train': 5.321877479553223} -09/20/2021 15:25:15 - INFO - __main__ - Step 4311: {'lr': 7.173333333333335e-05, 'samples': 137952, 'steps': 269, 'loss/train': 5.549623489379883} -09/20/2021 15:25:16 - INFO - __main__ - Step 4312: {'lr': 7.173333333333335e-05, 'samples': 137984, 'steps': 269, 'loss/train': 4.43431282043457} -09/20/2021 15:25:17 - INFO - __main__ - Step 4313: {'lr': 7.173333333333335e-05, 'samples': 138016, 'steps': 269, 'loss/train': 7.2113261222839355} -09/20/2021 15:25:18 - INFO - __main__ - Step 4314: {'lr': 7.173333333333335e-05, 'samples': 138048, 'steps': 269, 'loss/train': 5.777760982513428} -09/20/2021 15:25:19 - INFO - __main__ - Step 4315: {'lr': 7.173333333333335e-05, 'samples': 138080, 'steps': 269, 'loss/train': 5.900177478790283} -09/20/2021 15:25:19 - INFO - __main__ - Step 4316: {'lr': 7.173333333333335e-05, 'samples': 138112, 'steps': 269, 'loss/train': 5.426130294799805} -09/20/2021 15:25:20 - INFO - __main__ - Step 4317: {'lr': 7.173333333333335e-05, 'samples': 138144, 'steps': 269, 'loss/train': 5.714654922485352} -09/20/2021 15:25:21 - INFO - __main__ - Step 4318: {'lr': 7.173333333333335e-05, 'samples': 138176, 'steps': 269, 'loss/train': 5.3993000984191895} -09/20/2021 15:25:22 - INFO - __main__ - Step 4319: {'lr': 7.173333333333335e-05, 'samples': 138208, 'steps': 269, 'loss/train': 5.943475246429443} -09/20/2021 15:25:22 - INFO - __main__ - Step 4320: {'lr': 7.173333333333335e-05, 'samples': 138240, 'steps': 269, 'loss/train': 5.464844703674316} -09/20/2021 15:25:23 - INFO - __main__ - Step 4321: {'lr': 7.2e-05, 'samples': 138272, 'steps': 270, 'loss/train': 4.777159214019775} -09/20/2021 15:25:24 - INFO - __main__ - Step 4322: {'lr': 7.2e-05, 'samples': 138304, 'steps': 270, 'loss/train': 5.82138204574585} -09/20/2021 15:25:25 - INFO - __main__ - Step 4323: {'lr': 7.2e-05, 'samples': 138336, 'steps': 270, 'loss/train': 5.083676815032959} -09/20/2021 15:25:26 - INFO - __main__ - Step 4324: {'lr': 7.2e-05, 'samples': 138368, 'steps': 270, 'loss/train': 5.053329944610596} -09/20/2021 15:25:26 - INFO - __main__ - Step 4325: {'lr': 7.2e-05, 'samples': 138400, 'steps': 270, 'loss/train': 5.775004863739014} -09/20/2021 15:25:27 - INFO - __main__ - Step 4326: {'lr': 7.2e-05, 'samples': 138432, 'steps': 270, 'loss/train': 5.337765693664551} -09/20/2021 15:25:28 - INFO - __main__ - Step 4327: {'lr': 7.2e-05, 'samples': 138464, 'steps': 270, 'loss/train': 5.6400065422058105} -09/20/2021 15:25:29 - INFO - __main__ - Step 4328: {'lr': 7.2e-05, 'samples': 138496, 'steps': 270, 'loss/train': 5.342634201049805} -09/20/2021 15:25:29 - INFO - __main__ - Step 4329: {'lr': 7.2e-05, 'samples': 138528, 'steps': 270, 'loss/train': 5.781447410583496} -09/20/2021 15:25:30 - INFO - __main__ - Step 4330: {'lr': 7.2e-05, 'samples': 138560, 'steps': 270, 'loss/train': 6.090068817138672} -09/20/2021 15:25:31 - INFO - __main__ - Step 4331: {'lr': 7.2e-05, 'samples': 138592, 'steps': 270, 'loss/train': 5.4315185546875} -09/20/2021 15:25:32 - INFO - __main__ - Step 4332: {'lr': 7.2e-05, 'samples': 138624, 'steps': 270, 'loss/train': 6.51323938369751} -09/20/2021 15:25:32 - INFO - __main__ - Step 4333: {'lr': 7.2e-05, 'samples': 138656, 'steps': 270, 'loss/train': 6.132203578948975} -09/20/2021 15:25:33 - INFO - __main__ - Step 4334: {'lr': 7.2e-05, 'samples': 138688, 'steps': 270, 'loss/train': 5.8709397315979} -09/20/2021 15:25:34 - INFO - __main__ - Step 4335: {'lr': 7.2e-05, 'samples': 138720, 'steps': 270, 'loss/train': 5.86212158203125} -09/20/2021 15:25:35 - INFO - __main__ - Step 4336: {'lr': 7.2e-05, 'samples': 138752, 'steps': 270, 'loss/train': 5.500588417053223} -09/20/2021 15:25:35 - INFO - __main__ - Step 4337: {'lr': 7.226666666666667e-05, 'samples': 138784, 'steps': 271, 'loss/train': 5.399415493011475} -09/20/2021 15:25:36 - INFO - __main__ - Step 4338: {'lr': 7.226666666666667e-05, 'samples': 138816, 'steps': 271, 'loss/train': 5.796328067779541} -09/20/2021 15:25:37 - INFO - __main__ - Step 4339: {'lr': 7.226666666666667e-05, 'samples': 138848, 'steps': 271, 'loss/train': 2.847156047821045} -09/20/2021 15:25:38 - INFO - __main__ - Step 4340: {'lr': 7.226666666666667e-05, 'samples': 138880, 'steps': 271, 'loss/train': 5.659191131591797} -09/20/2021 15:25:38 - INFO - __main__ - Step 4341: {'lr': 7.226666666666667e-05, 'samples': 138912, 'steps': 271, 'loss/train': 4.6568684577941895} -09/20/2021 15:25:39 - INFO - __main__ - Step 4342: {'lr': 7.226666666666667e-05, 'samples': 138944, 'steps': 271, 'loss/train': 5.167910575866699} -09/20/2021 15:25:40 - INFO - __main__ - Step 4343: {'lr': 7.226666666666667e-05, 'samples': 138976, 'steps': 271, 'loss/train': 5.451864242553711} -09/20/2021 15:25:41 - INFO - __main__ - Step 4344: {'lr': 7.226666666666667e-05, 'samples': 139008, 'steps': 271, 'loss/train': 5.507290840148926} -09/20/2021 15:25:42 - INFO - __main__ - Step 4345: {'lr': 7.226666666666667e-05, 'samples': 139040, 'steps': 271, 'loss/train': 5.70491886138916} -09/20/2021 15:25:43 - INFO - __main__ - Step 4346: {'lr': 7.226666666666667e-05, 'samples': 139072, 'steps': 271, 'loss/train': 6.109258651733398} -09/20/2021 15:25:43 - INFO - __main__ - Step 4347: {'lr': 7.226666666666667e-05, 'samples': 139104, 'steps': 271, 'loss/train': 5.482288837432861} -09/20/2021 15:25:44 - INFO - __main__ - Step 4348: {'lr': 7.226666666666667e-05, 'samples': 139136, 'steps': 271, 'loss/train': 4.820034503936768} -09/20/2021 15:25:45 - INFO - __main__ - Step 4349: {'lr': 7.226666666666667e-05, 'samples': 139168, 'steps': 271, 'loss/train': 5.7791948318481445} -09/20/2021 15:25:46 - INFO - __main__ - Step 4350: {'lr': 7.226666666666667e-05, 'samples': 139200, 'steps': 271, 'loss/train': 6.120129108428955} -09/20/2021 15:25:46 - INFO - __main__ - Step 4351: {'lr': 7.226666666666667e-05, 'samples': 139232, 'steps': 271, 'loss/train': 5.1846699714660645} -09/20/2021 15:25:47 - INFO - __main__ - Step 4352: {'lr': 7.226666666666667e-05, 'samples': 139264, 'steps': 271, 'loss/train': 5.301422119140625} -09/20/2021 15:25:48 - INFO - __main__ - Step 4353: {'lr': 7.253333333333334e-05, 'samples': 139296, 'steps': 272, 'loss/train': 4.954637050628662} -09/20/2021 15:25:49 - INFO - __main__ - Step 4354: {'lr': 7.253333333333334e-05, 'samples': 139328, 'steps': 272, 'loss/train': 5.186250686645508} -09/20/2021 15:25:50 - INFO - __main__ - Step 4355: {'lr': 7.253333333333334e-05, 'samples': 139360, 'steps': 272, 'loss/train': 5.17704439163208} -09/20/2021 15:25:50 - INFO - __main__ - Step 4356: {'lr': 7.253333333333334e-05, 'samples': 139392, 'steps': 272, 'loss/train': 4.7883501052856445} -09/20/2021 15:25:51 - INFO - __main__ - Step 4357: {'lr': 7.253333333333334e-05, 'samples': 139424, 'steps': 272, 'loss/train': 5.239960670471191} -09/20/2021 15:25:52 - INFO - __main__ - Step 4358: {'lr': 7.253333333333334e-05, 'samples': 139456, 'steps': 272, 'loss/train': 2.640453338623047} -09/20/2021 15:25:53 - INFO - __main__ - Step 4359: {'lr': 7.253333333333334e-05, 'samples': 139488, 'steps': 272, 'loss/train': 4.7996673583984375} -09/20/2021 15:25:53 - INFO - __main__ - Step 4360: {'lr': 7.253333333333334e-05, 'samples': 139520, 'steps': 272, 'loss/train': 7.006623268127441} -09/20/2021 15:25:54 - INFO - __main__ - Step 4361: {'lr': 7.253333333333334e-05, 'samples': 139552, 'steps': 272, 'loss/train': 5.1884870529174805} -09/20/2021 15:25:55 - INFO - __main__ - Step 4362: {'lr': 7.253333333333334e-05, 'samples': 139584, 'steps': 272, 'loss/train': 5.034470081329346} -09/20/2021 15:25:56 - INFO - __main__ - Step 4363: {'lr': 7.253333333333334e-05, 'samples': 139616, 'steps': 272, 'loss/train': 5.844695091247559} -09/20/2021 15:25:56 - INFO - __main__ - Step 4364: {'lr': 7.253333333333334e-05, 'samples': 139648, 'steps': 272, 'loss/train': 5.5514912605285645} -09/20/2021 15:25:57 - INFO - __main__ - Step 4365: {'lr': 7.253333333333334e-05, 'samples': 139680, 'steps': 272, 'loss/train': 5.056936264038086} -09/20/2021 15:25:58 - INFO - __main__ - Step 4366: {'lr': 7.253333333333334e-05, 'samples': 139712, 'steps': 272, 'loss/train': 2.9658641815185547} -09/20/2021 15:25:59 - INFO - __main__ - Step 4367: {'lr': 7.253333333333334e-05, 'samples': 139744, 'steps': 272, 'loss/train': 5.062161445617676} -09/20/2021 15:25:59 - INFO - __main__ - Step 4368: {'lr': 7.253333333333334e-05, 'samples': 139776, 'steps': 272, 'loss/train': 5.560389995574951} -09/20/2021 15:26:00 - INFO - __main__ - Step 4369: {'lr': 7.280000000000001e-05, 'samples': 139808, 'steps': 273, 'loss/train': 5.316586017608643} -09/20/2021 15:26:01 - INFO - __main__ - Step 4370: {'lr': 7.280000000000001e-05, 'samples': 139840, 'steps': 273, 'loss/train': 4.710814952850342} -09/20/2021 15:26:02 - INFO - __main__ - Step 4371: {'lr': 7.280000000000001e-05, 'samples': 139872, 'steps': 273, 'loss/train': 5.337206840515137} -09/20/2021 15:26:03 - INFO - __main__ - Step 4372: {'lr': 7.280000000000001e-05, 'samples': 139904, 'steps': 273, 'loss/train': 5.220736980438232} -09/20/2021 15:26:03 - INFO - __main__ - Step 4373: {'lr': 7.280000000000001e-05, 'samples': 139936, 'steps': 273, 'loss/train': 5.952816486358643} -09/20/2021 15:26:04 - INFO - __main__ - Step 4374: {'lr': 7.280000000000001e-05, 'samples': 139968, 'steps': 273, 'loss/train': 5.094738006591797} -09/20/2021 15:26:05 - INFO - __main__ - Step 4375: {'lr': 7.280000000000001e-05, 'samples': 140000, 'steps': 273, 'loss/train': 5.615108489990234} -09/20/2021 15:26:06 - INFO - __main__ - Step 4376: {'lr': 7.280000000000001e-05, 'samples': 140032, 'steps': 273, 'loss/train': 4.552473545074463} -09/20/2021 15:26:07 - INFO - __main__ - Step 4377: {'lr': 7.280000000000001e-05, 'samples': 140064, 'steps': 273, 'loss/train': 5.698679447174072} -09/20/2021 15:26:08 - INFO - __main__ - Step 4378: {'lr': 7.280000000000001e-05, 'samples': 140096, 'steps': 273, 'loss/train': 7.223032474517822} -09/20/2021 15:26:08 - INFO - __main__ - Step 4379: {'lr': 7.280000000000001e-05, 'samples': 140128, 'steps': 273, 'loss/train': 7.296456336975098} -09/20/2021 15:26:09 - INFO - __main__ - Step 4380: {'lr': 7.280000000000001e-05, 'samples': 140160, 'steps': 273, 'loss/train': 5.412067890167236} -09/20/2021 15:26:10 - INFO - __main__ - Step 4381: {'lr': 7.280000000000001e-05, 'samples': 140192, 'steps': 273, 'loss/train': 6.106313228607178} -09/20/2021 15:26:11 - INFO - __main__ - Step 4382: {'lr': 7.280000000000001e-05, 'samples': 140224, 'steps': 273, 'loss/train': 5.294243335723877} -09/20/2021 15:26:11 - INFO - __main__ - Step 4383: {'lr': 7.280000000000001e-05, 'samples': 140256, 'steps': 273, 'loss/train': 3.4666154384613037} -09/20/2021 15:26:12 - INFO - __main__ - Step 4384: {'lr': 7.280000000000001e-05, 'samples': 140288, 'steps': 273, 'loss/train': 5.987436771392822} -09/20/2021 15:26:13 - INFO - __main__ - Step 4385: {'lr': 7.306666666666668e-05, 'samples': 140320, 'steps': 274, 'loss/train': 5.631346702575684} -09/20/2021 15:26:14 - INFO - __main__ - Step 4386: {'lr': 7.306666666666668e-05, 'samples': 140352, 'steps': 274, 'loss/train': 4.450146198272705} -09/20/2021 15:26:15 - INFO - __main__ - Step 4387: {'lr': 7.306666666666668e-05, 'samples': 140384, 'steps': 274, 'loss/train': 5.2248005867004395} -09/20/2021 15:26:15 - INFO - __main__ - Step 4388: {'lr': 7.306666666666668e-05, 'samples': 140416, 'steps': 274, 'loss/train': 5.806710720062256} -09/20/2021 15:26:16 - INFO - __main__ - Step 4389: {'lr': 7.306666666666668e-05, 'samples': 140448, 'steps': 274, 'loss/train': 5.573002815246582} -09/20/2021 15:26:17 - INFO - __main__ - Step 4390: {'lr': 7.306666666666668e-05, 'samples': 140480, 'steps': 274, 'loss/train': 4.676459312438965} -09/20/2021 15:26:18 - INFO - __main__ - Step 4391: {'lr': 7.306666666666668e-05, 'samples': 140512, 'steps': 274, 'loss/train': 4.755455493927002} -09/20/2021 15:26:18 - INFO - __main__ - Step 4392: {'lr': 7.306666666666668e-05, 'samples': 140544, 'steps': 274, 'loss/train': 4.501762390136719} -09/20/2021 15:26:19 - INFO - __main__ - Step 4393: {'lr': 7.306666666666668e-05, 'samples': 140576, 'steps': 274, 'loss/train': 5.858189582824707} -09/20/2021 15:26:20 - INFO - __main__ - Step 4394: {'lr': 7.306666666666668e-05, 'samples': 140608, 'steps': 274, 'loss/train': 5.0169596672058105} -09/20/2021 15:26:21 - INFO - __main__ - Step 4395: {'lr': 7.306666666666668e-05, 'samples': 140640, 'steps': 274, 'loss/train': 5.366095066070557} -09/20/2021 15:26:21 - INFO - __main__ - Step 4396: {'lr': 7.306666666666668e-05, 'samples': 140672, 'steps': 274, 'loss/train': 5.182440757751465} -09/20/2021 15:26:22 - INFO - __main__ - Step 4397: {'lr': 7.306666666666668e-05, 'samples': 140704, 'steps': 274, 'loss/train': 4.986732006072998} -09/20/2021 15:26:23 - INFO - __main__ - Step 4398: {'lr': 7.306666666666668e-05, 'samples': 140736, 'steps': 274, 'loss/train': 6.203718662261963} -09/20/2021 15:26:24 - INFO - __main__ - Step 4399: {'lr': 7.306666666666668e-05, 'samples': 140768, 'steps': 274, 'loss/train': 5.483407974243164} -09/20/2021 15:26:24 - INFO - __main__ - Step 4400: {'lr': 7.306666666666668e-05, 'samples': 140800, 'steps': 274, 'loss/train': 5.878673553466797} -09/20/2021 15:26:25 - INFO - __main__ - Step 4401: {'lr': 7.333333333333333e-05, 'samples': 140832, 'steps': 275, 'loss/train': 5.623448371887207} -09/20/2021 15:26:26 - INFO - __main__ - Step 4402: {'lr': 7.333333333333333e-05, 'samples': 140864, 'steps': 275, 'loss/train': 4.673789024353027} -09/20/2021 15:26:27 - INFO - __main__ - Step 4403: {'lr': 7.333333333333333e-05, 'samples': 140896, 'steps': 275, 'loss/train': 6.814786911010742} -09/20/2021 15:26:27 - INFO - __main__ - Step 4404: {'lr': 7.333333333333333e-05, 'samples': 140928, 'steps': 275, 'loss/train': 5.844600677490234} -09/20/2021 15:26:28 - INFO - __main__ - Step 4405: {'lr': 7.333333333333333e-05, 'samples': 140960, 'steps': 275, 'loss/train': 6.425435543060303} -09/20/2021 15:26:30 - INFO - __main__ - Step 4406: {'lr': 7.333333333333333e-05, 'samples': 140992, 'steps': 275, 'loss/train': 5.449148178100586} -09/20/2021 15:26:30 - INFO - __main__ - Step 4407: {'lr': 7.333333333333333e-05, 'samples': 141024, 'steps': 275, 'loss/train': 5.420917510986328} -09/20/2021 15:26:31 - INFO - __main__ - Step 4408: {'lr': 7.333333333333333e-05, 'samples': 141056, 'steps': 275, 'loss/train': 5.639200687408447} -09/20/2021 15:26:32 - INFO - __main__ - Step 4409: {'lr': 7.333333333333333e-05, 'samples': 141088, 'steps': 275, 'loss/train': 5.225945949554443} -09/20/2021 15:26:33 - INFO - __main__ - Step 4410: {'lr': 7.333333333333333e-05, 'samples': 141120, 'steps': 275, 'loss/train': 4.652252197265625} -09/20/2021 15:26:33 - INFO - __main__ - Step 4411: {'lr': 7.333333333333333e-05, 'samples': 141152, 'steps': 275, 'loss/train': 5.952761173248291} -09/20/2021 15:26:34 - INFO - __main__ - Step 4412: {'lr': 7.333333333333333e-05, 'samples': 141184, 'steps': 275, 'loss/train': 5.410816669464111} -09/20/2021 15:26:35 - INFO - __main__ - Step 4413: {'lr': 7.333333333333333e-05, 'samples': 141216, 'steps': 275, 'loss/train': 5.78819465637207} -09/20/2021 15:26:36 - INFO - __main__ - Step 4414: {'lr': 7.333333333333333e-05, 'samples': 141248, 'steps': 275, 'loss/train': 5.976875305175781} -09/20/2021 15:26:36 - INFO - __main__ - Step 4415: {'lr': 7.333333333333333e-05, 'samples': 141280, 'steps': 275, 'loss/train': 5.619223117828369} -09/20/2021 15:26:37 - INFO - __main__ - Step 4416: {'lr': 7.333333333333333e-05, 'samples': 141312, 'steps': 275, 'loss/train': 5.492790222167969} -09/20/2021 15:26:38 - INFO - __main__ - Step 4417: {'lr': 7.36e-05, 'samples': 141344, 'steps': 276, 'loss/train': 6.370048522949219} -09/20/2021 15:26:39 - INFO - __main__ - Step 4418: {'lr': 7.36e-05, 'samples': 141376, 'steps': 276, 'loss/train': 6.223494052886963} -09/20/2021 15:26:39 - INFO - __main__ - Step 4419: {'lr': 7.36e-05, 'samples': 141408, 'steps': 276, 'loss/train': 5.633800506591797} -09/20/2021 15:26:40 - INFO - __main__ - Step 4420: {'lr': 7.36e-05, 'samples': 141440, 'steps': 276, 'loss/train': 5.234057903289795} -09/20/2021 15:26:41 - INFO - __main__ - Step 4421: {'lr': 7.36e-05, 'samples': 141472, 'steps': 276, 'loss/train': 5.1244964599609375} -09/20/2021 15:26:42 - INFO - __main__ - Step 4422: {'lr': 7.36e-05, 'samples': 141504, 'steps': 276, 'loss/train': 0.8499786853790283} -09/20/2021 15:26:42 - INFO - __main__ - Step 4423: {'lr': 7.36e-05, 'samples': 141536, 'steps': 276, 'loss/train': 6.017881393432617} -09/20/2021 15:26:43 - INFO - __main__ - Step 4424: {'lr': 7.36e-05, 'samples': 141568, 'steps': 276, 'loss/train': 5.0001630783081055} -09/20/2021 15:26:44 - INFO - __main__ - Step 4425: {'lr': 7.36e-05, 'samples': 141600, 'steps': 276, 'loss/train': 4.891355991363525} -09/20/2021 15:26:45 - INFO - __main__ - Step 4426: {'lr': 7.36e-05, 'samples': 141632, 'steps': 276, 'loss/train': 5.032819747924805} -09/20/2021 15:26:45 - INFO - __main__ - Step 4427: {'lr': 7.36e-05, 'samples': 141664, 'steps': 276, 'loss/train': 4.592894554138184} -09/20/2021 15:26:46 - INFO - __main__ - Step 4428: {'lr': 7.36e-05, 'samples': 141696, 'steps': 276, 'loss/train': 5.531311511993408} -09/20/2021 15:26:47 - INFO - __main__ - Step 4429: {'lr': 7.36e-05, 'samples': 141728, 'steps': 276, 'loss/train': 5.0564117431640625} -09/20/2021 15:26:48 - INFO - __main__ - Step 4430: {'lr': 7.36e-05, 'samples': 141760, 'steps': 276, 'loss/train': 5.255195140838623} -09/20/2021 15:26:48 - INFO - __main__ - Step 4431: {'lr': 7.36e-05, 'samples': 141792, 'steps': 276, 'loss/train': 4.772751808166504} -09/20/2021 15:26:49 - INFO - __main__ - Step 4432: {'lr': 7.36e-05, 'samples': 141824, 'steps': 276, 'loss/train': 5.685938835144043} -09/20/2021 15:26:50 - INFO - __main__ - Step 4433: {'lr': 7.386666666666667e-05, 'samples': 141856, 'steps': 277, 'loss/train': 6.912177085876465} -09/20/2021 15:26:51 - INFO - __main__ - Step 4434: {'lr': 7.386666666666667e-05, 'samples': 141888, 'steps': 277, 'loss/train': 5.441844463348389} -09/20/2021 15:26:52 - INFO - __main__ - Step 4435: {'lr': 7.386666666666667e-05, 'samples': 141920, 'steps': 277, 'loss/train': 6.669328689575195} -09/20/2021 15:26:52 - INFO - __main__ - Step 4436: {'lr': 7.386666666666667e-05, 'samples': 141952, 'steps': 277, 'loss/train': 5.691988945007324} -09/20/2021 15:26:53 - INFO - __main__ - Step 4437: {'lr': 7.386666666666667e-05, 'samples': 141984, 'steps': 277, 'loss/train': 5.570296287536621} -09/20/2021 15:26:55 - INFO - __main__ - Step 4438: {'lr': 7.386666666666667e-05, 'samples': 142016, 'steps': 277, 'loss/train': 5.408724308013916} -09/20/2021 15:26:55 - INFO - __main__ - Step 4439: {'lr': 7.386666666666667e-05, 'samples': 142048, 'steps': 277, 'loss/train': 5.343891620635986} -09/20/2021 15:26:56 - INFO - __main__ - Step 4440: {'lr': 7.386666666666667e-05, 'samples': 142080, 'steps': 277, 'loss/train': 5.197979927062988} -09/20/2021 15:26:57 - INFO - __main__ - Step 4441: {'lr': 7.386666666666667e-05, 'samples': 142112, 'steps': 277, 'loss/train': 5.108036518096924} -09/20/2021 15:26:58 - INFO - __main__ - Step 4442: {'lr': 7.386666666666667e-05, 'samples': 142144, 'steps': 277, 'loss/train': 4.634382724761963} -09/20/2021 15:26:58 - INFO - __main__ - Step 4443: {'lr': 7.386666666666667e-05, 'samples': 142176, 'steps': 277, 'loss/train': 6.329591751098633} -09/20/2021 15:26:59 - INFO - __main__ - Step 4444: {'lr': 7.386666666666667e-05, 'samples': 142208, 'steps': 277, 'loss/train': 6.4089250564575195} -09/20/2021 15:27:00 - INFO - __main__ - Step 4445: {'lr': 7.386666666666667e-05, 'samples': 142240, 'steps': 277, 'loss/train': 5.720455169677734} -09/20/2021 15:27:01 - INFO - __main__ - Step 4446: {'lr': 7.386666666666667e-05, 'samples': 142272, 'steps': 277, 'loss/train': 5.8252387046813965} -09/20/2021 15:27:01 - INFO - __main__ - Step 4447: {'lr': 7.386666666666667e-05, 'samples': 142304, 'steps': 277, 'loss/train': 5.060269832611084} -09/20/2021 15:27:02 - INFO - __main__ - Step 4448: {'lr': 7.386666666666667e-05, 'samples': 142336, 'steps': 277, 'loss/train': 5.710058212280273} -09/20/2021 15:27:03 - INFO - __main__ - Step 4449: {'lr': 7.413333333333334e-05, 'samples': 142368, 'steps': 278, 'loss/train': 6.556556224822998} -09/20/2021 15:27:04 - INFO - __main__ - Step 4450: {'lr': 7.413333333333334e-05, 'samples': 142400, 'steps': 278, 'loss/train': 4.786515712738037} -09/20/2021 15:27:05 - INFO - __main__ - Step 4451: {'lr': 7.413333333333334e-05, 'samples': 142432, 'steps': 278, 'loss/train': 5.498515605926514} -09/20/2021 15:27:05 - INFO - __main__ - Step 4452: {'lr': 7.413333333333334e-05, 'samples': 142464, 'steps': 278, 'loss/train': 5.998151779174805} -09/20/2021 15:27:06 - INFO - __main__ - Step 4453: {'lr': 7.413333333333334e-05, 'samples': 142496, 'steps': 278, 'loss/train': 5.150630950927734} -09/20/2021 15:27:07 - INFO - __main__ - Step 4454: {'lr': 7.413333333333334e-05, 'samples': 142528, 'steps': 278, 'loss/train': 4.732308864593506} -09/20/2021 15:27:08 - INFO - __main__ - Step 4455: {'lr': 7.413333333333334e-05, 'samples': 142560, 'steps': 278, 'loss/train': 5.783046245574951} -09/20/2021 15:27:08 - INFO - __main__ - Step 4456: {'lr': 7.413333333333334e-05, 'samples': 142592, 'steps': 278, 'loss/train': 6.448365211486816} -09/20/2021 15:27:09 - INFO - __main__ - Step 4457: {'lr': 7.413333333333334e-05, 'samples': 142624, 'steps': 278, 'loss/train': 4.857707977294922} -09/20/2021 15:27:10 - INFO - __main__ - Step 4458: {'lr': 7.413333333333334e-05, 'samples': 142656, 'steps': 278, 'loss/train': 6.080463886260986} -09/20/2021 15:27:11 - INFO - __main__ - Step 4459: {'lr': 7.413333333333334e-05, 'samples': 142688, 'steps': 278, 'loss/train': 5.249147891998291} -09/20/2021 15:27:11 - INFO - __main__ - Step 4460: {'lr': 7.413333333333334e-05, 'samples': 142720, 'steps': 278, 'loss/train': 5.392813205718994} -09/20/2021 15:27:12 - INFO - __main__ - Step 4461: {'lr': 7.413333333333334e-05, 'samples': 142752, 'steps': 278, 'loss/train': 3.716857433319092} -09/20/2021 15:27:13 - INFO - __main__ - Step 4462: {'lr': 7.413333333333334e-05, 'samples': 142784, 'steps': 278, 'loss/train': 3.507577419281006} -09/20/2021 15:27:14 - INFO - __main__ - Step 4463: {'lr': 7.413333333333334e-05, 'samples': 142816, 'steps': 278, 'loss/train': 3.5955069065093994} -09/20/2021 15:27:14 - INFO - __main__ - Step 4464: {'lr': 7.413333333333334e-05, 'samples': 142848, 'steps': 278, 'loss/train': 5.515825271606445} -09/20/2021 15:27:15 - INFO - __main__ - Step 4465: {'lr': 7.44e-05, 'samples': 142880, 'steps': 279, 'loss/train': 5.284401893615723} -09/20/2021 15:27:16 - INFO - __main__ - Step 4466: {'lr': 7.44e-05, 'samples': 142912, 'steps': 279, 'loss/train': 5.240123271942139} -09/20/2021 15:27:17 - INFO - __main__ - Step 4467: {'lr': 7.44e-05, 'samples': 142944, 'steps': 279, 'loss/train': 6.741515159606934} -09/20/2021 15:27:17 - INFO - __main__ - Step 4468: {'lr': 7.44e-05, 'samples': 142976, 'steps': 279, 'loss/train': 0.9987664818763733} -09/20/2021 15:27:19 - INFO - __main__ - Step 4469: {'lr': 7.44e-05, 'samples': 143008, 'steps': 279, 'loss/train': 5.176795482635498} -09/20/2021 15:27:20 - INFO - __main__ - Step 4470: {'lr': 7.44e-05, 'samples': 143040, 'steps': 279, 'loss/train': 5.923036575317383} -09/20/2021 15:27:20 - INFO - __main__ - Step 4471: {'lr': 7.44e-05, 'samples': 143072, 'steps': 279, 'loss/train': 5.8013763427734375} -09/20/2021 15:27:21 - INFO - __main__ - Step 4472: {'lr': 7.44e-05, 'samples': 143104, 'steps': 279, 'loss/train': 4.916594505310059} -09/20/2021 15:27:22 - INFO - __main__ - Step 4473: {'lr': 7.44e-05, 'samples': 143136, 'steps': 279, 'loss/train': 5.944260120391846} -09/20/2021 15:27:23 - INFO - __main__ - Step 4474: {'lr': 7.44e-05, 'samples': 143168, 'steps': 279, 'loss/train': 5.501603603363037} -09/20/2021 15:27:23 - INFO - __main__ - Step 4475: {'lr': 7.44e-05, 'samples': 143200, 'steps': 279, 'loss/train': 4.625901222229004} -09/20/2021 15:27:24 - INFO - __main__ - Step 4476: {'lr': 7.44e-05, 'samples': 143232, 'steps': 279, 'loss/train': 5.0746564865112305} -09/20/2021 15:27:25 - INFO - __main__ - Step 4477: {'lr': 7.44e-05, 'samples': 143264, 'steps': 279, 'loss/train': 5.534459590911865} -09/20/2021 15:27:26 - INFO - __main__ - Step 4478: {'lr': 7.44e-05, 'samples': 143296, 'steps': 279, 'loss/train': 4.3213114738464355} -09/20/2021 15:27:26 - INFO - __main__ - Step 4479: {'lr': 7.44e-05, 'samples': 143328, 'steps': 279, 'loss/train': 6.209096431732178} -09/20/2021 15:27:27 - INFO - __main__ - Step 4480: {'lr': 7.44e-05, 'samples': 143360, 'steps': 279, 'loss/train': 6.030097484588623} -09/20/2021 15:27:28 - INFO - __main__ - Step 4481: {'lr': 7.466666666666667e-05, 'samples': 143392, 'steps': 280, 'loss/train': 3.9112188816070557} -09/20/2021 15:27:29 - INFO - __main__ - Step 4482: {'lr': 7.466666666666667e-05, 'samples': 143424, 'steps': 280, 'loss/train': 5.276439189910889} -09/20/2021 15:27:29 - INFO - __main__ - Step 4483: {'lr': 7.466666666666667e-05, 'samples': 143456, 'steps': 280, 'loss/train': 4.714699745178223} -09/20/2021 15:27:30 - INFO - __main__ - Step 4484: {'lr': 7.466666666666667e-05, 'samples': 143488, 'steps': 280, 'loss/train': 5.6290364265441895} -09/20/2021 15:27:31 - INFO - __main__ - Step 4485: {'lr': 7.466666666666667e-05, 'samples': 143520, 'steps': 280, 'loss/train': 5.034501552581787} -09/20/2021 15:27:32 - INFO - __main__ - Step 4486: {'lr': 7.466666666666667e-05, 'samples': 143552, 'steps': 280, 'loss/train': 5.175933837890625} -09/20/2021 15:27:32 - INFO - __main__ - Step 4487: {'lr': 7.466666666666667e-05, 'samples': 143584, 'steps': 280, 'loss/train': 4.956721305847168} -09/20/2021 15:27:33 - INFO - __main__ - Step 4488: {'lr': 7.466666666666667e-05, 'samples': 143616, 'steps': 280, 'loss/train': 5.182989120483398} -09/20/2021 15:27:34 - INFO - __main__ - Step 4489: {'lr': 7.466666666666667e-05, 'samples': 143648, 'steps': 280, 'loss/train': 2.417292356491089} -09/20/2021 15:27:35 - INFO - __main__ - Step 4490: {'lr': 7.466666666666667e-05, 'samples': 143680, 'steps': 280, 'loss/train': 5.985912322998047} -09/20/2021 15:27:35 - INFO - __main__ - Step 4491: {'lr': 7.466666666666667e-05, 'samples': 143712, 'steps': 280, 'loss/train': 5.971760272979736} -09/20/2021 15:27:36 - INFO - __main__ - Step 4492: {'lr': 7.466666666666667e-05, 'samples': 143744, 'steps': 280, 'loss/train': 5.230867862701416} -09/20/2021 15:27:37 - INFO - __main__ - Step 4493: {'lr': 7.466666666666667e-05, 'samples': 143776, 'steps': 280, 'loss/train': 5.408276081085205} -09/20/2021 15:27:38 - INFO - __main__ - Step 4494: {'lr': 7.466666666666667e-05, 'samples': 143808, 'steps': 280, 'loss/train': 6.385995864868164} -09/20/2021 15:27:38 - INFO - __main__ - Step 4495: {'lr': 7.466666666666667e-05, 'samples': 143840, 'steps': 280, 'loss/train': 4.50820255279541} -09/20/2021 15:27:39 - INFO - __main__ - Step 4496: {'lr': 7.466666666666667e-05, 'samples': 143872, 'steps': 280, 'loss/train': 5.33376932144165} -09/20/2021 15:27:40 - INFO - __main__ - Step 4497: {'lr': 7.493333333333333e-05, 'samples': 143904, 'steps': 281, 'loss/train': 5.294809818267822} -09/20/2021 15:27:41 - INFO - __main__ - Step 4498: {'lr': 7.493333333333333e-05, 'samples': 143936, 'steps': 281, 'loss/train': 4.853035926818848} -09/20/2021 15:27:42 - INFO - __main__ - Step 4499: {'lr': 7.493333333333333e-05, 'samples': 143968, 'steps': 281, 'loss/train': 6.304806232452393} -09/20/2021 15:27:43 - INFO - __main__ - Step 4500: {'lr': 7.493333333333333e-05, 'samples': 144000, 'steps': 281, 'loss/train': 5.32348108291626} -09/20/2021 15:27:44 - INFO - __main__ - Step 4501: {'lr': 7.493333333333333e-05, 'samples': 144032, 'steps': 281, 'loss/train': 6.226818561553955} -09/20/2021 15:27:44 - INFO - __main__ - Step 4502: {'lr': 7.493333333333333e-05, 'samples': 144064, 'steps': 281, 'loss/train': 5.2326531410217285} -09/20/2021 15:27:45 - INFO - __main__ - Step 4503: {'lr': 7.493333333333333e-05, 'samples': 144096, 'steps': 281, 'loss/train': 5.571634769439697} -09/20/2021 15:27:46 - INFO - __main__ - Step 4504: {'lr': 7.493333333333333e-05, 'samples': 144128, 'steps': 281, 'loss/train': 5.966563701629639} -09/20/2021 15:27:47 - INFO - __main__ - Step 4505: {'lr': 7.493333333333333e-05, 'samples': 144160, 'steps': 281, 'loss/train': 2.9852139949798584} -09/20/2021 15:27:47 - INFO - __main__ - Step 4506: {'lr': 7.493333333333333e-05, 'samples': 144192, 'steps': 281, 'loss/train': 2.8812475204467773} -09/20/2021 15:27:48 - INFO - __main__ - Step 4507: {'lr': 7.493333333333333e-05, 'samples': 144224, 'steps': 281, 'loss/train': 3.0040342807769775} -09/20/2021 15:27:49 - INFO - __main__ - Step 4508: {'lr': 7.493333333333333e-05, 'samples': 144256, 'steps': 281, 'loss/train': 4.591525554656982} -09/20/2021 15:27:50 - INFO - __main__ - Step 4509: {'lr': 7.493333333333333e-05, 'samples': 144288, 'steps': 281, 'loss/train': 5.598766803741455} -09/20/2021 15:27:50 - INFO - __main__ - Step 4510: {'lr': 7.493333333333333e-05, 'samples': 144320, 'steps': 281, 'loss/train': 5.244665622711182} -09/20/2021 15:27:51 - INFO - __main__ - Step 4511: {'lr': 7.493333333333333e-05, 'samples': 144352, 'steps': 281, 'loss/train': 5.2986741065979} -09/20/2021 15:27:52 - INFO - __main__ - Step 4512: {'lr': 7.493333333333333e-05, 'samples': 144384, 'steps': 281, 'loss/train': 5.414282321929932} -09/20/2021 15:27:53 - INFO - __main__ - Step 4513: {'lr': 7.52e-05, 'samples': 144416, 'steps': 282, 'loss/train': 5.992149829864502} -09/20/2021 15:27:54 - INFO - __main__ - Step 4514: {'lr': 7.52e-05, 'samples': 144448, 'steps': 282, 'loss/train': 5.15747594833374} -09/20/2021 15:27:54 - INFO - __main__ - Step 4515: {'lr': 7.52e-05, 'samples': 144480, 'steps': 282, 'loss/train': 4.523283004760742} -09/20/2021 15:27:55 - INFO - __main__ - Step 4516: {'lr': 7.52e-05, 'samples': 144512, 'steps': 282, 'loss/train': 4.340363025665283} -09/20/2021 15:27:56 - INFO - __main__ - Step 4517: {'lr': 7.52e-05, 'samples': 144544, 'steps': 282, 'loss/train': 5.919661521911621} -09/20/2021 15:27:57 - INFO - __main__ - Step 4518: {'lr': 7.52e-05, 'samples': 144576, 'steps': 282, 'loss/train': 6.082365036010742} -09/20/2021 15:27:57 - INFO - __main__ - Step 4519: {'lr': 7.52e-05, 'samples': 144608, 'steps': 282, 'loss/train': 5.389665603637695} -09/20/2021 15:27:58 - INFO - __main__ - Step 4520: {'lr': 7.52e-05, 'samples': 144640, 'steps': 282, 'loss/train': 6.104410171508789} -09/20/2021 15:27:59 - INFO - __main__ - Step 4521: {'lr': 7.52e-05, 'samples': 144672, 'steps': 282, 'loss/train': 5.017051696777344} -09/20/2021 15:28:00 - INFO - __main__ - Step 4522: {'lr': 7.52e-05, 'samples': 144704, 'steps': 282, 'loss/train': 6.673102855682373} -09/20/2021 15:28:00 - INFO - __main__ - Step 4523: {'lr': 7.52e-05, 'samples': 144736, 'steps': 282, 'loss/train': 5.938574314117432} -09/20/2021 15:28:01 - INFO - __main__ - Step 4524: {'lr': 7.52e-05, 'samples': 144768, 'steps': 282, 'loss/train': 5.700127124786377} -09/20/2021 15:28:02 - INFO - __main__ - Step 4525: {'lr': 7.52e-05, 'samples': 144800, 'steps': 282, 'loss/train': 5.213598251342773} -09/20/2021 15:28:03 - INFO - __main__ - Step 4526: {'lr': 7.52e-05, 'samples': 144832, 'steps': 282, 'loss/train': 5.8693528175354} -09/20/2021 15:28:03 - INFO - __main__ - Step 4527: {'lr': 7.52e-05, 'samples': 144864, 'steps': 282, 'loss/train': 5.71565055847168} -09/20/2021 15:28:04 - INFO - __main__ - Step 4528: {'lr': 7.52e-05, 'samples': 144896, 'steps': 282, 'loss/train': 5.112179756164551} -09/20/2021 15:28:05 - INFO - __main__ - Step 4529: {'lr': 7.546666666666668e-05, 'samples': 144928, 'steps': 283, 'loss/train': 5.3100972175598145} -09/20/2021 15:28:06 - INFO - __main__ - Step 4530: {'lr': 7.546666666666668e-05, 'samples': 144960, 'steps': 283, 'loss/train': 5.533773422241211} -09/20/2021 15:28:08 - INFO - __main__ - Step 4531: {'lr': 7.546666666666668e-05, 'samples': 144992, 'steps': 283, 'loss/train': 5.522866725921631} -09/20/2021 15:28:08 - INFO - __main__ - Step 4532: {'lr': 7.546666666666668e-05, 'samples': 145024, 'steps': 283, 'loss/train': 5.461336135864258} -09/20/2021 15:28:09 - INFO - __main__ - Step 4533: {'lr': 7.546666666666668e-05, 'samples': 145056, 'steps': 283, 'loss/train': 5.639922142028809} -09/20/2021 15:28:10 - INFO - __main__ - Step 4534: {'lr': 7.546666666666668e-05, 'samples': 145088, 'steps': 283, 'loss/train': 5.675043106079102} -09/20/2021 15:28:11 - INFO - __main__ - Step 4535: {'lr': 7.546666666666668e-05, 'samples': 145120, 'steps': 283, 'loss/train': 5.5247416496276855} -09/20/2021 15:28:11 - INFO - __main__ - Step 4536: {'lr': 7.546666666666668e-05, 'samples': 145152, 'steps': 283, 'loss/train': 6.001149654388428} -09/20/2021 15:28:12 - INFO - __main__ - Step 4537: {'lr': 7.546666666666668e-05, 'samples': 145184, 'steps': 283, 'loss/train': 5.5872416496276855} -09/20/2021 15:28:13 - INFO - __main__ - Step 4538: {'lr': 7.546666666666668e-05, 'samples': 145216, 'steps': 283, 'loss/train': 5.716784477233887} -09/20/2021 15:28:14 - INFO - __main__ - Step 4539: {'lr': 7.546666666666668e-05, 'samples': 145248, 'steps': 283, 'loss/train': 5.189687728881836} -09/20/2021 15:28:14 - INFO - __main__ - Step 4540: {'lr': 7.546666666666668e-05, 'samples': 145280, 'steps': 283, 'loss/train': 5.317867279052734} -09/20/2021 15:28:15 - INFO - __main__ - Step 4541: {'lr': 7.546666666666668e-05, 'samples': 145312, 'steps': 283, 'loss/train': 5.160130500793457} -09/20/2021 15:28:16 - INFO - __main__ - Step 4542: {'lr': 7.546666666666668e-05, 'samples': 145344, 'steps': 283, 'loss/train': 5.73743200302124} -09/20/2021 15:28:17 - INFO - __main__ - Step 4543: {'lr': 7.546666666666668e-05, 'samples': 145376, 'steps': 283, 'loss/train': 4.244842529296875} -09/20/2021 15:28:17 - INFO - __main__ - Step 4544: {'lr': 7.546666666666668e-05, 'samples': 145408, 'steps': 283, 'loss/train': 5.430264949798584} -09/20/2021 15:28:18 - INFO - __main__ - Step 4545: {'lr': 7.573333333333334e-05, 'samples': 145440, 'steps': 284, 'loss/train': 4.818701267242432} -09/20/2021 15:28:19 - INFO - __main__ - Step 4546: {'lr': 7.573333333333334e-05, 'samples': 145472, 'steps': 284, 'loss/train': 5.506748199462891} -09/20/2021 15:28:20 - INFO - __main__ - Step 4547: {'lr': 7.573333333333334e-05, 'samples': 145504, 'steps': 284, 'loss/train': 5.716595649719238} -09/20/2021 15:28:20 - INFO - __main__ - Step 4548: {'lr': 7.573333333333334e-05, 'samples': 145536, 'steps': 284, 'loss/train': 5.885504722595215} -09/20/2021 15:28:21 - INFO - __main__ - Step 4549: {'lr': 7.573333333333334e-05, 'samples': 145568, 'steps': 284, 'loss/train': 5.14340353012085} -09/20/2021 15:28:22 - INFO - __main__ - Step 4550: {'lr': 7.573333333333334e-05, 'samples': 145600, 'steps': 284, 'loss/train': 6.733628273010254} -09/20/2021 15:28:23 - INFO - __main__ - Step 4551: {'lr': 7.573333333333334e-05, 'samples': 145632, 'steps': 284, 'loss/train': 6.095855236053467} -09/20/2021 15:28:23 - INFO - __main__ - Step 4552: {'lr': 7.573333333333334e-05, 'samples': 145664, 'steps': 284, 'loss/train': 4.861330986022949} -09/20/2021 15:28:24 - INFO - __main__ - Step 4553: {'lr': 7.573333333333334e-05, 'samples': 145696, 'steps': 284, 'loss/train': 6.212584972381592} -09/20/2021 15:28:25 - INFO - __main__ - Step 4554: {'lr': 7.573333333333334e-05, 'samples': 145728, 'steps': 284, 'loss/train': 5.266475677490234} -09/20/2021 15:28:26 - INFO - __main__ - Step 4555: {'lr': 7.573333333333334e-05, 'samples': 145760, 'steps': 284, 'loss/train': 5.267995357513428} -09/20/2021 15:28:26 - INFO - __main__ - Step 4556: {'lr': 7.573333333333334e-05, 'samples': 145792, 'steps': 284, 'loss/train': 4.718427658081055} -09/20/2021 15:28:27 - INFO - __main__ - Step 4557: {'lr': 7.573333333333334e-05, 'samples': 145824, 'steps': 284, 'loss/train': 4.892198085784912} -09/20/2021 15:28:28 - INFO - __main__ - Step 4558: {'lr': 7.573333333333334e-05, 'samples': 145856, 'steps': 284, 'loss/train': 5.547525405883789} -09/20/2021 15:28:29 - INFO - __main__ - Step 4559: {'lr': 7.573333333333334e-05, 'samples': 145888, 'steps': 284, 'loss/train': 8.552312850952148} -09/20/2021 15:28:29 - INFO - __main__ - Step 4560: {'lr': 7.573333333333334e-05, 'samples': 145920, 'steps': 284, 'loss/train': 3.909783124923706} -09/20/2021 15:28:30 - INFO - __main__ - Step 4561: {'lr': 7.6e-05, 'samples': 145952, 'steps': 285, 'loss/train': 4.5409979820251465} -09/20/2021 15:28:32 - INFO - __main__ - Step 4562: {'lr': 7.6e-05, 'samples': 145984, 'steps': 285, 'loss/train': 5.218264579772949} -09/20/2021 15:28:32 - INFO - __main__ - Step 4563: {'lr': 7.6e-05, 'samples': 146016, 'steps': 285, 'loss/train': 4.7978644371032715} -09/20/2021 15:28:33 - INFO - __main__ - Step 4564: {'lr': 7.6e-05, 'samples': 146048, 'steps': 285, 'loss/train': 5.112090110778809} -09/20/2021 15:28:34 - INFO - __main__ - Step 4565: {'lr': 7.6e-05, 'samples': 146080, 'steps': 285, 'loss/train': 5.7730393409729} -09/20/2021 15:28:35 - INFO - __main__ - Step 4566: {'lr': 7.6e-05, 'samples': 146112, 'steps': 285, 'loss/train': 5.431302547454834} -09/20/2021 15:28:35 - INFO - __main__ - Step 4567: {'lr': 7.6e-05, 'samples': 146144, 'steps': 285, 'loss/train': 5.522546768188477} -09/20/2021 15:28:36 - INFO - __main__ - Step 4568: {'lr': 7.6e-05, 'samples': 146176, 'steps': 285, 'loss/train': 6.060423374176025} -09/20/2021 15:28:37 - INFO - __main__ - Step 4569: {'lr': 7.6e-05, 'samples': 146208, 'steps': 285, 'loss/train': 5.534214496612549} -09/20/2021 15:28:38 - INFO - __main__ - Step 4570: {'lr': 7.6e-05, 'samples': 146240, 'steps': 285, 'loss/train': 5.171018600463867} -09/20/2021 15:28:38 - INFO - __main__ - Step 4571: {'lr': 7.6e-05, 'samples': 146272, 'steps': 285, 'loss/train': 5.480294704437256} -09/20/2021 15:28:39 - INFO - __main__ - Step 4572: {'lr': 7.6e-05, 'samples': 146304, 'steps': 285, 'loss/train': 7.340632915496826} -09/20/2021 15:28:40 - INFO - __main__ - Step 4573: {'lr': 7.6e-05, 'samples': 146336, 'steps': 285, 'loss/train': 5.485751628875732} -09/20/2021 15:28:41 - INFO - __main__ - Step 4574: {'lr': 7.6e-05, 'samples': 146368, 'steps': 285, 'loss/train': 5.504886627197266} -09/20/2021 15:28:41 - INFO - __main__ - Step 4575: {'lr': 7.6e-05, 'samples': 146400, 'steps': 285, 'loss/train': 4.130813121795654} -09/20/2021 15:28:42 - INFO - __main__ - Step 4576: {'lr': 7.6e-05, 'samples': 146432, 'steps': 285, 'loss/train': 6.337793350219727} -09/20/2021 15:28:43 - INFO - __main__ - Step 4577: {'lr': 7.626666666666667e-05, 'samples': 146464, 'steps': 286, 'loss/train': 5.352132320404053} -09/20/2021 15:28:44 - INFO - __main__ - Step 4578: {'lr': 7.626666666666667e-05, 'samples': 146496, 'steps': 286, 'loss/train': 5.152563571929932} -09/20/2021 15:28:45 - INFO - __main__ - Step 4579: {'lr': 7.626666666666667e-05, 'samples': 146528, 'steps': 286, 'loss/train': 2.8517394065856934} -09/20/2021 15:28:45 - INFO - __main__ - Step 4580: {'lr': 7.626666666666667e-05, 'samples': 146560, 'steps': 286, 'loss/train': 3.4678893089294434} -09/20/2021 15:28:46 - INFO - __main__ - Step 4581: {'lr': 7.626666666666667e-05, 'samples': 146592, 'steps': 286, 'loss/train': 5.236100673675537} -09/20/2021 15:28:47 - INFO - __main__ - Step 4582: {'lr': 7.626666666666667e-05, 'samples': 146624, 'steps': 286, 'loss/train': 5.350886344909668} -09/20/2021 15:28:48 - INFO - __main__ - Step 4583: {'lr': 7.626666666666667e-05, 'samples': 146656, 'steps': 286, 'loss/train': 6.018505573272705} -09/20/2021 15:28:48 - INFO - __main__ - Step 4584: {'lr': 7.626666666666667e-05, 'samples': 146688, 'steps': 286, 'loss/train': 5.662903785705566} -09/20/2021 15:28:49 - INFO - __main__ - Step 4585: {'lr': 7.626666666666667e-05, 'samples': 146720, 'steps': 286, 'loss/train': 5.319450378417969} -09/20/2021 15:28:50 - INFO - __main__ - Step 4586: {'lr': 7.626666666666667e-05, 'samples': 146752, 'steps': 286, 'loss/train': 5.7806854248046875} -09/20/2021 15:28:51 - INFO - __main__ - Step 4587: {'lr': 7.626666666666667e-05, 'samples': 146784, 'steps': 286, 'loss/train': 3.0301079750061035} -09/20/2021 15:28:51 - INFO - __main__ - Step 4588: {'lr': 7.626666666666667e-05, 'samples': 146816, 'steps': 286, 'loss/train': 4.942442417144775} -09/20/2021 15:28:52 - INFO - __main__ - Step 4589: {'lr': 7.626666666666667e-05, 'samples': 146848, 'steps': 286, 'loss/train': 5.400108337402344} -09/20/2021 15:28:53 - INFO - __main__ - Step 4590: {'lr': 7.626666666666667e-05, 'samples': 146880, 'steps': 286, 'loss/train': 5.246940612792969} -09/20/2021 15:28:54 - INFO - __main__ - Step 4591: {'lr': 7.626666666666667e-05, 'samples': 146912, 'steps': 286, 'loss/train': 3.7298552989959717} -09/20/2021 15:28:54 - INFO - __main__ - Step 4592: {'lr': 7.626666666666667e-05, 'samples': 146944, 'steps': 286, 'loss/train': 5.223062515258789} -09/20/2021 15:28:56 - INFO - __main__ - Step 4593: {'lr': 7.653333333333333e-05, 'samples': 146976, 'steps': 287, 'loss/train': 5.011385440826416} -09/20/2021 15:28:57 - INFO - __main__ - Step 4594: {'lr': 7.653333333333333e-05, 'samples': 147008, 'steps': 287, 'loss/train': 6.070590496063232} -09/20/2021 15:28:57 - INFO - __main__ - Step 4595: {'lr': 7.653333333333333e-05, 'samples': 147040, 'steps': 287, 'loss/train': 5.317637920379639} -09/20/2021 15:28:58 - INFO - __main__ - Step 4596: {'lr': 7.653333333333333e-05, 'samples': 147072, 'steps': 287, 'loss/train': 4.938673973083496} -09/20/2021 15:28:59 - INFO - __main__ - Step 4597: {'lr': 7.653333333333333e-05, 'samples': 147104, 'steps': 287, 'loss/train': 4.99381160736084} -09/20/2021 15:29:00 - INFO - __main__ - Step 4598: {'lr': 7.653333333333333e-05, 'samples': 147136, 'steps': 287, 'loss/train': 4.9808149337768555} -09/20/2021 15:29:00 - INFO - __main__ - Step 4599: {'lr': 7.653333333333333e-05, 'samples': 147168, 'steps': 287, 'loss/train': 5.8042402267456055} -09/20/2021 15:29:01 - INFO - __main__ - Step 4600: {'lr': 7.653333333333333e-05, 'samples': 147200, 'steps': 287, 'loss/train': 5.4022979736328125} -09/20/2021 15:29:02 - INFO - __main__ - Step 4601: {'lr': 7.653333333333333e-05, 'samples': 147232, 'steps': 287, 'loss/train': 4.90098762512207} -09/20/2021 15:29:03 - INFO - __main__ - Step 4602: {'lr': 7.653333333333333e-05, 'samples': 147264, 'steps': 287, 'loss/train': 6.532174587249756} -09/20/2021 15:29:03 - INFO - __main__ - Step 4603: {'lr': 7.653333333333333e-05, 'samples': 147296, 'steps': 287, 'loss/train': 6.101161479949951} -09/20/2021 15:29:04 - INFO - __main__ - Step 4604: {'lr': 7.653333333333333e-05, 'samples': 147328, 'steps': 287, 'loss/train': 4.653881072998047} -09/20/2021 15:29:05 - INFO - __main__ - Step 4605: {'lr': 7.653333333333333e-05, 'samples': 147360, 'steps': 287, 'loss/train': 4.766629219055176} -09/20/2021 15:29:06 - INFO - __main__ - Step 4606: {'lr': 7.653333333333333e-05, 'samples': 147392, 'steps': 287, 'loss/train': 5.521703720092773} -09/20/2021 15:29:06 - INFO - __main__ - Step 4607: {'lr': 7.653333333333333e-05, 'samples': 147424, 'steps': 287, 'loss/train': 5.096555233001709} -09/20/2021 15:29:07 - INFO - __main__ - Step 4608: {'lr': 7.653333333333333e-05, 'samples': 147456, 'steps': 287, 'loss/train': 6.664859294891357} -09/20/2021 15:29:08 - INFO - __main__ - Step 4609: {'lr': 7.680000000000001e-05, 'samples': 147488, 'steps': 288, 'loss/train': 5.852946758270264} -09/20/2021 15:29:09 - INFO - __main__ - Step 4610: {'lr': 7.680000000000001e-05, 'samples': 147520, 'steps': 288, 'loss/train': 6.343890190124512} -09/20/2021 15:29:10 - INFO - __main__ - Step 4611: {'lr': 7.680000000000001e-05, 'samples': 147552, 'steps': 288, 'loss/train': 6.092362880706787} -09/20/2021 15:29:10 - INFO - __main__ - Step 4612: {'lr': 7.680000000000001e-05, 'samples': 147584, 'steps': 288, 'loss/train': 5.298228740692139} -09/20/2021 15:29:11 - INFO - __main__ - Step 4613: {'lr': 7.680000000000001e-05, 'samples': 147616, 'steps': 288, 'loss/train': 4.659576416015625} -09/20/2021 15:29:12 - INFO - __main__ - Step 4614: {'lr': 7.680000000000001e-05, 'samples': 147648, 'steps': 288, 'loss/train': 5.680912971496582} -09/20/2021 15:29:13 - INFO - __main__ - Step 4615: {'lr': 7.680000000000001e-05, 'samples': 147680, 'steps': 288, 'loss/train': 5.4541473388671875} -09/20/2021 15:29:13 - INFO - __main__ - Step 4616: {'lr': 7.680000000000001e-05, 'samples': 147712, 'steps': 288, 'loss/train': 5.578554630279541} -09/20/2021 15:29:14 - INFO - __main__ - Step 4617: {'lr': 7.680000000000001e-05, 'samples': 147744, 'steps': 288, 'loss/train': 6.005313396453857} -09/20/2021 15:29:15 - INFO - __main__ - Step 4618: {'lr': 7.680000000000001e-05, 'samples': 147776, 'steps': 288, 'loss/train': 5.745676517486572} -09/20/2021 15:29:16 - INFO - __main__ - Step 4619: {'lr': 7.680000000000001e-05, 'samples': 147808, 'steps': 288, 'loss/train': 5.835874080657959} -09/20/2021 15:29:16 - INFO - __main__ - Step 4620: {'lr': 7.680000000000001e-05, 'samples': 147840, 'steps': 288, 'loss/train': 3.707944631576538} -09/20/2021 15:29:17 - INFO - __main__ - Step 4621: {'lr': 7.680000000000001e-05, 'samples': 147872, 'steps': 288, 'loss/train': 2.737013578414917} -09/20/2021 15:29:18 - INFO - __main__ - Step 4622: {'lr': 7.680000000000001e-05, 'samples': 147904, 'steps': 288, 'loss/train': 2.5688443183898926} -09/20/2021 15:29:19 - INFO - __main__ - Step 4623: {'lr': 7.680000000000001e-05, 'samples': 147936, 'steps': 288, 'loss/train': 2.8841090202331543} -09/20/2021 15:29:20 - INFO - __main__ - Step 4624: {'lr': 7.680000000000001e-05, 'samples': 147968, 'steps': 288, 'loss/train': 5.352253437042236} -09/20/2021 15:29:21 - INFO - __main__ - Step 4625: {'lr': 7.706666666666668e-05, 'samples': 148000, 'steps': 289, 'loss/train': 6.144937038421631} -09/20/2021 15:29:22 - INFO - __main__ - Step 4626: {'lr': 7.706666666666668e-05, 'samples': 148032, 'steps': 289, 'loss/train': 5.805943012237549} -09/20/2021 15:29:22 - INFO - __main__ - Step 4627: {'lr': 7.706666666666668e-05, 'samples': 148064, 'steps': 289, 'loss/train': 6.055062770843506} -09/20/2021 15:29:23 - INFO - __main__ - Step 4628: {'lr': 7.706666666666668e-05, 'samples': 148096, 'steps': 289, 'loss/train': 5.134720802307129} -09/20/2021 15:29:24 - INFO - __main__ - Step 4629: {'lr': 7.706666666666668e-05, 'samples': 148128, 'steps': 289, 'loss/train': 6.021145820617676} -09/20/2021 15:29:25 - INFO - __main__ - Step 4630: {'lr': 7.706666666666668e-05, 'samples': 148160, 'steps': 289, 'loss/train': 5.5235700607299805} -09/20/2021 15:29:25 - INFO - __main__ - Step 4631: {'lr': 7.706666666666668e-05, 'samples': 148192, 'steps': 289, 'loss/train': 4.292232513427734} -09/20/2021 15:29:26 - INFO - __main__ - Step 4632: {'lr': 7.706666666666668e-05, 'samples': 148224, 'steps': 289, 'loss/train': 4.9766716957092285} -09/20/2021 15:29:27 - INFO - __main__ - Step 4633: {'lr': 7.706666666666668e-05, 'samples': 148256, 'steps': 289, 'loss/train': 4.963958740234375} -09/20/2021 15:29:28 - INFO - __main__ - Step 4634: {'lr': 7.706666666666668e-05, 'samples': 148288, 'steps': 289, 'loss/train': 2.700479507446289} -09/20/2021 15:29:28 - INFO - __main__ - Step 4635: {'lr': 7.706666666666668e-05, 'samples': 148320, 'steps': 289, 'loss/train': 5.89247989654541} -09/20/2021 15:29:29 - INFO - __main__ - Step 4636: {'lr': 7.706666666666668e-05, 'samples': 148352, 'steps': 289, 'loss/train': 5.426644802093506} -09/20/2021 15:29:30 - INFO - __main__ - Step 4637: {'lr': 7.706666666666668e-05, 'samples': 148384, 'steps': 289, 'loss/train': 4.169192790985107} -09/20/2021 15:29:31 - INFO - __main__ - Step 4638: {'lr': 7.706666666666668e-05, 'samples': 148416, 'steps': 289, 'loss/train': 5.7880706787109375} -09/20/2021 15:29:31 - INFO - __main__ - Step 4639: {'lr': 7.706666666666668e-05, 'samples': 148448, 'steps': 289, 'loss/train': 4.780680179595947} -09/20/2021 15:29:32 - INFO - __main__ - Step 4640: {'lr': 7.706666666666668e-05, 'samples': 148480, 'steps': 289, 'loss/train': 5.556665420532227} -09/20/2021 15:29:33 - INFO - __main__ - Step 4641: {'lr': 7.733333333333333e-05, 'samples': 148512, 'steps': 290, 'loss/train': 5.388270378112793} -09/20/2021 15:29:34 - INFO - __main__ - Step 4642: {'lr': 7.733333333333333e-05, 'samples': 148544, 'steps': 290, 'loss/train': 4.886449337005615} -09/20/2021 15:29:34 - INFO - __main__ - Step 4643: {'lr': 7.733333333333333e-05, 'samples': 148576, 'steps': 290, 'loss/train': 5.328670024871826} -09/20/2021 15:29:35 - INFO - __main__ - Step 4644: {'lr': 7.733333333333333e-05, 'samples': 148608, 'steps': 290, 'loss/train': 4.604154109954834} -09/20/2021 15:29:36 - INFO - __main__ - Step 4645: {'lr': 7.733333333333333e-05, 'samples': 148640, 'steps': 290, 'loss/train': 5.415585994720459} -09/20/2021 15:29:37 - INFO - __main__ - Step 4646: {'lr': 7.733333333333333e-05, 'samples': 148672, 'steps': 290, 'loss/train': 4.612975597381592} -09/20/2021 15:29:37 - INFO - __main__ - Step 4647: {'lr': 7.733333333333333e-05, 'samples': 148704, 'steps': 290, 'loss/train': 5.312697887420654} -09/20/2021 15:29:38 - INFO - __main__ - Step 4648: {'lr': 7.733333333333333e-05, 'samples': 148736, 'steps': 290, 'loss/train': 5.780230522155762} -09/20/2021 15:29:39 - INFO - __main__ - Step 4649: {'lr': 7.733333333333333e-05, 'samples': 148768, 'steps': 290, 'loss/train': 5.465467929840088} -09/20/2021 15:29:40 - INFO - __main__ - Step 4650: {'lr': 7.733333333333333e-05, 'samples': 148800, 'steps': 290, 'loss/train': 4.6212477684021} -09/20/2021 15:29:40 - INFO - __main__ - Step 4651: {'lr': 7.733333333333333e-05, 'samples': 148832, 'steps': 290, 'loss/train': 5.719583511352539} -09/20/2021 15:29:41 - INFO - __main__ - Step 4652: {'lr': 7.733333333333333e-05, 'samples': 148864, 'steps': 290, 'loss/train': 5.571081638336182} -09/20/2021 15:29:42 - INFO - __main__ - Step 4653: {'lr': 7.733333333333333e-05, 'samples': 148896, 'steps': 290, 'loss/train': 5.192627429962158} -09/20/2021 15:29:43 - INFO - __main__ - Step 4654: {'lr': 7.733333333333333e-05, 'samples': 148928, 'steps': 290, 'loss/train': 7.301811218261719} -09/20/2021 15:29:44 - INFO - __main__ - Step 4655: {'lr': 7.733333333333333e-05, 'samples': 148960, 'steps': 290, 'loss/train': 4.966060161590576} -09/20/2021 15:29:45 - INFO - __main__ - Step 4656: {'lr': 7.733333333333333e-05, 'samples': 148992, 'steps': 290, 'loss/train': 5.498871803283691} -09/20/2021 15:29:46 - INFO - __main__ - Step 4657: {'lr': 7.76e-05, 'samples': 149024, 'steps': 291, 'loss/train': 5.672582149505615} -09/20/2021 15:29:46 - INFO - __main__ - Step 4658: {'lr': 7.76e-05, 'samples': 149056, 'steps': 291, 'loss/train': 4.476406574249268} -09/20/2021 15:29:47 - INFO - __main__ - Step 4659: {'lr': 7.76e-05, 'samples': 149088, 'steps': 291, 'loss/train': 6.259646892547607} -09/20/2021 15:29:48 - INFO - __main__ - Step 4660: {'lr': 7.76e-05, 'samples': 149120, 'steps': 291, 'loss/train': 5.202132225036621} -09/20/2021 15:29:49 - INFO - __main__ - Step 4661: {'lr': 7.76e-05, 'samples': 149152, 'steps': 291, 'loss/train': 4.736645698547363} -09/20/2021 15:29:49 - INFO - __main__ - Step 4662: {'lr': 7.76e-05, 'samples': 149184, 'steps': 291, 'loss/train': 5.352738857269287} -09/20/2021 15:29:50 - INFO - __main__ - Step 4663: {'lr': 7.76e-05, 'samples': 149216, 'steps': 291, 'loss/train': 3.1918842792510986} -09/20/2021 15:29:51 - INFO - __main__ - Step 4664: {'lr': 7.76e-05, 'samples': 149248, 'steps': 291, 'loss/train': 5.997156620025635} -09/20/2021 15:29:52 - INFO - __main__ - Step 4665: {'lr': 7.76e-05, 'samples': 149280, 'steps': 291, 'loss/train': 5.295978546142578} -09/20/2021 15:29:52 - INFO - __main__ - Step 4666: {'lr': 7.76e-05, 'samples': 149312, 'steps': 291, 'loss/train': 5.499514579772949} -09/20/2021 15:29:53 - INFO - __main__ - Step 4667: {'lr': 7.76e-05, 'samples': 149344, 'steps': 291, 'loss/train': 3.8125429153442383} -09/20/2021 15:29:54 - INFO - __main__ - Step 4668: {'lr': 7.76e-05, 'samples': 149376, 'steps': 291, 'loss/train': 2.5117874145507812} -09/20/2021 15:29:55 - INFO - __main__ - Step 4669: {'lr': 7.76e-05, 'samples': 149408, 'steps': 291, 'loss/train': 5.562502861022949} -09/20/2021 15:29:55 - INFO - __main__ - Step 4670: {'lr': 7.76e-05, 'samples': 149440, 'steps': 291, 'loss/train': 7.199620723724365} -09/20/2021 15:29:56 - INFO - __main__ - Step 4671: {'lr': 7.76e-05, 'samples': 149472, 'steps': 291, 'loss/train': 5.854090213775635} -09/20/2021 15:29:57 - INFO - __main__ - Step 4672: {'lr': 7.76e-05, 'samples': 149504, 'steps': 291, 'loss/train': 5.31201696395874} -09/20/2021 15:29:58 - INFO - __main__ - Step 4673: {'lr': 7.786666666666667e-05, 'samples': 149536, 'steps': 292, 'loss/train': 4.967014312744141} -09/20/2021 15:29:59 - INFO - __main__ - Step 4674: {'lr': 7.786666666666667e-05, 'samples': 149568, 'steps': 292, 'loss/train': 4.322098255157471} -09/20/2021 15:29:59 - INFO - __main__ - Step 4675: {'lr': 7.786666666666667e-05, 'samples': 149600, 'steps': 292, 'loss/train': 4.972704887390137} -09/20/2021 15:30:00 - INFO - __main__ - Step 4676: {'lr': 7.786666666666667e-05, 'samples': 149632, 'steps': 292, 'loss/train': 4.937442779541016} -09/20/2021 15:30:01 - INFO - __main__ - Step 4677: {'lr': 7.786666666666667e-05, 'samples': 149664, 'steps': 292, 'loss/train': 5.688011646270752} -09/20/2021 15:30:02 - INFO - __main__ - Step 4678: {'lr': 7.786666666666667e-05, 'samples': 149696, 'steps': 292, 'loss/train': 5.359736442565918} -09/20/2021 15:30:02 - INFO - __main__ - Step 4679: {'lr': 7.786666666666667e-05, 'samples': 149728, 'steps': 292, 'loss/train': 4.970710754394531} -09/20/2021 15:30:03 - INFO - __main__ - Step 4680: {'lr': 7.786666666666667e-05, 'samples': 149760, 'steps': 292, 'loss/train': 4.789140701293945} -09/20/2021 15:30:04 - INFO - __main__ - Step 4681: {'lr': 7.786666666666667e-05, 'samples': 149792, 'steps': 292, 'loss/train': 6.190579891204834} -09/20/2021 15:30:05 - INFO - __main__ - Step 4682: {'lr': 7.786666666666667e-05, 'samples': 149824, 'steps': 292, 'loss/train': 5.180537223815918} -09/20/2021 15:30:05 - INFO - __main__ - Step 4683: {'lr': 7.786666666666667e-05, 'samples': 149856, 'steps': 292, 'loss/train': 5.427474498748779} -09/20/2021 15:30:06 - INFO - __main__ - Step 4684: {'lr': 7.786666666666667e-05, 'samples': 149888, 'steps': 292, 'loss/train': 5.262916564941406} -09/20/2021 15:30:07 - INFO - __main__ - Step 4685: {'lr': 7.786666666666667e-05, 'samples': 149920, 'steps': 292, 'loss/train': 6.338757514953613} -09/20/2021 15:30:08 - INFO - __main__ - Step 4686: {'lr': 7.786666666666667e-05, 'samples': 149952, 'steps': 292, 'loss/train': 4.719053268432617} -09/20/2021 15:30:09 - INFO - __main__ - Step 4687: {'lr': 7.786666666666667e-05, 'samples': 149984, 'steps': 292, 'loss/train': 5.31782341003418} -09/20/2021 15:30:10 - INFO - __main__ - Step 4688: {'lr': 7.786666666666667e-05, 'samples': 150016, 'steps': 292, 'loss/train': 4.96221399307251} -09/20/2021 15:30:11 - INFO - __main__ - Step 4689: {'lr': 7.813333333333334e-05, 'samples': 150048, 'steps': 293, 'loss/train': 5.295232772827148} -09/20/2021 15:30:11 - INFO - __main__ - Step 4690: {'lr': 7.813333333333334e-05, 'samples': 150080, 'steps': 293, 'loss/train': 5.534135341644287} -09/20/2021 15:30:12 - INFO - __main__ - Step 4691: {'lr': 7.813333333333334e-05, 'samples': 150112, 'steps': 293, 'loss/train': 4.9918060302734375} -09/20/2021 15:30:13 - INFO - __main__ - Step 4692: {'lr': 7.813333333333334e-05, 'samples': 150144, 'steps': 293, 'loss/train': 5.397793292999268} -09/20/2021 15:30:14 - INFO - __main__ - Step 4693: {'lr': 7.813333333333334e-05, 'samples': 150176, 'steps': 293, 'loss/train': 5.3243408203125} -09/20/2021 15:30:14 - INFO - __main__ - Step 4694: {'lr': 7.813333333333334e-05, 'samples': 150208, 'steps': 293, 'loss/train': 5.520057678222656} -09/20/2021 15:30:15 - INFO - __main__ - Step 4695: {'lr': 7.813333333333334e-05, 'samples': 150240, 'steps': 293, 'loss/train': 5.326910972595215} -09/20/2021 15:30:16 - INFO - __main__ - Step 4696: {'lr': 7.813333333333334e-05, 'samples': 150272, 'steps': 293, 'loss/train': 4.788662910461426} -09/20/2021 15:30:17 - INFO - __main__ - Step 4697: {'lr': 7.813333333333334e-05, 'samples': 150304, 'steps': 293, 'loss/train': 5.666843891143799} -09/20/2021 15:30:17 - INFO - __main__ - Step 4698: {'lr': 7.813333333333334e-05, 'samples': 150336, 'steps': 293, 'loss/train': 5.670262813568115} -09/20/2021 15:30:18 - INFO - __main__ - Step 4699: {'lr': 7.813333333333334e-05, 'samples': 150368, 'steps': 293, 'loss/train': 4.8939127922058105} -09/20/2021 15:30:19 - INFO - __main__ - Step 4700: {'lr': 7.813333333333334e-05, 'samples': 150400, 'steps': 293, 'loss/train': 5.904105186462402} -09/20/2021 15:30:20 - INFO - __main__ - Step 4701: {'lr': 7.813333333333334e-05, 'samples': 150432, 'steps': 293, 'loss/train': 6.406614780426025} -09/20/2021 15:30:20 - INFO - __main__ - Step 4702: {'lr': 7.813333333333334e-05, 'samples': 150464, 'steps': 293, 'loss/train': 5.399034023284912} -09/20/2021 15:30:21 - INFO - __main__ - Step 4703: {'lr': 7.813333333333334e-05, 'samples': 150496, 'steps': 293, 'loss/train': 5.344061851501465} -09/20/2021 15:30:22 - INFO - __main__ - Step 4704: {'lr': 7.813333333333334e-05, 'samples': 150528, 'steps': 293, 'loss/train': 5.824329853057861} -09/20/2021 15:30:23 - INFO - __main__ - Step 4705: {'lr': 7.840000000000001e-05, 'samples': 150560, 'steps': 294, 'loss/train': 5.400763511657715} -09/20/2021 15:30:23 - INFO - __main__ - Step 4706: {'lr': 7.840000000000001e-05, 'samples': 150592, 'steps': 294, 'loss/train': 5.802358150482178} -09/20/2021 15:30:24 - INFO - __main__ - Step 4707: {'lr': 7.840000000000001e-05, 'samples': 150624, 'steps': 294, 'loss/train': 5.324863910675049} -09/20/2021 15:30:25 - INFO - __main__ - Step 4708: {'lr': 7.840000000000001e-05, 'samples': 150656, 'steps': 294, 'loss/train': 5.32637882232666} -09/20/2021 15:30:26 - INFO - __main__ - Step 4709: {'lr': 7.840000000000001e-05, 'samples': 150688, 'steps': 294, 'loss/train': 6.097682476043701} -09/20/2021 15:30:26 - INFO - __main__ - Step 4710: {'lr': 7.840000000000001e-05, 'samples': 150720, 'steps': 294, 'loss/train': 5.124694347381592} -09/20/2021 15:30:27 - INFO - __main__ - Step 4711: {'lr': 7.840000000000001e-05, 'samples': 150752, 'steps': 294, 'loss/train': 5.353367328643799} -09/20/2021 15:30:28 - INFO - __main__ - Step 4712: {'lr': 7.840000000000001e-05, 'samples': 150784, 'steps': 294, 'loss/train': 5.494429111480713} -09/20/2021 15:30:29 - INFO - __main__ - Step 4713: {'lr': 7.840000000000001e-05, 'samples': 150816, 'steps': 294, 'loss/train': 4.694206237792969} -09/20/2021 15:30:29 - INFO - __main__ - Step 4714: {'lr': 7.840000000000001e-05, 'samples': 150848, 'steps': 294, 'loss/train': 5.410038471221924} -09/20/2021 15:30:30 - INFO - __main__ - Step 4715: {'lr': 7.840000000000001e-05, 'samples': 150880, 'steps': 294, 'loss/train': 5.392768859863281} -09/20/2021 15:30:31 - INFO - __main__ - Step 4716: {'lr': 7.840000000000001e-05, 'samples': 150912, 'steps': 294, 'loss/train': 4.988758563995361} -09/20/2021 15:30:32 - INFO - __main__ - Step 4717: {'lr': 7.840000000000001e-05, 'samples': 150944, 'steps': 294, 'loss/train': 6.897923469543457} -09/20/2021 15:30:33 - INFO - __main__ - Step 4718: {'lr': 7.840000000000001e-05, 'samples': 150976, 'steps': 294, 'loss/train': 5.387388706207275} -09/20/2021 15:30:34 - INFO - __main__ - Step 4719: {'lr': 7.840000000000001e-05, 'samples': 151008, 'steps': 294, 'loss/train': 5.4693074226379395} -09/20/2021 15:30:35 - INFO - __main__ - Step 4720: {'lr': 7.840000000000001e-05, 'samples': 151040, 'steps': 294, 'loss/train': 4.523196697235107} -09/20/2021 15:30:35 - INFO - __main__ - Step 4721: {'lr': 7.866666666666666e-05, 'samples': 151072, 'steps': 295, 'loss/train': 4.919972896575928} -09/20/2021 15:30:36 - INFO - __main__ - Step 4722: {'lr': 7.866666666666666e-05, 'samples': 151104, 'steps': 295, 'loss/train': 5.014980792999268} -09/20/2021 15:30:37 - INFO - __main__ - Step 4723: {'lr': 7.866666666666666e-05, 'samples': 151136, 'steps': 295, 'loss/train': 5.302999496459961} -09/20/2021 15:30:38 - INFO - __main__ - Step 4724: {'lr': 7.866666666666666e-05, 'samples': 151168, 'steps': 295, 'loss/train': 4.9534831047058105} -09/20/2021 15:30:38 - INFO - __main__ - Step 4725: {'lr': 7.866666666666666e-05, 'samples': 151200, 'steps': 295, 'loss/train': 5.071728229522705} -09/20/2021 15:30:39 - INFO - __main__ - Step 4726: {'lr': 7.866666666666666e-05, 'samples': 151232, 'steps': 295, 'loss/train': 4.917537212371826} -09/20/2021 15:30:40 - INFO - __main__ - Step 4727: {'lr': 7.866666666666666e-05, 'samples': 151264, 'steps': 295, 'loss/train': 5.168331623077393} -09/20/2021 15:30:41 - INFO - __main__ - Step 4728: {'lr': 7.866666666666666e-05, 'samples': 151296, 'steps': 295, 'loss/train': 3.6410915851593018} -09/20/2021 15:30:41 - INFO - __main__ - Step 4729: {'lr': 7.866666666666666e-05, 'samples': 151328, 'steps': 295, 'loss/train': 5.465755939483643} -09/20/2021 15:30:42 - INFO - __main__ - Step 4730: {'lr': 7.866666666666666e-05, 'samples': 151360, 'steps': 295, 'loss/train': 4.966460227966309} -09/20/2021 15:30:43 - INFO - __main__ - Step 4731: {'lr': 7.866666666666666e-05, 'samples': 151392, 'steps': 295, 'loss/train': 5.760241985321045} -09/20/2021 15:30:44 - INFO - __main__ - Step 4732: {'lr': 7.866666666666666e-05, 'samples': 151424, 'steps': 295, 'loss/train': 3.8709356784820557} -09/20/2021 15:30:44 - INFO - __main__ - Step 4733: {'lr': 7.866666666666666e-05, 'samples': 151456, 'steps': 295, 'loss/train': 5.53029203414917} -09/20/2021 15:30:45 - INFO - __main__ - Step 4734: {'lr': 7.866666666666666e-05, 'samples': 151488, 'steps': 295, 'loss/train': 5.155550479888916} -09/20/2021 15:30:46 - INFO - __main__ - Step 4735: {'lr': 7.866666666666666e-05, 'samples': 151520, 'steps': 295, 'loss/train': 6.1695661544799805} -09/20/2021 15:30:47 - INFO - __main__ - Step 4736: {'lr': 7.866666666666666e-05, 'samples': 151552, 'steps': 295, 'loss/train': 5.377432346343994} -09/20/2021 15:30:48 - INFO - __main__ - Step 4737: {'lr': 7.893333333333333e-05, 'samples': 151584, 'steps': 296, 'loss/train': 5.639698028564453} -09/20/2021 15:30:48 - INFO - __main__ - Step 4738: {'lr': 7.893333333333333e-05, 'samples': 151616, 'steps': 296, 'loss/train': 4.915383815765381} -09/20/2021 15:30:49 - INFO - __main__ - Step 4739: {'lr': 7.893333333333333e-05, 'samples': 151648, 'steps': 296, 'loss/train': 5.575832843780518} -09/20/2021 15:30:50 - INFO - __main__ - Step 4740: {'lr': 7.893333333333333e-05, 'samples': 151680, 'steps': 296, 'loss/train': 5.428203105926514} -09/20/2021 15:30:51 - INFO - __main__ - Step 4741: {'lr': 7.893333333333333e-05, 'samples': 151712, 'steps': 296, 'loss/train': 4.287022590637207} -09/20/2021 15:30:51 - INFO - __main__ - Step 4742: {'lr': 7.893333333333333e-05, 'samples': 151744, 'steps': 296, 'loss/train': 4.878973007202148} -09/20/2021 15:30:52 - INFO - __main__ - Step 4743: {'lr': 7.893333333333333e-05, 'samples': 151776, 'steps': 296, 'loss/train': 5.262876510620117} -09/20/2021 15:30:53 - INFO - __main__ - Step 4744: {'lr': 7.893333333333333e-05, 'samples': 151808, 'steps': 296, 'loss/train': 6.180769920349121} -09/20/2021 15:30:54 - INFO - __main__ - Step 4745: {'lr': 7.893333333333333e-05, 'samples': 151840, 'steps': 296, 'loss/train': 6.408411502838135} -09/20/2021 15:30:54 - INFO - __main__ - Step 4746: {'lr': 7.893333333333333e-05, 'samples': 151872, 'steps': 296, 'loss/train': 4.6819939613342285} -09/20/2021 15:30:56 - INFO - __main__ - Step 4747: {'lr': 7.893333333333333e-05, 'samples': 151904, 'steps': 296, 'loss/train': 5.126769542694092} -09/20/2021 15:30:56 - INFO - __main__ - Step 4748: {'lr': 7.893333333333333e-05, 'samples': 151936, 'steps': 296, 'loss/train': 5.734513759613037} -09/20/2021 15:30:57 - INFO - __main__ - Step 4749: {'lr': 7.893333333333333e-05, 'samples': 151968, 'steps': 296, 'loss/train': 5.773078441619873} -09/20/2021 15:30:58 - INFO - __main__ - Step 4750: {'lr': 7.893333333333333e-05, 'samples': 152000, 'steps': 296, 'loss/train': 6.912895202636719} -09/20/2021 15:30:59 - INFO - __main__ - Step 4751: {'lr': 7.893333333333333e-05, 'samples': 152032, 'steps': 296, 'loss/train': 5.784300327301025} -09/20/2021 15:30:59 - INFO - __main__ - Step 4752: {'lr': 7.893333333333333e-05, 'samples': 152064, 'steps': 296, 'loss/train': 5.614590167999268} -09/20/2021 15:31:00 - INFO - __main__ - Step 4753: {'lr': 7.920000000000001e-05, 'samples': 152096, 'steps': 297, 'loss/train': 5.476154804229736} -09/20/2021 15:31:01 - INFO - __main__ - Step 4754: {'lr': 7.920000000000001e-05, 'samples': 152128, 'steps': 297, 'loss/train': 4.11313009262085} -09/20/2021 15:31:02 - INFO - __main__ - Step 4755: {'lr': 7.920000000000001e-05, 'samples': 152160, 'steps': 297, 'loss/train': 5.325584411621094} -09/20/2021 15:31:02 - INFO - __main__ - Step 4756: {'lr': 7.920000000000001e-05, 'samples': 152192, 'steps': 297, 'loss/train': 4.472682952880859} -09/20/2021 15:31:03 - INFO - __main__ - Step 4757: {'lr': 7.920000000000001e-05, 'samples': 152224, 'steps': 297, 'loss/train': 5.204057693481445} -09/20/2021 15:31:04 - INFO - __main__ - Step 4758: {'lr': 7.920000000000001e-05, 'samples': 152256, 'steps': 297, 'loss/train': 5.3257904052734375} -09/20/2021 15:31:05 - INFO - __main__ - Step 4759: {'lr': 7.920000000000001e-05, 'samples': 152288, 'steps': 297, 'loss/train': 6.127524375915527} -09/20/2021 15:31:05 - INFO - __main__ - Step 4760: {'lr': 7.920000000000001e-05, 'samples': 152320, 'steps': 297, 'loss/train': 5.276191711425781} -09/20/2021 15:31:06 - INFO - __main__ - Step 4761: {'lr': 7.920000000000001e-05, 'samples': 152352, 'steps': 297, 'loss/train': 6.3362135887146} -09/20/2021 15:31:07 - INFO - __main__ - Step 4762: {'lr': 7.920000000000001e-05, 'samples': 152384, 'steps': 297, 'loss/train': 5.460935115814209} -09/20/2021 15:31:08 - INFO - __main__ - Step 4763: {'lr': 7.920000000000001e-05, 'samples': 152416, 'steps': 297, 'loss/train': 4.184385299682617} -09/20/2021 15:31:08 - INFO - __main__ - Step 4764: {'lr': 7.920000000000001e-05, 'samples': 152448, 'steps': 297, 'loss/train': 5.794515132904053} -09/20/2021 15:31:09 - INFO - __main__ - Step 4765: {'lr': 7.920000000000001e-05, 'samples': 152480, 'steps': 297, 'loss/train': 6.5190958976745605} -09/20/2021 15:31:10 - INFO - __main__ - Step 4766: {'lr': 7.920000000000001e-05, 'samples': 152512, 'steps': 297, 'loss/train': 7.318321704864502} -09/20/2021 15:31:11 - INFO - __main__ - Step 4767: {'lr': 7.920000000000001e-05, 'samples': 152544, 'steps': 297, 'loss/train': 5.686529636383057} -09/20/2021 15:31:11 - INFO - __main__ - Step 4768: {'lr': 7.920000000000001e-05, 'samples': 152576, 'steps': 297, 'loss/train': 5.607117176055908} -09/20/2021 15:31:12 - INFO - __main__ - Step 4769: {'lr': 7.946666666666667e-05, 'samples': 152608, 'steps': 298, 'loss/train': 4.5747904777526855} -09/20/2021 15:31:13 - INFO - __main__ - Step 4770: {'lr': 7.946666666666667e-05, 'samples': 152640, 'steps': 298, 'loss/train': 5.36928653717041} -09/20/2021 15:31:14 - INFO - __main__ - Step 4771: {'lr': 7.946666666666667e-05, 'samples': 152672, 'steps': 298, 'loss/train': 5.442177772521973} -09/20/2021 15:31:15 - INFO - __main__ - Step 4772: {'lr': 7.946666666666667e-05, 'samples': 152704, 'steps': 298, 'loss/train': 5.641175270080566} -09/20/2021 15:31:15 - INFO - __main__ - Step 4773: {'lr': 7.946666666666667e-05, 'samples': 152736, 'steps': 298, 'loss/train': 5.518006324768066} -09/20/2021 15:31:16 - INFO - __main__ - Step 4774: {'lr': 7.946666666666667e-05, 'samples': 152768, 'steps': 298, 'loss/train': 5.434079170227051} -09/20/2021 15:31:17 - INFO - __main__ - Step 4775: {'lr': 7.946666666666667e-05, 'samples': 152800, 'steps': 298, 'loss/train': 4.957564830780029} -09/20/2021 15:31:18 - INFO - __main__ - Step 4776: {'lr': 7.946666666666667e-05, 'samples': 152832, 'steps': 298, 'loss/train': 5.7759175300598145} -09/20/2021 15:31:19 - INFO - __main__ - Step 4777: {'lr': 7.946666666666667e-05, 'samples': 152864, 'steps': 298, 'loss/train': 4.746893882751465} -09/20/2021 15:31:20 - INFO - __main__ - Step 4778: {'lr': 7.946666666666667e-05, 'samples': 152896, 'steps': 298, 'loss/train': 5.356778621673584} -09/20/2021 15:31:20 - INFO - __main__ - Step 4779: {'lr': 7.946666666666667e-05, 'samples': 152928, 'steps': 298, 'loss/train': 5.848897933959961} -09/20/2021 15:31:21 - INFO - __main__ - Step 4780: {'lr': 7.946666666666667e-05, 'samples': 152960, 'steps': 298, 'loss/train': 4.9499897956848145} -09/20/2021 15:31:22 - INFO - __main__ - Step 4781: {'lr': 7.946666666666667e-05, 'samples': 152992, 'steps': 298, 'loss/train': 5.248047351837158} -09/20/2021 15:31:23 - INFO - __main__ - Step 4782: {'lr': 7.946666666666667e-05, 'samples': 153024, 'steps': 298, 'loss/train': 5.36011266708374} -09/20/2021 15:31:23 - INFO - __main__ - Step 4783: {'lr': 7.946666666666667e-05, 'samples': 153056, 'steps': 298, 'loss/train': 5.533944129943848} -09/20/2021 15:31:24 - INFO - __main__ - Step 4784: {'lr': 7.946666666666667e-05, 'samples': 153088, 'steps': 298, 'loss/train': 5.574655055999756} -09/20/2021 15:31:25 - INFO - __main__ - Step 4785: {'lr': 7.973333333333334e-05, 'samples': 153120, 'steps': 299, 'loss/train': 4.953268527984619} -09/20/2021 15:31:26 - INFO - __main__ - Step 4786: {'lr': 7.973333333333334e-05, 'samples': 153152, 'steps': 299, 'loss/train': 5.209625244140625} -09/20/2021 15:31:27 - INFO - __main__ - Step 4787: {'lr': 7.973333333333334e-05, 'samples': 153184, 'steps': 299, 'loss/train': 6.903402328491211} -09/20/2021 15:31:27 - INFO - __main__ - Step 4788: {'lr': 7.973333333333334e-05, 'samples': 153216, 'steps': 299, 'loss/train': 6.762294292449951} -09/20/2021 15:31:28 - INFO - __main__ - Step 4789: {'lr': 7.973333333333334e-05, 'samples': 153248, 'steps': 299, 'loss/train': 5.727801322937012} -09/20/2021 15:31:29 - INFO - __main__ - Step 4790: {'lr': 7.973333333333334e-05, 'samples': 153280, 'steps': 299, 'loss/train': 5.714907169342041} -09/20/2021 15:31:30 - INFO - __main__ - Step 4791: {'lr': 7.973333333333334e-05, 'samples': 153312, 'steps': 299, 'loss/train': 5.1351637840271} -09/20/2021 15:31:30 - INFO - __main__ - Step 4792: {'lr': 7.973333333333334e-05, 'samples': 153344, 'steps': 299, 'loss/train': 5.174346446990967} -09/20/2021 15:31:31 - INFO - __main__ - Step 4793: {'lr': 7.973333333333334e-05, 'samples': 153376, 'steps': 299, 'loss/train': 5.065070152282715} -09/20/2021 15:31:32 - INFO - __main__ - Step 4794: {'lr': 7.973333333333334e-05, 'samples': 153408, 'steps': 299, 'loss/train': 5.062902450561523} -09/20/2021 15:31:33 - INFO - __main__ - Step 4795: {'lr': 7.973333333333334e-05, 'samples': 153440, 'steps': 299, 'loss/train': 4.9183478355407715} -09/20/2021 15:31:33 - INFO - __main__ - Step 4796: {'lr': 7.973333333333334e-05, 'samples': 153472, 'steps': 299, 'loss/train': 5.8664069175720215} -09/20/2021 15:31:34 - INFO - __main__ - Step 4797: {'lr': 7.973333333333334e-05, 'samples': 153504, 'steps': 299, 'loss/train': 5.524677276611328} -09/20/2021 15:31:35 - INFO - __main__ - Step 4798: {'lr': 7.973333333333334e-05, 'samples': 153536, 'steps': 299, 'loss/train': 5.555685997009277} -09/20/2021 15:31:36 - INFO - __main__ - Step 4799: {'lr': 7.973333333333334e-05, 'samples': 153568, 'steps': 299, 'loss/train': 5.298201084136963} -09/20/2021 15:31:36 - INFO - __main__ - Step 4800: {'lr': 7.973333333333334e-05, 'samples': 153600, 'steps': 299, 'loss/train': 5.800741672515869} -09/20/2021 15:31:37 - INFO - __main__ - Step 4801: {'lr': 8e-05, 'samples': 153632, 'steps': 300, 'loss/train': 5.461219310760498} -09/20/2021 15:31:38 - INFO - __main__ - Step 4802: {'lr': 8e-05, 'samples': 153664, 'steps': 300, 'loss/train': 5.326870918273926} -09/20/2021 15:31:39 - INFO - __main__ - Step 4803: {'lr': 8e-05, 'samples': 153696, 'steps': 300, 'loss/train': 6.173565864562988} -09/20/2021 15:31:39 - INFO - __main__ - Step 4804: {'lr': 8e-05, 'samples': 153728, 'steps': 300, 'loss/train': 4.502365589141846} -09/20/2021 15:31:40 - INFO - __main__ - Step 4805: {'lr': 8e-05, 'samples': 153760, 'steps': 300, 'loss/train': 5.477347373962402} -09/20/2021 15:31:41 - INFO - __main__ - Step 4806: {'lr': 8e-05, 'samples': 153792, 'steps': 300, 'loss/train': 4.939754486083984} -09/20/2021 15:31:42 - INFO - __main__ - Step 4807: {'lr': 8e-05, 'samples': 153824, 'steps': 300, 'loss/train': 4.689521789550781} -09/20/2021 15:31:43 - INFO - __main__ - Step 4808: {'lr': 8e-05, 'samples': 153856, 'steps': 300, 'loss/train': 3.529254198074341} -09/20/2021 15:31:44 - INFO - __main__ - Step 4809: {'lr': 8e-05, 'samples': 153888, 'steps': 300, 'loss/train': 6.038878440856934} -09/20/2021 15:31:45 - INFO - __main__ - Step 4810: {'lr': 8e-05, 'samples': 153920, 'steps': 300, 'loss/train': 6.218875885009766} -09/20/2021 15:31:46 - INFO - __main__ - Step 4811: {'lr': 8e-05, 'samples': 153952, 'steps': 300, 'loss/train': 4.896056652069092} -09/20/2021 15:31:46 - INFO - __main__ - Step 4812: {'lr': 8e-05, 'samples': 153984, 'steps': 300, 'loss/train': 5.398807048797607} -09/20/2021 15:31:47 - INFO - __main__ - Step 4813: {'lr': 8e-05, 'samples': 154016, 'steps': 300, 'loss/train': 4.950446605682373} -09/20/2021 15:31:48 - INFO - __main__ - Step 4814: {'lr': 8e-05, 'samples': 154048, 'steps': 300, 'loss/train': 6.201563358306885} -09/20/2021 15:31:49 - INFO - __main__ - Step 4815: {'lr': 8e-05, 'samples': 154080, 'steps': 300, 'loss/train': 5.764690399169922} -09/20/2021 15:31:49 - INFO - __main__ - Step 4816: {'lr': 8e-05, 'samples': 154112, 'steps': 300, 'loss/train': 5.39171028137207} -09/20/2021 15:31:50 - INFO - __main__ - Step 4817: {'lr': 8.026666666666666e-05, 'samples': 154144, 'steps': 301, 'loss/train': 2.9365763664245605} -09/20/2021 15:31:51 - INFO - __main__ - Step 4818: {'lr': 8.026666666666666e-05, 'samples': 154176, 'steps': 301, 'loss/train': 5.377200603485107} -09/20/2021 15:31:52 - INFO - __main__ - Step 4819: {'lr': 8.026666666666666e-05, 'samples': 154208, 'steps': 301, 'loss/train': 5.386132717132568} -09/20/2021 15:31:52 - INFO - __main__ - Step 4820: {'lr': 8.026666666666666e-05, 'samples': 154240, 'steps': 301, 'loss/train': 6.210172176361084} -09/20/2021 15:31:53 - INFO - __main__ - Step 4821: {'lr': 8.026666666666666e-05, 'samples': 154272, 'steps': 301, 'loss/train': 4.727843284606934} -09/20/2021 15:31:54 - INFO - __main__ - Step 4822: {'lr': 8.026666666666666e-05, 'samples': 154304, 'steps': 301, 'loss/train': 4.56445837020874} -09/20/2021 15:31:55 - INFO - __main__ - Step 4823: {'lr': 8.026666666666666e-05, 'samples': 154336, 'steps': 301, 'loss/train': 4.524242877960205} -09/20/2021 15:31:55 - INFO - __main__ - Step 4824: {'lr': 8.026666666666666e-05, 'samples': 154368, 'steps': 301, 'loss/train': 4.486336708068848} -09/20/2021 15:31:56 - INFO - __main__ - Step 4825: {'lr': 8.026666666666666e-05, 'samples': 154400, 'steps': 301, 'loss/train': 4.507199764251709} -09/20/2021 15:31:57 - INFO - __main__ - Step 4826: {'lr': 8.026666666666666e-05, 'samples': 154432, 'steps': 301, 'loss/train': 4.436805248260498} -09/20/2021 15:31:58 - INFO - __main__ - Step 4827: {'lr': 8.026666666666666e-05, 'samples': 154464, 'steps': 301, 'loss/train': 4.543234348297119} -09/20/2021 15:31:58 - INFO - __main__ - Step 4828: {'lr': 8.026666666666666e-05, 'samples': 154496, 'steps': 301, 'loss/train': 4.50554895401001} -09/20/2021 15:31:59 - INFO - __main__ - Step 4829: {'lr': 8.026666666666666e-05, 'samples': 154528, 'steps': 301, 'loss/train': 4.51401948928833} -09/20/2021 15:32:00 - INFO - __main__ - Step 4830: {'lr': 8.026666666666666e-05, 'samples': 154560, 'steps': 301, 'loss/train': 4.496257781982422} -09/20/2021 15:32:01 - INFO - __main__ - Step 4831: {'lr': 8.026666666666666e-05, 'samples': 154592, 'steps': 301, 'loss/train': 5.024193286895752} -09/20/2021 15:32:01 - INFO - __main__ - Step 4832: {'lr': 8.026666666666666e-05, 'samples': 154624, 'steps': 301, 'loss/train': 5.308282852172852} -09/20/2021 15:32:02 - INFO - __main__ - Step 4833: {'lr': 8.053333333333334e-05, 'samples': 154656, 'steps': 302, 'loss/train': 4.830345630645752} -09/20/2021 15:32:03 - INFO - __main__ - Step 4834: {'lr': 8.053333333333334e-05, 'samples': 154688, 'steps': 302, 'loss/train': 4.739180564880371} -09/20/2021 15:32:04 - INFO - __main__ - Step 4835: {'lr': 8.053333333333334e-05, 'samples': 154720, 'steps': 302, 'loss/train': 5.410952568054199} -09/20/2021 15:32:05 - INFO - __main__ - Step 4836: {'lr': 8.053333333333334e-05, 'samples': 154752, 'steps': 302, 'loss/train': 5.620928764343262} -09/20/2021 15:32:05 - INFO - __main__ - Step 4837: {'lr': 8.053333333333334e-05, 'samples': 154784, 'steps': 302, 'loss/train': 8.163758277893066} -09/20/2021 15:32:06 - INFO - __main__ - Step 4838: {'lr': 8.053333333333334e-05, 'samples': 154816, 'steps': 302, 'loss/train': 8.37623119354248} -09/20/2021 15:32:07 - INFO - __main__ - Step 4839: {'lr': 8.053333333333334e-05, 'samples': 154848, 'steps': 302, 'loss/train': 8.63700008392334} -09/20/2021 15:32:08 - INFO - __main__ - Step 4840: {'lr': 8.053333333333334e-05, 'samples': 154880, 'steps': 302, 'loss/train': 8.696738243103027} -09/20/2021 15:32:08 - INFO - __main__ - Step 4841: {'lr': 8.053333333333334e-05, 'samples': 154912, 'steps': 302, 'loss/train': 4.934760570526123} -09/20/2021 15:32:09 - INFO - __main__ - Step 4842: {'lr': 8.053333333333334e-05, 'samples': 154944, 'steps': 302, 'loss/train': 5.17291784286499} -09/20/2021 15:32:10 - INFO - __main__ - Step 4843: {'lr': 8.053333333333334e-05, 'samples': 154976, 'steps': 302, 'loss/train': 5.477624893188477} -09/20/2021 15:32:11 - INFO - __main__ - Step 4844: {'lr': 8.053333333333334e-05, 'samples': 155008, 'steps': 302, 'loss/train': 5.395003795623779} -09/20/2021 15:32:11 - INFO - __main__ - Step 4845: {'lr': 8.053333333333334e-05, 'samples': 155040, 'steps': 302, 'loss/train': 5.044056415557861} -09/20/2021 15:32:13 - INFO - __main__ - Step 4846: {'lr': 8.053333333333334e-05, 'samples': 155072, 'steps': 302, 'loss/train': 6.346251487731934} -09/20/2021 15:32:14 - INFO - __main__ - Step 4847: {'lr': 8.053333333333334e-05, 'samples': 155104, 'steps': 302, 'loss/train': 5.382023811340332} -09/20/2021 15:32:15 - INFO - __main__ - Step 4848: {'lr': 8.053333333333334e-05, 'samples': 155136, 'steps': 302, 'loss/train': 5.6117448806762695} -09/20/2021 15:32:16 - INFO - __main__ - Step 4849: {'lr': 8.080000000000001e-05, 'samples': 155168, 'steps': 303, 'loss/train': 6.404287338256836} -09/20/2021 15:32:16 - INFO - __main__ - Step 4850: {'lr': 8.080000000000001e-05, 'samples': 155200, 'steps': 303, 'loss/train': 6.368414402008057} -09/20/2021 15:32:17 - INFO - __main__ - Step 4851: {'lr': 8.080000000000001e-05, 'samples': 155232, 'steps': 303, 'loss/train': 4.56447696685791} -09/20/2021 15:32:18 - INFO - __main__ - Step 4852: {'lr': 8.080000000000001e-05, 'samples': 155264, 'steps': 303, 'loss/train': 5.808920383453369} -09/20/2021 15:32:19 - INFO - __main__ - Step 4853: {'lr': 8.080000000000001e-05, 'samples': 155296, 'steps': 303, 'loss/train': 5.551543235778809} -09/20/2021 15:32:19 - INFO - __main__ - Step 4854: {'lr': 8.080000000000001e-05, 'samples': 155328, 'steps': 303, 'loss/train': 6.149200916290283} -09/20/2021 15:32:20 - INFO - __main__ - Step 4855: {'lr': 8.080000000000001e-05, 'samples': 155360, 'steps': 303, 'loss/train': 5.950965881347656} -09/20/2021 15:32:21 - INFO - __main__ - Step 4856: {'lr': 8.080000000000001e-05, 'samples': 155392, 'steps': 303, 'loss/train': 5.80861234664917} -09/20/2021 15:32:22 - INFO - __main__ - Step 4857: {'lr': 8.080000000000001e-05, 'samples': 155424, 'steps': 303, 'loss/train': 5.395907402038574} -09/20/2021 15:32:22 - INFO - __main__ - Step 4858: {'lr': 8.080000000000001e-05, 'samples': 155456, 'steps': 303, 'loss/train': 5.718006610870361} -09/20/2021 15:32:23 - INFO - __main__ - Step 4859: {'lr': 8.080000000000001e-05, 'samples': 155488, 'steps': 303, 'loss/train': 3.0555012226104736} -09/20/2021 15:32:24 - INFO - __main__ - Step 4860: {'lr': 8.080000000000001e-05, 'samples': 155520, 'steps': 303, 'loss/train': 5.22431755065918} -09/20/2021 15:32:25 - INFO - __main__ - Step 4861: {'lr': 8.080000000000001e-05, 'samples': 155552, 'steps': 303, 'loss/train': 5.395984172821045} -09/20/2021 15:32:25 - INFO - __main__ - Step 4862: {'lr': 8.080000000000001e-05, 'samples': 155584, 'steps': 303, 'loss/train': 4.793773174285889} -09/20/2021 15:32:26 - INFO - __main__ - Step 4863: {'lr': 8.080000000000001e-05, 'samples': 155616, 'steps': 303, 'loss/train': 6.285000801086426} -09/20/2021 15:32:27 - INFO - __main__ - Step 4864: {'lr': 8.080000000000001e-05, 'samples': 155648, 'steps': 303, 'loss/train': 6.080304145812988} -09/20/2021 15:32:28 - INFO - __main__ - Step 4865: {'lr': 8.106666666666667e-05, 'samples': 155680, 'steps': 304, 'loss/train': 5.209150791168213} -09/20/2021 15:32:28 - INFO - __main__ - Step 4866: {'lr': 8.106666666666667e-05, 'samples': 155712, 'steps': 304, 'loss/train': 5.931151390075684} -09/20/2021 15:32:29 - INFO - __main__ - Step 4867: {'lr': 8.106666666666667e-05, 'samples': 155744, 'steps': 304, 'loss/train': 5.683284759521484} -09/20/2021 15:32:30 - INFO - __main__ - Step 4868: {'lr': 8.106666666666667e-05, 'samples': 155776, 'steps': 304, 'loss/train': 5.162135124206543} -09/20/2021 15:32:31 - INFO - __main__ - Step 4869: {'lr': 8.106666666666667e-05, 'samples': 155808, 'steps': 304, 'loss/train': 5.363882541656494} -09/20/2021 15:32:31 - INFO - __main__ - Step 4870: {'lr': 8.106666666666667e-05, 'samples': 155840, 'steps': 304, 'loss/train': 4.758358478546143} -09/20/2021 15:32:32 - INFO - __main__ - Step 4871: {'lr': 8.106666666666667e-05, 'samples': 155872, 'steps': 304, 'loss/train': 5.76579475402832} -09/20/2021 15:32:33 - INFO - __main__ - Step 4872: {'lr': 8.106666666666667e-05, 'samples': 155904, 'steps': 304, 'loss/train': 4.7786431312561035} -09/20/2021 15:32:34 - INFO - __main__ - Step 4873: {'lr': 8.106666666666667e-05, 'samples': 155936, 'steps': 304, 'loss/train': 5.2358551025390625} -09/20/2021 15:32:34 - INFO - __main__ - Step 4874: {'lr': 8.106666666666667e-05, 'samples': 155968, 'steps': 304, 'loss/train': 5.131595611572266} -09/20/2021 15:32:35 - INFO - __main__ - Step 4875: {'lr': 8.106666666666667e-05, 'samples': 156000, 'steps': 304, 'loss/train': 5.454939365386963} -09/20/2021 15:32:37 - INFO - __main__ - Step 4876: {'lr': 8.106666666666667e-05, 'samples': 156032, 'steps': 304, 'loss/train': 4.669661521911621} -09/20/2021 15:32:37 - INFO - __main__ - Step 4877: {'lr': 8.106666666666667e-05, 'samples': 156064, 'steps': 304, 'loss/train': 5.870526313781738} -09/20/2021 15:32:38 - INFO - __main__ - Step 4878: {'lr': 8.106666666666667e-05, 'samples': 156096, 'steps': 304, 'loss/train': 4.827754497528076} -09/20/2021 15:32:39 - INFO - __main__ - Step 4879: {'lr': 8.106666666666667e-05, 'samples': 156128, 'steps': 304, 'loss/train': 5.734160423278809} -09/20/2021 15:32:40 - INFO - __main__ - Step 4880: {'lr': 8.106666666666667e-05, 'samples': 156160, 'steps': 304, 'loss/train': 5.26615047454834} -09/20/2021 15:32:40 - INFO - __main__ - Step 4881: {'lr': 8.133333333333334e-05, 'samples': 156192, 'steps': 305, 'loss/train': 5.930915355682373} -09/20/2021 15:32:41 - INFO - __main__ - Step 4882: {'lr': 8.133333333333334e-05, 'samples': 156224, 'steps': 305, 'loss/train': 4.224565029144287} -09/20/2021 15:32:42 - INFO - __main__ - Step 4883: {'lr': 8.133333333333334e-05, 'samples': 156256, 'steps': 305, 'loss/train': 4.127201557159424} -09/20/2021 15:32:43 - INFO - __main__ - Step 4884: {'lr': 8.133333333333334e-05, 'samples': 156288, 'steps': 305, 'loss/train': 5.04114294052124} -09/20/2021 15:32:43 - INFO - __main__ - Step 4885: {'lr': 8.133333333333334e-05, 'samples': 156320, 'steps': 305, 'loss/train': 4.5057878494262695} -09/20/2021 15:32:44 - INFO - __main__ - Step 4886: {'lr': 8.133333333333334e-05, 'samples': 156352, 'steps': 305, 'loss/train': 5.087780475616455} -09/20/2021 15:32:45 - INFO - __main__ - Step 4887: {'lr': 8.133333333333334e-05, 'samples': 156384, 'steps': 305, 'loss/train': 7.728635787963867} -09/20/2021 15:32:46 - INFO - __main__ - Step 4888: {'lr': 8.133333333333334e-05, 'samples': 156416, 'steps': 305, 'loss/train': 4.937198638916016} -09/20/2021 15:32:46 - INFO - __main__ - Step 4889: {'lr': 8.133333333333334e-05, 'samples': 156448, 'steps': 305, 'loss/train': 5.604025363922119} -09/20/2021 15:32:47 - INFO - __main__ - Step 4890: {'lr': 8.133333333333334e-05, 'samples': 156480, 'steps': 305, 'loss/train': 5.433679580688477} -09/20/2021 15:32:48 - INFO - __main__ - Step 4891: {'lr': 8.133333333333334e-05, 'samples': 156512, 'steps': 305, 'loss/train': 4.679986953735352} -09/20/2021 15:32:49 - INFO - __main__ - Step 4892: {'lr': 8.133333333333334e-05, 'samples': 156544, 'steps': 305, 'loss/train': 6.211657524108887} -09/20/2021 15:32:49 - INFO - __main__ - Step 4893: {'lr': 8.133333333333334e-05, 'samples': 156576, 'steps': 305, 'loss/train': 5.4820051193237305} -09/20/2021 15:32:50 - INFO - __main__ - Step 4894: {'lr': 8.133333333333334e-05, 'samples': 156608, 'steps': 305, 'loss/train': 5.89391565322876} -09/20/2021 15:32:51 - INFO - __main__ - Step 4895: {'lr': 8.133333333333334e-05, 'samples': 156640, 'steps': 305, 'loss/train': 5.564783096313477} -09/20/2021 15:32:52 - INFO - __main__ - Step 4896: {'lr': 8.133333333333334e-05, 'samples': 156672, 'steps': 305, 'loss/train': 5.129359722137451} -09/20/2021 15:32:53 - INFO - __main__ - Step 4897: {'lr': 8.16e-05, 'samples': 156704, 'steps': 306, 'loss/train': 2.2188477516174316} -09/20/2021 15:32:53 - INFO - __main__ - Step 4898: {'lr': 8.16e-05, 'samples': 156736, 'steps': 306, 'loss/train': 5.721442699432373} -09/20/2021 15:32:54 - INFO - __main__ - Step 4899: {'lr': 8.16e-05, 'samples': 156768, 'steps': 306, 'loss/train': 5.1500115394592285} -09/20/2021 15:32:55 - INFO - __main__ - Step 4900: {'lr': 8.16e-05, 'samples': 156800, 'steps': 306, 'loss/train': 3.2524161338806152} -09/20/2021 15:32:56 - INFO - __main__ - Step 4901: {'lr': 8.16e-05, 'samples': 156832, 'steps': 306, 'loss/train': 5.292043209075928} -09/20/2021 15:32:56 - INFO - __main__ - Step 4902: {'lr': 8.16e-05, 'samples': 156864, 'steps': 306, 'loss/train': 4.642873764038086} -09/20/2021 15:32:57 - INFO - __main__ - Step 4903: {'lr': 8.16e-05, 'samples': 156896, 'steps': 306, 'loss/train': 4.942684173583984} -09/20/2021 15:32:58 - INFO - __main__ - Step 4904: {'lr': 8.16e-05, 'samples': 156928, 'steps': 306, 'loss/train': 5.347644805908203} -09/20/2021 15:32:59 - INFO - __main__ - Step 4905: {'lr': 8.16e-05, 'samples': 156960, 'steps': 306, 'loss/train': 5.321578502655029} -09/20/2021 15:32:59 - INFO - __main__ - Step 4906: {'lr': 8.16e-05, 'samples': 156992, 'steps': 306, 'loss/train': 5.690346717834473} -09/20/2021 15:33:01 - INFO - __main__ - Step 4907: {'lr': 8.16e-05, 'samples': 157024, 'steps': 306, 'loss/train': 2.6573290824890137} -09/20/2021 15:33:01 - INFO - __main__ - Step 4908: {'lr': 8.16e-05, 'samples': 157056, 'steps': 306, 'loss/train': 6.068639278411865} -09/20/2021 15:33:02 - INFO - __main__ - Step 4909: {'lr': 8.16e-05, 'samples': 157088, 'steps': 306, 'loss/train': 5.2399420738220215} -09/20/2021 15:33:03 - INFO - __main__ - Step 4910: {'lr': 8.16e-05, 'samples': 157120, 'steps': 306, 'loss/train': 5.884511947631836} -09/20/2021 15:33:04 - INFO - __main__ - Step 4911: {'lr': 8.16e-05, 'samples': 157152, 'steps': 306, 'loss/train': 6.307431221008301} -09/20/2021 15:33:04 - INFO - __main__ - Step 4912: {'lr': 8.16e-05, 'samples': 157184, 'steps': 306, 'loss/train': 5.927221298217773} -09/20/2021 15:33:05 - INFO - __main__ - Step 4913: {'lr': 8.186666666666667e-05, 'samples': 157216, 'steps': 307, 'loss/train': 5.942783832550049} -09/20/2021 15:33:06 - INFO - __main__ - Step 4914: {'lr': 8.186666666666667e-05, 'samples': 157248, 'steps': 307, 'loss/train': 5.270291328430176} -09/20/2021 15:33:07 - INFO - __main__ - Step 4915: {'lr': 8.186666666666667e-05, 'samples': 157280, 'steps': 307, 'loss/train': 5.263009548187256} -09/20/2021 15:33:08 - INFO - __main__ - Step 4916: {'lr': 8.186666666666667e-05, 'samples': 157312, 'steps': 307, 'loss/train': 5.589785099029541} -09/20/2021 15:33:08 - INFO - __main__ - Step 4917: {'lr': 8.186666666666667e-05, 'samples': 157344, 'steps': 307, 'loss/train': 5.986478805541992} -09/20/2021 15:33:09 - INFO - __main__ - Step 4918: {'lr': 8.186666666666667e-05, 'samples': 157376, 'steps': 307, 'loss/train': 5.794854164123535} -09/20/2021 15:33:10 - INFO - __main__ - Step 4919: {'lr': 8.186666666666667e-05, 'samples': 157408, 'steps': 307, 'loss/train': 4.557121753692627} -09/20/2021 15:33:11 - INFO - __main__ - Step 4920: {'lr': 8.186666666666667e-05, 'samples': 157440, 'steps': 307, 'loss/train': 5.125516891479492} -09/20/2021 15:33:11 - INFO - __main__ - Step 4921: {'lr': 8.186666666666667e-05, 'samples': 157472, 'steps': 307, 'loss/train': 4.612670421600342} -09/20/2021 15:33:12 - INFO - __main__ - Step 4922: {'lr': 8.186666666666667e-05, 'samples': 157504, 'steps': 307, 'loss/train': 5.829664707183838} -09/20/2021 15:33:13 - INFO - __main__ - Step 4923: {'lr': 8.186666666666667e-05, 'samples': 157536, 'steps': 307, 'loss/train': 4.854950904846191} -09/20/2021 15:33:14 - INFO - __main__ - Step 4924: {'lr': 8.186666666666667e-05, 'samples': 157568, 'steps': 307, 'loss/train': 5.032217502593994} -09/20/2021 15:33:14 - INFO - __main__ - Step 4925: {'lr': 8.186666666666667e-05, 'samples': 157600, 'steps': 307, 'loss/train': 5.467102527618408} -09/20/2021 15:33:15 - INFO - __main__ - Step 4926: {'lr': 8.186666666666667e-05, 'samples': 157632, 'steps': 307, 'loss/train': 5.331958770751953} -09/20/2021 15:33:16 - INFO - __main__ - Step 4927: {'lr': 8.186666666666667e-05, 'samples': 157664, 'steps': 307, 'loss/train': 5.495339393615723} -09/20/2021 15:33:17 - INFO - __main__ - Step 4928: {'lr': 8.186666666666667e-05, 'samples': 157696, 'steps': 307, 'loss/train': 4.254512786865234} -09/20/2021 15:33:17 - INFO - __main__ - Step 4929: {'lr': 8.213333333333334e-05, 'samples': 157728, 'steps': 308, 'loss/train': 4.912678241729736} -09/20/2021 15:33:18 - INFO - __main__ - Step 4930: {'lr': 8.213333333333334e-05, 'samples': 157760, 'steps': 308, 'loss/train': 5.342695236206055} -09/20/2021 15:33:19 - INFO - __main__ - Step 4931: {'lr': 8.213333333333334e-05, 'samples': 157792, 'steps': 308, 'loss/train': 5.931067943572998} -09/20/2021 15:33:20 - INFO - __main__ - Step 4932: {'lr': 8.213333333333334e-05, 'samples': 157824, 'steps': 308, 'loss/train': 5.470242977142334} -09/20/2021 15:33:20 - INFO - __main__ - Step 4933: {'lr': 8.213333333333334e-05, 'samples': 157856, 'steps': 308, 'loss/train': 5.573367595672607} -09/20/2021 15:33:21 - INFO - __main__ - Step 4934: {'lr': 8.213333333333334e-05, 'samples': 157888, 'steps': 308, 'loss/train': 6.6168131828308105} -09/20/2021 15:33:22 - INFO - __main__ - Step 4935: {'lr': 8.213333333333334e-05, 'samples': 157920, 'steps': 308, 'loss/train': 5.035292625427246} -09/20/2021 15:33:23 - INFO - __main__ - Step 4936: {'lr': 8.213333333333334e-05, 'samples': 157952, 'steps': 308, 'loss/train': 5.679954528808594} -09/20/2021 15:33:23 - INFO - __main__ - Step 4937: {'lr': 8.213333333333334e-05, 'samples': 157984, 'steps': 308, 'loss/train': 6.638424873352051} -09/20/2021 15:33:25 - INFO - __main__ - Step 4938: {'lr': 8.213333333333334e-05, 'samples': 158016, 'steps': 308, 'loss/train': 5.828599452972412} -09/20/2021 15:33:26 - INFO - __main__ - Step 4939: {'lr': 8.213333333333334e-05, 'samples': 158048, 'steps': 308, 'loss/train': 4.679985046386719} -09/20/2021 15:33:27 - INFO - __main__ - Step 4940: {'lr': 8.213333333333334e-05, 'samples': 158080, 'steps': 308, 'loss/train': 5.195011615753174} -09/20/2021 15:33:27 - INFO - __main__ - Step 4941: {'lr': 8.213333333333334e-05, 'samples': 158112, 'steps': 308, 'loss/train': 4.524921894073486} -09/20/2021 15:33:28 - INFO - __main__ - Step 4942: {'lr': 8.213333333333334e-05, 'samples': 158144, 'steps': 308, 'loss/train': 5.4266581535339355} -09/20/2021 15:33:29 - INFO - __main__ - Step 4943: {'lr': 8.213333333333334e-05, 'samples': 158176, 'steps': 308, 'loss/train': 5.08497953414917} -09/20/2021 15:33:30 - INFO - __main__ - Step 4944: {'lr': 8.213333333333334e-05, 'samples': 158208, 'steps': 308, 'loss/train': 5.977057933807373} -09/20/2021 15:33:30 - INFO - __main__ - Step 4945: {'lr': 8.24e-05, 'samples': 158240, 'steps': 309, 'loss/train': 5.19895076751709} -09/20/2021 15:33:31 - INFO - __main__ - Step 4946: {'lr': 8.24e-05, 'samples': 158272, 'steps': 309, 'loss/train': 4.899035930633545} -09/20/2021 15:33:32 - INFO - __main__ - Step 4947: {'lr': 8.24e-05, 'samples': 158304, 'steps': 309, 'loss/train': 4.726512908935547} -09/20/2021 15:33:33 - INFO - __main__ - Step 4948: {'lr': 8.24e-05, 'samples': 158336, 'steps': 309, 'loss/train': 4.714048385620117} -09/20/2021 15:33:33 - INFO - __main__ - Step 4949: {'lr': 8.24e-05, 'samples': 158368, 'steps': 309, 'loss/train': 4.1461968421936035} -09/20/2021 15:33:34 - INFO - __main__ - Step 4950: {'lr': 8.24e-05, 'samples': 158400, 'steps': 309, 'loss/train': 4.344832420349121} -09/20/2021 15:33:35 - INFO - __main__ - Step 4951: {'lr': 8.24e-05, 'samples': 158432, 'steps': 309, 'loss/train': 4.653172492980957} -09/20/2021 15:33:36 - INFO - __main__ - Step 4952: {'lr': 8.24e-05, 'samples': 158464, 'steps': 309, 'loss/train': 4.448892116546631} -09/20/2021 15:33:36 - INFO - __main__ - Step 4953: {'lr': 8.24e-05, 'samples': 158496, 'steps': 309, 'loss/train': 3.9997432231903076} -09/20/2021 15:33:37 - INFO - __main__ - Step 4954: {'lr': 8.24e-05, 'samples': 158528, 'steps': 309, 'loss/train': 5.4322309494018555} -09/20/2021 15:33:38 - INFO - __main__ - Step 4955: {'lr': 8.24e-05, 'samples': 158560, 'steps': 309, 'loss/train': 5.055183410644531} -09/20/2021 15:33:39 - INFO - __main__ - Step 4956: {'lr': 8.24e-05, 'samples': 158592, 'steps': 309, 'loss/train': 5.215583801269531} -09/20/2021 15:33:39 - INFO - __main__ - Step 4957: {'lr': 8.24e-05, 'samples': 158624, 'steps': 309, 'loss/train': 5.26240873336792} -09/20/2021 15:33:40 - INFO - __main__ - Step 4958: {'lr': 8.24e-05, 'samples': 158656, 'steps': 309, 'loss/train': 5.267985820770264} -09/20/2021 15:33:41 - INFO - __main__ - Step 4959: {'lr': 8.24e-05, 'samples': 158688, 'steps': 309, 'loss/train': 5.895720481872559} -09/20/2021 15:33:42 - INFO - __main__ - Step 4960: {'lr': 8.24e-05, 'samples': 158720, 'steps': 309, 'loss/train': 5.652649402618408} -09/20/2021 15:33:43 - INFO - __main__ - Step 4961: {'lr': 8.266666666666667e-05, 'samples': 158752, 'steps': 310, 'loss/train': 6.450252532958984} -09/20/2021 15:33:43 - INFO - __main__ - Step 4962: {'lr': 8.266666666666667e-05, 'samples': 158784, 'steps': 310, 'loss/train': 4.978530406951904} -09/20/2021 15:33:44 - INFO - __main__ - Step 4963: {'lr': 8.266666666666667e-05, 'samples': 158816, 'steps': 310, 'loss/train': 6.55708646774292} -09/20/2021 15:33:45 - INFO - __main__ - Step 4964: {'lr': 8.266666666666667e-05, 'samples': 158848, 'steps': 310, 'loss/train': 5.69425630569458} -09/20/2021 15:33:46 - INFO - __main__ - Step 4965: {'lr': 8.266666666666667e-05, 'samples': 158880, 'steps': 310, 'loss/train': 6.182365417480469} -09/20/2021 15:33:46 - INFO - __main__ - Step 4966: {'lr': 8.266666666666667e-05, 'samples': 158912, 'steps': 310, 'loss/train': 5.273046016693115} -09/20/2021 15:33:47 - INFO - __main__ - Step 4967: {'lr': 8.266666666666667e-05, 'samples': 158944, 'steps': 310, 'loss/train': 5.322258949279785} -09/20/2021 15:33:48 - INFO - __main__ - Step 4968: {'lr': 8.266666666666667e-05, 'samples': 158976, 'steps': 310, 'loss/train': 5.940856456756592} -09/20/2021 15:33:49 - INFO - __main__ - Step 4969: {'lr': 8.266666666666667e-05, 'samples': 159008, 'steps': 310, 'loss/train': 5.259368419647217} -09/20/2021 15:33:49 - INFO - __main__ - Step 4970: {'lr': 8.266666666666667e-05, 'samples': 159040, 'steps': 310, 'loss/train': 5.175925254821777} -09/20/2021 15:33:50 - INFO - __main__ - Step 4971: {'lr': 8.266666666666667e-05, 'samples': 159072, 'steps': 310, 'loss/train': 5.471467018127441} -09/20/2021 15:33:52 - INFO - __main__ - Step 4972: {'lr': 8.266666666666667e-05, 'samples': 159104, 'steps': 310, 'loss/train': 5.409620761871338} -09/20/2021 15:33:53 - INFO - __main__ - Step 4973: {'lr': 8.266666666666667e-05, 'samples': 159136, 'steps': 310, 'loss/train': 5.490121364593506} -09/20/2021 15:33:53 - INFO - __main__ - Step 4974: {'lr': 8.266666666666667e-05, 'samples': 159168, 'steps': 310, 'loss/train': 4.380381107330322} -09/20/2021 15:33:54 - INFO - __main__ - Step 4975: {'lr': 8.266666666666667e-05, 'samples': 159200, 'steps': 310, 'loss/train': 5.407658100128174} -09/20/2021 15:33:55 - INFO - __main__ - Step 4976: {'lr': 8.266666666666667e-05, 'samples': 159232, 'steps': 310, 'loss/train': 4.901230335235596} -09/20/2021 15:33:56 - INFO - __main__ - Step 4977: {'lr': 8.293333333333333e-05, 'samples': 159264, 'steps': 311, 'loss/train': 5.070281505584717} -09/20/2021 15:33:56 - INFO - __main__ - Step 4978: {'lr': 8.293333333333333e-05, 'samples': 159296, 'steps': 311, 'loss/train': 5.463735580444336} -09/20/2021 15:33:57 - INFO - __main__ - Step 4979: {'lr': 8.293333333333333e-05, 'samples': 159328, 'steps': 311, 'loss/train': 4.545314788818359} -09/20/2021 15:33:58 - INFO - __main__ - Step 4980: {'lr': 8.293333333333333e-05, 'samples': 159360, 'steps': 311, 'loss/train': 5.495726585388184} -09/20/2021 15:33:59 - INFO - __main__ - Step 4981: {'lr': 8.293333333333333e-05, 'samples': 159392, 'steps': 311, 'loss/train': 4.948739051818848} -09/20/2021 15:33:59 - INFO - __main__ - Step 4982: {'lr': 8.293333333333333e-05, 'samples': 159424, 'steps': 311, 'loss/train': 5.662156581878662} -09/20/2021 15:34:00 - INFO - __main__ - Step 4983: {'lr': 8.293333333333333e-05, 'samples': 159456, 'steps': 311, 'loss/train': 4.769741058349609} -09/20/2021 15:34:01 - INFO - __main__ - Step 4984: {'lr': 8.293333333333333e-05, 'samples': 159488, 'steps': 311, 'loss/train': 5.812058925628662} -09/20/2021 15:34:02 - INFO - __main__ - Step 4985: {'lr': 8.293333333333333e-05, 'samples': 159520, 'steps': 311, 'loss/train': 5.587367057800293} -09/20/2021 15:34:02 - INFO - __main__ - Step 4986: {'lr': 8.293333333333333e-05, 'samples': 159552, 'steps': 311, 'loss/train': 5.391585826873779} -09/20/2021 15:34:03 - INFO - __main__ - Step 4987: {'lr': 8.293333333333333e-05, 'samples': 159584, 'steps': 311, 'loss/train': 6.141360759735107} -09/20/2021 15:34:04 - INFO - __main__ - Step 4988: {'lr': 8.293333333333333e-05, 'samples': 159616, 'steps': 311, 'loss/train': 6.083409786224365} -09/20/2021 15:34:05 - INFO - __main__ - Step 4989: {'lr': 8.293333333333333e-05, 'samples': 159648, 'steps': 311, 'loss/train': 5.6486897468566895} -09/20/2021 15:34:05 - INFO - __main__ - Step 4990: {'lr': 8.293333333333333e-05, 'samples': 159680, 'steps': 311, 'loss/train': 7.16287088394165} -09/20/2021 15:34:06 - INFO - __main__ - Step 4991: {'lr': 8.293333333333333e-05, 'samples': 159712, 'steps': 311, 'loss/train': 7.126363277435303} -09/20/2021 15:34:07 - INFO - __main__ - Step 4992: {'lr': 8.293333333333333e-05, 'samples': 159744, 'steps': 311, 'loss/train': 5.469630241394043} -09/20/2021 15:34:08 - INFO - __main__ - Step 4993: {'lr': 8.32e-05, 'samples': 159776, 'steps': 312, 'loss/train': 5.122842311859131} -09/20/2021 15:34:09 - INFO - __main__ - Step 4994: {'lr': 8.32e-05, 'samples': 159808, 'steps': 312, 'loss/train': 6.134239673614502} -09/20/2021 15:34:09 - INFO - __main__ - Step 4995: {'lr': 8.32e-05, 'samples': 159840, 'steps': 312, 'loss/train': 6.646216869354248} -09/20/2021 15:34:10 - INFO - __main__ - Step 4996: {'lr': 8.32e-05, 'samples': 159872, 'steps': 312, 'loss/train': 6.411255359649658} -09/20/2021 15:34:11 - INFO - __main__ - Step 4997: {'lr': 8.32e-05, 'samples': 159904, 'steps': 312, 'loss/train': 5.434847354888916} -09/20/2021 15:34:12 - INFO - __main__ - Step 4998: {'lr': 8.32e-05, 'samples': 159936, 'steps': 312, 'loss/train': 5.394834041595459} -09/20/2021 15:34:12 - INFO - __main__ - Step 4999: {'lr': 8.32e-05, 'samples': 159968, 'steps': 312, 'loss/train': 6.0742645263671875} -09/20/2021 15:34:13 - INFO - __main__ - Step 5000: {'lr': 8.32e-05, 'samples': 160000, 'steps': 312, 'loss/train': 5.245609283447266} -09/20/2021 15:34:14 - INFO - __main__ - Step 5001: {'lr': 8.32e-05, 'samples': 160032, 'steps': 312, 'loss/train': 6.459341049194336} -09/20/2021 15:34:15 - INFO - __main__ - Step 5002: {'lr': 8.32e-05, 'samples': 160064, 'steps': 312, 'loss/train': 5.847132205963135} -09/20/2021 15:34:15 - INFO - __main__ - Step 5003: {'lr': 8.32e-05, 'samples': 160096, 'steps': 312, 'loss/train': 5.143341064453125} -09/20/2021 15:34:17 - INFO - __main__ - Step 5004: {'lr': 8.32e-05, 'samples': 160128, 'steps': 312, 'loss/train': 5.318739891052246} -09/20/2021 15:34:17 - INFO - __main__ - Step 5005: {'lr': 8.32e-05, 'samples': 160160, 'steps': 312, 'loss/train': 5.808629989624023} -09/20/2021 15:34:18 - INFO - __main__ - Step 5006: {'lr': 8.32e-05, 'samples': 160192, 'steps': 312, 'loss/train': 6.23284912109375} -09/20/2021 15:34:19 - INFO - __main__ - Step 5007: {'lr': 8.32e-05, 'samples': 160224, 'steps': 312, 'loss/train': 4.717723846435547} -09/20/2021 15:34:20 - INFO - __main__ - Step 5008: {'lr': 8.32e-05, 'samples': 160256, 'steps': 312, 'loss/train': 5.771354675292969} -09/20/2021 15:34:20 - INFO - __main__ - Step 5009: {'lr': 8.346666666666667e-05, 'samples': 160288, 'steps': 313, 'loss/train': 5.538119316101074} -09/20/2021 15:34:21 - INFO - __main__ - Step 5010: {'lr': 8.346666666666667e-05, 'samples': 160320, 'steps': 313, 'loss/train': 5.28618860244751} -09/20/2021 15:34:22 - INFO - __main__ - Step 5011: {'lr': 8.346666666666667e-05, 'samples': 160352, 'steps': 313, 'loss/train': 5.437012672424316} -09/20/2021 15:34:23 - INFO - __main__ - Step 5012: {'lr': 8.346666666666667e-05, 'samples': 160384, 'steps': 313, 'loss/train': 5.523421764373779} -09/20/2021 15:34:23 - INFO - __main__ - Step 5013: {'lr': 8.346666666666667e-05, 'samples': 160416, 'steps': 313, 'loss/train': 5.835803508758545} -09/20/2021 15:34:24 - INFO - __main__ - Step 5014: {'lr': 8.346666666666667e-05, 'samples': 160448, 'steps': 313, 'loss/train': 6.6528096199035645} -09/20/2021 15:34:25 - INFO - __main__ - Step 5015: {'lr': 8.346666666666667e-05, 'samples': 160480, 'steps': 313, 'loss/train': 5.188760280609131} -09/20/2021 15:34:26 - INFO - __main__ - Step 5016: {'lr': 8.346666666666667e-05, 'samples': 160512, 'steps': 313, 'loss/train': 4.725438117980957} -09/20/2021 15:34:26 - INFO - __main__ - Step 5017: {'lr': 8.346666666666667e-05, 'samples': 160544, 'steps': 313, 'loss/train': 5.2730631828308105} -09/20/2021 15:34:27 - INFO - __main__ - Step 5018: {'lr': 8.346666666666667e-05, 'samples': 160576, 'steps': 313, 'loss/train': 5.29691219329834} -09/20/2021 15:34:28 - INFO - __main__ - Step 5019: {'lr': 8.346666666666667e-05, 'samples': 160608, 'steps': 313, 'loss/train': 5.405783176422119} -09/20/2021 15:34:29 - INFO - __main__ - Step 5020: {'lr': 8.346666666666667e-05, 'samples': 160640, 'steps': 313, 'loss/train': 5.385033130645752} -09/20/2021 15:34:29 - INFO - __main__ - Step 5021: {'lr': 8.346666666666667e-05, 'samples': 160672, 'steps': 313, 'loss/train': 5.711709499359131} -09/20/2021 15:34:30 - INFO - __main__ - Step 5022: {'lr': 8.346666666666667e-05, 'samples': 160704, 'steps': 313, 'loss/train': 5.824969291687012} -09/20/2021 15:34:31 - INFO - __main__ - Step 5023: {'lr': 8.346666666666667e-05, 'samples': 160736, 'steps': 313, 'loss/train': 4.993965148925781} -09/20/2021 15:34:32 - INFO - __main__ - Step 5024: {'lr': 8.346666666666667e-05, 'samples': 160768, 'steps': 313, 'loss/train': 5.512783050537109} -09/20/2021 15:34:33 - INFO - __main__ - Step 5025: {'lr': 8.373333333333334e-05, 'samples': 160800, 'steps': 314, 'loss/train': 4.335443496704102} -09/20/2021 15:34:33 - INFO - __main__ - Step 5026: {'lr': 8.373333333333334e-05, 'samples': 160832, 'steps': 314, 'loss/train': 5.237396717071533} -09/20/2021 15:34:34 - INFO - __main__ - Step 5027: {'lr': 8.373333333333334e-05, 'samples': 160864, 'steps': 314, 'loss/train': 5.570058345794678} -09/20/2021 15:34:35 - INFO - __main__ - Step 5028: {'lr': 8.373333333333334e-05, 'samples': 160896, 'steps': 314, 'loss/train': 6.2638750076293945} -09/20/2021 15:34:36 - INFO - __main__ - Step 5029: {'lr': 8.373333333333334e-05, 'samples': 160928, 'steps': 314, 'loss/train': 5.585598945617676} -09/20/2021 15:34:36 - INFO - __main__ - Step 5030: {'lr': 8.373333333333334e-05, 'samples': 160960, 'steps': 314, 'loss/train': 4.912350177764893} -09/20/2021 15:34:37 - INFO - __main__ - Step 5031: {'lr': 8.373333333333334e-05, 'samples': 160992, 'steps': 314, 'loss/train': 6.322399139404297} -09/20/2021 15:34:38 - INFO - __main__ - Step 5032: {'lr': 8.373333333333334e-05, 'samples': 161024, 'steps': 314, 'loss/train': 5.1755290031433105} -09/20/2021 15:34:39 - INFO - __main__ - Step 5033: {'lr': 8.373333333333334e-05, 'samples': 161056, 'steps': 314, 'loss/train': 5.260529518127441} -09/20/2021 15:34:40 - INFO - __main__ - Step 5034: {'lr': 8.373333333333334e-05, 'samples': 161088, 'steps': 314, 'loss/train': 5.568716049194336} -09/20/2021 15:34:41 - INFO - __main__ - Step 5035: {'lr': 8.373333333333334e-05, 'samples': 161120, 'steps': 314, 'loss/train': 4.194021701812744} -09/20/2021 15:34:41 - INFO - __main__ - Step 5036: {'lr': 8.373333333333334e-05, 'samples': 161152, 'steps': 314, 'loss/train': 4.787336826324463} -09/20/2021 15:34:42 - INFO - __main__ - Step 5037: {'lr': 8.373333333333334e-05, 'samples': 161184, 'steps': 314, 'loss/train': 5.1836323738098145} -09/20/2021 15:34:43 - INFO - __main__ - Step 5038: {'lr': 8.373333333333334e-05, 'samples': 161216, 'steps': 314, 'loss/train': 4.7610931396484375} -09/20/2021 15:34:44 - INFO - __main__ - Step 5039: {'lr': 8.373333333333334e-05, 'samples': 161248, 'steps': 314, 'loss/train': 6.322079658508301} -09/20/2021 15:34:44 - INFO - __main__ - Step 5040: {'lr': 8.373333333333334e-05, 'samples': 161280, 'steps': 314, 'loss/train': 5.5370354652404785} -09/20/2021 15:34:45 - INFO - __main__ - Step 5041: {'lr': 8.4e-05, 'samples': 161312, 'steps': 315, 'loss/train': 4.721248149871826} -09/20/2021 15:34:46 - INFO - __main__ - Step 5042: {'lr': 8.4e-05, 'samples': 161344, 'steps': 315, 'loss/train': 5.199637413024902} -09/20/2021 15:34:47 - INFO - __main__ - Step 5043: {'lr': 8.4e-05, 'samples': 161376, 'steps': 315, 'loss/train': 5.113504409790039} -09/20/2021 15:34:48 - INFO - __main__ - Step 5044: {'lr': 8.4e-05, 'samples': 161408, 'steps': 315, 'loss/train': 5.96085786819458} -09/20/2021 15:34:48 - INFO - __main__ - Step 5045: {'lr': 8.4e-05, 'samples': 161440, 'steps': 315, 'loss/train': 5.497251033782959} -09/20/2021 15:34:49 - INFO - __main__ - Step 5046: {'lr': 8.4e-05, 'samples': 161472, 'steps': 315, 'loss/train': 5.924946308135986} -09/20/2021 15:34:50 - INFO - __main__ - Step 5047: {'lr': 8.4e-05, 'samples': 161504, 'steps': 315, 'loss/train': 5.515246391296387} -09/20/2021 15:34:51 - INFO - __main__ - Step 5048: {'lr': 8.4e-05, 'samples': 161536, 'steps': 315, 'loss/train': 6.943782329559326} -09/20/2021 15:34:51 - INFO - __main__ - Step 5049: {'lr': 8.4e-05, 'samples': 161568, 'steps': 315, 'loss/train': 6.021889686584473} -09/20/2021 15:34:52 - INFO - __main__ - Step 5050: {'lr': 8.4e-05, 'samples': 161600, 'steps': 315, 'loss/train': 5.0048346519470215} -09/20/2021 15:34:53 - INFO - __main__ - Step 5051: {'lr': 8.4e-05, 'samples': 161632, 'steps': 315, 'loss/train': 2.972905158996582} -09/20/2021 15:34:54 - INFO - __main__ - Step 5052: {'lr': 8.4e-05, 'samples': 161664, 'steps': 315, 'loss/train': 5.529110431671143} -09/20/2021 15:34:54 - INFO - __main__ - Step 5053: {'lr': 8.4e-05, 'samples': 161696, 'steps': 315, 'loss/train': 6.171061992645264} -09/20/2021 15:34:55 - INFO - __main__ - Step 5054: {'lr': 8.4e-05, 'samples': 161728, 'steps': 315, 'loss/train': 4.817800521850586} -09/20/2021 15:34:56 - INFO - __main__ - Step 5055: {'lr': 8.4e-05, 'samples': 161760, 'steps': 315, 'loss/train': 5.964092254638672} -09/20/2021 15:34:57 - INFO - __main__ - Step 5056: {'lr': 8.4e-05, 'samples': 161792, 'steps': 315, 'loss/train': 5.8363776206970215} -09/20/2021 15:34:57 - INFO - __main__ - Step 5057: {'lr': 8.426666666666668e-05, 'samples': 161824, 'steps': 316, 'loss/train': 6.171299457550049} -09/20/2021 15:34:58 - INFO - __main__ - Step 5058: {'lr': 8.426666666666668e-05, 'samples': 161856, 'steps': 316, 'loss/train': 3.8766391277313232} -09/20/2021 15:34:59 - INFO - __main__ - Step 5059: {'lr': 8.426666666666668e-05, 'samples': 161888, 'steps': 316, 'loss/train': 5.624577045440674} -09/20/2021 15:35:00 - INFO - __main__ - Step 5060: {'lr': 8.426666666666668e-05, 'samples': 161920, 'steps': 316, 'loss/train': 4.875378608703613} -09/20/2021 15:35:00 - INFO - __main__ - Step 5061: {'lr': 8.426666666666668e-05, 'samples': 161952, 'steps': 316, 'loss/train': 5.318624019622803} -09/20/2021 15:35:01 - INFO - __main__ - Step 5062: {'lr': 8.426666666666668e-05, 'samples': 161984, 'steps': 316, 'loss/train': 5.119989395141602} -09/20/2021 15:35:02 - INFO - __main__ - Step 5063: {'lr': 8.426666666666668e-05, 'samples': 162016, 'steps': 316, 'loss/train': 5.734781742095947} -09/20/2021 15:35:03 - INFO - __main__ - Step 5064: {'lr': 8.426666666666668e-05, 'samples': 162048, 'steps': 316, 'loss/train': 5.15579080581665} -09/20/2021 15:35:03 - INFO - __main__ - Step 5065: {'lr': 8.426666666666668e-05, 'samples': 162080, 'steps': 316, 'loss/train': 3.355437755584717} -09/20/2021 15:35:05 - INFO - __main__ - Step 5066: {'lr': 8.426666666666668e-05, 'samples': 162112, 'steps': 316, 'loss/train': 5.987334251403809} -09/20/2021 15:35:05 - INFO - __main__ - Step 5067: {'lr': 8.426666666666668e-05, 'samples': 162144, 'steps': 316, 'loss/train': 5.735702037811279} -09/20/2021 15:35:06 - INFO - __main__ - Step 5068: {'lr': 8.426666666666668e-05, 'samples': 162176, 'steps': 316, 'loss/train': 5.8129706382751465} -09/20/2021 15:35:07 - INFO - __main__ - Step 5069: {'lr': 8.426666666666668e-05, 'samples': 162208, 'steps': 316, 'loss/train': 5.04066276550293} -09/20/2021 15:35:08 - INFO - __main__ - Step 5070: {'lr': 8.426666666666668e-05, 'samples': 162240, 'steps': 316, 'loss/train': 5.633821487426758} -09/20/2021 15:35:08 - INFO - __main__ - Step 5071: {'lr': 8.426666666666668e-05, 'samples': 162272, 'steps': 316, 'loss/train': 5.705963134765625} -09/20/2021 15:35:09 - INFO - __main__ - Step 5072: {'lr': 8.426666666666668e-05, 'samples': 162304, 'steps': 316, 'loss/train': 5.335928916931152} -09/20/2021 15:35:10 - INFO - __main__ - Step 5073: {'lr': 8.453333333333335e-05, 'samples': 162336, 'steps': 317, 'loss/train': 5.779125213623047} -09/20/2021 15:35:11 - INFO - __main__ - Step 5074: {'lr': 8.453333333333335e-05, 'samples': 162368, 'steps': 317, 'loss/train': 7.122903823852539} -09/20/2021 15:35:12 - INFO - __main__ - Step 5075: {'lr': 8.453333333333335e-05, 'samples': 162400, 'steps': 317, 'loss/train': 6.390419006347656} -09/20/2021 15:35:12 - INFO - __main__ - Step 5076: {'lr': 8.453333333333335e-05, 'samples': 162432, 'steps': 317, 'loss/train': 5.3561015129089355} -09/20/2021 15:35:13 - INFO - __main__ - Step 5077: {'lr': 8.453333333333335e-05, 'samples': 162464, 'steps': 317, 'loss/train': 5.134406566619873} -09/20/2021 15:35:14 - INFO - __main__ - Step 5078: {'lr': 8.453333333333335e-05, 'samples': 162496, 'steps': 317, 'loss/train': 5.356337070465088} -09/20/2021 15:35:15 - INFO - __main__ - Step 5079: {'lr': 8.453333333333335e-05, 'samples': 162528, 'steps': 317, 'loss/train': 5.404959201812744} -09/20/2021 15:35:15 - INFO - __main__ - Step 5080: {'lr': 8.453333333333335e-05, 'samples': 162560, 'steps': 317, 'loss/train': 5.462782382965088} -09/20/2021 15:35:16 - INFO - __main__ - Step 5081: {'lr': 8.453333333333335e-05, 'samples': 162592, 'steps': 317, 'loss/train': 4.7108049392700195} -09/20/2021 15:35:17 - INFO - __main__ - Step 5082: {'lr': 8.453333333333335e-05, 'samples': 162624, 'steps': 317, 'loss/train': 5.215411186218262} -09/20/2021 15:35:18 - INFO - __main__ - Step 5083: {'lr': 8.453333333333335e-05, 'samples': 162656, 'steps': 317, 'loss/train': 4.436779022216797} -09/20/2021 15:35:18 - INFO - __main__ - Step 5084: {'lr': 8.453333333333335e-05, 'samples': 162688, 'steps': 317, 'loss/train': 5.0834527015686035} -09/20/2021 15:35:19 - INFO - __main__ - Step 5085: {'lr': 8.453333333333335e-05, 'samples': 162720, 'steps': 317, 'loss/train': 4.857250690460205} -09/20/2021 15:35:20 - INFO - __main__ - Step 5086: {'lr': 8.453333333333335e-05, 'samples': 162752, 'steps': 317, 'loss/train': 4.949643135070801} -09/20/2021 15:35:21 - INFO - __main__ - Step 5087: {'lr': 8.453333333333335e-05, 'samples': 162784, 'steps': 317, 'loss/train': 5.7210469245910645} -09/20/2021 15:35:21 - INFO - __main__ - Step 5088: {'lr': 8.453333333333335e-05, 'samples': 162816, 'steps': 317, 'loss/train': 5.2745842933654785} -09/20/2021 15:35:22 - INFO - __main__ - Step 5089: {'lr': 8.48e-05, 'samples': 162848, 'steps': 318, 'loss/train': 5.524744033813477} -09/20/2021 15:35:23 - INFO - __main__ - Step 5090: {'lr': 8.48e-05, 'samples': 162880, 'steps': 318, 'loss/train': 4.9716691970825195} -09/20/2021 15:35:24 - INFO - __main__ - Step 5091: {'lr': 8.48e-05, 'samples': 162912, 'steps': 318, 'loss/train': 5.205618381500244} -09/20/2021 15:35:25 - INFO - __main__ - Step 5092: {'lr': 8.48e-05, 'samples': 162944, 'steps': 318, 'loss/train': 5.3136091232299805} -09/20/2021 15:35:25 - INFO - __main__ - Step 5093: {'lr': 8.48e-05, 'samples': 162976, 'steps': 318, 'loss/train': 5.380957126617432} -09/20/2021 15:35:26 - INFO - __main__ - Step 5094: {'lr': 8.48e-05, 'samples': 163008, 'steps': 318, 'loss/train': 5.0631794929504395} -09/20/2021 15:35:27 - INFO - __main__ - Step 5095: {'lr': 8.48e-05, 'samples': 163040, 'steps': 318, 'loss/train': 5.422647476196289} -09/20/2021 15:35:28 - INFO - __main__ - Step 5096: {'lr': 8.48e-05, 'samples': 163072, 'steps': 318, 'loss/train': 5.732766628265381} -09/20/2021 15:35:28 - INFO - __main__ - Step 5097: {'lr': 8.48e-05, 'samples': 163104, 'steps': 318, 'loss/train': 5.442637920379639} -09/20/2021 15:35:30 - INFO - __main__ - Step 5098: {'lr': 8.48e-05, 'samples': 163136, 'steps': 318, 'loss/train': 5.624783515930176} -09/20/2021 15:35:30 - INFO - __main__ - Step 5099: {'lr': 8.48e-05, 'samples': 163168, 'steps': 318, 'loss/train': 5.599978446960449} -09/20/2021 15:35:31 - INFO - __main__ - Step 5100: {'lr': 8.48e-05, 'samples': 163200, 'steps': 318, 'loss/train': 5.061368942260742} -09/20/2021 15:35:32 - INFO - __main__ - Step 5101: {'lr': 8.48e-05, 'samples': 163232, 'steps': 318, 'loss/train': 3.7235727310180664} -09/20/2021 15:35:33 - INFO - __main__ - Step 5102: {'lr': 8.48e-05, 'samples': 163264, 'steps': 318, 'loss/train': 5.246706485748291} -09/20/2021 15:35:33 - INFO - __main__ - Step 5103: {'lr': 8.48e-05, 'samples': 163296, 'steps': 318, 'loss/train': 6.00968074798584} -09/20/2021 15:35:34 - INFO - __main__ - Step 5104: {'lr': 8.48e-05, 'samples': 163328, 'steps': 318, 'loss/train': 5.607043266296387} -09/20/2021 15:35:35 - INFO - __main__ - Step 5105: {'lr': 8.506666666666667e-05, 'samples': 163360, 'steps': 319, 'loss/train': 5.627413749694824} -09/20/2021 15:35:36 - INFO - __main__ - Step 5106: {'lr': 8.506666666666667e-05, 'samples': 163392, 'steps': 319, 'loss/train': 5.118913173675537} -09/20/2021 15:35:36 - INFO - __main__ - Step 5107: {'lr': 8.506666666666667e-05, 'samples': 163424, 'steps': 319, 'loss/train': 5.470493316650391} -09/20/2021 15:35:37 - INFO - __main__ - Step 5108: {'lr': 8.506666666666667e-05, 'samples': 163456, 'steps': 319, 'loss/train': 6.350721836090088} -09/20/2021 15:35:38 - INFO - __main__ - Step 5109: {'lr': 8.506666666666667e-05, 'samples': 163488, 'steps': 319, 'loss/train': 4.359514236450195} -09/20/2021 15:35:39 - INFO - __main__ - Step 5110: {'lr': 8.506666666666667e-05, 'samples': 163520, 'steps': 319, 'loss/train': 5.8953776359558105} -09/20/2021 15:35:40 - INFO - __main__ - Step 5111: {'lr': 8.506666666666667e-05, 'samples': 163552, 'steps': 319, 'loss/train': 5.253284454345703} -09/20/2021 15:35:40 - INFO - __main__ - Step 5112: {'lr': 8.506666666666667e-05, 'samples': 163584, 'steps': 319, 'loss/train': 4.691274642944336} -09/20/2021 15:35:41 - INFO - __main__ - Step 5113: {'lr': 8.506666666666667e-05, 'samples': 163616, 'steps': 319, 'loss/train': 5.58586311340332} -09/20/2021 15:35:42 - INFO - __main__ - Step 5114: {'lr': 8.506666666666667e-05, 'samples': 163648, 'steps': 319, 'loss/train': 6.0749735832214355} -09/20/2021 15:35:43 - INFO - __main__ - Step 5115: {'lr': 8.506666666666667e-05, 'samples': 163680, 'steps': 319, 'loss/train': 4.7787675857543945} -09/20/2021 15:35:43 - INFO - __main__ - Step 5116: {'lr': 8.506666666666667e-05, 'samples': 163712, 'steps': 319, 'loss/train': 5.538918495178223} -09/20/2021 15:35:44 - INFO - __main__ - Step 5117: {'lr': 8.506666666666667e-05, 'samples': 163744, 'steps': 319, 'loss/train': 2.6033873558044434} -09/20/2021 15:35:45 - INFO - __main__ - Step 5118: {'lr': 8.506666666666667e-05, 'samples': 163776, 'steps': 319, 'loss/train': 4.180036544799805} -09/20/2021 15:35:46 - INFO - __main__ - Step 5119: {'lr': 8.506666666666667e-05, 'samples': 163808, 'steps': 319, 'loss/train': 5.460844039916992} -09/20/2021 15:35:46 - INFO - __main__ - Step 5120: {'lr': 8.506666666666667e-05, 'samples': 163840, 'steps': 319, 'loss/train': 6.003149032592773} -09/20/2021 15:35:47 - INFO - __main__ - Step 5121: {'lr': 8.533333333333334e-05, 'samples': 163872, 'steps': 320, 'loss/train': 5.5347723960876465} -09/20/2021 15:35:48 - INFO - __main__ - Step 5122: {'lr': 8.533333333333334e-05, 'samples': 163904, 'steps': 320, 'loss/train': 5.986757755279541} -09/20/2021 15:35:49 - INFO - __main__ - Step 5123: {'lr': 8.533333333333334e-05, 'samples': 163936, 'steps': 320, 'loss/train': 5.390974044799805} -09/20/2021 15:35:49 - INFO - __main__ - Step 5124: {'lr': 8.533333333333334e-05, 'samples': 163968, 'steps': 320, 'loss/train': 6.002465724945068} -09/20/2021 15:35:50 - INFO - __main__ - Step 5125: {'lr': 8.533333333333334e-05, 'samples': 164000, 'steps': 320, 'loss/train': 4.3669047355651855} -09/20/2021 15:35:51 - INFO - __main__ - Step 5126: {'lr': 8.533333333333334e-05, 'samples': 164032, 'steps': 320, 'loss/train': 5.2672343254089355} -09/20/2021 15:35:52 - INFO - __main__ - Step 5127: {'lr': 8.533333333333334e-05, 'samples': 164064, 'steps': 320, 'loss/train': 4.651850700378418} -09/20/2021 15:35:52 - INFO - __main__ - Step 5128: {'lr': 8.533333333333334e-05, 'samples': 164096, 'steps': 320, 'loss/train': 5.360902309417725} -09/20/2021 15:35:54 - INFO - __main__ - Step 5129: {'lr': 8.533333333333334e-05, 'samples': 164128, 'steps': 320, 'loss/train': 6.142908096313477} -09/20/2021 15:35:54 - INFO - __main__ - Step 5130: {'lr': 8.533333333333334e-05, 'samples': 164160, 'steps': 320, 'loss/train': 4.186105728149414} -09/20/2021 15:35:55 - INFO - __main__ - Step 5131: {'lr': 8.533333333333334e-05, 'samples': 164192, 'steps': 320, 'loss/train': 4.799931526184082} -09/20/2021 15:35:56 - INFO - __main__ - Step 5132: {'lr': 8.533333333333334e-05, 'samples': 164224, 'steps': 320, 'loss/train': 5.280296802520752} -09/20/2021 15:35:57 - INFO - __main__ - Step 5133: {'lr': 8.533333333333334e-05, 'samples': 164256, 'steps': 320, 'loss/train': 5.596061706542969} -09/20/2021 15:35:57 - INFO - __main__ - Step 5134: {'lr': 8.533333333333334e-05, 'samples': 164288, 'steps': 320, 'loss/train': 5.267591953277588} -09/20/2021 15:35:58 - INFO - __main__ - Step 5135: {'lr': 8.533333333333334e-05, 'samples': 164320, 'steps': 320, 'loss/train': 0.8359435796737671} -09/20/2021 15:35:59 - INFO - __main__ - Step 5136: {'lr': 8.533333333333334e-05, 'samples': 164352, 'steps': 320, 'loss/train': 4.2832841873168945} -09/20/2021 15:36:00 - INFO - __main__ - Step 5137: {'lr': 8.560000000000001e-05, 'samples': 164384, 'steps': 321, 'loss/train': 4.563912868499756} -09/20/2021 15:36:01 - INFO - __main__ - Step 5138: {'lr': 8.560000000000001e-05, 'samples': 164416, 'steps': 321, 'loss/train': 5.219320297241211} -09/20/2021 15:36:01 - INFO - __main__ - Step 5139: {'lr': 8.560000000000001e-05, 'samples': 164448, 'steps': 321, 'loss/train': 5.057872295379639} -09/20/2021 15:36:02 - INFO - __main__ - Step 5140: {'lr': 8.560000000000001e-05, 'samples': 164480, 'steps': 321, 'loss/train': 5.011388778686523} -09/20/2021 15:36:03 - INFO - __main__ - Step 5141: {'lr': 8.560000000000001e-05, 'samples': 164512, 'steps': 321, 'loss/train': 5.247156143188477} -09/20/2021 15:36:04 - INFO - __main__ - Step 5142: {'lr': 8.560000000000001e-05, 'samples': 164544, 'steps': 321, 'loss/train': 5.219557762145996} -09/20/2021 15:36:04 - INFO - __main__ - Step 5143: {'lr': 8.560000000000001e-05, 'samples': 164576, 'steps': 321, 'loss/train': 5.484218120574951} -09/20/2021 15:36:05 - INFO - __main__ - Step 5144: {'lr': 8.560000000000001e-05, 'samples': 164608, 'steps': 321, 'loss/train': 5.513405799865723} -09/20/2021 15:36:06 - INFO - __main__ - Step 5145: {'lr': 8.560000000000001e-05, 'samples': 164640, 'steps': 321, 'loss/train': 5.329002380371094} -09/20/2021 15:36:07 - INFO - __main__ - Step 5146: {'lr': 8.560000000000001e-05, 'samples': 164672, 'steps': 321, 'loss/train': 4.852018356323242} -09/20/2021 15:36:07 - INFO - __main__ - Step 5147: {'lr': 8.560000000000001e-05, 'samples': 164704, 'steps': 321, 'loss/train': 5.778067588806152} -09/20/2021 15:36:08 - INFO - __main__ - Step 5148: {'lr': 8.560000000000001e-05, 'samples': 164736, 'steps': 321, 'loss/train': 5.266128063201904} -09/20/2021 15:36:09 - INFO - __main__ - Step 5149: {'lr': 8.560000000000001e-05, 'samples': 164768, 'steps': 321, 'loss/train': 5.566220760345459} -09/20/2021 15:36:10 - INFO - __main__ - Step 5150: {'lr': 8.560000000000001e-05, 'samples': 164800, 'steps': 321, 'loss/train': 5.8382039070129395} -09/20/2021 15:36:10 - INFO - __main__ - Step 5151: {'lr': 8.560000000000001e-05, 'samples': 164832, 'steps': 321, 'loss/train': 4.253618240356445} -09/20/2021 15:36:11 - INFO - __main__ - Step 5152: {'lr': 8.560000000000001e-05, 'samples': 164864, 'steps': 321, 'loss/train': 4.986343860626221} -09/20/2021 15:36:12 - INFO - __main__ - Step 5153: {'lr': 8.586666666666668e-05, 'samples': 164896, 'steps': 322, 'loss/train': 6.054279804229736} -09/20/2021 15:36:13 - INFO - __main__ - Step 5154: {'lr': 8.586666666666668e-05, 'samples': 164928, 'steps': 322, 'loss/train': 5.005774974822998} -09/20/2021 15:36:13 - INFO - __main__ - Step 5155: {'lr': 8.586666666666668e-05, 'samples': 164960, 'steps': 322, 'loss/train': 6.666849136352539} -09/20/2021 15:36:14 - INFO - __main__ - Step 5156: {'lr': 8.586666666666668e-05, 'samples': 164992, 'steps': 322, 'loss/train': 5.319088935852051} -09/20/2021 15:36:15 - INFO - __main__ - Step 5157: {'lr': 8.586666666666668e-05, 'samples': 165024, 'steps': 322, 'loss/train': 5.864902019500732} -09/20/2021 15:36:16 - INFO - __main__ - Step 5158: {'lr': 8.586666666666668e-05, 'samples': 165056, 'steps': 322, 'loss/train': 4.877961158752441} -09/20/2021 15:36:16 - INFO - __main__ - Step 5159: {'lr': 8.586666666666668e-05, 'samples': 165088, 'steps': 322, 'loss/train': 5.0973429679870605} -09/20/2021 15:36:18 - INFO - __main__ - Step 5160: {'lr': 8.586666666666668e-05, 'samples': 165120, 'steps': 322, 'loss/train': 6.081110000610352} -09/20/2021 15:36:18 - INFO - __main__ - Step 5161: {'lr': 8.586666666666668e-05, 'samples': 165152, 'steps': 322, 'loss/train': 5.104872226715088} -09/20/2021 15:36:19 - INFO - __main__ - Step 5162: {'lr': 8.586666666666668e-05, 'samples': 165184, 'steps': 322, 'loss/train': 6.567409515380859} -09/20/2021 15:36:20 - INFO - __main__ - Step 5163: {'lr': 8.586666666666668e-05, 'samples': 165216, 'steps': 322, 'loss/train': 7.066905498504639} -09/20/2021 15:36:21 - INFO - __main__ - Step 5164: {'lr': 8.586666666666668e-05, 'samples': 165248, 'steps': 322, 'loss/train': 5.577068328857422} -09/20/2021 15:36:21 - INFO - __main__ - Step 5165: {'lr': 8.586666666666668e-05, 'samples': 165280, 'steps': 322, 'loss/train': 5.3379597663879395} -09/20/2021 15:36:22 - INFO - __main__ - Step 5166: {'lr': 8.586666666666668e-05, 'samples': 165312, 'steps': 322, 'loss/train': 4.981297969818115} -09/20/2021 15:36:23 - INFO - __main__ - Step 5167: {'lr': 8.586666666666668e-05, 'samples': 165344, 'steps': 322, 'loss/train': 5.227582931518555} -09/20/2021 15:36:24 - INFO - __main__ - Step 5168: {'lr': 8.586666666666668e-05, 'samples': 165376, 'steps': 322, 'loss/train': 6.078490257263184} -09/20/2021 15:36:25 - INFO - __main__ - Step 5169: {'lr': 8.613333333333333e-05, 'samples': 165408, 'steps': 323, 'loss/train': 4.923445224761963} -09/20/2021 15:36:25 - INFO - __main__ - Step 5170: {'lr': 8.613333333333333e-05, 'samples': 165440, 'steps': 323, 'loss/train': 5.407360553741455} -09/20/2021 15:36:26 - INFO - __main__ - Step 5171: {'lr': 8.613333333333333e-05, 'samples': 165472, 'steps': 323, 'loss/train': 2.4063544273376465} -09/20/2021 15:36:27 - INFO - __main__ - Step 5172: {'lr': 8.613333333333333e-05, 'samples': 165504, 'steps': 323, 'loss/train': 5.599913597106934} -09/20/2021 15:36:28 - INFO - __main__ - Step 5173: {'lr': 8.613333333333333e-05, 'samples': 165536, 'steps': 323, 'loss/train': 5.922239780426025} -09/20/2021 15:36:28 - INFO - __main__ - Step 5174: {'lr': 8.613333333333333e-05, 'samples': 165568, 'steps': 323, 'loss/train': 6.694727897644043} -09/20/2021 15:36:29 - INFO - __main__ - Step 5175: {'lr': 8.613333333333333e-05, 'samples': 165600, 'steps': 323, 'loss/train': 5.207618236541748} -09/20/2021 15:36:30 - INFO - __main__ - Step 5176: {'lr': 8.613333333333333e-05, 'samples': 165632, 'steps': 323, 'loss/train': 5.450159549713135} -09/20/2021 15:36:31 - INFO - __main__ - Step 5177: {'lr': 8.613333333333333e-05, 'samples': 165664, 'steps': 323, 'loss/train': 5.470453262329102} -09/20/2021 15:36:31 - INFO - __main__ - Step 5178: {'lr': 8.613333333333333e-05, 'samples': 165696, 'steps': 323, 'loss/train': 5.510370254516602} -09/20/2021 15:36:32 - INFO - __main__ - Step 5179: {'lr': 8.613333333333333e-05, 'samples': 165728, 'steps': 323, 'loss/train': 6.0023512840271} -09/20/2021 15:36:33 - INFO - __main__ - Step 5180: {'lr': 8.613333333333333e-05, 'samples': 165760, 'steps': 323, 'loss/train': 5.418008804321289} -09/20/2021 15:36:34 - INFO - __main__ - Step 5181: {'lr': 8.613333333333333e-05, 'samples': 165792, 'steps': 323, 'loss/train': 4.85176420211792} -09/20/2021 15:36:34 - INFO - __main__ - Step 5182: {'lr': 8.613333333333333e-05, 'samples': 165824, 'steps': 323, 'loss/train': 5.309209823608398} -09/20/2021 15:36:35 - INFO - __main__ - Step 5183: {'lr': 8.613333333333333e-05, 'samples': 165856, 'steps': 323, 'loss/train': 4.896228313446045} -09/20/2021 15:36:36 - INFO - __main__ - Step 5184: {'lr': 8.613333333333333e-05, 'samples': 165888, 'steps': 323, 'loss/train': 4.995411396026611} -09/20/2021 15:36:37 - INFO - __main__ - Step 5185: {'lr': 8.64e-05, 'samples': 165920, 'steps': 324, 'loss/train': 6.038274765014648} -09/20/2021 15:36:37 - INFO - __main__ - Step 5186: {'lr': 8.64e-05, 'samples': 165952, 'steps': 324, 'loss/train': 5.489011764526367} -09/20/2021 15:36:38 - INFO - __main__ - Step 5187: {'lr': 8.64e-05, 'samples': 165984, 'steps': 324, 'loss/train': 5.202978610992432} -09/20/2021 15:36:39 - INFO - __main__ - Step 5188: {'lr': 8.64e-05, 'samples': 166016, 'steps': 324, 'loss/train': 4.947934150695801} -09/20/2021 15:36:40 - INFO - __main__ - Step 5189: {'lr': 8.64e-05, 'samples': 166048, 'steps': 324, 'loss/train': 4.675381183624268} -09/20/2021 15:36:40 - INFO - __main__ - Step 5190: {'lr': 8.64e-05, 'samples': 166080, 'steps': 324, 'loss/train': 5.577156066894531} -09/20/2021 15:36:42 - INFO - __main__ - Step 5191: {'lr': 8.64e-05, 'samples': 166112, 'steps': 324, 'loss/train': 6.034795761108398} -09/20/2021 15:36:43 - INFO - __main__ - Step 5192: {'lr': 8.64e-05, 'samples': 166144, 'steps': 324, 'loss/train': 4.850050449371338} -09/20/2021 15:36:44 - INFO - __main__ - Step 5193: {'lr': 8.64e-05, 'samples': 166176, 'steps': 324, 'loss/train': 6.015021800994873} -09/20/2021 15:36:45 - INFO - __main__ - Step 5194: {'lr': 8.64e-05, 'samples': 166208, 'steps': 324, 'loss/train': 4.9926676750183105} -09/20/2021 15:36:45 - INFO - __main__ - Step 5195: {'lr': 8.64e-05, 'samples': 166240, 'steps': 324, 'loss/train': 4.863858699798584} -09/20/2021 15:36:46 - INFO - __main__ - Step 5196: {'lr': 8.64e-05, 'samples': 166272, 'steps': 324, 'loss/train': 4.961506366729736} -09/20/2021 15:36:47 - INFO - __main__ - Step 5197: {'lr': 8.64e-05, 'samples': 166304, 'steps': 324, 'loss/train': 5.635996341705322} -09/20/2021 15:36:48 - INFO - __main__ - Step 5198: {'lr': 8.64e-05, 'samples': 166336, 'steps': 324, 'loss/train': 4.907844066619873} -09/20/2021 15:36:48 - INFO - __main__ - Step 5199: {'lr': 8.64e-05, 'samples': 166368, 'steps': 324, 'loss/train': 4.637810230255127} -09/20/2021 15:36:49 - INFO - __main__ - Step 5200: {'lr': 8.64e-05, 'samples': 166400, 'steps': 324, 'loss/train': 4.029851913452148} -09/20/2021 15:36:50 - INFO - __main__ - Step 5201: {'lr': 8.666666666666667e-05, 'samples': 166432, 'steps': 325, 'loss/train': 4.905083656311035} -09/20/2021 15:36:51 - INFO - __main__ - Step 5202: {'lr': 8.666666666666667e-05, 'samples': 166464, 'steps': 325, 'loss/train': 5.5549702644348145} -09/20/2021 15:36:52 - INFO - __main__ - Step 5203: {'lr': 8.666666666666667e-05, 'samples': 166496, 'steps': 325, 'loss/train': 4.506026268005371} -09/20/2021 15:36:52 - INFO - __main__ - Step 5204: {'lr': 8.666666666666667e-05, 'samples': 166528, 'steps': 325, 'loss/train': 5.979297637939453} -09/20/2021 15:36:53 - INFO - __main__ - Step 5205: {'lr': 8.666666666666667e-05, 'samples': 166560, 'steps': 325, 'loss/train': 5.092284679412842} -09/20/2021 15:36:54 - INFO - __main__ - Step 5206: {'lr': 8.666666666666667e-05, 'samples': 166592, 'steps': 325, 'loss/train': 5.195693492889404} -09/20/2021 15:36:55 - INFO - __main__ - Step 5207: {'lr': 8.666666666666667e-05, 'samples': 166624, 'steps': 325, 'loss/train': 5.4162187576293945} -09/20/2021 15:36:55 - INFO - __main__ - Step 5208: {'lr': 8.666666666666667e-05, 'samples': 166656, 'steps': 325, 'loss/train': 4.958937644958496} -09/20/2021 15:36:56 - INFO - __main__ - Step 5209: {'lr': 8.666666666666667e-05, 'samples': 166688, 'steps': 325, 'loss/train': 5.403204441070557} -09/20/2021 15:36:57 - INFO - __main__ - Step 5210: {'lr': 8.666666666666667e-05, 'samples': 166720, 'steps': 325, 'loss/train': 5.418917655944824} -09/20/2021 15:36:58 - INFO - __main__ - Step 5211: {'lr': 8.666666666666667e-05, 'samples': 166752, 'steps': 325, 'loss/train': 6.31798791885376} -09/20/2021 15:36:58 - INFO - __main__ - Step 5212: {'lr': 8.666666666666667e-05, 'samples': 166784, 'steps': 325, 'loss/train': 5.007986068725586} -09/20/2021 15:36:59 - INFO - __main__ - Step 5213: {'lr': 8.666666666666667e-05, 'samples': 166816, 'steps': 325, 'loss/train': 4.988232612609863} -09/20/2021 15:37:00 - INFO - __main__ - Step 5214: {'lr': 8.666666666666667e-05, 'samples': 166848, 'steps': 325, 'loss/train': 5.69333553314209} -09/20/2021 15:37:01 - INFO - __main__ - Step 5215: {'lr': 8.666666666666667e-05, 'samples': 166880, 'steps': 325, 'loss/train': 5.470671653747559} -09/20/2021 15:37:01 - INFO - __main__ - Step 5216: {'lr': 8.666666666666667e-05, 'samples': 166912, 'steps': 325, 'loss/train': 8.176532745361328} -09/20/2021 15:37:02 - INFO - __main__ - Step 5217: {'lr': 8.693333333333334e-05, 'samples': 166944, 'steps': 326, 'loss/train': 5.012099266052246} -09/20/2021 15:37:03 - INFO - __main__ - Step 5218: {'lr': 8.693333333333334e-05, 'samples': 166976, 'steps': 326, 'loss/train': 5.438204765319824} -09/20/2021 15:37:04 - INFO - __main__ - Step 5219: {'lr': 8.693333333333334e-05, 'samples': 167008, 'steps': 326, 'loss/train': 5.249156951904297} -09/20/2021 15:37:04 - INFO - __main__ - Step 5220: {'lr': 8.693333333333334e-05, 'samples': 167040, 'steps': 326, 'loss/train': 4.9942731857299805} -09/20/2021 15:37:05 - INFO - __main__ - Step 5221: {'lr': 8.693333333333334e-05, 'samples': 167072, 'steps': 326, 'loss/train': 5.82078742980957} -09/20/2021 15:37:06 - INFO - __main__ - Step 5222: {'lr': 8.693333333333334e-05, 'samples': 167104, 'steps': 326, 'loss/train': 5.139018535614014} -09/20/2021 15:37:07 - INFO - __main__ - Step 5223: {'lr': 8.693333333333334e-05, 'samples': 167136, 'steps': 326, 'loss/train': 5.410138130187988} -09/20/2021 15:37:08 - INFO - __main__ - Step 5224: {'lr': 8.693333333333334e-05, 'samples': 167168, 'steps': 326, 'loss/train': 5.322451591491699} -09/20/2021 15:37:09 - INFO - __main__ - Step 5225: {'lr': 8.693333333333334e-05, 'samples': 167200, 'steps': 326, 'loss/train': 5.200402736663818} -09/20/2021 15:37:09 - INFO - __main__ - Step 5226: {'lr': 8.693333333333334e-05, 'samples': 167232, 'steps': 326, 'loss/train': 4.573403835296631} -09/20/2021 15:37:10 - INFO - __main__ - Step 5227: {'lr': 8.693333333333334e-05, 'samples': 167264, 'steps': 326, 'loss/train': 3.6500749588012695} -09/20/2021 15:37:11 - INFO - __main__ - Step 5228: {'lr': 8.693333333333334e-05, 'samples': 167296, 'steps': 326, 'loss/train': 4.809553146362305} -09/20/2021 15:37:12 - INFO - __main__ - Step 5229: {'lr': 8.693333333333334e-05, 'samples': 167328, 'steps': 326, 'loss/train': 5.441408634185791} -09/20/2021 15:37:12 - INFO - __main__ - Step 5230: {'lr': 8.693333333333334e-05, 'samples': 167360, 'steps': 326, 'loss/train': 5.16029691696167} -09/20/2021 15:37:13 - INFO - __main__ - Step 5231: {'lr': 8.693333333333334e-05, 'samples': 167392, 'steps': 326, 'loss/train': 5.02158260345459} -09/20/2021 15:37:14 - INFO - __main__ - Step 5232: {'lr': 8.693333333333334e-05, 'samples': 167424, 'steps': 326, 'loss/train': 4.682781219482422} -09/20/2021 15:37:15 - INFO - __main__ - Step 5233: {'lr': 8.72e-05, 'samples': 167456, 'steps': 327, 'loss/train': 5.436874866485596} -09/20/2021 15:37:16 - INFO - __main__ - Step 5234: {'lr': 8.72e-05, 'samples': 167488, 'steps': 327, 'loss/train': 5.099582672119141} -09/20/2021 15:37:16 - INFO - __main__ - Step 5235: {'lr': 8.72e-05, 'samples': 167520, 'steps': 327, 'loss/train': 5.837403774261475} -09/20/2021 15:37:17 - INFO - __main__ - Step 5236: {'lr': 8.72e-05, 'samples': 167552, 'steps': 327, 'loss/train': 5.7780561447143555} -09/20/2021 15:37:18 - INFO - __main__ - Step 5237: {'lr': 8.72e-05, 'samples': 167584, 'steps': 327, 'loss/train': 5.038455963134766} -09/20/2021 15:37:19 - INFO - __main__ - Step 5238: {'lr': 8.72e-05, 'samples': 167616, 'steps': 327, 'loss/train': 4.838837146759033} -09/20/2021 15:37:19 - INFO - __main__ - Step 5239: {'lr': 8.72e-05, 'samples': 167648, 'steps': 327, 'loss/train': 5.03202486038208} -09/20/2021 15:37:20 - INFO - __main__ - Step 5240: {'lr': 8.72e-05, 'samples': 167680, 'steps': 327, 'loss/train': 5.0728583335876465} -09/20/2021 15:37:21 - INFO - __main__ - Step 5241: {'lr': 8.72e-05, 'samples': 167712, 'steps': 327, 'loss/train': 5.698490619659424} -09/20/2021 15:37:22 - INFO - __main__ - Step 5242: {'lr': 8.72e-05, 'samples': 167744, 'steps': 327, 'loss/train': 3.7840869426727295} -09/20/2021 15:37:22 - INFO - __main__ - Step 5243: {'lr': 8.72e-05, 'samples': 167776, 'steps': 327, 'loss/train': 6.30916690826416} -09/20/2021 15:37:23 - INFO - __main__ - Step 5244: {'lr': 8.72e-05, 'samples': 167808, 'steps': 327, 'loss/train': 4.981746673583984} -09/20/2021 15:37:24 - INFO - __main__ - Step 5245: {'lr': 8.72e-05, 'samples': 167840, 'steps': 327, 'loss/train': 4.774704933166504} -09/20/2021 15:37:25 - INFO - __main__ - Step 5246: {'lr': 8.72e-05, 'samples': 167872, 'steps': 327, 'loss/train': 5.9609246253967285} -09/20/2021 15:37:25 - INFO - __main__ - Step 5247: {'lr': 8.72e-05, 'samples': 167904, 'steps': 327, 'loss/train': 5.513268947601318} -09/20/2021 15:37:26 - INFO - __main__ - Step 5248: {'lr': 8.72e-05, 'samples': 167936, 'steps': 327, 'loss/train': 4.461359024047852} -09/20/2021 15:37:27 - INFO - __main__ - Step 5249: {'lr': 8.746666666666667e-05, 'samples': 167968, 'steps': 328, 'loss/train': 6.1433539390563965} -09/20/2021 15:37:28 - INFO - __main__ - Step 5250: {'lr': 8.746666666666667e-05, 'samples': 168000, 'steps': 328, 'loss/train': 6.038671493530273} -09/20/2021 15:37:28 - INFO - __main__ - Step 5251: {'lr': 8.746666666666667e-05, 'samples': 168032, 'steps': 328, 'loss/train': 5.855745792388916} -09/20/2021 15:37:29 - INFO - __main__ - Step 5252: {'lr': 8.746666666666667e-05, 'samples': 168064, 'steps': 328, 'loss/train': 5.424520969390869} -09/20/2021 15:37:30 - INFO - __main__ - Step 5253: {'lr': 8.746666666666667e-05, 'samples': 168096, 'steps': 328, 'loss/train': 4.927320957183838} -09/20/2021 15:37:31 - INFO - __main__ - Step 5254: {'lr': 8.746666666666667e-05, 'samples': 168128, 'steps': 328, 'loss/train': 4.907266616821289} -09/20/2021 15:37:32 - INFO - __main__ - Step 5255: {'lr': 8.746666666666667e-05, 'samples': 168160, 'steps': 328, 'loss/train': 5.6278767585754395} -09/20/2021 15:37:33 - INFO - __main__ - Step 5256: {'lr': 8.746666666666667e-05, 'samples': 168192, 'steps': 328, 'loss/train': 4.685969352722168} -09/20/2021 15:37:34 - INFO - __main__ - Step 5257: {'lr': 8.746666666666667e-05, 'samples': 168224, 'steps': 328, 'loss/train': 5.391820430755615} -09/20/2021 15:37:34 - INFO - __main__ - Step 5258: {'lr': 8.746666666666667e-05, 'samples': 168256, 'steps': 328, 'loss/train': 5.068077564239502} -09/20/2021 15:37:35 - INFO - __main__ - Step 5259: {'lr': 8.746666666666667e-05, 'samples': 168288, 'steps': 328, 'loss/train': 5.063651084899902} -09/20/2021 15:37:36 - INFO - __main__ - Step 5260: {'lr': 8.746666666666667e-05, 'samples': 168320, 'steps': 328, 'loss/train': 4.730585098266602} -09/20/2021 15:37:37 - INFO - __main__ - Step 5261: {'lr': 8.746666666666667e-05, 'samples': 168352, 'steps': 328, 'loss/train': 6.28800106048584} -09/20/2021 15:37:37 - INFO - __main__ - Step 5262: {'lr': 8.746666666666667e-05, 'samples': 168384, 'steps': 328, 'loss/train': 6.633399963378906} -09/20/2021 15:37:38 - INFO - __main__ - Step 5263: {'lr': 8.746666666666667e-05, 'samples': 168416, 'steps': 328, 'loss/train': 5.4110870361328125} -09/20/2021 15:37:39 - INFO - __main__ - Step 5264: {'lr': 8.746666666666667e-05, 'samples': 168448, 'steps': 328, 'loss/train': 4.31696891784668} -09/20/2021 15:37:40 - INFO - __main__ - Step 5265: {'lr': 8.773333333333333e-05, 'samples': 168480, 'steps': 329, 'loss/train': 4.942706108093262} -09/20/2021 15:37:40 - INFO - __main__ - Step 5266: {'lr': 8.773333333333333e-05, 'samples': 168512, 'steps': 329, 'loss/train': 6.439427375793457} -09/20/2021 15:37:41 - INFO - __main__ - Step 5267: {'lr': 8.773333333333333e-05, 'samples': 168544, 'steps': 329, 'loss/train': 6.52621603012085} -09/20/2021 15:37:42 - INFO - __main__ - Step 5268: {'lr': 8.773333333333333e-05, 'samples': 168576, 'steps': 329, 'loss/train': 5.067740440368652} -09/20/2021 15:37:43 - INFO - __main__ - Step 5269: {'lr': 8.773333333333333e-05, 'samples': 168608, 'steps': 329, 'loss/train': 5.277476787567139} -09/20/2021 15:37:43 - INFO - __main__ - Step 5270: {'lr': 8.773333333333333e-05, 'samples': 168640, 'steps': 329, 'loss/train': 6.277835369110107} -09/20/2021 15:37:44 - INFO - __main__ - Step 5271: {'lr': 8.773333333333333e-05, 'samples': 168672, 'steps': 329, 'loss/train': 5.019824504852295} -09/20/2021 15:37:45 - INFO - __main__ - Step 5272: {'lr': 8.773333333333333e-05, 'samples': 168704, 'steps': 329, 'loss/train': 5.689580917358398} -09/20/2021 15:37:46 - INFO - __main__ - Step 5273: {'lr': 8.773333333333333e-05, 'samples': 168736, 'steps': 329, 'loss/train': 4.310647487640381} -09/20/2021 15:37:46 - INFO - __main__ - Step 5274: {'lr': 8.773333333333333e-05, 'samples': 168768, 'steps': 329, 'loss/train': 4.97784948348999} -09/20/2021 15:37:47 - INFO - __main__ - Step 5275: {'lr': 8.773333333333333e-05, 'samples': 168800, 'steps': 329, 'loss/train': 4.846078872680664} -09/20/2021 15:37:48 - INFO - __main__ - Step 5276: {'lr': 8.773333333333333e-05, 'samples': 168832, 'steps': 329, 'loss/train': 4.933518409729004} -09/20/2021 15:37:49 - INFO - __main__ - Step 5277: {'lr': 8.773333333333333e-05, 'samples': 168864, 'steps': 329, 'loss/train': 5.737600326538086} -09/20/2021 15:37:49 - INFO - __main__ - Step 5278: {'lr': 8.773333333333333e-05, 'samples': 168896, 'steps': 329, 'loss/train': 4.870748043060303} -09/20/2021 15:37:50 - INFO - __main__ - Step 5279: {'lr': 8.773333333333333e-05, 'samples': 168928, 'steps': 329, 'loss/train': 4.446191310882568} -09/20/2021 15:37:51 - INFO - __main__ - Step 5280: {'lr': 8.773333333333333e-05, 'samples': 168960, 'steps': 329, 'loss/train': 4.72280216217041} -09/20/2021 15:37:52 - INFO - __main__ - Step 5281: {'lr': 8.800000000000001e-05, 'samples': 168992, 'steps': 330, 'loss/train': 4.4386420249938965} -09/20/2021 15:37:53 - INFO - __main__ - Step 5282: {'lr': 8.800000000000001e-05, 'samples': 169024, 'steps': 330, 'loss/train': 4.882461071014404} -09/20/2021 15:37:53 - INFO - __main__ - Step 5283: {'lr': 8.800000000000001e-05, 'samples': 169056, 'steps': 330, 'loss/train': 5.476904392242432} -09/20/2021 15:37:54 - INFO - __main__ - Step 5284: {'lr': 8.800000000000001e-05, 'samples': 169088, 'steps': 330, 'loss/train': 5.1650800704956055} -09/20/2021 15:37:56 - INFO - __main__ - Step 5285: {'lr': 8.800000000000001e-05, 'samples': 169120, 'steps': 330, 'loss/train': 4.523749828338623} -09/20/2021 15:37:56 - INFO - __main__ - Step 5286: {'lr': 8.800000000000001e-05, 'samples': 169152, 'steps': 330, 'loss/train': 4.576113224029541} -09/20/2021 15:37:57 - INFO - __main__ - Step 5287: {'lr': 8.800000000000001e-05, 'samples': 169184, 'steps': 330, 'loss/train': 5.30133056640625} -09/20/2021 15:37:58 - INFO - __main__ - Step 5288: {'lr': 8.800000000000001e-05, 'samples': 169216, 'steps': 330, 'loss/train': 5.246250152587891} -09/20/2021 15:37:59 - INFO - __main__ - Step 5289: {'lr': 8.800000000000001e-05, 'samples': 169248, 'steps': 330, 'loss/train': 5.593227863311768} -09/20/2021 15:37:59 - INFO - __main__ - Step 5290: {'lr': 8.800000000000001e-05, 'samples': 169280, 'steps': 330, 'loss/train': 5.107081890106201} -09/20/2021 15:38:00 - INFO - __main__ - Step 5291: {'lr': 8.800000000000001e-05, 'samples': 169312, 'steps': 330, 'loss/train': 5.280956745147705} -09/20/2021 15:38:01 - INFO - __main__ - Step 5292: {'lr': 8.800000000000001e-05, 'samples': 169344, 'steps': 330, 'loss/train': 4.985455513000488} -09/20/2021 15:38:01 - INFO - __main__ - Step 5293: {'lr': 8.800000000000001e-05, 'samples': 169376, 'steps': 330, 'loss/train': 4.80440092086792} -09/20/2021 15:38:02 - INFO - __main__ - Step 5294: {'lr': 8.800000000000001e-05, 'samples': 169408, 'steps': 330, 'loss/train': 5.9704766273498535} -09/20/2021 15:38:03 - INFO - __main__ - Step 5295: {'lr': 8.800000000000001e-05, 'samples': 169440, 'steps': 330, 'loss/train': 5.057896137237549} -09/20/2021 15:38:04 - INFO - __main__ - Step 5296: {'lr': 8.800000000000001e-05, 'samples': 169472, 'steps': 330, 'loss/train': 5.659877300262451} -09/20/2021 15:38:05 - INFO - __main__ - Step 5297: {'lr': 8.826666666666668e-05, 'samples': 169504, 'steps': 331, 'loss/train': 4.387518882751465} -09/20/2021 15:38:05 - INFO - __main__ - Step 5298: {'lr': 8.826666666666668e-05, 'samples': 169536, 'steps': 331, 'loss/train': 6.451919078826904} -09/20/2021 15:38:06 - INFO - __main__ - Step 5299: {'lr': 8.826666666666668e-05, 'samples': 169568, 'steps': 331, 'loss/train': 5.250624179840088} -09/20/2021 15:38:07 - INFO - __main__ - Step 5300: {'lr': 8.826666666666668e-05, 'samples': 169600, 'steps': 331, 'loss/train': 4.805203914642334} -09/20/2021 15:38:08 - INFO - __main__ - Step 5301: {'lr': 8.826666666666668e-05, 'samples': 169632, 'steps': 331, 'loss/train': 5.607056617736816} -09/20/2021 15:38:08 - INFO - __main__ - Step 5302: {'lr': 8.826666666666668e-05, 'samples': 169664, 'steps': 331, 'loss/train': 4.472409248352051} -09/20/2021 15:38:09 - INFO - __main__ - Step 5303: {'lr': 8.826666666666668e-05, 'samples': 169696, 'steps': 331, 'loss/train': 5.794991493225098} -09/20/2021 15:38:10 - INFO - __main__ - Step 5304: {'lr': 8.826666666666668e-05, 'samples': 169728, 'steps': 331, 'loss/train': 5.588009834289551} -09/20/2021 15:38:11 - INFO - __main__ - Step 5305: {'lr': 8.826666666666668e-05, 'samples': 169760, 'steps': 331, 'loss/train': 6.010107517242432} -09/20/2021 15:38:11 - INFO - __main__ - Step 5306: {'lr': 8.826666666666668e-05, 'samples': 169792, 'steps': 331, 'loss/train': 4.729619026184082} -09/20/2021 15:38:12 - INFO - __main__ - Step 5307: {'lr': 8.826666666666668e-05, 'samples': 169824, 'steps': 331, 'loss/train': 6.00990104675293} -09/20/2021 15:38:13 - INFO - __main__ - Step 5308: {'lr': 8.826666666666668e-05, 'samples': 169856, 'steps': 331, 'loss/train': 5.942558288574219} -09/20/2021 15:38:14 - INFO - __main__ - Step 5309: {'lr': 8.826666666666668e-05, 'samples': 169888, 'steps': 331, 'loss/train': 5.519227504730225} -09/20/2021 15:38:14 - INFO - __main__ - Step 5310: {'lr': 8.826666666666668e-05, 'samples': 169920, 'steps': 331, 'loss/train': 5.10587739944458} -09/20/2021 15:38:15 - INFO - __main__ - Step 5311: {'lr': 8.826666666666668e-05, 'samples': 169952, 'steps': 331, 'loss/train': 5.246811866760254} -09/20/2021 15:38:16 - INFO - __main__ - Step 5312: {'lr': 8.826666666666668e-05, 'samples': 169984, 'steps': 331, 'loss/train': 5.156370162963867} -09/20/2021 15:38:17 - INFO - __main__ - Step 5313: {'lr': 8.853333333333333e-05, 'samples': 170016, 'steps': 332, 'loss/train': 4.932613849639893} -09/20/2021 15:38:18 - INFO - __main__ - Step 5314: {'lr': 8.853333333333333e-05, 'samples': 170048, 'steps': 332, 'loss/train': 3.5865397453308105} -09/20/2021 15:38:18 - INFO - __main__ - Step 5315: {'lr': 8.853333333333333e-05, 'samples': 170080, 'steps': 332, 'loss/train': 3.742985486984253} -09/20/2021 15:38:19 - INFO - __main__ - Step 5316: {'lr': 8.853333333333333e-05, 'samples': 170112, 'steps': 332, 'loss/train': 2.7622811794281006} -09/20/2021 15:38:20 - INFO - __main__ - Step 5317: {'lr': 8.853333333333333e-05, 'samples': 170144, 'steps': 332, 'loss/train': 2.8106682300567627} -09/20/2021 15:38:21 - INFO - __main__ - Step 5318: {'lr': 8.853333333333333e-05, 'samples': 170176, 'steps': 332, 'loss/train': 4.990001201629639} -09/20/2021 15:38:22 - INFO - __main__ - Step 5319: {'lr': 8.853333333333333e-05, 'samples': 170208, 'steps': 332, 'loss/train': 4.912141799926758} -09/20/2021 15:38:23 - INFO - __main__ - Step 5320: {'lr': 8.853333333333333e-05, 'samples': 170240, 'steps': 332, 'loss/train': 5.510341167449951} -09/20/2021 15:38:23 - INFO - __main__ - Step 5321: {'lr': 8.853333333333333e-05, 'samples': 170272, 'steps': 332, 'loss/train': 4.934590816497803} -09/20/2021 15:38:24 - INFO - __main__ - Step 5322: {'lr': 8.853333333333333e-05, 'samples': 170304, 'steps': 332, 'loss/train': 4.8396477699279785} -09/20/2021 15:38:25 - INFO - __main__ - Step 5323: {'lr': 8.853333333333333e-05, 'samples': 170336, 'steps': 332, 'loss/train': 5.769136428833008} -09/20/2021 15:38:26 - INFO - __main__ - Step 5324: {'lr': 8.853333333333333e-05, 'samples': 170368, 'steps': 332, 'loss/train': 7.028635501861572} -09/20/2021 15:38:26 - INFO - __main__ - Step 5325: {'lr': 8.853333333333333e-05, 'samples': 170400, 'steps': 332, 'loss/train': 5.219059467315674} -09/20/2021 15:38:27 - INFO - __main__ - Step 5326: {'lr': 8.853333333333333e-05, 'samples': 170432, 'steps': 332, 'loss/train': 3.740135669708252} -09/20/2021 15:38:28 - INFO - __main__ - Step 5327: {'lr': 8.853333333333333e-05, 'samples': 170464, 'steps': 332, 'loss/train': 5.46777868270874} -09/20/2021 15:38:29 - INFO - __main__ - Step 5328: {'lr': 8.853333333333333e-05, 'samples': 170496, 'steps': 332, 'loss/train': 5.218826770782471} -09/20/2021 15:38:29 - INFO - __main__ - Step 5329: {'lr': 8.88e-05, 'samples': 170528, 'steps': 333, 'loss/train': 4.8543314933776855} -09/20/2021 15:38:30 - INFO - __main__ - Step 5330: {'lr': 8.88e-05, 'samples': 170560, 'steps': 333, 'loss/train': 5.027904033660889} -09/20/2021 15:38:31 - INFO - __main__ - Step 5331: {'lr': 8.88e-05, 'samples': 170592, 'steps': 333, 'loss/train': 5.226142406463623} -09/20/2021 15:38:32 - INFO - __main__ - Step 5332: {'lr': 8.88e-05, 'samples': 170624, 'steps': 333, 'loss/train': 1.1535699367523193} -09/20/2021 15:38:32 - INFO - __main__ - Step 5333: {'lr': 8.88e-05, 'samples': 170656, 'steps': 333, 'loss/train': 6.15641450881958} -09/20/2021 15:38:33 - INFO - __main__ - Step 5334: {'lr': 8.88e-05, 'samples': 170688, 'steps': 333, 'loss/train': 6.222715377807617} -09/20/2021 15:38:34 - INFO - __main__ - Step 5335: {'lr': 8.88e-05, 'samples': 170720, 'steps': 333, 'loss/train': 5.756054401397705} -09/20/2021 15:38:35 - INFO - __main__ - Step 5336: {'lr': 8.88e-05, 'samples': 170752, 'steps': 333, 'loss/train': 5.061765193939209} -09/20/2021 15:38:35 - INFO - __main__ - Step 5337: {'lr': 8.88e-05, 'samples': 170784, 'steps': 333, 'loss/train': 5.536533832550049} -09/20/2021 15:38:36 - INFO - __main__ - Step 5338: {'lr': 8.88e-05, 'samples': 170816, 'steps': 333, 'loss/train': 5.870750904083252} -09/20/2021 15:38:37 - INFO - __main__ - Step 5339: {'lr': 8.88e-05, 'samples': 170848, 'steps': 333, 'loss/train': 5.4005632400512695} -09/20/2021 15:38:38 - INFO - __main__ - Step 5340: {'lr': 8.88e-05, 'samples': 170880, 'steps': 333, 'loss/train': 4.412332534790039} -09/20/2021 15:38:38 - INFO - __main__ - Step 5341: {'lr': 8.88e-05, 'samples': 170912, 'steps': 333, 'loss/train': 6.8268256187438965} -09/20/2021 15:38:39 - INFO - __main__ - Step 5342: {'lr': 8.88e-05, 'samples': 170944, 'steps': 333, 'loss/train': 5.451417446136475} -09/20/2021 15:38:40 - INFO - __main__ - Step 5343: {'lr': 8.88e-05, 'samples': 170976, 'steps': 333, 'loss/train': 5.5988569259643555} -09/20/2021 15:38:41 - INFO - __main__ - Step 5344: {'lr': 8.88e-05, 'samples': 171008, 'steps': 333, 'loss/train': 5.168604850769043} -09/20/2021 15:38:42 - INFO - __main__ - Step 5345: {'lr': 8.906666666666667e-05, 'samples': 171040, 'steps': 334, 'loss/train': 4.386437892913818} -09/20/2021 15:38:42 - INFO - __main__ - Step 5346: {'lr': 8.906666666666667e-05, 'samples': 171072, 'steps': 334, 'loss/train': 7.805311679840088} -09/20/2021 15:38:43 - INFO - __main__ - Step 5347: {'lr': 8.906666666666667e-05, 'samples': 171104, 'steps': 334, 'loss/train': 5.172269344329834} -09/20/2021 15:38:45 - INFO - __main__ - Step 5348: {'lr': 8.906666666666667e-05, 'samples': 171136, 'steps': 334, 'loss/train': 3.2226903438568115} -09/20/2021 15:38:46 - INFO - __main__ - Step 5349: {'lr': 8.906666666666667e-05, 'samples': 171168, 'steps': 334, 'loss/train': 5.747156143188477} -09/20/2021 15:38:46 - INFO - __main__ - Step 5350: {'lr': 8.906666666666667e-05, 'samples': 171200, 'steps': 334, 'loss/train': 5.47934103012085} -09/20/2021 15:38:47 - INFO - __main__ - Step 5351: {'lr': 8.906666666666667e-05, 'samples': 171232, 'steps': 334, 'loss/train': 4.940749645233154} -09/20/2021 15:38:48 - INFO - __main__ - Step 5352: {'lr': 8.906666666666667e-05, 'samples': 171264, 'steps': 334, 'loss/train': 5.420544624328613} -09/20/2021 15:38:49 - INFO - __main__ - Step 5353: {'lr': 8.906666666666667e-05, 'samples': 171296, 'steps': 334, 'loss/train': 5.387659072875977} -09/20/2021 15:38:49 - INFO - __main__ - Step 5354: {'lr': 8.906666666666667e-05, 'samples': 171328, 'steps': 334, 'loss/train': 5.917086124420166} -09/20/2021 15:38:50 - INFO - __main__ - Step 5355: {'lr': 8.906666666666667e-05, 'samples': 171360, 'steps': 334, 'loss/train': 5.029798984527588} -09/20/2021 15:38:51 - INFO - __main__ - Step 5356: {'lr': 8.906666666666667e-05, 'samples': 171392, 'steps': 334, 'loss/train': 5.1629486083984375} -09/20/2021 15:38:52 - INFO - __main__ - Step 5357: {'lr': 8.906666666666667e-05, 'samples': 171424, 'steps': 334, 'loss/train': 5.154572486877441} -09/20/2021 15:38:52 - INFO - __main__ - Step 5358: {'lr': 8.906666666666667e-05, 'samples': 171456, 'steps': 334, 'loss/train': 4.443328380584717} -09/20/2021 15:38:53 - INFO - __main__ - Step 5359: {'lr': 8.906666666666667e-05, 'samples': 171488, 'steps': 334, 'loss/train': 5.157140731811523} -09/20/2021 15:38:54 - INFO - __main__ - Step 5360: {'lr': 8.906666666666667e-05, 'samples': 171520, 'steps': 334, 'loss/train': 5.15903902053833} -09/20/2021 15:38:55 - INFO - __main__ - Step 5361: {'lr': 8.933333333333334e-05, 'samples': 171552, 'steps': 335, 'loss/train': 5.975949287414551} -09/20/2021 15:38:55 - INFO - __main__ - Step 5362: {'lr': 8.933333333333334e-05, 'samples': 171584, 'steps': 335, 'loss/train': 5.454341888427734} -09/20/2021 15:38:56 - INFO - __main__ - Step 5363: {'lr': 8.933333333333334e-05, 'samples': 171616, 'steps': 335, 'loss/train': 5.5160393714904785} -09/20/2021 15:38:57 - INFO - __main__ - Step 5364: {'lr': 8.933333333333334e-05, 'samples': 171648, 'steps': 335, 'loss/train': 5.157174587249756} -09/20/2021 15:38:58 - INFO - __main__ - Step 5365: {'lr': 8.933333333333334e-05, 'samples': 171680, 'steps': 335, 'loss/train': 5.8018798828125} -09/20/2021 15:38:58 - INFO - __main__ - Step 5366: {'lr': 8.933333333333334e-05, 'samples': 171712, 'steps': 335, 'loss/train': 5.047683238983154} -09/20/2021 15:38:59 - INFO - __main__ - Step 5367: {'lr': 8.933333333333334e-05, 'samples': 171744, 'steps': 335, 'loss/train': 5.147966384887695} -09/20/2021 15:39:00 - INFO - __main__ - Step 5368: {'lr': 8.933333333333334e-05, 'samples': 171776, 'steps': 335, 'loss/train': 6.149035930633545} -09/20/2021 15:39:01 - INFO - __main__ - Step 5369: {'lr': 8.933333333333334e-05, 'samples': 171808, 'steps': 335, 'loss/train': 4.872036457061768} -09/20/2021 15:39:01 - INFO - __main__ - Step 5370: {'lr': 8.933333333333334e-05, 'samples': 171840, 'steps': 335, 'loss/train': 4.96161413192749} -09/20/2021 15:39:02 - INFO - __main__ - Step 5371: {'lr': 8.933333333333334e-05, 'samples': 171872, 'steps': 335, 'loss/train': 5.198007583618164} -09/20/2021 15:39:03 - INFO - __main__ - Step 5372: {'lr': 8.933333333333334e-05, 'samples': 171904, 'steps': 335, 'loss/train': 5.703723907470703} -09/20/2021 15:39:04 - INFO - __main__ - Step 5373: {'lr': 8.933333333333334e-05, 'samples': 171936, 'steps': 335, 'loss/train': 5.15649938583374} -09/20/2021 15:39:04 - INFO - __main__ - Step 5374: {'lr': 8.933333333333334e-05, 'samples': 171968, 'steps': 335, 'loss/train': 4.630349636077881} -09/20/2021 15:39:05 - INFO - __main__ - Step 5375: {'lr': 8.933333333333334e-05, 'samples': 172000, 'steps': 335, 'loss/train': 3.270676612854004} -09/20/2021 15:39:06 - INFO - __main__ - Step 5376: {'lr': 8.933333333333334e-05, 'samples': 172032, 'steps': 335, 'loss/train': 3.44616436958313} -09/20/2021 15:39:07 - INFO - __main__ - Step 5377: {'lr': 8.960000000000001e-05, 'samples': 172064, 'steps': 336, 'loss/train': 3.7435779571533203} -09/20/2021 15:39:08 - INFO - __main__ - Step 5378: {'lr': 8.960000000000001e-05, 'samples': 172096, 'steps': 336, 'loss/train': 3.462674379348755} -09/20/2021 15:39:08 - INFO - __main__ - Step 5379: {'lr': 8.960000000000001e-05, 'samples': 172128, 'steps': 336, 'loss/train': 3.3298075199127197} -09/20/2021 15:39:10 - INFO - __main__ - Step 5380: {'lr': 8.960000000000001e-05, 'samples': 172160, 'steps': 336, 'loss/train': 3.606199264526367} -09/20/2021 15:39:11 - INFO - __main__ - Step 5381: {'lr': 8.960000000000001e-05, 'samples': 172192, 'steps': 336, 'loss/train': 3.39673113822937} -09/20/2021 15:39:11 - INFO - __main__ - Step 5382: {'lr': 8.960000000000001e-05, 'samples': 172224, 'steps': 336, 'loss/train': 5.232377052307129} -09/20/2021 15:39:12 - INFO - __main__ - Step 5383: {'lr': 8.960000000000001e-05, 'samples': 172256, 'steps': 336, 'loss/train': 3.7610843181610107} -09/20/2021 15:39:13 - INFO - __main__ - Step 5384: {'lr': 8.960000000000001e-05, 'samples': 172288, 'steps': 336, 'loss/train': 3.9665544033050537} -09/20/2021 15:39:14 - INFO - __main__ - Step 5385: {'lr': 8.960000000000001e-05, 'samples': 172320, 'steps': 336, 'loss/train': 3.211268186569214} -09/20/2021 15:39:14 - INFO - __main__ - Step 5386: {'lr': 8.960000000000001e-05, 'samples': 172352, 'steps': 336, 'loss/train': 3.527982473373413} -09/20/2021 15:39:15 - INFO - __main__ - Step 5387: {'lr': 8.960000000000001e-05, 'samples': 172384, 'steps': 336, 'loss/train': 6.054114818572998} -09/20/2021 15:39:16 - INFO - __main__ - Step 5388: {'lr': 8.960000000000001e-05, 'samples': 172416, 'steps': 336, 'loss/train': 5.108172416687012} -09/20/2021 15:39:17 - INFO - __main__ - Step 5389: {'lr': 8.960000000000001e-05, 'samples': 172448, 'steps': 336, 'loss/train': 3.492576837539673} -09/20/2021 15:39:17 - INFO - __main__ - Step 5390: {'lr': 8.960000000000001e-05, 'samples': 172480, 'steps': 336, 'loss/train': 4.934604644775391} -09/20/2021 15:39:18 - INFO - __main__ - Step 5391: {'lr': 8.960000000000001e-05, 'samples': 172512, 'steps': 336, 'loss/train': 5.532989025115967} -09/20/2021 15:39:19 - INFO - __main__ - Step 5392: {'lr': 8.960000000000001e-05, 'samples': 172544, 'steps': 336, 'loss/train': 5.128441333770752} -09/20/2021 15:39:20 - INFO - __main__ - Step 5393: {'lr': 8.986666666666666e-05, 'samples': 172576, 'steps': 337, 'loss/train': 4.81084680557251} -09/20/2021 15:39:21 - INFO - __main__ - Step 5394: {'lr': 8.986666666666666e-05, 'samples': 172608, 'steps': 337, 'loss/train': 5.644200325012207} -09/20/2021 15:39:21 - INFO - __main__ - Step 5395: {'lr': 8.986666666666666e-05, 'samples': 172640, 'steps': 337, 'loss/train': 3.2287020683288574} -09/20/2021 15:39:22 - INFO - __main__ - Step 5396: {'lr': 8.986666666666666e-05, 'samples': 172672, 'steps': 337, 'loss/train': 5.425690174102783} -09/20/2021 15:39:23 - INFO - __main__ - Step 5397: {'lr': 8.986666666666666e-05, 'samples': 172704, 'steps': 337, 'loss/train': 5.208451747894287} -09/20/2021 15:39:24 - INFO - __main__ - Step 5398: {'lr': 8.986666666666666e-05, 'samples': 172736, 'steps': 337, 'loss/train': 4.451248645782471} -09/20/2021 15:39:24 - INFO - __main__ - Step 5399: {'lr': 8.986666666666666e-05, 'samples': 172768, 'steps': 337, 'loss/train': 5.345738410949707} -09/20/2021 15:39:25 - INFO - __main__ - Step 5400: {'lr': 8.986666666666666e-05, 'samples': 172800, 'steps': 337, 'loss/train': 4.483436107635498} -09/20/2021 15:39:26 - INFO - __main__ - Step 5401: {'lr': 8.986666666666666e-05, 'samples': 172832, 'steps': 337, 'loss/train': 3.140005350112915} -09/20/2021 15:39:27 - INFO - __main__ - Step 5402: {'lr': 8.986666666666666e-05, 'samples': 172864, 'steps': 337, 'loss/train': 5.264571189880371} -09/20/2021 15:39:27 - INFO - __main__ - Step 5403: {'lr': 8.986666666666666e-05, 'samples': 172896, 'steps': 337, 'loss/train': 4.808784484863281} -09/20/2021 15:39:28 - INFO - __main__ - Step 5404: {'lr': 8.986666666666666e-05, 'samples': 172928, 'steps': 337, 'loss/train': 5.12804651260376} -09/20/2021 15:39:29 - INFO - __main__ - Step 5405: {'lr': 8.986666666666666e-05, 'samples': 172960, 'steps': 337, 'loss/train': 6.242219924926758} -09/20/2021 15:39:30 - INFO - __main__ - Step 5406: {'lr': 8.986666666666666e-05, 'samples': 172992, 'steps': 337, 'loss/train': 5.308853626251221} -09/20/2021 15:39:30 - INFO - __main__ - Step 5407: {'lr': 8.986666666666666e-05, 'samples': 173024, 'steps': 337, 'loss/train': 4.396137714385986} -09/20/2021 15:39:31 - INFO - __main__ - Step 5408: {'lr': 8.986666666666666e-05, 'samples': 173056, 'steps': 337, 'loss/train': 5.199435234069824} -09/20/2021 15:39:32 - INFO - __main__ - Step 5409: {'lr': 9.013333333333333e-05, 'samples': 173088, 'steps': 338, 'loss/train': 4.572367191314697} -09/20/2021 15:39:33 - INFO - __main__ - Step 5410: {'lr': 9.013333333333333e-05, 'samples': 173120, 'steps': 338, 'loss/train': 5.277188301086426} -09/20/2021 15:39:33 - INFO - __main__ - Step 5411: {'lr': 9.013333333333333e-05, 'samples': 173152, 'steps': 338, 'loss/train': 5.678586483001709} -09/20/2021 15:39:34 - INFO - __main__ - Step 5412: {'lr': 9.013333333333333e-05, 'samples': 173184, 'steps': 338, 'loss/train': 5.498887062072754} -09/20/2021 15:39:35 - INFO - __main__ - Step 5413: {'lr': 9.013333333333333e-05, 'samples': 173216, 'steps': 338, 'loss/train': 6.1488423347473145} -09/20/2021 15:39:36 - INFO - __main__ - Step 5414: {'lr': 9.013333333333333e-05, 'samples': 173248, 'steps': 338, 'loss/train': 4.910859107971191} -09/20/2021 15:39:36 - INFO - __main__ - Step 5415: {'lr': 9.013333333333333e-05, 'samples': 173280, 'steps': 338, 'loss/train': 5.999706268310547} -09/20/2021 15:39:37 - INFO - __main__ - Step 5416: {'lr': 9.013333333333333e-05, 'samples': 173312, 'steps': 338, 'loss/train': 4.861234664916992} -09/20/2021 15:39:39 - INFO - __main__ - Step 5417: {'lr': 9.013333333333333e-05, 'samples': 173344, 'steps': 338, 'loss/train': 5.558713912963867} -09/20/2021 15:39:39 - INFO - __main__ - Step 5418: {'lr': 9.013333333333333e-05, 'samples': 173376, 'steps': 338, 'loss/train': 6.1789937019348145} -09/20/2021 15:39:40 - INFO - __main__ - Step 5419: {'lr': 9.013333333333333e-05, 'samples': 173408, 'steps': 338, 'loss/train': 5.712224960327148} -09/20/2021 15:39:41 - INFO - __main__ - Step 5420: {'lr': 9.013333333333333e-05, 'samples': 173440, 'steps': 338, 'loss/train': 5.447385787963867} -09/20/2021 15:39:42 - INFO - __main__ - Step 5421: {'lr': 9.013333333333333e-05, 'samples': 173472, 'steps': 338, 'loss/train': 5.258033752441406} -09/20/2021 15:39:42 - INFO - __main__ - Step 5422: {'lr': 9.013333333333333e-05, 'samples': 173504, 'steps': 338, 'loss/train': 5.465023517608643} -09/20/2021 15:39:43 - INFO - __main__ - Step 5423: {'lr': 9.013333333333333e-05, 'samples': 173536, 'steps': 338, 'loss/train': 5.288208961486816} -09/20/2021 15:39:44 - INFO - __main__ - Step 5424: {'lr': 9.013333333333333e-05, 'samples': 173568, 'steps': 338, 'loss/train': 6.0776519775390625} -09/20/2021 15:39:45 - INFO - __main__ - Step 5425: {'lr': 9.04e-05, 'samples': 173600, 'steps': 339, 'loss/train': 5.747385025024414} -09/20/2021 15:39:45 - INFO - __main__ - Step 5426: {'lr': 9.04e-05, 'samples': 173632, 'steps': 339, 'loss/train': 5.4006757736206055} -09/20/2021 15:39:46 - INFO - __main__ - Step 5427: {'lr': 9.04e-05, 'samples': 173664, 'steps': 339, 'loss/train': 5.422842979431152} -09/20/2021 15:39:47 - INFO - __main__ - Step 5428: {'lr': 9.04e-05, 'samples': 173696, 'steps': 339, 'loss/train': 5.21320915222168} -09/20/2021 15:39:48 - INFO - __main__ - Step 5429: {'lr': 9.04e-05, 'samples': 173728, 'steps': 339, 'loss/train': 6.408205509185791} -09/20/2021 15:39:48 - INFO - __main__ - Step 5430: {'lr': 9.04e-05, 'samples': 173760, 'steps': 339, 'loss/train': 4.535247802734375} -09/20/2021 15:39:49 - INFO - __main__ - Step 5431: {'lr': 9.04e-05, 'samples': 173792, 'steps': 339, 'loss/train': 5.632444858551025} -09/20/2021 15:39:50 - INFO - __main__ - Step 5432: {'lr': 9.04e-05, 'samples': 173824, 'steps': 339, 'loss/train': 6.282907962799072} -09/20/2021 15:39:51 - INFO - __main__ - Step 5433: {'lr': 9.04e-05, 'samples': 173856, 'steps': 339, 'loss/train': 4.395140171051025} -09/20/2021 15:39:51 - INFO - __main__ - Step 5434: {'lr': 9.04e-05, 'samples': 173888, 'steps': 339, 'loss/train': 5.409454345703125} -09/20/2021 15:39:52 - INFO - __main__ - Step 5435: {'lr': 9.04e-05, 'samples': 173920, 'steps': 339, 'loss/train': 4.4227423667907715} -09/20/2021 15:39:53 - INFO - __main__ - Step 5436: {'lr': 9.04e-05, 'samples': 173952, 'steps': 339, 'loss/train': 6.337096214294434} -09/20/2021 15:39:54 - INFO - __main__ - Step 5437: {'lr': 9.04e-05, 'samples': 173984, 'steps': 339, 'loss/train': 5.819645404815674} -09/20/2021 15:39:54 - INFO - __main__ - Step 5438: {'lr': 9.04e-05, 'samples': 174016, 'steps': 339, 'loss/train': 5.175497531890869} -09/20/2021 15:39:55 - INFO - __main__ - Step 5439: {'lr': 9.04e-05, 'samples': 174048, 'steps': 339, 'loss/train': 4.996785640716553} -09/20/2021 15:39:56 - INFO - __main__ - Step 5440: {'lr': 9.04e-05, 'samples': 174080, 'steps': 339, 'loss/train': 5.028481960296631} -09/20/2021 15:39:57 - INFO - __main__ - Step 5441: {'lr': 9.066666666666667e-05, 'samples': 174112, 'steps': 340, 'loss/train': 5.042288303375244} -09/20/2021 15:39:58 - INFO - __main__ - Step 5442: {'lr': 9.066666666666667e-05, 'samples': 174144, 'steps': 340, 'loss/train': 3.05120849609375} -09/20/2021 15:39:58 - INFO - __main__ - Step 5443: {'lr': 9.066666666666667e-05, 'samples': 174176, 'steps': 340, 'loss/train': 4.070204734802246} -09/20/2021 15:39:59 - INFO - __main__ - Step 5444: {'lr': 9.066666666666667e-05, 'samples': 174208, 'steps': 340, 'loss/train': 4.319990158081055} -09/20/2021 15:40:00 - INFO - __main__ - Step 5445: {'lr': 9.066666666666667e-05, 'samples': 174240, 'steps': 340, 'loss/train': 0.79044109582901} -09/20/2021 15:40:01 - INFO - __main__ - Step 5446: {'lr': 9.066666666666667e-05, 'samples': 174272, 'steps': 340, 'loss/train': 4.365241050720215} -09/20/2021 15:40:01 - INFO - __main__ - Step 5447: {'lr': 9.066666666666667e-05, 'samples': 174304, 'steps': 340, 'loss/train': 5.225815773010254} -09/20/2021 15:40:03 - INFO - __main__ - Step 5448: {'lr': 9.066666666666667e-05, 'samples': 174336, 'steps': 340, 'loss/train': 5.723926544189453} -09/20/2021 15:40:04 - INFO - __main__ - Step 5449: {'lr': 9.066666666666667e-05, 'samples': 174368, 'steps': 340, 'loss/train': 4.663421630859375} -09/20/2021 15:40:04 - INFO - __main__ - Step 5450: {'lr': 9.066666666666667e-05, 'samples': 174400, 'steps': 340, 'loss/train': 5.811573505401611} -09/20/2021 15:40:05 - INFO - __main__ - Step 5451: {'lr': 9.066666666666667e-05, 'samples': 174432, 'steps': 340, 'loss/train': 5.870090007781982} -09/20/2021 15:40:06 - INFO - __main__ - Step 5452: {'lr': 9.066666666666667e-05, 'samples': 174464, 'steps': 340, 'loss/train': 5.60637903213501} -09/20/2021 15:40:07 - INFO - __main__ - Step 5453: {'lr': 9.066666666666667e-05, 'samples': 174496, 'steps': 340, 'loss/train': 5.391072750091553} -09/20/2021 15:40:07 - INFO - __main__ - Step 5454: {'lr': 9.066666666666667e-05, 'samples': 174528, 'steps': 340, 'loss/train': 4.837014675140381} -09/20/2021 15:40:08 - INFO - __main__ - Step 5455: {'lr': 9.066666666666667e-05, 'samples': 174560, 'steps': 340, 'loss/train': 8.686563491821289} -09/20/2021 15:40:09 - INFO - __main__ - Step 5456: {'lr': 9.066666666666667e-05, 'samples': 174592, 'steps': 340, 'loss/train': 5.090390205383301} -09/20/2021 15:40:10 - INFO - __main__ - Step 5457: {'lr': 9.093333333333334e-05, 'samples': 174624, 'steps': 341, 'loss/train': 4.2689032554626465} -09/20/2021 15:40:10 - INFO - __main__ - Step 5458: {'lr': 9.093333333333334e-05, 'samples': 174656, 'steps': 341, 'loss/train': 5.1582536697387695} -09/20/2021 15:40:11 - INFO - __main__ - Step 5459: {'lr': 9.093333333333334e-05, 'samples': 174688, 'steps': 341, 'loss/train': 5.231231212615967} -09/20/2021 15:40:12 - INFO - __main__ - Step 5460: {'lr': 9.093333333333334e-05, 'samples': 174720, 'steps': 341, 'loss/train': 3.0525286197662354} -09/20/2021 15:40:13 - INFO - __main__ - Step 5461: {'lr': 9.093333333333334e-05, 'samples': 174752, 'steps': 341, 'loss/train': 4.288314342498779} -09/20/2021 15:40:13 - INFO - __main__ - Step 5462: {'lr': 9.093333333333334e-05, 'samples': 174784, 'steps': 341, 'loss/train': 3.0058088302612305} -09/20/2021 15:40:14 - INFO - __main__ - Step 5463: {'lr': 9.093333333333334e-05, 'samples': 174816, 'steps': 341, 'loss/train': 2.792443037033081} -09/20/2021 15:40:15 - INFO - __main__ - Step 5464: {'lr': 9.093333333333334e-05, 'samples': 174848, 'steps': 341, 'loss/train': 3.778219223022461} -09/20/2021 15:40:16 - INFO - __main__ - Step 5465: {'lr': 9.093333333333334e-05, 'samples': 174880, 'steps': 341, 'loss/train': 3.0269505977630615} -09/20/2021 15:40:16 - INFO - __main__ - Step 5466: {'lr': 9.093333333333334e-05, 'samples': 174912, 'steps': 341, 'loss/train': 2.786797285079956} -09/20/2021 15:40:17 - INFO - __main__ - Step 5467: {'lr': 9.093333333333334e-05, 'samples': 174944, 'steps': 341, 'loss/train': 5.774354934692383} -09/20/2021 15:40:18 - INFO - __main__ - Step 5468: {'lr': 9.093333333333334e-05, 'samples': 174976, 'steps': 341, 'loss/train': 6.457828044891357} -09/20/2021 15:40:19 - INFO - __main__ - Step 5469: {'lr': 9.093333333333334e-05, 'samples': 175008, 'steps': 341, 'loss/train': 5.144443988800049} -09/20/2021 15:40:19 - INFO - __main__ - Step 5470: {'lr': 9.093333333333334e-05, 'samples': 175040, 'steps': 341, 'loss/train': 4.734076023101807} -09/20/2021 15:40:20 - INFO - __main__ - Step 5471: {'lr': 9.093333333333334e-05, 'samples': 175072, 'steps': 341, 'loss/train': 6.414511203765869} -09/20/2021 15:40:21 - INFO - __main__ - Step 5472: {'lr': 9.093333333333334e-05, 'samples': 175104, 'steps': 341, 'loss/train': 5.26296854019165} -09/20/2021 15:40:22 - INFO - __main__ - Step 5473: {'lr': 9.120000000000001e-05, 'samples': 175136, 'steps': 342, 'loss/train': 3.9741015434265137} -09/20/2021 15:40:23 - INFO - __main__ - Step 5474: {'lr': 9.120000000000001e-05, 'samples': 175168, 'steps': 342, 'loss/train': 5.563560962677002} -09/20/2021 15:40:23 - INFO - __main__ - Step 5475: {'lr': 9.120000000000001e-05, 'samples': 175200, 'steps': 342, 'loss/train': 5.5657572746276855} -09/20/2021 15:40:24 - INFO - __main__ - Step 5476: {'lr': 9.120000000000001e-05, 'samples': 175232, 'steps': 342, 'loss/train': 3.7923474311828613} -09/20/2021 15:40:25 - INFO - __main__ - Step 5477: {'lr': 9.120000000000001e-05, 'samples': 175264, 'steps': 342, 'loss/train': 3.815202236175537} -09/20/2021 15:40:26 - INFO - __main__ - Step 5478: {'lr': 9.120000000000001e-05, 'samples': 175296, 'steps': 342, 'loss/train': 6.279961109161377} -09/20/2021 15:40:26 - INFO - __main__ - Step 5479: {'lr': 9.120000000000001e-05, 'samples': 175328, 'steps': 342, 'loss/train': 4.906879425048828} -09/20/2021 15:40:27 - INFO - __main__ - Step 5480: {'lr': 9.120000000000001e-05, 'samples': 175360, 'steps': 342, 'loss/train': 5.348393440246582} -09/20/2021 15:40:28 - INFO - __main__ - Step 5481: {'lr': 9.120000000000001e-05, 'samples': 175392, 'steps': 342, 'loss/train': 6.18222713470459} -09/20/2021 15:40:29 - INFO - __main__ - Step 5482: {'lr': 9.120000000000001e-05, 'samples': 175424, 'steps': 342, 'loss/train': 5.1833672523498535} -09/20/2021 15:40:30 - INFO - __main__ - Step 5483: {'lr': 9.120000000000001e-05, 'samples': 175456, 'steps': 342, 'loss/train': 5.424426078796387} -09/20/2021 15:40:31 - INFO - __main__ - Step 5484: {'lr': 9.120000000000001e-05, 'samples': 175488, 'steps': 342, 'loss/train': 6.072707653045654} -09/20/2021 15:40:31 - INFO - __main__ - Step 5485: {'lr': 9.120000000000001e-05, 'samples': 175520, 'steps': 342, 'loss/train': 5.357459545135498} -09/20/2021 15:40:32 - INFO - __main__ - Step 5486: {'lr': 9.120000000000001e-05, 'samples': 175552, 'steps': 342, 'loss/train': 5.035484313964844} -09/20/2021 15:40:33 - INFO - __main__ - Step 5487: {'lr': 9.120000000000001e-05, 'samples': 175584, 'steps': 342, 'loss/train': 5.874192714691162} -09/20/2021 15:40:34 - INFO - __main__ - Step 5488: {'lr': 9.120000000000001e-05, 'samples': 175616, 'steps': 342, 'loss/train': 4.668027877807617} -09/20/2021 15:40:35 - INFO - __main__ - Step 5489: {'lr': 9.146666666666666e-05, 'samples': 175648, 'steps': 343, 'loss/train': 5.027698516845703} -09/20/2021 15:40:35 - INFO - __main__ - Step 5490: {'lr': 9.146666666666666e-05, 'samples': 175680, 'steps': 343, 'loss/train': 5.347578525543213} -09/20/2021 15:40:36 - INFO - __main__ - Step 5491: {'lr': 9.146666666666666e-05, 'samples': 175712, 'steps': 343, 'loss/train': 5.973912715911865} -09/20/2021 15:40:37 - INFO - __main__ - Step 5492: {'lr': 9.146666666666666e-05, 'samples': 175744, 'steps': 343, 'loss/train': 5.637224197387695} -09/20/2021 15:40:38 - INFO - __main__ - Step 5493: {'lr': 9.146666666666666e-05, 'samples': 175776, 'steps': 343, 'loss/train': 4.953136444091797} -09/20/2021 15:40:38 - INFO - __main__ - Step 5494: {'lr': 9.146666666666666e-05, 'samples': 175808, 'steps': 343, 'loss/train': 5.500664234161377} -09/20/2021 15:40:39 - INFO - __main__ - Step 5495: {'lr': 9.146666666666666e-05, 'samples': 175840, 'steps': 343, 'loss/train': 5.905028820037842} -09/20/2021 15:40:40 - INFO - __main__ - Step 5496: {'lr': 9.146666666666666e-05, 'samples': 175872, 'steps': 343, 'loss/train': 5.066688060760498} -09/20/2021 15:40:41 - INFO - __main__ - Step 5497: {'lr': 9.146666666666666e-05, 'samples': 175904, 'steps': 343, 'loss/train': 5.592641830444336} -09/20/2021 15:40:41 - INFO - __main__ - Step 5498: {'lr': 9.146666666666666e-05, 'samples': 175936, 'steps': 343, 'loss/train': 5.193167686462402} -09/20/2021 15:40:42 - INFO - __main__ - Step 5499: {'lr': 9.146666666666666e-05, 'samples': 175968, 'steps': 343, 'loss/train': 5.746843338012695} -09/20/2021 15:40:43 - INFO - __main__ - Step 5500: {'lr': 9.146666666666666e-05, 'samples': 176000, 'steps': 343, 'loss/train': 4.314781188964844} -09/20/2021 15:40:44 - INFO - __main__ - Step 5501: {'lr': 9.146666666666666e-05, 'samples': 176032, 'steps': 343, 'loss/train': 5.571049690246582} -09/20/2021 15:40:44 - INFO - __main__ - Step 5502: {'lr': 9.146666666666666e-05, 'samples': 176064, 'steps': 343, 'loss/train': 5.3748698234558105} -09/20/2021 15:40:45 - INFO - __main__ - Step 5503: {'lr': 9.146666666666666e-05, 'samples': 176096, 'steps': 343, 'loss/train': 5.348785877227783} -09/20/2021 15:40:46 - INFO - __main__ - Step 5504: {'lr': 9.146666666666666e-05, 'samples': 176128, 'steps': 343, 'loss/train': 6.266200542449951} -09/20/2021 15:40:47 - INFO - __main__ - Step 5505: {'lr': 9.173333333333333e-05, 'samples': 176160, 'steps': 344, 'loss/train': 5.019848823547363} -09/20/2021 15:40:48 - INFO - __main__ - Step 5506: {'lr': 9.173333333333333e-05, 'samples': 176192, 'steps': 344, 'loss/train': 6.520395755767822} -09/20/2021 15:40:48 - INFO - __main__ - Step 5507: {'lr': 9.173333333333333e-05, 'samples': 176224, 'steps': 344, 'loss/train': 3.338437795639038} -09/20/2021 15:40:49 - INFO - __main__ - Step 5508: {'lr': 9.173333333333333e-05, 'samples': 176256, 'steps': 344, 'loss/train': 5.440505027770996} -09/20/2021 15:40:50 - INFO - __main__ - Step 5509: {'lr': 9.173333333333333e-05, 'samples': 176288, 'steps': 344, 'loss/train': 5.432440280914307} -09/20/2021 15:40:51 - INFO - __main__ - Step 5510: {'lr': 9.173333333333333e-05, 'samples': 176320, 'steps': 344, 'loss/train': 5.015069484710693} -09/20/2021 15:40:51 - INFO - __main__ - Step 5511: {'lr': 9.173333333333333e-05, 'samples': 176352, 'steps': 344, 'loss/train': 2.7534196376800537} -09/20/2021 15:40:54 - INFO - __main__ - Step 5512: {'lr': 9.173333333333333e-05, 'samples': 176384, 'steps': 344, 'loss/train': 2.905034303665161} -09/20/2021 15:40:55 - INFO - __main__ - Step 5513: {'lr': 9.173333333333333e-05, 'samples': 176416, 'steps': 344, 'loss/train': 5.491565227508545} -09/20/2021 15:40:55 - INFO - __main__ - Step 5514: {'lr': 9.173333333333333e-05, 'samples': 176448, 'steps': 344, 'loss/train': 5.437163829803467} -09/20/2021 15:40:56 - INFO - __main__ - Step 5515: {'lr': 9.173333333333333e-05, 'samples': 176480, 'steps': 344, 'loss/train': 5.731266975402832} -09/20/2021 15:40:57 - INFO - __main__ - Step 5516: {'lr': 9.173333333333333e-05, 'samples': 176512, 'steps': 344, 'loss/train': 5.799922466278076} -09/20/2021 15:40:58 - INFO - __main__ - Step 5517: {'lr': 9.173333333333333e-05, 'samples': 176544, 'steps': 344, 'loss/train': 5.506438255310059} -09/20/2021 15:40:58 - INFO - __main__ - Step 5518: {'lr': 9.173333333333333e-05, 'samples': 176576, 'steps': 344, 'loss/train': 4.860450744628906} -09/20/2021 15:40:59 - INFO - __main__ - Step 5519: {'lr': 9.173333333333333e-05, 'samples': 176608, 'steps': 344, 'loss/train': 4.5448431968688965} -09/20/2021 15:41:00 - INFO - __main__ - Step 5520: {'lr': 9.173333333333333e-05, 'samples': 176640, 'steps': 344, 'loss/train': 5.547249794006348} -09/20/2021 15:41:01 - INFO - __main__ - Step 5521: {'lr': 9.200000000000001e-05, 'samples': 176672, 'steps': 345, 'loss/train': 5.1532464027404785} -09/20/2021 15:41:01 - INFO - __main__ - Step 5522: {'lr': 9.200000000000001e-05, 'samples': 176704, 'steps': 345, 'loss/train': 5.389433860778809} -09/20/2021 15:41:02 - INFO - __main__ - Step 5523: {'lr': 9.200000000000001e-05, 'samples': 176736, 'steps': 345, 'loss/train': 5.264421463012695} -09/20/2021 15:41:03 - INFO - __main__ - Step 5524: {'lr': 9.200000000000001e-05, 'samples': 176768, 'steps': 345, 'loss/train': 5.114089012145996} -09/20/2021 15:41:04 - INFO - __main__ - Step 5525: {'lr': 9.200000000000001e-05, 'samples': 176800, 'steps': 345, 'loss/train': 5.102212429046631} -09/20/2021 15:41:04 - INFO - __main__ - Step 5526: {'lr': 9.200000000000001e-05, 'samples': 176832, 'steps': 345, 'loss/train': 5.101009845733643} -09/20/2021 15:41:05 - INFO - __main__ - Step 5527: {'lr': 9.200000000000001e-05, 'samples': 176864, 'steps': 345, 'loss/train': 5.327374458312988} -09/20/2021 15:41:06 - INFO - __main__ - Step 5528: {'lr': 9.200000000000001e-05, 'samples': 176896, 'steps': 345, 'loss/train': 5.215038299560547} -09/20/2021 15:41:07 - INFO - __main__ - Step 5529: {'lr': 9.200000000000001e-05, 'samples': 176928, 'steps': 345, 'loss/train': 5.563596248626709} -09/20/2021 15:41:07 - INFO - __main__ - Step 5530: {'lr': 9.200000000000001e-05, 'samples': 176960, 'steps': 345, 'loss/train': 5.593835353851318} -09/20/2021 15:41:08 - INFO - __main__ - Step 5531: {'lr': 9.200000000000001e-05, 'samples': 176992, 'steps': 345, 'loss/train': 5.430323123931885} -09/20/2021 15:41:09 - INFO - __main__ - Step 5532: {'lr': 9.200000000000001e-05, 'samples': 177024, 'steps': 345, 'loss/train': 5.432932376861572} -09/20/2021 15:41:10 - INFO - __main__ - Step 5533: {'lr': 9.200000000000001e-05, 'samples': 177056, 'steps': 345, 'loss/train': 5.214032173156738} -09/20/2021 15:41:10 - INFO - __main__ - Step 5534: {'lr': 9.200000000000001e-05, 'samples': 177088, 'steps': 345, 'loss/train': 4.882608413696289} -09/20/2021 15:41:11 - INFO - __main__ - Step 5535: {'lr': 9.200000000000001e-05, 'samples': 177120, 'steps': 345, 'loss/train': 5.227992534637451} -09/20/2021 15:41:12 - INFO - __main__ - Step 5536: {'lr': 9.200000000000001e-05, 'samples': 177152, 'steps': 345, 'loss/train': 5.827428817749023} -09/20/2021 15:41:13 - INFO - __main__ - Step 5537: {'lr': 9.226666666666667e-05, 'samples': 177184, 'steps': 346, 'loss/train': 5.71653413772583} -09/20/2021 15:41:14 - INFO - __main__ - Step 5538: {'lr': 9.226666666666667e-05, 'samples': 177216, 'steps': 346, 'loss/train': 5.346329212188721} -09/20/2021 15:41:14 - INFO - __main__ - Step 5539: {'lr': 9.226666666666667e-05, 'samples': 177248, 'steps': 346, 'loss/train': 3.822739362716675} -09/20/2021 15:41:15 - INFO - __main__ - Step 5540: {'lr': 9.226666666666667e-05, 'samples': 177280, 'steps': 346, 'loss/train': 3.8205432891845703} -09/20/2021 15:41:16 - INFO - __main__ - Step 5541: {'lr': 9.226666666666667e-05, 'samples': 177312, 'steps': 346, 'loss/train': 3.8150229454040527} -09/20/2021 15:41:17 - INFO - __main__ - Step 5542: {'lr': 9.226666666666667e-05, 'samples': 177344, 'steps': 346, 'loss/train': 5.280844688415527} -09/20/2021 15:41:17 - INFO - __main__ - Step 5543: {'lr': 9.226666666666667e-05, 'samples': 177376, 'steps': 346, 'loss/train': 5.203717231750488} -09/20/2021 15:41:18 - INFO - __main__ - Step 5544: {'lr': 9.226666666666667e-05, 'samples': 177408, 'steps': 346, 'loss/train': 5.3951191902160645} -09/20/2021 15:41:19 - INFO - __main__ - Step 5545: {'lr': 9.226666666666667e-05, 'samples': 177440, 'steps': 346, 'loss/train': 5.56262731552124} -09/20/2021 15:41:20 - INFO - __main__ - Step 5546: {'lr': 9.226666666666667e-05, 'samples': 177472, 'steps': 346, 'loss/train': 5.205550193786621} -09/20/2021 15:41:20 - INFO - __main__ - Step 5547: {'lr': 9.226666666666667e-05, 'samples': 177504, 'steps': 346, 'loss/train': 5.739883899688721} -09/20/2021 15:41:21 - INFO - __main__ - Step 5548: {'lr': 9.226666666666667e-05, 'samples': 177536, 'steps': 346, 'loss/train': 4.655445575714111} -09/20/2021 15:41:22 - INFO - __main__ - Step 5549: {'lr': 9.226666666666667e-05, 'samples': 177568, 'steps': 346, 'loss/train': 6.046304225921631} -09/20/2021 15:41:23 - INFO - __main__ - Step 5550: {'lr': 9.226666666666667e-05, 'samples': 177600, 'steps': 346, 'loss/train': 4.951590538024902} -09/20/2021 15:41:24 - INFO - __main__ - Step 5551: {'lr': 9.226666666666667e-05, 'samples': 177632, 'steps': 346, 'loss/train': 5.4689459800720215} -09/20/2021 15:41:25 - INFO - __main__ - Step 5552: {'lr': 9.226666666666667e-05, 'samples': 177664, 'steps': 346, 'loss/train': 5.03894567489624} -09/20/2021 15:41:26 - INFO - __main__ - Step 5553: {'lr': 9.253333333333334e-05, 'samples': 177696, 'steps': 347, 'loss/train': 6.014812469482422} -09/20/2021 15:41:26 - INFO - __main__ - Step 5554: {'lr': 9.253333333333334e-05, 'samples': 177728, 'steps': 347, 'loss/train': 5.676041603088379} -09/20/2021 15:41:27 - INFO - __main__ - Step 5555: {'lr': 9.253333333333334e-05, 'samples': 177760, 'steps': 347, 'loss/train': 5.2041168212890625} -09/20/2021 15:41:28 - INFO - __main__ - Step 5556: {'lr': 9.253333333333334e-05, 'samples': 177792, 'steps': 347, 'loss/train': 5.748292446136475} -09/20/2021 15:41:29 - INFO - __main__ - Step 5557: {'lr': 9.253333333333334e-05, 'samples': 177824, 'steps': 347, 'loss/train': 5.339812278747559} -09/20/2021 15:41:29 - INFO - __main__ - Step 5558: {'lr': 9.253333333333334e-05, 'samples': 177856, 'steps': 347, 'loss/train': 5.330984592437744} -09/20/2021 15:41:30 - INFO - __main__ - Step 5559: {'lr': 9.253333333333334e-05, 'samples': 177888, 'steps': 347, 'loss/train': 5.789372444152832} -09/20/2021 15:41:31 - INFO - __main__ - Step 5560: {'lr': 9.253333333333334e-05, 'samples': 177920, 'steps': 347, 'loss/train': 5.302978038787842} -09/20/2021 15:41:32 - INFO - __main__ - Step 5561: {'lr': 9.253333333333334e-05, 'samples': 177952, 'steps': 347, 'loss/train': 6.00895357131958} -09/20/2021 15:41:32 - INFO - __main__ - Step 5562: {'lr': 9.253333333333334e-05, 'samples': 177984, 'steps': 347, 'loss/train': 4.645674228668213} -09/20/2021 15:41:33 - INFO - __main__ - Step 5563: {'lr': 9.253333333333334e-05, 'samples': 178016, 'steps': 347, 'loss/train': 5.512679100036621} -09/20/2021 15:41:34 - INFO - __main__ - Step 5564: {'lr': 9.253333333333334e-05, 'samples': 178048, 'steps': 347, 'loss/train': 5.9419379234313965} -09/20/2021 15:41:35 - INFO - __main__ - Step 5565: {'lr': 9.253333333333334e-05, 'samples': 178080, 'steps': 347, 'loss/train': 3.1105146408081055} -09/20/2021 15:41:36 - INFO - __main__ - Step 5566: {'lr': 9.253333333333334e-05, 'samples': 178112, 'steps': 347, 'loss/train': 3.0075032711029053} -09/20/2021 15:41:36 - INFO - __main__ - Step 5567: {'lr': 9.253333333333334e-05, 'samples': 178144, 'steps': 347, 'loss/train': 2.8887717723846436} -09/20/2021 15:41:37 - INFO - __main__ - Step 5568: {'lr': 9.253333333333334e-05, 'samples': 178176, 'steps': 347, 'loss/train': 5.608914852142334} -09/20/2021 15:41:38 - INFO - __main__ - Step 5569: {'lr': 9.28e-05, 'samples': 178208, 'steps': 348, 'loss/train': 6.040829181671143} -09/20/2021 15:41:39 - INFO - __main__ - Step 5570: {'lr': 9.28e-05, 'samples': 178240, 'steps': 348, 'loss/train': 5.449212074279785} -09/20/2021 15:41:39 - INFO - __main__ - Step 5571: {'lr': 9.28e-05, 'samples': 178272, 'steps': 348, 'loss/train': 4.975844383239746} -09/20/2021 15:41:40 - INFO - __main__ - Step 5572: {'lr': 9.28e-05, 'samples': 178304, 'steps': 348, 'loss/train': 5.733387470245361} -09/20/2021 15:41:41 - INFO - __main__ - Step 5573: {'lr': 9.28e-05, 'samples': 178336, 'steps': 348, 'loss/train': 5.796306133270264} -09/20/2021 15:41:42 - INFO - __main__ - Step 5574: {'lr': 9.28e-05, 'samples': 178368, 'steps': 348, 'loss/train': 4.927916526794434} -09/20/2021 15:41:42 - INFO - __main__ - Step 5575: {'lr': 9.28e-05, 'samples': 178400, 'steps': 348, 'loss/train': 4.8048481941223145} -09/20/2021 15:41:43 - INFO - __main__ - Step 5576: {'lr': 9.28e-05, 'samples': 178432, 'steps': 348, 'loss/train': 5.8723320960998535} -09/20/2021 15:41:44 - INFO - __main__ - Step 5577: {'lr': 9.28e-05, 'samples': 178464, 'steps': 348, 'loss/train': 4.99798059463501} -09/20/2021 15:41:45 - INFO - __main__ - Step 5578: {'lr': 9.28e-05, 'samples': 178496, 'steps': 348, 'loss/train': 4.907747745513916} -09/20/2021 15:41:45 - INFO - __main__ - Step 5579: {'lr': 9.28e-05, 'samples': 178528, 'steps': 348, 'loss/train': 6.255158424377441} -09/20/2021 15:41:46 - INFO - __main__ - Step 5580: {'lr': 9.28e-05, 'samples': 178560, 'steps': 348, 'loss/train': 4.368497848510742} -09/20/2021 15:41:47 - INFO - __main__ - Step 5581: {'lr': 9.28e-05, 'samples': 178592, 'steps': 348, 'loss/train': 4.673708438873291} -09/20/2021 15:41:48 - INFO - __main__ - Step 5582: {'lr': 9.28e-05, 'samples': 178624, 'steps': 348, 'loss/train': 4.3714470863342285} -09/20/2021 15:41:49 - INFO - __main__ - Step 5583: {'lr': 9.28e-05, 'samples': 178656, 'steps': 348, 'loss/train': 5.492004871368408} -09/20/2021 15:41:50 - INFO - __main__ - Step 5584: {'lr': 9.28e-05, 'samples': 178688, 'steps': 348, 'loss/train': 5.2347941398620605} -09/20/2021 15:41:51 - INFO - __main__ - Step 5585: {'lr': 9.306666666666667e-05, 'samples': 178720, 'steps': 349, 'loss/train': 5.52326774597168} -09/20/2021 15:41:51 - INFO - __main__ - Step 5586: {'lr': 9.306666666666667e-05, 'samples': 178752, 'steps': 349, 'loss/train': 5.168998718261719} -09/20/2021 15:41:52 - INFO - __main__ - Step 5587: {'lr': 9.306666666666667e-05, 'samples': 178784, 'steps': 349, 'loss/train': 5.387095928192139} -09/20/2021 15:41:53 - INFO - __main__ - Step 5588: {'lr': 9.306666666666667e-05, 'samples': 178816, 'steps': 349, 'loss/train': 6.600735664367676} -09/20/2021 15:41:54 - INFO - __main__ - Step 5589: {'lr': 9.306666666666667e-05, 'samples': 178848, 'steps': 349, 'loss/train': 5.348033428192139} -09/20/2021 15:41:54 - INFO - __main__ - Step 5590: {'lr': 9.306666666666667e-05, 'samples': 178880, 'steps': 349, 'loss/train': 5.064727306365967} -09/20/2021 15:41:55 - INFO - __main__ - Step 5591: {'lr': 9.306666666666667e-05, 'samples': 178912, 'steps': 349, 'loss/train': 5.199248790740967} -09/20/2021 15:41:56 - INFO - __main__ - Step 5592: {'lr': 9.306666666666667e-05, 'samples': 178944, 'steps': 349, 'loss/train': 3.6228835582733154} -09/20/2021 15:41:57 - INFO - __main__ - Step 5593: {'lr': 9.306666666666667e-05, 'samples': 178976, 'steps': 349, 'loss/train': 4.655359268188477} -09/20/2021 15:41:57 - INFO - __main__ - Step 5594: {'lr': 9.306666666666667e-05, 'samples': 179008, 'steps': 349, 'loss/train': 5.7903523445129395} -09/20/2021 15:41:58 - INFO - __main__ - Step 5595: {'lr': 9.306666666666667e-05, 'samples': 179040, 'steps': 349, 'loss/train': 5.156915664672852} -09/20/2021 15:41:59 - INFO - __main__ - Step 5596: {'lr': 9.306666666666667e-05, 'samples': 179072, 'steps': 349, 'loss/train': 5.207408905029297} -09/20/2021 15:42:00 - INFO - __main__ - Step 5597: {'lr': 9.306666666666667e-05, 'samples': 179104, 'steps': 349, 'loss/train': 5.719457149505615} -09/20/2021 15:42:00 - INFO - __main__ - Step 5598: {'lr': 9.306666666666667e-05, 'samples': 179136, 'steps': 349, 'loss/train': 5.580404758453369} -09/20/2021 15:42:01 - INFO - __main__ - Step 5599: {'lr': 9.306666666666667e-05, 'samples': 179168, 'steps': 349, 'loss/train': 5.844814777374268} -09/20/2021 15:42:02 - INFO - __main__ - Step 5600: {'lr': 9.306666666666667e-05, 'samples': 179200, 'steps': 349, 'loss/train': 5.466605186462402} -09/20/2021 15:42:03 - INFO - __main__ - Step 5601: {'lr': 9.333333333333334e-05, 'samples': 179232, 'steps': 350, 'loss/train': 5.680483818054199} -09/20/2021 15:42:04 - INFO - __main__ - Step 5602: {'lr': 9.333333333333334e-05, 'samples': 179264, 'steps': 350, 'loss/train': 5.718944549560547} -09/20/2021 15:42:04 - INFO - __main__ - Step 5603: {'lr': 9.333333333333334e-05, 'samples': 179296, 'steps': 350, 'loss/train': 9.51846981048584} -09/20/2021 15:42:05 - INFO - __main__ - Step 5604: {'lr': 9.333333333333334e-05, 'samples': 179328, 'steps': 350, 'loss/train': 5.7753777503967285} -09/20/2021 15:42:06 - INFO - __main__ - Step 5605: {'lr': 9.333333333333334e-05, 'samples': 179360, 'steps': 350, 'loss/train': 5.53237771987915} -09/20/2021 15:42:07 - INFO - __main__ - Step 5606: {'lr': 9.333333333333334e-05, 'samples': 179392, 'steps': 350, 'loss/train': 4.430092811584473} -09/20/2021 15:42:07 - INFO - __main__ - Step 5607: {'lr': 9.333333333333334e-05, 'samples': 179424, 'steps': 350, 'loss/train': 7.190914630889893} -09/20/2021 15:42:08 - INFO - __main__ - Step 5608: {'lr': 9.333333333333334e-05, 'samples': 179456, 'steps': 350, 'loss/train': 7.138641357421875} -09/20/2021 15:42:09 - INFO - __main__ - Step 5609: {'lr': 9.333333333333334e-05, 'samples': 179488, 'steps': 350, 'loss/train': 7.302279949188232} -09/20/2021 15:42:10 - INFO - __main__ - Step 5610: {'lr': 9.333333333333334e-05, 'samples': 179520, 'steps': 350, 'loss/train': 7.175479412078857} -09/20/2021 15:42:10 - INFO - __main__ - Step 5611: {'lr': 9.333333333333334e-05, 'samples': 179552, 'steps': 350, 'loss/train': 7.285817623138428} -09/20/2021 15:42:11 - INFO - __main__ - Step 5612: {'lr': 9.333333333333334e-05, 'samples': 179584, 'steps': 350, 'loss/train': 5.456872463226318} -09/20/2021 15:42:12 - INFO - __main__ - Step 5613: {'lr': 9.333333333333334e-05, 'samples': 179616, 'steps': 350, 'loss/train': 6.060328006744385} -09/20/2021 15:42:13 - INFO - __main__ - Step 5614: {'lr': 9.333333333333334e-05, 'samples': 179648, 'steps': 350, 'loss/train': 5.770284175872803} -09/20/2021 15:42:13 - INFO - __main__ - Step 5615: {'lr': 9.333333333333334e-05, 'samples': 179680, 'steps': 350, 'loss/train': 5.315225124359131} -09/20/2021 15:42:14 - INFO - __main__ - Step 5616: {'lr': 9.333333333333334e-05, 'samples': 179712, 'steps': 350, 'loss/train': 4.870311737060547} -09/20/2021 15:42:15 - INFO - __main__ - Step 5617: {'lr': 9.360000000000001e-05, 'samples': 179744, 'steps': 351, 'loss/train': 4.766963958740234} -09/20/2021 15:42:16 - INFO - __main__ - Step 5618: {'lr': 9.360000000000001e-05, 'samples': 179776, 'steps': 351, 'loss/train': 5.025938987731934} -09/20/2021 15:42:17 - INFO - __main__ - Step 5619: {'lr': 9.360000000000001e-05, 'samples': 179808, 'steps': 351, 'loss/train': 5.023279190063477} -09/20/2021 15:42:18 - INFO - __main__ - Step 5620: {'lr': 9.360000000000001e-05, 'samples': 179840, 'steps': 351, 'loss/train': 5.94888162612915} -09/20/2021 15:42:18 - INFO - __main__ - Step 5621: {'lr': 9.360000000000001e-05, 'samples': 179872, 'steps': 351, 'loss/train': 4.599450588226318} -09/20/2021 15:42:19 - INFO - __main__ - Step 5622: {'lr': 9.360000000000001e-05, 'samples': 179904, 'steps': 351, 'loss/train': 4.716702461242676} -09/20/2021 15:42:20 - INFO - __main__ - Step 5623: {'lr': 9.360000000000001e-05, 'samples': 179936, 'steps': 351, 'loss/train': 5.668166160583496} -09/20/2021 15:42:21 - INFO - __main__ - Step 5624: {'lr': 9.360000000000001e-05, 'samples': 179968, 'steps': 351, 'loss/train': 5.123833656311035} -09/20/2021 15:42:21 - INFO - __main__ - Step 5625: {'lr': 9.360000000000001e-05, 'samples': 180000, 'steps': 351, 'loss/train': 5.297661781311035} -09/20/2021 15:42:22 - INFO - __main__ - Step 5626: {'lr': 9.360000000000001e-05, 'samples': 180032, 'steps': 351, 'loss/train': 5.055722236633301} -09/20/2021 15:42:23 - INFO - __main__ - Step 5627: {'lr': 9.360000000000001e-05, 'samples': 180064, 'steps': 351, 'loss/train': 3.9614734649658203} -09/20/2021 15:42:24 - INFO - __main__ - Step 5628: {'lr': 9.360000000000001e-05, 'samples': 180096, 'steps': 351, 'loss/train': 5.633477210998535} -09/20/2021 15:42:24 - INFO - __main__ - Step 5629: {'lr': 9.360000000000001e-05, 'samples': 180128, 'steps': 351, 'loss/train': 5.089399337768555} -09/20/2021 15:42:25 - INFO - __main__ - Step 5630: {'lr': 9.360000000000001e-05, 'samples': 180160, 'steps': 351, 'loss/train': 5.754918575286865} -09/20/2021 15:42:26 - INFO - __main__ - Step 5631: {'lr': 9.360000000000001e-05, 'samples': 180192, 'steps': 351, 'loss/train': 5.5740838050842285} -09/20/2021 15:42:27 - INFO - __main__ - Step 5632: {'lr': 9.360000000000001e-05, 'samples': 180224, 'steps': 351, 'loss/train': 5.948805809020996} -09/20/2021 15:42:28 - INFO - __main__ - Step 5633: {'lr': 9.386666666666667e-05, 'samples': 180256, 'steps': 352, 'loss/train': 5.671315670013428} -09/20/2021 15:42:28 - INFO - __main__ - Step 5634: {'lr': 9.386666666666667e-05, 'samples': 180288, 'steps': 352, 'loss/train': 5.004700183868408} -09/20/2021 15:42:29 - INFO - __main__ - Step 5635: {'lr': 9.386666666666667e-05, 'samples': 180320, 'steps': 352, 'loss/train': 5.758557319641113} -09/20/2021 15:42:30 - INFO - __main__ - Step 5636: {'lr': 9.386666666666667e-05, 'samples': 180352, 'steps': 352, 'loss/train': 3.1684606075286865} -09/20/2021 15:42:31 - INFO - __main__ - Step 5637: {'lr': 9.386666666666667e-05, 'samples': 180384, 'steps': 352, 'loss/train': 4.73129415512085} -09/20/2021 15:42:31 - INFO - __main__ - Step 5638: {'lr': 9.386666666666667e-05, 'samples': 180416, 'steps': 352, 'loss/train': 5.586840629577637} -09/20/2021 15:42:32 - INFO - __main__ - Step 5639: {'lr': 9.386666666666667e-05, 'samples': 180448, 'steps': 352, 'loss/train': 5.304491996765137} -09/20/2021 15:42:33 - INFO - __main__ - Step 5640: {'lr': 9.386666666666667e-05, 'samples': 180480, 'steps': 352, 'loss/train': 0.7812522649765015} -09/20/2021 15:42:34 - INFO - __main__ - Step 5641: {'lr': 9.386666666666667e-05, 'samples': 180512, 'steps': 352, 'loss/train': 5.680932521820068} -09/20/2021 15:42:34 - INFO - __main__ - Step 5642: {'lr': 9.386666666666667e-05, 'samples': 180544, 'steps': 352, 'loss/train': 5.422125339508057} -09/20/2021 15:42:35 - INFO - __main__ - Step 5643: {'lr': 9.386666666666667e-05, 'samples': 180576, 'steps': 352, 'loss/train': 4.479362964630127} -09/20/2021 15:42:36 - INFO - __main__ - Step 5644: {'lr': 9.386666666666667e-05, 'samples': 180608, 'steps': 352, 'loss/train': 4.7793965339660645} -09/20/2021 15:42:37 - INFO - __main__ - Step 5645: {'lr': 9.386666666666667e-05, 'samples': 180640, 'steps': 352, 'loss/train': 5.4366278648376465} -09/20/2021 15:42:37 - INFO - __main__ - Step 5646: {'lr': 9.386666666666667e-05, 'samples': 180672, 'steps': 352, 'loss/train': 5.637180805206299} -09/20/2021 15:42:38 - INFO - __main__ - Step 5647: {'lr': 9.386666666666667e-05, 'samples': 180704, 'steps': 352, 'loss/train': 4.616225719451904} -09/20/2021 15:42:39 - INFO - __main__ - Step 5648: {'lr': 9.386666666666667e-05, 'samples': 180736, 'steps': 352, 'loss/train': 4.370076656341553} -09/20/2021 15:42:41 - INFO - __main__ - Step 5649: {'lr': 9.413333333333334e-05, 'samples': 180768, 'steps': 353, 'loss/train': 5.53543758392334} -09/20/2021 15:42:41 - INFO - __main__ - Step 5650: {'lr': 9.413333333333334e-05, 'samples': 180800, 'steps': 353, 'loss/train': 6.163289546966553} -09/20/2021 15:42:42 - INFO - __main__ - Step 5651: {'lr': 9.413333333333334e-05, 'samples': 180832, 'steps': 353, 'loss/train': 5.363085746765137} -09/20/2021 15:42:43 - INFO - __main__ - Step 5652: {'lr': 9.413333333333334e-05, 'samples': 180864, 'steps': 353, 'loss/train': 4.78127908706665} -09/20/2021 15:42:44 - INFO - __main__ - Step 5653: {'lr': 9.413333333333334e-05, 'samples': 180896, 'steps': 353, 'loss/train': 5.166905879974365} -09/20/2021 15:42:44 - INFO - __main__ - Step 5654: {'lr': 9.413333333333334e-05, 'samples': 180928, 'steps': 353, 'loss/train': 5.171432018280029} -09/20/2021 15:42:45 - INFO - __main__ - Step 5655: {'lr': 9.413333333333334e-05, 'samples': 180960, 'steps': 353, 'loss/train': 4.9827775955200195} -09/20/2021 15:42:46 - INFO - __main__ - Step 5656: {'lr': 9.413333333333334e-05, 'samples': 180992, 'steps': 353, 'loss/train': 5.383551120758057} -09/20/2021 15:42:47 - INFO - __main__ - Step 5657: {'lr': 9.413333333333334e-05, 'samples': 181024, 'steps': 353, 'loss/train': 5.136074542999268} -09/20/2021 15:42:47 - INFO - __main__ - Step 5658: {'lr': 9.413333333333334e-05, 'samples': 181056, 'steps': 353, 'loss/train': 6.080063819885254} -09/20/2021 15:42:48 - INFO - __main__ - Step 5659: {'lr': 9.413333333333334e-05, 'samples': 181088, 'steps': 353, 'loss/train': 7.462455749511719} -09/20/2021 15:42:49 - INFO - __main__ - Step 5660: {'lr': 9.413333333333334e-05, 'samples': 181120, 'steps': 353, 'loss/train': 4.6756978034973145} -09/20/2021 15:42:50 - INFO - __main__ - Step 5661: {'lr': 9.413333333333334e-05, 'samples': 181152, 'steps': 353, 'loss/train': 4.964842796325684} -09/20/2021 15:42:50 - INFO - __main__ - Step 5662: {'lr': 9.413333333333334e-05, 'samples': 181184, 'steps': 353, 'loss/train': 4.537538528442383} -09/20/2021 15:42:51 - INFO - __main__ - Step 5663: {'lr': 9.413333333333334e-05, 'samples': 181216, 'steps': 353, 'loss/train': 5.558237552642822} -09/20/2021 15:42:52 - INFO - __main__ - Step 5664: {'lr': 9.413333333333334e-05, 'samples': 181248, 'steps': 353, 'loss/train': 2.9045636653900146} -09/20/2021 15:42:53 - INFO - __main__ - Step 5665: {'lr': 9.44e-05, 'samples': 181280, 'steps': 354, 'loss/train': 5.69777250289917} -09/20/2021 15:42:54 - INFO - __main__ - Step 5666: {'lr': 9.44e-05, 'samples': 181312, 'steps': 354, 'loss/train': 3.213541030883789} -09/20/2021 15:42:54 - INFO - __main__ - Step 5667: {'lr': 9.44e-05, 'samples': 181344, 'steps': 354, 'loss/train': 4.373147010803223} -09/20/2021 15:42:55 - INFO - __main__ - Step 5668: {'lr': 9.44e-05, 'samples': 181376, 'steps': 354, 'loss/train': 4.320862770080566} -09/20/2021 15:42:56 - INFO - __main__ - Step 5669: {'lr': 9.44e-05, 'samples': 181408, 'steps': 354, 'loss/train': 3.5052289962768555} -09/20/2021 15:42:57 - INFO - __main__ - Step 5670: {'lr': 9.44e-05, 'samples': 181440, 'steps': 354, 'loss/train': 3.7658369541168213} -09/20/2021 15:42:57 - INFO - __main__ - Step 5671: {'lr': 9.44e-05, 'samples': 181472, 'steps': 354, 'loss/train': 5.356414794921875} -09/20/2021 15:42:58 - INFO - __main__ - Step 5672: {'lr': 9.44e-05, 'samples': 181504, 'steps': 354, 'loss/train': 3.9586780071258545} -09/20/2021 15:42:59 - INFO - __main__ - Step 5673: {'lr': 9.44e-05, 'samples': 181536, 'steps': 354, 'loss/train': 5.290148735046387} -09/20/2021 15:43:00 - INFO - __main__ - Step 5674: {'lr': 9.44e-05, 'samples': 181568, 'steps': 354, 'loss/train': 5.545540809631348} -09/20/2021 15:43:00 - INFO - __main__ - Step 5675: {'lr': 9.44e-05, 'samples': 181600, 'steps': 354, 'loss/train': 5.512177467346191} -09/20/2021 15:43:01 - INFO - __main__ - Step 5676: {'lr': 9.44e-05, 'samples': 181632, 'steps': 354, 'loss/train': 4.64142370223999} -09/20/2021 15:43:02 - INFO - __main__ - Step 5677: {'lr': 9.44e-05, 'samples': 181664, 'steps': 354, 'loss/train': 4.884592056274414} -09/20/2021 15:43:03 - INFO - __main__ - Step 5678: {'lr': 9.44e-05, 'samples': 181696, 'steps': 354, 'loss/train': 5.2332377433776855} -09/20/2021 15:43:03 - INFO - __main__ - Step 5679: {'lr': 9.44e-05, 'samples': 181728, 'steps': 354, 'loss/train': 5.558607578277588} -09/20/2021 15:43:04 - INFO - __main__ - Step 5680: {'lr': 9.44e-05, 'samples': 181760, 'steps': 354, 'loss/train': 5.283943176269531} -09/20/2021 15:43:05 - INFO - __main__ - Step 5681: {'lr': 9.466666666666667e-05, 'samples': 181792, 'steps': 355, 'loss/train': 5.3767595291137695} -09/20/2021 15:43:06 - INFO - __main__ - Step 5682: {'lr': 9.466666666666667e-05, 'samples': 181824, 'steps': 355, 'loss/train': 5.749292373657227} -09/20/2021 15:43:06 - INFO - __main__ - Step 5683: {'lr': 9.466666666666667e-05, 'samples': 181856, 'steps': 355, 'loss/train': 4.683923721313477} -09/20/2021 15:43:07 - INFO - __main__ - Step 5684: {'lr': 9.466666666666667e-05, 'samples': 181888, 'steps': 355, 'loss/train': 5.566446304321289} -09/20/2021 15:43:09 - INFO - __main__ - Step 5685: {'lr': 9.466666666666667e-05, 'samples': 181920, 'steps': 355, 'loss/train': 6.7790398597717285} -09/20/2021 15:43:10 - INFO - __main__ - Step 5686: {'lr': 9.466666666666667e-05, 'samples': 181952, 'steps': 355, 'loss/train': 5.289785861968994} -09/20/2021 15:43:10 - INFO - __main__ - Step 5687: {'lr': 9.466666666666667e-05, 'samples': 181984, 'steps': 355, 'loss/train': 4.7890753746032715} -09/20/2021 15:43:11 - INFO - __main__ - Step 5688: {'lr': 9.466666666666667e-05, 'samples': 182016, 'steps': 355, 'loss/train': 6.233094215393066} -09/20/2021 15:43:12 - INFO - __main__ - Step 5689: {'lr': 9.466666666666667e-05, 'samples': 182048, 'steps': 355, 'loss/train': 5.094099044799805} -09/20/2021 15:43:13 - INFO - __main__ - Step 5690: {'lr': 9.466666666666667e-05, 'samples': 182080, 'steps': 355, 'loss/train': 5.675225734710693} -09/20/2021 15:43:13 - INFO - __main__ - Step 5691: {'lr': 9.466666666666667e-05, 'samples': 182112, 'steps': 355, 'loss/train': 5.214225769042969} -09/20/2021 15:43:14 - INFO - __main__ - Step 5692: {'lr': 9.466666666666667e-05, 'samples': 182144, 'steps': 355, 'loss/train': 6.041398048400879} -09/20/2021 15:43:15 - INFO - __main__ - Step 5693: {'lr': 9.466666666666667e-05, 'samples': 182176, 'steps': 355, 'loss/train': 5.734488010406494} -09/20/2021 15:43:16 - INFO - __main__ - Step 5694: {'lr': 9.466666666666667e-05, 'samples': 182208, 'steps': 355, 'loss/train': 4.5238847732543945} -09/20/2021 15:43:16 - INFO - __main__ - Step 5695: {'lr': 9.466666666666667e-05, 'samples': 182240, 'steps': 355, 'loss/train': 5.672013759613037} -09/20/2021 15:43:17 - INFO - __main__ - Step 5696: {'lr': 9.466666666666667e-05, 'samples': 182272, 'steps': 355, 'loss/train': 5.261446952819824} -09/20/2021 15:43:18 - INFO - __main__ - Step 5697: {'lr': 9.493333333333334e-05, 'samples': 182304, 'steps': 356, 'loss/train': 5.091126441955566} -09/20/2021 15:43:19 - INFO - __main__ - Step 5698: {'lr': 9.493333333333334e-05, 'samples': 182336, 'steps': 356, 'loss/train': 4.888518333435059} -09/20/2021 15:43:19 - INFO - __main__ - Step 5699: {'lr': 9.493333333333334e-05, 'samples': 182368, 'steps': 356, 'loss/train': 5.185174942016602} -09/20/2021 15:43:20 - INFO - __main__ - Step 5700: {'lr': 9.493333333333334e-05, 'samples': 182400, 'steps': 356, 'loss/train': 5.2123703956604} -09/20/2021 15:43:21 - INFO - __main__ - Step 5701: {'lr': 9.493333333333334e-05, 'samples': 182432, 'steps': 356, 'loss/train': 2.8831467628479004} -09/20/2021 15:43:22 - INFO - __main__ - Step 5702: {'lr': 9.493333333333334e-05, 'samples': 182464, 'steps': 356, 'loss/train': 2.7337443828582764} -09/20/2021 15:43:22 - INFO - __main__ - Step 5703: {'lr': 9.493333333333334e-05, 'samples': 182496, 'steps': 356, 'loss/train': 2.5218026638031006} -09/20/2021 15:43:23 - INFO - __main__ - Step 5704: {'lr': 9.493333333333334e-05, 'samples': 182528, 'steps': 356, 'loss/train': 2.992769479751587} -09/20/2021 15:43:24 - INFO - __main__ - Step 5705: {'lr': 9.493333333333334e-05, 'samples': 182560, 'steps': 356, 'loss/train': 2.5331101417541504} -09/20/2021 15:43:25 - INFO - __main__ - Step 5706: {'lr': 9.493333333333334e-05, 'samples': 182592, 'steps': 356, 'loss/train': 5.129531383514404} -09/20/2021 15:43:25 - INFO - __main__ - Step 5707: {'lr': 9.493333333333334e-05, 'samples': 182624, 'steps': 356, 'loss/train': 5.3639960289001465} -09/20/2021 15:43:26 - INFO - __main__ - Step 5708: {'lr': 9.493333333333334e-05, 'samples': 182656, 'steps': 356, 'loss/train': 5.911093711853027} -09/20/2021 15:43:27 - INFO - __main__ - Step 5709: {'lr': 9.493333333333334e-05, 'samples': 182688, 'steps': 356, 'loss/train': 5.334080696105957} -09/20/2021 15:43:28 - INFO - __main__ - Step 5710: {'lr': 9.493333333333334e-05, 'samples': 182720, 'steps': 356, 'loss/train': 4.821935653686523} -09/20/2021 15:43:28 - INFO - __main__ - Step 5711: {'lr': 9.493333333333334e-05, 'samples': 182752, 'steps': 356, 'loss/train': 2.982029914855957} -09/20/2021 15:43:29 - INFO - __main__ - Step 5712: {'lr': 9.493333333333334e-05, 'samples': 182784, 'steps': 356, 'loss/train': 4.61350154876709} -09/20/2021 15:43:30 - INFO - __main__ - Step 5713: {'lr': 9.52e-05, 'samples': 182816, 'steps': 357, 'loss/train': 5.670671463012695} -09/20/2021 15:43:31 - INFO - __main__ - Step 5714: {'lr': 9.52e-05, 'samples': 182848, 'steps': 357, 'loss/train': 6.074394226074219} -09/20/2021 15:43:32 - INFO - __main__ - Step 5715: {'lr': 9.52e-05, 'samples': 182880, 'steps': 357, 'loss/train': 5.062023162841797} -09/20/2021 15:43:33 - INFO - __main__ - Step 5716: {'lr': 9.52e-05, 'samples': 182912, 'steps': 357, 'loss/train': 5.4630255699157715} -09/20/2021 15:43:34 - INFO - __main__ - Step 5717: {'lr': 9.52e-05, 'samples': 182944, 'steps': 357, 'loss/train': 5.686028957366943} -09/20/2021 15:43:34 - INFO - __main__ - Step 5718: {'lr': 9.52e-05, 'samples': 182976, 'steps': 357, 'loss/train': 5.1090803146362305} -09/20/2021 15:43:35 - INFO - __main__ - Step 5719: {'lr': 9.52e-05, 'samples': 183008, 'steps': 357, 'loss/train': 4.310811996459961} -09/20/2021 15:43:36 - INFO - __main__ - Step 5720: {'lr': 9.52e-05, 'samples': 183040, 'steps': 357, 'loss/train': 6.54330587387085} -09/20/2021 15:43:37 - INFO - __main__ - Step 5721: {'lr': 9.52e-05, 'samples': 183072, 'steps': 357, 'loss/train': 6.288913726806641} -09/20/2021 15:43:37 - INFO - __main__ - Step 5722: {'lr': 9.52e-05, 'samples': 183104, 'steps': 357, 'loss/train': 5.196284770965576} -09/20/2021 15:43:38 - INFO - __main__ - Step 5723: {'lr': 9.52e-05, 'samples': 183136, 'steps': 357, 'loss/train': 4.689889430999756} -09/20/2021 15:43:39 - INFO - __main__ - Step 5724: {'lr': 9.52e-05, 'samples': 183168, 'steps': 357, 'loss/train': 4.53674840927124} -09/20/2021 15:43:40 - INFO - __main__ - Step 5725: {'lr': 9.52e-05, 'samples': 183200, 'steps': 357, 'loss/train': 5.116604804992676} -09/20/2021 15:43:40 - INFO - __main__ - Step 5726: {'lr': 9.52e-05, 'samples': 183232, 'steps': 357, 'loss/train': 5.0671563148498535} -09/20/2021 15:43:41 - INFO - __main__ - Step 5727: {'lr': 9.52e-05, 'samples': 183264, 'steps': 357, 'loss/train': 5.027673721313477} -09/20/2021 15:43:42 - INFO - __main__ - Step 5728: {'lr': 9.52e-05, 'samples': 183296, 'steps': 357, 'loss/train': 5.892348289489746} -09/20/2021 15:43:43 - INFO - __main__ - Step 5729: {'lr': 9.546666666666667e-05, 'samples': 183328, 'steps': 358, 'loss/train': 5.256833553314209} -09/20/2021 15:43:44 - INFO - __main__ - Step 5730: {'lr': 9.546666666666667e-05, 'samples': 183360, 'steps': 358, 'loss/train': 5.214798927307129} -09/20/2021 15:43:44 - INFO - __main__ - Step 5731: {'lr': 9.546666666666667e-05, 'samples': 183392, 'steps': 358, 'loss/train': 6.0174384117126465} -09/20/2021 15:43:45 - INFO - __main__ - Step 5732: {'lr': 9.546666666666667e-05, 'samples': 183424, 'steps': 358, 'loss/train': 5.038745880126953} -09/20/2021 15:43:46 - INFO - __main__ - Step 5733: {'lr': 9.546666666666667e-05, 'samples': 183456, 'steps': 358, 'loss/train': 5.926299095153809} -09/20/2021 15:43:47 - INFO - __main__ - Step 5734: {'lr': 9.546666666666667e-05, 'samples': 183488, 'steps': 358, 'loss/train': 5.01640510559082} -09/20/2021 15:43:47 - INFO - __main__ - Step 5735: {'lr': 9.546666666666667e-05, 'samples': 183520, 'steps': 358, 'loss/train': 5.784521579742432} -09/20/2021 15:43:48 - INFO - __main__ - Step 5736: {'lr': 9.546666666666667e-05, 'samples': 183552, 'steps': 358, 'loss/train': 5.035879135131836} -09/20/2021 15:43:49 - INFO - __main__ - Step 5737: {'lr': 9.546666666666667e-05, 'samples': 183584, 'steps': 358, 'loss/train': 5.25081205368042} -09/20/2021 15:43:50 - INFO - __main__ - Step 5738: {'lr': 9.546666666666667e-05, 'samples': 183616, 'steps': 358, 'loss/train': 5.182352542877197} -09/20/2021 15:43:50 - INFO - __main__ - Step 5739: {'lr': 9.546666666666667e-05, 'samples': 183648, 'steps': 358, 'loss/train': 4.672657012939453} -09/20/2021 15:43:51 - INFO - __main__ - Step 5740: {'lr': 9.546666666666667e-05, 'samples': 183680, 'steps': 358, 'loss/train': 5.350667476654053} -09/20/2021 15:43:52 - INFO - __main__ - Step 5741: {'lr': 9.546666666666667e-05, 'samples': 183712, 'steps': 358, 'loss/train': 5.035157680511475} -09/20/2021 15:43:53 - INFO - __main__ - Step 5742: {'lr': 9.546666666666667e-05, 'samples': 183744, 'steps': 358, 'loss/train': 5.0502848625183105} -09/20/2021 15:43:53 - INFO - __main__ - Step 5743: {'lr': 9.546666666666667e-05, 'samples': 183776, 'steps': 358, 'loss/train': 4.492086887359619} -09/20/2021 15:43:54 - INFO - __main__ - Step 5744: {'lr': 9.546666666666667e-05, 'samples': 183808, 'steps': 358, 'loss/train': 5.95350980758667} -09/20/2021 15:43:55 - INFO - __main__ - Step 5745: {'lr': 9.573333333333335e-05, 'samples': 183840, 'steps': 359, 'loss/train': 6.753674507141113} -09/20/2021 15:43:56 - INFO - __main__ - Step 5746: {'lr': 9.573333333333335e-05, 'samples': 183872, 'steps': 359, 'loss/train': 7.485476493835449} -09/20/2021 15:43:57 - INFO - __main__ - Step 5747: {'lr': 9.573333333333335e-05, 'samples': 183904, 'steps': 359, 'loss/train': 5.255486488342285} -09/20/2021 15:43:58 - INFO - __main__ - Step 5748: {'lr': 9.573333333333335e-05, 'samples': 183936, 'steps': 359, 'loss/train': 5.073253631591797} -09/20/2021 15:43:58 - INFO - __main__ - Step 5749: {'lr': 9.573333333333335e-05, 'samples': 183968, 'steps': 359, 'loss/train': 4.417145729064941} -09/20/2021 15:43:59 - INFO - __main__ - Step 5750: {'lr': 9.573333333333335e-05, 'samples': 184000, 'steps': 359, 'loss/train': 5.569635391235352} -09/20/2021 15:44:00 - INFO - __main__ - Step 5751: {'lr': 9.573333333333335e-05, 'samples': 184032, 'steps': 359, 'loss/train': 4.9120001792907715} -09/20/2021 15:44:01 - INFO - __main__ - Step 5752: {'lr': 9.573333333333335e-05, 'samples': 184064, 'steps': 359, 'loss/train': 4.878974437713623} -09/20/2021 15:44:01 - INFO - __main__ - Step 5753: {'lr': 9.573333333333335e-05, 'samples': 184096, 'steps': 359, 'loss/train': 5.667460918426514} -09/20/2021 15:44:02 - INFO - __main__ - Step 5754: {'lr': 9.573333333333335e-05, 'samples': 184128, 'steps': 359, 'loss/train': 5.790393829345703} -09/20/2021 15:44:03 - INFO - __main__ - Step 5755: {'lr': 9.573333333333335e-05, 'samples': 184160, 'steps': 359, 'loss/train': 5.845137119293213} -09/20/2021 15:44:04 - INFO - __main__ - Step 5756: {'lr': 9.573333333333335e-05, 'samples': 184192, 'steps': 359, 'loss/train': 5.265115261077881} -09/20/2021 15:44:04 - INFO - __main__ - Step 5757: {'lr': 9.573333333333335e-05, 'samples': 184224, 'steps': 359, 'loss/train': 4.982673645019531} -09/20/2021 15:44:05 - INFO - __main__ - Step 5758: {'lr': 9.573333333333335e-05, 'samples': 184256, 'steps': 359, 'loss/train': 6.164405822753906} -09/20/2021 15:44:06 - INFO - __main__ - Step 5759: {'lr': 9.573333333333335e-05, 'samples': 184288, 'steps': 359, 'loss/train': 5.355983734130859} -09/20/2021 15:44:07 - INFO - __main__ - Step 5760: {'lr': 9.573333333333335e-05, 'samples': 184320, 'steps': 359, 'loss/train': 5.488994121551514} -09/20/2021 15:44:08 - INFO - __main__ - Step 5761: {'lr': 9.6e-05, 'samples': 184352, 'steps': 360, 'loss/train': 5.6793928146362305} -09/20/2021 15:44:08 - INFO - __main__ - Step 5762: {'lr': 9.6e-05, 'samples': 184384, 'steps': 360, 'loss/train': 5.358819007873535} -09/20/2021 15:44:09 - INFO - __main__ - Step 5763: {'lr': 9.6e-05, 'samples': 184416, 'steps': 360, 'loss/train': 4.534496784210205} -09/20/2021 15:44:10 - INFO - __main__ - Step 5764: {'lr': 9.6e-05, 'samples': 184448, 'steps': 360, 'loss/train': 3.1907145977020264} -09/20/2021 15:44:11 - INFO - __main__ - Step 5765: {'lr': 9.6e-05, 'samples': 184480, 'steps': 360, 'loss/train': 5.79475212097168} -09/20/2021 15:44:11 - INFO - __main__ - Step 5766: {'lr': 9.6e-05, 'samples': 184512, 'steps': 360, 'loss/train': 5.229329586029053} -09/20/2021 15:44:12 - INFO - __main__ - Step 5767: {'lr': 9.6e-05, 'samples': 184544, 'steps': 360, 'loss/train': 5.433714389801025} -09/20/2021 15:44:13 - INFO - __main__ - Step 5768: {'lr': 9.6e-05, 'samples': 184576, 'steps': 360, 'loss/train': 5.363348960876465} -09/20/2021 15:44:14 - INFO - __main__ - Step 5769: {'lr': 9.6e-05, 'samples': 184608, 'steps': 360, 'loss/train': 6.241818428039551} -09/20/2021 15:44:14 - INFO - __main__ - Step 5770: {'lr': 9.6e-05, 'samples': 184640, 'steps': 360, 'loss/train': 5.047175407409668} -09/20/2021 15:44:15 - INFO - __main__ - Step 5771: {'lr': 9.6e-05, 'samples': 184672, 'steps': 360, 'loss/train': 4.4104437828063965} -09/20/2021 15:44:16 - INFO - __main__ - Step 5772: {'lr': 9.6e-05, 'samples': 184704, 'steps': 360, 'loss/train': 5.531053066253662} -09/20/2021 15:44:17 - INFO - __main__ - Step 5773: {'lr': 9.6e-05, 'samples': 184736, 'steps': 360, 'loss/train': 4.941449165344238} -09/20/2021 15:44:17 - INFO - __main__ - Step 5774: {'lr': 9.6e-05, 'samples': 184768, 'steps': 360, 'loss/train': 5.643054008483887} -09/20/2021 15:44:18 - INFO - __main__ - Step 5775: {'lr': 9.6e-05, 'samples': 184800, 'steps': 360, 'loss/train': 4.4953131675720215} -09/20/2021 15:44:19 - INFO - __main__ - Step 5776: {'lr': 9.6e-05, 'samples': 184832, 'steps': 360, 'loss/train': 5.568892955780029} -09/20/2021 15:44:20 - INFO - __main__ - Step 5777: {'lr': 9.626666666666667e-05, 'samples': 184864, 'steps': 361, 'loss/train': 5.417667388916016} -09/20/2021 15:44:21 - INFO - __main__ - Step 5778: {'lr': 9.626666666666667e-05, 'samples': 184896, 'steps': 361, 'loss/train': 6.624860763549805} -09/20/2021 15:44:22 - INFO - __main__ - Step 5779: {'lr': 9.626666666666667e-05, 'samples': 184928, 'steps': 361, 'loss/train': 5.288095474243164} -09/20/2021 15:44:23 - INFO - __main__ - Step 5780: {'lr': 9.626666666666667e-05, 'samples': 184960, 'steps': 361, 'loss/train': 4.780955791473389} -09/20/2021 15:44:23 - INFO - __main__ - Step 5781: {'lr': 9.626666666666667e-05, 'samples': 184992, 'steps': 361, 'loss/train': 4.857607364654541} -09/20/2021 15:44:24 - INFO - __main__ - Step 5782: {'lr': 9.626666666666667e-05, 'samples': 185024, 'steps': 361, 'loss/train': 5.637740135192871} -09/20/2021 15:44:25 - INFO - __main__ - Step 5783: {'lr': 9.626666666666667e-05, 'samples': 185056, 'steps': 361, 'loss/train': 4.551308631896973} -09/20/2021 15:44:26 - INFO - __main__ - Step 5784: {'lr': 9.626666666666667e-05, 'samples': 185088, 'steps': 361, 'loss/train': 5.310695648193359} -09/20/2021 15:44:26 - INFO - __main__ - Step 5785: {'lr': 9.626666666666667e-05, 'samples': 185120, 'steps': 361, 'loss/train': 5.769985675811768} -09/20/2021 15:44:27 - INFO - __main__ - Step 5786: {'lr': 9.626666666666667e-05, 'samples': 185152, 'steps': 361, 'loss/train': 4.679082870483398} -09/20/2021 15:44:28 - INFO - __main__ - Step 5787: {'lr': 9.626666666666667e-05, 'samples': 185184, 'steps': 361, 'loss/train': 5.777172565460205} -09/20/2021 15:44:29 - INFO - __main__ - Step 5788: {'lr': 9.626666666666667e-05, 'samples': 185216, 'steps': 361, 'loss/train': 5.9438371658325195} -09/20/2021 15:44:29 - INFO - __main__ - Step 5789: {'lr': 9.626666666666667e-05, 'samples': 185248, 'steps': 361, 'loss/train': 5.657427787780762} -09/20/2021 15:44:30 - INFO - __main__ - Step 5790: {'lr': 9.626666666666667e-05, 'samples': 185280, 'steps': 361, 'loss/train': 5.672704219818115} -09/20/2021 15:44:31 - INFO - __main__ - Step 5791: {'lr': 9.626666666666667e-05, 'samples': 185312, 'steps': 361, 'loss/train': 4.529938697814941} -09/20/2021 15:44:32 - INFO - __main__ - Step 5792: {'lr': 9.626666666666667e-05, 'samples': 185344, 'steps': 361, 'loss/train': 6.051026821136475} -09/20/2021 15:44:33 - INFO - __main__ - Step 5793: {'lr': 9.653333333333334e-05, 'samples': 185376, 'steps': 362, 'loss/train': 5.1762542724609375} -09/20/2021 15:44:33 - INFO - __main__ - Step 5794: {'lr': 9.653333333333334e-05, 'samples': 185408, 'steps': 362, 'loss/train': 4.965038776397705} -09/20/2021 15:44:34 - INFO - __main__ - Step 5795: {'lr': 9.653333333333334e-05, 'samples': 185440, 'steps': 362, 'loss/train': 5.530971050262451} -09/20/2021 15:44:35 - INFO - __main__ - Step 5796: {'lr': 9.653333333333334e-05, 'samples': 185472, 'steps': 362, 'loss/train': 5.194446563720703} -09/20/2021 15:44:36 - INFO - __main__ - Step 5797: {'lr': 9.653333333333334e-05, 'samples': 185504, 'steps': 362, 'loss/train': 5.085996150970459} -09/20/2021 15:44:36 - INFO - __main__ - Step 5798: {'lr': 9.653333333333334e-05, 'samples': 185536, 'steps': 362, 'loss/train': 4.479193210601807} -09/20/2021 15:44:37 - INFO - __main__ - Step 5799: {'lr': 9.653333333333334e-05, 'samples': 185568, 'steps': 362, 'loss/train': 3.1109232902526855} -09/20/2021 15:44:38 - INFO - __main__ - Step 5800: {'lr': 9.653333333333334e-05, 'samples': 185600, 'steps': 362, 'loss/train': 3.4219260215759277} -09/20/2021 15:44:39 - INFO - __main__ - Step 5801: {'lr': 9.653333333333334e-05, 'samples': 185632, 'steps': 362, 'loss/train': 2.818716049194336} -09/20/2021 15:44:39 - INFO - __main__ - Step 5802: {'lr': 9.653333333333334e-05, 'samples': 185664, 'steps': 362, 'loss/train': 5.246437072753906} -09/20/2021 15:44:40 - INFO - __main__ - Step 5803: {'lr': 9.653333333333334e-05, 'samples': 185696, 'steps': 362, 'loss/train': 6.38890266418457} -09/20/2021 15:44:41 - INFO - __main__ - Step 5804: {'lr': 9.653333333333334e-05, 'samples': 185728, 'steps': 362, 'loss/train': 4.204047203063965} -09/20/2021 15:44:42 - INFO - __main__ - Step 5805: {'lr': 9.653333333333334e-05, 'samples': 185760, 'steps': 362, 'loss/train': 5.842275619506836} -09/20/2021 15:44:42 - INFO - __main__ - Step 5806: {'lr': 9.653333333333334e-05, 'samples': 185792, 'steps': 362, 'loss/train': 5.572460651397705} -09/20/2021 15:44:44 - INFO - __main__ - Step 5807: {'lr': 9.653333333333334e-05, 'samples': 185824, 'steps': 362, 'loss/train': 5.31003475189209} -09/20/2021 15:44:45 - INFO - __main__ - Step 5808: {'lr': 9.653333333333334e-05, 'samples': 185856, 'steps': 362, 'loss/train': 4.420400142669678} -09/20/2021 15:44:45 - INFO - __main__ - Step 5809: {'lr': 9.680000000000001e-05, 'samples': 185888, 'steps': 363, 'loss/train': 4.117995738983154} -09/20/2021 15:44:46 - INFO - __main__ - Step 5810: {'lr': 9.680000000000001e-05, 'samples': 185920, 'steps': 363, 'loss/train': 4.375681400299072} -09/20/2021 15:44:47 - INFO - __main__ - Step 5811: {'lr': 9.680000000000001e-05, 'samples': 185952, 'steps': 363, 'loss/train': 4.359973907470703} -09/20/2021 15:44:48 - INFO - __main__ - Step 5812: {'lr': 9.680000000000001e-05, 'samples': 185984, 'steps': 363, 'loss/train': 6.111325263977051} -09/20/2021 15:44:48 - INFO - __main__ - Step 5813: {'lr': 9.680000000000001e-05, 'samples': 186016, 'steps': 363, 'loss/train': 5.089745044708252} -09/20/2021 15:44:49 - INFO - __main__ - Step 5814: {'lr': 9.680000000000001e-05, 'samples': 186048, 'steps': 363, 'loss/train': 5.182774066925049} -09/20/2021 15:44:50 - INFO - __main__ - Step 5815: {'lr': 9.680000000000001e-05, 'samples': 186080, 'steps': 363, 'loss/train': 2.3397321701049805} -09/20/2021 15:44:51 - INFO - __main__ - Step 5816: {'lr': 9.680000000000001e-05, 'samples': 186112, 'steps': 363, 'loss/train': 3.711796283721924} -09/20/2021 15:44:51 - INFO - __main__ - Step 5817: {'lr': 9.680000000000001e-05, 'samples': 186144, 'steps': 363, 'loss/train': 2.5479214191436768} -09/20/2021 15:44:52 - INFO - __main__ - Step 5818: {'lr': 9.680000000000001e-05, 'samples': 186176, 'steps': 363, 'loss/train': 2.4476191997528076} -09/20/2021 15:44:53 - INFO - __main__ - Step 5819: {'lr': 9.680000000000001e-05, 'samples': 186208, 'steps': 363, 'loss/train': 4.6217427253723145} -09/20/2021 15:44:54 - INFO - __main__ - Step 5820: {'lr': 9.680000000000001e-05, 'samples': 186240, 'steps': 363, 'loss/train': 5.356381893157959} -09/20/2021 15:44:54 - INFO - __main__ - Step 5821: {'lr': 9.680000000000001e-05, 'samples': 186272, 'steps': 363, 'loss/train': 2.641495943069458} -09/20/2021 15:44:55 - INFO - __main__ - Step 5822: {'lr': 9.680000000000001e-05, 'samples': 186304, 'steps': 363, 'loss/train': 4.579079627990723} -09/20/2021 15:44:56 - INFO - __main__ - Step 5823: {'lr': 9.680000000000001e-05, 'samples': 186336, 'steps': 363, 'loss/train': 2.7443554401397705} -09/20/2021 15:44:57 - INFO - __main__ - Step 5824: {'lr': 9.680000000000001e-05, 'samples': 186368, 'steps': 363, 'loss/train': 5.089821815490723} -09/20/2021 15:44:58 - INFO - __main__ - Step 5825: {'lr': 9.706666666666668e-05, 'samples': 186400, 'steps': 364, 'loss/train': 4.864007949829102} -09/20/2021 15:44:58 - INFO - __main__ - Step 5826: {'lr': 9.706666666666668e-05, 'samples': 186432, 'steps': 364, 'loss/train': 4.9144487380981445} -09/20/2021 15:44:59 - INFO - __main__ - Step 5827: {'lr': 9.706666666666668e-05, 'samples': 186464, 'steps': 364, 'loss/train': 8.061260223388672} -09/20/2021 15:45:00 - INFO - __main__ - Step 5828: {'lr': 9.706666666666668e-05, 'samples': 186496, 'steps': 364, 'loss/train': 8.553977012634277} -09/20/2021 15:45:01 - INFO - __main__ - Step 5829: {'lr': 9.706666666666668e-05, 'samples': 186528, 'steps': 364, 'loss/train': 8.883248329162598} -09/20/2021 15:45:01 - INFO - __main__ - Step 5830: {'lr': 9.706666666666668e-05, 'samples': 186560, 'steps': 364, 'loss/train': 5.495733737945557} -09/20/2021 15:45:02 - INFO - __main__ - Step 5831: {'lr': 9.706666666666668e-05, 'samples': 186592, 'steps': 364, 'loss/train': 4.9168701171875} -09/20/2021 15:45:03 - INFO - __main__ - Step 5832: {'lr': 9.706666666666668e-05, 'samples': 186624, 'steps': 364, 'loss/train': 4.869269371032715} -09/20/2021 15:45:04 - INFO - __main__ - Step 5833: {'lr': 9.706666666666668e-05, 'samples': 186656, 'steps': 364, 'loss/train': 7.109536647796631} -09/20/2021 15:45:04 - INFO - __main__ - Step 5834: {'lr': 9.706666666666668e-05, 'samples': 186688, 'steps': 364, 'loss/train': 5.173968315124512} -09/20/2021 15:45:05 - INFO - __main__ - Step 5835: {'lr': 9.706666666666668e-05, 'samples': 186720, 'steps': 364, 'loss/train': 4.87672233581543} -09/20/2021 15:45:06 - INFO - __main__ - Step 5836: {'lr': 9.706666666666668e-05, 'samples': 186752, 'steps': 364, 'loss/train': 7.588232517242432} -09/20/2021 15:45:07 - INFO - __main__ - Step 5837: {'lr': 9.706666666666668e-05, 'samples': 186784, 'steps': 364, 'loss/train': 5.298622131347656} -09/20/2021 15:45:07 - INFO - __main__ - Step 5838: {'lr': 9.706666666666668e-05, 'samples': 186816, 'steps': 364, 'loss/train': 5.294812202453613} -09/20/2021 15:45:09 - INFO - __main__ - Step 5839: {'lr': 9.706666666666668e-05, 'samples': 186848, 'steps': 364, 'loss/train': 5.348281383514404} -09/20/2021 15:45:09 - INFO - __main__ - Step 5840: {'lr': 9.706666666666668e-05, 'samples': 186880, 'steps': 364, 'loss/train': 5.116253852844238} -09/20/2021 15:45:10 - INFO - __main__ - Step 5841: {'lr': 9.733333333333335e-05, 'samples': 186912, 'steps': 365, 'loss/train': 6.285698413848877} -09/20/2021 15:45:11 - INFO - __main__ - Step 5842: {'lr': 9.733333333333335e-05, 'samples': 186944, 'steps': 365, 'loss/train': 5.175037384033203} -09/20/2021 15:45:12 - INFO - __main__ - Step 5843: {'lr': 9.733333333333335e-05, 'samples': 186976, 'steps': 365, 'loss/train': 5.198854923248291} -09/20/2021 15:45:13 - INFO - __main__ - Step 5844: {'lr': 9.733333333333335e-05, 'samples': 187008, 'steps': 365, 'loss/train': 4.824155807495117} -09/20/2021 15:45:13 - INFO - __main__ - Step 5845: {'lr': 9.733333333333335e-05, 'samples': 187040, 'steps': 365, 'loss/train': 5.146164894104004} -09/20/2021 15:45:14 - INFO - __main__ - Step 5846: {'lr': 9.733333333333335e-05, 'samples': 187072, 'steps': 365, 'loss/train': 6.057418346405029} -09/20/2021 15:45:15 - INFO - __main__ - Step 5847: {'lr': 9.733333333333335e-05, 'samples': 187104, 'steps': 365, 'loss/train': 1.244922399520874} -09/20/2021 15:45:16 - INFO - __main__ - Step 5848: {'lr': 9.733333333333335e-05, 'samples': 187136, 'steps': 365, 'loss/train': 5.275058746337891} -09/20/2021 15:45:16 - INFO - __main__ - Step 5849: {'lr': 9.733333333333335e-05, 'samples': 187168, 'steps': 365, 'loss/train': 4.833264350891113} -09/20/2021 15:45:17 - INFO - __main__ - Step 5850: {'lr': 9.733333333333335e-05, 'samples': 187200, 'steps': 365, 'loss/train': 4.81699800491333} -09/20/2021 15:45:18 - INFO - __main__ - Step 5851: {'lr': 9.733333333333335e-05, 'samples': 187232, 'steps': 365, 'loss/train': 5.9459147453308105} -09/20/2021 15:45:19 - INFO - __main__ - Step 5852: {'lr': 9.733333333333335e-05, 'samples': 187264, 'steps': 365, 'loss/train': 5.758338928222656} -09/20/2021 15:45:19 - INFO - __main__ - Step 5853: {'lr': 9.733333333333335e-05, 'samples': 187296, 'steps': 365, 'loss/train': 4.502868175506592} -09/20/2021 15:45:20 - INFO - __main__ - Step 5854: {'lr': 9.733333333333335e-05, 'samples': 187328, 'steps': 365, 'loss/train': 6.513943195343018} -09/20/2021 15:45:21 - INFO - __main__ - Step 5855: {'lr': 9.733333333333335e-05, 'samples': 187360, 'steps': 365, 'loss/train': 6.494300842285156} -09/20/2021 15:45:22 - INFO - __main__ - Step 5856: {'lr': 9.733333333333335e-05, 'samples': 187392, 'steps': 365, 'loss/train': 5.283069610595703} -09/20/2021 15:45:23 - INFO - __main__ - Step 5857: {'lr': 9.76e-05, 'samples': 187424, 'steps': 366, 'loss/train': 5.480412483215332} -09/20/2021 15:45:23 - INFO - __main__ - Step 5858: {'lr': 9.76e-05, 'samples': 187456, 'steps': 366, 'loss/train': 5.0783562660217285} -09/20/2021 15:45:24 - INFO - __main__ - Step 5859: {'lr': 9.76e-05, 'samples': 187488, 'steps': 366, 'loss/train': 5.382884502410889} -09/20/2021 15:45:25 - INFO - __main__ - Step 5860: {'lr': 9.76e-05, 'samples': 187520, 'steps': 366, 'loss/train': 5.546062469482422} -09/20/2021 15:45:26 - INFO - __main__ - Step 5861: {'lr': 9.76e-05, 'samples': 187552, 'steps': 366, 'loss/train': 2.6719088554382324} -09/20/2021 15:45:26 - INFO - __main__ - Step 5862: {'lr': 9.76e-05, 'samples': 187584, 'steps': 366, 'loss/train': 5.462378978729248} -09/20/2021 15:45:27 - INFO - __main__ - Step 5863: {'lr': 9.76e-05, 'samples': 187616, 'steps': 366, 'loss/train': 6.234832763671875} -09/20/2021 15:45:28 - INFO - __main__ - Step 5864: {'lr': 9.76e-05, 'samples': 187648, 'steps': 366, 'loss/train': 5.920791149139404} -09/20/2021 15:45:29 - INFO - __main__ - Step 5865: {'lr': 9.76e-05, 'samples': 187680, 'steps': 366, 'loss/train': 5.267902851104736} -09/20/2021 15:45:29 - INFO - __main__ - Step 5866: {'lr': 9.76e-05, 'samples': 187712, 'steps': 366, 'loss/train': 5.707048416137695} -09/20/2021 15:45:30 - INFO - __main__ - Step 5867: {'lr': 9.76e-05, 'samples': 187744, 'steps': 366, 'loss/train': 6.579422473907471} -09/20/2021 15:45:31 - INFO - __main__ - Step 5868: {'lr': 9.76e-05, 'samples': 187776, 'steps': 366, 'loss/train': 4.771958827972412} -09/20/2021 15:45:33 - INFO - __main__ - Step 5869: {'lr': 9.76e-05, 'samples': 187808, 'steps': 366, 'loss/train': 5.4213480949401855} -09/20/2021 15:45:33 - INFO - __main__ - Step 5870: {'lr': 9.76e-05, 'samples': 187840, 'steps': 366, 'loss/train': 5.279909133911133} -09/20/2021 15:45:34 - INFO - __main__ - Step 5871: {'lr': 9.76e-05, 'samples': 187872, 'steps': 366, 'loss/train': 5.013769149780273} -09/20/2021 15:45:35 - INFO - __main__ - Step 5872: {'lr': 9.76e-05, 'samples': 187904, 'steps': 366, 'loss/train': 5.469991207122803} -09/20/2021 15:45:36 - INFO - __main__ - Step 5873: {'lr': 9.786666666666667e-05, 'samples': 187936, 'steps': 367, 'loss/train': 5.886990070343018} -09/20/2021 15:45:36 - INFO - __main__ - Step 5874: {'lr': 9.786666666666667e-05, 'samples': 187968, 'steps': 367, 'loss/train': 5.337019443511963} -09/20/2021 15:45:37 - INFO - __main__ - Step 5875: {'lr': 9.786666666666667e-05, 'samples': 188000, 'steps': 367, 'loss/train': 4.9638142585754395} -09/20/2021 15:45:38 - INFO - __main__ - Step 5876: {'lr': 9.786666666666667e-05, 'samples': 188032, 'steps': 367, 'loss/train': 4.847799777984619} -09/20/2021 15:45:39 - INFO - __main__ - Step 5877: {'lr': 9.786666666666667e-05, 'samples': 188064, 'steps': 367, 'loss/train': 5.4103288650512695} -09/20/2021 15:45:39 - INFO - __main__ - Step 5878: {'lr': 9.786666666666667e-05, 'samples': 188096, 'steps': 367, 'loss/train': 6.11687707901001} -09/20/2021 15:45:40 - INFO - __main__ - Step 5879: {'lr': 9.786666666666667e-05, 'samples': 188128, 'steps': 367, 'loss/train': 3.983815908432007} -09/20/2021 15:45:41 - INFO - __main__ - Step 5880: {'lr': 9.786666666666667e-05, 'samples': 188160, 'steps': 367, 'loss/train': 5.388835906982422} -09/20/2021 15:45:42 - INFO - __main__ - Step 5881: {'lr': 9.786666666666667e-05, 'samples': 188192, 'steps': 367, 'loss/train': 5.107140064239502} -09/20/2021 15:45:42 - INFO - __main__ - Step 5882: {'lr': 9.786666666666667e-05, 'samples': 188224, 'steps': 367, 'loss/train': 4.947966575622559} -09/20/2021 15:45:43 - INFO - __main__ - Step 5883: {'lr': 9.786666666666667e-05, 'samples': 188256, 'steps': 367, 'loss/train': 5.052899360656738} -09/20/2021 15:45:44 - INFO - __main__ - Step 5884: {'lr': 9.786666666666667e-05, 'samples': 188288, 'steps': 367, 'loss/train': 4.454050064086914} -09/20/2021 15:45:45 - INFO - __main__ - Step 5885: {'lr': 9.786666666666667e-05, 'samples': 188320, 'steps': 367, 'loss/train': 5.954023361206055} -09/20/2021 15:45:45 - INFO - __main__ - Step 5886: {'lr': 9.786666666666667e-05, 'samples': 188352, 'steps': 367, 'loss/train': 4.89090633392334} -09/20/2021 15:45:46 - INFO - __main__ - Step 5887: {'lr': 9.786666666666667e-05, 'samples': 188384, 'steps': 367, 'loss/train': 6.11176061630249} -09/20/2021 15:45:47 - INFO - __main__ - Step 5888: {'lr': 9.786666666666667e-05, 'samples': 188416, 'steps': 367, 'loss/train': 4.9943389892578125} -09/20/2021 15:45:48 - INFO - __main__ - Step 5889: {'lr': 9.813333333333334e-05, 'samples': 188448, 'steps': 368, 'loss/train': 5.203802108764648} -09/20/2021 15:45:49 - INFO - __main__ - Step 5890: {'lr': 9.813333333333334e-05, 'samples': 188480, 'steps': 368, 'loss/train': 5.640717506408691} -09/20/2021 15:45:49 - INFO - __main__ - Step 5891: {'lr': 9.813333333333334e-05, 'samples': 188512, 'steps': 368, 'loss/train': 4.434488296508789} -09/20/2021 15:45:50 - INFO - __main__ - Step 5892: {'lr': 9.813333333333334e-05, 'samples': 188544, 'steps': 368, 'loss/train': 5.254718780517578} -09/20/2021 15:45:51 - INFO - __main__ - Step 5893: {'lr': 9.813333333333334e-05, 'samples': 188576, 'steps': 368, 'loss/train': 4.750726699829102} -09/20/2021 15:45:52 - INFO - __main__ - Step 5894: {'lr': 9.813333333333334e-05, 'samples': 188608, 'steps': 368, 'loss/train': 5.560751914978027} -09/20/2021 15:45:52 - INFO - __main__ - Step 5895: {'lr': 9.813333333333334e-05, 'samples': 188640, 'steps': 368, 'loss/train': 4.405080318450928} -09/20/2021 15:45:53 - INFO - __main__ - Step 5896: {'lr': 9.813333333333334e-05, 'samples': 188672, 'steps': 368, 'loss/train': 5.8132548332214355} -09/20/2021 15:45:54 - INFO - __main__ - Step 5897: {'lr': 9.813333333333334e-05, 'samples': 188704, 'steps': 368, 'loss/train': 4.229068756103516} -09/20/2021 15:45:55 - INFO - __main__ - Step 5898: {'lr': 9.813333333333334e-05, 'samples': 188736, 'steps': 368, 'loss/train': 6.278164386749268} -09/20/2021 15:45:55 - INFO - __main__ - Step 5899: {'lr': 9.813333333333334e-05, 'samples': 188768, 'steps': 368, 'loss/train': 6.142221927642822} -09/20/2021 15:45:56 - INFO - __main__ - Step 5900: {'lr': 9.813333333333334e-05, 'samples': 188800, 'steps': 368, 'loss/train': 6.0823073387146} -09/20/2021 15:45:57 - INFO - __main__ - Step 5901: {'lr': 9.813333333333334e-05, 'samples': 188832, 'steps': 368, 'loss/train': 6.667386531829834} -09/20/2021 15:45:58 - INFO - __main__ - Step 5902: {'lr': 9.813333333333334e-05, 'samples': 188864, 'steps': 368, 'loss/train': 5.394545555114746} -09/20/2021 15:45:59 - INFO - __main__ - Step 5903: {'lr': 9.813333333333334e-05, 'samples': 188896, 'steps': 368, 'loss/train': 5.255876541137695} -09/20/2021 15:46:00 - INFO - __main__ - Step 5904: {'lr': 9.813333333333334e-05, 'samples': 188928, 'steps': 368, 'loss/train': 6.175190448760986} -09/20/2021 15:46:01 - INFO - __main__ - Step 5905: {'lr': 9.84e-05, 'samples': 188960, 'steps': 369, 'loss/train': 5.050478458404541} -09/20/2021 15:46:01 - INFO - __main__ - Step 5906: {'lr': 9.84e-05, 'samples': 188992, 'steps': 369, 'loss/train': 5.604061603546143} -09/20/2021 15:46:02 - INFO - __main__ - Step 5907: {'lr': 9.84e-05, 'samples': 189024, 'steps': 369, 'loss/train': 5.885441303253174} -09/20/2021 15:46:03 - INFO - __main__ - Step 5908: {'lr': 9.84e-05, 'samples': 189056, 'steps': 369, 'loss/train': 5.288589954376221} -09/20/2021 15:46:04 - INFO - __main__ - Step 5909: {'lr': 9.84e-05, 'samples': 189088, 'steps': 369, 'loss/train': 4.787325859069824} -09/20/2021 15:46:04 - INFO - __main__ - Step 5910: {'lr': 9.84e-05, 'samples': 189120, 'steps': 369, 'loss/train': 5.899075984954834} -09/20/2021 15:46:05 - INFO - __main__ - Step 5911: {'lr': 9.84e-05, 'samples': 189152, 'steps': 369, 'loss/train': 6.227932453155518} -09/20/2021 15:46:06 - INFO - __main__ - Step 5912: {'lr': 9.84e-05, 'samples': 189184, 'steps': 369, 'loss/train': 5.2233195304870605} -09/20/2021 15:46:07 - INFO - __main__ - Step 5913: {'lr': 9.84e-05, 'samples': 189216, 'steps': 369, 'loss/train': 5.615755558013916} -09/20/2021 15:46:07 - INFO - __main__ - Step 5914: {'lr': 9.84e-05, 'samples': 189248, 'steps': 369, 'loss/train': 5.808330535888672} -09/20/2021 15:46:08 - INFO - __main__ - Step 5915: {'lr': 9.84e-05, 'samples': 189280, 'steps': 369, 'loss/train': 5.952569961547852} -09/20/2021 15:46:09 - INFO - __main__ - Step 5916: {'lr': 9.84e-05, 'samples': 189312, 'steps': 369, 'loss/train': 6.874939918518066} -09/20/2021 15:46:10 - INFO - __main__ - Step 5917: {'lr': 9.84e-05, 'samples': 189344, 'steps': 369, 'loss/train': 5.135202407836914} -09/20/2021 15:46:10 - INFO - __main__ - Step 5918: {'lr': 9.84e-05, 'samples': 189376, 'steps': 369, 'loss/train': 5.164813041687012} -09/20/2021 15:46:11 - INFO - __main__ - Step 5919: {'lr': 9.84e-05, 'samples': 189408, 'steps': 369, 'loss/train': 4.354457855224609} -09/20/2021 15:46:12 - INFO - __main__ - Step 5920: {'lr': 9.84e-05, 'samples': 189440, 'steps': 369, 'loss/train': 5.842540740966797} -09/20/2021 15:46:13 - INFO - __main__ - Step 5921: {'lr': 9.866666666666668e-05, 'samples': 189472, 'steps': 370, 'loss/train': 5.561306476593018} -09/20/2021 15:46:13 - INFO - __main__ - Step 5922: {'lr': 9.866666666666668e-05, 'samples': 189504, 'steps': 370, 'loss/train': 5.040521144866943} -09/20/2021 15:46:14 - INFO - __main__ - Step 5923: {'lr': 9.866666666666668e-05, 'samples': 189536, 'steps': 370, 'loss/train': 4.9681291580200195} -09/20/2021 15:46:15 - INFO - __main__ - Step 5924: {'lr': 9.866666666666668e-05, 'samples': 189568, 'steps': 370, 'loss/train': 6.828869819641113} -09/20/2021 15:46:16 - INFO - __main__ - Step 5925: {'lr': 9.866666666666668e-05, 'samples': 189600, 'steps': 370, 'loss/train': 5.448275089263916} -09/20/2021 15:46:16 - INFO - __main__ - Step 5926: {'lr': 9.866666666666668e-05, 'samples': 189632, 'steps': 370, 'loss/train': 5.057938098907471} -09/20/2021 15:46:17 - INFO - __main__ - Step 5927: {'lr': 9.866666666666668e-05, 'samples': 189664, 'steps': 370, 'loss/train': 4.913153171539307} -09/20/2021 15:46:18 - INFO - __main__ - Step 5928: {'lr': 9.866666666666668e-05, 'samples': 189696, 'steps': 370, 'loss/train': 5.319303035736084} -09/20/2021 15:46:19 - INFO - __main__ - Step 5929: {'lr': 9.866666666666668e-05, 'samples': 189728, 'steps': 370, 'loss/train': 4.937519550323486} -09/20/2021 15:46:19 - INFO - __main__ - Step 5930: {'lr': 9.866666666666668e-05, 'samples': 189760, 'steps': 370, 'loss/train': 5.610849857330322} -09/20/2021 15:46:20 - INFO - __main__ - Step 5931: {'lr': 9.866666666666668e-05, 'samples': 189792, 'steps': 370, 'loss/train': 3.6287174224853516} -09/20/2021 15:46:22 - INFO - __main__ - Step 5932: {'lr': 9.866666666666668e-05, 'samples': 189824, 'steps': 370, 'loss/train': 3.410391330718994} -09/20/2021 15:46:23 - INFO - __main__ - Step 5933: {'lr': 9.866666666666668e-05, 'samples': 189856, 'steps': 370, 'loss/train': 5.452162265777588} -09/20/2021 15:46:23 - INFO - __main__ - Step 5934: {'lr': 9.866666666666668e-05, 'samples': 189888, 'steps': 370, 'loss/train': 5.22625207901001} -09/20/2021 15:46:24 - INFO - __main__ - Step 5935: {'lr': 9.866666666666668e-05, 'samples': 189920, 'steps': 370, 'loss/train': 6.325603008270264} -09/20/2021 15:46:25 - INFO - __main__ - Step 5936: {'lr': 9.866666666666668e-05, 'samples': 189952, 'steps': 370, 'loss/train': 5.503579139709473} -09/20/2021 15:46:26 - INFO - __main__ - Step 5937: {'lr': 9.893333333333333e-05, 'samples': 189984, 'steps': 371, 'loss/train': 5.701339244842529} -09/20/2021 15:46:27 - INFO - __main__ - Step 5938: {'lr': 9.893333333333333e-05, 'samples': 190016, 'steps': 371, 'loss/train': 5.820974349975586} -09/20/2021 15:46:27 - INFO - __main__ - Step 5939: {'lr': 9.893333333333333e-05, 'samples': 190048, 'steps': 371, 'loss/train': 4.870793342590332} -09/20/2021 15:46:28 - INFO - __main__ - Step 5940: {'lr': 9.893333333333333e-05, 'samples': 190080, 'steps': 371, 'loss/train': 5.333955764770508} -09/20/2021 15:46:29 - INFO - __main__ - Step 5941: {'lr': 9.893333333333333e-05, 'samples': 190112, 'steps': 371, 'loss/train': 4.337048053741455} -09/20/2021 15:46:30 - INFO - __main__ - Step 5942: {'lr': 9.893333333333333e-05, 'samples': 190144, 'steps': 371, 'loss/train': 5.930741310119629} -09/20/2021 15:46:30 - INFO - __main__ - Step 5943: {'lr': 9.893333333333333e-05, 'samples': 190176, 'steps': 371, 'loss/train': 6.876955032348633} -09/20/2021 15:46:31 - INFO - __main__ - Step 5944: {'lr': 9.893333333333333e-05, 'samples': 190208, 'steps': 371, 'loss/train': 6.968448162078857} -09/20/2021 15:46:32 - INFO - __main__ - Step 5945: {'lr': 9.893333333333333e-05, 'samples': 190240, 'steps': 371, 'loss/train': 6.9425458908081055} -09/20/2021 15:46:33 - INFO - __main__ - Step 5946: {'lr': 9.893333333333333e-05, 'samples': 190272, 'steps': 371, 'loss/train': 6.858020305633545} -09/20/2021 15:46:33 - INFO - __main__ - Step 5947: {'lr': 9.893333333333333e-05, 'samples': 190304, 'steps': 371, 'loss/train': 7.7387309074401855} -09/20/2021 15:46:34 - INFO - __main__ - Step 5948: {'lr': 9.893333333333333e-05, 'samples': 190336, 'steps': 371, 'loss/train': 6.962184429168701} -09/20/2021 15:46:35 - INFO - __main__ - Step 5949: {'lr': 9.893333333333333e-05, 'samples': 190368, 'steps': 371, 'loss/train': 6.982465744018555} -09/20/2021 15:46:36 - INFO - __main__ - Step 5950: {'lr': 9.893333333333333e-05, 'samples': 190400, 'steps': 371, 'loss/train': 6.887677192687988} -09/20/2021 15:46:36 - INFO - __main__ - Step 5951: {'lr': 9.893333333333333e-05, 'samples': 190432, 'steps': 371, 'loss/train': 6.889347553253174} -09/20/2021 15:46:37 - INFO - __main__ - Step 5952: {'lr': 9.893333333333333e-05, 'samples': 190464, 'steps': 371, 'loss/train': 6.988802433013916} -09/20/2021 15:46:38 - INFO - __main__ - Step 5953: {'lr': 9.92e-05, 'samples': 190496, 'steps': 372, 'loss/train': 7.259624481201172} -09/20/2021 15:46:39 - INFO - __main__ - Step 5954: {'lr': 9.92e-05, 'samples': 190528, 'steps': 372, 'loss/train': 7.111927509307861} -09/20/2021 15:46:39 - INFO - __main__ - Step 5955: {'lr': 9.92e-05, 'samples': 190560, 'steps': 372, 'loss/train': 5.967763900756836} -09/20/2021 15:46:40 - INFO - __main__ - Step 5956: {'lr': 9.92e-05, 'samples': 190592, 'steps': 372, 'loss/train': 5.683143615722656} -09/20/2021 15:46:41 - INFO - __main__ - Step 5957: {'lr': 9.92e-05, 'samples': 190624, 'steps': 372, 'loss/train': 5.621729373931885} -09/20/2021 15:46:42 - INFO - __main__ - Step 5958: {'lr': 9.92e-05, 'samples': 190656, 'steps': 372, 'loss/train': 4.0822834968566895} -09/20/2021 15:46:42 - INFO - __main__ - Step 5959: {'lr': 9.92e-05, 'samples': 190688, 'steps': 372, 'loss/train': 4.934310436248779} -09/20/2021 15:46:43 - INFO - __main__ - Step 5960: {'lr': 9.92e-05, 'samples': 190720, 'steps': 372, 'loss/train': 4.881924152374268} -09/20/2021 15:46:44 - INFO - __main__ - Step 5961: {'lr': 9.92e-05, 'samples': 190752, 'steps': 372, 'loss/train': 5.942986488342285} -09/20/2021 15:46:45 - INFO - __main__ - Step 5962: {'lr': 9.92e-05, 'samples': 190784, 'steps': 372, 'loss/train': 4.603703022003174} -09/20/2021 15:46:45 - INFO - __main__ - Step 5963: {'lr': 9.92e-05, 'samples': 190816, 'steps': 372, 'loss/train': 5.2580156326293945} -09/20/2021 15:46:46 - INFO - __main__ - Step 5964: {'lr': 9.92e-05, 'samples': 190848, 'steps': 372, 'loss/train': 6.329211711883545} -09/20/2021 15:46:47 - INFO - __main__ - Step 5965: {'lr': 9.92e-05, 'samples': 190880, 'steps': 372, 'loss/train': 5.674756050109863} -09/20/2021 15:46:48 - INFO - __main__ - Step 5966: {'lr': 9.92e-05, 'samples': 190912, 'steps': 372, 'loss/train': 6.012346267700195} -09/20/2021 15:46:48 - INFO - __main__ - Step 5967: {'lr': 9.92e-05, 'samples': 190944, 'steps': 372, 'loss/train': 7.228067398071289} -09/20/2021 15:46:49 - INFO - __main__ - Step 5968: {'lr': 9.92e-05, 'samples': 190976, 'steps': 372, 'loss/train': 5.5510640144348145} -09/20/2021 15:46:50 - INFO - __main__ - Step 5969: {'lr': 9.946666666666668e-05, 'samples': 191008, 'steps': 373, 'loss/train': 5.274379730224609} -09/20/2021 15:46:51 - INFO - __main__ - Step 5970: {'lr': 9.946666666666668e-05, 'samples': 191040, 'steps': 373, 'loss/train': 5.028403282165527} -09/20/2021 15:46:52 - INFO - __main__ - Step 5971: {'lr': 9.946666666666668e-05, 'samples': 191072, 'steps': 373, 'loss/train': 5.13372802734375} -09/20/2021 15:46:53 - INFO - __main__ - Step 5972: {'lr': 9.946666666666668e-05, 'samples': 191104, 'steps': 373, 'loss/train': 4.644721031188965} -09/20/2021 15:46:54 - INFO - __main__ - Step 5973: {'lr': 9.946666666666668e-05, 'samples': 191136, 'steps': 373, 'loss/train': 4.6556878089904785} -09/20/2021 15:46:54 - INFO - __main__ - Step 5974: {'lr': 9.946666666666668e-05, 'samples': 191168, 'steps': 373, 'loss/train': 5.04736328125} -09/20/2021 15:46:55 - INFO - __main__ - Step 5975: {'lr': 9.946666666666668e-05, 'samples': 191200, 'steps': 373, 'loss/train': 5.8285064697265625} -09/20/2021 15:46:56 - INFO - __main__ - Step 5976: {'lr': 9.946666666666668e-05, 'samples': 191232, 'steps': 373, 'loss/train': 4.878609657287598} -09/20/2021 15:46:57 - INFO - __main__ - Step 5977: {'lr': 9.946666666666668e-05, 'samples': 191264, 'steps': 373, 'loss/train': 5.332126617431641} -09/20/2021 15:46:57 - INFO - __main__ - Step 5978: {'lr': 9.946666666666668e-05, 'samples': 191296, 'steps': 373, 'loss/train': 5.869365215301514} -09/20/2021 15:46:58 - INFO - __main__ - Step 5979: {'lr': 9.946666666666668e-05, 'samples': 191328, 'steps': 373, 'loss/train': 5.005349159240723} -09/20/2021 15:46:59 - INFO - __main__ - Step 5980: {'lr': 9.946666666666668e-05, 'samples': 191360, 'steps': 373, 'loss/train': 6.086219787597656} -09/20/2021 15:47:00 - INFO - __main__ - Step 5981: {'lr': 9.946666666666668e-05, 'samples': 191392, 'steps': 373, 'loss/train': 4.52787446975708} -09/20/2021 15:47:00 - INFO - __main__ - Step 5982: {'lr': 9.946666666666668e-05, 'samples': 191424, 'steps': 373, 'loss/train': 5.008665561676025} -09/20/2021 15:47:01 - INFO - __main__ - Step 5983: {'lr': 9.946666666666668e-05, 'samples': 191456, 'steps': 373, 'loss/train': 5.517675399780273} -09/20/2021 15:47:02 - INFO - __main__ - Step 5984: {'lr': 9.946666666666668e-05, 'samples': 191488, 'steps': 373, 'loss/train': 4.8827056884765625} -09/20/2021 15:47:03 - INFO - __main__ - Step 5985: {'lr': 9.973333333333334e-05, 'samples': 191520, 'steps': 374, 'loss/train': 3.0746335983276367} -09/20/2021 15:47:03 - INFO - __main__ - Step 5986: {'lr': 9.973333333333334e-05, 'samples': 191552, 'steps': 374, 'loss/train': 5.229404449462891} -09/20/2021 15:47:04 - INFO - __main__ - Step 5987: {'lr': 9.973333333333334e-05, 'samples': 191584, 'steps': 374, 'loss/train': 3.4257190227508545} -09/20/2021 15:47:05 - INFO - __main__ - Step 5988: {'lr': 9.973333333333334e-05, 'samples': 191616, 'steps': 374, 'loss/train': 5.492071628570557} -09/20/2021 15:47:06 - INFO - __main__ - Step 5989: {'lr': 9.973333333333334e-05, 'samples': 191648, 'steps': 374, 'loss/train': 4.9915452003479} -09/20/2021 15:47:06 - INFO - __main__ - Step 5990: {'lr': 9.973333333333334e-05, 'samples': 191680, 'steps': 374, 'loss/train': 6.091172695159912} -09/20/2021 15:47:07 - INFO - __main__ - Step 5991: {'lr': 9.973333333333334e-05, 'samples': 191712, 'steps': 374, 'loss/train': 4.869424343109131} -09/20/2021 15:47:08 - INFO - __main__ - Step 5992: {'lr': 9.973333333333334e-05, 'samples': 191744, 'steps': 374, 'loss/train': 4.555848598480225} -09/20/2021 15:47:09 - INFO - __main__ - Step 5993: {'lr': 9.973333333333334e-05, 'samples': 191776, 'steps': 374, 'loss/train': 4.700955390930176} -09/20/2021 15:47:09 - INFO - __main__ - Step 5994: {'lr': 9.973333333333334e-05, 'samples': 191808, 'steps': 374, 'loss/train': 4.87289571762085} -09/20/2021 15:47:10 - INFO - __main__ - Step 5995: {'lr': 9.973333333333334e-05, 'samples': 191840, 'steps': 374, 'loss/train': 5.23130989074707} -09/20/2021 15:47:11 - INFO - __main__ - Step 5996: {'lr': 9.973333333333334e-05, 'samples': 191872, 'steps': 374, 'loss/train': 6.113896369934082} -09/20/2021 15:47:12 - INFO - __main__ - Step 5997: {'lr': 9.973333333333334e-05, 'samples': 191904, 'steps': 374, 'loss/train': 4.953559875488281} -09/20/2021 15:47:12 - INFO - __main__ - Step 5998: {'lr': 9.973333333333334e-05, 'samples': 191936, 'steps': 374, 'loss/train': 5.590534210205078} -09/20/2021 15:47:13 - INFO - __main__ - Step 5999: {'lr': 9.973333333333334e-05, 'samples': 191968, 'steps': 374, 'loss/train': 4.628453731536865} -09/20/2021 15:47:14 - INFO - __main__ - Step 6000: {'lr': 9.973333333333334e-05, 'samples': 192000, 'steps': 374, 'loss/train': 4.975855827331543} -09/20/2021 15:47:15 - INFO - __main__ - Step 6001: {'lr': 0.0001, 'samples': 192032, 'steps': 375, 'loss/train': 5.733121395111084} -09/20/2021 15:47:16 - INFO - __main__ - Step 6002: {'lr': 0.0001, 'samples': 192064, 'steps': 375, 'loss/train': 5.325373649597168} -09/20/2021 15:47:17 - INFO - __main__ - Step 6003: {'lr': 0.0001, 'samples': 192096, 'steps': 375, 'loss/train': 6.471938610076904} -09/20/2021 15:47:18 - INFO - __main__ - Step 6004: {'lr': 0.0001, 'samples': 192128, 'steps': 375, 'loss/train': 5.345799446105957} -09/20/2021 15:47:18 - INFO - __main__ - Step 6005: {'lr': 0.0001, 'samples': 192160, 'steps': 375, 'loss/train': 5.5114922523498535} -09/20/2021 15:47:19 - INFO - __main__ - Step 6006: {'lr': 0.0001, 'samples': 192192, 'steps': 375, 'loss/train': 5.1240081787109375} -09/20/2021 15:47:20 - INFO - __main__ - Step 6007: {'lr': 0.0001, 'samples': 192224, 'steps': 375, 'loss/train': 5.198154449462891} -09/20/2021 15:47:21 - INFO - __main__ - Step 6008: {'lr': 0.0001, 'samples': 192256, 'steps': 375, 'loss/train': 5.125683307647705} -09/20/2021 15:47:21 - INFO - __main__ - Step 6009: {'lr': 0.0001, 'samples': 192288, 'steps': 375, 'loss/train': 6.01994514465332} -09/20/2021 15:47:22 - INFO - __main__ - Step 6010: {'lr': 0.0001, 'samples': 192320, 'steps': 375, 'loss/train': 5.328632354736328} -09/20/2021 15:47:23 - INFO - __main__ - Step 6011: {'lr': 0.0001, 'samples': 192352, 'steps': 375, 'loss/train': 5.044973373413086} -09/20/2021 15:47:24 - INFO - __main__ - Step 6012: {'lr': 0.0001, 'samples': 192384, 'steps': 375, 'loss/train': 5.307803153991699} -09/20/2021 15:47:24 - INFO - __main__ - Step 6013: {'lr': 0.0001, 'samples': 192416, 'steps': 375, 'loss/train': 4.943833827972412} -09/20/2021 15:47:25 - INFO - __main__ - Step 6014: {'lr': 0.0001, 'samples': 192448, 'steps': 375, 'loss/train': 4.9387617111206055} -09/20/2021 15:47:26 - INFO - __main__ - Step 6015: {'lr': 0.0001, 'samples': 192480, 'steps': 375, 'loss/train': 5.478773593902588} -09/20/2021 15:47:27 - INFO - __main__ - Step 6016: {'lr': 0.0001, 'samples': 192512, 'steps': 375, 'loss/train': 5.289918899536133} -09/20/2021 15:47:28 - INFO - __main__ - Step 6017: {'lr': 0.00010026666666666666, 'samples': 192544, 'steps': 376, 'loss/train': 5.727816104888916} -09/20/2021 15:47:28 - INFO - __main__ - Step 6018: {'lr': 0.00010026666666666666, 'samples': 192576, 'steps': 376, 'loss/train': 5.283658504486084} -09/20/2021 15:47:29 - INFO - __main__ - Step 6019: {'lr': 0.00010026666666666666, 'samples': 192608, 'steps': 376, 'loss/train': 5.025421619415283} -09/20/2021 15:47:30 - INFO - __main__ - Step 6020: {'lr': 0.00010026666666666666, 'samples': 192640, 'steps': 376, 'loss/train': 5.300779819488525} -09/20/2021 15:47:31 - INFO - __main__ - Step 6021: {'lr': 0.00010026666666666666, 'samples': 192672, 'steps': 376, 'loss/train': 4.851236343383789} -09/20/2021 15:47:31 - INFO - __main__ - Step 6022: {'lr': 0.00010026666666666666, 'samples': 192704, 'steps': 376, 'loss/train': 4.904393672943115} -09/20/2021 15:47:32 - INFO - __main__ - Step 6023: {'lr': 0.00010026666666666666, 'samples': 192736, 'steps': 376, 'loss/train': 6.123940944671631} -09/20/2021 15:47:33 - INFO - __main__ - Step 6024: {'lr': 0.00010026666666666666, 'samples': 192768, 'steps': 376, 'loss/train': 5.748961925506592} -09/20/2021 15:47:34 - INFO - __main__ - Step 6025: {'lr': 0.00010026666666666666, 'samples': 192800, 'steps': 376, 'loss/train': 5.045909404754639} -09/20/2021 15:47:34 - INFO - __main__ - Step 6026: {'lr': 0.00010026666666666666, 'samples': 192832, 'steps': 376, 'loss/train': 6.087928771972656} -09/20/2021 15:47:35 - INFO - __main__ - Step 6027: {'lr': 0.00010026666666666666, 'samples': 192864, 'steps': 376, 'loss/train': 5.652730941772461} -09/20/2021 15:47:36 - INFO - __main__ - Step 6028: {'lr': 0.00010026666666666666, 'samples': 192896, 'steps': 376, 'loss/train': 5.72726583480835} -09/20/2021 15:47:37 - INFO - __main__ - Step 6029: {'lr': 0.00010026666666666666, 'samples': 192928, 'steps': 376, 'loss/train': 3.9474070072174072} -09/20/2021 15:47:37 - INFO - __main__ - Step 6030: {'lr': 0.00010026666666666666, 'samples': 192960, 'steps': 376, 'loss/train': 5.246128559112549} -09/20/2021 15:47:39 - INFO - __main__ - Step 6031: {'lr': 0.00010026666666666666, 'samples': 192992, 'steps': 376, 'loss/train': 5.353104114532471} -09/20/2021 15:47:40 - INFO - __main__ - Step 6032: {'lr': 0.00010026666666666666, 'samples': 193024, 'steps': 376, 'loss/train': 4.88531494140625} -09/20/2021 15:47:41 - INFO - __main__ - Step 6033: {'lr': 0.00010053333333333334, 'samples': 193056, 'steps': 377, 'loss/train': 4.301018238067627} -09/20/2021 15:47:41 - INFO - __main__ - Step 6034: {'lr': 0.00010053333333333334, 'samples': 193088, 'steps': 377, 'loss/train': 5.479100227355957} -09/20/2021 15:47:42 - INFO - __main__ - Step 6035: {'lr': 0.00010053333333333334, 'samples': 193120, 'steps': 377, 'loss/train': 4.849815368652344} -09/20/2021 15:47:43 - INFO - __main__ - Step 6036: {'lr': 0.00010053333333333334, 'samples': 193152, 'steps': 377, 'loss/train': 4.871247291564941} -09/20/2021 15:47:44 - INFO - __main__ - Step 6037: {'lr': 0.00010053333333333334, 'samples': 193184, 'steps': 377, 'loss/train': 4.7861809730529785} -09/20/2021 15:47:44 - INFO - __main__ - Step 6038: {'lr': 0.00010053333333333334, 'samples': 193216, 'steps': 377, 'loss/train': 4.929915428161621} -09/20/2021 15:47:45 - INFO - __main__ - Step 6039: {'lr': 0.00010053333333333334, 'samples': 193248, 'steps': 377, 'loss/train': 7.012317180633545} -09/20/2021 15:47:46 - INFO - __main__ - Step 6040: {'lr': 0.00010053333333333334, 'samples': 193280, 'steps': 377, 'loss/train': 5.411402702331543} -09/20/2021 15:47:47 - INFO - __main__ - Step 6041: {'lr': 0.00010053333333333334, 'samples': 193312, 'steps': 377, 'loss/train': 5.2774152755737305} -09/20/2021 15:47:47 - INFO - __main__ - Step 6042: {'lr': 0.00010053333333333334, 'samples': 193344, 'steps': 377, 'loss/train': 4.697407245635986} -09/20/2021 15:47:48 - INFO - __main__ - Step 6043: {'lr': 0.00010053333333333334, 'samples': 193376, 'steps': 377, 'loss/train': 5.117120265960693} -09/20/2021 15:47:49 - INFO - __main__ - Step 6044: {'lr': 0.00010053333333333334, 'samples': 193408, 'steps': 377, 'loss/train': 4.2448015213012695} -09/20/2021 15:47:50 - INFO - __main__ - Step 6045: {'lr': 0.00010053333333333334, 'samples': 193440, 'steps': 377, 'loss/train': 4.252785682678223} -09/20/2021 15:47:50 - INFO - __main__ - Step 6046: {'lr': 0.00010053333333333334, 'samples': 193472, 'steps': 377, 'loss/train': 4.554966449737549} -09/20/2021 15:47:51 - INFO - __main__ - Step 6047: {'lr': 0.00010053333333333334, 'samples': 193504, 'steps': 377, 'loss/train': 5.715235233306885} -09/20/2021 15:47:52 - INFO - __main__ - Step 6048: {'lr': 0.00010053333333333334, 'samples': 193536, 'steps': 377, 'loss/train': 5.032104015350342} -09/20/2021 15:47:53 - INFO - __main__ - Step 6049: {'lr': 0.00010080000000000001, 'samples': 193568, 'steps': 378, 'loss/train': 4.878632545471191} -09/20/2021 15:47:53 - INFO - __main__ - Step 6050: {'lr': 0.00010080000000000001, 'samples': 193600, 'steps': 378, 'loss/train': 4.839878082275391} -09/20/2021 15:47:54 - INFO - __main__ - Step 6051: {'lr': 0.00010080000000000001, 'samples': 193632, 'steps': 378, 'loss/train': 3.7266387939453125} -09/20/2021 15:47:55 - INFO - __main__ - Step 6052: {'lr': 0.00010080000000000001, 'samples': 193664, 'steps': 378, 'loss/train': 3.70971417427063} -09/20/2021 15:47:56 - INFO - __main__ - Step 6053: {'lr': 0.00010080000000000001, 'samples': 193696, 'steps': 378, 'loss/train': 3.7122368812561035} -09/20/2021 15:47:56 - INFO - __main__ - Step 6054: {'lr': 0.00010080000000000001, 'samples': 193728, 'steps': 378, 'loss/train': 3.7184345722198486} -09/20/2021 15:47:57 - INFO - __main__ - Step 6055: {'lr': 0.00010080000000000001, 'samples': 193760, 'steps': 378, 'loss/train': 3.5171046257019043} -09/20/2021 15:47:58 - INFO - __main__ - Step 6056: {'lr': 0.00010080000000000001, 'samples': 193792, 'steps': 378, 'loss/train': 3.5292630195617676} -09/20/2021 15:47:59 - INFO - __main__ - Step 6057: {'lr': 0.00010080000000000001, 'samples': 193824, 'steps': 378, 'loss/train': 3.7158432006835938} -09/20/2021 15:47:59 - INFO - __main__ - Step 6058: {'lr': 0.00010080000000000001, 'samples': 193856, 'steps': 378, 'loss/train': 3.680220603942871} -09/20/2021 15:48:00 - INFO - __main__ - Step 6059: {'lr': 0.00010080000000000001, 'samples': 193888, 'steps': 378, 'loss/train': 5.681966304779053} -09/20/2021 15:48:01 - INFO - __main__ - Step 6060: {'lr': 0.00010080000000000001, 'samples': 193920, 'steps': 378, 'loss/train': 5.791448593139648} -09/20/2021 15:48:02 - INFO - __main__ - Step 6061: {'lr': 0.00010080000000000001, 'samples': 193952, 'steps': 378, 'loss/train': 3.8763349056243896} -09/20/2021 15:48:02 - INFO - __main__ - Step 6062: {'lr': 0.00010080000000000001, 'samples': 193984, 'steps': 378, 'loss/train': 5.045027732849121} -09/20/2021 15:48:03 - INFO - __main__ - Step 6063: {'lr': 0.00010080000000000001, 'samples': 194016, 'steps': 378, 'loss/train': 4.879772663116455} -09/20/2021 15:48:04 - INFO - __main__ - Step 6064: {'lr': 0.00010080000000000001, 'samples': 194048, 'steps': 378, 'loss/train': 5.000495910644531} -09/20/2021 15:48:05 - INFO - __main__ - Step 6065: {'lr': 0.00010106666666666667, 'samples': 194080, 'steps': 379, 'loss/train': 6.646951198577881} -09/20/2021 15:48:06 - INFO - __main__ - Step 6066: {'lr': 0.00010106666666666667, 'samples': 194112, 'steps': 379, 'loss/train': 6.253330707550049} -09/20/2021 15:48:06 - INFO - __main__ - Step 6067: {'lr': 0.00010106666666666667, 'samples': 194144, 'steps': 379, 'loss/train': 6.175625801086426} -09/20/2021 15:48:08 - INFO - __main__ - Step 6068: {'lr': 0.00010106666666666667, 'samples': 194176, 'steps': 379, 'loss/train': 5.028749942779541} -09/20/2021 15:48:08 - INFO - __main__ - Step 6069: {'lr': 0.00010106666666666667, 'samples': 194208, 'steps': 379, 'loss/train': 5.5613555908203125} -09/20/2021 15:48:09 - INFO - __main__ - Step 6070: {'lr': 0.00010106666666666667, 'samples': 194240, 'steps': 379, 'loss/train': 5.2388482093811035} -09/20/2021 15:48:10 - INFO - __main__ - Step 6071: {'lr': 0.00010106666666666667, 'samples': 194272, 'steps': 379, 'loss/train': 6.068282127380371} -09/20/2021 15:48:11 - INFO - __main__ - Step 6072: {'lr': 0.00010106666666666667, 'samples': 194304, 'steps': 379, 'loss/train': 5.5268473625183105} -09/20/2021 15:48:11 - INFO - __main__ - Step 6073: {'lr': 0.00010106666666666667, 'samples': 194336, 'steps': 379, 'loss/train': 5.351179122924805} -09/20/2021 15:48:12 - INFO - __main__ - Step 6074: {'lr': 0.00010106666666666667, 'samples': 194368, 'steps': 379, 'loss/train': 3.0322015285491943} -09/20/2021 15:48:13 - INFO - __main__ - Step 6075: {'lr': 0.00010106666666666667, 'samples': 194400, 'steps': 379, 'loss/train': 5.060859203338623} -09/20/2021 15:48:14 - INFO - __main__ - Step 6076: {'lr': 0.00010106666666666667, 'samples': 194432, 'steps': 379, 'loss/train': 4.910289287567139} -09/20/2021 15:48:14 - INFO - __main__ - Step 6077: {'lr': 0.00010106666666666667, 'samples': 194464, 'steps': 379, 'loss/train': 4.860773086547852} -09/20/2021 15:48:15 - INFO - __main__ - Step 6078: {'lr': 0.00010106666666666667, 'samples': 194496, 'steps': 379, 'loss/train': 5.232768535614014} -09/20/2021 15:48:16 - INFO - __main__ - Step 6079: {'lr': 0.00010106666666666667, 'samples': 194528, 'steps': 379, 'loss/train': 4.854548454284668} -09/20/2021 15:48:17 - INFO - __main__ - Step 6080: {'lr': 0.00010106666666666667, 'samples': 194560, 'steps': 379, 'loss/train': 5.05911922454834} -09/20/2021 15:48:18 - INFO - __main__ - Step 6081: {'lr': 0.00010133333333333335, 'samples': 194592, 'steps': 380, 'loss/train': 6.378683090209961} -09/20/2021 15:48:18 - INFO - __main__ - Step 6082: {'lr': 0.00010133333333333335, 'samples': 194624, 'steps': 380, 'loss/train': 5.3230462074279785} -09/20/2021 15:48:19 - INFO - __main__ - Step 6083: {'lr': 0.00010133333333333335, 'samples': 194656, 'steps': 380, 'loss/train': 7.64207124710083} -09/20/2021 15:48:20 - INFO - __main__ - Step 6084: {'lr': 0.00010133333333333335, 'samples': 194688, 'steps': 380, 'loss/train': 7.36376428604126} -09/20/2021 15:48:21 - INFO - __main__ - Step 6085: {'lr': 0.00010133333333333335, 'samples': 194720, 'steps': 380, 'loss/train': 8.015669822692871} -09/20/2021 15:48:21 - INFO - __main__ - Step 6086: {'lr': 0.00010133333333333335, 'samples': 194752, 'steps': 380, 'loss/train': 5.460724830627441} -09/20/2021 15:48:22 - INFO - __main__ - Step 6087: {'lr': 0.00010133333333333335, 'samples': 194784, 'steps': 380, 'loss/train': 4.773585319519043} -09/20/2021 15:48:23 - INFO - __main__ - Step 6088: {'lr': 0.00010133333333333335, 'samples': 194816, 'steps': 380, 'loss/train': 5.649134159088135} -09/20/2021 15:48:24 - INFO - __main__ - Step 6089: {'lr': 0.00010133333333333335, 'samples': 194848, 'steps': 380, 'loss/train': 5.836554527282715} -09/20/2021 15:48:24 - INFO - __main__ - Step 6090: {'lr': 0.00010133333333333335, 'samples': 194880, 'steps': 380, 'loss/train': 4.3396711349487305} -09/20/2021 15:48:25 - INFO - __main__ - Step 6091: {'lr': 0.00010133333333333335, 'samples': 194912, 'steps': 380, 'loss/train': 4.911440372467041} -09/20/2021 15:48:26 - INFO - __main__ - Step 6092: {'lr': 0.00010133333333333335, 'samples': 194944, 'steps': 380, 'loss/train': 4.705105781555176} -09/20/2021 15:48:27 - INFO - __main__ - Step 6093: {'lr': 0.00010133333333333335, 'samples': 194976, 'steps': 380, 'loss/train': 6.2248992919921875} -09/20/2021 15:48:27 - INFO - __main__ - Step 6094: {'lr': 0.00010133333333333335, 'samples': 195008, 'steps': 380, 'loss/train': 4.972703456878662} -09/20/2021 15:48:28 - INFO - __main__ - Step 6095: {'lr': 0.00010133333333333335, 'samples': 195040, 'steps': 380, 'loss/train': 5.992672443389893} -09/20/2021 15:48:29 - INFO - __main__ - Step 6096: {'lr': 0.00010133333333333335, 'samples': 195072, 'steps': 380, 'loss/train': 5.220491886138916} -09/20/2021 15:48:30 - INFO - __main__ - Step 6097: {'lr': 0.0001016, 'samples': 195104, 'steps': 381, 'loss/train': 5.721402168273926} -09/20/2021 15:48:30 - INFO - __main__ - Step 6098: {'lr': 0.0001016, 'samples': 195136, 'steps': 381, 'loss/train': 5.145596504211426} -09/20/2021 15:48:31 - INFO - __main__ - Step 6099: {'lr': 0.0001016, 'samples': 195168, 'steps': 381, 'loss/train': 5.042770862579346} -09/20/2021 15:48:33 - INFO - __main__ - Step 6100: {'lr': 0.0001016, 'samples': 195200, 'steps': 381, 'loss/train': 5.184782028198242} -09/20/2021 15:48:33 - INFO - __main__ - Step 6101: {'lr': 0.0001016, 'samples': 195232, 'steps': 381, 'loss/train': 5.228471755981445} -09/20/2021 15:48:34 - INFO - __main__ - Step 6102: {'lr': 0.0001016, 'samples': 195264, 'steps': 381, 'loss/train': 5.084226608276367} -09/20/2021 15:48:35 - INFO - __main__ - Step 6103: {'lr': 0.0001016, 'samples': 195296, 'steps': 381, 'loss/train': 5.9989166259765625} -09/20/2021 15:48:36 - INFO - __main__ - Step 6104: {'lr': 0.0001016, 'samples': 195328, 'steps': 381, 'loss/train': 5.844771385192871} -09/20/2021 15:48:36 - INFO - __main__ - Step 6105: {'lr': 0.0001016, 'samples': 195360, 'steps': 381, 'loss/train': 4.758748531341553} -09/20/2021 15:48:37 - INFO - __main__ - Step 6106: {'lr': 0.0001016, 'samples': 195392, 'steps': 381, 'loss/train': 4.032096862792969} -09/20/2021 15:48:38 - INFO - __main__ - Step 6107: {'lr': 0.0001016, 'samples': 195424, 'steps': 381, 'loss/train': 4.601985454559326} -09/20/2021 15:48:39 - INFO - __main__ - Step 6108: {'lr': 0.0001016, 'samples': 195456, 'steps': 381, 'loss/train': 5.793426990509033} -09/20/2021 15:48:39 - INFO - __main__ - Step 6109: {'lr': 0.0001016, 'samples': 195488, 'steps': 381, 'loss/train': 5.445920467376709} -09/20/2021 15:48:40 - INFO - __main__ - Step 6110: {'lr': 0.0001016, 'samples': 195520, 'steps': 381, 'loss/train': 4.950735092163086} -09/20/2021 15:48:41 - INFO - __main__ - Step 6111: {'lr': 0.0001016, 'samples': 195552, 'steps': 381, 'loss/train': 5.320648193359375} -09/20/2021 15:48:42 - INFO - __main__ - Step 6112: {'lr': 0.0001016, 'samples': 195584, 'steps': 381, 'loss/train': 5.848977565765381} -09/20/2021 15:48:42 - INFO - __main__ - Step 6113: {'lr': 0.00010186666666666667, 'samples': 195616, 'steps': 382, 'loss/train': 6.023468017578125} -09/20/2021 15:48:43 - INFO - __main__ - Step 6114: {'lr': 0.00010186666666666667, 'samples': 195648, 'steps': 382, 'loss/train': 4.9009480476379395} -09/20/2021 15:48:44 - INFO - __main__ - Step 6115: {'lr': 0.00010186666666666667, 'samples': 195680, 'steps': 382, 'loss/train': 6.89099645614624} -09/20/2021 15:48:45 - INFO - __main__ - Step 6116: {'lr': 0.00010186666666666667, 'samples': 195712, 'steps': 382, 'loss/train': 5.325668811798096} -09/20/2021 15:48:45 - INFO - __main__ - Step 6117: {'lr': 0.00010186666666666667, 'samples': 195744, 'steps': 382, 'loss/train': 5.591905117034912} -09/20/2021 15:48:46 - INFO - __main__ - Step 6118: {'lr': 0.00010186666666666667, 'samples': 195776, 'steps': 382, 'loss/train': 4.774571418762207} -09/20/2021 15:48:47 - INFO - __main__ - Step 6119: {'lr': 0.00010186666666666667, 'samples': 195808, 'steps': 382, 'loss/train': 4.957118511199951} -09/20/2021 15:48:48 - INFO - __main__ - Step 6120: {'lr': 0.00010186666666666667, 'samples': 195840, 'steps': 382, 'loss/train': 4.641545295715332} -09/20/2021 15:48:48 - INFO - __main__ - Step 6121: {'lr': 0.00010186666666666667, 'samples': 195872, 'steps': 382, 'loss/train': 4.59766149520874} -09/20/2021 15:48:49 - INFO - __main__ - Step 6122: {'lr': 0.00010186666666666667, 'samples': 195904, 'steps': 382, 'loss/train': 4.7825846672058105} -09/20/2021 15:48:50 - INFO - __main__ - Step 6123: {'lr': 0.00010186666666666667, 'samples': 195936, 'steps': 382, 'loss/train': 5.059673309326172} -09/20/2021 15:48:51 - INFO - __main__ - Step 6124: {'lr': 0.00010186666666666667, 'samples': 195968, 'steps': 382, 'loss/train': 7.174239635467529} -09/20/2021 15:48:51 - INFO - __main__ - Step 6125: {'lr': 0.00010186666666666667, 'samples': 196000, 'steps': 382, 'loss/train': 5.080442905426025} -09/20/2021 15:48:52 - INFO - __main__ - Step 6126: {'lr': 0.00010186666666666667, 'samples': 196032, 'steps': 382, 'loss/train': 5.1733856201171875} -09/20/2021 15:48:53 - INFO - __main__ - Step 6127: {'lr': 0.00010186666666666667, 'samples': 196064, 'steps': 382, 'loss/train': 5.057189464569092} -09/20/2021 15:48:54 - INFO - __main__ - Step 6128: {'lr': 0.00010186666666666667, 'samples': 196096, 'steps': 382, 'loss/train': 6.333260536193848} -09/20/2021 15:48:55 - INFO - __main__ - Step 6129: {'lr': 0.00010213333333333335, 'samples': 196128, 'steps': 383, 'loss/train': 6.151083946228027} -09/20/2021 15:48:56 - INFO - __main__ - Step 6130: {'lr': 0.00010213333333333335, 'samples': 196160, 'steps': 383, 'loss/train': 4.958632946014404} -09/20/2021 15:48:57 - INFO - __main__ - Step 6131: {'lr': 0.00010213333333333335, 'samples': 196192, 'steps': 383, 'loss/train': 5.200196743011475} -09/20/2021 15:48:57 - INFO - __main__ - Step 6132: {'lr': 0.00010213333333333335, 'samples': 196224, 'steps': 383, 'loss/train': 4.623350620269775} -09/20/2021 15:48:58 - INFO - __main__ - Step 6133: {'lr': 0.00010213333333333335, 'samples': 196256, 'steps': 383, 'loss/train': 4.554861545562744} -09/20/2021 15:48:59 - INFO - __main__ - Step 6134: {'lr': 0.00010213333333333335, 'samples': 196288, 'steps': 383, 'loss/train': 5.286263942718506} -09/20/2021 15:49:00 - INFO - __main__ - Step 6135: {'lr': 0.00010213333333333335, 'samples': 196320, 'steps': 383, 'loss/train': 4.873608589172363} -09/20/2021 15:49:00 - INFO - __main__ - Step 6136: {'lr': 0.00010213333333333335, 'samples': 196352, 'steps': 383, 'loss/train': 4.5388078689575195} -09/20/2021 15:49:01 - INFO - __main__ - Step 6137: {'lr': 0.00010213333333333335, 'samples': 196384, 'steps': 383, 'loss/train': 4.32119607925415} -09/20/2021 15:49:02 - INFO - __main__ - Step 6138: {'lr': 0.00010213333333333335, 'samples': 196416, 'steps': 383, 'loss/train': 4.831181049346924} -09/20/2021 15:49:03 - INFO - __main__ - Step 6139: {'lr': 0.00010213333333333335, 'samples': 196448, 'steps': 383, 'loss/train': 5.188840866088867} -09/20/2021 15:49:03 - INFO - __main__ - Step 6140: {'lr': 0.00010213333333333335, 'samples': 196480, 'steps': 383, 'loss/train': 4.532480716705322} -09/20/2021 15:49:04 - INFO - __main__ - Step 6141: {'lr': 0.00010213333333333335, 'samples': 196512, 'steps': 383, 'loss/train': 5.113681793212891} -09/20/2021 15:49:05 - INFO - __main__ - Step 6142: {'lr': 0.00010213333333333335, 'samples': 196544, 'steps': 383, 'loss/train': 5.260409832000732} -09/20/2021 15:49:06 - INFO - __main__ - Step 6143: {'lr': 0.00010213333333333335, 'samples': 196576, 'steps': 383, 'loss/train': 5.574301242828369} -09/20/2021 15:49:06 - INFO - __main__ - Step 6144: {'lr': 0.00010213333333333335, 'samples': 196608, 'steps': 383, 'loss/train': 4.0589280128479} -09/20/2021 15:49:07 - INFO - __main__ - Step 6145: {'lr': 0.00010240000000000001, 'samples': 196640, 'steps': 384, 'loss/train': 7.647355079650879} -09/20/2021 15:49:08 - INFO - __main__ - Step 6146: {'lr': 0.00010240000000000001, 'samples': 196672, 'steps': 384, 'loss/train': 5.01049280166626} -09/20/2021 15:49:09 - INFO - __main__ - Step 6147: {'lr': 0.00010240000000000001, 'samples': 196704, 'steps': 384, 'loss/train': 5.937919616699219} -09/20/2021 15:49:10 - INFO - __main__ - Step 6148: {'lr': 0.00010240000000000001, 'samples': 196736, 'steps': 384, 'loss/train': 5.562115669250488} -09/20/2021 15:49:10 - INFO - __main__ - Step 6149: {'lr': 0.00010240000000000001, 'samples': 196768, 'steps': 384, 'loss/train': 4.818474769592285} -09/20/2021 15:49:11 - INFO - __main__ - Step 6150: {'lr': 0.00010240000000000001, 'samples': 196800, 'steps': 384, 'loss/train': 5.212122440338135} -09/20/2021 15:49:12 - INFO - __main__ - Step 6151: {'lr': 0.00010240000000000001, 'samples': 196832, 'steps': 384, 'loss/train': 4.467218399047852} -09/20/2021 15:49:13 - INFO - __main__ - Step 6152: {'lr': 0.00010240000000000001, 'samples': 196864, 'steps': 384, 'loss/train': 5.354669570922852} -09/20/2021 15:49:13 - INFO - __main__ - Step 6153: {'lr': 0.00010240000000000001, 'samples': 196896, 'steps': 384, 'loss/train': 5.357248306274414} -09/20/2021 15:49:14 - INFO - __main__ - Step 6154: {'lr': 0.00010240000000000001, 'samples': 196928, 'steps': 384, 'loss/train': 5.070106029510498} -09/20/2021 15:49:15 - INFO - __main__ - Step 6155: {'lr': 0.00010240000000000001, 'samples': 196960, 'steps': 384, 'loss/train': 5.204556465148926} -09/20/2021 15:49:16 - INFO - __main__ - Step 6156: {'lr': 0.00010240000000000001, 'samples': 196992, 'steps': 384, 'loss/train': 3.18607759475708} -09/20/2021 15:49:16 - INFO - __main__ - Step 6157: {'lr': 0.00010240000000000001, 'samples': 197024, 'steps': 384, 'loss/train': 4.513599872589111} -09/20/2021 15:49:17 - INFO - __main__ - Step 6158: {'lr': 0.00010240000000000001, 'samples': 197056, 'steps': 384, 'loss/train': 5.1787214279174805} -09/20/2021 15:49:18 - INFO - __main__ - Step 6159: {'lr': 0.00010240000000000001, 'samples': 197088, 'steps': 384, 'loss/train': 5.245896339416504} -09/20/2021 15:49:19 - INFO - __main__ - Step 6160: {'lr': 0.00010240000000000001, 'samples': 197120, 'steps': 384, 'loss/train': 4.607112407684326} -09/20/2021 15:49:20 - INFO - __main__ - Step 6161: {'lr': 0.00010266666666666666, 'samples': 197152, 'steps': 385, 'loss/train': 5.8492560386657715} -09/20/2021 15:49:21 - INFO - __main__ - Step 6162: {'lr': 0.00010266666666666666, 'samples': 197184, 'steps': 385, 'loss/train': 4.981241703033447} -09/20/2021 15:49:22 - INFO - __main__ - Step 6163: {'lr': 0.00010266666666666666, 'samples': 197216, 'steps': 385, 'loss/train': 6.784089088439941} -09/20/2021 15:49:23 - INFO - __main__ - Step 6164: {'lr': 0.00010266666666666666, 'samples': 197248, 'steps': 385, 'loss/train': 5.284665107727051} -09/20/2021 15:49:23 - INFO - __main__ - Step 6165: {'lr': 0.00010266666666666666, 'samples': 197280, 'steps': 385, 'loss/train': 5.19978141784668} -09/20/2021 15:49:24 - INFO - __main__ - Step 6166: {'lr': 0.00010266666666666666, 'samples': 197312, 'steps': 385, 'loss/train': 5.178034782409668} -09/20/2021 15:49:25 - INFO - __main__ - Step 6167: {'lr': 0.00010266666666666666, 'samples': 197344, 'steps': 385, 'loss/train': 4.700356483459473} -09/20/2021 15:49:26 - INFO - __main__ - Step 6168: {'lr': 0.00010266666666666666, 'samples': 197376, 'steps': 385, 'loss/train': 5.9459547996521} -09/20/2021 15:49:26 - INFO - __main__ - Step 6169: {'lr': 0.00010266666666666666, 'samples': 197408, 'steps': 385, 'loss/train': 5.476052284240723} -09/20/2021 15:49:27 - INFO - __main__ - Step 6170: {'lr': 0.00010266666666666666, 'samples': 197440, 'steps': 385, 'loss/train': 3.819770097732544} -09/20/2021 15:49:28 - INFO - __main__ - Step 6171: {'lr': 0.00010266666666666666, 'samples': 197472, 'steps': 385, 'loss/train': 2.774310350418091} -09/20/2021 15:49:29 - INFO - __main__ - Step 6172: {'lr': 0.00010266666666666666, 'samples': 197504, 'steps': 385, 'loss/train': 3.0360918045043945} -09/20/2021 15:49:29 - INFO - __main__ - Step 6173: {'lr': 0.00010266666666666666, 'samples': 197536, 'steps': 385, 'loss/train': 4.076735496520996} -09/20/2021 15:49:30 - INFO - __main__ - Step 6174: {'lr': 0.00010266666666666666, 'samples': 197568, 'steps': 385, 'loss/train': 3.2034189701080322} -09/20/2021 15:49:31 - INFO - __main__ - Step 6175: {'lr': 0.00010266666666666666, 'samples': 197600, 'steps': 385, 'loss/train': 3.994899272918701} -09/20/2021 15:49:32 - INFO - __main__ - Step 6176: {'lr': 0.00010266666666666666, 'samples': 197632, 'steps': 385, 'loss/train': 5.024319171905518} -09/20/2021 15:49:32 - INFO - __main__ - Step 6177: {'lr': 0.00010293333333333335, 'samples': 197664, 'steps': 386, 'loss/train': 5.214025020599365} -09/20/2021 15:49:33 - INFO - __main__ - Step 6178: {'lr': 0.00010293333333333335, 'samples': 197696, 'steps': 386, 'loss/train': 4.948516368865967} -09/20/2021 15:49:34 - INFO - __main__ - Step 6179: {'lr': 0.00010293333333333335, 'samples': 197728, 'steps': 386, 'loss/train': 4.319981098175049} -09/20/2021 15:49:35 - INFO - __main__ - Step 6180: {'lr': 0.00010293333333333335, 'samples': 197760, 'steps': 386, 'loss/train': 5.286691188812256} -09/20/2021 15:49:36 - INFO - __main__ - Step 6181: {'lr': 0.00010293333333333335, 'samples': 197792, 'steps': 386, 'loss/train': 4.986863136291504} -09/20/2021 15:49:36 - INFO - __main__ - Step 6182: {'lr': 0.00010293333333333335, 'samples': 197824, 'steps': 386, 'loss/train': 5.588137149810791} -09/20/2021 15:49:37 - INFO - __main__ - Step 6183: {'lr': 0.00010293333333333335, 'samples': 197856, 'steps': 386, 'loss/train': 5.07297945022583} -09/20/2021 15:49:38 - INFO - __main__ - Step 6184: {'lr': 0.00010293333333333335, 'samples': 197888, 'steps': 386, 'loss/train': 5.872481346130371} -09/20/2021 15:49:39 - INFO - __main__ - Step 6185: {'lr': 0.00010293333333333335, 'samples': 197920, 'steps': 386, 'loss/train': 5.446286201477051} -09/20/2021 15:49:39 - INFO - __main__ - Step 6186: {'lr': 0.00010293333333333335, 'samples': 197952, 'steps': 386, 'loss/train': 4.974415302276611} -09/20/2021 15:49:40 - INFO - __main__ - Step 6187: {'lr': 0.00010293333333333335, 'samples': 197984, 'steps': 386, 'loss/train': 5.382274627685547} -09/20/2021 15:49:41 - INFO - __main__ - Step 6188: {'lr': 0.00010293333333333335, 'samples': 198016, 'steps': 386, 'loss/train': 4.949905872344971} -09/20/2021 15:49:42 - INFO - __main__ - Step 6189: {'lr': 0.00010293333333333335, 'samples': 198048, 'steps': 386, 'loss/train': 5.225276470184326} -09/20/2021 15:49:42 - INFO - __main__ - Step 6190: {'lr': 0.00010293333333333335, 'samples': 198080, 'steps': 386, 'loss/train': 5.520069599151611} -09/20/2021 15:49:43 - INFO - __main__ - Step 6191: {'lr': 0.00010293333333333335, 'samples': 198112, 'steps': 386, 'loss/train': 4.820483684539795} -09/20/2021 15:49:45 - INFO - __main__ - Step 6192: {'lr': 0.00010293333333333335, 'samples': 198144, 'steps': 386, 'loss/train': 5.07861328125} -09/20/2021 15:49:46 - INFO - __main__ - Step 6193: {'lr': 0.0001032, 'samples': 198176, 'steps': 387, 'loss/train': 5.3809967041015625} -09/20/2021 15:49:46 - INFO - __main__ - Step 6194: {'lr': 0.0001032, 'samples': 198208, 'steps': 387, 'loss/train': 5.138727188110352} -09/20/2021 15:49:47 - INFO - __main__ - Step 6195: {'lr': 0.0001032, 'samples': 198240, 'steps': 387, 'loss/train': 5.715369701385498} -09/20/2021 15:49:48 - INFO - __main__ - Step 6196: {'lr': 0.0001032, 'samples': 198272, 'steps': 387, 'loss/train': 4.7869367599487305} -09/20/2021 15:49:49 - INFO - __main__ - Step 6197: {'lr': 0.0001032, 'samples': 198304, 'steps': 387, 'loss/train': 4.950803756713867} -09/20/2021 15:49:49 - INFO - __main__ - Step 6198: {'lr': 0.0001032, 'samples': 198336, 'steps': 387, 'loss/train': 4.83839750289917} -09/20/2021 15:49:50 - INFO - __main__ - Step 6199: {'lr': 0.0001032, 'samples': 198368, 'steps': 387, 'loss/train': 5.966403007507324} -09/20/2021 15:49:51 - INFO - __main__ - Step 6200: {'lr': 0.0001032, 'samples': 198400, 'steps': 387, 'loss/train': 6.54057502746582} -09/20/2021 15:49:52 - INFO - __main__ - Step 6201: {'lr': 0.0001032, 'samples': 198432, 'steps': 387, 'loss/train': 5.509919166564941} -09/20/2021 15:49:52 - INFO - __main__ - Step 6202: {'lr': 0.0001032, 'samples': 198464, 'steps': 387, 'loss/train': 4.817920207977295} -09/20/2021 15:49:53 - INFO - __main__ - Step 6203: {'lr': 0.0001032, 'samples': 198496, 'steps': 387, 'loss/train': 5.506747245788574} -09/20/2021 15:49:54 - INFO - __main__ - Step 6204: {'lr': 0.0001032, 'samples': 198528, 'steps': 387, 'loss/train': 6.955705165863037} -09/20/2021 15:49:55 - INFO - __main__ - Step 6205: {'lr': 0.0001032, 'samples': 198560, 'steps': 387, 'loss/train': 5.184272766113281} -09/20/2021 15:49:55 - INFO - __main__ - Step 6206: {'lr': 0.0001032, 'samples': 198592, 'steps': 387, 'loss/train': 4.574939250946045} -09/20/2021 15:49:56 - INFO - __main__ - Step 6207: {'lr': 0.0001032, 'samples': 198624, 'steps': 387, 'loss/train': 5.460910797119141} -09/20/2021 15:49:57 - INFO - __main__ - Step 6208: {'lr': 0.0001032, 'samples': 198656, 'steps': 387, 'loss/train': 6.7585601806640625} -09/20/2021 15:49:58 - INFO - __main__ - Step 6209: {'lr': 0.00010346666666666667, 'samples': 198688, 'steps': 388, 'loss/train': 5.054930210113525} -09/20/2021 15:49:59 - INFO - __main__ - Step 6210: {'lr': 0.00010346666666666667, 'samples': 198720, 'steps': 388, 'loss/train': 6.342729568481445} -09/20/2021 15:49:59 - INFO - __main__ - Step 6211: {'lr': 0.00010346666666666667, 'samples': 198752, 'steps': 388, 'loss/train': 6.623684406280518} -09/20/2021 15:50:00 - INFO - __main__ - Step 6212: {'lr': 0.00010346666666666667, 'samples': 198784, 'steps': 388, 'loss/train': 2.7116286754608154} -09/20/2021 15:50:01 - INFO - __main__ - Step 6213: {'lr': 0.00010346666666666667, 'samples': 198816, 'steps': 388, 'loss/train': 5.201048851013184} -09/20/2021 15:50:02 - INFO - __main__ - Step 6214: {'lr': 0.00010346666666666667, 'samples': 198848, 'steps': 388, 'loss/train': 5.220352649688721} -09/20/2021 15:50:02 - INFO - __main__ - Step 6215: {'lr': 0.00010346666666666667, 'samples': 198880, 'steps': 388, 'loss/train': 4.813627243041992} -09/20/2021 15:50:03 - INFO - __main__ - Step 6216: {'lr': 0.00010346666666666667, 'samples': 198912, 'steps': 388, 'loss/train': 6.198338985443115} -09/20/2021 15:50:04 - INFO - __main__ - Step 6217: {'lr': 0.00010346666666666667, 'samples': 198944, 'steps': 388, 'loss/train': 4.971668720245361} -09/20/2021 15:50:05 - INFO - __main__ - Step 6218: {'lr': 0.00010346666666666667, 'samples': 198976, 'steps': 388, 'loss/train': 3.8249166011810303} -09/20/2021 15:50:05 - INFO - __main__ - Step 6219: {'lr': 0.00010346666666666667, 'samples': 199008, 'steps': 388, 'loss/train': 5.324762344360352} -09/20/2021 15:50:06 - INFO - __main__ - Step 6220: {'lr': 0.00010346666666666667, 'samples': 199040, 'steps': 388, 'loss/train': 5.737759113311768} -09/20/2021 15:50:07 - INFO - __main__ - Step 6221: {'lr': 0.00010346666666666667, 'samples': 199072, 'steps': 388, 'loss/train': 5.098987102508545} -09/20/2021 15:50:08 - INFO - __main__ - Step 6222: {'lr': 0.00010346666666666667, 'samples': 199104, 'steps': 388, 'loss/train': 5.876335144042969} -09/20/2021 15:50:09 - INFO - __main__ - Step 6223: {'lr': 0.00010346666666666667, 'samples': 199136, 'steps': 388, 'loss/train': 5.157642364501953} -09/20/2021 15:50:10 - INFO - __main__ - Step 6224: {'lr': 0.00010346666666666667, 'samples': 199168, 'steps': 388, 'loss/train': 5.077480792999268} -09/20/2021 15:50:10 - INFO - __main__ - Step 6225: {'lr': 0.00010373333333333335, 'samples': 199200, 'steps': 389, 'loss/train': 5.270542144775391} -09/20/2021 15:50:11 - INFO - __main__ - Step 6226: {'lr': 0.00010373333333333335, 'samples': 199232, 'steps': 389, 'loss/train': 5.423245906829834} -09/20/2021 15:50:12 - INFO - __main__ - Step 6227: {'lr': 0.00010373333333333335, 'samples': 199264, 'steps': 389, 'loss/train': 4.705164909362793} -09/20/2021 15:50:13 - INFO - __main__ - Step 6228: {'lr': 0.00010373333333333335, 'samples': 199296, 'steps': 389, 'loss/train': 5.041686058044434} -09/20/2021 15:50:13 - INFO - __main__ - Step 6229: {'lr': 0.00010373333333333335, 'samples': 199328, 'steps': 389, 'loss/train': 4.914275646209717} -09/20/2021 15:50:14 - INFO - __main__ - Step 6230: {'lr': 0.00010373333333333335, 'samples': 199360, 'steps': 389, 'loss/train': 1.0372064113616943} -09/20/2021 15:50:15 - INFO - __main__ - Step 6231: {'lr': 0.00010373333333333335, 'samples': 199392, 'steps': 389, 'loss/train': 5.8744940757751465} -09/20/2021 15:50:16 - INFO - __main__ - Step 6232: {'lr': 0.00010373333333333335, 'samples': 199424, 'steps': 389, 'loss/train': 8.674612998962402} -09/20/2021 15:50:16 - INFO - __main__ - Step 6233: {'lr': 0.00010373333333333335, 'samples': 199456, 'steps': 389, 'loss/train': 4.572208881378174} -09/20/2021 15:50:17 - INFO - __main__ - Step 6234: {'lr': 0.00010373333333333335, 'samples': 199488, 'steps': 389, 'loss/train': 5.099900722503662} -09/20/2021 15:50:18 - INFO - __main__ - Step 6235: {'lr': 0.00010373333333333335, 'samples': 199520, 'steps': 389, 'loss/train': 4.861019611358643} -09/20/2021 15:50:19 - INFO - __main__ - Step 6236: {'lr': 0.00010373333333333335, 'samples': 199552, 'steps': 389, 'loss/train': 1.595914602279663} -09/20/2021 15:50:19 - INFO - __main__ - Step 6237: {'lr': 0.00010373333333333335, 'samples': 199584, 'steps': 389, 'loss/train': 4.843727111816406} -09/20/2021 15:50:20 - INFO - __main__ - Step 6238: {'lr': 0.00010373333333333335, 'samples': 199616, 'steps': 389, 'loss/train': 5.283071517944336} -09/20/2021 15:50:21 - INFO - __main__ - Step 6239: {'lr': 0.00010373333333333335, 'samples': 199648, 'steps': 389, 'loss/train': 5.281555652618408} -09/20/2021 15:50:22 - INFO - __main__ - Step 6240: {'lr': 0.00010373333333333335, 'samples': 199680, 'steps': 389, 'loss/train': 5.77042818069458} -09/20/2021 15:50:23 - INFO - __main__ - Step 6241: {'lr': 0.00010400000000000001, 'samples': 199712, 'steps': 390, 'loss/train': 4.787271022796631} -09/20/2021 15:50:23 - INFO - __main__ - Step 6242: {'lr': 0.00010400000000000001, 'samples': 199744, 'steps': 390, 'loss/train': 5.206768989562988} -09/20/2021 15:50:24 - INFO - __main__ - Step 6243: {'lr': 0.00010400000000000001, 'samples': 199776, 'steps': 390, 'loss/train': 5.133284568786621} -09/20/2021 15:50:25 - INFO - __main__ - Step 6244: {'lr': 0.00010400000000000001, 'samples': 199808, 'steps': 390, 'loss/train': 5.636648178100586} -09/20/2021 15:50:26 - INFO - __main__ - Step 6245: {'lr': 0.00010400000000000001, 'samples': 199840, 'steps': 390, 'loss/train': 5.517178058624268} -09/20/2021 15:50:26 - INFO - __main__ - Step 6246: {'lr': 0.00010400000000000001, 'samples': 199872, 'steps': 390, 'loss/train': 4.85926628112793} -09/20/2021 15:50:27 - INFO - __main__ - Step 6247: {'lr': 0.00010400000000000001, 'samples': 199904, 'steps': 390, 'loss/train': 4.996678829193115} -09/20/2021 15:50:28 - INFO - __main__ - Step 6248: {'lr': 0.00010400000000000001, 'samples': 199936, 'steps': 390, 'loss/train': 5.696592807769775} -09/20/2021 15:50:29 - INFO - __main__ - Step 6249: {'lr': 0.00010400000000000001, 'samples': 199968, 'steps': 390, 'loss/train': 5.136824607849121} -09/20/2021 15:50:29 - INFO - __main__ - Step 6250: {'lr': 0.00010400000000000001, 'samples': 200000, 'steps': 390, 'loss/train': 4.8619513511657715} -09/20/2021 15:50:30 - INFO - __main__ - Step 6251: {'lr': 0.00010400000000000001, 'samples': 200032, 'steps': 390, 'loss/train': 5.198021411895752} -09/20/2021 15:50:31 - INFO - __main__ - Step 6252: {'lr': 0.00010400000000000001, 'samples': 200064, 'steps': 390, 'loss/train': 4.730133533477783} -09/20/2021 15:50:32 - INFO - __main__ - Step 6253: {'lr': 0.00010400000000000001, 'samples': 200096, 'steps': 390, 'loss/train': 5.3002824783325195} -09/20/2021 15:50:33 - INFO - __main__ - Step 6254: {'lr': 0.00010400000000000001, 'samples': 200128, 'steps': 390, 'loss/train': 5.34547758102417} -09/20/2021 15:50:34 - INFO - __main__ - Step 6255: {'lr': 0.00010400000000000001, 'samples': 200160, 'steps': 390, 'loss/train': 5.047243595123291} -09/20/2021 15:50:34 - INFO - __main__ - Step 6256: {'lr': 0.00010400000000000001, 'samples': 200192, 'steps': 390, 'loss/train': 5.673645973205566} -09/20/2021 15:50:35 - INFO - __main__ - Step 6257: {'lr': 0.00010426666666666666, 'samples': 200224, 'steps': 391, 'loss/train': 4.9926347732543945} -09/20/2021 15:50:36 - INFO - __main__ - Step 6258: {'lr': 0.00010426666666666666, 'samples': 200256, 'steps': 391, 'loss/train': 4.908750057220459} -09/20/2021 15:50:37 - INFO - __main__ - Step 6259: {'lr': 0.00010426666666666666, 'samples': 200288, 'steps': 391, 'loss/train': 6.055606842041016} -09/20/2021 15:50:38 - INFO - __main__ - Step 6260: {'lr': 0.00010426666666666666, 'samples': 200320, 'steps': 391, 'loss/train': 5.286067008972168} -09/20/2021 15:50:38 - INFO - __main__ - Step 6261: {'lr': 0.00010426666666666666, 'samples': 200352, 'steps': 391, 'loss/train': 4.918385982513428} -09/20/2021 15:50:39 - INFO - __main__ - Step 6262: {'lr': 0.00010426666666666666, 'samples': 200384, 'steps': 391, 'loss/train': 5.047978401184082} -09/20/2021 15:50:40 - INFO - __main__ - Step 6263: {'lr': 0.00010426666666666666, 'samples': 200416, 'steps': 391, 'loss/train': 6.011622905731201} -09/20/2021 15:50:41 - INFO - __main__ - Step 6264: {'lr': 0.00010426666666666666, 'samples': 200448, 'steps': 391, 'loss/train': 5.059463024139404} -09/20/2021 15:50:41 - INFO - __main__ - Step 6265: {'lr': 0.00010426666666666666, 'samples': 200480, 'steps': 391, 'loss/train': 5.134816646575928} -09/20/2021 15:50:42 - INFO - __main__ - Step 6266: {'lr': 0.00010426666666666666, 'samples': 200512, 'steps': 391, 'loss/train': 5.3093390464782715} -09/20/2021 15:50:43 - INFO - __main__ - Step 6267: {'lr': 0.00010426666666666666, 'samples': 200544, 'steps': 391, 'loss/train': 5.130618095397949} -09/20/2021 15:50:44 - INFO - __main__ - Step 6268: {'lr': 0.00010426666666666666, 'samples': 200576, 'steps': 391, 'loss/train': 5.663939952850342} -09/20/2021 15:50:44 - INFO - __main__ - Step 6269: {'lr': 0.00010426666666666666, 'samples': 200608, 'steps': 391, 'loss/train': 5.096347332000732} -09/20/2021 15:50:45 - INFO - __main__ - Step 6270: {'lr': 0.00010426666666666666, 'samples': 200640, 'steps': 391, 'loss/train': 5.010516166687012} -09/20/2021 15:50:46 - INFO - __main__ - Step 6271: {'lr': 0.00010426666666666666, 'samples': 200672, 'steps': 391, 'loss/train': 6.176682472229004} -09/20/2021 15:50:47 - INFO - __main__ - Step 6272: {'lr': 0.00010426666666666666, 'samples': 200704, 'steps': 391, 'loss/train': 4.433653354644775} -09/20/2021 15:50:47 - INFO - __main__ - Step 6273: {'lr': 0.00010453333333333333, 'samples': 200736, 'steps': 392, 'loss/train': 5.42526912689209} -09/20/2021 15:50:48 - INFO - __main__ - Step 6274: {'lr': 0.00010453333333333333, 'samples': 200768, 'steps': 392, 'loss/train': 5.485437870025635} -09/20/2021 15:50:49 - INFO - __main__ - Step 6275: {'lr': 0.00010453333333333333, 'samples': 200800, 'steps': 392, 'loss/train': 5.681934833526611} -09/20/2021 15:50:50 - INFO - __main__ - Step 6276: {'lr': 0.00010453333333333333, 'samples': 200832, 'steps': 392, 'loss/train': 5.089773654937744} -09/20/2021 15:50:50 - INFO - __main__ - Step 6277: {'lr': 0.00010453333333333333, 'samples': 200864, 'steps': 392, 'loss/train': 4.727214813232422} -09/20/2021 15:50:51 - INFO - __main__ - Step 6278: {'lr': 0.00010453333333333333, 'samples': 200896, 'steps': 392, 'loss/train': 5.117652416229248} -09/20/2021 15:50:52 - INFO - __main__ - Step 6279: {'lr': 0.00010453333333333333, 'samples': 200928, 'steps': 392, 'loss/train': 4.966012954711914} -09/20/2021 15:50:53 - INFO - __main__ - Step 6280: {'lr': 0.00010453333333333333, 'samples': 200960, 'steps': 392, 'loss/train': 5.085820198059082} -09/20/2021 15:50:53 - INFO - __main__ - Step 6281: {'lr': 0.00010453333333333333, 'samples': 200992, 'steps': 392, 'loss/train': 5.087268829345703} -09/20/2021 15:50:54 - INFO - __main__ - Step 6282: {'lr': 0.00010453333333333333, 'samples': 201024, 'steps': 392, 'loss/train': 4.6364359855651855} -09/20/2021 15:50:55 - INFO - __main__ - Step 6283: {'lr': 0.00010453333333333333, 'samples': 201056, 'steps': 392, 'loss/train': 6.5049591064453125} -09/20/2021 15:50:56 - INFO - __main__ - Step 6284: {'lr': 0.00010453333333333333, 'samples': 201088, 'steps': 392, 'loss/train': 5.278923034667969} -09/20/2021 15:50:57 - INFO - __main__ - Step 6285: {'lr': 0.00010453333333333333, 'samples': 201120, 'steps': 392, 'loss/train': 4.6279096603393555} -09/20/2021 15:50:58 - INFO - __main__ - Step 6286: {'lr': 0.00010453333333333333, 'samples': 201152, 'steps': 392, 'loss/train': 4.670717239379883} -09/20/2021 15:50:58 - INFO - __main__ - Step 6287: {'lr': 0.00010453333333333333, 'samples': 201184, 'steps': 392, 'loss/train': 4.8924665451049805} -09/20/2021 15:50:59 - INFO - __main__ - Step 6288: {'lr': 0.00010453333333333333, 'samples': 201216, 'steps': 392, 'loss/train': 5.246464252471924} -09/20/2021 15:51:00 - INFO - __main__ - Step 6289: {'lr': 0.00010480000000000001, 'samples': 201248, 'steps': 393, 'loss/train': 5.001348972320557} -09/20/2021 15:51:01 - INFO - __main__ - Step 6290: {'lr': 0.00010480000000000001, 'samples': 201280, 'steps': 393, 'loss/train': 5.841858863830566} -09/20/2021 15:51:02 - INFO - __main__ - Step 6291: {'lr': 0.00010480000000000001, 'samples': 201312, 'steps': 393, 'loss/train': 4.398216724395752} -09/20/2021 15:51:02 - INFO - __main__ - Step 6292: {'lr': 0.00010480000000000001, 'samples': 201344, 'steps': 393, 'loss/train': 5.1156182289123535} -09/20/2021 15:51:03 - INFO - __main__ - Step 6293: {'lr': 0.00010480000000000001, 'samples': 201376, 'steps': 393, 'loss/train': 5.050980567932129} -09/20/2021 15:51:04 - INFO - __main__ - Step 6294: {'lr': 0.00010480000000000001, 'samples': 201408, 'steps': 393, 'loss/train': 4.851740837097168} -09/20/2021 15:51:05 - INFO - __main__ - Step 6295: {'lr': 0.00010480000000000001, 'samples': 201440, 'steps': 393, 'loss/train': 4.597358703613281} -09/20/2021 15:51:05 - INFO - __main__ - Step 6296: {'lr': 0.00010480000000000001, 'samples': 201472, 'steps': 393, 'loss/train': 4.912489414215088} -09/20/2021 15:51:06 - INFO - __main__ - Step 6297: {'lr': 0.00010480000000000001, 'samples': 201504, 'steps': 393, 'loss/train': 4.529915809631348} -09/20/2021 15:51:07 - INFO - __main__ - Step 6298: {'lr': 0.00010480000000000001, 'samples': 201536, 'steps': 393, 'loss/train': 4.291790962219238} -09/20/2021 15:51:08 - INFO - __main__ - Step 6299: {'lr': 0.00010480000000000001, 'samples': 201568, 'steps': 393, 'loss/train': 5.325258731842041} -09/20/2021 15:51:08 - INFO - __main__ - Step 6300: {'lr': 0.00010480000000000001, 'samples': 201600, 'steps': 393, 'loss/train': 4.811532974243164} -09/20/2021 15:51:09 - INFO - __main__ - Step 6301: {'lr': 0.00010480000000000001, 'samples': 201632, 'steps': 393, 'loss/train': 5.281351566314697} -09/20/2021 15:51:10 - INFO - __main__ - Step 6302: {'lr': 0.00010480000000000001, 'samples': 201664, 'steps': 393, 'loss/train': 5.526342868804932} -09/20/2021 15:51:11 - INFO - __main__ - Step 6303: {'lr': 0.00010480000000000001, 'samples': 201696, 'steps': 393, 'loss/train': 5.908514499664307} -09/20/2021 15:51:11 - INFO - __main__ - Step 6304: {'lr': 0.00010480000000000001, 'samples': 201728, 'steps': 393, 'loss/train': 5.987160682678223} -09/20/2021 15:51:12 - INFO - __main__ - Step 6305: {'lr': 0.00010506666666666667, 'samples': 201760, 'steps': 394, 'loss/train': 4.33823823928833} -09/20/2021 15:51:13 - INFO - __main__ - Step 6306: {'lr': 0.00010506666666666667, 'samples': 201792, 'steps': 394, 'loss/train': 5.495689868927002} -09/20/2021 15:51:14 - INFO - __main__ - Step 6307: {'lr': 0.00010506666666666667, 'samples': 201824, 'steps': 394, 'loss/train': 5.97475004196167} -09/20/2021 15:51:14 - INFO - __main__ - Step 6308: {'lr': 0.00010506666666666667, 'samples': 201856, 'steps': 394, 'loss/train': 5.324914455413818} -09/20/2021 15:51:15 - INFO - __main__ - Step 6309: {'lr': 0.00010506666666666667, 'samples': 201888, 'steps': 394, 'loss/train': 4.37912130355835} -09/20/2021 15:51:16 - INFO - __main__ - Step 6310: {'lr': 0.00010506666666666667, 'samples': 201920, 'steps': 394, 'loss/train': 5.394744396209717} -09/20/2021 15:51:17 - INFO - __main__ - Step 6311: {'lr': 0.00010506666666666667, 'samples': 201952, 'steps': 394, 'loss/train': 5.357307434082031} -09/20/2021 15:51:17 - INFO - __main__ - Step 6312: {'lr': 0.00010506666666666667, 'samples': 201984, 'steps': 394, 'loss/train': 5.212714672088623} -09/20/2021 15:51:18 - INFO - __main__ - Step 6313: {'lr': 0.00010506666666666667, 'samples': 202016, 'steps': 394, 'loss/train': 4.979619979858398} -09/20/2021 15:51:19 - INFO - __main__ - Step 6314: {'lr': 0.00010506666666666667, 'samples': 202048, 'steps': 394, 'loss/train': 5.071383953094482} -09/20/2021 15:51:20 - INFO - __main__ - Step 6315: {'lr': 0.00010506666666666667, 'samples': 202080, 'steps': 394, 'loss/train': 0.9841877818107605} -09/20/2021 15:51:21 - INFO - __main__ - Step 6316: {'lr': 0.00010506666666666667, 'samples': 202112, 'steps': 394, 'loss/train': 5.290858268737793} -09/20/2021 15:51:22 - INFO - __main__ - Step 6317: {'lr': 0.00010506666666666667, 'samples': 202144, 'steps': 394, 'loss/train': 5.27586030960083} -09/20/2021 15:51:23 - INFO - __main__ - Step 6318: {'lr': 0.00010506666666666667, 'samples': 202176, 'steps': 394, 'loss/train': 6.608367919921875} -09/20/2021 15:51:23 - INFO - __main__ - Step 6319: {'lr': 0.00010506666666666667, 'samples': 202208, 'steps': 394, 'loss/train': 5.118356227874756} -09/20/2021 15:51:24 - INFO - __main__ - Step 6320: {'lr': 0.00010506666666666667, 'samples': 202240, 'steps': 394, 'loss/train': 5.103254795074463} -09/20/2021 15:51:25 - INFO - __main__ - Step 6321: {'lr': 0.00010533333333333332, 'samples': 202272, 'steps': 395, 'loss/train': 4.732451915740967} -09/20/2021 15:51:26 - INFO - __main__ - Step 6322: {'lr': 0.00010533333333333332, 'samples': 202304, 'steps': 395, 'loss/train': 5.15871524810791} -09/20/2021 15:51:26 - INFO - __main__ - Step 6323: {'lr': 0.00010533333333333332, 'samples': 202336, 'steps': 395, 'loss/train': 4.700324535369873} -09/20/2021 15:51:27 - INFO - __main__ - Step 6324: {'lr': 0.00010533333333333332, 'samples': 202368, 'steps': 395, 'loss/train': 4.781498908996582} -09/20/2021 15:51:28 - INFO - __main__ - Step 6325: {'lr': 0.00010533333333333332, 'samples': 202400, 'steps': 395, 'loss/train': 4.469964027404785} -09/20/2021 15:51:29 - INFO - __main__ - Step 6326: {'lr': 0.00010533333333333332, 'samples': 202432, 'steps': 395, 'loss/train': 4.571869373321533} -09/20/2021 15:51:29 - INFO - __main__ - Step 6327: {'lr': 0.00010533333333333332, 'samples': 202464, 'steps': 395, 'loss/train': 5.25010347366333} -09/20/2021 15:51:30 - INFO - __main__ - Step 6328: {'lr': 0.00010533333333333332, 'samples': 202496, 'steps': 395, 'loss/train': 5.269396781921387} -09/20/2021 15:51:31 - INFO - __main__ - Step 6329: {'lr': 0.00010533333333333332, 'samples': 202528, 'steps': 395, 'loss/train': 5.669257164001465} -09/20/2021 15:51:32 - INFO - __main__ - Step 6330: {'lr': 0.00010533333333333332, 'samples': 202560, 'steps': 395, 'loss/train': 5.8207879066467285} -09/20/2021 15:51:32 - INFO - __main__ - Step 6331: {'lr': 0.00010533333333333332, 'samples': 202592, 'steps': 395, 'loss/train': 5.073752403259277} -09/20/2021 15:51:33 - INFO - __main__ - Step 6332: {'lr': 0.00010533333333333332, 'samples': 202624, 'steps': 395, 'loss/train': 4.699794292449951} -09/20/2021 15:51:34 - INFO - __main__ - Step 6333: {'lr': 0.00010533333333333332, 'samples': 202656, 'steps': 395, 'loss/train': 4.9629693031311035} -09/20/2021 15:51:35 - INFO - __main__ - Step 6334: {'lr': 0.00010533333333333332, 'samples': 202688, 'steps': 395, 'loss/train': 5.507871627807617} -09/20/2021 15:51:35 - INFO - __main__ - Step 6335: {'lr': 0.00010533333333333332, 'samples': 202720, 'steps': 395, 'loss/train': 4.649709224700928} -09/20/2021 15:51:36 - INFO - __main__ - Step 6336: {'lr': 0.00010533333333333332, 'samples': 202752, 'steps': 395, 'loss/train': 4.782787322998047} -09/20/2021 15:51:37 - INFO - __main__ - Step 6337: {'lr': 0.0001056, 'samples': 202784, 'steps': 396, 'loss/train': 4.921724319458008} -09/20/2021 15:51:38 - INFO - __main__ - Step 6338: {'lr': 0.0001056, 'samples': 202816, 'steps': 396, 'loss/train': 5.00670051574707} -09/20/2021 15:51:39 - INFO - __main__ - Step 6339: {'lr': 0.0001056, 'samples': 202848, 'steps': 396, 'loss/train': 4.1114068031311035} -09/20/2021 15:51:39 - INFO - __main__ - Step 6340: {'lr': 0.0001056, 'samples': 202880, 'steps': 396, 'loss/train': 6.010355472564697} -09/20/2021 15:51:40 - INFO - __main__ - Step 6341: {'lr': 0.0001056, 'samples': 202912, 'steps': 396, 'loss/train': 5.199075698852539} -09/20/2021 15:51:41 - INFO - __main__ - Step 6342: {'lr': 0.0001056, 'samples': 202944, 'steps': 396, 'loss/train': 4.889699935913086} -09/20/2021 15:51:42 - INFO - __main__ - Step 6343: {'lr': 0.0001056, 'samples': 202976, 'steps': 396, 'loss/train': 5.207945823669434} -09/20/2021 15:51:42 - INFO - __main__ - Step 6344: {'lr': 0.0001056, 'samples': 203008, 'steps': 396, 'loss/train': 4.213631629943848} -09/20/2021 15:51:43 - INFO - __main__ - Step 6345: {'lr': 0.0001056, 'samples': 203040, 'steps': 396, 'loss/train': 4.7476806640625} -09/20/2021 15:51:44 - INFO - __main__ - Step 6346: {'lr': 0.0001056, 'samples': 203072, 'steps': 396, 'loss/train': 4.936276912689209} -09/20/2021 15:51:45 - INFO - __main__ - Step 6347: {'lr': 0.0001056, 'samples': 203104, 'steps': 396, 'loss/train': 5.179327964782715} -09/20/2021 15:51:46 - INFO - __main__ - Step 6348: {'lr': 0.0001056, 'samples': 203136, 'steps': 396, 'loss/train': 4.997227668762207} -09/20/2021 15:51:47 - INFO - __main__ - Step 6349: {'lr': 0.0001056, 'samples': 203168, 'steps': 396, 'loss/train': 5.506021499633789} -09/20/2021 15:51:47 - INFO - __main__ - Step 6350: {'lr': 0.0001056, 'samples': 203200, 'steps': 396, 'loss/train': 5.188838958740234} -09/20/2021 15:51:48 - INFO - __main__ - Step 6351: {'lr': 0.0001056, 'samples': 203232, 'steps': 396, 'loss/train': 5.255263328552246} -09/20/2021 15:51:49 - INFO - __main__ - Step 6352: {'lr': 0.0001056, 'samples': 203264, 'steps': 396, 'loss/train': 5.498103141784668} -09/20/2021 15:51:50 - INFO - __main__ - Step 6353: {'lr': 0.00010586666666666667, 'samples': 203296, 'steps': 397, 'loss/train': 3.8619749546051025} -09/20/2021 15:51:50 - INFO - __main__ - Step 6354: {'lr': 0.00010586666666666667, 'samples': 203328, 'steps': 397, 'loss/train': 5.304193019866943} -09/20/2021 15:51:51 - INFO - __main__ - Step 6355: {'lr': 0.00010586666666666667, 'samples': 203360, 'steps': 397, 'loss/train': 5.025384902954102} -09/20/2021 15:51:52 - INFO - __main__ - Step 6356: {'lr': 0.00010586666666666667, 'samples': 203392, 'steps': 397, 'loss/train': 4.836343288421631} -09/20/2021 15:51:53 - INFO - __main__ - Step 6357: {'lr': 0.00010586666666666667, 'samples': 203424, 'steps': 397, 'loss/train': 5.827605724334717} -09/20/2021 15:51:53 - INFO - __main__ - Step 6358: {'lr': 0.00010586666666666667, 'samples': 203456, 'steps': 397, 'loss/train': 7.30184268951416} -09/20/2021 15:51:54 - INFO - __main__ - Step 6359: {'lr': 0.00010586666666666667, 'samples': 203488, 'steps': 397, 'loss/train': 5.192502021789551} -09/20/2021 15:51:55 - INFO - __main__ - Step 6360: {'lr': 0.00010586666666666667, 'samples': 203520, 'steps': 397, 'loss/train': 5.384901523590088} -09/20/2021 15:51:56 - INFO - __main__ - Step 6361: {'lr': 0.00010586666666666667, 'samples': 203552, 'steps': 397, 'loss/train': 5.189207077026367} -09/20/2021 15:51:56 - INFO - __main__ - Step 6362: {'lr': 0.00010586666666666667, 'samples': 203584, 'steps': 397, 'loss/train': 6.270502090454102} -09/20/2021 15:51:57 - INFO - __main__ - Step 6363: {'lr': 0.00010586666666666667, 'samples': 203616, 'steps': 397, 'loss/train': 5.573006629943848} -09/20/2021 15:51:58 - INFO - __main__ - Step 6364: {'lr': 0.00010586666666666667, 'samples': 203648, 'steps': 397, 'loss/train': 4.933098793029785} -09/20/2021 15:51:59 - INFO - __main__ - Step 6365: {'lr': 0.00010586666666666667, 'samples': 203680, 'steps': 397, 'loss/train': 2.9888217449188232} -09/20/2021 15:51:59 - INFO - __main__ - Step 6366: {'lr': 0.00010586666666666667, 'samples': 203712, 'steps': 397, 'loss/train': 5.100575923919678} -09/20/2021 15:52:00 - INFO - __main__ - Step 6367: {'lr': 0.00010586666666666667, 'samples': 203744, 'steps': 397, 'loss/train': 4.1568522453308105} -09/20/2021 15:52:01 - INFO - __main__ - Step 6368: {'lr': 0.00010586666666666667, 'samples': 203776, 'steps': 397, 'loss/train': 4.955411434173584} -09/20/2021 15:52:02 - INFO - __main__ - Step 6369: {'lr': 0.00010613333333333333, 'samples': 203808, 'steps': 398, 'loss/train': 5.214855194091797} -09/20/2021 15:52:03 - INFO - __main__ - Step 6370: {'lr': 0.00010613333333333333, 'samples': 203840, 'steps': 398, 'loss/train': 5.301117897033691} -09/20/2021 15:52:03 - INFO - __main__ - Step 6371: {'lr': 0.00010613333333333333, 'samples': 203872, 'steps': 398, 'loss/train': 5.994975566864014} -09/20/2021 15:52:04 - INFO - __main__ - Step 6372: {'lr': 0.00010613333333333333, 'samples': 203904, 'steps': 398, 'loss/train': 5.2167439460754395} -09/20/2021 15:52:05 - INFO - __main__ - Step 6373: {'lr': 0.00010613333333333333, 'samples': 203936, 'steps': 398, 'loss/train': 4.141780853271484} -09/20/2021 15:52:06 - INFO - __main__ - Step 6374: {'lr': 0.00010613333333333333, 'samples': 203968, 'steps': 398, 'loss/train': 5.4655256271362305} -09/20/2021 15:52:06 - INFO - __main__ - Step 6375: {'lr': 0.00010613333333333333, 'samples': 204000, 'steps': 398, 'loss/train': 5.153753757476807} -09/20/2021 15:52:07 - INFO - __main__ - Step 6376: {'lr': 0.00010613333333333333, 'samples': 204032, 'steps': 398, 'loss/train': 4.787028789520264} -09/20/2021 15:52:08 - INFO - __main__ - Step 6377: {'lr': 0.00010613333333333333, 'samples': 204064, 'steps': 398, 'loss/train': 5.862005710601807} -09/20/2021 15:52:09 - INFO - __main__ - Step 6378: {'lr': 0.00010613333333333333, 'samples': 204096, 'steps': 398, 'loss/train': 5.528008460998535} -09/20/2021 15:52:10 - INFO - __main__ - Step 6379: {'lr': 0.00010613333333333333, 'samples': 204128, 'steps': 398, 'loss/train': 4.9887847900390625} -09/20/2021 15:52:11 - INFO - __main__ - Step 6380: {'lr': 0.00010613333333333333, 'samples': 204160, 'steps': 398, 'loss/train': 5.152680397033691} -09/20/2021 15:52:11 - INFO - __main__ - Step 6381: {'lr': 0.00010613333333333333, 'samples': 204192, 'steps': 398, 'loss/train': 3.6932125091552734} -09/20/2021 15:52:12 - INFO - __main__ - Step 6382: {'lr': 0.00010613333333333333, 'samples': 204224, 'steps': 398, 'loss/train': 5.414663314819336} -09/20/2021 15:52:13 - INFO - __main__ - Step 6383: {'lr': 0.00010613333333333333, 'samples': 204256, 'steps': 398, 'loss/train': 4.82857608795166} -09/20/2021 15:52:14 - INFO - __main__ - Step 6384: {'lr': 0.00010613333333333333, 'samples': 204288, 'steps': 398, 'loss/train': 4.868615627288818} -09/20/2021 15:52:15 - INFO - __main__ - Step 6385: {'lr': 0.00010640000000000001, 'samples': 204320, 'steps': 399, 'loss/train': 2.2629761695861816} -09/20/2021 15:52:15 - INFO - __main__ - Step 6386: {'lr': 0.00010640000000000001, 'samples': 204352, 'steps': 399, 'loss/train': 6.394118785858154} -09/20/2021 15:52:16 - INFO - __main__ - Step 6387: {'lr': 0.00010640000000000001, 'samples': 204384, 'steps': 399, 'loss/train': 5.766390800476074} -09/20/2021 15:52:17 - INFO - __main__ - Step 6388: {'lr': 0.00010640000000000001, 'samples': 204416, 'steps': 399, 'loss/train': 5.074295520782471} -09/20/2021 15:52:18 - INFO - __main__ - Step 6389: {'lr': 0.00010640000000000001, 'samples': 204448, 'steps': 399, 'loss/train': 5.438939571380615} -09/20/2021 15:52:18 - INFO - __main__ - Step 6390: {'lr': 0.00010640000000000001, 'samples': 204480, 'steps': 399, 'loss/train': 5.531443119049072} -09/20/2021 15:52:19 - INFO - __main__ - Step 6391: {'lr': 0.00010640000000000001, 'samples': 204512, 'steps': 399, 'loss/train': 4.63358736038208} -09/20/2021 15:52:20 - INFO - __main__ - Step 6392: {'lr': 0.00010640000000000001, 'samples': 204544, 'steps': 399, 'loss/train': 6.148521423339844} -09/20/2021 15:52:21 - INFO - __main__ - Step 6393: {'lr': 0.00010640000000000001, 'samples': 204576, 'steps': 399, 'loss/train': 5.137456893920898} -09/20/2021 15:52:21 - INFO - __main__ - Step 6394: {'lr': 0.00010640000000000001, 'samples': 204608, 'steps': 399, 'loss/train': 4.828500270843506} -09/20/2021 15:52:22 - INFO - __main__ - Step 6395: {'lr': 0.00010640000000000001, 'samples': 204640, 'steps': 399, 'loss/train': 5.039977073669434} -09/20/2021 15:52:23 - INFO - __main__ - Step 6396: {'lr': 0.00010640000000000001, 'samples': 204672, 'steps': 399, 'loss/train': 4.5675153732299805} -09/20/2021 15:52:24 - INFO - __main__ - Step 6397: {'lr': 0.00010640000000000001, 'samples': 204704, 'steps': 399, 'loss/train': 5.0735673904418945} -09/20/2021 15:52:24 - INFO - __main__ - Step 6398: {'lr': 0.00010640000000000001, 'samples': 204736, 'steps': 399, 'loss/train': 4.803854942321777} -09/20/2021 15:52:25 - INFO - __main__ - Step 6399: {'lr': 0.00010640000000000001, 'samples': 204768, 'steps': 399, 'loss/train': 4.026212215423584} -09/20/2021 15:52:26 - INFO - __main__ - Step 6400: {'lr': 0.00010640000000000001, 'samples': 204800, 'steps': 399, 'loss/train': 5.0979437828063965} -09/20/2021 15:52:27 - INFO - __main__ - Step 6401: {'lr': 0.00010666666666666667, 'samples': 204832, 'steps': 400, 'loss/train': 6.051360130310059} -09/20/2021 15:52:27 - INFO - __main__ - Step 6402: {'lr': 0.00010666666666666667, 'samples': 204864, 'steps': 400, 'loss/train': 4.524413108825684} -09/20/2021 15:52:28 - INFO - __main__ - Step 6403: {'lr': 0.00010666666666666667, 'samples': 204896, 'steps': 400, 'loss/train': 3.940487861633301} -09/20/2021 15:52:29 - INFO - __main__ - Step 6404: {'lr': 0.00010666666666666667, 'samples': 204928, 'steps': 400, 'loss/train': 4.171616554260254} -09/20/2021 15:52:30 - INFO - __main__ - Step 6405: {'lr': 0.00010666666666666667, 'samples': 204960, 'steps': 400, 'loss/train': 4.226556777954102} -09/20/2021 15:52:30 - INFO - __main__ - Step 6406: {'lr': 0.00010666666666666667, 'samples': 204992, 'steps': 400, 'loss/train': 5.0221147537231445} -09/20/2021 15:52:32 - INFO - __main__ - Step 6407: {'lr': 0.00010666666666666667, 'samples': 205024, 'steps': 400, 'loss/train': 4.599175453186035} -09/20/2021 15:52:33 - INFO - __main__ - Step 6408: {'lr': 0.00010666666666666667, 'samples': 205056, 'steps': 400, 'loss/train': 5.146554470062256} -09/20/2021 15:52:33 - INFO - __main__ - Step 6409: {'lr': 0.00010666666666666667, 'samples': 205088, 'steps': 400, 'loss/train': 6.61536979675293} -09/20/2021 15:52:34 - INFO - __main__ - Step 6410: {'lr': 0.00010666666666666667, 'samples': 205120, 'steps': 400, 'loss/train': 5.005630016326904} -09/20/2021 15:52:35 - INFO - __main__ - Step 6411: {'lr': 0.00010666666666666667, 'samples': 205152, 'steps': 400, 'loss/train': 5.596896171569824} -09/20/2021 15:52:36 - INFO - __main__ - Step 6412: {'lr': 0.00010666666666666667, 'samples': 205184, 'steps': 400, 'loss/train': 4.946610450744629} -09/20/2021 15:52:36 - INFO - __main__ - Step 6413: {'lr': 0.00010666666666666667, 'samples': 205216, 'steps': 400, 'loss/train': 4.961913108825684} -09/20/2021 15:52:37 - INFO - __main__ - Step 6414: {'lr': 0.00010666666666666667, 'samples': 205248, 'steps': 400, 'loss/train': 5.084519386291504} -09/20/2021 15:52:38 - INFO - __main__ - Step 6415: {'lr': 0.00010666666666666667, 'samples': 205280, 'steps': 400, 'loss/train': 5.578676700592041} -09/20/2021 15:52:39 - INFO - __main__ - Step 6416: {'lr': 0.00010666666666666667, 'samples': 205312, 'steps': 400, 'loss/train': 4.5453386306762695} -09/20/2021 15:52:39 - INFO - __main__ - Step 6417: {'lr': 0.00010693333333333333, 'samples': 205344, 'steps': 401, 'loss/train': 5.084810733795166} -09/20/2021 15:52:40 - INFO - __main__ - Step 6418: {'lr': 0.00010693333333333333, 'samples': 205376, 'steps': 401, 'loss/train': 4.521391868591309} -09/20/2021 15:52:41 - INFO - __main__ - Step 6419: {'lr': 0.00010693333333333333, 'samples': 205408, 'steps': 401, 'loss/train': 5.114582538604736} -09/20/2021 15:52:42 - INFO - __main__ - Step 6420: {'lr': 0.00010693333333333333, 'samples': 205440, 'steps': 401, 'loss/train': 5.991066932678223} -09/20/2021 15:52:42 - INFO - __main__ - Step 6421: {'lr': 0.00010693333333333333, 'samples': 205472, 'steps': 401, 'loss/train': 5.8051629066467285} -09/20/2021 15:52:43 - INFO - __main__ - Step 6422: {'lr': 0.00010693333333333333, 'samples': 205504, 'steps': 401, 'loss/train': 6.876168251037598} -09/20/2021 15:52:44 - INFO - __main__ - Step 6423: {'lr': 0.00010693333333333333, 'samples': 205536, 'steps': 401, 'loss/train': 5.378902912139893} -09/20/2021 15:52:45 - INFO - __main__ - Step 6424: {'lr': 0.00010693333333333333, 'samples': 205568, 'steps': 401, 'loss/train': 5.682559967041016} -09/20/2021 15:52:45 - INFO - __main__ - Step 6425: {'lr': 0.00010693333333333333, 'samples': 205600, 'steps': 401, 'loss/train': 4.3661088943481445} -09/20/2021 15:52:46 - INFO - __main__ - Step 6426: {'lr': 0.00010693333333333333, 'samples': 205632, 'steps': 401, 'loss/train': 4.979681968688965} -09/20/2021 15:52:47 - INFO - __main__ - Step 6427: {'lr': 0.00010693333333333333, 'samples': 205664, 'steps': 401, 'loss/train': 4.840137004852295} -09/20/2021 15:52:48 - INFO - __main__ - Step 6428: {'lr': 0.00010693333333333333, 'samples': 205696, 'steps': 401, 'loss/train': 0.595072865486145} -09/20/2021 15:52:48 - INFO - __main__ - Step 6429: {'lr': 0.00010693333333333333, 'samples': 205728, 'steps': 401, 'loss/train': 2.535289764404297} -09/20/2021 15:52:49 - INFO - __main__ - Step 6430: {'lr': 0.00010693333333333333, 'samples': 205760, 'steps': 401, 'loss/train': 2.503962278366089} -09/20/2021 15:52:50 - INFO - __main__ - Step 6431: {'lr': 0.00010693333333333333, 'samples': 205792, 'steps': 401, 'loss/train': 3.3082661628723145} -09/20/2021 15:52:51 - INFO - __main__ - Step 6432: {'lr': 0.00010693333333333333, 'samples': 205824, 'steps': 401, 'loss/train': 5.239477634429932} -09/20/2021 15:52:52 - INFO - __main__ - Step 6433: {'lr': 0.00010720000000000002, 'samples': 205856, 'steps': 402, 'loss/train': 5.098870754241943} -09/20/2021 15:52:52 - INFO - __main__ - Step 6434: {'lr': 0.00010720000000000002, 'samples': 205888, 'steps': 402, 'loss/train': 4.812989711761475} -09/20/2021 15:52:53 - INFO - __main__ - Step 6435: {'lr': 0.00010720000000000002, 'samples': 205920, 'steps': 402, 'loss/train': 4.976877689361572} -09/20/2021 15:52:54 - INFO - __main__ - Step 6436: {'lr': 0.00010720000000000002, 'samples': 205952, 'steps': 402, 'loss/train': 2.0965781211853027} -09/20/2021 15:52:55 - INFO - __main__ - Step 6437: {'lr': 0.00010720000000000002, 'samples': 205984, 'steps': 402, 'loss/train': 2.609896659851074} -09/20/2021 15:52:56 - INFO - __main__ - Step 6438: {'lr': 0.00010720000000000002, 'samples': 206016, 'steps': 402, 'loss/train': 2.577000856399536} -09/20/2021 15:52:57 - INFO - __main__ - Step 6439: {'lr': 0.00010720000000000002, 'samples': 206048, 'steps': 402, 'loss/train': 4.494433879852295} -09/20/2021 15:52:57 - INFO - __main__ - Step 6440: {'lr': 0.00010720000000000002, 'samples': 206080, 'steps': 402, 'loss/train': 5.1631388664245605} -09/20/2021 15:52:58 - INFO - __main__ - Step 6441: {'lr': 0.00010720000000000002, 'samples': 206112, 'steps': 402, 'loss/train': 5.3799638748168945} -09/20/2021 15:52:59 - INFO - __main__ - Step 6442: {'lr': 0.00010720000000000002, 'samples': 206144, 'steps': 402, 'loss/train': 5.509840965270996} -09/20/2021 15:53:00 - INFO - __main__ - Step 6443: {'lr': 0.00010720000000000002, 'samples': 206176, 'steps': 402, 'loss/train': 4.7045745849609375} -09/20/2021 15:53:00 - INFO - __main__ - Step 6444: {'lr': 0.00010720000000000002, 'samples': 206208, 'steps': 402, 'loss/train': 5.26876163482666} -09/20/2021 15:53:01 - INFO - __main__ - Step 6445: {'lr': 0.00010720000000000002, 'samples': 206240, 'steps': 402, 'loss/train': 4.710333347320557} -09/20/2021 15:53:02 - INFO - __main__ - Step 6446: {'lr': 0.00010720000000000002, 'samples': 206272, 'steps': 402, 'loss/train': 5.445194244384766} -09/20/2021 15:53:03 - INFO - __main__ - Step 6447: {'lr': 0.00010720000000000002, 'samples': 206304, 'steps': 402, 'loss/train': 5.51575231552124} -09/20/2021 15:53:03 - INFO - __main__ - Step 6448: {'lr': 0.00010720000000000002, 'samples': 206336, 'steps': 402, 'loss/train': 4.61784553527832} -09/20/2021 15:53:04 - INFO - __main__ - Step 6449: {'lr': 0.00010746666666666667, 'samples': 206368, 'steps': 403, 'loss/train': 5.790551662445068} -09/20/2021 15:53:05 - INFO - __main__ - Step 6450: {'lr': 0.00010746666666666667, 'samples': 206400, 'steps': 403, 'loss/train': 3.5542185306549072} -09/20/2021 15:53:06 - INFO - __main__ - Step 6451: {'lr': 0.00010746666666666667, 'samples': 206432, 'steps': 403, 'loss/train': 4.579967498779297} -09/20/2021 15:53:06 - INFO - __main__ - Step 6452: {'lr': 0.00010746666666666667, 'samples': 206464, 'steps': 403, 'loss/train': 4.422189712524414} -09/20/2021 15:53:07 - INFO - __main__ - Step 6453: {'lr': 0.00010746666666666667, 'samples': 206496, 'steps': 403, 'loss/train': 4.816019058227539} -09/20/2021 15:53:08 - INFO - __main__ - Step 6454: {'lr': 0.00010746666666666667, 'samples': 206528, 'steps': 403, 'loss/train': 4.7611002922058105} -09/20/2021 15:53:09 - INFO - __main__ - Step 6455: {'lr': 0.00010746666666666667, 'samples': 206560, 'steps': 403, 'loss/train': 4.342095851898193} -09/20/2021 15:53:09 - INFO - __main__ - Step 6456: {'lr': 0.00010746666666666667, 'samples': 206592, 'steps': 403, 'loss/train': 5.293024063110352} -09/20/2021 15:53:10 - INFO - __main__ - Step 6457: {'lr': 0.00010746666666666667, 'samples': 206624, 'steps': 403, 'loss/train': 4.570538520812988} -09/20/2021 15:53:11 - INFO - __main__ - Step 6458: {'lr': 0.00010746666666666667, 'samples': 206656, 'steps': 403, 'loss/train': 5.097640037536621} -09/20/2021 15:53:12 - INFO - __main__ - Step 6459: {'lr': 0.00010746666666666667, 'samples': 206688, 'steps': 403, 'loss/train': 5.015421390533447} -09/20/2021 15:53:12 - INFO - __main__ - Step 6460: {'lr': 0.00010746666666666667, 'samples': 206720, 'steps': 403, 'loss/train': 6.400839328765869} -09/20/2021 15:53:13 - INFO - __main__ - Step 6461: {'lr': 0.00010746666666666667, 'samples': 206752, 'steps': 403, 'loss/train': 6.07536506652832} -09/20/2021 15:53:14 - INFO - __main__ - Step 6462: {'lr': 0.00010746666666666667, 'samples': 206784, 'steps': 403, 'loss/train': 4.8806962966918945} -09/20/2021 15:53:15 - INFO - __main__ - Step 6463: {'lr': 0.00010746666666666667, 'samples': 206816, 'steps': 403, 'loss/train': 5.2104058265686035} -09/20/2021 15:53:15 - INFO - __main__ - Step 6464: {'lr': 0.00010746666666666667, 'samples': 206848, 'steps': 403, 'loss/train': 3.8066530227661133} -09/20/2021 15:53:16 - INFO - __main__ - Step 6465: {'lr': 0.00010773333333333333, 'samples': 206880, 'steps': 404, 'loss/train': 5.82191801071167} -09/20/2021 15:53:17 - INFO - __main__ - Step 6466: {'lr': 0.00010773333333333333, 'samples': 206912, 'steps': 404, 'loss/train': 5.786263465881348} -09/20/2021 15:53:18 - INFO - __main__ - Step 6467: {'lr': 0.00010773333333333333, 'samples': 206944, 'steps': 404, 'loss/train': 5.989168167114258} -09/20/2021 15:53:19 - INFO - __main__ - Step 6468: {'lr': 0.00010773333333333333, 'samples': 206976, 'steps': 404, 'loss/train': 4.962606906890869} -09/20/2021 15:53:20 - INFO - __main__ - Step 6469: {'lr': 0.00010773333333333333, 'samples': 207008, 'steps': 404, 'loss/train': 5.501187324523926} -09/20/2021 15:53:21 - INFO - __main__ - Step 6470: {'lr': 0.00010773333333333333, 'samples': 207040, 'steps': 404, 'loss/train': 5.029437065124512} -09/20/2021 15:53:21 - INFO - __main__ - Step 6471: {'lr': 0.00010773333333333333, 'samples': 207072, 'steps': 404, 'loss/train': 5.12761926651001} -09/20/2021 15:53:22 - INFO - __main__ - Step 6472: {'lr': 0.00010773333333333333, 'samples': 207104, 'steps': 404, 'loss/train': 5.624192714691162} -09/20/2021 15:53:23 - INFO - __main__ - Step 6473: {'lr': 0.00010773333333333333, 'samples': 207136, 'steps': 404, 'loss/train': 5.355924606323242} -09/20/2021 15:53:24 - INFO - __main__ - Step 6474: {'lr': 0.00010773333333333333, 'samples': 207168, 'steps': 404, 'loss/train': 5.081484317779541} -09/20/2021 15:53:24 - INFO - __main__ - Step 6475: {'lr': 0.00010773333333333333, 'samples': 207200, 'steps': 404, 'loss/train': 5.373753070831299} -09/20/2021 15:53:25 - INFO - __main__ - Step 6476: {'lr': 0.00010773333333333333, 'samples': 207232, 'steps': 404, 'loss/train': 5.096464157104492} -09/20/2021 15:53:26 - INFO - __main__ - Step 6477: {'lr': 0.00010773333333333333, 'samples': 207264, 'steps': 404, 'loss/train': 4.569275856018066} -09/20/2021 15:53:27 - INFO - __main__ - Step 6478: {'lr': 0.00010773333333333333, 'samples': 207296, 'steps': 404, 'loss/train': 5.079554080963135} -09/20/2021 15:53:27 - INFO - __main__ - Step 6479: {'lr': 0.00010773333333333333, 'samples': 207328, 'steps': 404, 'loss/train': 5.151605129241943} -09/20/2021 15:53:28 - INFO - __main__ - Step 6480: {'lr': 0.00010773333333333333, 'samples': 207360, 'steps': 404, 'loss/train': 5.3397440910339355} -09/20/2021 15:53:29 - INFO - __main__ - Step 6481: {'lr': 0.00010800000000000001, 'samples': 207392, 'steps': 405, 'loss/train': 5.098344326019287} -09/20/2021 15:53:30 - INFO - __main__ - Step 6482: {'lr': 0.00010800000000000001, 'samples': 207424, 'steps': 405, 'loss/train': 5.9224138259887695} -09/20/2021 15:53:31 - INFO - __main__ - Step 6483: {'lr': 0.00010800000000000001, 'samples': 207456, 'steps': 405, 'loss/train': 5.134453773498535} -09/20/2021 15:53:31 - INFO - __main__ - Step 6484: {'lr': 0.00010800000000000001, 'samples': 207488, 'steps': 405, 'loss/train': 4.396368980407715} -09/20/2021 15:53:32 - INFO - __main__ - Step 6485: {'lr': 0.00010800000000000001, 'samples': 207520, 'steps': 405, 'loss/train': 5.106194019317627} -09/20/2021 15:53:33 - INFO - __main__ - Step 6486: {'lr': 0.00010800000000000001, 'samples': 207552, 'steps': 405, 'loss/train': 5.740379333496094} -09/20/2021 15:53:34 - INFO - __main__ - Step 6487: {'lr': 0.00010800000000000001, 'samples': 207584, 'steps': 405, 'loss/train': 5.0180888175964355} -09/20/2021 15:53:34 - INFO - __main__ - Step 6488: {'lr': 0.00010800000000000001, 'samples': 207616, 'steps': 405, 'loss/train': 5.7042412757873535} -09/20/2021 15:53:35 - INFO - __main__ - Step 6489: {'lr': 0.00010800000000000001, 'samples': 207648, 'steps': 405, 'loss/train': 4.915680885314941} -09/20/2021 15:53:36 - INFO - __main__ - Step 6490: {'lr': 0.00010800000000000001, 'samples': 207680, 'steps': 405, 'loss/train': 5.368072509765625} -09/20/2021 15:53:37 - INFO - __main__ - Step 6491: {'lr': 0.00010800000000000001, 'samples': 207712, 'steps': 405, 'loss/train': 5.893815994262695} -09/20/2021 15:53:37 - INFO - __main__ - Step 6492: {'lr': 0.00010800000000000001, 'samples': 207744, 'steps': 405, 'loss/train': 5.183209419250488} -09/20/2021 15:53:38 - INFO - __main__ - Step 6493: {'lr': 0.00010800000000000001, 'samples': 207776, 'steps': 405, 'loss/train': 4.995182037353516} -09/20/2021 15:53:39 - INFO - __main__ - Step 6494: {'lr': 0.00010800000000000001, 'samples': 207808, 'steps': 405, 'loss/train': 5.564706325531006} -09/20/2021 15:53:40 - INFO - __main__ - Step 6495: {'lr': 0.00010800000000000001, 'samples': 207840, 'steps': 405, 'loss/train': 4.588360786437988} -09/20/2021 15:53:40 - INFO - __main__ - Step 6496: {'lr': 0.00010800000000000001, 'samples': 207872, 'steps': 405, 'loss/train': 6.861678123474121} -09/20/2021 15:53:41 - INFO - __main__ - Step 6497: {'lr': 0.00010826666666666668, 'samples': 207904, 'steps': 406, 'loss/train': 4.30963134765625} -09/20/2021 15:53:42 - INFO - __main__ - Step 6498: {'lr': 0.00010826666666666668, 'samples': 207936, 'steps': 406, 'loss/train': 5.684950828552246} -09/20/2021 15:53:43 - INFO - __main__ - Step 6499: {'lr': 0.00010826666666666668, 'samples': 207968, 'steps': 406, 'loss/train': 5.421882152557373} -09/20/2021 15:53:44 - INFO - __main__ - Step 6500: {'lr': 0.00010826666666666668, 'samples': 208000, 'steps': 406, 'loss/train': 4.861454963684082} -09/20/2021 15:53:45 - INFO - __main__ - Step 6501: {'lr': 0.00010826666666666668, 'samples': 208032, 'steps': 406, 'loss/train': 4.42271089553833} -09/20/2021 15:53:46 - INFO - __main__ - Step 6502: {'lr': 0.00010826666666666668, 'samples': 208064, 'steps': 406, 'loss/train': 6.293734073638916} -09/20/2021 15:53:46 - INFO - __main__ - Step 6503: {'lr': 0.00010826666666666668, 'samples': 208096, 'steps': 406, 'loss/train': 5.1356329917907715} -09/20/2021 15:53:47 - INFO - __main__ - Step 6504: {'lr': 0.00010826666666666668, 'samples': 208128, 'steps': 406, 'loss/train': 4.788565635681152} -09/20/2021 15:53:48 - INFO - __main__ - Step 6505: {'lr': 0.00010826666666666668, 'samples': 208160, 'steps': 406, 'loss/train': 2.8208529949188232} -09/20/2021 15:53:49 - INFO - __main__ - Step 6506: {'lr': 0.00010826666666666668, 'samples': 208192, 'steps': 406, 'loss/train': 5.0316386222839355} -09/20/2021 15:53:49 - INFO - __main__ - Step 6507: {'lr': 0.00010826666666666668, 'samples': 208224, 'steps': 406, 'loss/train': 2.187880516052246} -09/20/2021 15:53:50 - INFO - __main__ - Step 6508: {'lr': 0.00010826666666666668, 'samples': 208256, 'steps': 406, 'loss/train': 2.7476143836975098} -09/20/2021 15:53:51 - INFO - __main__ - Step 6509: {'lr': 0.00010826666666666668, 'samples': 208288, 'steps': 406, 'loss/train': 2.4375152587890625} -09/20/2021 15:53:52 - INFO - __main__ - Step 6510: {'lr': 0.00010826666666666668, 'samples': 208320, 'steps': 406, 'loss/train': 4.601317405700684} -09/20/2021 15:53:52 - INFO - __main__ - Step 6511: {'lr': 0.00010826666666666668, 'samples': 208352, 'steps': 406, 'loss/train': 4.986715793609619} -09/20/2021 15:53:53 - INFO - __main__ - Step 6512: {'lr': 0.00010826666666666668, 'samples': 208384, 'steps': 406, 'loss/train': 4.708186626434326} -09/20/2021 15:53:54 - INFO - __main__ - Step 6513: {'lr': 0.00010853333333333333, 'samples': 208416, 'steps': 407, 'loss/train': 5.493370056152344} -09/20/2021 15:53:55 - INFO - __main__ - Step 6514: {'lr': 0.00010853333333333333, 'samples': 208448, 'steps': 407, 'loss/train': 4.648984432220459} -09/20/2021 15:53:55 - INFO - __main__ - Step 6515: {'lr': 0.00010853333333333333, 'samples': 208480, 'steps': 407, 'loss/train': 5.483673572540283} -09/20/2021 15:53:56 - INFO - __main__ - Step 6516: {'lr': 0.00010853333333333333, 'samples': 208512, 'steps': 407, 'loss/train': 5.449950218200684} -09/20/2021 15:53:57 - INFO - __main__ - Step 6517: {'lr': 0.00010853333333333333, 'samples': 208544, 'steps': 407, 'loss/train': 5.599679946899414} -09/20/2021 15:53:58 - INFO - __main__ - Step 6518: {'lr': 0.00010853333333333333, 'samples': 208576, 'steps': 407, 'loss/train': 5.790879249572754} -09/20/2021 15:53:58 - INFO - __main__ - Step 6519: {'lr': 0.00010853333333333333, 'samples': 208608, 'steps': 407, 'loss/train': 6.424349308013916} -09/20/2021 15:53:59 - INFO - __main__ - Step 6520: {'lr': 0.00010853333333333333, 'samples': 208640, 'steps': 407, 'loss/train': 4.835176467895508} -09/20/2021 15:54:00 - INFO - __main__ - Step 6521: {'lr': 0.00010853333333333333, 'samples': 208672, 'steps': 407, 'loss/train': 4.907838821411133} -09/20/2021 15:54:01 - INFO - __main__ - Step 6522: {'lr': 0.00010853333333333333, 'samples': 208704, 'steps': 407, 'loss/train': 2.9297842979431152} -09/20/2021 15:54:01 - INFO - __main__ - Step 6523: {'lr': 0.00010853333333333333, 'samples': 208736, 'steps': 407, 'loss/train': 4.899796962738037} -09/20/2021 15:54:02 - INFO - __main__ - Step 6524: {'lr': 0.00010853333333333333, 'samples': 208768, 'steps': 407, 'loss/train': 6.299516201019287} -09/20/2021 15:54:03 - INFO - __main__ - Step 6525: {'lr': 0.00010853333333333333, 'samples': 208800, 'steps': 407, 'loss/train': 4.4461493492126465} -09/20/2021 15:54:04 - INFO - __main__ - Step 6526: {'lr': 0.00010853333333333333, 'samples': 208832, 'steps': 407, 'loss/train': 2.8803231716156006} -09/20/2021 15:54:04 - INFO - __main__ - Step 6527: {'lr': 0.00010853333333333333, 'samples': 208864, 'steps': 407, 'loss/train': 1.8633601665496826} -09/20/2021 15:54:05 - INFO - __main__ - Step 6528: {'lr': 0.00010853333333333333, 'samples': 208896, 'steps': 407, 'loss/train': 5.524704933166504} -09/20/2021 15:54:06 - INFO - __main__ - Step 6529: {'lr': 0.00010880000000000002, 'samples': 208928, 'steps': 408, 'loss/train': 5.88223123550415} -09/20/2021 15:54:07 - INFO - __main__ - Step 6530: {'lr': 0.00010880000000000002, 'samples': 208960, 'steps': 408, 'loss/train': 5.500226974487305} -09/20/2021 15:54:09 - INFO - __main__ - Step 6531: {'lr': 0.00010880000000000002, 'samples': 208992, 'steps': 408, 'loss/train': 5.055667400360107} -09/20/2021 15:54:09 - INFO - __main__ - Step 6532: {'lr': 0.00010880000000000002, 'samples': 209024, 'steps': 408, 'loss/train': 5.6848344802856445} -09/20/2021 15:54:10 - INFO - __main__ - Step 6533: {'lr': 0.00010880000000000002, 'samples': 209056, 'steps': 408, 'loss/train': 5.379434585571289} -09/20/2021 15:54:11 - INFO - __main__ - Step 6534: {'lr': 0.00010880000000000002, 'samples': 209088, 'steps': 408, 'loss/train': 5.1803388595581055} -09/20/2021 15:54:12 - INFO - __main__ - Step 6535: {'lr': 0.00010880000000000002, 'samples': 209120, 'steps': 408, 'loss/train': 4.762481212615967} -09/20/2021 15:54:12 - INFO - __main__ - Step 6536: {'lr': 0.00010880000000000002, 'samples': 209152, 'steps': 408, 'loss/train': 5.67367696762085} -09/20/2021 15:54:13 - INFO - __main__ - Step 6537: {'lr': 0.00010880000000000002, 'samples': 209184, 'steps': 408, 'loss/train': 4.276095867156982} -09/20/2021 15:54:14 - INFO - __main__ - Step 6538: {'lr': 0.00010880000000000002, 'samples': 209216, 'steps': 408, 'loss/train': 5.318968296051025} -09/20/2021 15:54:15 - INFO - __main__ - Step 6539: {'lr': 0.00010880000000000002, 'samples': 209248, 'steps': 408, 'loss/train': 4.995871543884277} -09/20/2021 15:54:15 - INFO - __main__ - Step 6540: {'lr': 0.00010880000000000002, 'samples': 209280, 'steps': 408, 'loss/train': 5.260360240936279} -09/20/2021 15:54:16 - INFO - __main__ - Step 6541: {'lr': 0.00010880000000000002, 'samples': 209312, 'steps': 408, 'loss/train': 5.065194129943848} -09/20/2021 15:54:17 - INFO - __main__ - Step 6542: {'lr': 0.00010880000000000002, 'samples': 209344, 'steps': 408, 'loss/train': 5.55816125869751} -09/20/2021 15:54:18 - INFO - __main__ - Step 6543: {'lr': 0.00010880000000000002, 'samples': 209376, 'steps': 408, 'loss/train': 5.0273847579956055} -09/20/2021 15:54:18 - INFO - __main__ - Step 6544: {'lr': 0.00010880000000000002, 'samples': 209408, 'steps': 408, 'loss/train': 4.945597171783447} -09/20/2021 15:54:19 - INFO - __main__ - Step 6545: {'lr': 0.00010906666666666667, 'samples': 209440, 'steps': 409, 'loss/train': 5.399755954742432} -09/20/2021 15:54:20 - INFO - __main__ - Step 6546: {'lr': 0.00010906666666666667, 'samples': 209472, 'steps': 409, 'loss/train': 4.326019763946533} -09/20/2021 15:54:21 - INFO - __main__ - Step 6547: {'lr': 0.00010906666666666667, 'samples': 209504, 'steps': 409, 'loss/train': 5.572659492492676} -09/20/2021 15:54:22 - INFO - __main__ - Step 6548: {'lr': 0.00010906666666666667, 'samples': 209536, 'steps': 409, 'loss/train': 4.749759674072266} -09/20/2021 15:54:22 - INFO - __main__ - Step 6549: {'lr': 0.00010906666666666667, 'samples': 209568, 'steps': 409, 'loss/train': 5.1258063316345215} -09/20/2021 15:54:23 - INFO - __main__ - Step 6550: {'lr': 0.00010906666666666667, 'samples': 209600, 'steps': 409, 'loss/train': 4.666409969329834} -09/20/2021 15:54:24 - INFO - __main__ - Step 6551: {'lr': 0.00010906666666666667, 'samples': 209632, 'steps': 409, 'loss/train': 4.775618076324463} -09/20/2021 15:54:25 - INFO - __main__ - Step 6552: {'lr': 0.00010906666666666667, 'samples': 209664, 'steps': 409, 'loss/train': 5.501824378967285} -09/20/2021 15:54:25 - INFO - __main__ - Step 6553: {'lr': 0.00010906666666666667, 'samples': 209696, 'steps': 409, 'loss/train': 5.974086284637451} -09/20/2021 15:54:26 - INFO - __main__ - Step 6554: {'lr': 0.00010906666666666667, 'samples': 209728, 'steps': 409, 'loss/train': 4.756568908691406} -09/20/2021 15:54:27 - INFO - __main__ - Step 6555: {'lr': 0.00010906666666666667, 'samples': 209760, 'steps': 409, 'loss/train': 5.286856174468994} -09/20/2021 15:54:28 - INFO - __main__ - Step 6556: {'lr': 0.00010906666666666667, 'samples': 209792, 'steps': 409, 'loss/train': 4.491393566131592} -09/20/2021 15:54:28 - INFO - __main__ - Step 6557: {'lr': 0.00010906666666666667, 'samples': 209824, 'steps': 409, 'loss/train': 4.698129177093506} -09/20/2021 15:54:29 - INFO - __main__ - Step 6558: {'lr': 0.00010906666666666667, 'samples': 209856, 'steps': 409, 'loss/train': 5.971731185913086} -09/20/2021 15:54:30 - INFO - __main__ - Step 6559: {'lr': 0.00010906666666666667, 'samples': 209888, 'steps': 409, 'loss/train': 4.95283842086792} -09/20/2021 15:54:31 - INFO - __main__ - Step 6560: {'lr': 0.00010906666666666667, 'samples': 209920, 'steps': 409, 'loss/train': 4.654728889465332} -09/20/2021 15:54:32 - INFO - __main__ - Step 6561: {'lr': 0.00010933333333333333, 'samples': 209952, 'steps': 410, 'loss/train': 4.931030750274658} -09/20/2021 15:54:33 - INFO - __main__ - Step 6562: {'lr': 0.00010933333333333333, 'samples': 209984, 'steps': 410, 'loss/train': 5.732258319854736} -09/20/2021 15:54:33 - INFO - __main__ - Step 6563: {'lr': 0.00010933333333333333, 'samples': 210016, 'steps': 410, 'loss/train': 4.749716758728027} -09/20/2021 15:54:34 - INFO - __main__ - Step 6564: {'lr': 0.00010933333333333333, 'samples': 210048, 'steps': 410, 'loss/train': 5.079720973968506} -09/20/2021 15:54:35 - INFO - __main__ - Step 6565: {'lr': 0.00010933333333333333, 'samples': 210080, 'steps': 410, 'loss/train': 5.2320237159729} -09/20/2021 15:54:36 - INFO - __main__ - Step 6566: {'lr': 0.00010933333333333333, 'samples': 210112, 'steps': 410, 'loss/train': 4.7926154136657715} -09/20/2021 15:54:36 - INFO - __main__ - Step 6567: {'lr': 0.00010933333333333333, 'samples': 210144, 'steps': 410, 'loss/train': 5.207075119018555} -09/20/2021 15:54:37 - INFO - __main__ - Step 6568: {'lr': 0.00010933333333333333, 'samples': 210176, 'steps': 410, 'loss/train': 4.979766845703125} -09/20/2021 15:54:38 - INFO - __main__ - Step 6569: {'lr': 0.00010933333333333333, 'samples': 210208, 'steps': 410, 'loss/train': 4.456409931182861} -09/20/2021 15:54:39 - INFO - __main__ - Step 6570: {'lr': 0.00010933333333333333, 'samples': 210240, 'steps': 410, 'loss/train': 4.979555130004883} -09/20/2021 15:54:39 - INFO - __main__ - Step 6571: {'lr': 0.00010933333333333333, 'samples': 210272, 'steps': 410, 'loss/train': 4.971851348876953} -09/20/2021 15:54:40 - INFO - __main__ - Step 6572: {'lr': 0.00010933333333333333, 'samples': 210304, 'steps': 410, 'loss/train': 4.666993141174316} -09/20/2021 15:54:41 - INFO - __main__ - Step 6573: {'lr': 0.00010933333333333333, 'samples': 210336, 'steps': 410, 'loss/train': 5.884000778198242} -09/20/2021 15:54:42 - INFO - __main__ - Step 6574: {'lr': 0.00010933333333333333, 'samples': 210368, 'steps': 410, 'loss/train': 5.040315628051758} -09/20/2021 15:54:42 - INFO - __main__ - Step 6575: {'lr': 0.00010933333333333333, 'samples': 210400, 'steps': 410, 'loss/train': 5.29665470123291} -09/20/2021 15:54:43 - INFO - __main__ - Step 6576: {'lr': 0.00010933333333333333, 'samples': 210432, 'steps': 410, 'loss/train': 4.295209884643555} -09/20/2021 15:54:44 - INFO - __main__ - Step 6577: {'lr': 0.00010960000000000001, 'samples': 210464, 'steps': 411, 'loss/train': 5.452447414398193} -09/20/2021 15:54:45 - INFO - __main__ - Step 6578: {'lr': 0.00010960000000000001, 'samples': 210496, 'steps': 411, 'loss/train': 5.093515872955322} -09/20/2021 15:54:46 - INFO - __main__ - Step 6579: {'lr': 0.00010960000000000001, 'samples': 210528, 'steps': 411, 'loss/train': 5.333983898162842} -09/20/2021 15:54:46 - INFO - __main__ - Step 6580: {'lr': 0.00010960000000000001, 'samples': 210560, 'steps': 411, 'loss/train': 5.213863372802734} -09/20/2021 15:54:47 - INFO - __main__ - Step 6581: {'lr': 0.00010960000000000001, 'samples': 210592, 'steps': 411, 'loss/train': 4.604071140289307} -09/20/2021 15:54:48 - INFO - __main__ - Step 6582: {'lr': 0.00010960000000000001, 'samples': 210624, 'steps': 411, 'loss/train': 3.1099581718444824} -09/20/2021 15:54:49 - INFO - __main__ - Step 6583: {'lr': 0.00010960000000000001, 'samples': 210656, 'steps': 411, 'loss/train': 4.686581611633301} -09/20/2021 15:54:49 - INFO - __main__ - Step 6584: {'lr': 0.00010960000000000001, 'samples': 210688, 'steps': 411, 'loss/train': 5.5453314781188965} -09/20/2021 15:54:50 - INFO - __main__ - Step 6585: {'lr': 0.00010960000000000001, 'samples': 210720, 'steps': 411, 'loss/train': 5.887656211853027} -09/20/2021 15:54:51 - INFO - __main__ - Step 6586: {'lr': 0.00010960000000000001, 'samples': 210752, 'steps': 411, 'loss/train': 4.890100002288818} -09/20/2021 15:54:52 - INFO - __main__ - Step 6587: {'lr': 0.00010960000000000001, 'samples': 210784, 'steps': 411, 'loss/train': 4.246721267700195} -09/20/2021 15:54:52 - INFO - __main__ - Step 6588: {'lr': 0.00010960000000000001, 'samples': 210816, 'steps': 411, 'loss/train': 4.416571140289307} -09/20/2021 15:54:53 - INFO - __main__ - Step 6589: {'lr': 0.00010960000000000001, 'samples': 210848, 'steps': 411, 'loss/train': 4.764012336730957} -09/20/2021 15:54:54 - INFO - __main__ - Step 6590: {'lr': 0.00010960000000000001, 'samples': 210880, 'steps': 411, 'loss/train': 3.3443496227264404} -09/20/2021 15:54:55 - INFO - __main__ - Step 6591: {'lr': 0.00010960000000000001, 'samples': 210912, 'steps': 411, 'loss/train': 4.633081912994385} -09/20/2021 15:54:56 - INFO - __main__ - Step 6592: {'lr': 0.00010960000000000001, 'samples': 210944, 'steps': 411, 'loss/train': 5.289555549621582} -09/20/2021 15:54:57 - INFO - __main__ - Step 6593: {'lr': 0.00010986666666666668, 'samples': 210976, 'steps': 412, 'loss/train': 4.159301280975342} -09/20/2021 15:54:58 - INFO - __main__ - Step 6594: {'lr': 0.00010986666666666668, 'samples': 211008, 'steps': 412, 'loss/train': 4.973498821258545} -09/20/2021 15:54:58 - INFO - __main__ - Step 6595: {'lr': 0.00010986666666666668, 'samples': 211040, 'steps': 412, 'loss/train': 5.588534832000732} -09/20/2021 15:54:59 - INFO - __main__ - Step 6596: {'lr': 0.00010986666666666668, 'samples': 211072, 'steps': 412, 'loss/train': 4.973855972290039} -09/20/2021 15:55:00 - INFO - __main__ - Step 6597: {'lr': 0.00010986666666666668, 'samples': 211104, 'steps': 412, 'loss/train': 5.54953670501709} -09/20/2021 15:55:01 - INFO - __main__ - Step 6598: {'lr': 0.00010986666666666668, 'samples': 211136, 'steps': 412, 'loss/train': 5.154092311859131} -09/20/2021 15:55:01 - INFO - __main__ - Step 6599: {'lr': 0.00010986666666666668, 'samples': 211168, 'steps': 412, 'loss/train': 4.632680416107178} -09/20/2021 15:55:02 - INFO - __main__ - Step 6600: {'lr': 0.00010986666666666668, 'samples': 211200, 'steps': 412, 'loss/train': 5.035826683044434} -09/20/2021 15:55:03 - INFO - __main__ - Step 6601: {'lr': 0.00010986666666666668, 'samples': 211232, 'steps': 412, 'loss/train': 4.914887428283691} -09/20/2021 15:55:04 - INFO - __main__ - Step 6602: {'lr': 0.00010986666666666668, 'samples': 211264, 'steps': 412, 'loss/train': 4.895543098449707} -09/20/2021 15:55:04 - INFO - __main__ - Step 6603: {'lr': 0.00010986666666666668, 'samples': 211296, 'steps': 412, 'loss/train': 4.800352096557617} -09/20/2021 15:55:05 - INFO - __main__ - Step 6604: {'lr': 0.00010986666666666668, 'samples': 211328, 'steps': 412, 'loss/train': 5.881603717803955} -09/20/2021 15:55:06 - INFO - __main__ - Step 6605: {'lr': 0.00010986666666666668, 'samples': 211360, 'steps': 412, 'loss/train': 5.743620872497559} -09/20/2021 15:55:07 - INFO - __main__ - Step 6606: {'lr': 0.00010986666666666668, 'samples': 211392, 'steps': 412, 'loss/train': 5.656296253204346} -09/20/2021 15:55:07 - INFO - __main__ - Step 6607: {'lr': 0.00010986666666666668, 'samples': 211424, 'steps': 412, 'loss/train': 4.616331577301025} -09/20/2021 15:55:08 - INFO - __main__ - Step 6608: {'lr': 0.00010986666666666668, 'samples': 211456, 'steps': 412, 'loss/train': 6.575959205627441} -09/20/2021 15:55:09 - INFO - __main__ - Step 6609: {'lr': 0.00011013333333333333, 'samples': 211488, 'steps': 413, 'loss/train': 5.27940559387207} -09/20/2021 15:55:10 - INFO - __main__ - Step 6610: {'lr': 0.00011013333333333333, 'samples': 211520, 'steps': 413, 'loss/train': 5.677916049957275} -09/20/2021 15:55:11 - INFO - __main__ - Step 6611: {'lr': 0.00011013333333333333, 'samples': 211552, 'steps': 413, 'loss/train': 5.0995378494262695} -09/20/2021 15:55:11 - INFO - __main__ - Step 6612: {'lr': 0.00011013333333333333, 'samples': 211584, 'steps': 413, 'loss/train': 5.332212448120117} -09/20/2021 15:55:12 - INFO - __main__ - Step 6613: {'lr': 0.00011013333333333333, 'samples': 211616, 'steps': 413, 'loss/train': 4.448111534118652} -09/20/2021 15:55:13 - INFO - __main__ - Step 6614: {'lr': 0.00011013333333333333, 'samples': 211648, 'steps': 413, 'loss/train': 4.33376407623291} -09/20/2021 15:55:14 - INFO - __main__ - Step 6615: {'lr': 0.00011013333333333333, 'samples': 211680, 'steps': 413, 'loss/train': 4.8604936599731445} -09/20/2021 15:55:14 - INFO - __main__ - Step 6616: {'lr': 0.00011013333333333333, 'samples': 211712, 'steps': 413, 'loss/train': 5.506651878356934} -09/20/2021 15:55:15 - INFO - __main__ - Step 6617: {'lr': 0.00011013333333333333, 'samples': 211744, 'steps': 413, 'loss/train': 6.395086765289307} -09/20/2021 15:55:16 - INFO - __main__ - Step 6618: {'lr': 0.00011013333333333333, 'samples': 211776, 'steps': 413, 'loss/train': 6.531789779663086} -09/20/2021 15:55:17 - INFO - __main__ - Step 6619: {'lr': 0.00011013333333333333, 'samples': 211808, 'steps': 413, 'loss/train': 6.399831771850586} -09/20/2021 15:55:17 - INFO - __main__ - Step 6620: {'lr': 0.00011013333333333333, 'samples': 211840, 'steps': 413, 'loss/train': 6.443670749664307} -09/20/2021 15:55:18 - INFO - __main__ - Step 6621: {'lr': 0.00011013333333333333, 'samples': 211872, 'steps': 413, 'loss/train': 6.586544036865234} -09/20/2021 15:55:19 - INFO - __main__ - Step 6622: {'lr': 0.00011013333333333333, 'samples': 211904, 'steps': 413, 'loss/train': 5.040977954864502} -09/20/2021 15:55:20 - INFO - __main__ - Step 6623: {'lr': 0.00011013333333333333, 'samples': 211936, 'steps': 413, 'loss/train': 4.275781154632568} -09/20/2021 15:55:21 - INFO - __main__ - Step 6624: {'lr': 0.00011013333333333333, 'samples': 211968, 'steps': 413, 'loss/train': 4.124597072601318} -09/20/2021 15:55:22 - INFO - __main__ - Step 6625: {'lr': 0.00011040000000000001, 'samples': 212000, 'steps': 414, 'loss/train': 4.614504337310791} -09/20/2021 15:55:23 - INFO - __main__ - Step 6626: {'lr': 0.00011040000000000001, 'samples': 212032, 'steps': 414, 'loss/train': 5.088083267211914} -09/20/2021 15:55:23 - INFO - __main__ - Step 6627: {'lr': 0.00011040000000000001, 'samples': 212064, 'steps': 414, 'loss/train': 5.388031482696533} -09/20/2021 15:55:24 - INFO - __main__ - Step 6628: {'lr': 0.00011040000000000001, 'samples': 212096, 'steps': 414, 'loss/train': 4.380010604858398} -09/20/2021 15:55:25 - INFO - __main__ - Step 6629: {'lr': 0.00011040000000000001, 'samples': 212128, 'steps': 414, 'loss/train': 5.333324432373047} -09/20/2021 15:55:26 - INFO - __main__ - Step 6630: {'lr': 0.00011040000000000001, 'samples': 212160, 'steps': 414, 'loss/train': 5.509359836578369} -09/20/2021 15:55:26 - INFO - __main__ - Step 6631: {'lr': 0.00011040000000000001, 'samples': 212192, 'steps': 414, 'loss/train': 4.8417158126831055} -09/20/2021 15:55:27 - INFO - __main__ - Step 6632: {'lr': 0.00011040000000000001, 'samples': 212224, 'steps': 414, 'loss/train': 4.998599052429199} -09/20/2021 15:55:28 - INFO - __main__ - Step 6633: {'lr': 0.00011040000000000001, 'samples': 212256, 'steps': 414, 'loss/train': 4.789622783660889} -09/20/2021 15:55:29 - INFO - __main__ - Step 6634: {'lr': 0.00011040000000000001, 'samples': 212288, 'steps': 414, 'loss/train': 5.2329559326171875} -09/20/2021 15:55:29 - INFO - __main__ - Step 6635: {'lr': 0.00011040000000000001, 'samples': 212320, 'steps': 414, 'loss/train': 4.296838760375977} -09/20/2021 15:55:30 - INFO - __main__ - Step 6636: {'lr': 0.00011040000000000001, 'samples': 212352, 'steps': 414, 'loss/train': 0.6556114554405212} -09/20/2021 15:55:31 - INFO - __main__ - Step 6637: {'lr': 0.00011040000000000001, 'samples': 212384, 'steps': 414, 'loss/train': 4.784023284912109} -09/20/2021 15:55:32 - INFO - __main__ - Step 6638: {'lr': 0.00011040000000000001, 'samples': 212416, 'steps': 414, 'loss/train': 5.411656856536865} -09/20/2021 15:55:32 - INFO - __main__ - Step 6639: {'lr': 0.00011040000000000001, 'samples': 212448, 'steps': 414, 'loss/train': 5.064844131469727} -09/20/2021 15:55:33 - INFO - __main__ - Step 6640: {'lr': 0.00011040000000000001, 'samples': 212480, 'steps': 414, 'loss/train': 5.470262050628662} -09/20/2021 15:55:34 - INFO - __main__ - Step 6641: {'lr': 0.00011066666666666667, 'samples': 212512, 'steps': 415, 'loss/train': 5.544620513916016} -09/20/2021 15:55:35 - INFO - __main__ - Step 6642: {'lr': 0.00011066666666666667, 'samples': 212544, 'steps': 415, 'loss/train': 4.436079025268555} -09/20/2021 15:55:35 - INFO - __main__ - Step 6643: {'lr': 0.00011066666666666667, 'samples': 212576, 'steps': 415, 'loss/train': 4.764084339141846} -09/20/2021 15:55:36 - INFO - __main__ - Step 6644: {'lr': 0.00011066666666666667, 'samples': 212608, 'steps': 415, 'loss/train': 4.8628315925598145} -09/20/2021 15:55:37 - INFO - __main__ - Step 6645: {'lr': 0.00011066666666666667, 'samples': 212640, 'steps': 415, 'loss/train': 5.421824932098389} -09/20/2021 15:55:38 - INFO - __main__ - Step 6646: {'lr': 0.00011066666666666667, 'samples': 212672, 'steps': 415, 'loss/train': 4.469810962677002} -09/20/2021 15:55:38 - INFO - __main__ - Step 6647: {'lr': 0.00011066666666666667, 'samples': 212704, 'steps': 415, 'loss/train': 3.208173990249634} -09/20/2021 15:55:39 - INFO - __main__ - Step 6648: {'lr': 0.00011066666666666667, 'samples': 212736, 'steps': 415, 'loss/train': 4.083039283752441} -09/20/2021 15:55:40 - INFO - __main__ - Step 6649: {'lr': 0.00011066666666666667, 'samples': 212768, 'steps': 415, 'loss/train': 4.8219990730285645} -09/20/2021 15:55:41 - INFO - __main__ - Step 6650: {'lr': 0.00011066666666666667, 'samples': 212800, 'steps': 415, 'loss/train': 4.874783515930176} -09/20/2021 15:55:41 - INFO - __main__ - Step 6651: {'lr': 0.00011066666666666667, 'samples': 212832, 'steps': 415, 'loss/train': 5.170016288757324} -09/20/2021 15:55:42 - INFO - __main__ - Step 6652: {'lr': 0.00011066666666666667, 'samples': 212864, 'steps': 415, 'loss/train': 5.076542377471924} -09/20/2021 15:55:43 - INFO - __main__ - Step 6653: {'lr': 0.00011066666666666667, 'samples': 212896, 'steps': 415, 'loss/train': 4.692251682281494} -09/20/2021 15:55:44 - INFO - __main__ - Step 6654: {'lr': 0.00011066666666666667, 'samples': 212928, 'steps': 415, 'loss/train': 5.261285305023193} -09/20/2021 15:55:45 - INFO - __main__ - Step 6655: {'lr': 0.00011066666666666667, 'samples': 212960, 'steps': 415, 'loss/train': 4.533268451690674} -09/20/2021 15:55:46 - INFO - __main__ - Step 6656: {'lr': 0.00011066666666666667, 'samples': 212992, 'steps': 415, 'loss/train': 4.390631198883057} -09/20/2021 15:55:47 - INFO - __main__ - Step 6657: {'lr': 0.00011093333333333334, 'samples': 213024, 'steps': 416, 'loss/train': 5.134537696838379} -09/20/2021 15:55:48 - INFO - __main__ - Step 6658: {'lr': 0.00011093333333333334, 'samples': 213056, 'steps': 416, 'loss/train': 5.3143205642700195} -09/20/2021 15:55:48 - INFO - __main__ - Step 6659: {'lr': 0.00011093333333333334, 'samples': 213088, 'steps': 416, 'loss/train': 4.627806663513184} -09/20/2021 15:55:49 - INFO - __main__ - Step 6660: {'lr': 0.00011093333333333334, 'samples': 213120, 'steps': 416, 'loss/train': 5.050300598144531} -09/20/2021 15:55:50 - INFO - __main__ - Step 6661: {'lr': 0.00011093333333333334, 'samples': 213152, 'steps': 416, 'loss/train': 4.699406623840332} -09/20/2021 15:55:51 - INFO - __main__ - Step 6662: {'lr': 0.00011093333333333334, 'samples': 213184, 'steps': 416, 'loss/train': 6.003138065338135} -09/20/2021 15:55:51 - INFO - __main__ - Step 6663: {'lr': 0.00011093333333333334, 'samples': 213216, 'steps': 416, 'loss/train': 5.764217376708984} -09/20/2021 15:55:52 - INFO - __main__ - Step 6664: {'lr': 0.00011093333333333334, 'samples': 213248, 'steps': 416, 'loss/train': 5.904780387878418} -09/20/2021 15:55:53 - INFO - __main__ - Step 6665: {'lr': 0.00011093333333333334, 'samples': 213280, 'steps': 416, 'loss/train': 4.912280082702637} -09/20/2021 15:55:54 - INFO - __main__ - Step 6666: {'lr': 0.00011093333333333334, 'samples': 213312, 'steps': 416, 'loss/train': 5.146542549133301} -09/20/2021 15:55:54 - INFO - __main__ - Step 6667: {'lr': 0.00011093333333333334, 'samples': 213344, 'steps': 416, 'loss/train': 5.602182865142822} -09/20/2021 15:55:55 - INFO - __main__ - Step 6668: {'lr': 0.00011093333333333334, 'samples': 213376, 'steps': 416, 'loss/train': 5.592175006866455} -09/20/2021 15:55:56 - INFO - __main__ - Step 6669: {'lr': 0.00011093333333333334, 'samples': 213408, 'steps': 416, 'loss/train': 7.138521194458008} -09/20/2021 15:55:57 - INFO - __main__ - Step 6670: {'lr': 0.00011093333333333334, 'samples': 213440, 'steps': 416, 'loss/train': 5.0241241455078125} -09/20/2021 15:55:57 - INFO - __main__ - Step 6671: {'lr': 0.00011093333333333334, 'samples': 213472, 'steps': 416, 'loss/train': 5.156890869140625} -09/20/2021 15:55:58 - INFO - __main__ - Step 6672: {'lr': 0.00011093333333333334, 'samples': 213504, 'steps': 416, 'loss/train': 5.703515529632568} -09/20/2021 15:55:59 - INFO - __main__ - Step 6673: {'lr': 0.00011120000000000002, 'samples': 213536, 'steps': 417, 'loss/train': 5.2076263427734375} -09/20/2021 15:56:00 - INFO - __main__ - Step 6674: {'lr': 0.00011120000000000002, 'samples': 213568, 'steps': 417, 'loss/train': 4.815072059631348} -09/20/2021 15:56:00 - INFO - __main__ - Step 6675: {'lr': 0.00011120000000000002, 'samples': 213600, 'steps': 417, 'loss/train': 6.132091045379639} -09/20/2021 15:56:01 - INFO - __main__ - Step 6676: {'lr': 0.00011120000000000002, 'samples': 213632, 'steps': 417, 'loss/train': 4.487865447998047} -09/20/2021 15:56:02 - INFO - __main__ - Step 6677: {'lr': 0.00011120000000000002, 'samples': 213664, 'steps': 417, 'loss/train': 4.865962982177734} -09/20/2021 15:56:03 - INFO - __main__ - Step 6678: {'lr': 0.00011120000000000002, 'samples': 213696, 'steps': 417, 'loss/train': 5.242199420928955} -09/20/2021 15:56:03 - INFO - __main__ - Step 6679: {'lr': 0.00011120000000000002, 'samples': 213728, 'steps': 417, 'loss/train': 5.284058570861816} -09/20/2021 15:56:04 - INFO - __main__ - Step 6680: {'lr': 0.00011120000000000002, 'samples': 213760, 'steps': 417, 'loss/train': 5.968560218811035} -09/20/2021 15:56:05 - INFO - __main__ - Step 6681: {'lr': 0.00011120000000000002, 'samples': 213792, 'steps': 417, 'loss/train': 5.73182487487793} -09/20/2021 15:56:06 - INFO - __main__ - Step 6682: {'lr': 0.00011120000000000002, 'samples': 213824, 'steps': 417, 'loss/train': 4.7747907638549805} -09/20/2021 15:56:06 - INFO - __main__ - Step 6683: {'lr': 0.00011120000000000002, 'samples': 213856, 'steps': 417, 'loss/train': 5.156219482421875} -09/20/2021 15:56:08 - INFO - __main__ - Step 6684: {'lr': 0.00011120000000000002, 'samples': 213888, 'steps': 417, 'loss/train': 4.222270965576172} -09/20/2021 15:56:08 - INFO - __main__ - Step 6685: {'lr': 0.00011120000000000002, 'samples': 213920, 'steps': 417, 'loss/train': 5.688076019287109} -09/20/2021 15:56:09 - INFO - __main__ - Step 6686: {'lr': 0.00011120000000000002, 'samples': 213952, 'steps': 417, 'loss/train': 8.099295616149902} -09/20/2021 15:56:10 - INFO - __main__ - Step 6687: {'lr': 0.00011120000000000002, 'samples': 213984, 'steps': 417, 'loss/train': 8.122645378112793} -09/20/2021 15:56:11 - INFO - __main__ - Step 6688: {'lr': 0.00011120000000000002, 'samples': 214016, 'steps': 417, 'loss/train': 8.111034393310547} -09/20/2021 15:56:12 - INFO - __main__ - Step 6689: {'lr': 0.00011146666666666667, 'samples': 214048, 'steps': 418, 'loss/train': 5.049685478210449} -09/20/2021 15:56:12 - INFO - __main__ - Step 6690: {'lr': 0.00011146666666666667, 'samples': 214080, 'steps': 418, 'loss/train': 5.772732257843018} -09/20/2021 15:56:13 - INFO - __main__ - Step 6691: {'lr': 0.00011146666666666667, 'samples': 214112, 'steps': 418, 'loss/train': 4.353865146636963} -09/20/2021 15:56:14 - INFO - __main__ - Step 6692: {'lr': 0.00011146666666666667, 'samples': 214144, 'steps': 418, 'loss/train': 4.658662796020508} -09/20/2021 15:56:15 - INFO - __main__ - Step 6693: {'lr': 0.00011146666666666667, 'samples': 214176, 'steps': 418, 'loss/train': 3.1348817348480225} -09/20/2021 15:56:15 - INFO - __main__ - Step 6694: {'lr': 0.00011146666666666667, 'samples': 214208, 'steps': 418, 'loss/train': 5.403960227966309} -09/20/2021 15:56:16 - INFO - __main__ - Step 6695: {'lr': 0.00011146666666666667, 'samples': 214240, 'steps': 418, 'loss/train': 4.7255072593688965} -09/20/2021 15:56:17 - INFO - __main__ - Step 6696: {'lr': 0.00011146666666666667, 'samples': 214272, 'steps': 418, 'loss/train': 3.9592137336730957} -09/20/2021 15:56:18 - INFO - __main__ - Step 6697: {'lr': 0.00011146666666666667, 'samples': 214304, 'steps': 418, 'loss/train': 4.740718364715576} -09/20/2021 15:56:18 - INFO - __main__ - Step 6698: {'lr': 0.00011146666666666667, 'samples': 214336, 'steps': 418, 'loss/train': 3.024895429611206} -09/20/2021 15:56:19 - INFO - __main__ - Step 6699: {'lr': 0.00011146666666666667, 'samples': 214368, 'steps': 418, 'loss/train': 5.684895992279053} -09/20/2021 15:56:20 - INFO - __main__ - Step 6700: {'lr': 0.00011146666666666667, 'samples': 214400, 'steps': 418, 'loss/train': 4.759124755859375} -09/20/2021 15:56:21 - INFO - __main__ - Step 6701: {'lr': 0.00011146666666666667, 'samples': 214432, 'steps': 418, 'loss/train': 4.3526997566223145} -09/20/2021 15:56:21 - INFO - __main__ - Step 6702: {'lr': 0.00011146666666666667, 'samples': 214464, 'steps': 418, 'loss/train': 5.118817329406738} -09/20/2021 15:56:22 - INFO - __main__ - Step 6703: {'lr': 0.00011146666666666667, 'samples': 214496, 'steps': 418, 'loss/train': 4.664594650268555} -09/20/2021 15:56:23 - INFO - __main__ - Step 6704: {'lr': 0.00011146666666666667, 'samples': 214528, 'steps': 418, 'loss/train': 5.181055068969727} -09/20/2021 15:56:24 - INFO - __main__ - Step 6705: {'lr': 0.00011173333333333333, 'samples': 214560, 'steps': 419, 'loss/train': 5.344329833984375} -09/20/2021 15:56:24 - INFO - __main__ - Step 6706: {'lr': 0.00011173333333333333, 'samples': 214592, 'steps': 419, 'loss/train': 5.209292888641357} -09/20/2021 15:56:25 - INFO - __main__ - Step 6707: {'lr': 0.00011173333333333333, 'samples': 214624, 'steps': 419, 'loss/train': 5.363424777984619} -09/20/2021 15:56:26 - INFO - __main__ - Step 6708: {'lr': 0.00011173333333333333, 'samples': 214656, 'steps': 419, 'loss/train': 5.163487911224365} -09/20/2021 15:56:27 - INFO - __main__ - Step 6709: {'lr': 0.00011173333333333333, 'samples': 214688, 'steps': 419, 'loss/train': 5.899084568023682} -09/20/2021 15:56:27 - INFO - __main__ - Step 6710: {'lr': 0.00011173333333333333, 'samples': 214720, 'steps': 419, 'loss/train': 4.8383283615112305} -09/20/2021 15:56:28 - INFO - __main__ - Step 6711: {'lr': 0.00011173333333333333, 'samples': 214752, 'steps': 419, 'loss/train': 2.9592466354370117} -09/20/2021 15:56:29 - INFO - __main__ - Step 6712: {'lr': 0.00011173333333333333, 'samples': 214784, 'steps': 419, 'loss/train': 5.269327163696289} -09/20/2021 15:56:30 - INFO - __main__ - Step 6713: {'lr': 0.00011173333333333333, 'samples': 214816, 'steps': 419, 'loss/train': 5.23960018157959} -09/20/2021 15:56:30 - INFO - __main__ - Step 6714: {'lr': 0.00011173333333333333, 'samples': 214848, 'steps': 419, 'loss/train': 4.833663463592529} -09/20/2021 15:56:31 - INFO - __main__ - Step 6715: {'lr': 0.00011173333333333333, 'samples': 214880, 'steps': 419, 'loss/train': 3.0720362663269043} -09/20/2021 15:56:33 - INFO - __main__ - Step 6716: {'lr': 0.00011173333333333333, 'samples': 214912, 'steps': 419, 'loss/train': 5.359171390533447} -09/20/2021 15:56:33 - INFO - __main__ - Step 6717: {'lr': 0.00011173333333333333, 'samples': 214944, 'steps': 419, 'loss/train': 4.67389440536499} -09/20/2021 15:56:34 - INFO - __main__ - Step 6718: {'lr': 0.00011173333333333333, 'samples': 214976, 'steps': 419, 'loss/train': 4.9795637130737305} -09/20/2021 15:56:35 - INFO - __main__ - Step 6719: {'lr': 0.00011173333333333333, 'samples': 215008, 'steps': 419, 'loss/train': 4.3680853843688965} -09/20/2021 15:56:36 - INFO - __main__ - Step 6720: {'lr': 0.00011173333333333333, 'samples': 215040, 'steps': 419, 'loss/train': 4.528225898742676} -09/20/2021 15:56:36 - INFO - __main__ - Step 6721: {'lr': 0.00011200000000000001, 'samples': 215072, 'steps': 420, 'loss/train': 4.590816020965576} -09/20/2021 15:56:37 - INFO - __main__ - Step 6722: {'lr': 0.00011200000000000001, 'samples': 215104, 'steps': 420, 'loss/train': 5.449955940246582} -09/20/2021 15:56:38 - INFO - __main__ - Step 6723: {'lr': 0.00011200000000000001, 'samples': 215136, 'steps': 420, 'loss/train': 4.8831305503845215} -09/20/2021 15:56:39 - INFO - __main__ - Step 6724: {'lr': 0.00011200000000000001, 'samples': 215168, 'steps': 420, 'loss/train': 4.835837364196777} -09/20/2021 15:56:39 - INFO - __main__ - Step 6725: {'lr': 0.00011200000000000001, 'samples': 215200, 'steps': 420, 'loss/train': 5.3719401359558105} -09/20/2021 15:56:40 - INFO - __main__ - Step 6726: {'lr': 0.00011200000000000001, 'samples': 215232, 'steps': 420, 'loss/train': 4.972078323364258} -09/20/2021 15:56:41 - INFO - __main__ - Step 6727: {'lr': 0.00011200000000000001, 'samples': 215264, 'steps': 420, 'loss/train': 5.694159030914307} -09/20/2021 15:56:42 - INFO - __main__ - Step 6728: {'lr': 0.00011200000000000001, 'samples': 215296, 'steps': 420, 'loss/train': 5.370009422302246} -09/20/2021 15:56:42 - INFO - __main__ - Step 6729: {'lr': 0.00011200000000000001, 'samples': 215328, 'steps': 420, 'loss/train': 6.217458248138428} -09/20/2021 15:56:43 - INFO - __main__ - Step 6730: {'lr': 0.00011200000000000001, 'samples': 215360, 'steps': 420, 'loss/train': 5.5015869140625} -09/20/2021 15:56:44 - INFO - __main__ - Step 6731: {'lr': 0.00011200000000000001, 'samples': 215392, 'steps': 420, 'loss/train': 3.084617853164673} -09/20/2021 15:56:45 - INFO - __main__ - Step 6732: {'lr': 0.00011200000000000001, 'samples': 215424, 'steps': 420, 'loss/train': 4.413370132446289} -09/20/2021 15:56:45 - INFO - __main__ - Step 6733: {'lr': 0.00011200000000000001, 'samples': 215456, 'steps': 420, 'loss/train': 5.344028472900391} -09/20/2021 15:56:46 - INFO - __main__ - Step 6734: {'lr': 0.00011200000000000001, 'samples': 215488, 'steps': 420, 'loss/train': 2.8845272064208984} -09/20/2021 15:56:47 - INFO - __main__ - Step 6735: {'lr': 0.00011200000000000001, 'samples': 215520, 'steps': 420, 'loss/train': 5.187143802642822} -09/20/2021 15:56:48 - INFO - __main__ - Step 6736: {'lr': 0.00011200000000000001, 'samples': 215552, 'steps': 420, 'loss/train': 5.034367561340332} -09/20/2021 15:56:49 - INFO - __main__ - Step 6737: {'lr': 0.00011226666666666668, 'samples': 215584, 'steps': 421, 'loss/train': 5.64532470703125} -09/20/2021 15:56:49 - INFO - __main__ - Step 6738: {'lr': 0.00011226666666666668, 'samples': 215616, 'steps': 421, 'loss/train': 4.730142116546631} -09/20/2021 15:56:50 - INFO - __main__ - Step 6739: {'lr': 0.00011226666666666668, 'samples': 215648, 'steps': 421, 'loss/train': 4.963594436645508} -09/20/2021 15:56:51 - INFO - __main__ - Step 6740: {'lr': 0.00011226666666666668, 'samples': 215680, 'steps': 421, 'loss/train': 4.800766468048096} -09/20/2021 15:56:52 - INFO - __main__ - Step 6741: {'lr': 0.00011226666666666668, 'samples': 215712, 'steps': 421, 'loss/train': 5.292637825012207} -09/20/2021 15:56:52 - INFO - __main__ - Step 6742: {'lr': 0.00011226666666666668, 'samples': 215744, 'steps': 421, 'loss/train': 5.143767833709717} -09/20/2021 15:56:53 - INFO - __main__ - Step 6743: {'lr': 0.00011226666666666668, 'samples': 215776, 'steps': 421, 'loss/train': 4.417198181152344} -09/20/2021 15:56:54 - INFO - __main__ - Step 6744: {'lr': 0.00011226666666666668, 'samples': 215808, 'steps': 421, 'loss/train': 4.218728542327881} -09/20/2021 15:56:55 - INFO - __main__ - Step 6745: {'lr': 0.00011226666666666668, 'samples': 215840, 'steps': 421, 'loss/train': 5.257081508636475} -09/20/2021 15:56:55 - INFO - __main__ - Step 6746: {'lr': 0.00011226666666666668, 'samples': 215872, 'steps': 421, 'loss/train': 5.371946811676025} -09/20/2021 15:56:57 - INFO - __main__ - Step 6747: {'lr': 0.00011226666666666668, 'samples': 215904, 'steps': 421, 'loss/train': 6.334212303161621} -09/20/2021 15:56:57 - INFO - __main__ - Step 6748: {'lr': 0.00011226666666666668, 'samples': 215936, 'steps': 421, 'loss/train': 6.026825428009033} -09/20/2021 15:56:58 - INFO - __main__ - Step 6749: {'lr': 0.00011226666666666668, 'samples': 215968, 'steps': 421, 'loss/train': 7.075463771820068} -09/20/2021 15:56:59 - INFO - __main__ - Step 6750: {'lr': 0.00011226666666666668, 'samples': 216000, 'steps': 421, 'loss/train': 5.407381057739258} -09/20/2021 15:57:00 - INFO - __main__ - Step 6751: {'lr': 0.00011226666666666668, 'samples': 216032, 'steps': 421, 'loss/train': 5.796195983886719} -09/20/2021 15:57:00 - INFO - __main__ - Step 6752: {'lr': 0.00011226666666666668, 'samples': 216064, 'steps': 421, 'loss/train': 4.929059028625488} -09/20/2021 15:57:01 - INFO - __main__ - Step 6753: {'lr': 0.00011253333333333334, 'samples': 216096, 'steps': 422, 'loss/train': 5.024047374725342} -09/20/2021 15:57:02 - INFO - __main__ - Step 6754: {'lr': 0.00011253333333333334, 'samples': 216128, 'steps': 422, 'loss/train': 5.1209635734558105} -09/20/2021 15:57:03 - INFO - __main__ - Step 6755: {'lr': 0.00011253333333333334, 'samples': 216160, 'steps': 422, 'loss/train': 5.279445648193359} -09/20/2021 15:57:04 - INFO - __main__ - Step 6756: {'lr': 0.00011253333333333334, 'samples': 216192, 'steps': 422, 'loss/train': 4.852492809295654} -09/20/2021 15:57:04 - INFO - __main__ - Step 6757: {'lr': 0.00011253333333333334, 'samples': 216224, 'steps': 422, 'loss/train': 5.036653995513916} -09/20/2021 15:57:05 - INFO - __main__ - Step 6758: {'lr': 0.00011253333333333334, 'samples': 216256, 'steps': 422, 'loss/train': 4.688997745513916} -09/20/2021 15:57:06 - INFO - __main__ - Step 6759: {'lr': 0.00011253333333333334, 'samples': 216288, 'steps': 422, 'loss/train': 6.221524238586426} -09/20/2021 15:57:07 - INFO - __main__ - Step 6760: {'lr': 0.00011253333333333334, 'samples': 216320, 'steps': 422, 'loss/train': 4.8998703956604} -09/20/2021 15:57:07 - INFO - __main__ - Step 6761: {'lr': 0.00011253333333333334, 'samples': 216352, 'steps': 422, 'loss/train': 6.640113830566406} -09/20/2021 15:57:08 - INFO - __main__ - Step 6762: {'lr': 0.00011253333333333334, 'samples': 216384, 'steps': 422, 'loss/train': 7.439425945281982} -09/20/2021 15:57:09 - INFO - __main__ - Step 6763: {'lr': 0.00011253333333333334, 'samples': 216416, 'steps': 422, 'loss/train': 7.3580827713012695} -09/20/2021 15:57:10 - INFO - __main__ - Step 6764: {'lr': 0.00011253333333333334, 'samples': 216448, 'steps': 422, 'loss/train': 5.074521541595459} -09/20/2021 15:57:10 - INFO - __main__ - Step 6765: {'lr': 0.00011253333333333334, 'samples': 216480, 'steps': 422, 'loss/train': 5.140573978424072} -09/20/2021 15:57:11 - INFO - __main__ - Step 6766: {'lr': 0.00011253333333333334, 'samples': 216512, 'steps': 422, 'loss/train': 5.432600498199463} -09/20/2021 15:57:12 - INFO - __main__ - Step 6767: {'lr': 0.00011253333333333334, 'samples': 216544, 'steps': 422, 'loss/train': 4.9380879402160645} -09/20/2021 15:57:13 - INFO - __main__ - Step 6768: {'lr': 0.00011253333333333334, 'samples': 216576, 'steps': 422, 'loss/train': 5.386763572692871} -09/20/2021 15:57:13 - INFO - __main__ - Step 6769: {'lr': 0.00011279999999999999, 'samples': 216608, 'steps': 423, 'loss/train': 4.983053684234619} -09/20/2021 15:57:14 - INFO - __main__ - Step 6770: {'lr': 0.00011279999999999999, 'samples': 216640, 'steps': 423, 'loss/train': 3.8515727519989014} -09/20/2021 15:57:15 - INFO - __main__ - Step 6771: {'lr': 0.00011279999999999999, 'samples': 216672, 'steps': 423, 'loss/train': 3.772268295288086} -09/20/2021 15:57:16 - INFO - __main__ - Step 6772: {'lr': 0.00011279999999999999, 'samples': 216704, 'steps': 423, 'loss/train': 3.5076088905334473} -09/20/2021 15:57:16 - INFO - __main__ - Step 6773: {'lr': 0.00011279999999999999, 'samples': 216736, 'steps': 423, 'loss/train': 4.82672119140625} -09/20/2021 15:57:17 - INFO - __main__ - Step 6774: {'lr': 0.00011279999999999999, 'samples': 216768, 'steps': 423, 'loss/train': 5.549027442932129} -09/20/2021 15:57:18 - INFO - __main__ - Step 6775: {'lr': 0.00011279999999999999, 'samples': 216800, 'steps': 423, 'loss/train': 5.479783058166504} -09/20/2021 15:57:19 - INFO - __main__ - Step 6776: {'lr': 0.00011279999999999999, 'samples': 216832, 'steps': 423, 'loss/train': 5.261926651000977} -09/20/2021 15:57:19 - INFO - __main__ - Step 6777: {'lr': 0.00011279999999999999, 'samples': 216864, 'steps': 423, 'loss/train': 4.946736812591553} -09/20/2021 15:57:21 - INFO - __main__ - Step 6778: {'lr': 0.00011279999999999999, 'samples': 216896, 'steps': 423, 'loss/train': 4.938838958740234} -09/20/2021 15:57:21 - INFO - __main__ - Step 6779: {'lr': 0.00011279999999999999, 'samples': 216928, 'steps': 423, 'loss/train': 5.294494152069092} -09/20/2021 15:57:22 - INFO - __main__ - Step 6780: {'lr': 0.00011279999999999999, 'samples': 216960, 'steps': 423, 'loss/train': 5.099812984466553} -09/20/2021 15:57:23 - INFO - __main__ - Step 6781: {'lr': 0.00011279999999999999, 'samples': 216992, 'steps': 423, 'loss/train': 4.1381635665893555} -09/20/2021 15:57:24 - INFO - __main__ - Step 6782: {'lr': 0.00011279999999999999, 'samples': 217024, 'steps': 423, 'loss/train': 4.8509392738342285} -09/20/2021 15:57:24 - INFO - __main__ - Step 6783: {'lr': 0.00011279999999999999, 'samples': 217056, 'steps': 423, 'loss/train': 4.422801971435547} -09/20/2021 15:57:25 - INFO - __main__ - Step 6784: {'lr': 0.00011279999999999999, 'samples': 217088, 'steps': 423, 'loss/train': 5.01191520690918} -09/20/2021 15:57:26 - INFO - __main__ - Step 6785: {'lr': 0.00011306666666666667, 'samples': 217120, 'steps': 424, 'loss/train': 5.031498432159424} -09/20/2021 15:57:27 - INFO - __main__ - Step 6786: {'lr': 0.00011306666666666667, 'samples': 217152, 'steps': 424, 'loss/train': 6.800312519073486} -09/20/2021 15:57:28 - INFO - __main__ - Step 6787: {'lr': 0.00011306666666666667, 'samples': 217184, 'steps': 424, 'loss/train': 4.651416778564453} -09/20/2021 15:57:28 - INFO - __main__ - Step 6788: {'lr': 0.00011306666666666667, 'samples': 217216, 'steps': 424, 'loss/train': 5.087191104888916} -09/20/2021 15:57:29 - INFO - __main__ - Step 6789: {'lr': 0.00011306666666666667, 'samples': 217248, 'steps': 424, 'loss/train': 4.635270595550537} -09/20/2021 15:57:30 - INFO - __main__ - Step 6790: {'lr': 0.00011306666666666667, 'samples': 217280, 'steps': 424, 'loss/train': 5.621965408325195} -09/20/2021 15:57:31 - INFO - __main__ - Step 6791: {'lr': 0.00011306666666666667, 'samples': 217312, 'steps': 424, 'loss/train': 5.423948764801025} -09/20/2021 15:57:31 - INFO - __main__ - Step 6792: {'lr': 0.00011306666666666667, 'samples': 217344, 'steps': 424, 'loss/train': 4.686850070953369} -09/20/2021 15:57:32 - INFO - __main__ - Step 6793: {'lr': 0.00011306666666666667, 'samples': 217376, 'steps': 424, 'loss/train': 4.672537326812744} -09/20/2021 15:57:33 - INFO - __main__ - Step 6794: {'lr': 0.00011306666666666667, 'samples': 217408, 'steps': 424, 'loss/train': 3.7964441776275635} -09/20/2021 15:57:34 - INFO - __main__ - Step 6795: {'lr': 0.00011306666666666667, 'samples': 217440, 'steps': 424, 'loss/train': 4.813160419464111} -09/20/2021 15:57:34 - INFO - __main__ - Step 6796: {'lr': 0.00011306666666666667, 'samples': 217472, 'steps': 424, 'loss/train': 5.061515808105469} -09/20/2021 15:57:35 - INFO - __main__ - Step 6797: {'lr': 0.00011306666666666667, 'samples': 217504, 'steps': 424, 'loss/train': 5.406384468078613} -09/20/2021 15:57:36 - INFO - __main__ - Step 6798: {'lr': 0.00011306666666666667, 'samples': 217536, 'steps': 424, 'loss/train': 5.051100254058838} -09/20/2021 15:57:37 - INFO - __main__ - Step 6799: {'lr': 0.00011306666666666667, 'samples': 217568, 'steps': 424, 'loss/train': 4.623842239379883} -09/20/2021 15:57:37 - INFO - __main__ - Step 6800: {'lr': 0.00011306666666666667, 'samples': 217600, 'steps': 424, 'loss/train': 5.053721904754639} -09/20/2021 15:57:38 - INFO - __main__ - Step 6801: {'lr': 0.00011333333333333334, 'samples': 217632, 'steps': 425, 'loss/train': 4.5989089012146} -09/20/2021 15:57:39 - INFO - __main__ - Step 6802: {'lr': 0.00011333333333333334, 'samples': 217664, 'steps': 425, 'loss/train': 3.2580764293670654} -09/20/2021 15:57:40 - INFO - __main__ - Step 6803: {'lr': 0.00011333333333333334, 'samples': 217696, 'steps': 425, 'loss/train': 4.437859535217285} -09/20/2021 15:57:40 - INFO - __main__ - Step 6804: {'lr': 0.00011333333333333334, 'samples': 217728, 'steps': 425, 'loss/train': 4.942420959472656} -09/20/2021 15:57:41 - INFO - __main__ - Step 6805: {'lr': 0.00011333333333333334, 'samples': 217760, 'steps': 425, 'loss/train': 5.211764812469482} -09/20/2021 15:57:42 - INFO - __main__ - Step 6806: {'lr': 0.00011333333333333334, 'samples': 217792, 'steps': 425, 'loss/train': 4.615809440612793} -09/20/2021 15:57:43 - INFO - __main__ - Step 6807: {'lr': 0.00011333333333333334, 'samples': 217824, 'steps': 425, 'loss/train': 4.912482738494873} -09/20/2021 15:57:43 - INFO - __main__ - Step 6808: {'lr': 0.00011333333333333334, 'samples': 217856, 'steps': 425, 'loss/train': 6.489677906036377} -09/20/2021 15:57:44 - INFO - __main__ - Step 6809: {'lr': 0.00011333333333333334, 'samples': 217888, 'steps': 425, 'loss/train': 4.992429733276367} -09/20/2021 15:57:46 - INFO - __main__ - Step 6810: {'lr': 0.00011333333333333334, 'samples': 217920, 'steps': 425, 'loss/train': 4.9045491218566895} -09/20/2021 15:57:46 - INFO - __main__ - Step 6811: {'lr': 0.00011333333333333334, 'samples': 217952, 'steps': 425, 'loss/train': 5.446518421173096} -09/20/2021 15:57:47 - INFO - __main__ - Step 6812: {'lr': 0.00011333333333333334, 'samples': 217984, 'steps': 425, 'loss/train': 4.746507167816162} -09/20/2021 15:57:48 - INFO - __main__ - Step 6813: {'lr': 0.00011333333333333334, 'samples': 218016, 'steps': 425, 'loss/train': 5.461071968078613} -09/20/2021 15:57:49 - INFO - __main__ - Step 6814: {'lr': 0.00011333333333333334, 'samples': 218048, 'steps': 425, 'loss/train': 5.215565204620361} -09/20/2021 15:57:49 - INFO - __main__ - Step 6815: {'lr': 0.00011333333333333334, 'samples': 218080, 'steps': 425, 'loss/train': 5.0476484298706055} -09/20/2021 15:57:50 - INFO - __main__ - Step 6816: {'lr': 0.00011333333333333334, 'samples': 218112, 'steps': 425, 'loss/train': 5.314855098724365} -09/20/2021 15:57:51 - INFO - __main__ - Step 6817: {'lr': 0.0001136, 'samples': 218144, 'steps': 426, 'loss/train': 4.614178657531738} -09/20/2021 15:57:52 - INFO - __main__ - Step 6818: {'lr': 0.0001136, 'samples': 218176, 'steps': 426, 'loss/train': 5.101551055908203} -09/20/2021 15:57:53 - INFO - __main__ - Step 6819: {'lr': 0.0001136, 'samples': 218208, 'steps': 426, 'loss/train': 5.157998561859131} -09/20/2021 15:57:53 - INFO - __main__ - Step 6820: {'lr': 0.0001136, 'samples': 218240, 'steps': 426, 'loss/train': 5.077305316925049} -09/20/2021 15:57:54 - INFO - __main__ - Step 6821: {'lr': 0.0001136, 'samples': 218272, 'steps': 426, 'loss/train': 5.233895301818848} -09/20/2021 15:57:55 - INFO - __main__ - Step 6822: {'lr': 0.0001136, 'samples': 218304, 'steps': 426, 'loss/train': 5.447694301605225} -09/20/2021 15:57:56 - INFO - __main__ - Step 6823: {'lr': 0.0001136, 'samples': 218336, 'steps': 426, 'loss/train': 5.493888854980469} -09/20/2021 15:57:56 - INFO - __main__ - Step 6824: {'lr': 0.0001136, 'samples': 218368, 'steps': 426, 'loss/train': 5.453551292419434} -09/20/2021 15:57:57 - INFO - __main__ - Step 6825: {'lr': 0.0001136, 'samples': 218400, 'steps': 426, 'loss/train': 5.3989033699035645} -09/20/2021 15:57:58 - INFO - __main__ - Step 6826: {'lr': 0.0001136, 'samples': 218432, 'steps': 426, 'loss/train': 5.160539627075195} -09/20/2021 15:57:59 - INFO - __main__ - Step 6827: {'lr': 0.0001136, 'samples': 218464, 'steps': 426, 'loss/train': 3.6581711769104004} -09/20/2021 15:57:59 - INFO - __main__ - Step 6828: {'lr': 0.0001136, 'samples': 218496, 'steps': 426, 'loss/train': 4.590479850769043} -09/20/2021 15:58:00 - INFO - __main__ - Step 6829: {'lr': 0.0001136, 'samples': 218528, 'steps': 426, 'loss/train': 3.981499671936035} -09/20/2021 15:58:01 - INFO - __main__ - Step 6830: {'lr': 0.0001136, 'samples': 218560, 'steps': 426, 'loss/train': 5.247864723205566} -09/20/2021 15:58:02 - INFO - __main__ - Step 6831: {'lr': 0.0001136, 'samples': 218592, 'steps': 426, 'loss/train': 7.427027225494385} -09/20/2021 15:58:02 - INFO - __main__ - Step 6832: {'lr': 0.0001136, 'samples': 218624, 'steps': 426, 'loss/train': 7.891445159912109} -09/20/2021 15:58:03 - INFO - __main__ - Step 6833: {'lr': 0.00011386666666666668, 'samples': 218656, 'steps': 427, 'loss/train': 7.359785556793213} -09/20/2021 15:58:04 - INFO - __main__ - Step 6834: {'lr': 0.00011386666666666668, 'samples': 218688, 'steps': 427, 'loss/train': 7.056912899017334} -09/20/2021 15:58:05 - INFO - __main__ - Step 6835: {'lr': 0.00011386666666666668, 'samples': 218720, 'steps': 427, 'loss/train': 7.487785816192627} -09/20/2021 15:58:06 - INFO - __main__ - Step 6836: {'lr': 0.00011386666666666668, 'samples': 218752, 'steps': 427, 'loss/train': 5.0979084968566895} -09/20/2021 15:58:06 - INFO - __main__ - Step 6837: {'lr': 0.00011386666666666668, 'samples': 218784, 'steps': 427, 'loss/train': 4.739347457885742} -09/20/2021 15:58:07 - INFO - __main__ - Step 6838: {'lr': 0.00011386666666666668, 'samples': 218816, 'steps': 427, 'loss/train': 6.998041152954102} -09/20/2021 15:58:08 - INFO - __main__ - Step 6839: {'lr': 0.00011386666666666668, 'samples': 218848, 'steps': 427, 'loss/train': 2.8922884464263916} -09/20/2021 15:58:09 - INFO - __main__ - Step 6840: {'lr': 0.00011386666666666668, 'samples': 218880, 'steps': 427, 'loss/train': 5.463291645050049} -09/20/2021 15:58:09 - INFO - __main__ - Step 6841: {'lr': 0.00011386666666666668, 'samples': 218912, 'steps': 427, 'loss/train': 5.381453037261963} -09/20/2021 15:58:10 - INFO - __main__ - Step 6842: {'lr': 0.00011386666666666668, 'samples': 218944, 'steps': 427, 'loss/train': 5.08977746963501} -09/20/2021 15:58:12 - INFO - __main__ - Step 6843: {'lr': 0.00011386666666666668, 'samples': 218976, 'steps': 427, 'loss/train': 5.427450180053711} -09/20/2021 15:58:13 - INFO - __main__ - Step 6844: {'lr': 0.00011386666666666668, 'samples': 219008, 'steps': 427, 'loss/train': 5.770097732543945} -09/20/2021 15:58:13 - INFO - __main__ - Step 6845: {'lr': 0.00011386666666666668, 'samples': 219040, 'steps': 427, 'loss/train': 5.00039005279541} -09/20/2021 15:58:14 - INFO - __main__ - Step 6846: {'lr': 0.00011386666666666668, 'samples': 219072, 'steps': 427, 'loss/train': 4.833428382873535} -09/20/2021 15:58:15 - INFO - __main__ - Step 6847: {'lr': 0.00011386666666666668, 'samples': 219104, 'steps': 427, 'loss/train': 4.852452278137207} -09/20/2021 15:58:16 - INFO - __main__ - Step 6848: {'lr': 0.00011386666666666668, 'samples': 219136, 'steps': 427, 'loss/train': 5.483060836791992} -09/20/2021 15:58:16 - INFO - __main__ - Step 6849: {'lr': 0.00011413333333333333, 'samples': 219168, 'steps': 428, 'loss/train': 5.830286502838135} -09/20/2021 15:58:17 - INFO - __main__ - Step 6850: {'lr': 0.00011413333333333333, 'samples': 219200, 'steps': 428, 'loss/train': 5.074123382568359} -09/20/2021 15:58:18 - INFO - __main__ - Step 6851: {'lr': 0.00011413333333333333, 'samples': 219232, 'steps': 428, 'loss/train': 0.699809730052948} -09/20/2021 15:58:19 - INFO - __main__ - Step 6852: {'lr': 0.00011413333333333333, 'samples': 219264, 'steps': 428, 'loss/train': 4.702761650085449} -09/20/2021 15:58:19 - INFO - __main__ - Step 6853: {'lr': 0.00011413333333333333, 'samples': 219296, 'steps': 428, 'loss/train': 5.496675491333008} -09/20/2021 15:58:20 - INFO - __main__ - Step 6854: {'lr': 0.00011413333333333333, 'samples': 219328, 'steps': 428, 'loss/train': 3.6868035793304443} -09/20/2021 15:58:21 - INFO - __main__ - Step 6855: {'lr': 0.00011413333333333333, 'samples': 219360, 'steps': 428, 'loss/train': 4.694363117218018} -09/20/2021 15:58:22 - INFO - __main__ - Step 6856: {'lr': 0.00011413333333333333, 'samples': 219392, 'steps': 428, 'loss/train': 4.68229341506958} -09/20/2021 15:58:22 - INFO - __main__ - Step 6857: {'lr': 0.00011413333333333333, 'samples': 219424, 'steps': 428, 'loss/train': 5.127723217010498} -09/20/2021 15:58:23 - INFO - __main__ - Step 6858: {'lr': 0.00011413333333333333, 'samples': 219456, 'steps': 428, 'loss/train': 5.240750789642334} -09/20/2021 15:58:24 - INFO - __main__ - Step 6859: {'lr': 0.00011413333333333333, 'samples': 219488, 'steps': 428, 'loss/train': 4.895044803619385} -09/20/2021 15:58:25 - INFO - __main__ - Step 6860: {'lr': 0.00011413333333333333, 'samples': 219520, 'steps': 428, 'loss/train': 4.842635154724121} -09/20/2021 15:58:25 - INFO - __main__ - Step 6861: {'lr': 0.00011413333333333333, 'samples': 219552, 'steps': 428, 'loss/train': 5.332630634307861} -09/20/2021 15:58:26 - INFO - __main__ - Step 6862: {'lr': 0.00011413333333333333, 'samples': 219584, 'steps': 428, 'loss/train': 4.865818500518799} -09/20/2021 15:58:27 - INFO - __main__ - Step 6863: {'lr': 0.00011413333333333333, 'samples': 219616, 'steps': 428, 'loss/train': 5.597419261932373} -09/20/2021 15:58:28 - INFO - __main__ - Step 6864: {'lr': 0.00011413333333333333, 'samples': 219648, 'steps': 428, 'loss/train': 4.999797821044922} -09/20/2021 15:58:29 - INFO - __main__ - Step 6865: {'lr': 0.0001144, 'samples': 219680, 'steps': 429, 'loss/train': 4.883028030395508} -09/20/2021 15:58:29 - INFO - __main__ - Step 6866: {'lr': 0.0001144, 'samples': 219712, 'steps': 429, 'loss/train': 5.186740875244141} -09/20/2021 15:58:30 - INFO - __main__ - Step 6867: {'lr': 0.0001144, 'samples': 219744, 'steps': 429, 'loss/train': 5.626510143280029} -09/20/2021 15:58:31 - INFO - __main__ - Step 6868: {'lr': 0.0001144, 'samples': 219776, 'steps': 429, 'loss/train': 4.87734842300415} -09/20/2021 15:58:32 - INFO - __main__ - Step 6869: {'lr': 0.0001144, 'samples': 219808, 'steps': 429, 'loss/train': 5.693902492523193} -09/20/2021 15:58:32 - INFO - __main__ - Step 6870: {'lr': 0.0001144, 'samples': 219840, 'steps': 429, 'loss/train': 4.980292797088623} -09/20/2021 15:58:33 - INFO - __main__ - Step 6871: {'lr': 0.0001144, 'samples': 219872, 'steps': 429, 'loss/train': 4.628477573394775} -09/20/2021 15:58:34 - INFO - __main__ - Step 6872: {'lr': 0.0001144, 'samples': 219904, 'steps': 429, 'loss/train': 4.994778156280518} -09/20/2021 15:58:35 - INFO - __main__ - Step 6873: {'lr': 0.0001144, 'samples': 219936, 'steps': 429, 'loss/train': 5.034818172454834} -09/20/2021 15:58:36 - INFO - __main__ - Step 6874: {'lr': 0.0001144, 'samples': 219968, 'steps': 429, 'loss/train': 4.892640590667725} -09/20/2021 15:58:37 - INFO - __main__ - Step 6875: {'lr': 0.0001144, 'samples': 220000, 'steps': 429, 'loss/train': 5.205986976623535} -09/20/2021 15:58:37 - INFO - __main__ - Step 6876: {'lr': 0.0001144, 'samples': 220032, 'steps': 429, 'loss/train': 5.085744857788086} -09/20/2021 15:58:38 - INFO - __main__ - Step 6877: {'lr': 0.0001144, 'samples': 220064, 'steps': 429, 'loss/train': 5.8406853675842285} -09/20/2021 15:58:39 - INFO - __main__ - Step 6878: {'lr': 0.0001144, 'samples': 220096, 'steps': 429, 'loss/train': 4.906833171844482} -09/20/2021 15:58:40 - INFO - __main__ - Step 6879: {'lr': 0.0001144, 'samples': 220128, 'steps': 429, 'loss/train': 4.985761642456055} -09/20/2021 15:58:40 - INFO - __main__ - Step 6880: {'lr': 0.0001144, 'samples': 220160, 'steps': 429, 'loss/train': 4.977330207824707} -09/20/2021 15:58:41 - INFO - __main__ - Step 6881: {'lr': 0.00011466666666666667, 'samples': 220192, 'steps': 430, 'loss/train': 6.315338134765625} -09/20/2021 15:58:42 - INFO - __main__ - Step 6882: {'lr': 0.00011466666666666667, 'samples': 220224, 'steps': 430, 'loss/train': 6.712274551391602} -09/20/2021 15:58:43 - INFO - __main__ - Step 6883: {'lr': 0.00011466666666666667, 'samples': 220256, 'steps': 430, 'loss/train': 5.64125919342041} -09/20/2021 15:58:43 - INFO - __main__ - Step 6884: {'lr': 0.00011466666666666667, 'samples': 220288, 'steps': 430, 'loss/train': 4.78389835357666} -09/20/2021 15:58:44 - INFO - __main__ - Step 6885: {'lr': 0.00011466666666666667, 'samples': 220320, 'steps': 430, 'loss/train': 4.964935302734375} -09/20/2021 15:58:45 - INFO - __main__ - Step 6886: {'lr': 0.00011466666666666667, 'samples': 220352, 'steps': 430, 'loss/train': 5.233120441436768} -09/20/2021 15:58:46 - INFO - __main__ - Step 6887: {'lr': 0.00011466666666666667, 'samples': 220384, 'steps': 430, 'loss/train': 5.047523498535156} -09/20/2021 15:58:46 - INFO - __main__ - Step 6888: {'lr': 0.00011466666666666667, 'samples': 220416, 'steps': 430, 'loss/train': 4.392302989959717} -09/20/2021 15:58:47 - INFO - __main__ - Step 6889: {'lr': 0.00011466666666666667, 'samples': 220448, 'steps': 430, 'loss/train': 5.046858787536621} -09/20/2021 15:58:48 - INFO - __main__ - Step 6890: {'lr': 0.00011466666666666667, 'samples': 220480, 'steps': 430, 'loss/train': 4.796978950500488} -09/20/2021 15:58:49 - INFO - __main__ - Step 6891: {'lr': 0.00011466666666666667, 'samples': 220512, 'steps': 430, 'loss/train': 5.275213241577148} -09/20/2021 15:58:49 - INFO - __main__ - Step 6892: {'lr': 0.00011466666666666667, 'samples': 220544, 'steps': 430, 'loss/train': 5.045446395874023} -09/20/2021 15:58:50 - INFO - __main__ - Step 6893: {'lr': 0.00011466666666666667, 'samples': 220576, 'steps': 430, 'loss/train': 4.955303192138672} -09/20/2021 15:58:51 - INFO - __main__ - Step 6894: {'lr': 0.00011466666666666667, 'samples': 220608, 'steps': 430, 'loss/train': 4.864318370819092} -09/20/2021 15:58:52 - INFO - __main__ - Step 6895: {'lr': 0.00011466666666666667, 'samples': 220640, 'steps': 430, 'loss/train': 2.8216428756713867} -09/20/2021 15:58:52 - INFO - __main__ - Step 6896: {'lr': 0.00011466666666666667, 'samples': 220672, 'steps': 430, 'loss/train': 4.483376979827881} -09/20/2021 15:58:53 - INFO - __main__ - Step 6897: {'lr': 0.00011493333333333334, 'samples': 220704, 'steps': 431, 'loss/train': 4.886142730712891} -09/20/2021 15:58:54 - INFO - __main__ - Step 6898: {'lr': 0.00011493333333333334, 'samples': 220736, 'steps': 431, 'loss/train': 4.876998424530029} -09/20/2021 15:58:55 - INFO - __main__ - Step 6899: {'lr': 0.00011493333333333334, 'samples': 220768, 'steps': 431, 'loss/train': 5.054596900939941} -09/20/2021 15:58:56 - INFO - __main__ - Step 6900: {'lr': 0.00011493333333333334, 'samples': 220800, 'steps': 431, 'loss/train': 5.166456699371338} -09/20/2021 15:58:56 - INFO - __main__ - Step 6901: {'lr': 0.00011493333333333334, 'samples': 220832, 'steps': 431, 'loss/train': 5.74151611328125} -09/20/2021 15:58:57 - INFO - __main__ - Step 6902: {'lr': 0.00011493333333333334, 'samples': 220864, 'steps': 431, 'loss/train': 5.187188625335693} -09/20/2021 15:58:58 - INFO - __main__ - Step 6903: {'lr': 0.00011493333333333334, 'samples': 220896, 'steps': 431, 'loss/train': 5.9586181640625} -09/20/2021 15:58:59 - INFO - __main__ - Step 6904: {'lr': 0.00011493333333333334, 'samples': 220928, 'steps': 431, 'loss/train': 5.07769775390625} -09/20/2021 15:59:00 - INFO - __main__ - Step 6905: {'lr': 0.00011493333333333334, 'samples': 220960, 'steps': 431, 'loss/train': 5.22812557220459} -09/20/2021 15:59:01 - INFO - __main__ - Step 6906: {'lr': 0.00011493333333333334, 'samples': 220992, 'steps': 431, 'loss/train': 4.830185413360596} -09/20/2021 15:59:02 - INFO - __main__ - Step 6907: {'lr': 0.00011493333333333334, 'samples': 221024, 'steps': 431, 'loss/train': 5.013248443603516} -09/20/2021 15:59:02 - INFO - __main__ - Step 6908: {'lr': 0.00011493333333333334, 'samples': 221056, 'steps': 431, 'loss/train': 4.776726722717285} -09/20/2021 15:59:03 - INFO - __main__ - Step 6909: {'lr': 0.00011493333333333334, 'samples': 221088, 'steps': 431, 'loss/train': 4.753328800201416} -09/20/2021 15:59:04 - INFO - __main__ - Step 6910: {'lr': 0.00011493333333333334, 'samples': 221120, 'steps': 431, 'loss/train': 4.938852310180664} -09/20/2021 15:59:05 - INFO - __main__ - Step 6911: {'lr': 0.00011493333333333334, 'samples': 221152, 'steps': 431, 'loss/train': 5.5810089111328125} -09/20/2021 15:59:05 - INFO - __main__ - Step 6912: {'lr': 0.00011493333333333334, 'samples': 221184, 'steps': 431, 'loss/train': 5.2089033126831055} -09/20/2021 15:59:06 - INFO - __main__ - Step 6913: {'lr': 0.0001152, 'samples': 221216, 'steps': 432, 'loss/train': 3.331202745437622} -09/20/2021 15:59:07 - INFO - __main__ - Step 6914: {'lr': 0.0001152, 'samples': 221248, 'steps': 432, 'loss/train': 3.1192047595977783} -09/20/2021 15:59:08 - INFO - __main__ - Step 6915: {'lr': 0.0001152, 'samples': 221280, 'steps': 432, 'loss/train': 4.774552822113037} -09/20/2021 15:59:08 - INFO - __main__ - Step 6916: {'lr': 0.0001152, 'samples': 221312, 'steps': 432, 'loss/train': 5.187729835510254} -09/20/2021 15:59:09 - INFO - __main__ - Step 6917: {'lr': 0.0001152, 'samples': 221344, 'steps': 432, 'loss/train': 5.221068859100342} -09/20/2021 15:59:10 - INFO - __main__ - Step 6918: {'lr': 0.0001152, 'samples': 221376, 'steps': 432, 'loss/train': 4.940755367279053} -09/20/2021 15:59:11 - INFO - __main__ - Step 6919: {'lr': 0.0001152, 'samples': 221408, 'steps': 432, 'loss/train': 5.071404933929443} -09/20/2021 15:59:11 - INFO - __main__ - Step 6920: {'lr': 0.0001152, 'samples': 221440, 'steps': 432, 'loss/train': 5.201576232910156} -09/20/2021 15:59:12 - INFO - __main__ - Step 6921: {'lr': 0.0001152, 'samples': 221472, 'steps': 432, 'loss/train': 5.010682582855225} -09/20/2021 15:59:13 - INFO - __main__ - Step 6922: {'lr': 0.0001152, 'samples': 221504, 'steps': 432, 'loss/train': 4.4057111740112305} -09/20/2021 15:59:14 - INFO - __main__ - Step 6923: {'lr': 0.0001152, 'samples': 221536, 'steps': 432, 'loss/train': 4.7127485275268555} -09/20/2021 15:59:14 - INFO - __main__ - Step 6924: {'lr': 0.0001152, 'samples': 221568, 'steps': 432, 'loss/train': 4.801892280578613} -09/20/2021 15:59:15 - INFO - __main__ - Step 6925: {'lr': 0.0001152, 'samples': 221600, 'steps': 432, 'loss/train': 5.1057233810424805} -09/20/2021 15:59:16 - INFO - __main__ - Step 6926: {'lr': 0.0001152, 'samples': 221632, 'steps': 432, 'loss/train': 4.656691074371338} -09/20/2021 15:59:17 - INFO - __main__ - Step 6927: {'lr': 0.0001152, 'samples': 221664, 'steps': 432, 'loss/train': 6.0676960945129395} -09/20/2021 15:59:17 - INFO - __main__ - Step 6928: {'lr': 0.0001152, 'samples': 221696, 'steps': 432, 'loss/train': 5.094420909881592} -09/20/2021 15:59:18 - INFO - __main__ - Step 6929: {'lr': 0.00011546666666666668, 'samples': 221728, 'steps': 433, 'loss/train': 4.497099876403809} -09/20/2021 15:59:19 - INFO - __main__ - Step 6930: {'lr': 0.00011546666666666668, 'samples': 221760, 'steps': 433, 'loss/train': 5.903721809387207} -09/20/2021 15:59:20 - INFO - __main__ - Step 6931: {'lr': 0.00011546666666666668, 'samples': 221792, 'steps': 433, 'loss/train': 6.287099361419678} -09/20/2021 15:59:21 - INFO - __main__ - Step 6932: {'lr': 0.00011546666666666668, 'samples': 221824, 'steps': 433, 'loss/train': 4.817792892456055} -09/20/2021 15:59:21 - INFO - __main__ - Step 6933: {'lr': 0.00011546666666666668, 'samples': 221856, 'steps': 433, 'loss/train': 5.2112932205200195} -09/20/2021 15:59:22 - INFO - __main__ - Step 6934: {'lr': 0.00011546666666666668, 'samples': 221888, 'steps': 433, 'loss/train': 4.337226390838623} -09/20/2021 15:59:23 - INFO - __main__ - Step 6935: {'lr': 0.00011546666666666668, 'samples': 221920, 'steps': 433, 'loss/train': 9.387563705444336} -09/20/2021 15:59:24 - INFO - __main__ - Step 6936: {'lr': 0.00011546666666666668, 'samples': 221952, 'steps': 433, 'loss/train': 9.365959167480469} -09/20/2021 15:59:24 - INFO - __main__ - Step 6937: {'lr': 0.00011546666666666668, 'samples': 221984, 'steps': 433, 'loss/train': 7.083222389221191} -09/20/2021 15:59:26 - INFO - __main__ - Step 6938: {'lr': 0.00011546666666666668, 'samples': 222016, 'steps': 433, 'loss/train': 6.414459705352783} -09/20/2021 15:59:26 - INFO - __main__ - Step 6939: {'lr': 0.00011546666666666668, 'samples': 222048, 'steps': 433, 'loss/train': 5.306549072265625} -09/20/2021 15:59:27 - INFO - __main__ - Step 6940: {'lr': 0.00011546666666666668, 'samples': 222080, 'steps': 433, 'loss/train': 3.8028416633605957} -09/20/2021 15:59:28 - INFO - __main__ - Step 6941: {'lr': 0.00011546666666666668, 'samples': 222112, 'steps': 433, 'loss/train': 5.090792179107666} -09/20/2021 15:59:29 - INFO - __main__ - Step 6942: {'lr': 0.00011546666666666668, 'samples': 222144, 'steps': 433, 'loss/train': 5.442928791046143} -09/20/2021 15:59:29 - INFO - __main__ - Step 6943: {'lr': 0.00011546666666666668, 'samples': 222176, 'steps': 433, 'loss/train': 5.0789947509765625} -09/20/2021 15:59:30 - INFO - __main__ - Step 6944: {'lr': 0.00011546666666666668, 'samples': 222208, 'steps': 433, 'loss/train': 5.677493095397949} -09/20/2021 15:59:31 - INFO - __main__ - Step 6945: {'lr': 0.00011573333333333333, 'samples': 222240, 'steps': 434, 'loss/train': 5.007058143615723} -09/20/2021 15:59:32 - INFO - __main__ - Step 6946: {'lr': 0.00011573333333333333, 'samples': 222272, 'steps': 434, 'loss/train': 4.698328495025635} -09/20/2021 15:59:33 - INFO - __main__ - Step 6947: {'lr': 0.00011573333333333333, 'samples': 222304, 'steps': 434, 'loss/train': 5.728270053863525} -09/20/2021 15:59:33 - INFO - __main__ - Step 6948: {'lr': 0.00011573333333333333, 'samples': 222336, 'steps': 434, 'loss/train': 6.100681781768799} -09/20/2021 15:59:34 - INFO - __main__ - Step 6949: {'lr': 0.00011573333333333333, 'samples': 222368, 'steps': 434, 'loss/train': 5.112281322479248} -09/20/2021 15:59:35 - INFO - __main__ - Step 6950: {'lr': 0.00011573333333333333, 'samples': 222400, 'steps': 434, 'loss/train': 5.350078105926514} -09/20/2021 15:59:36 - INFO - __main__ - Step 6951: {'lr': 0.00011573333333333333, 'samples': 222432, 'steps': 434, 'loss/train': 6.075608730316162} -09/20/2021 15:59:36 - INFO - __main__ - Step 6952: {'lr': 0.00011573333333333333, 'samples': 222464, 'steps': 434, 'loss/train': 4.956234455108643} -09/20/2021 15:59:37 - INFO - __main__ - Step 6953: {'lr': 0.00011573333333333333, 'samples': 222496, 'steps': 434, 'loss/train': 4.302507400512695} -09/20/2021 15:59:38 - INFO - __main__ - Step 6954: {'lr': 0.00011573333333333333, 'samples': 222528, 'steps': 434, 'loss/train': 5.048542022705078} -09/20/2021 15:59:39 - INFO - __main__ - Step 6955: {'lr': 0.00011573333333333333, 'samples': 222560, 'steps': 434, 'loss/train': 5.169127941131592} -09/20/2021 15:59:39 - INFO - __main__ - Step 6956: {'lr': 0.00011573333333333333, 'samples': 222592, 'steps': 434, 'loss/train': 6.403012752532959} -09/20/2021 15:59:40 - INFO - __main__ - Step 6957: {'lr': 0.00011573333333333333, 'samples': 222624, 'steps': 434, 'loss/train': 5.294203758239746} -09/20/2021 15:59:41 - INFO - __main__ - Step 6958: {'lr': 0.00011573333333333333, 'samples': 222656, 'steps': 434, 'loss/train': 5.664985656738281} -09/20/2021 15:59:42 - INFO - __main__ - Step 6959: {'lr': 0.00011573333333333333, 'samples': 222688, 'steps': 434, 'loss/train': 4.864521503448486} -09/20/2021 15:59:42 - INFO - __main__ - Step 6960: {'lr': 0.00011573333333333333, 'samples': 222720, 'steps': 434, 'loss/train': 5.040899276733398} -09/20/2021 15:59:43 - INFO - __main__ - Step 6961: {'lr': 0.000116, 'samples': 222752, 'steps': 435, 'loss/train': 5.277835369110107} -09/20/2021 15:59:44 - INFO - __main__ - Step 6962: {'lr': 0.000116, 'samples': 222784, 'steps': 435, 'loss/train': 0.722992479801178} -09/20/2021 15:59:45 - INFO - __main__ - Step 6963: {'lr': 0.000116, 'samples': 222816, 'steps': 435, 'loss/train': 4.608615398406982} -09/20/2021 15:59:45 - INFO - __main__ - Step 6964: {'lr': 0.000116, 'samples': 222848, 'steps': 435, 'loss/train': 5.272794246673584} -09/20/2021 15:59:46 - INFO - __main__ - Step 6965: {'lr': 0.000116, 'samples': 222880, 'steps': 435, 'loss/train': 4.79270601272583} -09/20/2021 15:59:47 - INFO - __main__ - Step 6966: {'lr': 0.000116, 'samples': 222912, 'steps': 435, 'loss/train': 4.084462642669678} -09/20/2021 15:59:48 - INFO - __main__ - Step 6967: {'lr': 0.000116, 'samples': 222944, 'steps': 435, 'loss/train': 4.802402019500732} -09/20/2021 15:59:48 - INFO - __main__ - Step 6968: {'lr': 0.000116, 'samples': 222976, 'steps': 435, 'loss/train': 4.984625339508057} -09/20/2021 15:59:50 - INFO - __main__ - Step 6969: {'lr': 0.000116, 'samples': 223008, 'steps': 435, 'loss/train': 5.267923355102539} -09/20/2021 15:59:51 - INFO - __main__ - Step 6970: {'lr': 0.000116, 'samples': 223040, 'steps': 435, 'loss/train': 5.453836441040039} -09/20/2021 15:59:51 - INFO - __main__ - Step 6971: {'lr': 0.000116, 'samples': 223072, 'steps': 435, 'loss/train': 6.764666557312012} -09/20/2021 15:59:52 - INFO - __main__ - Step 6972: {'lr': 0.000116, 'samples': 223104, 'steps': 435, 'loss/train': 2.5616557598114014} -09/20/2021 15:59:53 - INFO - __main__ - Step 6973: {'lr': 0.000116, 'samples': 223136, 'steps': 435, 'loss/train': 2.342466115951538} -09/20/2021 15:59:54 - INFO - __main__ - Step 6974: {'lr': 0.000116, 'samples': 223168, 'steps': 435, 'loss/train': 5.056408405303955} -09/20/2021 15:59:54 - INFO - __main__ - Step 6975: {'lr': 0.000116, 'samples': 223200, 'steps': 435, 'loss/train': 5.489850997924805} -09/20/2021 15:59:55 - INFO - __main__ - Step 6976: {'lr': 0.000116, 'samples': 223232, 'steps': 435, 'loss/train': 5.6012349128723145} -09/20/2021 15:59:56 - INFO - __main__ - Step 6977: {'lr': 0.00011626666666666668, 'samples': 223264, 'steps': 436, 'loss/train': 5.703437328338623} -09/20/2021 15:59:57 - INFO - __main__ - Step 6978: {'lr': 0.00011626666666666668, 'samples': 223296, 'steps': 436, 'loss/train': 5.007512092590332} -09/20/2021 15:59:57 - INFO - __main__ - Step 6979: {'lr': 0.00011626666666666668, 'samples': 223328, 'steps': 436, 'loss/train': 5.3844218254089355} -09/20/2021 15:59:58 - INFO - __main__ - Step 6980: {'lr': 0.00011626666666666668, 'samples': 223360, 'steps': 436, 'loss/train': 5.643062114715576} -09/20/2021 15:59:59 - INFO - __main__ - Step 6981: {'lr': 0.00011626666666666668, 'samples': 223392, 'steps': 436, 'loss/train': 4.76788854598999} -09/20/2021 16:00:00 - INFO - __main__ - Step 6982: {'lr': 0.00011626666666666668, 'samples': 223424, 'steps': 436, 'loss/train': 7.287636756896973} -09/20/2021 16:00:00 - INFO - __main__ - Step 6983: {'lr': 0.00011626666666666668, 'samples': 223456, 'steps': 436, 'loss/train': 5.296051979064941} -09/20/2021 16:00:01 - INFO - __main__ - Step 6984: {'lr': 0.00011626666666666668, 'samples': 223488, 'steps': 436, 'loss/train': 3.9019882678985596} -09/20/2021 16:00:02 - INFO - __main__ - Step 6985: {'lr': 0.00011626666666666668, 'samples': 223520, 'steps': 436, 'loss/train': 3.6100425720214844} -09/20/2021 16:00:03 - INFO - __main__ - Step 6986: {'lr': 0.00011626666666666668, 'samples': 223552, 'steps': 436, 'loss/train': 3.8937463760375977} -09/20/2021 16:00:03 - INFO - __main__ - Step 6987: {'lr': 0.00011626666666666668, 'samples': 223584, 'steps': 436, 'loss/train': 2.8997411727905273} -09/20/2021 16:00:04 - INFO - __main__ - Step 6988: {'lr': 0.00011626666666666668, 'samples': 223616, 'steps': 436, 'loss/train': 3.3762826919555664} -09/20/2021 16:00:05 - INFO - __main__ - Step 6989: {'lr': 0.00011626666666666668, 'samples': 223648, 'steps': 436, 'loss/train': 5.143653392791748} -09/20/2021 16:00:06 - INFO - __main__ - Step 6990: {'lr': 0.00011626666666666668, 'samples': 223680, 'steps': 436, 'loss/train': 4.8073811531066895} -09/20/2021 16:00:06 - INFO - __main__ - Step 6991: {'lr': 0.00011626666666666668, 'samples': 223712, 'steps': 436, 'loss/train': 4.870699882507324} -09/20/2021 16:00:07 - INFO - __main__ - Step 6992: {'lr': 0.00011626666666666668, 'samples': 223744, 'steps': 436, 'loss/train': 5.205853462219238} -09/20/2021 16:00:08 - INFO - __main__ - Step 6993: {'lr': 0.00011653333333333334, 'samples': 223776, 'steps': 437, 'loss/train': 4.473331451416016} -09/20/2021 16:00:09 - INFO - __main__ - Step 6994: {'lr': 0.00011653333333333334, 'samples': 223808, 'steps': 437, 'loss/train': 4.588613510131836} -09/20/2021 16:00:10 - INFO - __main__ - Step 6995: {'lr': 0.00011653333333333334, 'samples': 223840, 'steps': 437, 'loss/train': 4.42431640625} -09/20/2021 16:00:10 - INFO - __main__ - Step 6996: {'lr': 0.00011653333333333334, 'samples': 223872, 'steps': 437, 'loss/train': 4.502840995788574} -09/20/2021 16:00:11 - INFO - __main__ - Step 6997: {'lr': 0.00011653333333333334, 'samples': 223904, 'steps': 437, 'loss/train': 3.7248623371124268} -09/20/2021 16:00:12 - INFO - __main__ - Step 6998: {'lr': 0.00011653333333333334, 'samples': 223936, 'steps': 437, 'loss/train': 2.8713600635528564} -09/20/2021 16:00:13 - INFO - __main__ - Step 6999: {'lr': 0.00011653333333333334, 'samples': 223968, 'steps': 437, 'loss/train': 1.8780707120895386} -09/20/2021 16:00:14 - INFO - __main__ - Step 7000: {'lr': 0.00011653333333333334, 'samples': 224000, 'steps': 437, 'loss/train': 5.037160396575928} -09/20/2021 16:00:15 - INFO - __main__ - Step 7001: {'lr': 0.00011653333333333334, 'samples': 224032, 'steps': 437, 'loss/train': 4.8632731437683105} -09/20/2021 16:00:15 - INFO - __main__ - Step 7002: {'lr': 0.00011653333333333334, 'samples': 224064, 'steps': 437, 'loss/train': 5.301426887512207} -09/20/2021 16:00:16 - INFO - __main__ - Step 7003: {'lr': 0.00011653333333333334, 'samples': 224096, 'steps': 437, 'loss/train': 6.170408725738525} -09/20/2021 16:00:17 - INFO - __main__ - Step 7004: {'lr': 0.00011653333333333334, 'samples': 224128, 'steps': 437, 'loss/train': 4.792888164520264} -09/20/2021 16:00:18 - INFO - __main__ - Step 7005: {'lr': 0.00011653333333333334, 'samples': 224160, 'steps': 437, 'loss/train': 2.126154661178589} -09/20/2021 16:00:18 - INFO - __main__ - Step 7006: {'lr': 0.00011653333333333334, 'samples': 224192, 'steps': 437, 'loss/train': 4.724394798278809} -09/20/2021 16:00:19 - INFO - __main__ - Step 7007: {'lr': 0.00011653333333333334, 'samples': 224224, 'steps': 437, 'loss/train': 5.842303276062012} -09/20/2021 16:00:20 - INFO - __main__ - Step 7008: {'lr': 0.00011653333333333334, 'samples': 224256, 'steps': 437, 'loss/train': 5.8061299324035645} -09/20/2021 16:00:21 - INFO - __main__ - Step 7009: {'lr': 0.00011679999999999999, 'samples': 224288, 'steps': 438, 'loss/train': 4.8217010498046875} -09/20/2021 16:00:21 - INFO - __main__ - Step 7010: {'lr': 0.00011679999999999999, 'samples': 224320, 'steps': 438, 'loss/train': 5.088934421539307} -09/20/2021 16:00:22 - INFO - __main__ - Step 7011: {'lr': 0.00011679999999999999, 'samples': 224352, 'steps': 438, 'loss/train': 4.553540229797363} -09/20/2021 16:00:23 - INFO - __main__ - Step 7012: {'lr': 0.00011679999999999999, 'samples': 224384, 'steps': 438, 'loss/train': 5.467595100402832} -09/20/2021 16:00:24 - INFO - __main__ - Step 7013: {'lr': 0.00011679999999999999, 'samples': 224416, 'steps': 438, 'loss/train': 4.881397247314453} -09/20/2021 16:00:24 - INFO - __main__ - Step 7014: {'lr': 0.00011679999999999999, 'samples': 224448, 'steps': 438, 'loss/train': 5.315874099731445} -09/20/2021 16:00:25 - INFO - __main__ - Step 7015: {'lr': 0.00011679999999999999, 'samples': 224480, 'steps': 438, 'loss/train': 5.410292148590088} -09/20/2021 16:00:26 - INFO - __main__ - Step 7016: {'lr': 0.00011679999999999999, 'samples': 224512, 'steps': 438, 'loss/train': 5.467952251434326} -09/20/2021 16:00:27 - INFO - __main__ - Step 7017: {'lr': 0.00011679999999999999, 'samples': 224544, 'steps': 438, 'loss/train': 4.97040319442749} -09/20/2021 16:00:27 - INFO - __main__ - Step 7018: {'lr': 0.00011679999999999999, 'samples': 224576, 'steps': 438, 'loss/train': 5.224005222320557} -09/20/2021 16:00:28 - INFO - __main__ - Step 7019: {'lr': 0.00011679999999999999, 'samples': 224608, 'steps': 438, 'loss/train': 1.8452435731887817} -09/20/2021 16:00:29 - INFO - __main__ - Step 7020: {'lr': 0.00011679999999999999, 'samples': 224640, 'steps': 438, 'loss/train': 1.9864951372146606} -09/20/2021 16:00:30 - INFO - __main__ - Step 7021: {'lr': 0.00011679999999999999, 'samples': 224672, 'steps': 438, 'loss/train': 5.694334983825684} -09/20/2021 16:00:30 - INFO - __main__ - Step 7022: {'lr': 0.00011679999999999999, 'samples': 224704, 'steps': 438, 'loss/train': 5.1688337326049805} -09/20/2021 16:00:31 - INFO - __main__ - Step 7023: {'lr': 0.00011679999999999999, 'samples': 224736, 'steps': 438, 'loss/train': 4.830999851226807} -09/20/2021 16:00:32 - INFO - __main__ - Step 7024: {'lr': 0.00011679999999999999, 'samples': 224768, 'steps': 438, 'loss/train': 4.963718414306641} -09/20/2021 16:00:33 - INFO - __main__ - Step 7025: {'lr': 0.00011706666666666668, 'samples': 224800, 'steps': 439, 'loss/train': 5.137984275817871} -09/20/2021 16:00:34 - INFO - __main__ - Step 7026: {'lr': 0.00011706666666666668, 'samples': 224832, 'steps': 439, 'loss/train': 4.6200103759765625} -09/20/2021 16:00:34 - INFO - __main__ - Step 7027: {'lr': 0.00011706666666666668, 'samples': 224864, 'steps': 439, 'loss/train': 4.843639373779297} -09/20/2021 16:00:35 - INFO - __main__ - Step 7028: {'lr': 0.00011706666666666668, 'samples': 224896, 'steps': 439, 'loss/train': 5.596092700958252} -09/20/2021 16:00:36 - INFO - __main__ - Step 7029: {'lr': 0.00011706666666666668, 'samples': 224928, 'steps': 439, 'loss/train': 4.664041996002197} -09/20/2021 16:00:37 - INFO - __main__ - Step 7030: {'lr': 0.00011706666666666668, 'samples': 224960, 'steps': 439, 'loss/train': 5.297601222991943} -09/20/2021 16:00:38 - INFO - __main__ - Step 7031: {'lr': 0.00011706666666666668, 'samples': 224992, 'steps': 439, 'loss/train': 4.534040451049805} -09/20/2021 16:00:39 - INFO - __main__ - Step 7032: {'lr': 0.00011706666666666668, 'samples': 225024, 'steps': 439, 'loss/train': 2.8895716667175293} -09/20/2021 16:00:40 - INFO - __main__ - Step 7033: {'lr': 0.00011706666666666668, 'samples': 225056, 'steps': 439, 'loss/train': 2.4912233352661133} -09/20/2021 16:00:40 - INFO - __main__ - Step 7034: {'lr': 0.00011706666666666668, 'samples': 225088, 'steps': 439, 'loss/train': 4.806788921356201} -09/20/2021 16:00:41 - INFO - __main__ - Step 7035: {'lr': 0.00011706666666666668, 'samples': 225120, 'steps': 439, 'loss/train': 4.947830677032471} -09/20/2021 16:00:42 - INFO - __main__ - Step 7036: {'lr': 0.00011706666666666668, 'samples': 225152, 'steps': 439, 'loss/train': 5.422831058502197} -09/20/2021 16:00:43 - INFO - __main__ - Step 7037: {'lr': 0.00011706666666666668, 'samples': 225184, 'steps': 439, 'loss/train': 5.068739891052246} -09/20/2021 16:00:43 - INFO - __main__ - Step 7038: {'lr': 0.00011706666666666668, 'samples': 225216, 'steps': 439, 'loss/train': 5.339808940887451} -09/20/2021 16:00:44 - INFO - __main__ - Step 7039: {'lr': 0.00011706666666666668, 'samples': 225248, 'steps': 439, 'loss/train': 5.145984649658203} -09/20/2021 16:00:45 - INFO - __main__ - Step 7040: {'lr': 0.00011706666666666668, 'samples': 225280, 'steps': 439, 'loss/train': 5.732313632965088} -09/20/2021 16:00:46 - INFO - __main__ - Step 7041: {'lr': 0.00011733333333333334, 'samples': 225312, 'steps': 440, 'loss/train': 5.2493367195129395} -09/20/2021 16:00:47 - INFO - __main__ - Step 7042: {'lr': 0.00011733333333333334, 'samples': 225344, 'steps': 440, 'loss/train': 5.146507263183594} -09/20/2021 16:00:47 - INFO - __main__ - Step 7043: {'lr': 0.00011733333333333334, 'samples': 225376, 'steps': 440, 'loss/train': 5.023070812225342} -09/20/2021 16:00:48 - INFO - __main__ - Step 7044: {'lr': 0.00011733333333333334, 'samples': 225408, 'steps': 440, 'loss/train': 5.577686786651611} -09/20/2021 16:00:49 - INFO - __main__ - Step 7045: {'lr': 0.00011733333333333334, 'samples': 225440, 'steps': 440, 'loss/train': 5.360510349273682} -09/20/2021 16:00:50 - INFO - __main__ - Step 7046: {'lr': 0.00011733333333333334, 'samples': 225472, 'steps': 440, 'loss/train': 5.227387428283691} -09/20/2021 16:00:50 - INFO - __main__ - Step 7047: {'lr': 0.00011733333333333334, 'samples': 225504, 'steps': 440, 'loss/train': 4.781126976013184} -09/20/2021 16:00:51 - INFO - __main__ - Step 7048: {'lr': 0.00011733333333333334, 'samples': 225536, 'steps': 440, 'loss/train': 4.528456211090088} -09/20/2021 16:00:52 - INFO - __main__ - Step 7049: {'lr': 0.00011733333333333334, 'samples': 225568, 'steps': 440, 'loss/train': 4.895262718200684} -09/20/2021 16:00:53 - INFO - __main__ - Step 7050: {'lr': 0.00011733333333333334, 'samples': 225600, 'steps': 440, 'loss/train': 5.288473606109619} -09/20/2021 16:00:53 - INFO - __main__ - Step 7051: {'lr': 0.00011733333333333334, 'samples': 225632, 'steps': 440, 'loss/train': 4.5222249031066895} -09/20/2021 16:00:54 - INFO - __main__ - Step 7052: {'lr': 0.00011733333333333334, 'samples': 225664, 'steps': 440, 'loss/train': 5.049380302429199} -09/20/2021 16:00:55 - INFO - __main__ - Step 7053: {'lr': 0.00011733333333333334, 'samples': 225696, 'steps': 440, 'loss/train': 5.166492462158203} -09/20/2021 16:00:56 - INFO - __main__ - Step 7054: {'lr': 0.00011733333333333334, 'samples': 225728, 'steps': 440, 'loss/train': 5.49250602722168} -09/20/2021 16:00:56 - INFO - __main__ - Step 7055: {'lr': 0.00011733333333333334, 'samples': 225760, 'steps': 440, 'loss/train': 4.922379016876221} -09/20/2021 16:00:57 - INFO - __main__ - Step 7056: {'lr': 0.00011733333333333334, 'samples': 225792, 'steps': 440, 'loss/train': 5.116669178009033} -09/20/2021 16:00:58 - INFO - __main__ - Step 7057: {'lr': 0.0001176, 'samples': 225824, 'steps': 441, 'loss/train': 5.267856597900391} -09/20/2021 16:00:59 - INFO - __main__ - Step 7058: {'lr': 0.0001176, 'samples': 225856, 'steps': 441, 'loss/train': 4.94473934173584} -09/20/2021 16:00:59 - INFO - __main__ - Step 7059: {'lr': 0.0001176, 'samples': 225888, 'steps': 441, 'loss/train': 4.740016937255859} -09/20/2021 16:01:01 - INFO - __main__ - Step 7060: {'lr': 0.0001176, 'samples': 225920, 'steps': 441, 'loss/train': 4.199758529663086} -09/20/2021 16:01:02 - INFO - __main__ - Step 7061: {'lr': 0.0001176, 'samples': 225952, 'steps': 441, 'loss/train': 5.1118998527526855} -09/20/2021 16:01:02 - INFO - __main__ - Step 7062: {'lr': 0.0001176, 'samples': 225984, 'steps': 441, 'loss/train': 5.366971969604492} -09/20/2021 16:01:03 - INFO - __main__ - Step 7063: {'lr': 0.0001176, 'samples': 226016, 'steps': 441, 'loss/train': 5.096493721008301} -09/20/2021 16:01:04 - INFO - __main__ - Step 7064: {'lr': 0.0001176, 'samples': 226048, 'steps': 441, 'loss/train': 4.905974864959717} -09/20/2021 16:01:05 - INFO - __main__ - Step 7065: {'lr': 0.0001176, 'samples': 226080, 'steps': 441, 'loss/train': 4.903099536895752} -09/20/2021 16:01:05 - INFO - __main__ - Step 7066: {'lr': 0.0001176, 'samples': 226112, 'steps': 441, 'loss/train': 5.924293041229248} -09/20/2021 16:01:06 - INFO - __main__ - Step 7067: {'lr': 0.0001176, 'samples': 226144, 'steps': 441, 'loss/train': 6.242842674255371} -09/20/2021 16:01:07 - INFO - __main__ - Step 7068: {'lr': 0.0001176, 'samples': 226176, 'steps': 441, 'loss/train': 6.413668155670166} -09/20/2021 16:01:08 - INFO - __main__ - Step 7069: {'lr': 0.0001176, 'samples': 226208, 'steps': 441, 'loss/train': 5.36935567855835} -09/20/2021 16:01:08 - INFO - __main__ - Step 7070: {'lr': 0.0001176, 'samples': 226240, 'steps': 441, 'loss/train': 4.6209540367126465} -09/20/2021 16:01:09 - INFO - __main__ - Step 7071: {'lr': 0.0001176, 'samples': 226272, 'steps': 441, 'loss/train': 5.251248836517334} -09/20/2021 16:01:10 - INFO - __main__ - Step 7072: {'lr': 0.0001176, 'samples': 226304, 'steps': 441, 'loss/train': 4.147571086883545} -09/20/2021 16:01:11 - INFO - __main__ - Step 7073: {'lr': 0.00011786666666666668, 'samples': 226336, 'steps': 442, 'loss/train': 5.171285152435303} -09/20/2021 16:01:11 - INFO - __main__ - Step 7074: {'lr': 0.00011786666666666668, 'samples': 226368, 'steps': 442, 'loss/train': 5.885597229003906} -09/20/2021 16:01:12 - INFO - __main__ - Step 7075: {'lr': 0.00011786666666666668, 'samples': 226400, 'steps': 442, 'loss/train': 5.699315547943115} -09/20/2021 16:01:13 - INFO - __main__ - Step 7076: {'lr': 0.00011786666666666668, 'samples': 226432, 'steps': 442, 'loss/train': 5.36042594909668} -09/20/2021 16:01:14 - INFO - __main__ - Step 7077: {'lr': 0.00011786666666666668, 'samples': 226464, 'steps': 442, 'loss/train': 3.9054980278015137} -09/20/2021 16:01:14 - INFO - __main__ - Step 7078: {'lr': 0.00011786666666666668, 'samples': 226496, 'steps': 442, 'loss/train': 5.39531946182251} -09/20/2021 16:01:15 - INFO - __main__ - Step 7079: {'lr': 0.00011786666666666668, 'samples': 226528, 'steps': 442, 'loss/train': 5.110724925994873} -09/20/2021 16:01:16 - INFO - __main__ - Step 7080: {'lr': 0.00011786666666666668, 'samples': 226560, 'steps': 442, 'loss/train': 2.2588112354278564} -09/20/2021 16:01:17 - INFO - __main__ - Step 7081: {'lr': 0.00011786666666666668, 'samples': 226592, 'steps': 442, 'loss/train': 2.1295840740203857} -09/20/2021 16:01:17 - INFO - __main__ - Step 7082: {'lr': 0.00011786666666666668, 'samples': 226624, 'steps': 442, 'loss/train': 5.185661792755127} -09/20/2021 16:01:18 - INFO - __main__ - Step 7083: {'lr': 0.00011786666666666668, 'samples': 226656, 'steps': 442, 'loss/train': 4.782024383544922} -09/20/2021 16:01:19 - INFO - __main__ - Step 7084: {'lr': 0.00011786666666666668, 'samples': 226688, 'steps': 442, 'loss/train': 4.409018039703369} -09/20/2021 16:01:20 - INFO - __main__ - Step 7085: {'lr': 0.00011786666666666668, 'samples': 226720, 'steps': 442, 'loss/train': 4.665772914886475} -09/20/2021 16:01:20 - INFO - __main__ - Step 7086: {'lr': 0.00011786666666666668, 'samples': 226752, 'steps': 442, 'loss/train': 5.076434135437012} -09/20/2021 16:01:21 - INFO - __main__ - Step 7087: {'lr': 0.00011786666666666668, 'samples': 226784, 'steps': 442, 'loss/train': 5.0806660652160645} -09/20/2021 16:01:22 - INFO - __main__ - Step 7088: {'lr': 0.00011786666666666668, 'samples': 226816, 'steps': 442, 'loss/train': 5.743529319763184} -09/20/2021 16:01:23 - INFO - __main__ - Step 7089: {'lr': 0.00011813333333333334, 'samples': 226848, 'steps': 443, 'loss/train': 4.792573928833008} -09/20/2021 16:01:24 - INFO - __main__ - Step 7090: {'lr': 0.00011813333333333334, 'samples': 226880, 'steps': 443, 'loss/train': 4.7506327629089355} -09/20/2021 16:01:25 - INFO - __main__ - Step 7091: {'lr': 0.00011813333333333334, 'samples': 226912, 'steps': 443, 'loss/train': 4.714658260345459} -09/20/2021 16:01:26 - INFO - __main__ - Step 7092: {'lr': 0.00011813333333333334, 'samples': 226944, 'steps': 443, 'loss/train': 4.471029281616211} -09/20/2021 16:01:27 - INFO - __main__ - Step 7093: {'lr': 0.00011813333333333334, 'samples': 226976, 'steps': 443, 'loss/train': 5.154417037963867} -09/20/2021 16:01:27 - INFO - __main__ - Step 7094: {'lr': 0.00011813333333333334, 'samples': 227008, 'steps': 443, 'loss/train': 4.427051067352295} -09/20/2021 16:01:28 - INFO - __main__ - Step 7095: {'lr': 0.00011813333333333334, 'samples': 227040, 'steps': 443, 'loss/train': 4.483659744262695} -09/20/2021 16:01:29 - INFO - __main__ - Step 7096: {'lr': 0.00011813333333333334, 'samples': 227072, 'steps': 443, 'loss/train': 4.502241134643555} -09/20/2021 16:01:30 - INFO - __main__ - Step 7097: {'lr': 0.00011813333333333334, 'samples': 227104, 'steps': 443, 'loss/train': 4.985086917877197} -09/20/2021 16:01:30 - INFO - __main__ - Step 7098: {'lr': 0.00011813333333333334, 'samples': 227136, 'steps': 443, 'loss/train': 5.044963836669922} -09/20/2021 16:01:31 - INFO - __main__ - Step 7099: {'lr': 0.00011813333333333334, 'samples': 227168, 'steps': 443, 'loss/train': 4.5702223777771} -09/20/2021 16:01:32 - INFO - __main__ - Step 7100: {'lr': 0.00011813333333333334, 'samples': 227200, 'steps': 443, 'loss/train': 5.410682201385498} -09/20/2021 16:01:33 - INFO - __main__ - Step 7101: {'lr': 0.00011813333333333334, 'samples': 227232, 'steps': 443, 'loss/train': 5.837945938110352} -09/20/2021 16:01:34 - INFO - __main__ - Step 7102: {'lr': 0.00011813333333333334, 'samples': 227264, 'steps': 443, 'loss/train': 5.0072340965271} -09/20/2021 16:01:34 - INFO - __main__ - Step 7103: {'lr': 0.00011813333333333334, 'samples': 227296, 'steps': 443, 'loss/train': 4.828414440155029} -09/20/2021 16:01:35 - INFO - __main__ - Step 7104: {'lr': 0.00011813333333333334, 'samples': 227328, 'steps': 443, 'loss/train': 4.487966060638428} -09/20/2021 16:01:36 - INFO - __main__ - Step 7105: {'lr': 0.0001184, 'samples': 227360, 'steps': 444, 'loss/train': 4.589295387268066} -09/20/2021 16:01:37 - INFO - __main__ - Step 7106: {'lr': 0.0001184, 'samples': 227392, 'steps': 444, 'loss/train': 6.184419631958008} -09/20/2021 16:01:37 - INFO - __main__ - Step 7107: {'lr': 0.0001184, 'samples': 227424, 'steps': 444, 'loss/train': 4.7339186668396} -09/20/2021 16:01:38 - INFO - __main__ - Step 7108: {'lr': 0.0001184, 'samples': 227456, 'steps': 444, 'loss/train': 4.622530460357666} -09/20/2021 16:01:39 - INFO - __main__ - Step 7109: {'lr': 0.0001184, 'samples': 227488, 'steps': 444, 'loss/train': 4.277790069580078} -09/20/2021 16:01:40 - INFO - __main__ - Step 7110: {'lr': 0.0001184, 'samples': 227520, 'steps': 444, 'loss/train': 4.690971374511719} -09/20/2021 16:01:40 - INFO - __main__ - Step 7111: {'lr': 0.0001184, 'samples': 227552, 'steps': 444, 'loss/train': 3.183164358139038} -09/20/2021 16:01:41 - INFO - __main__ - Step 7112: {'lr': 0.0001184, 'samples': 227584, 'steps': 444, 'loss/train': 3.2345871925354004} -09/20/2021 16:01:42 - INFO - __main__ - Step 7113: {'lr': 0.0001184, 'samples': 227616, 'steps': 444, 'loss/train': 3.2658050060272217} -09/20/2021 16:01:43 - INFO - __main__ - Step 7114: {'lr': 0.0001184, 'samples': 227648, 'steps': 444, 'loss/train': 3.195596218109131} -09/20/2021 16:01:43 - INFO - __main__ - Step 7115: {'lr': 0.0001184, 'samples': 227680, 'steps': 444, 'loss/train': 3.219959020614624} -09/20/2021 16:01:44 - INFO - __main__ - Step 7116: {'lr': 0.0001184, 'samples': 227712, 'steps': 444, 'loss/train': 3.253535032272339} -09/20/2021 16:01:45 - INFO - __main__ - Step 7117: {'lr': 0.0001184, 'samples': 227744, 'steps': 444, 'loss/train': 3.2344555854797363} -09/20/2021 16:01:46 - INFO - __main__ - Step 7118: {'lr': 0.0001184, 'samples': 227776, 'steps': 444, 'loss/train': 3.280626058578491} -09/20/2021 16:01:46 - INFO - __main__ - Step 7119: {'lr': 0.0001184, 'samples': 227808, 'steps': 444, 'loss/train': 5.374937057495117} -09/20/2021 16:01:47 - INFO - __main__ - Step 7120: {'lr': 0.0001184, 'samples': 227840, 'steps': 444, 'loss/train': 5.445438861846924} -09/20/2021 16:01:48 - INFO - __main__ - Step 7121: {'lr': 0.00011866666666666669, 'samples': 227872, 'steps': 445, 'loss/train': 5.648751735687256} -09/20/2021 16:01:49 - INFO - __main__ - Step 7122: {'lr': 0.00011866666666666669, 'samples': 227904, 'steps': 445, 'loss/train': 4.643500328063965} -09/20/2021 16:01:50 - INFO - __main__ - Step 7123: {'lr': 0.00011866666666666669, 'samples': 227936, 'steps': 445, 'loss/train': 5.9120097160339355} -09/20/2021 16:01:50 - INFO - __main__ - Step 7124: {'lr': 0.00011866666666666669, 'samples': 227968, 'steps': 445, 'loss/train': 4.822029113769531} -09/20/2021 16:01:51 - INFO - __main__ - Step 7125: {'lr': 0.00011866666666666669, 'samples': 228000, 'steps': 445, 'loss/train': 5.4515461921691895} -09/20/2021 16:01:52 - INFO - __main__ - Step 7126: {'lr': 0.00011866666666666669, 'samples': 228032, 'steps': 445, 'loss/train': 4.840950012207031} -09/20/2021 16:01:53 - INFO - __main__ - Step 7127: {'lr': 0.00011866666666666669, 'samples': 228064, 'steps': 445, 'loss/train': 5.117909908294678} -09/20/2021 16:01:54 - INFO - __main__ - Step 7128: {'lr': 0.00011866666666666669, 'samples': 228096, 'steps': 445, 'loss/train': 4.394682884216309} -09/20/2021 16:01:55 - INFO - __main__ - Step 7129: {'lr': 0.00011866666666666669, 'samples': 228128, 'steps': 445, 'loss/train': 5.0585808753967285} -09/20/2021 16:01:55 - INFO - __main__ - Step 7130: {'lr': 0.00011866666666666669, 'samples': 228160, 'steps': 445, 'loss/train': 5.490981578826904} -09/20/2021 16:01:56 - INFO - __main__ - Step 7131: {'lr': 0.00011866666666666669, 'samples': 228192, 'steps': 445, 'loss/train': 5.187209129333496} -09/20/2021 16:01:57 - INFO - __main__ - Step 7132: {'lr': 0.00011866666666666669, 'samples': 228224, 'steps': 445, 'loss/train': 4.634932994842529} -09/20/2021 16:01:58 - INFO - __main__ - Step 7133: {'lr': 0.00011866666666666669, 'samples': 228256, 'steps': 445, 'loss/train': 4.617866039276123} -09/20/2021 16:01:58 - INFO - __main__ - Step 7134: {'lr': 0.00011866666666666669, 'samples': 228288, 'steps': 445, 'loss/train': 5.343010902404785} -09/20/2021 16:01:59 - INFO - __main__ - Step 7135: {'lr': 0.00011866666666666669, 'samples': 228320, 'steps': 445, 'loss/train': 5.474579811096191} -09/20/2021 16:02:00 - INFO - __main__ - Step 7136: {'lr': 0.00011866666666666669, 'samples': 228352, 'steps': 445, 'loss/train': 4.658284664154053} -09/20/2021 16:02:01 - INFO - __main__ - Step 7137: {'lr': 0.00011893333333333334, 'samples': 228384, 'steps': 446, 'loss/train': 5.607635974884033} -09/20/2021 16:02:01 - INFO - __main__ - Step 7138: {'lr': 0.00011893333333333334, 'samples': 228416, 'steps': 446, 'loss/train': 5.287203311920166} -09/20/2021 16:02:02 - INFO - __main__ - Step 7139: {'lr': 0.00011893333333333334, 'samples': 228448, 'steps': 446, 'loss/train': 5.336169242858887} -09/20/2021 16:02:03 - INFO - __main__ - Step 7140: {'lr': 0.00011893333333333334, 'samples': 228480, 'steps': 446, 'loss/train': 4.3090291023254395} -09/20/2021 16:02:04 - INFO - __main__ - Step 7141: {'lr': 0.00011893333333333334, 'samples': 228512, 'steps': 446, 'loss/train': 4.389971733093262} -09/20/2021 16:02:04 - INFO - __main__ - Step 7142: {'lr': 0.00011893333333333334, 'samples': 228544, 'steps': 446, 'loss/train': 5.056092739105225} -09/20/2021 16:02:05 - INFO - __main__ - Step 7143: {'lr': 0.00011893333333333334, 'samples': 228576, 'steps': 446, 'loss/train': 5.940206527709961} -09/20/2021 16:02:06 - INFO - __main__ - Step 7144: {'lr': 0.00011893333333333334, 'samples': 228608, 'steps': 446, 'loss/train': 5.028641700744629} -09/20/2021 16:02:07 - INFO - __main__ - Step 7145: {'lr': 0.00011893333333333334, 'samples': 228640, 'steps': 446, 'loss/train': 5.162530899047852} -09/20/2021 16:02:07 - INFO - __main__ - Step 7146: {'lr': 0.00011893333333333334, 'samples': 228672, 'steps': 446, 'loss/train': 1.0657004117965698} -09/20/2021 16:02:08 - INFO - __main__ - Step 7147: {'lr': 0.00011893333333333334, 'samples': 228704, 'steps': 446, 'loss/train': 4.569728851318359} -09/20/2021 16:02:09 - INFO - __main__ - Step 7148: {'lr': 0.00011893333333333334, 'samples': 228736, 'steps': 446, 'loss/train': 6.366339683532715} -09/20/2021 16:02:10 - INFO - __main__ - Step 7149: {'lr': 0.00011893333333333334, 'samples': 228768, 'steps': 446, 'loss/train': 2.5071589946746826} -09/20/2021 16:02:10 - INFO - __main__ - Step 7150: {'lr': 0.00011893333333333334, 'samples': 228800, 'steps': 446, 'loss/train': 5.309795379638672} -09/20/2021 16:02:11 - INFO - __main__ - Step 7151: {'lr': 0.00011893333333333334, 'samples': 228832, 'steps': 446, 'loss/train': 6.002483367919922} -09/20/2021 16:02:12 - INFO - __main__ - Step 7152: {'lr': 0.00011893333333333334, 'samples': 228864, 'steps': 446, 'loss/train': 5.193049430847168} -09/20/2021 16:02:13 - INFO - __main__ - Step 7153: {'lr': 0.0001192, 'samples': 228896, 'steps': 447, 'loss/train': 4.9358086585998535} -09/20/2021 16:02:14 - INFO - __main__ - Step 7154: {'lr': 0.0001192, 'samples': 228928, 'steps': 447, 'loss/train': 4.8753767013549805} -09/20/2021 16:02:14 - INFO - __main__ - Step 7155: {'lr': 0.0001192, 'samples': 228960, 'steps': 447, 'loss/train': 6.097005367279053} -09/20/2021 16:02:15 - INFO - __main__ - Step 7156: {'lr': 0.0001192, 'samples': 228992, 'steps': 447, 'loss/train': 6.409482479095459} -09/20/2021 16:02:17 - INFO - __main__ - Step 7157: {'lr': 0.0001192, 'samples': 229024, 'steps': 447, 'loss/train': 5.381659507751465} -09/20/2021 16:02:18 - INFO - __main__ - Step 7158: {'lr': 0.0001192, 'samples': 229056, 'steps': 447, 'loss/train': 5.642935276031494} -09/20/2021 16:02:19 - INFO - __main__ - Step 7159: {'lr': 0.0001192, 'samples': 229088, 'steps': 447, 'loss/train': 5.288673400878906} -09/20/2021 16:02:20 - INFO - __main__ - Step 7160: {'lr': 0.0001192, 'samples': 229120, 'steps': 447, 'loss/train': 7.622968673706055} -09/20/2021 16:02:20 - INFO - __main__ - Step 7161: {'lr': 0.0001192, 'samples': 229152, 'steps': 447, 'loss/train': 4.98046350479126} -09/20/2021 16:02:21 - INFO - __main__ - Step 7162: {'lr': 0.0001192, 'samples': 229184, 'steps': 447, 'loss/train': 5.292484760284424} -09/20/2021 16:02:22 - INFO - __main__ - Step 7163: {'lr': 0.0001192, 'samples': 229216, 'steps': 447, 'loss/train': 5.520038604736328} -09/20/2021 16:02:23 - INFO - __main__ - Step 7164: {'lr': 0.0001192, 'samples': 229248, 'steps': 447, 'loss/train': 5.821788311004639} -09/20/2021 16:02:23 - INFO - __main__ - Step 7165: {'lr': 0.0001192, 'samples': 229280, 'steps': 447, 'loss/train': 2.9537594318389893} -09/20/2021 16:02:24 - INFO - __main__ - Step 7166: {'lr': 0.0001192, 'samples': 229312, 'steps': 447, 'loss/train': 5.317448139190674} -09/20/2021 16:02:25 - INFO - __main__ - Step 7167: {'lr': 0.0001192, 'samples': 229344, 'steps': 447, 'loss/train': 4.779819488525391} -09/20/2021 16:02:26 - INFO - __main__ - Step 7168: {'lr': 0.0001192, 'samples': 229376, 'steps': 447, 'loss/train': 6.554901123046875} -09/20/2021 16:02:27 - INFO - __main__ - Step 7169: {'lr': 0.00011946666666666668, 'samples': 229408, 'steps': 448, 'loss/train': 5.1733479499816895} -09/20/2021 16:02:27 - INFO - __main__ - Step 7170: {'lr': 0.00011946666666666668, 'samples': 229440, 'steps': 448, 'loss/train': 4.516578674316406} -09/20/2021 16:02:28 - INFO - __main__ - Step 7171: {'lr': 0.00011946666666666668, 'samples': 229472, 'steps': 448, 'loss/train': 4.981825351715088} -09/20/2021 16:02:29 - INFO - __main__ - Step 7172: {'lr': 0.00011946666666666668, 'samples': 229504, 'steps': 448, 'loss/train': 5.45286226272583} -09/20/2021 16:02:30 - INFO - __main__ - Step 7173: {'lr': 0.00011946666666666668, 'samples': 229536, 'steps': 448, 'loss/train': 6.232016563415527} -09/20/2021 16:02:30 - INFO - __main__ - Step 7174: {'lr': 0.00011946666666666668, 'samples': 229568, 'steps': 448, 'loss/train': 5.154457092285156} -09/20/2021 16:02:31 - INFO - __main__ - Step 7175: {'lr': 0.00011946666666666668, 'samples': 229600, 'steps': 448, 'loss/train': 5.341779708862305} -09/20/2021 16:02:32 - INFO - __main__ - Step 7176: {'lr': 0.00011946666666666668, 'samples': 229632, 'steps': 448, 'loss/train': 4.872687339782715} -09/20/2021 16:02:33 - INFO - __main__ - Step 7177: {'lr': 0.00011946666666666668, 'samples': 229664, 'steps': 448, 'loss/train': 4.568483352661133} -09/20/2021 16:02:33 - INFO - __main__ - Step 7178: {'lr': 0.00011946666666666668, 'samples': 229696, 'steps': 448, 'loss/train': 4.771674156188965} -09/20/2021 16:02:34 - INFO - __main__ - Step 7179: {'lr': 0.00011946666666666668, 'samples': 229728, 'steps': 448, 'loss/train': 4.690338611602783} -09/20/2021 16:02:35 - INFO - __main__ - Step 7180: {'lr': 0.00011946666666666668, 'samples': 229760, 'steps': 448, 'loss/train': 4.782427787780762} -09/20/2021 16:02:36 - INFO - __main__ - Step 7181: {'lr': 0.00011946666666666668, 'samples': 229792, 'steps': 448, 'loss/train': 4.892975807189941} -09/20/2021 16:02:36 - INFO - __main__ - Step 7182: {'lr': 0.00011946666666666668, 'samples': 229824, 'steps': 448, 'loss/train': 4.624279499053955} -09/20/2021 16:02:37 - INFO - __main__ - Step 7183: {'lr': 0.00011946666666666668, 'samples': 229856, 'steps': 448, 'loss/train': 4.68069314956665} -09/20/2021 16:02:38 - INFO - __main__ - Step 7184: {'lr': 0.00011946666666666668, 'samples': 229888, 'steps': 448, 'loss/train': 5.2611613273620605} -09/20/2021 16:02:39 - INFO - __main__ - Step 7185: {'lr': 0.00011973333333333335, 'samples': 229920, 'steps': 449, 'loss/train': 4.984877109527588} -09/20/2021 16:02:39 - INFO - __main__ - Step 7186: {'lr': 0.00011973333333333335, 'samples': 229952, 'steps': 449, 'loss/train': 5.0888285636901855} -09/20/2021 16:02:40 - INFO - __main__ - Step 7187: {'lr': 0.00011973333333333335, 'samples': 229984, 'steps': 449, 'loss/train': 5.763420581817627} -09/20/2021 16:02:41 - INFO - __main__ - Step 7188: {'lr': 0.00011973333333333335, 'samples': 230016, 'steps': 449, 'loss/train': 4.745408535003662} -09/20/2021 16:02:42 - INFO - __main__ - Step 7189: {'lr': 0.00011973333333333335, 'samples': 230048, 'steps': 449, 'loss/train': 4.569273471832275} -09/20/2021 16:02:43 - INFO - __main__ - Step 7190: {'lr': 0.00011973333333333335, 'samples': 230080, 'steps': 449, 'loss/train': 4.170726776123047} -09/20/2021 16:02:44 - INFO - __main__ - Step 7191: {'lr': 0.00011973333333333335, 'samples': 230112, 'steps': 449, 'loss/train': 4.641967296600342} -09/20/2021 16:02:44 - INFO - __main__ - Step 7192: {'lr': 0.00011973333333333335, 'samples': 230144, 'steps': 449, 'loss/train': 4.947014331817627} -09/20/2021 16:02:45 - INFO - __main__ - Step 7193: {'lr': 0.00011973333333333335, 'samples': 230176, 'steps': 449, 'loss/train': 5.572672367095947} -09/20/2021 16:02:46 - INFO - __main__ - Step 7194: {'lr': 0.00011973333333333335, 'samples': 230208, 'steps': 449, 'loss/train': 4.328732490539551} -09/20/2021 16:02:47 - INFO - __main__ - Step 7195: {'lr': 0.00011973333333333335, 'samples': 230240, 'steps': 449, 'loss/train': 4.44368314743042} -09/20/2021 16:02:47 - INFO - __main__ - Step 7196: {'lr': 0.00011973333333333335, 'samples': 230272, 'steps': 449, 'loss/train': 4.815203666687012} -09/20/2021 16:02:48 - INFO - __main__ - Step 7197: {'lr': 0.00011973333333333335, 'samples': 230304, 'steps': 449, 'loss/train': 4.6420512199401855} -09/20/2021 16:02:49 - INFO - __main__ - Step 7198: {'lr': 0.00011973333333333335, 'samples': 230336, 'steps': 449, 'loss/train': 4.726474285125732} -09/20/2021 16:02:50 - INFO - __main__ - Step 7199: {'lr': 0.00011973333333333335, 'samples': 230368, 'steps': 449, 'loss/train': 4.467252254486084} -09/20/2021 16:02:50 - INFO - __main__ - Step 7200: {'lr': 0.00011973333333333335, 'samples': 230400, 'steps': 449, 'loss/train': 5.0026702880859375} -09/20/2021 16:02:51 - INFO - __main__ - Step 7201: {'lr': 0.00012, 'samples': 230432, 'steps': 450, 'loss/train': 5.2741899490356445} -09/20/2021 16:02:52 - INFO - __main__ - Step 7202: {'lr': 0.00012, 'samples': 230464, 'steps': 450, 'loss/train': 4.978912830352783} -09/20/2021 16:02:53 - INFO - __main__ - Step 7203: {'lr': 0.00012, 'samples': 230496, 'steps': 450, 'loss/train': 4.734591484069824} -09/20/2021 16:02:54 - INFO - __main__ - Step 7204: {'lr': 0.00012, 'samples': 230528, 'steps': 450, 'loss/train': 4.810159683227539} -09/20/2021 16:02:54 - INFO - __main__ - Step 7205: {'lr': 0.00012, 'samples': 230560, 'steps': 450, 'loss/train': 4.257649898529053} -09/20/2021 16:02:55 - INFO - __main__ - Step 7206: {'lr': 0.00012, 'samples': 230592, 'steps': 450, 'loss/train': 4.449889183044434} -09/20/2021 16:02:56 - INFO - __main__ - Step 7207: {'lr': 0.00012, 'samples': 230624, 'steps': 450, 'loss/train': 5.024677753448486} -09/20/2021 16:02:57 - INFO - __main__ - Step 7208: {'lr': 0.00012, 'samples': 230656, 'steps': 450, 'loss/train': 5.015509605407715} -09/20/2021 16:02:57 - INFO - __main__ - Step 7209: {'lr': 0.00012, 'samples': 230688, 'steps': 450, 'loss/train': 5.4484076499938965} -09/20/2021 16:02:58 - INFO - __main__ - Step 7210: {'lr': 0.00012, 'samples': 230720, 'steps': 450, 'loss/train': 4.919012069702148} -09/20/2021 16:02:59 - INFO - __main__ - Step 7211: {'lr': 0.00012, 'samples': 230752, 'steps': 450, 'loss/train': 5.438572406768799} -09/20/2021 16:03:00 - INFO - __main__ - Step 7212: {'lr': 0.00012, 'samples': 230784, 'steps': 450, 'loss/train': 4.9297404289245605} -09/20/2021 16:03:00 - INFO - __main__ - Step 7213: {'lr': 0.00012, 'samples': 230816, 'steps': 450, 'loss/train': 2.9956254959106445} -09/20/2021 16:03:01 - INFO - __main__ - Step 7214: {'lr': 0.00012, 'samples': 230848, 'steps': 450, 'loss/train': 3.236884593963623} -09/20/2021 16:03:02 - INFO - __main__ - Step 7215: {'lr': 0.00012, 'samples': 230880, 'steps': 450, 'loss/train': 4.765522480010986} -09/20/2021 16:03:03 - INFO - __main__ - Step 7216: {'lr': 0.00012, 'samples': 230912, 'steps': 450, 'loss/train': 4.031152248382568} -09/20/2021 16:03:04 - INFO - __main__ - Step 7217: {'lr': 0.00012026666666666669, 'samples': 230944, 'steps': 451, 'loss/train': 5.316596508026123} -09/20/2021 16:03:04 - INFO - __main__ - Step 7218: {'lr': 0.00012026666666666669, 'samples': 230976, 'steps': 451, 'loss/train': 4.228866100311279} -09/20/2021 16:03:05 - INFO - __main__ - Step 7219: {'lr': 0.00012026666666666669, 'samples': 231008, 'steps': 451, 'loss/train': 4.761346340179443} -09/20/2021 16:03:06 - INFO - __main__ - Step 7220: {'lr': 0.00012026666666666669, 'samples': 231040, 'steps': 451, 'loss/train': 5.0284929275512695} -09/20/2021 16:03:07 - INFO - __main__ - Step 7221: {'lr': 0.00012026666666666669, 'samples': 231072, 'steps': 451, 'loss/train': 4.709408283233643} -09/20/2021 16:03:08 - INFO - __main__ - Step 7222: {'lr': 0.00012026666666666669, 'samples': 231104, 'steps': 451, 'loss/train': 5.242715358734131} -09/20/2021 16:03:09 - INFO - __main__ - Step 7223: {'lr': 0.00012026666666666669, 'samples': 231136, 'steps': 451, 'loss/train': 5.237442493438721} -09/20/2021 16:03:09 - INFO - __main__ - Step 7224: {'lr': 0.00012026666666666669, 'samples': 231168, 'steps': 451, 'loss/train': 5.697751522064209} -09/20/2021 16:03:10 - INFO - __main__ - Step 7225: {'lr': 0.00012026666666666669, 'samples': 231200, 'steps': 451, 'loss/train': 5.007907390594482} -09/20/2021 16:03:11 - INFO - __main__ - Step 7226: {'lr': 0.00012026666666666669, 'samples': 231232, 'steps': 451, 'loss/train': 5.129699230194092} -09/20/2021 16:03:12 - INFO - __main__ - Step 7227: {'lr': 0.00012026666666666669, 'samples': 231264, 'steps': 451, 'loss/train': 5.303888320922852} -09/20/2021 16:03:12 - INFO - __main__ - Step 7228: {'lr': 0.00012026666666666669, 'samples': 231296, 'steps': 451, 'loss/train': 4.3009419441223145} -09/20/2021 16:03:13 - INFO - __main__ - Step 7229: {'lr': 0.00012026666666666669, 'samples': 231328, 'steps': 451, 'loss/train': 4.549489974975586} -09/20/2021 16:03:14 - INFO - __main__ - Step 7230: {'lr': 0.00012026666666666669, 'samples': 231360, 'steps': 451, 'loss/train': 5.590306282043457} -09/20/2021 16:03:15 - INFO - __main__ - Step 7231: {'lr': 0.00012026666666666669, 'samples': 231392, 'steps': 451, 'loss/train': 5.701260089874268} -09/20/2021 16:03:15 - INFO - __main__ - Step 7232: {'lr': 0.00012026666666666669, 'samples': 231424, 'steps': 451, 'loss/train': 5.349546432495117} -09/20/2021 16:03:16 - INFO - __main__ - Step 7233: {'lr': 0.00012053333333333334, 'samples': 231456, 'steps': 452, 'loss/train': 5.912286281585693} -09/20/2021 16:03:17 - INFO - __main__ - Step 7234: {'lr': 0.00012053333333333334, 'samples': 231488, 'steps': 452, 'loss/train': 4.383343696594238} -09/20/2021 16:03:18 - INFO - __main__ - Step 7235: {'lr': 0.00012053333333333334, 'samples': 231520, 'steps': 452, 'loss/train': 4.942287445068359} -09/20/2021 16:03:18 - INFO - __main__ - Step 7236: {'lr': 0.00012053333333333334, 'samples': 231552, 'steps': 452, 'loss/train': 4.864915370941162} -09/20/2021 16:03:19 - INFO - __main__ - Step 7237: {'lr': 0.00012053333333333334, 'samples': 231584, 'steps': 452, 'loss/train': 4.444822311401367} -09/20/2021 16:03:20 - INFO - __main__ - Step 7238: {'lr': 0.00012053333333333334, 'samples': 231616, 'steps': 452, 'loss/train': 4.209653377532959} -09/20/2021 16:03:21 - INFO - __main__ - Step 7239: {'lr': 0.00012053333333333334, 'samples': 231648, 'steps': 452, 'loss/train': 5.0812506675720215} -09/20/2021 16:03:21 - INFO - __main__ - Step 7240: {'lr': 0.00012053333333333334, 'samples': 231680, 'steps': 452, 'loss/train': 5.396887302398682} -09/20/2021 16:03:22 - INFO - __main__ - Step 7241: {'lr': 0.00012053333333333334, 'samples': 231712, 'steps': 452, 'loss/train': 4.560201644897461} -09/20/2021 16:03:23 - INFO - __main__ - Step 7242: {'lr': 0.00012053333333333334, 'samples': 231744, 'steps': 452, 'loss/train': 4.90788459777832} -09/20/2021 16:03:24 - INFO - __main__ - Step 7243: {'lr': 0.00012053333333333334, 'samples': 231776, 'steps': 452, 'loss/train': 5.173142910003662} -09/20/2021 16:03:24 - INFO - __main__ - Step 7244: {'lr': 0.00012053333333333334, 'samples': 231808, 'steps': 452, 'loss/train': 5.441556453704834} -09/20/2021 16:03:25 - INFO - __main__ - Step 7245: {'lr': 0.00012053333333333334, 'samples': 231840, 'steps': 452, 'loss/train': 5.864333152770996} -09/20/2021 16:03:26 - INFO - __main__ - Step 7246: {'lr': 0.00012053333333333334, 'samples': 231872, 'steps': 452, 'loss/train': 5.21150016784668} -09/20/2021 16:03:27 - INFO - __main__ - Step 7247: {'lr': 0.00012053333333333334, 'samples': 231904, 'steps': 452, 'loss/train': 5.1560492515563965} -09/20/2021 16:03:27 - INFO - __main__ - Step 7248: {'lr': 0.00012053333333333334, 'samples': 231936, 'steps': 452, 'loss/train': 4.561408042907715} -09/20/2021 16:03:28 - INFO - __main__ - Step 7249: {'lr': 0.0001208, 'samples': 231968, 'steps': 453, 'loss/train': 5.11685037612915} -09/20/2021 16:03:29 - INFO - __main__ - Step 7250: {'lr': 0.0001208, 'samples': 232000, 'steps': 453, 'loss/train': 5.227630615234375} -09/20/2021 16:03:30 - INFO - __main__ - Step 7251: {'lr': 0.0001208, 'samples': 232032, 'steps': 453, 'loss/train': 4.7109551429748535} -09/20/2021 16:03:31 - INFO - __main__ - Step 7252: {'lr': 0.0001208, 'samples': 232064, 'steps': 453, 'loss/train': 4.48485803604126} -09/20/2021 16:03:32 - INFO - __main__ - Step 7253: {'lr': 0.0001208, 'samples': 232096, 'steps': 453, 'loss/train': 5.078672885894775} -09/20/2021 16:03:33 - INFO - __main__ - Step 7254: {'lr': 0.0001208, 'samples': 232128, 'steps': 453, 'loss/train': 4.383066654205322} -09/20/2021 16:03:33 - INFO - __main__ - Step 7255: {'lr': 0.0001208, 'samples': 232160, 'steps': 453, 'loss/train': 5.908428192138672} -09/20/2021 16:03:34 - INFO - __main__ - Step 7256: {'lr': 0.0001208, 'samples': 232192, 'steps': 453, 'loss/train': 4.625698089599609} -09/20/2021 16:03:35 - INFO - __main__ - Step 7257: {'lr': 0.0001208, 'samples': 232224, 'steps': 453, 'loss/train': 5.775930404663086} -09/20/2021 16:03:36 - INFO - __main__ - Step 7258: {'lr': 0.0001208, 'samples': 232256, 'steps': 453, 'loss/train': 5.509486198425293} -09/20/2021 16:03:36 - INFO - __main__ - Step 7259: {'lr': 0.0001208, 'samples': 232288, 'steps': 453, 'loss/train': 5.706762790679932} -09/20/2021 16:03:37 - INFO - __main__ - Step 7260: {'lr': 0.0001208, 'samples': 232320, 'steps': 453, 'loss/train': 5.290687084197998} -09/20/2021 16:03:38 - INFO - __main__ - Step 7261: {'lr': 0.0001208, 'samples': 232352, 'steps': 453, 'loss/train': 5.445558547973633} -09/20/2021 16:03:39 - INFO - __main__ - Step 7262: {'lr': 0.0001208, 'samples': 232384, 'steps': 453, 'loss/train': 5.938233375549316} -09/20/2021 16:03:39 - INFO - __main__ - Step 7263: {'lr': 0.0001208, 'samples': 232416, 'steps': 453, 'loss/train': 4.720699310302734} -09/20/2021 16:03:40 - INFO - __main__ - Step 7264: {'lr': 0.0001208, 'samples': 232448, 'steps': 453, 'loss/train': 4.612132549285889} -09/20/2021 16:03:41 - INFO - __main__ - Step 7265: {'lr': 0.00012106666666666666, 'samples': 232480, 'steps': 454, 'loss/train': 4.994317054748535} -09/20/2021 16:03:42 - INFO - __main__ - Step 7266: {'lr': 0.00012106666666666666, 'samples': 232512, 'steps': 454, 'loss/train': 5.053410053253174} -09/20/2021 16:03:43 - INFO - __main__ - Step 7267: {'lr': 0.00012106666666666666, 'samples': 232544, 'steps': 454, 'loss/train': 4.197361946105957} -09/20/2021 16:03:43 - INFO - __main__ - Step 7268: {'lr': 0.00012106666666666666, 'samples': 232576, 'steps': 454, 'loss/train': 5.435714244842529} -09/20/2021 16:03:44 - INFO - __main__ - Step 7269: {'lr': 0.00012106666666666666, 'samples': 232608, 'steps': 454, 'loss/train': 6.045768737792969} -09/20/2021 16:03:45 - INFO - __main__ - Step 7270: {'lr': 0.00012106666666666666, 'samples': 232640, 'steps': 454, 'loss/train': 4.823723793029785} -09/20/2021 16:03:46 - INFO - __main__ - Step 7271: {'lr': 0.00012106666666666666, 'samples': 232672, 'steps': 454, 'loss/train': 5.00532865524292} -09/20/2021 16:03:46 - INFO - __main__ - Step 7272: {'lr': 0.00012106666666666666, 'samples': 232704, 'steps': 454, 'loss/train': 6.175492763519287} -09/20/2021 16:03:47 - INFO - __main__ - Step 7273: {'lr': 0.00012106666666666666, 'samples': 232736, 'steps': 454, 'loss/train': 5.132211208343506} -09/20/2021 16:03:48 - INFO - __main__ - Step 7274: {'lr': 0.00012106666666666666, 'samples': 232768, 'steps': 454, 'loss/train': 4.289505958557129} -09/20/2021 16:03:49 - INFO - __main__ - Step 7275: {'lr': 0.00012106666666666666, 'samples': 232800, 'steps': 454, 'loss/train': 4.03167724609375} -09/20/2021 16:03:49 - INFO - __main__ - Step 7276: {'lr': 0.00012106666666666666, 'samples': 232832, 'steps': 454, 'loss/train': 5.321635723114014} -09/20/2021 16:03:50 - INFO - __main__ - Step 7277: {'lr': 0.00012106666666666666, 'samples': 232864, 'steps': 454, 'loss/train': 4.400756359100342} -09/20/2021 16:03:51 - INFO - __main__ - Step 7278: {'lr': 0.00012106666666666666, 'samples': 232896, 'steps': 454, 'loss/train': 4.110419273376465} -09/20/2021 16:03:52 - INFO - __main__ - Step 7279: {'lr': 0.00012106666666666666, 'samples': 232928, 'steps': 454, 'loss/train': 3.5880887508392334} -09/20/2021 16:03:52 - INFO - __main__ - Step 7280: {'lr': 0.00012106666666666666, 'samples': 232960, 'steps': 454, 'loss/train': 5.318213939666748} -09/20/2021 16:03:53 - INFO - __main__ - Step 7281: {'lr': 0.00012133333333333335, 'samples': 232992, 'steps': 455, 'loss/train': 4.913898944854736} -09/20/2021 16:03:54 - INFO - __main__ - Step 7282: {'lr': 0.00012133333333333335, 'samples': 233024, 'steps': 455, 'loss/train': 4.900660037994385} -09/20/2021 16:03:55 - INFO - __main__ - Step 7283: {'lr': 0.00012133333333333335, 'samples': 233056, 'steps': 455, 'loss/train': 5.762563705444336} -09/20/2021 16:03:56 - INFO - __main__ - Step 7284: {'lr': 0.00012133333333333335, 'samples': 233088, 'steps': 455, 'loss/train': 4.725808620452881} -09/20/2021 16:03:57 - INFO - __main__ - Step 7285: {'lr': 0.00012133333333333335, 'samples': 233120, 'steps': 455, 'loss/train': 5.161486625671387} -09/20/2021 16:03:57 - INFO - __main__ - Step 7286: {'lr': 0.00012133333333333335, 'samples': 233152, 'steps': 455, 'loss/train': 4.309919834136963} -09/20/2021 16:03:58 - INFO - __main__ - Step 7287: {'lr': 0.00012133333333333335, 'samples': 233184, 'steps': 455, 'loss/train': 4.680462837219238} -09/20/2021 16:03:59 - INFO - __main__ - Step 7288: {'lr': 0.00012133333333333335, 'samples': 233216, 'steps': 455, 'loss/train': 4.333162307739258} -09/20/2021 16:04:00 - INFO - __main__ - Step 7289: {'lr': 0.00012133333333333335, 'samples': 233248, 'steps': 455, 'loss/train': 6.227027416229248} -09/20/2021 16:04:00 - INFO - __main__ - Step 7290: {'lr': 0.00012133333333333335, 'samples': 233280, 'steps': 455, 'loss/train': 4.915371417999268} -09/20/2021 16:04:01 - INFO - __main__ - Step 7291: {'lr': 0.00012133333333333335, 'samples': 233312, 'steps': 455, 'loss/train': 4.070094585418701} -09/20/2021 16:04:02 - INFO - __main__ - Step 7292: {'lr': 0.00012133333333333335, 'samples': 233344, 'steps': 455, 'loss/train': 5.090342044830322} -09/20/2021 16:04:03 - INFO - __main__ - Step 7293: {'lr': 0.00012133333333333335, 'samples': 233376, 'steps': 455, 'loss/train': 4.8827409744262695} -09/20/2021 16:04:03 - INFO - __main__ - Step 7294: {'lr': 0.00012133333333333335, 'samples': 233408, 'steps': 455, 'loss/train': 4.964282512664795} -09/20/2021 16:04:04 - INFO - __main__ - Step 7295: {'lr': 0.00012133333333333335, 'samples': 233440, 'steps': 455, 'loss/train': 4.792296886444092} -09/20/2021 16:04:05 - INFO - __main__ - Step 7296: {'lr': 0.00012133333333333335, 'samples': 233472, 'steps': 455, 'loss/train': 5.065532207489014} -09/20/2021 16:04:06 - INFO - __main__ - Step 7297: {'lr': 0.0001216, 'samples': 233504, 'steps': 456, 'loss/train': 5.269762992858887} -09/20/2021 16:04:07 - INFO - __main__ - Step 7298: {'lr': 0.0001216, 'samples': 233536, 'steps': 456, 'loss/train': 3.4835660457611084} -09/20/2021 16:04:07 - INFO - __main__ - Step 7299: {'lr': 0.0001216, 'samples': 233568, 'steps': 456, 'loss/train': 4.569561004638672} -09/20/2021 16:04:08 - INFO - __main__ - Step 7300: {'lr': 0.0001216, 'samples': 233600, 'steps': 456, 'loss/train': 5.217222213745117} -09/20/2021 16:04:09 - INFO - __main__ - Step 7301: {'lr': 0.0001216, 'samples': 233632, 'steps': 456, 'loss/train': 4.612789630889893} -09/20/2021 16:04:10 - INFO - __main__ - Step 7302: {'lr': 0.0001216, 'samples': 233664, 'steps': 456, 'loss/train': 5.412721633911133} -09/20/2021 16:04:10 - INFO - __main__ - Step 7303: {'lr': 0.0001216, 'samples': 233696, 'steps': 456, 'loss/train': 5.802995204925537} -09/20/2021 16:04:11 - INFO - __main__ - Step 7304: {'lr': 0.0001216, 'samples': 233728, 'steps': 456, 'loss/train': 4.920236110687256} -09/20/2021 16:04:12 - INFO - __main__ - Step 7305: {'lr': 0.0001216, 'samples': 233760, 'steps': 456, 'loss/train': 4.534509658813477} -09/20/2021 16:04:13 - INFO - __main__ - Step 7306: {'lr': 0.0001216, 'samples': 233792, 'steps': 456, 'loss/train': 5.960755825042725} -09/20/2021 16:04:13 - INFO - __main__ - Step 7307: {'lr': 0.0001216, 'samples': 233824, 'steps': 456, 'loss/train': 6.079678058624268} -09/20/2021 16:04:14 - INFO - __main__ - Step 7308: {'lr': 0.0001216, 'samples': 233856, 'steps': 456, 'loss/train': 6.335751533508301} -09/20/2021 16:04:15 - INFO - __main__ - Step 7309: {'lr': 0.0001216, 'samples': 233888, 'steps': 456, 'loss/train': 5.733253479003906} -09/20/2021 16:04:16 - INFO - __main__ - Step 7310: {'lr': 0.0001216, 'samples': 233920, 'steps': 456, 'loss/train': 4.847565174102783} -09/20/2021 16:04:16 - INFO - __main__ - Step 7311: {'lr': 0.0001216, 'samples': 233952, 'steps': 456, 'loss/train': 4.468441009521484} -09/20/2021 16:04:17 - INFO - __main__ - Step 7312: {'lr': 0.0001216, 'samples': 233984, 'steps': 456, 'loss/train': 5.267650604248047} -09/20/2021 16:04:19 - INFO - __main__ - Step 7313: {'lr': 0.00012186666666666666, 'samples': 234016, 'steps': 457, 'loss/train': 4.962606906890869} -09/20/2021 16:04:19 - INFO - __main__ - Step 7314: {'lr': 0.00012186666666666666, 'samples': 234048, 'steps': 457, 'loss/train': 4.570956707000732} -09/20/2021 16:04:20 - INFO - __main__ - Step 7315: {'lr': 0.00012186666666666666, 'samples': 234080, 'steps': 457, 'loss/train': 4.719027042388916} -09/20/2021 16:04:21 - INFO - __main__ - Step 7316: {'lr': 0.00012186666666666666, 'samples': 234112, 'steps': 457, 'loss/train': 3.877723455429077} -09/20/2021 16:04:22 - INFO - __main__ - Step 7317: {'lr': 0.00012186666666666666, 'samples': 234144, 'steps': 457, 'loss/train': 3.842893600463867} -09/20/2021 16:04:22 - INFO - __main__ - Step 7318: {'lr': 0.00012186666666666666, 'samples': 234176, 'steps': 457, 'loss/train': 5.197667121887207} -09/20/2021 16:04:23 - INFO - __main__ - Step 7319: {'lr': 0.00012186666666666666, 'samples': 234208, 'steps': 457, 'loss/train': 5.280219078063965} -09/20/2021 16:04:24 - INFO - __main__ - Step 7320: {'lr': 0.00012186666666666666, 'samples': 234240, 'steps': 457, 'loss/train': 4.776626110076904} -09/20/2021 16:04:25 - INFO - __main__ - Step 7321: {'lr': 0.00012186666666666666, 'samples': 234272, 'steps': 457, 'loss/train': 4.909165382385254} -09/20/2021 16:04:25 - INFO - __main__ - Step 7322: {'lr': 0.00012186666666666666, 'samples': 234304, 'steps': 457, 'loss/train': 5.311565399169922} -09/20/2021 16:04:26 - INFO - __main__ - Step 7323: {'lr': 0.00012186666666666666, 'samples': 234336, 'steps': 457, 'loss/train': 5.033533573150635} -09/20/2021 16:04:27 - INFO - __main__ - Step 7324: {'lr': 0.00012186666666666666, 'samples': 234368, 'steps': 457, 'loss/train': 5.373739719390869} -09/20/2021 16:04:28 - INFO - __main__ - Step 7325: {'lr': 0.00012186666666666666, 'samples': 234400, 'steps': 457, 'loss/train': 5.162104606628418} -09/20/2021 16:04:28 - INFO - __main__ - Step 7326: {'lr': 0.00012186666666666666, 'samples': 234432, 'steps': 457, 'loss/train': 5.71993350982666} -09/20/2021 16:04:29 - INFO - __main__ - Step 7327: {'lr': 0.00012186666666666666, 'samples': 234464, 'steps': 457, 'loss/train': 4.162580490112305} -09/20/2021 16:04:30 - INFO - __main__ - Step 7328: {'lr': 0.00012186666666666666, 'samples': 234496, 'steps': 457, 'loss/train': 4.775973320007324} -09/20/2021 16:04:31 - INFO - __main__ - Step 7329: {'lr': 0.00012213333333333334, 'samples': 234528, 'steps': 458, 'loss/train': 5.378231525421143} -09/20/2021 16:04:32 - INFO - __main__ - Step 7330: {'lr': 0.00012213333333333334, 'samples': 234560, 'steps': 458, 'loss/train': 6.8586835861206055} -09/20/2021 16:04:32 - INFO - __main__ - Step 7331: {'lr': 0.00012213333333333334, 'samples': 234592, 'steps': 458, 'loss/train': 4.97754430770874} -09/20/2021 16:04:33 - INFO - __main__ - Step 7332: {'lr': 0.00012213333333333334, 'samples': 234624, 'steps': 458, 'loss/train': 5.137783050537109} -09/20/2021 16:04:34 - INFO - __main__ - Step 7333: {'lr': 0.00012213333333333334, 'samples': 234656, 'steps': 458, 'loss/train': 5.023401737213135} -09/20/2021 16:04:35 - INFO - __main__ - Step 7334: {'lr': 0.00012213333333333334, 'samples': 234688, 'steps': 458, 'loss/train': 5.005176067352295} -09/20/2021 16:04:35 - INFO - __main__ - Step 7335: {'lr': 0.00012213333333333334, 'samples': 234720, 'steps': 458, 'loss/train': 4.661386489868164} -09/20/2021 16:04:36 - INFO - __main__ - Step 7336: {'lr': 0.00012213333333333334, 'samples': 234752, 'steps': 458, 'loss/train': 5.364800453186035} -09/20/2021 16:04:37 - INFO - __main__ - Step 7337: {'lr': 0.00012213333333333334, 'samples': 234784, 'steps': 458, 'loss/train': 4.671205043792725} -09/20/2021 16:04:38 - INFO - __main__ - Step 7338: {'lr': 0.00012213333333333334, 'samples': 234816, 'steps': 458, 'loss/train': 4.912260055541992} -09/20/2021 16:04:38 - INFO - __main__ - Step 7339: {'lr': 0.00012213333333333334, 'samples': 234848, 'steps': 458, 'loss/train': 4.806763172149658} -09/20/2021 16:04:39 - INFO - __main__ - Step 7340: {'lr': 0.00012213333333333334, 'samples': 234880, 'steps': 458, 'loss/train': 2.783954620361328} -09/20/2021 16:04:40 - INFO - __main__ - Step 7341: {'lr': 0.00012213333333333334, 'samples': 234912, 'steps': 458, 'loss/train': 2.6896533966064453} -09/20/2021 16:04:41 - INFO - __main__ - Step 7342: {'lr': 0.00012213333333333334, 'samples': 234944, 'steps': 458, 'loss/train': 4.819274425506592} -09/20/2021 16:04:41 - INFO - __main__ - Step 7343: {'lr': 0.00012213333333333334, 'samples': 234976, 'steps': 458, 'loss/train': 4.099838733673096} -09/20/2021 16:04:43 - INFO - __main__ - Step 7344: {'lr': 0.00012213333333333334, 'samples': 235008, 'steps': 458, 'loss/train': 5.307132244110107} -09/20/2021 16:04:43 - INFO - __main__ - Step 7345: {'lr': 0.0001224, 'samples': 235040, 'steps': 459, 'loss/train': 5.084747791290283} -09/20/2021 16:04:44 - INFO - __main__ - Step 7346: {'lr': 0.0001224, 'samples': 235072, 'steps': 459, 'loss/train': 5.358036994934082} -09/20/2021 16:04:45 - INFO - __main__ - Step 7347: {'lr': 0.0001224, 'samples': 235104, 'steps': 459, 'loss/train': 5.1944756507873535} -09/20/2021 16:04:46 - INFO - __main__ - Step 7348: {'lr': 0.0001224, 'samples': 235136, 'steps': 459, 'loss/train': 4.640199184417725} -09/20/2021 16:04:46 - INFO - __main__ - Step 7349: {'lr': 0.0001224, 'samples': 235168, 'steps': 459, 'loss/train': 5.4507012367248535} -09/20/2021 16:04:47 - INFO - __main__ - Step 7350: {'lr': 0.0001224, 'samples': 235200, 'steps': 459, 'loss/train': 5.420350551605225} -09/20/2021 16:04:48 - INFO - __main__ - Step 7351: {'lr': 0.0001224, 'samples': 235232, 'steps': 459, 'loss/train': 6.474308013916016} -09/20/2021 16:04:49 - INFO - __main__ - Step 7352: {'lr': 0.0001224, 'samples': 235264, 'steps': 459, 'loss/train': 4.488390922546387} -09/20/2021 16:04:49 - INFO - __main__ - Step 7353: {'lr': 0.0001224, 'samples': 235296, 'steps': 459, 'loss/train': 5.5905070304870605} -09/20/2021 16:04:50 - INFO - __main__ - Step 7354: {'lr': 0.0001224, 'samples': 235328, 'steps': 459, 'loss/train': 3.4725146293640137} -09/20/2021 16:04:51 - INFO - __main__ - Step 7355: {'lr': 0.0001224, 'samples': 235360, 'steps': 459, 'loss/train': 4.623347282409668} -09/20/2021 16:04:52 - INFO - __main__ - Step 7356: {'lr': 0.0001224, 'samples': 235392, 'steps': 459, 'loss/train': 4.064384460449219} -09/20/2021 16:04:52 - INFO - __main__ - Step 7357: {'lr': 0.0001224, 'samples': 235424, 'steps': 459, 'loss/train': 5.0202789306640625} -09/20/2021 16:04:53 - INFO - __main__ - Step 7358: {'lr': 0.0001224, 'samples': 235456, 'steps': 459, 'loss/train': 5.5171308517456055} -09/20/2021 16:04:54 - INFO - __main__ - Step 7359: {'lr': 0.0001224, 'samples': 235488, 'steps': 459, 'loss/train': 5.332603931427002} -09/20/2021 16:04:55 - INFO - __main__ - Step 7360: {'lr': 0.0001224, 'samples': 235520, 'steps': 459, 'loss/train': 4.943603992462158} -09/20/2021 16:04:56 - INFO - __main__ - Step 7361: {'lr': 0.00012266666666666668, 'samples': 235552, 'steps': 460, 'loss/train': 4.25240421295166} -09/20/2021 16:04:56 - INFO - __main__ - Step 7362: {'lr': 0.00012266666666666668, 'samples': 235584, 'steps': 460, 'loss/train': 4.971428871154785} -09/20/2021 16:04:57 - INFO - __main__ - Step 7363: {'lr': 0.00012266666666666668, 'samples': 235616, 'steps': 460, 'loss/train': 3.860258102416992} -09/20/2021 16:04:58 - INFO - __main__ - Step 7364: {'lr': 0.00012266666666666668, 'samples': 235648, 'steps': 460, 'loss/train': 4.6215620040893555} -09/20/2021 16:04:59 - INFO - __main__ - Step 7365: {'lr': 0.00012266666666666668, 'samples': 235680, 'steps': 460, 'loss/train': 5.235167980194092} -09/20/2021 16:04:59 - INFO - __main__ - Step 7366: {'lr': 0.00012266666666666668, 'samples': 235712, 'steps': 460, 'loss/train': 5.576355934143066} -09/20/2021 16:05:00 - INFO - __main__ - Step 7367: {'lr': 0.00012266666666666668, 'samples': 235744, 'steps': 460, 'loss/train': 5.153991222381592} -09/20/2021 16:05:01 - INFO - __main__ - Step 7368: {'lr': 0.00012266666666666668, 'samples': 235776, 'steps': 460, 'loss/train': 3.7525510787963867} -09/20/2021 16:05:02 - INFO - __main__ - Step 7369: {'lr': 0.00012266666666666668, 'samples': 235808, 'steps': 460, 'loss/train': 4.691175937652588} -09/20/2021 16:05:02 - INFO - __main__ - Step 7370: {'lr': 0.00012266666666666668, 'samples': 235840, 'steps': 460, 'loss/train': 4.447870254516602} -09/20/2021 16:05:03 - INFO - __main__ - Step 7371: {'lr': 0.00012266666666666668, 'samples': 235872, 'steps': 460, 'loss/train': 4.653221607208252} -09/20/2021 16:05:04 - INFO - __main__ - Step 7372: {'lr': 0.00012266666666666668, 'samples': 235904, 'steps': 460, 'loss/train': 5.207758903503418} -09/20/2021 16:05:05 - INFO - __main__ - Step 7373: {'lr': 0.00012266666666666668, 'samples': 235936, 'steps': 460, 'loss/train': 5.129505157470703} -09/20/2021 16:05:05 - INFO - __main__ - Step 7374: {'lr': 0.00012266666666666668, 'samples': 235968, 'steps': 460, 'loss/train': 6.064978122711182} -09/20/2021 16:05:07 - INFO - __main__ - Step 7375: {'lr': 0.00012266666666666668, 'samples': 236000, 'steps': 460, 'loss/train': 5.62080717086792} -09/20/2021 16:05:07 - INFO - __main__ - Step 7376: {'lr': 0.00012266666666666668, 'samples': 236032, 'steps': 460, 'loss/train': 5.098077774047852} -09/20/2021 16:05:08 - INFO - __main__ - Step 7377: {'lr': 0.00012293333333333336, 'samples': 236064, 'steps': 461, 'loss/train': 5.695276737213135} -09/20/2021 16:05:09 - INFO - __main__ - Step 7378: {'lr': 0.00012293333333333336, 'samples': 236096, 'steps': 461, 'loss/train': 4.331623554229736} -09/20/2021 16:05:10 - INFO - __main__ - Step 7379: {'lr': 0.00012293333333333336, 'samples': 236128, 'steps': 461, 'loss/train': 5.206715106964111} -09/20/2021 16:05:11 - INFO - __main__ - Step 7380: {'lr': 0.00012293333333333336, 'samples': 236160, 'steps': 461, 'loss/train': 4.436736583709717} -09/20/2021 16:05:11 - INFO - __main__ - Step 7381: {'lr': 0.00012293333333333336, 'samples': 236192, 'steps': 461, 'loss/train': 5.516878604888916} -09/20/2021 16:05:12 - INFO - __main__ - Step 7382: {'lr': 0.00012293333333333336, 'samples': 236224, 'steps': 461, 'loss/train': 6.327261924743652} -09/20/2021 16:05:13 - INFO - __main__ - Step 7383: {'lr': 0.00012293333333333336, 'samples': 236256, 'steps': 461, 'loss/train': 5.133607864379883} -09/20/2021 16:05:14 - INFO - __main__ - Step 7384: {'lr': 0.00012293333333333336, 'samples': 236288, 'steps': 461, 'loss/train': 6.14782190322876} -09/20/2021 16:05:14 - INFO - __main__ - Step 7385: {'lr': 0.00012293333333333336, 'samples': 236320, 'steps': 461, 'loss/train': 4.978664398193359} -09/20/2021 16:05:15 - INFO - __main__ - Step 7386: {'lr': 0.00012293333333333336, 'samples': 236352, 'steps': 461, 'loss/train': 4.6238508224487305} -09/20/2021 16:05:16 - INFO - __main__ - Step 7387: {'lr': 0.00012293333333333336, 'samples': 236384, 'steps': 461, 'loss/train': 5.571641445159912} -09/20/2021 16:05:17 - INFO - __main__ - Step 7388: {'lr': 0.00012293333333333336, 'samples': 236416, 'steps': 461, 'loss/train': 4.539444923400879} -09/20/2021 16:05:17 - INFO - __main__ - Step 7389: {'lr': 0.00012293333333333336, 'samples': 236448, 'steps': 461, 'loss/train': 5.493902206420898} -09/20/2021 16:05:18 - INFO - __main__ - Step 7390: {'lr': 0.00012293333333333336, 'samples': 236480, 'steps': 461, 'loss/train': 5.249922752380371} -09/20/2021 16:05:19 - INFO - __main__ - Step 7391: {'lr': 0.00012293333333333336, 'samples': 236512, 'steps': 461, 'loss/train': 4.158466815948486} -09/20/2021 16:05:20 - INFO - __main__ - Step 7392: {'lr': 0.00012293333333333336, 'samples': 236544, 'steps': 461, 'loss/train': 5.866281509399414} -09/20/2021 16:05:21 - INFO - __main__ - Step 7393: {'lr': 0.0001232, 'samples': 236576, 'steps': 462, 'loss/train': 5.250998497009277} -09/20/2021 16:05:21 - INFO - __main__ - Step 7394: {'lr': 0.0001232, 'samples': 236608, 'steps': 462, 'loss/train': 4.750932216644287} -09/20/2021 16:05:22 - INFO - __main__ - Step 7395: {'lr': 0.0001232, 'samples': 236640, 'steps': 462, 'loss/train': 6.296382427215576} -09/20/2021 16:05:23 - INFO - __main__ - Step 7396: {'lr': 0.0001232, 'samples': 236672, 'steps': 462, 'loss/train': 4.66579532623291} -09/20/2021 16:05:24 - INFO - __main__ - Step 7397: {'lr': 0.0001232, 'samples': 236704, 'steps': 462, 'loss/train': 4.785472869873047} -09/20/2021 16:05:24 - INFO - __main__ - Step 7398: {'lr': 0.0001232, 'samples': 236736, 'steps': 462, 'loss/train': 4.2269368171691895} -09/20/2021 16:05:25 - INFO - __main__ - Step 7399: {'lr': 0.0001232, 'samples': 236768, 'steps': 462, 'loss/train': 4.3915886878967285} -09/20/2021 16:05:26 - INFO - __main__ - Step 7400: {'lr': 0.0001232, 'samples': 236800, 'steps': 462, 'loss/train': 5.4484944343566895} -09/20/2021 16:05:27 - INFO - __main__ - Step 7401: {'lr': 0.0001232, 'samples': 236832, 'steps': 462, 'loss/train': 4.526267051696777} -09/20/2021 16:05:27 - INFO - __main__ - Step 7402: {'lr': 0.0001232, 'samples': 236864, 'steps': 462, 'loss/train': 4.8254923820495605} -09/20/2021 16:05:28 - INFO - __main__ - Step 7403: {'lr': 0.0001232, 'samples': 236896, 'steps': 462, 'loss/train': 4.748174667358398} -09/20/2021 16:05:29 - INFO - __main__ - Step 7404: {'lr': 0.0001232, 'samples': 236928, 'steps': 462, 'loss/train': 4.233503341674805} -09/20/2021 16:05:30 - INFO - __main__ - Step 7405: {'lr': 0.0001232, 'samples': 236960, 'steps': 462, 'loss/train': 4.789389133453369} -09/20/2021 16:05:31 - INFO - __main__ - Step 7406: {'lr': 0.0001232, 'samples': 236992, 'steps': 462, 'loss/train': 4.4197916984558105} -09/20/2021 16:05:32 - INFO - __main__ - Step 7407: {'lr': 0.0001232, 'samples': 237024, 'steps': 462, 'loss/train': 4.848060131072998} -09/20/2021 16:05:32 - INFO - __main__ - Step 7408: {'lr': 0.0001232, 'samples': 237056, 'steps': 462, 'loss/train': 4.781623363494873} -09/20/2021 16:05:33 - INFO - __main__ - Step 7409: {'lr': 0.00012346666666666667, 'samples': 237088, 'steps': 463, 'loss/train': 4.959803581237793} -09/20/2021 16:05:34 - INFO - __main__ - Step 7410: {'lr': 0.00012346666666666667, 'samples': 237120, 'steps': 463, 'loss/train': 2.2259764671325684} -09/20/2021 16:05:35 - INFO - __main__ - Step 7411: {'lr': 0.00012346666666666667, 'samples': 237152, 'steps': 463, 'loss/train': 2.091984987258911} -09/20/2021 16:05:35 - INFO - __main__ - Step 7412: {'lr': 0.00012346666666666667, 'samples': 237184, 'steps': 463, 'loss/train': 4.703676700592041} -09/20/2021 16:05:36 - INFO - __main__ - Step 7413: {'lr': 0.00012346666666666667, 'samples': 237216, 'steps': 463, 'loss/train': 5.491934299468994} -09/20/2021 16:05:37 - INFO - __main__ - Step 7414: {'lr': 0.00012346666666666667, 'samples': 237248, 'steps': 463, 'loss/train': 3.820615291595459} -09/20/2021 16:05:38 - INFO - __main__ - Step 7415: {'lr': 0.00012346666666666667, 'samples': 237280, 'steps': 463, 'loss/train': 4.62590217590332} -09/20/2021 16:05:38 - INFO - __main__ - Step 7416: {'lr': 0.00012346666666666667, 'samples': 237312, 'steps': 463, 'loss/train': 2.0193185806274414} -09/20/2021 16:05:39 - INFO - __main__ - Step 7417: {'lr': 0.00012346666666666667, 'samples': 237344, 'steps': 463, 'loss/train': 4.509789943695068} -09/20/2021 16:05:40 - INFO - __main__ - Step 7418: {'lr': 0.00012346666666666667, 'samples': 237376, 'steps': 463, 'loss/train': 4.620835781097412} -09/20/2021 16:05:41 - INFO - __main__ - Step 7419: {'lr': 0.00012346666666666667, 'samples': 237408, 'steps': 463, 'loss/train': 4.8717942237854} -09/20/2021 16:05:41 - INFO - __main__ - Step 7420: {'lr': 0.00012346666666666667, 'samples': 237440, 'steps': 463, 'loss/train': 4.9497880935668945} -09/20/2021 16:05:42 - INFO - __main__ - Step 7421: {'lr': 0.00012346666666666667, 'samples': 237472, 'steps': 463, 'loss/train': 4.516996383666992} -09/20/2021 16:05:43 - INFO - __main__ - Step 7422: {'lr': 0.00012346666666666667, 'samples': 237504, 'steps': 463, 'loss/train': 4.970673084259033} -09/20/2021 16:05:44 - INFO - __main__ - Step 7423: {'lr': 0.00012346666666666667, 'samples': 237536, 'steps': 463, 'loss/train': 5.352842807769775} -09/20/2021 16:05:44 - INFO - __main__ - Step 7424: {'lr': 0.00012346666666666667, 'samples': 237568, 'steps': 463, 'loss/train': 4.762048721313477} -09/20/2021 16:05:45 - INFO - __main__ - Step 7425: {'lr': 0.00012373333333333335, 'samples': 237600, 'steps': 464, 'loss/train': 4.239212512969971} -09/20/2021 16:05:46 - INFO - __main__ - Step 7426: {'lr': 0.00012373333333333335, 'samples': 237632, 'steps': 464, 'loss/train': 4.405455112457275} -09/20/2021 16:05:47 - INFO - __main__ - Step 7427: {'lr': 0.00012373333333333335, 'samples': 237664, 'steps': 464, 'loss/train': 4.630776882171631} -09/20/2021 16:05:48 - INFO - __main__ - Step 7428: {'lr': 0.00012373333333333335, 'samples': 237696, 'steps': 464, 'loss/train': 3.867370128631592} -09/20/2021 16:05:48 - INFO - __main__ - Step 7429: {'lr': 0.00012373333333333335, 'samples': 237728, 'steps': 464, 'loss/train': 4.577883243560791} -09/20/2021 16:05:49 - INFO - __main__ - Step 7430: {'lr': 0.00012373333333333335, 'samples': 237760, 'steps': 464, 'loss/train': 4.496367931365967} -09/20/2021 16:05:50 - INFO - __main__ - Step 7431: {'lr': 0.00012373333333333335, 'samples': 237792, 'steps': 464, 'loss/train': 4.099760055541992} -09/20/2021 16:05:51 - INFO - __main__ - Step 7432: {'lr': 0.00012373333333333335, 'samples': 237824, 'steps': 464, 'loss/train': 4.144007682800293} -09/20/2021 16:05:51 - INFO - __main__ - Step 7433: {'lr': 0.00012373333333333335, 'samples': 237856, 'steps': 464, 'loss/train': 4.983336925506592} -09/20/2021 16:05:52 - INFO - __main__ - Step 7434: {'lr': 0.00012373333333333335, 'samples': 237888, 'steps': 464, 'loss/train': 4.91481876373291} -09/20/2021 16:05:54 - INFO - __main__ - Step 7435: {'lr': 0.00012373333333333335, 'samples': 237920, 'steps': 464, 'loss/train': 5.584636211395264} -09/20/2021 16:05:54 - INFO - __main__ - Step 7436: {'lr': 0.00012373333333333335, 'samples': 237952, 'steps': 464, 'loss/train': 4.78622579574585} -09/20/2021 16:05:55 - INFO - __main__ - Step 7437: {'lr': 0.00012373333333333335, 'samples': 237984, 'steps': 464, 'loss/train': 5.869943141937256} -09/20/2021 16:05:56 - INFO - __main__ - Step 7438: {'lr': 0.00012373333333333335, 'samples': 238016, 'steps': 464, 'loss/train': 5.905243873596191} -09/20/2021 16:05:57 - INFO - __main__ - Step 7439: {'lr': 0.00012373333333333335, 'samples': 238048, 'steps': 464, 'loss/train': 5.133723735809326} -09/20/2021 16:05:57 - INFO - __main__ - Step 7440: {'lr': 0.00012373333333333335, 'samples': 238080, 'steps': 464, 'loss/train': 4.560364246368408} -09/20/2021 16:05:58 - INFO - __main__ - Step 7441: {'lr': 0.000124, 'samples': 238112, 'steps': 465, 'loss/train': 4.9699482917785645} -09/20/2021 16:05:59 - INFO - __main__ - Step 7442: {'lr': 0.000124, 'samples': 238144, 'steps': 465, 'loss/train': 4.839716911315918} -09/20/2021 16:06:00 - INFO - __main__ - Step 7443: {'lr': 0.000124, 'samples': 238176, 'steps': 465, 'loss/train': 4.41544771194458} -09/20/2021 16:06:00 - INFO - __main__ - Step 7444: {'lr': 0.000124, 'samples': 238208, 'steps': 465, 'loss/train': 4.994120121002197} -09/20/2021 16:06:01 - INFO - __main__ - Step 7445: {'lr': 0.000124, 'samples': 238240, 'steps': 465, 'loss/train': 4.741170406341553} -09/20/2021 16:06:02 - INFO - __main__ - Step 7446: {'lr': 0.000124, 'samples': 238272, 'steps': 465, 'loss/train': 3.6374056339263916} -09/20/2021 16:06:03 - INFO - __main__ - Step 7447: {'lr': 0.000124, 'samples': 238304, 'steps': 465, 'loss/train': 5.034252166748047} -09/20/2021 16:06:03 - INFO - __main__ - Step 7448: {'lr': 0.000124, 'samples': 238336, 'steps': 465, 'loss/train': 4.696845054626465} -09/20/2021 16:06:04 - INFO - __main__ - Step 7449: {'lr': 0.000124, 'samples': 238368, 'steps': 465, 'loss/train': 4.874663829803467} -09/20/2021 16:06:05 - INFO - __main__ - Step 7450: {'lr': 0.000124, 'samples': 238400, 'steps': 465, 'loss/train': 4.427073001861572} -09/20/2021 16:06:06 - INFO - __main__ - Step 7451: {'lr': 0.000124, 'samples': 238432, 'steps': 465, 'loss/train': 4.424759864807129} -09/20/2021 16:06:06 - INFO - __main__ - Step 7452: {'lr': 0.000124, 'samples': 238464, 'steps': 465, 'loss/train': 5.986752986907959} -09/20/2021 16:06:07 - INFO - __main__ - Step 7453: {'lr': 0.000124, 'samples': 238496, 'steps': 465, 'loss/train': 5.11374568939209} -09/20/2021 16:06:08 - INFO - __main__ - Step 7454: {'lr': 0.000124, 'samples': 238528, 'steps': 465, 'loss/train': 6.158735752105713} -09/20/2021 16:06:09 - INFO - __main__ - Step 7455: {'lr': 0.000124, 'samples': 238560, 'steps': 465, 'loss/train': 0.6167276501655579} -09/20/2021 16:06:09 - INFO - __main__ - Step 7456: {'lr': 0.000124, 'samples': 238592, 'steps': 465, 'loss/train': 4.775589942932129} -09/20/2021 16:06:10 - INFO - __main__ - Step 7457: {'lr': 0.00012426666666666666, 'samples': 238624, 'steps': 466, 'loss/train': 5.77016019821167} -09/20/2021 16:06:11 - INFO - __main__ - Step 7458: {'lr': 0.00012426666666666666, 'samples': 238656, 'steps': 466, 'loss/train': 4.8437275886535645} -09/20/2021 16:06:12 - INFO - __main__ - Step 7459: {'lr': 0.00012426666666666666, 'samples': 238688, 'steps': 466, 'loss/train': 4.917807102203369} -09/20/2021 16:06:13 - INFO - __main__ - Step 7460: {'lr': 0.00012426666666666666, 'samples': 238720, 'steps': 466, 'loss/train': 4.430678844451904} -09/20/2021 16:06:13 - INFO - __main__ - Step 7461: {'lr': 0.00012426666666666666, 'samples': 238752, 'steps': 466, 'loss/train': 3.999069929122925} -09/20/2021 16:06:14 - INFO - __main__ - Step 7462: {'lr': 0.00012426666666666666, 'samples': 238784, 'steps': 466, 'loss/train': 3.3355484008789062} -09/20/2021 16:06:15 - INFO - __main__ - Step 7463: {'lr': 0.00012426666666666666, 'samples': 238816, 'steps': 466, 'loss/train': 2.2365145683288574} -09/20/2021 16:06:16 - INFO - __main__ - Step 7464: {'lr': 0.00012426666666666666, 'samples': 238848, 'steps': 466, 'loss/train': 1.919191598892212} -09/20/2021 16:06:16 - INFO - __main__ - Step 7465: {'lr': 0.00012426666666666666, 'samples': 238880, 'steps': 466, 'loss/train': 4.612288951873779} -09/20/2021 16:06:18 - INFO - __main__ - Step 7466: {'lr': 0.00012426666666666666, 'samples': 238912, 'steps': 466, 'loss/train': 5.061590194702148} -09/20/2021 16:06:18 - INFO - __main__ - Step 7467: {'lr': 0.00012426666666666666, 'samples': 238944, 'steps': 466, 'loss/train': 5.602367401123047} -09/20/2021 16:06:19 - INFO - __main__ - Step 7468: {'lr': 0.00012426666666666666, 'samples': 238976, 'steps': 466, 'loss/train': 6.060081958770752} -09/20/2021 16:06:20 - INFO - __main__ - Step 7469: {'lr': 0.00012426666666666666, 'samples': 239008, 'steps': 466, 'loss/train': 5.049441814422607} -09/20/2021 16:06:21 - INFO - __main__ - Step 7470: {'lr': 0.00012426666666666666, 'samples': 239040, 'steps': 466, 'loss/train': 4.87510871887207} -09/20/2021 16:06:21 - INFO - __main__ - Step 7471: {'lr': 0.00012426666666666666, 'samples': 239072, 'steps': 466, 'loss/train': 4.593929290771484} -09/20/2021 16:06:22 - INFO - __main__ - Step 7472: {'lr': 0.00012426666666666666, 'samples': 239104, 'steps': 466, 'loss/train': 5.243465900421143} -09/20/2021 16:06:23 - INFO - __main__ - Step 7473: {'lr': 0.00012453333333333334, 'samples': 239136, 'steps': 467, 'loss/train': 5.164076328277588} -09/20/2021 16:06:24 - INFO - __main__ - Step 7474: {'lr': 0.00012453333333333334, 'samples': 239168, 'steps': 467, 'loss/train': 4.801425933837891} -09/20/2021 16:06:24 - INFO - __main__ - Step 7475: {'lr': 0.00012453333333333334, 'samples': 239200, 'steps': 467, 'loss/train': 4.119222164154053} -09/20/2021 16:06:25 - INFO - __main__ - Step 7476: {'lr': 0.00012453333333333334, 'samples': 239232, 'steps': 467, 'loss/train': 6.506728172302246} -09/20/2021 16:06:26 - INFO - __main__ - Step 7477: {'lr': 0.00012453333333333334, 'samples': 239264, 'steps': 467, 'loss/train': 4.916224479675293} -09/20/2021 16:06:27 - INFO - __main__ - Step 7478: {'lr': 0.00012453333333333334, 'samples': 239296, 'steps': 467, 'loss/train': 2.1623477935791016} -09/20/2021 16:06:27 - INFO - __main__ - Step 7479: {'lr': 0.00012453333333333334, 'samples': 239328, 'steps': 467, 'loss/train': 4.681838512420654} -09/20/2021 16:06:28 - INFO - __main__ - Step 7480: {'lr': 0.00012453333333333334, 'samples': 239360, 'steps': 467, 'loss/train': 4.57940673828125} -09/20/2021 16:06:29 - INFO - __main__ - Step 7481: {'lr': 0.00012453333333333334, 'samples': 239392, 'steps': 467, 'loss/train': 5.1125168800354} -09/20/2021 16:06:30 - INFO - __main__ - Step 7482: {'lr': 0.00012453333333333334, 'samples': 239424, 'steps': 467, 'loss/train': 5.670173645019531} -09/20/2021 16:06:30 - INFO - __main__ - Step 7483: {'lr': 0.00012453333333333334, 'samples': 239456, 'steps': 467, 'loss/train': 5.211643218994141} -09/20/2021 16:06:31 - INFO - __main__ - Step 7484: {'lr': 0.00012453333333333334, 'samples': 239488, 'steps': 467, 'loss/train': 4.780231475830078} -09/20/2021 16:06:32 - INFO - __main__ - Step 7485: {'lr': 0.00012453333333333334, 'samples': 239520, 'steps': 467, 'loss/train': 4.564001560211182} -09/20/2021 16:06:33 - INFO - __main__ - Step 7486: {'lr': 0.00012453333333333334, 'samples': 239552, 'steps': 467, 'loss/train': 3.9477741718292236} -09/20/2021 16:06:33 - INFO - __main__ - Step 7487: {'lr': 0.00012453333333333334, 'samples': 239584, 'steps': 467, 'loss/train': 5.272304534912109} -09/20/2021 16:06:34 - INFO - __main__ - Step 7488: {'lr': 0.00012453333333333334, 'samples': 239616, 'steps': 467, 'loss/train': 5.469486713409424} -09/20/2021 16:06:35 - INFO - __main__ - Step 7489: {'lr': 0.0001248, 'samples': 239648, 'steps': 468, 'loss/train': 4.649707317352295} -09/20/2021 16:06:36 - INFO - __main__ - Step 7490: {'lr': 0.0001248, 'samples': 239680, 'steps': 468, 'loss/train': 6.138578414916992} -09/20/2021 16:06:37 - INFO - __main__ - Step 7491: {'lr': 0.0001248, 'samples': 239712, 'steps': 468, 'loss/train': 4.670405387878418} -09/20/2021 16:06:37 - INFO - __main__ - Step 7492: {'lr': 0.0001248, 'samples': 239744, 'steps': 468, 'loss/train': 4.194469451904297} -09/20/2021 16:06:38 - INFO - __main__ - Step 7493: {'lr': 0.0001248, 'samples': 239776, 'steps': 468, 'loss/train': 5.027189254760742} -09/20/2021 16:06:39 - INFO - __main__ - Step 7494: {'lr': 0.0001248, 'samples': 239808, 'steps': 468, 'loss/train': 4.734976291656494} -09/20/2021 16:06:40 - INFO - __main__ - Step 7495: {'lr': 0.0001248, 'samples': 239840, 'steps': 468, 'loss/train': 5.062179088592529} -09/20/2021 16:06:41 - INFO - __main__ - Step 7496: {'lr': 0.0001248, 'samples': 239872, 'steps': 468, 'loss/train': 6.239749908447266} -09/20/2021 16:06:42 - INFO - __main__ - Step 7497: {'lr': 0.0001248, 'samples': 239904, 'steps': 468, 'loss/train': 6.0606513023376465} -09/20/2021 16:06:43 - INFO - __main__ - Step 7498: {'lr': 0.0001248, 'samples': 239936, 'steps': 468, 'loss/train': 5.2235002517700195} -09/20/2021 16:06:44 - INFO - __main__ - Step 7499: {'lr': 0.0001248, 'samples': 239968, 'steps': 468, 'loss/train': 4.337571620941162} -09/20/2021 16:06:44 - INFO - __main__ - Step 7500: {'lr': 0.0001248, 'samples': 240000, 'steps': 468, 'loss/train': 6.112304210662842} -09/20/2021 16:06:45 - INFO - __main__ - Step 7501: {'lr': 0.0001248, 'samples': 240032, 'steps': 468, 'loss/train': 2.2499423027038574} -09/20/2021 16:06:46 - INFO - __main__ - Step 7502: {'lr': 0.0001248, 'samples': 240064, 'steps': 468, 'loss/train': 6.111788272857666} -09/20/2021 16:06:47 - INFO - __main__ - Step 7503: {'lr': 0.0001248, 'samples': 240096, 'steps': 468, 'loss/train': 5.187572479248047} -09/20/2021 16:06:47 - INFO - __main__ - Step 7504: {'lr': 0.0001248, 'samples': 240128, 'steps': 468, 'loss/train': 4.600554943084717} -09/20/2021 16:06:48 - INFO - __main__ - Step 7505: {'lr': 0.00012506666666666665, 'samples': 240160, 'steps': 469, 'loss/train': 4.724011421203613} -09/20/2021 16:06:49 - INFO - __main__ - Step 7506: {'lr': 0.00012506666666666665, 'samples': 240192, 'steps': 469, 'loss/train': 5.153430938720703} -09/20/2021 16:06:50 - INFO - __main__ - Step 7507: {'lr': 0.00012506666666666665, 'samples': 240224, 'steps': 469, 'loss/train': 4.549210071563721} -09/20/2021 16:06:51 - INFO - __main__ - Step 7508: {'lr': 0.00012506666666666665, 'samples': 240256, 'steps': 469, 'loss/train': 4.496822357177734} -09/20/2021 16:06:51 - INFO - __main__ - Step 7509: {'lr': 0.00012506666666666665, 'samples': 240288, 'steps': 469, 'loss/train': 4.816986083984375} -09/20/2021 16:06:52 - INFO - __main__ - Step 7510: {'lr': 0.00012506666666666665, 'samples': 240320, 'steps': 469, 'loss/train': 3.8358097076416016} -09/20/2021 16:06:53 - INFO - __main__ - Step 7511: {'lr': 0.00012506666666666665, 'samples': 240352, 'steps': 469, 'loss/train': 5.316055774688721} -09/20/2021 16:06:54 - INFO - __main__ - Step 7512: {'lr': 0.00012506666666666665, 'samples': 240384, 'steps': 469, 'loss/train': 4.4113898277282715} -09/20/2021 16:06:54 - INFO - __main__ - Step 7513: {'lr': 0.00012506666666666665, 'samples': 240416, 'steps': 469, 'loss/train': 5.420957565307617} -09/20/2021 16:06:55 - INFO - __main__ - Step 7514: {'lr': 0.00012506666666666665, 'samples': 240448, 'steps': 469, 'loss/train': 3.960599184036255} -09/20/2021 16:06:56 - INFO - __main__ - Step 7515: {'lr': 0.00012506666666666665, 'samples': 240480, 'steps': 469, 'loss/train': 5.517866611480713} -09/20/2021 16:06:57 - INFO - __main__ - Step 7516: {'lr': 0.00012506666666666665, 'samples': 240512, 'steps': 469, 'loss/train': 5.742685794830322} -09/20/2021 16:06:57 - INFO - __main__ - Step 7517: {'lr': 0.00012506666666666665, 'samples': 240544, 'steps': 469, 'loss/train': 4.766600608825684} -09/20/2021 16:06:58 - INFO - __main__ - Step 7518: {'lr': 0.00012506666666666665, 'samples': 240576, 'steps': 469, 'loss/train': 5.126004219055176} -09/20/2021 16:06:59 - INFO - __main__ - Step 7519: {'lr': 0.00012506666666666665, 'samples': 240608, 'steps': 469, 'loss/train': 5.505195617675781} -09/20/2021 16:07:00 - INFO - __main__ - Step 7520: {'lr': 0.00012506666666666665, 'samples': 240640, 'steps': 469, 'loss/train': 5.769065856933594} -09/20/2021 16:07:00 - INFO - __main__ - Step 7521: {'lr': 0.00012533333333333334, 'samples': 240672, 'steps': 470, 'loss/train': 5.111444473266602} -09/20/2021 16:07:01 - INFO - __main__ - Step 7522: {'lr': 0.00012533333333333334, 'samples': 240704, 'steps': 470, 'loss/train': 4.839430809020996} -09/20/2021 16:07:02 - INFO - __main__ - Step 7523: {'lr': 0.00012533333333333334, 'samples': 240736, 'steps': 470, 'loss/train': 4.459171295166016} -09/20/2021 16:07:03 - INFO - __main__ - Step 7524: {'lr': 0.00012533333333333334, 'samples': 240768, 'steps': 470, 'loss/train': 4.819435119628906} -09/20/2021 16:07:03 - INFO - __main__ - Step 7525: {'lr': 0.00012533333333333334, 'samples': 240800, 'steps': 470, 'loss/train': 5.181318759918213} -09/20/2021 16:07:04 - INFO - __main__ - Step 7526: {'lr': 0.00012533333333333334, 'samples': 240832, 'steps': 470, 'loss/train': 5.514060020446777} -09/20/2021 16:07:05 - INFO - __main__ - Step 7527: {'lr': 0.00012533333333333334, 'samples': 240864, 'steps': 470, 'loss/train': 4.548046588897705} -09/20/2021 16:07:06 - INFO - __main__ - Step 7528: {'lr': 0.00012533333333333334, 'samples': 240896, 'steps': 470, 'loss/train': 4.185269355773926} -09/20/2021 16:07:07 - INFO - __main__ - Step 7529: {'lr': 0.00012533333333333334, 'samples': 240928, 'steps': 470, 'loss/train': 4.258167743682861} -09/20/2021 16:07:08 - INFO - __main__ - Step 7530: {'lr': 0.00012533333333333334, 'samples': 240960, 'steps': 470, 'loss/train': 5.368376731872559} -09/20/2021 16:07:09 - INFO - __main__ - Step 7531: {'lr': 0.00012533333333333334, 'samples': 240992, 'steps': 470, 'loss/train': 4.574673175811768} -09/20/2021 16:07:09 - INFO - __main__ - Step 7532: {'lr': 0.00012533333333333334, 'samples': 241024, 'steps': 470, 'loss/train': 3.8272106647491455} -09/20/2021 16:07:10 - INFO - __main__ - Step 7533: {'lr': 0.00012533333333333334, 'samples': 241056, 'steps': 470, 'loss/train': 4.543956756591797} -09/20/2021 16:07:11 - INFO - __main__ - Step 7534: {'lr': 0.00012533333333333334, 'samples': 241088, 'steps': 470, 'loss/train': 4.164019584655762} -09/20/2021 16:07:12 - INFO - __main__ - Step 7535: {'lr': 0.00012533333333333334, 'samples': 241120, 'steps': 470, 'loss/train': 5.258185386657715} -09/20/2021 16:07:12 - INFO - __main__ - Step 7536: {'lr': 0.00012533333333333334, 'samples': 241152, 'steps': 470, 'loss/train': 4.191833019256592} -09/20/2021 16:07:13 - INFO - __main__ - Step 7537: {'lr': 0.00012560000000000002, 'samples': 241184, 'steps': 471, 'loss/train': 5.181268215179443} -09/20/2021 16:07:14 - INFO - __main__ - Step 7538: {'lr': 0.00012560000000000002, 'samples': 241216, 'steps': 471, 'loss/train': 4.815582275390625} -09/20/2021 16:07:15 - INFO - __main__ - Step 7539: {'lr': 0.00012560000000000002, 'samples': 241248, 'steps': 471, 'loss/train': 4.622442722320557} -09/20/2021 16:07:15 - INFO - __main__ - Step 7540: {'lr': 0.00012560000000000002, 'samples': 241280, 'steps': 471, 'loss/train': 4.067703723907471} -09/20/2021 16:07:16 - INFO - __main__ - Step 7541: {'lr': 0.00012560000000000002, 'samples': 241312, 'steps': 471, 'loss/train': 4.961869239807129} -09/20/2021 16:07:17 - INFO - __main__ - Step 7542: {'lr': 0.00012560000000000002, 'samples': 241344, 'steps': 471, 'loss/train': 5.401642799377441} -09/20/2021 16:07:18 - INFO - __main__ - Step 7543: {'lr': 0.00012560000000000002, 'samples': 241376, 'steps': 471, 'loss/train': 4.72955846786499} -09/20/2021 16:07:18 - INFO - __main__ - Step 7544: {'lr': 0.00012560000000000002, 'samples': 241408, 'steps': 471, 'loss/train': 4.492173671722412} -09/20/2021 16:07:19 - INFO - __main__ - Step 7545: {'lr': 0.00012560000000000002, 'samples': 241440, 'steps': 471, 'loss/train': 5.035430431365967} -09/20/2021 16:07:20 - INFO - __main__ - Step 7546: {'lr': 0.00012560000000000002, 'samples': 241472, 'steps': 471, 'loss/train': 5.598487854003906} -09/20/2021 16:07:21 - INFO - __main__ - Step 7547: {'lr': 0.00012560000000000002, 'samples': 241504, 'steps': 471, 'loss/train': 4.917916297912598} -09/20/2021 16:07:21 - INFO - __main__ - Step 7548: {'lr': 0.00012560000000000002, 'samples': 241536, 'steps': 471, 'loss/train': 4.749343395233154} -09/20/2021 16:07:22 - INFO - __main__ - Step 7549: {'lr': 0.00012560000000000002, 'samples': 241568, 'steps': 471, 'loss/train': 5.470411777496338} -09/20/2021 16:07:23 - INFO - __main__ - Step 7550: {'lr': 0.00012560000000000002, 'samples': 241600, 'steps': 471, 'loss/train': 4.733547687530518} -09/20/2021 16:07:24 - INFO - __main__ - Step 7551: {'lr': 0.00012560000000000002, 'samples': 241632, 'steps': 471, 'loss/train': 4.18346643447876} -09/20/2021 16:07:24 - INFO - __main__ - Step 7552: {'lr': 0.00012560000000000002, 'samples': 241664, 'steps': 471, 'loss/train': 4.884097099304199} -09/20/2021 16:07:25 - INFO - __main__ - Step 7553: {'lr': 0.00012586666666666667, 'samples': 241696, 'steps': 472, 'loss/train': 5.638082504272461} -09/20/2021 16:07:26 - INFO - __main__ - Step 7554: {'lr': 0.00012586666666666667, 'samples': 241728, 'steps': 472, 'loss/train': 5.261865615844727} -09/20/2021 16:07:27 - INFO - __main__ - Step 7555: {'lr': 0.00012586666666666667, 'samples': 241760, 'steps': 472, 'loss/train': 5.329814434051514} -09/20/2021 16:07:28 - INFO - __main__ - Step 7556: {'lr': 0.00012586666666666667, 'samples': 241792, 'steps': 472, 'loss/train': 4.021989822387695} -09/20/2021 16:07:28 - INFO - __main__ - Step 7557: {'lr': 0.00012586666666666667, 'samples': 241824, 'steps': 472, 'loss/train': 5.10994291305542} -09/20/2021 16:07:29 - INFO - __main__ - Step 7558: {'lr': 0.00012586666666666667, 'samples': 241856, 'steps': 472, 'loss/train': 4.812422275543213} -09/20/2021 16:07:30 - INFO - __main__ - Step 7559: {'lr': 0.00012586666666666667, 'samples': 241888, 'steps': 472, 'loss/train': 5.49033784866333} -09/20/2021 16:07:31 - INFO - __main__ - Step 7560: {'lr': 0.00012586666666666667, 'samples': 241920, 'steps': 472, 'loss/train': 4.493945121765137} -09/20/2021 16:07:32 - INFO - __main__ - Step 7561: {'lr': 0.00012586666666666667, 'samples': 241952, 'steps': 472, 'loss/train': 5.687849521636963} -09/20/2021 16:07:33 - INFO - __main__ - Step 7562: {'lr': 0.00012586666666666667, 'samples': 241984, 'steps': 472, 'loss/train': 4.503575325012207} -09/20/2021 16:07:33 - INFO - __main__ - Step 7563: {'lr': 0.00012586666666666667, 'samples': 242016, 'steps': 472, 'loss/train': 5.250401020050049} -09/20/2021 16:07:34 - INFO - __main__ - Step 7564: {'lr': 0.00012586666666666667, 'samples': 242048, 'steps': 472, 'loss/train': 3.8084027767181396} -09/20/2021 16:07:35 - INFO - __main__ - Step 7565: {'lr': 0.00012586666666666667, 'samples': 242080, 'steps': 472, 'loss/train': 4.699249267578125} -09/20/2021 16:07:36 - INFO - __main__ - Step 7566: {'lr': 0.00012586666666666667, 'samples': 242112, 'steps': 472, 'loss/train': 4.9401936531066895} -09/20/2021 16:07:36 - INFO - __main__ - Step 7567: {'lr': 0.00012586666666666667, 'samples': 242144, 'steps': 472, 'loss/train': 4.578446388244629} -09/20/2021 16:07:37 - INFO - __main__ - Step 7568: {'lr': 0.00012586666666666667, 'samples': 242176, 'steps': 472, 'loss/train': 5.1786041259765625} -09/20/2021 16:07:38 - INFO - __main__ - Step 7569: {'lr': 0.00012613333333333335, 'samples': 242208, 'steps': 473, 'loss/train': 4.7546916007995605} -09/20/2021 16:07:39 - INFO - __main__ - Step 7570: {'lr': 0.00012613333333333335, 'samples': 242240, 'steps': 473, 'loss/train': 4.91250467300415} -09/20/2021 16:07:39 - INFO - __main__ - Step 7571: {'lr': 0.00012613333333333335, 'samples': 242272, 'steps': 473, 'loss/train': 5.207979202270508} -09/20/2021 16:07:40 - INFO - __main__ - Step 7572: {'lr': 0.00012613333333333335, 'samples': 242304, 'steps': 473, 'loss/train': 4.103402137756348} -09/20/2021 16:07:41 - INFO - __main__ - Step 7573: {'lr': 0.00012613333333333335, 'samples': 242336, 'steps': 473, 'loss/train': 4.952985763549805} -09/20/2021 16:07:42 - INFO - __main__ - Step 7574: {'lr': 0.00012613333333333335, 'samples': 242368, 'steps': 473, 'loss/train': 4.727346420288086} -09/20/2021 16:07:42 - INFO - __main__ - Step 7575: {'lr': 0.00012613333333333335, 'samples': 242400, 'steps': 473, 'loss/train': 5.987504482269287} -09/20/2021 16:07:43 - INFO - __main__ - Step 7576: {'lr': 0.00012613333333333335, 'samples': 242432, 'steps': 473, 'loss/train': 5.723267078399658} -09/20/2021 16:07:44 - INFO - __main__ - Step 7577: {'lr': 0.00012613333333333335, 'samples': 242464, 'steps': 473, 'loss/train': 4.979958534240723} -09/20/2021 16:07:45 - INFO - __main__ - Step 7578: {'lr': 0.00012613333333333335, 'samples': 242496, 'steps': 473, 'loss/train': 4.7519612312316895} -09/20/2021 16:07:45 - INFO - __main__ - Step 7579: {'lr': 0.00012613333333333335, 'samples': 242528, 'steps': 473, 'loss/train': 4.4600419998168945} -09/20/2021 16:07:46 - INFO - __main__ - Step 7580: {'lr': 0.00012613333333333335, 'samples': 242560, 'steps': 473, 'loss/train': 6.206377029418945} -09/20/2021 16:07:47 - INFO - __main__ - Step 7581: {'lr': 0.00012613333333333335, 'samples': 242592, 'steps': 473, 'loss/train': 5.469013690948486} -09/20/2021 16:07:48 - INFO - __main__ - Step 7582: {'lr': 0.00012613333333333335, 'samples': 242624, 'steps': 473, 'loss/train': 4.212704658508301} -09/20/2021 16:07:48 - INFO - __main__ - Step 7583: {'lr': 0.00012613333333333335, 'samples': 242656, 'steps': 473, 'loss/train': 4.710216045379639} -09/20/2021 16:07:49 - INFO - __main__ - Step 7584: {'lr': 0.00012613333333333335, 'samples': 242688, 'steps': 473, 'loss/train': 7.458829879760742} -09/20/2021 16:07:50 - INFO - __main__ - Step 7585: {'lr': 0.0001264, 'samples': 242720, 'steps': 474, 'loss/train': 4.408639907836914} -09/20/2021 16:07:51 - INFO - __main__ - Step 7586: {'lr': 0.0001264, 'samples': 242752, 'steps': 474, 'loss/train': 3.9734201431274414} -09/20/2021 16:07:52 - INFO - __main__ - Step 7587: {'lr': 0.0001264, 'samples': 242784, 'steps': 474, 'loss/train': 2.2446789741516113} -09/20/2021 16:07:52 - INFO - __main__ - Step 7588: {'lr': 0.0001264, 'samples': 242816, 'steps': 474, 'loss/train': 4.218580722808838} -09/20/2021 16:07:53 - INFO - __main__ - Step 7589: {'lr': 0.0001264, 'samples': 242848, 'steps': 474, 'loss/train': 5.120977401733398} -09/20/2021 16:07:54 - INFO - __main__ - Step 7590: {'lr': 0.0001264, 'samples': 242880, 'steps': 474, 'loss/train': 5.538987159729004} -09/20/2021 16:07:55 - INFO - __main__ - Step 7591: {'lr': 0.0001264, 'samples': 242912, 'steps': 474, 'loss/train': 5.657094478607178} -09/20/2021 16:07:56 - INFO - __main__ - Step 7592: {'lr': 0.0001264, 'samples': 242944, 'steps': 474, 'loss/train': 5.042112827301025} -09/20/2021 16:07:57 - INFO - __main__ - Step 7593: {'lr': 0.0001264, 'samples': 242976, 'steps': 474, 'loss/train': 5.116501331329346} -09/20/2021 16:07:57 - INFO - __main__ - Step 7594: {'lr': 0.0001264, 'samples': 243008, 'steps': 474, 'loss/train': 4.624953269958496} -09/20/2021 16:07:58 - INFO - __main__ - Step 7595: {'lr': 0.0001264, 'samples': 243040, 'steps': 474, 'loss/train': 4.350710868835449} -09/20/2021 16:07:59 - INFO - __main__ - Step 7596: {'lr': 0.0001264, 'samples': 243072, 'steps': 474, 'loss/train': 4.472692489624023} -09/20/2021 16:08:00 - INFO - __main__ - Step 7597: {'lr': 0.0001264, 'samples': 243104, 'steps': 474, 'loss/train': 4.118538856506348} -09/20/2021 16:08:00 - INFO - __main__ - Step 7598: {'lr': 0.0001264, 'samples': 243136, 'steps': 474, 'loss/train': 4.2376322746276855} -09/20/2021 16:08:01 - INFO - __main__ - Step 7599: {'lr': 0.0001264, 'samples': 243168, 'steps': 474, 'loss/train': 5.161502838134766} -09/20/2021 16:08:02 - INFO - __main__ - Step 7600: {'lr': 0.0001264, 'samples': 243200, 'steps': 474, 'loss/train': 6.3559136390686035} -09/20/2021 16:08:03 - INFO - __main__ - Step 7601: {'lr': 0.00012666666666666666, 'samples': 243232, 'steps': 475, 'loss/train': 4.428295612335205} -09/20/2021 16:08:04 - INFO - __main__ - Step 7602: {'lr': 0.00012666666666666666, 'samples': 243264, 'steps': 475, 'loss/train': 4.934238910675049} -09/20/2021 16:08:04 - INFO - __main__ - Step 7603: {'lr': 0.00012666666666666666, 'samples': 243296, 'steps': 475, 'loss/train': 4.292011737823486} -09/20/2021 16:08:05 - INFO - __main__ - Step 7604: {'lr': 0.00012666666666666666, 'samples': 243328, 'steps': 475, 'loss/train': 3.8141512870788574} -09/20/2021 16:08:06 - INFO - __main__ - Step 7605: {'lr': 0.00012666666666666666, 'samples': 243360, 'steps': 475, 'loss/train': 4.467144012451172} -09/20/2021 16:08:07 - INFO - __main__ - Step 7606: {'lr': 0.00012666666666666666, 'samples': 243392, 'steps': 475, 'loss/train': 5.745641708374023} -09/20/2021 16:08:07 - INFO - __main__ - Step 7607: {'lr': 0.00012666666666666666, 'samples': 243424, 'steps': 475, 'loss/train': 5.586683750152588} -09/20/2021 16:08:08 - INFO - __main__ - Step 7608: {'lr': 0.00012666666666666666, 'samples': 243456, 'steps': 475, 'loss/train': 5.357786178588867} -09/20/2021 16:08:09 - INFO - __main__ - Step 7609: {'lr': 0.00012666666666666666, 'samples': 243488, 'steps': 475, 'loss/train': 5.076363563537598} -09/20/2021 16:08:10 - INFO - __main__ - Step 7610: {'lr': 0.00012666666666666666, 'samples': 243520, 'steps': 475, 'loss/train': 4.79742956161499} -09/20/2021 16:08:10 - INFO - __main__ - Step 7611: {'lr': 0.00012666666666666666, 'samples': 243552, 'steps': 475, 'loss/train': 4.483051776885986} -09/20/2021 16:08:11 - INFO - __main__ - Step 7612: {'lr': 0.00012666666666666666, 'samples': 243584, 'steps': 475, 'loss/train': 4.719489097595215} -09/20/2021 16:08:12 - INFO - __main__ - Step 7613: {'lr': 0.00012666666666666666, 'samples': 243616, 'steps': 475, 'loss/train': 5.121277809143066} -09/20/2021 16:08:13 - INFO - __main__ - Step 7614: {'lr': 0.00012666666666666666, 'samples': 243648, 'steps': 475, 'loss/train': 4.673638820648193} -09/20/2021 16:08:13 - INFO - __main__ - Step 7615: {'lr': 0.00012666666666666666, 'samples': 243680, 'steps': 475, 'loss/train': 4.459590911865234} -09/20/2021 16:08:14 - INFO - __main__ - Step 7616: {'lr': 0.00012666666666666666, 'samples': 243712, 'steps': 475, 'loss/train': 4.966084957122803} -09/20/2021 16:08:15 - INFO - __main__ - Step 7617: {'lr': 0.00012693333333333335, 'samples': 243744, 'steps': 476, 'loss/train': 5.24279260635376} -09/20/2021 16:08:16 - INFO - __main__ - Step 7618: {'lr': 0.00012693333333333335, 'samples': 243776, 'steps': 476, 'loss/train': 4.988985538482666} -09/20/2021 16:08:16 - INFO - __main__ - Step 7619: {'lr': 0.00012693333333333335, 'samples': 243808, 'steps': 476, 'loss/train': 4.405672550201416} -09/20/2021 16:08:17 - INFO - __main__ - Step 7620: {'lr': 0.00012693333333333335, 'samples': 243840, 'steps': 476, 'loss/train': 5.358885765075684} -09/20/2021 16:08:18 - INFO - __main__ - Step 7621: {'lr': 0.00012693333333333335, 'samples': 243872, 'steps': 476, 'loss/train': 6.400119304656982} -09/20/2021 16:08:19 - INFO - __main__ - Step 7622: {'lr': 0.00012693333333333335, 'samples': 243904, 'steps': 476, 'loss/train': 4.348724365234375} -09/20/2021 16:08:19 - INFO - __main__ - Step 7623: {'lr': 0.00012693333333333335, 'samples': 243936, 'steps': 476, 'loss/train': 4.155511379241943} -09/20/2021 16:08:21 - INFO - __main__ - Step 7624: {'lr': 0.00012693333333333335, 'samples': 243968, 'steps': 476, 'loss/train': 4.823246955871582} -09/20/2021 16:08:22 - INFO - __main__ - Step 7625: {'lr': 0.00012693333333333335, 'samples': 244000, 'steps': 476, 'loss/train': 4.480041980743408} -09/20/2021 16:08:22 - INFO - __main__ - Step 7626: {'lr': 0.00012693333333333335, 'samples': 244032, 'steps': 476, 'loss/train': 4.7775187492370605} -09/20/2021 16:08:23 - INFO - __main__ - Step 7627: {'lr': 0.00012693333333333335, 'samples': 244064, 'steps': 476, 'loss/train': 4.709996700286865} -09/20/2021 16:08:24 - INFO - __main__ - Step 7628: {'lr': 0.00012693333333333335, 'samples': 244096, 'steps': 476, 'loss/train': 3.60941481590271} -09/20/2021 16:08:25 - INFO - __main__ - Step 7629: {'lr': 0.00012693333333333335, 'samples': 244128, 'steps': 476, 'loss/train': 4.704276084899902} -09/20/2021 16:08:25 - INFO - __main__ - Step 7630: {'lr': 0.00012693333333333335, 'samples': 244160, 'steps': 476, 'loss/train': 4.469223499298096} -09/20/2021 16:08:26 - INFO - __main__ - Step 7631: {'lr': 0.00012693333333333335, 'samples': 244192, 'steps': 476, 'loss/train': 4.421358108520508} -09/20/2021 16:08:27 - INFO - __main__ - Step 7632: {'lr': 0.00012693333333333335, 'samples': 244224, 'steps': 476, 'loss/train': 3.969928741455078} -09/20/2021 16:08:28 - INFO - __main__ - Step 7633: {'lr': 0.0001272, 'samples': 244256, 'steps': 477, 'loss/train': 4.698239803314209} -09/20/2021 16:08:28 - INFO - __main__ - Step 7634: {'lr': 0.0001272, 'samples': 244288, 'steps': 477, 'loss/train': 5.045013904571533} -09/20/2021 16:08:29 - INFO - __main__ - Step 7635: {'lr': 0.0001272, 'samples': 244320, 'steps': 477, 'loss/train': 4.975440979003906} -09/20/2021 16:08:30 - INFO - __main__ - Step 7636: {'lr': 0.0001272, 'samples': 244352, 'steps': 477, 'loss/train': 4.348126411437988} -09/20/2021 16:08:31 - INFO - __main__ - Step 7637: {'lr': 0.0001272, 'samples': 244384, 'steps': 477, 'loss/train': 5.2500529289245605} -09/20/2021 16:08:31 - INFO - __main__ - Step 7638: {'lr': 0.0001272, 'samples': 244416, 'steps': 477, 'loss/train': 4.706852436065674} -09/20/2021 16:08:32 - INFO - __main__ - Step 7639: {'lr': 0.0001272, 'samples': 244448, 'steps': 477, 'loss/train': 4.933978080749512} -09/20/2021 16:08:33 - INFO - __main__ - Step 7640: {'lr': 0.0001272, 'samples': 244480, 'steps': 477, 'loss/train': 4.286815166473389} -09/20/2021 16:08:34 - INFO - __main__ - Step 7641: {'lr': 0.0001272, 'samples': 244512, 'steps': 477, 'loss/train': 4.602852821350098} -09/20/2021 16:08:34 - INFO - __main__ - Step 7642: {'lr': 0.0001272, 'samples': 244544, 'steps': 477, 'loss/train': 4.46994686126709} -09/20/2021 16:08:35 - INFO - __main__ - Step 7643: {'lr': 0.0001272, 'samples': 244576, 'steps': 477, 'loss/train': 4.969522476196289} -09/20/2021 16:08:36 - INFO - __main__ - Step 7644: {'lr': 0.0001272, 'samples': 244608, 'steps': 477, 'loss/train': 2.132286310195923} -09/20/2021 16:08:37 - INFO - __main__ - Step 7645: {'lr': 0.0001272, 'samples': 244640, 'steps': 477, 'loss/train': 2.2108278274536133} -09/20/2021 16:08:37 - INFO - __main__ - Step 7646: {'lr': 0.0001272, 'samples': 244672, 'steps': 477, 'loss/train': 2.2714860439300537} -09/20/2021 16:08:38 - INFO - __main__ - Step 7647: {'lr': 0.0001272, 'samples': 244704, 'steps': 477, 'loss/train': 2.417067289352417} -09/20/2021 16:08:39 - INFO - __main__ - Step 7648: {'lr': 0.0001272, 'samples': 244736, 'steps': 477, 'loss/train': 4.961719036102295} -09/20/2021 16:08:40 - INFO - __main__ - Step 7649: {'lr': 0.00012746666666666666, 'samples': 244768, 'steps': 478, 'loss/train': 4.756503582000732} -09/20/2021 16:08:41 - INFO - __main__ - Step 7650: {'lr': 0.00012746666666666666, 'samples': 244800, 'steps': 478, 'loss/train': 5.076107978820801} -09/20/2021 16:08:41 - INFO - __main__ - Step 7651: {'lr': 0.00012746666666666666, 'samples': 244832, 'steps': 478, 'loss/train': 4.994014739990234} -09/20/2021 16:08:42 - INFO - __main__ - Step 7652: {'lr': 0.00012746666666666666, 'samples': 244864, 'steps': 478, 'loss/train': 4.1332573890686035} -09/20/2021 16:08:43 - INFO - __main__ - Step 7653: {'lr': 0.00012746666666666666, 'samples': 244896, 'steps': 478, 'loss/train': 6.243308067321777} -09/20/2021 16:08:44 - INFO - __main__ - Step 7654: {'lr': 0.00012746666666666666, 'samples': 244928, 'steps': 478, 'loss/train': 4.555246829986572} -09/20/2021 16:08:45 - INFO - __main__ - Step 7655: {'lr': 0.00012746666666666666, 'samples': 244960, 'steps': 478, 'loss/train': 4.689541816711426} -09/20/2021 16:08:46 - INFO - __main__ - Step 7656: {'lr': 0.00012746666666666666, 'samples': 244992, 'steps': 478, 'loss/train': 5.060683727264404} -09/20/2021 16:08:46 - INFO - __main__ - Step 7657: {'lr': 0.00012746666666666666, 'samples': 245024, 'steps': 478, 'loss/train': 4.519890785217285} -09/20/2021 16:08:47 - INFO - __main__ - Step 7658: {'lr': 0.00012746666666666666, 'samples': 245056, 'steps': 478, 'loss/train': 5.04747200012207} -09/20/2021 16:08:48 - INFO - __main__ - Step 7659: {'lr': 0.00012746666666666666, 'samples': 245088, 'steps': 478, 'loss/train': 4.765403747558594} -09/20/2021 16:08:49 - INFO - __main__ - Step 7660: {'lr': 0.00012746666666666666, 'samples': 245120, 'steps': 478, 'loss/train': 5.254444122314453} -09/20/2021 16:08:49 - INFO - __main__ - Step 7661: {'lr': 0.00012746666666666666, 'samples': 245152, 'steps': 478, 'loss/train': 4.420345306396484} -09/20/2021 16:08:50 - INFO - __main__ - Step 7662: {'lr': 0.00012746666666666666, 'samples': 245184, 'steps': 478, 'loss/train': 4.774374485015869} -09/20/2021 16:08:51 - INFO - __main__ - Step 7663: {'lr': 0.00012746666666666666, 'samples': 245216, 'steps': 478, 'loss/train': 5.159323215484619} -09/20/2021 16:08:52 - INFO - __main__ - Step 7664: {'lr': 0.00012746666666666666, 'samples': 245248, 'steps': 478, 'loss/train': 5.344122886657715} -09/20/2021 16:08:53 - INFO - __main__ - Step 7665: {'lr': 0.00012773333333333334, 'samples': 245280, 'steps': 479, 'loss/train': 4.70095157623291} -09/20/2021 16:08:53 - INFO - __main__ - Step 7666: {'lr': 0.00012773333333333334, 'samples': 245312, 'steps': 479, 'loss/train': 4.832871437072754} -09/20/2021 16:08:54 - INFO - __main__ - Step 7667: {'lr': 0.00012773333333333334, 'samples': 245344, 'steps': 479, 'loss/train': 5.0611443519592285} -09/20/2021 16:08:55 - INFO - __main__ - Step 7668: {'lr': 0.00012773333333333334, 'samples': 245376, 'steps': 479, 'loss/train': 5.858805179595947} -09/20/2021 16:08:56 - INFO - __main__ - Step 7669: {'lr': 0.00012773333333333334, 'samples': 245408, 'steps': 479, 'loss/train': 5.159914970397949} -09/20/2021 16:08:56 - INFO - __main__ - Step 7670: {'lr': 0.00012773333333333334, 'samples': 245440, 'steps': 479, 'loss/train': 5.311400890350342} -09/20/2021 16:08:57 - INFO - __main__ - Step 7671: {'lr': 0.00012773333333333334, 'samples': 245472, 'steps': 479, 'loss/train': 5.037092685699463} -09/20/2021 16:08:58 - INFO - __main__ - Step 7672: {'lr': 0.00012773333333333334, 'samples': 245504, 'steps': 479, 'loss/train': 4.253902912139893} -09/20/2021 16:08:59 - INFO - __main__ - Step 7673: {'lr': 0.00012773333333333334, 'samples': 245536, 'steps': 479, 'loss/train': 5.498553276062012} -09/20/2021 16:08:59 - INFO - __main__ - Step 7674: {'lr': 0.00012773333333333334, 'samples': 245568, 'steps': 479, 'loss/train': 5.1933441162109375} -09/20/2021 16:09:00 - INFO - __main__ - Step 7675: {'lr': 0.00012773333333333334, 'samples': 245600, 'steps': 479, 'loss/train': 5.188488006591797} -09/20/2021 16:09:01 - INFO - __main__ - Step 7676: {'lr': 0.00012773333333333334, 'samples': 245632, 'steps': 479, 'loss/train': 4.13588809967041} -09/20/2021 16:09:02 - INFO - __main__ - Step 7677: {'lr': 0.00012773333333333334, 'samples': 245664, 'steps': 479, 'loss/train': 4.75526237487793} -09/20/2021 16:09:02 - INFO - __main__ - Step 7678: {'lr': 0.00012773333333333334, 'samples': 245696, 'steps': 479, 'loss/train': 4.405651569366455} -09/20/2021 16:09:03 - INFO - __main__ - Step 7679: {'lr': 0.00012773333333333334, 'samples': 245728, 'steps': 479, 'loss/train': 5.593935012817383} -09/20/2021 16:09:04 - INFO - __main__ - Step 7680: {'lr': 0.00012773333333333334, 'samples': 245760, 'steps': 479, 'loss/train': 4.434133529663086} -09/20/2021 16:09:05 - INFO - __main__ - Step 7681: {'lr': 0.00012800000000000002, 'samples': 245792, 'steps': 480, 'loss/train': 5.11810302734375} -09/20/2021 16:09:06 - INFO - __main__ - Step 7682: {'lr': 0.00012800000000000002, 'samples': 245824, 'steps': 480, 'loss/train': 4.78603982925415} -09/20/2021 16:09:06 - INFO - __main__ - Step 7683: {'lr': 0.00012800000000000002, 'samples': 245856, 'steps': 480, 'loss/train': 4.475322723388672} -09/20/2021 16:09:07 - INFO - __main__ - Step 7684: {'lr': 0.00012800000000000002, 'samples': 245888, 'steps': 480, 'loss/train': 5.90109920501709} -09/20/2021 16:09:08 - INFO - __main__ - Step 7685: {'lr': 0.00012800000000000002, 'samples': 245920, 'steps': 480, 'loss/train': 5.023372650146484} -09/20/2021 16:09:09 - INFO - __main__ - Step 7686: {'lr': 0.00012800000000000002, 'samples': 245952, 'steps': 480, 'loss/train': 4.85098123550415} -09/20/2021 16:09:10 - INFO - __main__ - Step 7687: {'lr': 0.00012800000000000002, 'samples': 245984, 'steps': 480, 'loss/train': 5.103142738342285} -09/20/2021 16:09:11 - INFO - __main__ - Step 7688: {'lr': 0.00012800000000000002, 'samples': 246016, 'steps': 480, 'loss/train': 4.280885219573975} -09/20/2021 16:09:11 - INFO - __main__ - Step 7689: {'lr': 0.00012800000000000002, 'samples': 246048, 'steps': 480, 'loss/train': 4.310540199279785} -09/20/2021 16:09:12 - INFO - __main__ - Step 7690: {'lr': 0.00012800000000000002, 'samples': 246080, 'steps': 480, 'loss/train': 4.31424617767334} -09/20/2021 16:09:13 - INFO - __main__ - Step 7691: {'lr': 0.00012800000000000002, 'samples': 246112, 'steps': 480, 'loss/train': 5.594841957092285} -09/20/2021 16:09:14 - INFO - __main__ - Step 7692: {'lr': 0.00012800000000000002, 'samples': 246144, 'steps': 480, 'loss/train': 6.445462703704834} -09/20/2021 16:09:14 - INFO - __main__ - Step 7693: {'lr': 0.00012800000000000002, 'samples': 246176, 'steps': 480, 'loss/train': 4.764311790466309} -09/20/2021 16:09:15 - INFO - __main__ - Step 7694: {'lr': 0.00012800000000000002, 'samples': 246208, 'steps': 480, 'loss/train': 5.175570011138916} -09/20/2021 16:09:16 - INFO - __main__ - Step 7695: {'lr': 0.00012800000000000002, 'samples': 246240, 'steps': 480, 'loss/train': 5.059759140014648} -09/20/2021 16:09:17 - INFO - __main__ - Step 7696: {'lr': 0.00012800000000000002, 'samples': 246272, 'steps': 480, 'loss/train': 4.905330657958984} -09/20/2021 16:09:18 - INFO - __main__ - Step 7697: {'lr': 0.00012826666666666668, 'samples': 246304, 'steps': 481, 'loss/train': 5.738001823425293} -09/20/2021 16:09:18 - INFO - __main__ - Step 7698: {'lr': 0.00012826666666666668, 'samples': 246336, 'steps': 481, 'loss/train': 6.028079032897949} -09/20/2021 16:09:19 - INFO - __main__ - Step 7699: {'lr': 0.00012826666666666668, 'samples': 246368, 'steps': 481, 'loss/train': 4.333385944366455} -09/20/2021 16:09:20 - INFO - __main__ - Step 7700: {'lr': 0.00012826666666666668, 'samples': 246400, 'steps': 481, 'loss/train': 3.7117738723754883} -09/20/2021 16:09:21 - INFO - __main__ - Step 7701: {'lr': 0.00012826666666666668, 'samples': 246432, 'steps': 481, 'loss/train': 5.0190887451171875} -09/20/2021 16:09:21 - INFO - __main__ - Step 7702: {'lr': 0.00012826666666666668, 'samples': 246464, 'steps': 481, 'loss/train': 5.801809310913086} -09/20/2021 16:09:22 - INFO - __main__ - Step 7703: {'lr': 0.00012826666666666668, 'samples': 246496, 'steps': 481, 'loss/train': 4.533288955688477} -09/20/2021 16:09:23 - INFO - __main__ - Step 7704: {'lr': 0.00012826666666666668, 'samples': 246528, 'steps': 481, 'loss/train': 5.240228652954102} -09/20/2021 16:09:24 - INFO - __main__ - Step 7705: {'lr': 0.00012826666666666668, 'samples': 246560, 'steps': 481, 'loss/train': 4.642524242401123} -09/20/2021 16:09:24 - INFO - __main__ - Step 7706: {'lr': 0.00012826666666666668, 'samples': 246592, 'steps': 481, 'loss/train': 4.480901718139648} -09/20/2021 16:09:25 - INFO - __main__ - Step 7707: {'lr': 0.00012826666666666668, 'samples': 246624, 'steps': 481, 'loss/train': 4.617707252502441} -09/20/2021 16:09:26 - INFO - __main__ - Step 7708: {'lr': 0.00012826666666666668, 'samples': 246656, 'steps': 481, 'loss/train': 4.88523006439209} -09/20/2021 16:09:27 - INFO - __main__ - Step 7709: {'lr': 0.00012826666666666668, 'samples': 246688, 'steps': 481, 'loss/train': 5.232980728149414} -09/20/2021 16:09:27 - INFO - __main__ - Step 7710: {'lr': 0.00012826666666666668, 'samples': 246720, 'steps': 481, 'loss/train': 4.537715435028076} -09/20/2021 16:09:28 - INFO - __main__ - Step 7711: {'lr': 0.00012826666666666668, 'samples': 246752, 'steps': 481, 'loss/train': 5.680470943450928} -09/20/2021 16:09:29 - INFO - __main__ - Step 7712: {'lr': 0.00012826666666666668, 'samples': 246784, 'steps': 481, 'loss/train': 4.4717512130737305} -09/20/2021 16:09:30 - INFO - __main__ - Step 7713: {'lr': 0.00012853333333333336, 'samples': 246816, 'steps': 482, 'loss/train': 4.968825340270996} -09/20/2021 16:09:30 - INFO - __main__ - Step 7714: {'lr': 0.00012853333333333336, 'samples': 246848, 'steps': 482, 'loss/train': 5.236695766448975} -09/20/2021 16:09:31 - INFO - __main__ - Step 7715: {'lr': 0.00012853333333333336, 'samples': 246880, 'steps': 482, 'loss/train': 4.861998081207275} -09/20/2021 16:09:32 - INFO - __main__ - Step 7716: {'lr': 0.00012853333333333336, 'samples': 246912, 'steps': 482, 'loss/train': 5.105165958404541} -09/20/2021 16:09:33 - INFO - __main__ - Step 7717: {'lr': 0.00012853333333333336, 'samples': 246944, 'steps': 482, 'loss/train': 5.418693542480469} -09/20/2021 16:09:34 - INFO - __main__ - Step 7718: {'lr': 0.00012853333333333336, 'samples': 246976, 'steps': 482, 'loss/train': 5.719724178314209} -09/20/2021 16:09:35 - INFO - __main__ - Step 7719: {'lr': 0.00012853333333333336, 'samples': 247008, 'steps': 482, 'loss/train': 5.232754230499268} -09/20/2021 16:09:35 - INFO - __main__ - Step 7720: {'lr': 0.00012853333333333336, 'samples': 247040, 'steps': 482, 'loss/train': 4.406139373779297} -09/20/2021 16:09:36 - INFO - __main__ - Step 7721: {'lr': 0.00012853333333333336, 'samples': 247072, 'steps': 482, 'loss/train': 4.2305169105529785} -09/20/2021 16:09:37 - INFO - __main__ - Step 7722: {'lr': 0.00012853333333333336, 'samples': 247104, 'steps': 482, 'loss/train': 4.421037197113037} -09/20/2021 16:09:38 - INFO - __main__ - Step 7723: {'lr': 0.00012853333333333336, 'samples': 247136, 'steps': 482, 'loss/train': 5.338330268859863} -09/20/2021 16:09:38 - INFO - __main__ - Step 7724: {'lr': 0.00012853333333333336, 'samples': 247168, 'steps': 482, 'loss/train': 5.117246150970459} -09/20/2021 16:09:39 - INFO - __main__ - Step 7725: {'lr': 0.00012853333333333336, 'samples': 247200, 'steps': 482, 'loss/train': 5.545544147491455} -09/20/2021 16:09:40 - INFO - __main__ - Step 7726: {'lr': 0.00012853333333333336, 'samples': 247232, 'steps': 482, 'loss/train': 4.664307594299316} -09/20/2021 16:09:41 - INFO - __main__ - Step 7727: {'lr': 0.00012853333333333336, 'samples': 247264, 'steps': 482, 'loss/train': 4.778728485107422} -09/20/2021 16:09:41 - INFO - __main__ - Step 7728: {'lr': 0.00012853333333333336, 'samples': 247296, 'steps': 482, 'loss/train': 4.198953628540039} -09/20/2021 16:09:42 - INFO - __main__ - Step 7729: {'lr': 0.00012880000000000001, 'samples': 247328, 'steps': 483, 'loss/train': 4.948071479797363} -09/20/2021 16:09:43 - INFO - __main__ - Step 7730: {'lr': 0.00012880000000000001, 'samples': 247360, 'steps': 483, 'loss/train': 4.491260528564453} -09/20/2021 16:09:44 - INFO - __main__ - Step 7731: {'lr': 0.00012880000000000001, 'samples': 247392, 'steps': 483, 'loss/train': 5.148431777954102} -09/20/2021 16:09:45 - INFO - __main__ - Step 7732: {'lr': 0.00012880000000000001, 'samples': 247424, 'steps': 483, 'loss/train': 5.845170021057129} -09/20/2021 16:09:45 - INFO - __main__ - Step 7733: {'lr': 0.00012880000000000001, 'samples': 247456, 'steps': 483, 'loss/train': 4.846225738525391} -09/20/2021 16:09:46 - INFO - __main__ - Step 7734: {'lr': 0.00012880000000000001, 'samples': 247488, 'steps': 483, 'loss/train': 4.867334842681885} -09/20/2021 16:09:47 - INFO - __main__ - Step 7735: {'lr': 0.00012880000000000001, 'samples': 247520, 'steps': 483, 'loss/train': 3.2039458751678467} -09/20/2021 16:09:48 - INFO - __main__ - Step 7736: {'lr': 0.00012880000000000001, 'samples': 247552, 'steps': 483, 'loss/train': 5.6245951652526855} -09/20/2021 16:09:48 - INFO - __main__ - Step 7737: {'lr': 0.00012880000000000001, 'samples': 247584, 'steps': 483, 'loss/train': 5.245790481567383} -09/20/2021 16:09:49 - INFO - __main__ - Step 7738: {'lr': 0.00012880000000000001, 'samples': 247616, 'steps': 483, 'loss/train': 6.109390735626221} -09/20/2021 16:09:50 - INFO - __main__ - Step 7739: {'lr': 0.00012880000000000001, 'samples': 247648, 'steps': 483, 'loss/train': 5.70652961730957} -09/20/2021 16:09:51 - INFO - __main__ - Step 7740: {'lr': 0.00012880000000000001, 'samples': 247680, 'steps': 483, 'loss/train': 5.554479122161865} -09/20/2021 16:09:51 - INFO - __main__ - Step 7741: {'lr': 0.00012880000000000001, 'samples': 247712, 'steps': 483, 'loss/train': 4.735692024230957} -09/20/2021 16:09:52 - INFO - __main__ - Step 7742: {'lr': 0.00012880000000000001, 'samples': 247744, 'steps': 483, 'loss/train': 4.659004211425781} -09/20/2021 16:09:53 - INFO - __main__ - Step 7743: {'lr': 0.00012880000000000001, 'samples': 247776, 'steps': 483, 'loss/train': 5.561318397521973} -09/20/2021 16:09:54 - INFO - __main__ - Step 7744: {'lr': 0.00012880000000000001, 'samples': 247808, 'steps': 483, 'loss/train': 4.693902492523193} -09/20/2021 16:09:54 - INFO - __main__ - Step 7745: {'lr': 0.00012906666666666667, 'samples': 247840, 'steps': 484, 'loss/train': 5.361315727233887} -09/20/2021 16:09:55 - INFO - __main__ - Step 7746: {'lr': 0.00012906666666666667, 'samples': 247872, 'steps': 484, 'loss/train': 5.13009786605835} -09/20/2021 16:09:56 - INFO - __main__ - Step 7747: {'lr': 0.00012906666666666667, 'samples': 247904, 'steps': 484, 'loss/train': 4.335397243499756} -09/20/2021 16:09:57 - INFO - __main__ - Step 7748: {'lr': 0.00012906666666666667, 'samples': 247936, 'steps': 484, 'loss/train': 5.090139389038086} -09/20/2021 16:09:58 - INFO - __main__ - Step 7749: {'lr': 0.00012906666666666667, 'samples': 247968, 'steps': 484, 'loss/train': 4.854864597320557} -09/20/2021 16:09:59 - INFO - __main__ - Step 7750: {'lr': 0.00012906666666666667, 'samples': 248000, 'steps': 484, 'loss/train': 4.637014389038086} -09/20/2021 16:10:00 - INFO - __main__ - Step 7751: {'lr': 0.00012906666666666667, 'samples': 248032, 'steps': 484, 'loss/train': 2.4167637825012207} -09/20/2021 16:10:01 - INFO - __main__ - Step 7752: {'lr': 0.00012906666666666667, 'samples': 248064, 'steps': 484, 'loss/train': 3.8953442573547363} -09/20/2021 16:10:01 - INFO - __main__ - Step 7753: {'lr': 0.00012906666666666667, 'samples': 248096, 'steps': 484, 'loss/train': 5.456029891967773} -09/20/2021 16:10:02 - INFO - __main__ - Step 7754: {'lr': 0.00012906666666666667, 'samples': 248128, 'steps': 484, 'loss/train': 5.151153564453125} -09/20/2021 16:10:03 - INFO - __main__ - Step 7755: {'lr': 0.00012906666666666667, 'samples': 248160, 'steps': 484, 'loss/train': 4.813875198364258} -09/20/2021 16:10:04 - INFO - __main__ - Step 7756: {'lr': 0.00012906666666666667, 'samples': 248192, 'steps': 484, 'loss/train': 4.951108455657959} -09/20/2021 16:10:04 - INFO - __main__ - Step 7757: {'lr': 0.00012906666666666667, 'samples': 248224, 'steps': 484, 'loss/train': 4.397687911987305} -09/20/2021 16:10:05 - INFO - __main__ - Step 7758: {'lr': 0.00012906666666666667, 'samples': 248256, 'steps': 484, 'loss/train': 5.4804487228393555} -09/20/2021 16:10:06 - INFO - __main__ - Step 7759: {'lr': 0.00012906666666666667, 'samples': 248288, 'steps': 484, 'loss/train': 5.321675777435303} -09/20/2021 16:10:07 - INFO - __main__ - Step 7760: {'lr': 0.00012906666666666667, 'samples': 248320, 'steps': 484, 'loss/train': 6.522986888885498} -09/20/2021 16:10:07 - INFO - __main__ - Step 7761: {'lr': 0.00012933333333333332, 'samples': 248352, 'steps': 485, 'loss/train': 5.485047817230225} -09/20/2021 16:10:08 - INFO - __main__ - Step 7762: {'lr': 0.00012933333333333332, 'samples': 248384, 'steps': 485, 'loss/train': 5.199676990509033} -09/20/2021 16:10:09 - INFO - __main__ - Step 7763: {'lr': 0.00012933333333333332, 'samples': 248416, 'steps': 485, 'loss/train': 5.119121074676514} -09/20/2021 16:10:10 - INFO - __main__ - Step 7764: {'lr': 0.00012933333333333332, 'samples': 248448, 'steps': 485, 'loss/train': 5.225090980529785} -09/20/2021 16:10:10 - INFO - __main__ - Step 7765: {'lr': 0.00012933333333333332, 'samples': 248480, 'steps': 485, 'loss/train': 4.600152015686035} -09/20/2021 16:10:11 - INFO - __main__ - Step 7766: {'lr': 0.00012933333333333332, 'samples': 248512, 'steps': 485, 'loss/train': 4.451647758483887} -09/20/2021 16:10:12 - INFO - __main__ - Step 7767: {'lr': 0.00012933333333333332, 'samples': 248544, 'steps': 485, 'loss/train': 5.232996940612793} -09/20/2021 16:10:13 - INFO - __main__ - Step 7768: {'lr': 0.00012933333333333332, 'samples': 248576, 'steps': 485, 'loss/train': 4.859212398529053} -09/20/2021 16:10:13 - INFO - __main__ - Step 7769: {'lr': 0.00012933333333333332, 'samples': 248608, 'steps': 485, 'loss/train': 5.449426174163818} -09/20/2021 16:10:14 - INFO - __main__ - Step 7770: {'lr': 0.00012933333333333332, 'samples': 248640, 'steps': 485, 'loss/train': 0.8540747165679932} -09/20/2021 16:10:15 - INFO - __main__ - Step 7771: {'lr': 0.00012933333333333332, 'samples': 248672, 'steps': 485, 'loss/train': 4.564017295837402} -09/20/2021 16:10:16 - INFO - __main__ - Step 7772: {'lr': 0.00012933333333333332, 'samples': 248704, 'steps': 485, 'loss/train': 4.36898136138916} -09/20/2021 16:10:16 - INFO - __main__ - Step 7773: {'lr': 0.00012933333333333332, 'samples': 248736, 'steps': 485, 'loss/train': 4.641147136688232} -09/20/2021 16:10:17 - INFO - __main__ - Step 7774: {'lr': 0.00012933333333333332, 'samples': 248768, 'steps': 485, 'loss/train': 4.994087219238281} -09/20/2021 16:10:18 - INFO - __main__ - Step 7775: {'lr': 0.00012933333333333332, 'samples': 248800, 'steps': 485, 'loss/train': 4.63913106918335} -09/20/2021 16:10:19 - INFO - __main__ - Step 7776: {'lr': 0.00012933333333333332, 'samples': 248832, 'steps': 485, 'loss/train': 4.365682601928711} -09/20/2021 16:10:20 - INFO - __main__ - Step 7777: {'lr': 0.0001296, 'samples': 248864, 'steps': 486, 'loss/train': 4.665826320648193} -09/20/2021 16:10:20 - INFO - __main__ - Step 7778: {'lr': 0.0001296, 'samples': 248896, 'steps': 486, 'loss/train': 4.933258533477783} -09/20/2021 16:10:21 - INFO - __main__ - Step 7779: {'lr': 0.0001296, 'samples': 248928, 'steps': 486, 'loss/train': 5.303093910217285} -09/20/2021 16:10:22 - INFO - __main__ - Step 7780: {'lr': 0.0001296, 'samples': 248960, 'steps': 486, 'loss/train': 5.148040294647217} -09/20/2021 16:10:23 - INFO - __main__ - Step 7781: {'lr': 0.0001296, 'samples': 248992, 'steps': 486, 'loss/train': 4.71112585067749} -09/20/2021 16:10:24 - INFO - __main__ - Step 7782: {'lr': 0.0001296, 'samples': 249024, 'steps': 486, 'loss/train': 4.757824420928955} -09/20/2021 16:10:25 - INFO - __main__ - Step 7783: {'lr': 0.0001296, 'samples': 249056, 'steps': 486, 'loss/train': 4.698879241943359} -09/20/2021 16:10:25 - INFO - __main__ - Step 7784: {'lr': 0.0001296, 'samples': 249088, 'steps': 486, 'loss/train': 4.223826885223389} -09/20/2021 16:10:26 - INFO - __main__ - Step 7785: {'lr': 0.0001296, 'samples': 249120, 'steps': 486, 'loss/train': 5.225093364715576} -09/20/2021 16:10:27 - INFO - __main__ - Step 7786: {'lr': 0.0001296, 'samples': 249152, 'steps': 486, 'loss/train': 3.616945505142212} -09/20/2021 16:10:28 - INFO - __main__ - Step 7787: {'lr': 0.0001296, 'samples': 249184, 'steps': 486, 'loss/train': 5.510298252105713} -09/20/2021 16:10:28 - INFO - __main__ - Step 7788: {'lr': 0.0001296, 'samples': 249216, 'steps': 486, 'loss/train': 5.31577730178833} -09/20/2021 16:10:29 - INFO - __main__ - Step 7789: {'lr': 0.0001296, 'samples': 249248, 'steps': 486, 'loss/train': 4.4054460525512695} -09/20/2021 16:10:30 - INFO - __main__ - Step 7790: {'lr': 0.0001296, 'samples': 249280, 'steps': 486, 'loss/train': 5.413074970245361} -09/20/2021 16:10:31 - INFO - __main__ - Step 7791: {'lr': 0.0001296, 'samples': 249312, 'steps': 486, 'loss/train': 5.877654075622559} -09/20/2021 16:10:31 - INFO - __main__ - Step 7792: {'lr': 0.0001296, 'samples': 249344, 'steps': 486, 'loss/train': 4.310831546783447} -09/20/2021 16:10:32 - INFO - __main__ - Step 7793: {'lr': 0.00012986666666666666, 'samples': 249376, 'steps': 487, 'loss/train': 4.261581897735596} -09/20/2021 16:10:33 - INFO - __main__ - Step 7794: {'lr': 0.00012986666666666666, 'samples': 249408, 'steps': 487, 'loss/train': 4.997432231903076} -09/20/2021 16:10:34 - INFO - __main__ - Step 7795: {'lr': 0.00012986666666666666, 'samples': 249440, 'steps': 487, 'loss/train': 5.158768653869629} -09/20/2021 16:10:34 - INFO - __main__ - Step 7796: {'lr': 0.00012986666666666666, 'samples': 249472, 'steps': 487, 'loss/train': 4.538197040557861} -09/20/2021 16:10:35 - INFO - __main__ - Step 7797: {'lr': 0.00012986666666666666, 'samples': 249504, 'steps': 487, 'loss/train': 5.088677883148193} -09/20/2021 16:10:36 - INFO - __main__ - Step 7798: {'lr': 0.00012986666666666666, 'samples': 249536, 'steps': 487, 'loss/train': 5.101759433746338} -09/20/2021 16:10:37 - INFO - __main__ - Step 7799: {'lr': 0.00012986666666666666, 'samples': 249568, 'steps': 487, 'loss/train': 4.863611221313477} -09/20/2021 16:10:37 - INFO - __main__ - Step 7800: {'lr': 0.00012986666666666666, 'samples': 249600, 'steps': 487, 'loss/train': 4.978802680969238} -09/20/2021 16:10:38 - INFO - __main__ - Step 7801: {'lr': 0.00012986666666666666, 'samples': 249632, 'steps': 487, 'loss/train': 4.533084392547607} -09/20/2021 16:10:39 - INFO - __main__ - Step 7802: {'lr': 0.00012986666666666666, 'samples': 249664, 'steps': 487, 'loss/train': 5.053435325622559} -09/20/2021 16:10:40 - INFO - __main__ - Step 7803: {'lr': 0.00012986666666666666, 'samples': 249696, 'steps': 487, 'loss/train': 4.279356479644775} -09/20/2021 16:10:40 - INFO - __main__ - Step 7804: {'lr': 0.00012986666666666666, 'samples': 249728, 'steps': 487, 'loss/train': 5.105947494506836} -09/20/2021 16:10:41 - INFO - __main__ - Step 7805: {'lr': 0.00012986666666666666, 'samples': 249760, 'steps': 487, 'loss/train': 4.761768341064453} -09/20/2021 16:10:42 - INFO - __main__ - Step 7806: {'lr': 0.00012986666666666666, 'samples': 249792, 'steps': 487, 'loss/train': 5.674995422363281} -09/20/2021 16:10:43 - INFO - __main__ - Step 7807: {'lr': 0.00012986666666666666, 'samples': 249824, 'steps': 487, 'loss/train': 5.229672908782959} -09/20/2021 16:10:43 - INFO - __main__ - Step 7808: {'lr': 0.00012986666666666666, 'samples': 249856, 'steps': 487, 'loss/train': 4.1475090980529785} -09/20/2021 16:10:44 - INFO - __main__ - Step 7809: {'lr': 0.00013013333333333332, 'samples': 249888, 'steps': 488, 'loss/train': 4.494261741638184} -09/20/2021 16:10:46 - INFO - __main__ - Step 7810: {'lr': 0.00013013333333333332, 'samples': 249920, 'steps': 488, 'loss/train': 5.301942825317383} -09/20/2021 16:10:47 - INFO - __main__ - Step 7811: {'lr': 0.00013013333333333332, 'samples': 249952, 'steps': 488, 'loss/train': 5.217100143432617} -09/20/2021 16:10:48 - INFO - __main__ - Step 7812: {'lr': 0.00013013333333333332, 'samples': 249984, 'steps': 488, 'loss/train': 4.944485664367676} -09/20/2021 16:10:48 - INFO - __main__ - Step 7813: {'lr': 0.00013013333333333332, 'samples': 250016, 'steps': 488, 'loss/train': 4.790155410766602} -09/20/2021 16:10:49 - INFO - __main__ - Step 7814: {'lr': 0.00013013333333333332, 'samples': 250048, 'steps': 488, 'loss/train': 4.478643417358398} -09/20/2021 16:10:50 - INFO - __main__ - Step 7815: {'lr': 0.00013013333333333332, 'samples': 250080, 'steps': 488, 'loss/train': 4.832804203033447} -09/20/2021 16:10:51 - INFO - __main__ - Step 7816: {'lr': 0.00013013333333333332, 'samples': 250112, 'steps': 488, 'loss/train': 4.519772529602051} -09/20/2021 16:10:51 - INFO - __main__ - Step 7817: {'lr': 0.00013013333333333332, 'samples': 250144, 'steps': 488, 'loss/train': 6.196793556213379} -09/20/2021 16:10:52 - INFO - __main__ - Step 7818: {'lr': 0.00013013333333333332, 'samples': 250176, 'steps': 488, 'loss/train': 5.807190418243408} -09/20/2021 16:10:53 - INFO - __main__ - Step 7819: {'lr': 0.00013013333333333332, 'samples': 250208, 'steps': 488, 'loss/train': 4.5472588539123535} -09/20/2021 16:10:54 - INFO - __main__ - Step 7820: {'lr': 0.00013013333333333332, 'samples': 250240, 'steps': 488, 'loss/train': 5.08791446685791} -09/20/2021 16:10:54 - INFO - __main__ - Step 7821: {'lr': 0.00013013333333333332, 'samples': 250272, 'steps': 488, 'loss/train': 5.684513568878174} -09/20/2021 16:10:55 - INFO - __main__ - Step 7822: {'lr': 0.00013013333333333332, 'samples': 250304, 'steps': 488, 'loss/train': 5.902915000915527} -09/20/2021 16:10:56 - INFO - __main__ - Step 7823: {'lr': 0.00013013333333333332, 'samples': 250336, 'steps': 488, 'loss/train': 4.406017303466797} -09/20/2021 16:10:57 - INFO - __main__ - Step 7824: {'lr': 0.00013013333333333332, 'samples': 250368, 'steps': 488, 'loss/train': 4.0859599113464355} -09/20/2021 16:10:58 - INFO - __main__ - Step 7825: {'lr': 0.0001304, 'samples': 250400, 'steps': 489, 'loss/train': 5.190537452697754} -09/20/2021 16:10:58 - INFO - __main__ - Step 7826: {'lr': 0.0001304, 'samples': 250432, 'steps': 489, 'loss/train': 5.534895420074463} -09/20/2021 16:10:59 - INFO - __main__ - Step 7827: {'lr': 0.0001304, 'samples': 250464, 'steps': 489, 'loss/train': 5.025020122528076} -09/20/2021 16:11:00 - INFO - __main__ - Step 7828: {'lr': 0.0001304, 'samples': 250496, 'steps': 489, 'loss/train': 5.823399543762207} -09/20/2021 16:11:01 - INFO - __main__ - Step 7829: {'lr': 0.0001304, 'samples': 250528, 'steps': 489, 'loss/train': 4.508184909820557} -09/20/2021 16:11:01 - INFO - __main__ - Step 7830: {'lr': 0.0001304, 'samples': 250560, 'steps': 489, 'loss/train': 5.004680633544922} -09/20/2021 16:11:02 - INFO - __main__ - Step 7831: {'lr': 0.0001304, 'samples': 250592, 'steps': 489, 'loss/train': 4.728108882904053} -09/20/2021 16:11:03 - INFO - __main__ - Step 7832: {'lr': 0.0001304, 'samples': 250624, 'steps': 489, 'loss/train': 4.775350093841553} -09/20/2021 16:11:04 - INFO - __main__ - Step 7833: {'lr': 0.0001304, 'samples': 250656, 'steps': 489, 'loss/train': 4.516931533813477} -09/20/2021 16:11:04 - INFO - __main__ - Step 7834: {'lr': 0.0001304, 'samples': 250688, 'steps': 489, 'loss/train': 5.224084377288818} -09/20/2021 16:11:05 - INFO - __main__ - Step 7835: {'lr': 0.0001304, 'samples': 250720, 'steps': 489, 'loss/train': 2.925621271133423} -09/20/2021 16:11:06 - INFO - __main__ - Step 7836: {'lr': 0.0001304, 'samples': 250752, 'steps': 489, 'loss/train': 3.094294548034668} -09/20/2021 16:11:07 - INFO - __main__ - Step 7837: {'lr': 0.0001304, 'samples': 250784, 'steps': 489, 'loss/train': 4.88972806930542} -09/20/2021 16:11:07 - INFO - __main__ - Step 7838: {'lr': 0.0001304, 'samples': 250816, 'steps': 489, 'loss/train': 4.7059149742126465} -09/20/2021 16:11:08 - INFO - __main__ - Step 7839: {'lr': 0.0001304, 'samples': 250848, 'steps': 489, 'loss/train': 4.684230327606201} -09/20/2021 16:11:09 - INFO - __main__ - Step 7840: {'lr': 0.0001304, 'samples': 250880, 'steps': 489, 'loss/train': 4.409826278686523} -09/20/2021 16:11:10 - INFO - __main__ - Step 7841: {'lr': 0.00013066666666666668, 'samples': 250912, 'steps': 490, 'loss/train': 4.657246112823486} -09/20/2021 16:11:11 - INFO - __main__ - Step 7842: {'lr': 0.00013066666666666668, 'samples': 250944, 'steps': 490, 'loss/train': 6.0085883140563965} -09/20/2021 16:11:12 - INFO - __main__ - Step 7843: {'lr': 0.00013066666666666668, 'samples': 250976, 'steps': 490, 'loss/train': 5.314446449279785} -09/20/2021 16:11:12 - INFO - __main__ - Step 7844: {'lr': 0.00013066666666666668, 'samples': 251008, 'steps': 490, 'loss/train': 5.475388526916504} -09/20/2021 16:11:13 - INFO - __main__ - Step 7845: {'lr': 0.00013066666666666668, 'samples': 251040, 'steps': 490, 'loss/train': 5.956265926361084} -09/20/2021 16:11:14 - INFO - __main__ - Step 7846: {'lr': 0.00013066666666666668, 'samples': 251072, 'steps': 490, 'loss/train': 4.029618263244629} -09/20/2021 16:11:15 - INFO - __main__ - Step 7847: {'lr': 0.00013066666666666668, 'samples': 251104, 'steps': 490, 'loss/train': 5.135080814361572} -09/20/2021 16:11:15 - INFO - __main__ - Step 7848: {'lr': 0.00013066666666666668, 'samples': 251136, 'steps': 490, 'loss/train': 5.3769683837890625} -09/20/2021 16:11:16 - INFO - __main__ - Step 7849: {'lr': 0.00013066666666666668, 'samples': 251168, 'steps': 490, 'loss/train': 4.199297904968262} -09/20/2021 16:11:17 - INFO - __main__ - Step 7850: {'lr': 0.00013066666666666668, 'samples': 251200, 'steps': 490, 'loss/train': 4.773329734802246} -09/20/2021 16:11:18 - INFO - __main__ - Step 7851: {'lr': 0.00013066666666666668, 'samples': 251232, 'steps': 490, 'loss/train': 3.0820212364196777} -09/20/2021 16:11:18 - INFO - __main__ - Step 7852: {'lr': 0.00013066666666666668, 'samples': 251264, 'steps': 490, 'loss/train': 5.254916667938232} -09/20/2021 16:11:19 - INFO - __main__ - Step 7853: {'lr': 0.00013066666666666668, 'samples': 251296, 'steps': 490, 'loss/train': 4.272443771362305} -09/20/2021 16:11:20 - INFO - __main__ - Step 7854: {'lr': 0.00013066666666666668, 'samples': 251328, 'steps': 490, 'loss/train': 5.435953140258789} -09/20/2021 16:11:21 - INFO - __main__ - Step 7855: {'lr': 0.00013066666666666668, 'samples': 251360, 'steps': 490, 'loss/train': 4.362133979797363} -09/20/2021 16:11:21 - INFO - __main__ - Step 7856: {'lr': 0.00013066666666666668, 'samples': 251392, 'steps': 490, 'loss/train': 4.806246280670166} -09/20/2021 16:11:22 - INFO - __main__ - Step 7857: {'lr': 0.00013093333333333334, 'samples': 251424, 'steps': 491, 'loss/train': 4.678631782531738} -09/20/2021 16:11:23 - INFO - __main__ - Step 7858: {'lr': 0.00013093333333333334, 'samples': 251456, 'steps': 491, 'loss/train': 4.111815452575684} -09/20/2021 16:11:24 - INFO - __main__ - Step 7859: {'lr': 0.00013093333333333334, 'samples': 251488, 'steps': 491, 'loss/train': 4.176553249359131} -09/20/2021 16:11:25 - INFO - __main__ - Step 7860: {'lr': 0.00013093333333333334, 'samples': 251520, 'steps': 491, 'loss/train': 4.807948589324951} -09/20/2021 16:11:25 - INFO - __main__ - Step 7861: {'lr': 0.00013093333333333334, 'samples': 251552, 'steps': 491, 'loss/train': 4.967971324920654} -09/20/2021 16:11:26 - INFO - __main__ - Step 7862: {'lr': 0.00013093333333333334, 'samples': 251584, 'steps': 491, 'loss/train': 4.837158679962158} -09/20/2021 16:11:27 - INFO - __main__ - Step 7863: {'lr': 0.00013093333333333334, 'samples': 251616, 'steps': 491, 'loss/train': 4.8373284339904785} -09/20/2021 16:11:28 - INFO - __main__ - Step 7864: {'lr': 0.00013093333333333334, 'samples': 251648, 'steps': 491, 'loss/train': 4.637104511260986} -09/20/2021 16:11:28 - INFO - __main__ - Step 7865: {'lr': 0.00013093333333333334, 'samples': 251680, 'steps': 491, 'loss/train': 4.402001857757568} -09/20/2021 16:11:29 - INFO - __main__ - Step 7866: {'lr': 0.00013093333333333334, 'samples': 251712, 'steps': 491, 'loss/train': 4.340337753295898} -09/20/2021 16:11:30 - INFO - __main__ - Step 7867: {'lr': 0.00013093333333333334, 'samples': 251744, 'steps': 491, 'loss/train': 5.077282905578613} -09/20/2021 16:11:31 - INFO - __main__ - Step 7868: {'lr': 0.00013093333333333334, 'samples': 251776, 'steps': 491, 'loss/train': 4.618851184844971} -09/20/2021 16:11:31 - INFO - __main__ - Step 7869: {'lr': 0.00013093333333333334, 'samples': 251808, 'steps': 491, 'loss/train': 5.491179466247559} -09/20/2021 16:11:33 - INFO - __main__ - Step 7870: {'lr': 0.00013093333333333334, 'samples': 251840, 'steps': 491, 'loss/train': 5.48305082321167} -09/20/2021 16:11:33 - INFO - __main__ - Step 7871: {'lr': 0.00013093333333333334, 'samples': 251872, 'steps': 491, 'loss/train': 4.0972394943237305} -09/20/2021 16:11:34 - INFO - __main__ - Step 7872: {'lr': 0.00013093333333333334, 'samples': 251904, 'steps': 491, 'loss/train': 3.478243827819824} -09/20/2021 16:11:35 - INFO - __main__ - Step 7873: {'lr': 0.00013120000000000002, 'samples': 251936, 'steps': 492, 'loss/train': 4.781507968902588} -09/20/2021 16:11:36 - INFO - __main__ - Step 7874: {'lr': 0.00013120000000000002, 'samples': 251968, 'steps': 492, 'loss/train': 4.602396011352539} -09/20/2021 16:11:37 - INFO - __main__ - Step 7875: {'lr': 0.00013120000000000002, 'samples': 252000, 'steps': 492, 'loss/train': 4.643352508544922} -09/20/2021 16:11:37 - INFO - __main__ - Step 7876: {'lr': 0.00013120000000000002, 'samples': 252032, 'steps': 492, 'loss/train': 4.78187894821167} -09/20/2021 16:11:38 - INFO - __main__ - Step 7877: {'lr': 0.00013120000000000002, 'samples': 252064, 'steps': 492, 'loss/train': 4.54573917388916} -09/20/2021 16:11:39 - INFO - __main__ - Step 7878: {'lr': 0.00013120000000000002, 'samples': 252096, 'steps': 492, 'loss/train': 2.2354750633239746} -09/20/2021 16:11:40 - INFO - __main__ - Step 7879: {'lr': 0.00013120000000000002, 'samples': 252128, 'steps': 492, 'loss/train': 3.0203936100006104} -09/20/2021 16:11:40 - INFO - __main__ - Step 7880: {'lr': 0.00013120000000000002, 'samples': 252160, 'steps': 492, 'loss/train': 6.265031337738037} -09/20/2021 16:11:41 - INFO - __main__ - Step 7881: {'lr': 0.00013120000000000002, 'samples': 252192, 'steps': 492, 'loss/train': 5.1673150062561035} -09/20/2021 16:11:42 - INFO - __main__ - Step 7882: {'lr': 0.00013120000000000002, 'samples': 252224, 'steps': 492, 'loss/train': 5.24595308303833} -09/20/2021 16:11:43 - INFO - __main__ - Step 7883: {'lr': 0.00013120000000000002, 'samples': 252256, 'steps': 492, 'loss/train': 4.393604278564453} -09/20/2021 16:11:43 - INFO - __main__ - Step 7884: {'lr': 0.00013120000000000002, 'samples': 252288, 'steps': 492, 'loss/train': 4.272785186767578} -09/20/2021 16:11:44 - INFO - __main__ - Step 7885: {'lr': 0.00013120000000000002, 'samples': 252320, 'steps': 492, 'loss/train': 4.697671890258789} -09/20/2021 16:11:45 - INFO - __main__ - Step 7886: {'lr': 0.00013120000000000002, 'samples': 252352, 'steps': 492, 'loss/train': 6.202086448669434} -09/20/2021 16:11:46 - INFO - __main__ - Step 7887: {'lr': 0.00013120000000000002, 'samples': 252384, 'steps': 492, 'loss/train': 4.052656650543213} -09/20/2021 16:11:46 - INFO - __main__ - Step 7888: {'lr': 0.00013120000000000002, 'samples': 252416, 'steps': 492, 'loss/train': 5.530203819274902} -09/20/2021 16:11:47 - INFO - __main__ - Step 7889: {'lr': 0.00013146666666666667, 'samples': 252448, 'steps': 493, 'loss/train': 5.256258487701416} -09/20/2021 16:11:48 - INFO - __main__ - Step 7890: {'lr': 0.00013146666666666667, 'samples': 252480, 'steps': 493, 'loss/train': 5.047057628631592} -09/20/2021 16:11:49 - INFO - __main__ - Step 7891: {'lr': 0.00013146666666666667, 'samples': 252512, 'steps': 493, 'loss/train': 5.394242286682129} -09/20/2021 16:11:49 - INFO - __main__ - Step 7892: {'lr': 0.00013146666666666667, 'samples': 252544, 'steps': 493, 'loss/train': 5.498025417327881} -09/20/2021 16:11:50 - INFO - __main__ - Step 7893: {'lr': 0.00013146666666666667, 'samples': 252576, 'steps': 493, 'loss/train': 4.737252712249756} -09/20/2021 16:11:51 - INFO - __main__ - Step 7894: {'lr': 0.00013146666666666667, 'samples': 252608, 'steps': 493, 'loss/train': 5.02819299697876} -09/20/2021 16:11:52 - INFO - __main__ - Step 7895: {'lr': 0.00013146666666666667, 'samples': 252640, 'steps': 493, 'loss/train': 4.463802814483643} -09/20/2021 16:11:52 - INFO - __main__ - Step 7896: {'lr': 0.00013146666666666667, 'samples': 252672, 'steps': 493, 'loss/train': 4.371448040008545} -09/20/2021 16:11:53 - INFO - __main__ - Step 7897: {'lr': 0.00013146666666666667, 'samples': 252704, 'steps': 493, 'loss/train': 4.837845802307129} -09/20/2021 16:11:54 - INFO - __main__ - Step 7898: {'lr': 0.00013146666666666667, 'samples': 252736, 'steps': 493, 'loss/train': 4.714407444000244} -09/20/2021 16:11:55 - INFO - __main__ - Step 7899: {'lr': 0.00013146666666666667, 'samples': 252768, 'steps': 493, 'loss/train': 1.303999900817871} -09/20/2021 16:11:55 - INFO - __main__ - Step 7900: {'lr': 0.00013146666666666667, 'samples': 252800, 'steps': 493, 'loss/train': 4.775937557220459} -09/20/2021 16:11:57 - INFO - __main__ - Step 7901: {'lr': 0.00013146666666666667, 'samples': 252832, 'steps': 493, 'loss/train': 4.680009841918945} -09/20/2021 16:11:57 - INFO - __main__ - Step 7902: {'lr': 0.00013146666666666667, 'samples': 252864, 'steps': 493, 'loss/train': 5.772879600524902} -09/20/2021 16:11:58 - INFO - __main__ - Step 7903: {'lr': 0.00013146666666666667, 'samples': 252896, 'steps': 493, 'loss/train': 4.844300746917725} -09/20/2021 16:11:59 - INFO - __main__ - Step 7904: {'lr': 0.00013146666666666667, 'samples': 252928, 'steps': 493, 'loss/train': 4.898494720458984} -09/20/2021 16:12:00 - INFO - __main__ - Step 7905: {'lr': 0.00013173333333333333, 'samples': 252960, 'steps': 494, 'loss/train': 4.5233588218688965} -09/20/2021 16:12:01 - INFO - __main__ - Step 7906: {'lr': 0.00013173333333333333, 'samples': 252992, 'steps': 494, 'loss/train': 4.2702860832214355} -09/20/2021 16:12:01 - INFO - __main__ - Step 7907: {'lr': 0.00013173333333333333, 'samples': 253024, 'steps': 494, 'loss/train': 5.6844482421875} -09/20/2021 16:12:02 - INFO - __main__ - Step 7908: {'lr': 0.00013173333333333333, 'samples': 253056, 'steps': 494, 'loss/train': 5.254024505615234} -09/20/2021 16:12:03 - INFO - __main__ - Step 7909: {'lr': 0.00013173333333333333, 'samples': 253088, 'steps': 494, 'loss/train': 4.645874977111816} -09/20/2021 16:12:04 - INFO - __main__ - Step 7910: {'lr': 0.00013173333333333333, 'samples': 253120, 'steps': 494, 'loss/train': 5.089033126831055} -09/20/2021 16:12:04 - INFO - __main__ - Step 7911: {'lr': 0.00013173333333333333, 'samples': 253152, 'steps': 494, 'loss/train': 4.878950119018555} -09/20/2021 16:12:05 - INFO - __main__ - Step 7912: {'lr': 0.00013173333333333333, 'samples': 253184, 'steps': 494, 'loss/train': 4.242925643920898} -09/20/2021 16:12:06 - INFO - __main__ - Step 7913: {'lr': 0.00013173333333333333, 'samples': 253216, 'steps': 494, 'loss/train': 4.135544776916504} -09/20/2021 16:12:07 - INFO - __main__ - Step 7914: {'lr': 0.00013173333333333333, 'samples': 253248, 'steps': 494, 'loss/train': 4.755489349365234} -09/20/2021 16:12:07 - INFO - __main__ - Step 7915: {'lr': 0.00013173333333333333, 'samples': 253280, 'steps': 494, 'loss/train': 5.419590950012207} -09/20/2021 16:12:08 - INFO - __main__ - Step 7916: {'lr': 0.00013173333333333333, 'samples': 253312, 'steps': 494, 'loss/train': 5.138927936553955} -09/20/2021 16:12:09 - INFO - __main__ - Step 7917: {'lr': 0.00013173333333333333, 'samples': 253344, 'steps': 494, 'loss/train': 5.273261070251465} -09/20/2021 16:12:10 - INFO - __main__ - Step 7918: {'lr': 0.00013173333333333333, 'samples': 253376, 'steps': 494, 'loss/train': 5.038711071014404} -09/20/2021 16:12:10 - INFO - __main__ - Step 7919: {'lr': 0.00013173333333333333, 'samples': 253408, 'steps': 494, 'loss/train': 4.265824317932129} -09/20/2021 16:12:11 - INFO - __main__ - Step 7920: {'lr': 0.00013173333333333333, 'samples': 253440, 'steps': 494, 'loss/train': 5.046384811401367} -09/20/2021 16:12:12 - INFO - __main__ - Step 7921: {'lr': 0.000132, 'samples': 253472, 'steps': 495, 'loss/train': 4.805464744567871} -09/20/2021 16:12:13 - INFO - __main__ - Step 7922: {'lr': 0.000132, 'samples': 253504, 'steps': 495, 'loss/train': 4.7383503913879395} -09/20/2021 16:12:14 - INFO - __main__ - Step 7923: {'lr': 0.000132, 'samples': 253536, 'steps': 495, 'loss/train': 4.624204635620117} -09/20/2021 16:12:14 - INFO - __main__ - Step 7924: {'lr': 0.000132, 'samples': 253568, 'steps': 495, 'loss/train': 3.9876749515533447} -09/20/2021 16:12:15 - INFO - __main__ - Step 7925: {'lr': 0.000132, 'samples': 253600, 'steps': 495, 'loss/train': 4.827192783355713} -09/20/2021 16:12:16 - INFO - __main__ - Step 7926: {'lr': 0.000132, 'samples': 253632, 'steps': 495, 'loss/train': 5.727856159210205} -09/20/2021 16:12:17 - INFO - __main__ - Step 7927: {'lr': 0.000132, 'samples': 253664, 'steps': 495, 'loss/train': 2.1185476779937744} -09/20/2021 16:12:17 - INFO - __main__ - Step 7928: {'lr': 0.000132, 'samples': 253696, 'steps': 495, 'loss/train': 4.7183990478515625} -09/20/2021 16:12:18 - INFO - __main__ - Step 7929: {'lr': 0.000132, 'samples': 253728, 'steps': 495, 'loss/train': 5.014801025390625} -09/20/2021 16:12:19 - INFO - __main__ - Step 7930: {'lr': 0.000132, 'samples': 253760, 'steps': 495, 'loss/train': 5.129844665527344} -09/20/2021 16:12:20 - INFO - __main__ - Step 7931: {'lr': 0.000132, 'samples': 253792, 'steps': 495, 'loss/train': 5.5268874168396} -09/20/2021 16:12:21 - INFO - __main__ - Step 7932: {'lr': 0.000132, 'samples': 253824, 'steps': 495, 'loss/train': 5.887753009796143} -09/20/2021 16:12:22 - INFO - __main__ - Step 7933: {'lr': 0.000132, 'samples': 253856, 'steps': 495, 'loss/train': 5.616817951202393} -09/20/2021 16:12:22 - INFO - __main__ - Step 7934: {'lr': 0.000132, 'samples': 253888, 'steps': 495, 'loss/train': 5.466612815856934} -09/20/2021 16:12:23 - INFO - __main__ - Step 7935: {'lr': 0.000132, 'samples': 253920, 'steps': 495, 'loss/train': 4.695691108703613} -09/20/2021 16:12:24 - INFO - __main__ - Step 7936: {'lr': 0.000132, 'samples': 253952, 'steps': 495, 'loss/train': 5.403289318084717} -09/20/2021 16:12:25 - INFO - __main__ - Step 7937: {'lr': 0.00013226666666666667, 'samples': 253984, 'steps': 496, 'loss/train': 0.7284773588180542} -09/20/2021 16:12:25 - INFO - __main__ - Step 7938: {'lr': 0.00013226666666666667, 'samples': 254016, 'steps': 496, 'loss/train': 4.771432399749756} -09/20/2021 16:12:26 - INFO - __main__ - Step 7939: {'lr': 0.00013226666666666667, 'samples': 254048, 'steps': 496, 'loss/train': 5.095003604888916} -09/20/2021 16:12:27 - INFO - __main__ - Step 7940: {'lr': 0.00013226666666666667, 'samples': 254080, 'steps': 496, 'loss/train': 5.023282527923584} -09/20/2021 16:12:28 - INFO - __main__ - Step 7941: {'lr': 0.00013226666666666667, 'samples': 254112, 'steps': 496, 'loss/train': 4.663234233856201} -09/20/2021 16:12:28 - INFO - __main__ - Step 7942: {'lr': 0.00013226666666666667, 'samples': 254144, 'steps': 496, 'loss/train': 4.852288722991943} -09/20/2021 16:12:29 - INFO - __main__ - Step 7943: {'lr': 0.00013226666666666667, 'samples': 254176, 'steps': 496, 'loss/train': 4.559933662414551} -09/20/2021 16:12:30 - INFO - __main__ - Step 7944: {'lr': 0.00013226666666666667, 'samples': 254208, 'steps': 496, 'loss/train': 5.101560115814209} -09/20/2021 16:12:31 - INFO - __main__ - Step 7945: {'lr': 0.00013226666666666667, 'samples': 254240, 'steps': 496, 'loss/train': 2.5080630779266357} -09/20/2021 16:12:31 - INFO - __main__ - Step 7946: {'lr': 0.00013226666666666667, 'samples': 254272, 'steps': 496, 'loss/train': 4.973417282104492} -09/20/2021 16:12:32 - INFO - __main__ - Step 7947: {'lr': 0.00013226666666666667, 'samples': 254304, 'steps': 496, 'loss/train': 4.937849044799805} -09/20/2021 16:12:33 - INFO - __main__ - Step 7948: {'lr': 0.00013226666666666667, 'samples': 254336, 'steps': 496, 'loss/train': 5.123424053192139} -09/20/2021 16:12:34 - INFO - __main__ - Step 7949: {'lr': 0.00013226666666666667, 'samples': 254368, 'steps': 496, 'loss/train': 5.422667026519775} -09/20/2021 16:12:34 - INFO - __main__ - Step 7950: {'lr': 0.00013226666666666667, 'samples': 254400, 'steps': 496, 'loss/train': 4.934493064880371} -09/20/2021 16:12:35 - INFO - __main__ - Step 7951: {'lr': 0.00013226666666666667, 'samples': 254432, 'steps': 496, 'loss/train': 6.744475841522217} -09/20/2021 16:12:36 - INFO - __main__ - Step 7952: {'lr': 0.00013226666666666667, 'samples': 254464, 'steps': 496, 'loss/train': 6.669126510620117} -09/20/2021 16:12:37 - INFO - __main__ - Step 7953: {'lr': 0.00013253333333333332, 'samples': 254496, 'steps': 497, 'loss/train': 5.435420036315918} -09/20/2021 16:12:38 - INFO - __main__ - Step 7954: {'lr': 0.00013253333333333332, 'samples': 254528, 'steps': 497, 'loss/train': 4.705149173736572} -09/20/2021 16:12:38 - INFO - __main__ - Step 7955: {'lr': 0.00013253333333333332, 'samples': 254560, 'steps': 497, 'loss/train': 5.203330993652344} -09/20/2021 16:12:39 - INFO - __main__ - Step 7956: {'lr': 0.00013253333333333332, 'samples': 254592, 'steps': 497, 'loss/train': 4.521091938018799} -09/20/2021 16:12:40 - INFO - __main__ - Step 7957: {'lr': 0.00013253333333333332, 'samples': 254624, 'steps': 497, 'loss/train': 2.1297194957733154} -09/20/2021 16:12:41 - INFO - __main__ - Step 7958: {'lr': 0.00013253333333333332, 'samples': 254656, 'steps': 497, 'loss/train': 3.9752023220062256} -09/20/2021 16:12:41 - INFO - __main__ - Step 7959: {'lr': 0.00013253333333333332, 'samples': 254688, 'steps': 497, 'loss/train': 4.607245445251465} -09/20/2021 16:12:42 - INFO - __main__ - Step 7960: {'lr': 0.00013253333333333332, 'samples': 254720, 'steps': 497, 'loss/train': 5.2398905754089355} -09/20/2021 16:12:43 - INFO - __main__ - Step 7961: {'lr': 0.00013253333333333332, 'samples': 254752, 'steps': 497, 'loss/train': 4.231736660003662} -09/20/2021 16:12:44 - INFO - __main__ - Step 7962: {'lr': 0.00013253333333333332, 'samples': 254784, 'steps': 497, 'loss/train': 4.390438079833984} -09/20/2021 16:12:45 - INFO - __main__ - Step 7963: {'lr': 0.00013253333333333332, 'samples': 254816, 'steps': 497, 'loss/train': 5.592050075531006} -09/20/2021 16:12:46 - INFO - __main__ - Step 7964: {'lr': 0.00013253333333333332, 'samples': 254848, 'steps': 497, 'loss/train': 4.802499771118164} -09/20/2021 16:12:46 - INFO - __main__ - Step 7965: {'lr': 0.00013253333333333332, 'samples': 254880, 'steps': 497, 'loss/train': 4.761590003967285} -09/20/2021 16:12:47 - INFO - __main__ - Step 7966: {'lr': 0.00013253333333333332, 'samples': 254912, 'steps': 497, 'loss/train': 4.746912002563477} -09/20/2021 16:12:48 - INFO - __main__ - Step 7967: {'lr': 0.00013253333333333332, 'samples': 254944, 'steps': 497, 'loss/train': 4.575090408325195} -09/20/2021 16:12:49 - INFO - __main__ - Step 7968: {'lr': 0.00013253333333333332, 'samples': 254976, 'steps': 497, 'loss/train': 5.301072597503662} -09/20/2021 16:12:50 - INFO - __main__ - Step 7969: {'lr': 0.0001328, 'samples': 255008, 'steps': 498, 'loss/train': 5.160857677459717} -09/20/2021 16:12:50 - INFO - __main__ - Step 7970: {'lr': 0.0001328, 'samples': 255040, 'steps': 498, 'loss/train': 4.706794738769531} -09/20/2021 16:12:51 - INFO - __main__ - Step 7971: {'lr': 0.0001328, 'samples': 255072, 'steps': 498, 'loss/train': 4.758089542388916} -09/20/2021 16:12:52 - INFO - __main__ - Step 7972: {'lr': 0.0001328, 'samples': 255104, 'steps': 498, 'loss/train': 4.580460071563721} -09/20/2021 16:12:53 - INFO - __main__ - Step 7973: {'lr': 0.0001328, 'samples': 255136, 'steps': 498, 'loss/train': 5.471375465393066} -09/20/2021 16:12:53 - INFO - __main__ - Step 7974: {'lr': 0.0001328, 'samples': 255168, 'steps': 498, 'loss/train': 4.566463470458984} -09/20/2021 16:12:54 - INFO - __main__ - Step 7975: {'lr': 0.0001328, 'samples': 255200, 'steps': 498, 'loss/train': 6.256859302520752} -09/20/2021 16:12:55 - INFO - __main__ - Step 7976: {'lr': 0.0001328, 'samples': 255232, 'steps': 498, 'loss/train': 5.852092742919922} -09/20/2021 16:12:56 - INFO - __main__ - Step 7977: {'lr': 0.0001328, 'samples': 255264, 'steps': 498, 'loss/train': 5.360988140106201} -09/20/2021 16:12:56 - INFO - __main__ - Step 7978: {'lr': 0.0001328, 'samples': 255296, 'steps': 498, 'loss/train': 4.929738521575928} -09/20/2021 16:12:57 - INFO - __main__ - Step 7979: {'lr': 0.0001328, 'samples': 255328, 'steps': 498, 'loss/train': 5.803675651550293} -09/20/2021 16:12:58 - INFO - __main__ - Step 7980: {'lr': 0.0001328, 'samples': 255360, 'steps': 498, 'loss/train': 4.632200717926025} -09/20/2021 16:12:59 - INFO - __main__ - Step 7981: {'lr': 0.0001328, 'samples': 255392, 'steps': 498, 'loss/train': 7.568363666534424} -09/20/2021 16:12:59 - INFO - __main__ - Step 7982: {'lr': 0.0001328, 'samples': 255424, 'steps': 498, 'loss/train': 5.304202079772949} -09/20/2021 16:13:00 - INFO - __main__ - Step 7983: {'lr': 0.0001328, 'samples': 255456, 'steps': 498, 'loss/train': 5.3488030433654785} -09/20/2021 16:13:01 - INFO - __main__ - Step 7984: {'lr': 0.0001328, 'samples': 255488, 'steps': 498, 'loss/train': 5.054522514343262} -09/20/2021 16:13:02 - INFO - __main__ - Step 7985: {'lr': 0.00013306666666666668, 'samples': 255520, 'steps': 499, 'loss/train': 5.178238868713379} -09/20/2021 16:13:02 - INFO - __main__ - Step 7986: {'lr': 0.00013306666666666668, 'samples': 255552, 'steps': 499, 'loss/train': 4.551785469055176} -09/20/2021 16:13:03 - INFO - __main__ - Step 7987: {'lr': 0.00013306666666666668, 'samples': 255584, 'steps': 499, 'loss/train': 4.9538421630859375} -09/20/2021 16:13:04 - INFO - __main__ - Step 7988: {'lr': 0.00013306666666666668, 'samples': 255616, 'steps': 499, 'loss/train': 4.999790191650391} -09/20/2021 16:13:05 - INFO - __main__ - Step 7989: {'lr': 0.00013306666666666668, 'samples': 255648, 'steps': 499, 'loss/train': 4.204465866088867} -09/20/2021 16:13:05 - INFO - __main__ - Step 7990: {'lr': 0.00013306666666666668, 'samples': 255680, 'steps': 499, 'loss/train': 3.578065872192383} -09/20/2021 16:13:06 - INFO - __main__ - Step 7991: {'lr': 0.00013306666666666668, 'samples': 255712, 'steps': 499, 'loss/train': 4.81950569152832} -09/20/2021 16:13:07 - INFO - __main__ - Step 7992: {'lr': 0.00013306666666666668, 'samples': 255744, 'steps': 499, 'loss/train': 5.342745780944824} -09/20/2021 16:13:08 - INFO - __main__ - Step 7993: {'lr': 0.00013306666666666668, 'samples': 255776, 'steps': 499, 'loss/train': 4.694540023803711} -09/20/2021 16:13:09 - INFO - __main__ - Step 7994: {'lr': 0.00013306666666666668, 'samples': 255808, 'steps': 499, 'loss/train': 3.722822427749634} -09/20/2021 16:13:10 - INFO - __main__ - Step 7995: {'lr': 0.00013306666666666668, 'samples': 255840, 'steps': 499, 'loss/train': 4.848760604858398} -09/20/2021 16:13:11 - INFO - __main__ - Step 7996: {'lr': 0.00013306666666666668, 'samples': 255872, 'steps': 499, 'loss/train': 4.536911964416504} -09/20/2021 16:13:11 - INFO - __main__ - Step 7997: {'lr': 0.00013306666666666668, 'samples': 255904, 'steps': 499, 'loss/train': 5.274442195892334} -09/20/2021 16:13:12 - INFO - __main__ - Step 7998: {'lr': 0.00013306666666666668, 'samples': 255936, 'steps': 499, 'loss/train': 5.350534439086914} -09/20/2021 16:13:13 - INFO - __main__ - Step 7999: {'lr': 0.00013306666666666668, 'samples': 255968, 'steps': 499, 'loss/train': 4.693626403808594} -09/20/2021 16:13:14 - INFO - __main__ - Step 8000: {'lr': 0.00013306666666666668, 'samples': 256000, 'steps': 499, 'loss/train': 4.094519138336182} -09/20/2021 16:13:15 - INFO - __main__ - Step 8001: {'lr': 0.00013333333333333334, 'samples': 256032, 'steps': 500, 'loss/train': 4.268496513366699} -09/20/2021 16:13:15 - INFO - __main__ - Step 8002: {'lr': 0.00013333333333333334, 'samples': 256064, 'steps': 500, 'loss/train': 3.888932704925537} -09/20/2021 16:13:16 - INFO - __main__ - Step 8003: {'lr': 0.00013333333333333334, 'samples': 256096, 'steps': 500, 'loss/train': 4.3328046798706055} -09/20/2021 16:13:17 - INFO - __main__ - Step 8004: {'lr': 0.00013333333333333334, 'samples': 256128, 'steps': 500, 'loss/train': 4.7644267082214355} -09/20/2021 16:13:18 - INFO - __main__ - Step 8005: {'lr': 0.00013333333333333334, 'samples': 256160, 'steps': 500, 'loss/train': 4.49952507019043} -09/20/2021 16:13:18 - INFO - __main__ - Step 8006: {'lr': 0.00013333333333333334, 'samples': 256192, 'steps': 500, 'loss/train': 4.553197383880615} -09/20/2021 16:13:19 - INFO - __main__ - Step 8007: {'lr': 0.00013333333333333334, 'samples': 256224, 'steps': 500, 'loss/train': 3.622469186782837} -09/20/2021 16:13:20 - INFO - __main__ - Step 8008: {'lr': 0.00013333333333333334, 'samples': 256256, 'steps': 500, 'loss/train': 3.5808801651000977} -09/20/2021 16:13:21 - INFO - __main__ - Step 8009: {'lr': 0.00013333333333333334, 'samples': 256288, 'steps': 500, 'loss/train': 4.895234107971191} -09/20/2021 16:13:21 - INFO - __main__ - Step 8010: {'lr': 0.00013333333333333334, 'samples': 256320, 'steps': 500, 'loss/train': 4.859447956085205} -09/20/2021 16:13:22 - INFO - __main__ - Step 8011: {'lr': 0.00013333333333333334, 'samples': 256352, 'steps': 500, 'loss/train': 3.9976391792297363} -09/20/2021 16:13:23 - INFO - __main__ - Step 8012: {'lr': 0.00013333333333333334, 'samples': 256384, 'steps': 500, 'loss/train': 4.773595333099365} -09/20/2021 16:13:24 - INFO - __main__ - Step 8013: {'lr': 0.00013333333333333334, 'samples': 256416, 'steps': 500, 'loss/train': 5.03000020980835} -09/20/2021 16:13:24 - INFO - __main__ - Step 8014: {'lr': 0.00013333333333333334, 'samples': 256448, 'steps': 500, 'loss/train': 6.072232723236084} -09/20/2021 16:13:25 - INFO - __main__ - Step 8015: {'lr': 0.00013333333333333334, 'samples': 256480, 'steps': 500, 'loss/train': 5.0477519035339355} -09/20/2021 16:13:26 - INFO - __main__ - Step 8016: {'lr': 0.00013333333333333334, 'samples': 256512, 'steps': 500, 'loss/train': 4.503360271453857} -09/20/2021 16:13:27 - INFO - __main__ - Step 8017: {'lr': 0.00013360000000000002, 'samples': 256544, 'steps': 501, 'loss/train': 4.990461349487305} -09/20/2021 16:13:27 - INFO - __main__ - Step 8018: {'lr': 0.00013360000000000002, 'samples': 256576, 'steps': 501, 'loss/train': 4.943474769592285} -09/20/2021 16:13:28 - INFO - __main__ - Step 8019: {'lr': 0.00013360000000000002, 'samples': 256608, 'steps': 501, 'loss/train': 4.581838607788086} -09/20/2021 16:13:29 - INFO - __main__ - Step 8020: {'lr': 0.00013360000000000002, 'samples': 256640, 'steps': 501, 'loss/train': 4.2589569091796875} -09/20/2021 16:13:30 - INFO - __main__ - Step 8021: {'lr': 0.00013360000000000002, 'samples': 256672, 'steps': 501, 'loss/train': 4.4473557472229} -09/20/2021 16:13:30 - INFO - __main__ - Step 8022: {'lr': 0.00013360000000000002, 'samples': 256704, 'steps': 501, 'loss/train': 4.46104097366333} -09/20/2021 16:13:31 - INFO - __main__ - Step 8023: {'lr': 0.00013360000000000002, 'samples': 256736, 'steps': 501, 'loss/train': 4.999881744384766} -09/20/2021 16:13:32 - INFO - __main__ - Step 8024: {'lr': 0.00013360000000000002, 'samples': 256768, 'steps': 501, 'loss/train': 4.7594895362854} -09/20/2021 16:13:33 - INFO - __main__ - Step 8025: {'lr': 0.00013360000000000002, 'samples': 256800, 'steps': 501, 'loss/train': 5.667740345001221} -09/20/2021 16:13:34 - INFO - __main__ - Step 8026: {'lr': 0.00013360000000000002, 'samples': 256832, 'steps': 501, 'loss/train': 4.617949962615967} -09/20/2021 16:13:35 - INFO - __main__ - Step 8027: {'lr': 0.00013360000000000002, 'samples': 256864, 'steps': 501, 'loss/train': 4.114779949188232} -09/20/2021 16:13:35 - INFO - __main__ - Step 8028: {'lr': 0.00013360000000000002, 'samples': 256896, 'steps': 501, 'loss/train': 4.1675238609313965} -09/20/2021 16:13:36 - INFO - __main__ - Step 8029: {'lr': 0.00013360000000000002, 'samples': 256928, 'steps': 501, 'loss/train': 5.051292896270752} -09/20/2021 16:13:37 - INFO - __main__ - Step 8030: {'lr': 0.00013360000000000002, 'samples': 256960, 'steps': 501, 'loss/train': 4.3770365715026855} -09/20/2021 16:13:38 - INFO - __main__ - Step 8031: {'lr': 0.00013360000000000002, 'samples': 256992, 'steps': 501, 'loss/train': 4.954093933105469} -09/20/2021 16:13:38 - INFO - __main__ - Step 8032: {'lr': 0.00013360000000000002, 'samples': 257024, 'steps': 501, 'loss/train': 5.470209121704102} -09/20/2021 16:13:39 - INFO - __main__ - Step 8033: {'lr': 0.00013386666666666668, 'samples': 257056, 'steps': 502, 'loss/train': 4.461838722229004} -09/20/2021 16:13:40 - INFO - __main__ - Step 8034: {'lr': 0.00013386666666666668, 'samples': 257088, 'steps': 502, 'loss/train': 5.0109357833862305} -09/20/2021 16:13:41 - INFO - __main__ - Step 8035: {'lr': 0.00013386666666666668, 'samples': 257120, 'steps': 502, 'loss/train': 4.629079818725586} -09/20/2021 16:13:42 - INFO - __main__ - Step 8036: {'lr': 0.00013386666666666668, 'samples': 257152, 'steps': 502, 'loss/train': 4.6598992347717285} -09/20/2021 16:13:42 - INFO - __main__ - Step 8037: {'lr': 0.00013386666666666668, 'samples': 257184, 'steps': 502, 'loss/train': 5.516654968261719} -09/20/2021 16:13:43 - INFO - __main__ - Step 8038: {'lr': 0.00013386666666666668, 'samples': 257216, 'steps': 502, 'loss/train': 5.264680862426758} -09/20/2021 16:13:44 - INFO - __main__ - Step 8039: {'lr': 0.00013386666666666668, 'samples': 257248, 'steps': 502, 'loss/train': 4.357647895812988} -09/20/2021 16:13:45 - INFO - __main__ - Step 8040: {'lr': 0.00013386666666666668, 'samples': 257280, 'steps': 502, 'loss/train': 4.886534214019775} -09/20/2021 16:13:45 - INFO - __main__ - Step 8041: {'lr': 0.00013386666666666668, 'samples': 257312, 'steps': 502, 'loss/train': 4.613530158996582} -09/20/2021 16:13:46 - INFO - __main__ - Step 8042: {'lr': 0.00013386666666666668, 'samples': 257344, 'steps': 502, 'loss/train': 4.815621376037598} -09/20/2021 16:13:47 - INFO - __main__ - Step 8043: {'lr': 0.00013386666666666668, 'samples': 257376, 'steps': 502, 'loss/train': 5.485581398010254} -09/20/2021 16:13:48 - INFO - __main__ - Step 8044: {'lr': 0.00013386666666666668, 'samples': 257408, 'steps': 502, 'loss/train': 6.067444801330566} -09/20/2021 16:13:48 - INFO - __main__ - Step 8045: {'lr': 0.00013386666666666668, 'samples': 257440, 'steps': 502, 'loss/train': 4.465749263763428} -09/20/2021 16:13:49 - INFO - __main__ - Step 8046: {'lr': 0.00013386666666666668, 'samples': 257472, 'steps': 502, 'loss/train': 5.145448684692383} -09/20/2021 16:13:50 - INFO - __main__ - Step 8047: {'lr': 0.00013386666666666668, 'samples': 257504, 'steps': 502, 'loss/train': 4.104377269744873} -09/20/2021 16:13:51 - INFO - __main__ - Step 8048: {'lr': 0.00013386666666666668, 'samples': 257536, 'steps': 502, 'loss/train': 5.085182189941406} -09/20/2021 16:13:51 - INFO - __main__ - Step 8049: {'lr': 0.00013413333333333333, 'samples': 257568, 'steps': 503, 'loss/train': 4.683269500732422} -09/20/2021 16:13:52 - INFO - __main__ - Step 8050: {'lr': 0.00013413333333333333, 'samples': 257600, 'steps': 503, 'loss/train': 4.422253608703613} -09/20/2021 16:13:53 - INFO - __main__ - Step 8051: {'lr': 0.00013413333333333333, 'samples': 257632, 'steps': 503, 'loss/train': 4.7349748611450195} -09/20/2021 16:13:54 - INFO - __main__ - Step 8052: {'lr': 0.00013413333333333333, 'samples': 257664, 'steps': 503, 'loss/train': 4.286820411682129} -09/20/2021 16:13:54 - INFO - __main__ - Step 8053: {'lr': 0.00013413333333333333, 'samples': 257696, 'steps': 503, 'loss/train': 4.810722827911377} -09/20/2021 16:13:55 - INFO - __main__ - Step 8054: {'lr': 0.00013413333333333333, 'samples': 257728, 'steps': 503, 'loss/train': 4.961278438568115} -09/20/2021 16:13:56 - INFO - __main__ - Step 8055: {'lr': 0.00013413333333333333, 'samples': 257760, 'steps': 503, 'loss/train': 4.717992782592773} -09/20/2021 16:13:57 - INFO - __main__ - Step 8056: {'lr': 0.00013413333333333333, 'samples': 257792, 'steps': 503, 'loss/train': 3.4281272888183594} -09/20/2021 16:13:58 - INFO - __main__ - Step 8057: {'lr': 0.00013413333333333333, 'samples': 257824, 'steps': 503, 'loss/train': 4.834129333496094} -09/20/2021 16:13:59 - INFO - __main__ - Step 8058: {'lr': 0.00013413333333333333, 'samples': 257856, 'steps': 503, 'loss/train': 7.238846302032471} -09/20/2021 16:14:00 - INFO - __main__ - Step 8059: {'lr': 0.00013413333333333333, 'samples': 257888, 'steps': 503, 'loss/train': 6.039786338806152} -09/20/2021 16:14:00 - INFO - __main__ - Step 8060: {'lr': 0.00013413333333333333, 'samples': 257920, 'steps': 503, 'loss/train': 5.735358238220215} -09/20/2021 16:14:01 - INFO - __main__ - Step 8061: {'lr': 0.00013413333333333333, 'samples': 257952, 'steps': 503, 'loss/train': 4.44685697555542} -09/20/2021 16:14:02 - INFO - __main__ - Step 8062: {'lr': 0.00013413333333333333, 'samples': 257984, 'steps': 503, 'loss/train': 4.809537887573242} -09/20/2021 16:14:03 - INFO - __main__ - Step 8063: {'lr': 0.00013413333333333333, 'samples': 258016, 'steps': 503, 'loss/train': 3.955595016479492} -09/20/2021 16:14:03 - INFO - __main__ - Step 8064: {'lr': 0.00013413333333333333, 'samples': 258048, 'steps': 503, 'loss/train': 4.685600280761719} -09/20/2021 16:14:04 - INFO - __main__ - Step 8065: {'lr': 0.00013440000000000001, 'samples': 258080, 'steps': 504, 'loss/train': 5.07699728012085} -09/20/2021 16:14:05 - INFO - __main__ - Step 8066: {'lr': 0.00013440000000000001, 'samples': 258112, 'steps': 504, 'loss/train': 5.019253253936768} -09/20/2021 16:14:06 - INFO - __main__ - Step 8067: {'lr': 0.00013440000000000001, 'samples': 258144, 'steps': 504, 'loss/train': 4.499202728271484} -09/20/2021 16:14:06 - INFO - __main__ - Step 8068: {'lr': 0.00013440000000000001, 'samples': 258176, 'steps': 504, 'loss/train': 5.19895076751709} -09/20/2021 16:14:07 - INFO - __main__ - Step 8069: {'lr': 0.00013440000000000001, 'samples': 258208, 'steps': 504, 'loss/train': 4.397487640380859} -09/20/2021 16:14:08 - INFO - __main__ - Step 8070: {'lr': 0.00013440000000000001, 'samples': 258240, 'steps': 504, 'loss/train': 5.155936241149902} -09/20/2021 16:14:09 - INFO - __main__ - Step 8071: {'lr': 0.00013440000000000001, 'samples': 258272, 'steps': 504, 'loss/train': 4.550515651702881} -09/20/2021 16:14:09 - INFO - __main__ - Step 8072: {'lr': 0.00013440000000000001, 'samples': 258304, 'steps': 504, 'loss/train': 4.386971950531006} -09/20/2021 16:14:10 - INFO - __main__ - Step 8073: {'lr': 0.00013440000000000001, 'samples': 258336, 'steps': 504, 'loss/train': 5.138436794281006} -09/20/2021 16:14:11 - INFO - __main__ - Step 8074: {'lr': 0.00013440000000000001, 'samples': 258368, 'steps': 504, 'loss/train': 4.886171817779541} -09/20/2021 16:14:12 - INFO - __main__ - Step 8075: {'lr': 0.00013440000000000001, 'samples': 258400, 'steps': 504, 'loss/train': 4.83590841293335} -09/20/2021 16:14:12 - INFO - __main__ - Step 8076: {'lr': 0.00013440000000000001, 'samples': 258432, 'steps': 504, 'loss/train': 5.193584442138672} -09/20/2021 16:14:13 - INFO - __main__ - Step 8077: {'lr': 0.00013440000000000001, 'samples': 258464, 'steps': 504, 'loss/train': 4.3650593757629395} -09/20/2021 16:14:14 - INFO - __main__ - Step 8078: {'lr': 0.00013440000000000001, 'samples': 258496, 'steps': 504, 'loss/train': 6.547563076019287} -09/20/2021 16:14:15 - INFO - __main__ - Step 8079: {'lr': 0.00013440000000000001, 'samples': 258528, 'steps': 504, 'loss/train': 5.035971164703369} -09/20/2021 16:14:15 - INFO - __main__ - Step 8080: {'lr': 0.00013440000000000001, 'samples': 258560, 'steps': 504, 'loss/train': 3.99605655670166} -09/20/2021 16:14:16 - INFO - __main__ - Step 8081: {'lr': 0.00013466666666666667, 'samples': 258592, 'steps': 505, 'loss/train': 4.113707542419434} -09/20/2021 16:14:17 - INFO - __main__ - Step 8082: {'lr': 0.00013466666666666667, 'samples': 258624, 'steps': 505, 'loss/train': 4.8886213302612305} -09/20/2021 16:14:18 - INFO - __main__ - Step 8083: {'lr': 0.00013466666666666667, 'samples': 258656, 'steps': 505, 'loss/train': 5.1680779457092285} -09/20/2021 16:14:19 - INFO - __main__ - Step 8084: {'lr': 0.00013466666666666667, 'samples': 258688, 'steps': 505, 'loss/train': 4.571174144744873} -09/20/2021 16:14:19 - INFO - __main__ - Step 8085: {'lr': 0.00013466666666666667, 'samples': 258720, 'steps': 505, 'loss/train': 5.372359752655029} -09/20/2021 16:14:21 - INFO - __main__ - Step 8086: {'lr': 0.00013466666666666667, 'samples': 258752, 'steps': 505, 'loss/train': 5.088579177856445} -09/20/2021 16:14:21 - INFO - __main__ - Step 8087: {'lr': 0.00013466666666666667, 'samples': 258784, 'steps': 505, 'loss/train': 6.4174370765686035} -09/20/2021 16:14:22 - INFO - __main__ - Step 8088: {'lr': 0.00013466666666666667, 'samples': 258816, 'steps': 505, 'loss/train': 4.652072906494141} -09/20/2021 16:14:23 - INFO - __main__ - Step 8089: {'lr': 0.00013466666666666667, 'samples': 258848, 'steps': 505, 'loss/train': 4.090162754058838} -09/20/2021 16:14:24 - INFO - __main__ - Step 8090: {'lr': 0.00013466666666666667, 'samples': 258880, 'steps': 505, 'loss/train': 4.398613929748535} -09/20/2021 16:14:24 - INFO - __main__ - Step 8091: {'lr': 0.00013466666666666667, 'samples': 258912, 'steps': 505, 'loss/train': 2.4576117992401123} -09/20/2021 16:14:25 - INFO - __main__ - Step 8092: {'lr': 0.00013466666666666667, 'samples': 258944, 'steps': 505, 'loss/train': 2.5563557147979736} -09/20/2021 16:14:26 - INFO - __main__ - Step 8093: {'lr': 0.00013466666666666667, 'samples': 258976, 'steps': 505, 'loss/train': 5.04499626159668} -09/20/2021 16:14:27 - INFO - __main__ - Step 8094: {'lr': 0.00013466666666666667, 'samples': 259008, 'steps': 505, 'loss/train': 5.035996437072754} -09/20/2021 16:14:27 - INFO - __main__ - Step 8095: {'lr': 0.00013466666666666667, 'samples': 259040, 'steps': 505, 'loss/train': 4.754516124725342} -09/20/2021 16:14:28 - INFO - __main__ - Step 8096: {'lr': 0.00013466666666666667, 'samples': 259072, 'steps': 505, 'loss/train': 4.840994834899902} -09/20/2021 16:14:29 - INFO - __main__ - Step 8097: {'lr': 0.00013493333333333332, 'samples': 259104, 'steps': 506, 'loss/train': 3.974989414215088} -09/20/2021 16:14:30 - INFO - __main__ - Step 8098: {'lr': 0.00013493333333333332, 'samples': 259136, 'steps': 506, 'loss/train': 5.577053546905518} -09/20/2021 16:14:31 - INFO - __main__ - Step 8099: {'lr': 0.00013493333333333332, 'samples': 259168, 'steps': 506, 'loss/train': 5.393185615539551} -09/20/2021 16:14:31 - INFO - __main__ - Step 8100: {'lr': 0.00013493333333333332, 'samples': 259200, 'steps': 506, 'loss/train': 5.439890384674072} -09/20/2021 16:14:32 - INFO - __main__ - Step 8101: {'lr': 0.00013493333333333332, 'samples': 259232, 'steps': 506, 'loss/train': 4.932602405548096} -09/20/2021 16:14:33 - INFO - __main__ - Step 8102: {'lr': 0.00013493333333333332, 'samples': 259264, 'steps': 506, 'loss/train': 5.038383483886719} -09/20/2021 16:14:34 - INFO - __main__ - Step 8103: {'lr': 0.00013493333333333332, 'samples': 259296, 'steps': 506, 'loss/train': 4.480461120605469} -09/20/2021 16:14:34 - INFO - __main__ - Step 8104: {'lr': 0.00013493333333333332, 'samples': 259328, 'steps': 506, 'loss/train': 3.972581386566162} -09/20/2021 16:14:35 - INFO - __main__ - Step 8105: {'lr': 0.00013493333333333332, 'samples': 259360, 'steps': 506, 'loss/train': 4.783412933349609} -09/20/2021 16:14:36 - INFO - __main__ - Step 8106: {'lr': 0.00013493333333333332, 'samples': 259392, 'steps': 506, 'loss/train': 4.812092304229736} -09/20/2021 16:14:37 - INFO - __main__ - Step 8107: {'lr': 0.00013493333333333332, 'samples': 259424, 'steps': 506, 'loss/train': 4.9373579025268555} -09/20/2021 16:14:37 - INFO - __main__ - Step 8108: {'lr': 0.00013493333333333332, 'samples': 259456, 'steps': 506, 'loss/train': 4.77292013168335} -09/20/2021 16:14:38 - INFO - __main__ - Step 8109: {'lr': 0.00013493333333333332, 'samples': 259488, 'steps': 506, 'loss/train': 4.24783992767334} -09/20/2021 16:14:39 - INFO - __main__ - Step 8110: {'lr': 0.00013493333333333332, 'samples': 259520, 'steps': 506, 'loss/train': 2.9067916870117188} -09/20/2021 16:14:40 - INFO - __main__ - Step 8111: {'lr': 0.00013493333333333332, 'samples': 259552, 'steps': 506, 'loss/train': 5.426432132720947} -09/20/2021 16:14:40 - INFO - __main__ - Step 8112: {'lr': 0.00013493333333333332, 'samples': 259584, 'steps': 506, 'loss/train': 5.114521026611328} -09/20/2021 16:14:41 - INFO - __main__ - Step 8113: {'lr': 0.0001352, 'samples': 259616, 'steps': 507, 'loss/train': 5.066030502319336} -09/20/2021 16:14:42 - INFO - __main__ - Step 8114: {'lr': 0.0001352, 'samples': 259648, 'steps': 507, 'loss/train': 5.180427551269531} -09/20/2021 16:14:43 - INFO - __main__ - Step 8115: {'lr': 0.0001352, 'samples': 259680, 'steps': 507, 'loss/train': 6.408442497253418} -09/20/2021 16:14:43 - INFO - __main__ - Step 8116: {'lr': 0.0001352, 'samples': 259712, 'steps': 507, 'loss/train': 4.816753387451172} -09/20/2021 16:14:44 - INFO - __main__ - Step 8117: {'lr': 0.0001352, 'samples': 259744, 'steps': 507, 'loss/train': 5.127864360809326} -09/20/2021 16:14:45 - INFO - __main__ - Step 8118: {'lr': 0.0001352, 'samples': 259776, 'steps': 507, 'loss/train': 4.919224739074707} -09/20/2021 16:14:46 - INFO - __main__ - Step 8119: {'lr': 0.0001352, 'samples': 259808, 'steps': 507, 'loss/train': 4.5529866218566895} -09/20/2021 16:14:47 - INFO - __main__ - Step 8120: {'lr': 0.0001352, 'samples': 259840, 'steps': 507, 'loss/train': 5.0290679931640625} -09/20/2021 16:14:48 - INFO - __main__ - Step 8121: {'lr': 0.0001352, 'samples': 259872, 'steps': 507, 'loss/train': 5.491666316986084} -09/20/2021 16:14:48 - INFO - __main__ - Step 8122: {'lr': 0.0001352, 'samples': 259904, 'steps': 507, 'loss/train': 4.558452129364014} -09/20/2021 16:14:49 - INFO - __main__ - Step 8123: {'lr': 0.0001352, 'samples': 259936, 'steps': 507, 'loss/train': 4.753674030303955} -09/20/2021 16:14:50 - INFO - __main__ - Step 8124: {'lr': 0.0001352, 'samples': 259968, 'steps': 507, 'loss/train': 4.681117534637451} -09/20/2021 16:14:51 - INFO - __main__ - Step 8125: {'lr': 0.0001352, 'samples': 260000, 'steps': 507, 'loss/train': 4.26437520980835} -09/20/2021 16:14:51 - INFO - __main__ - Step 8126: {'lr': 0.0001352, 'samples': 260032, 'steps': 507, 'loss/train': 4.632114887237549} -09/20/2021 16:14:52 - INFO - __main__ - Step 8127: {'lr': 0.0001352, 'samples': 260064, 'steps': 507, 'loss/train': 4.628859519958496} -09/20/2021 16:14:53 - INFO - __main__ - Step 8128: {'lr': 0.0001352, 'samples': 260096, 'steps': 507, 'loss/train': 0.8551200032234192} -09/20/2021 16:14:54 - INFO - __main__ - Step 8129: {'lr': 0.00013546666666666666, 'samples': 260128, 'steps': 508, 'loss/train': 4.437031269073486} -09/20/2021 16:14:55 - INFO - __main__ - Step 8130: {'lr': 0.00013546666666666666, 'samples': 260160, 'steps': 508, 'loss/train': 4.438231945037842} -09/20/2021 16:14:55 - INFO - __main__ - Step 8131: {'lr': 0.00013546666666666666, 'samples': 260192, 'steps': 508, 'loss/train': 3.785069704055786} -09/20/2021 16:14:56 - INFO - __main__ - Step 8132: {'lr': 0.00013546666666666666, 'samples': 260224, 'steps': 508, 'loss/train': 5.029649257659912} -09/20/2021 16:14:57 - INFO - __main__ - Step 8133: {'lr': 0.00013546666666666666, 'samples': 260256, 'steps': 508, 'loss/train': 5.029013156890869} -09/20/2021 16:14:58 - INFO - __main__ - Step 8134: {'lr': 0.00013546666666666666, 'samples': 260288, 'steps': 508, 'loss/train': 5.7491044998168945} -09/20/2021 16:14:58 - INFO - __main__ - Step 8135: {'lr': 0.00013546666666666666, 'samples': 260320, 'steps': 508, 'loss/train': 4.83797550201416} -09/20/2021 16:14:59 - INFO - __main__ - Step 8136: {'lr': 0.00013546666666666666, 'samples': 260352, 'steps': 508, 'loss/train': 5.175710678100586} -09/20/2021 16:15:00 - INFO - __main__ - Step 8137: {'lr': 0.00013546666666666666, 'samples': 260384, 'steps': 508, 'loss/train': 5.078213691711426} -09/20/2021 16:15:01 - INFO - __main__ - Step 8138: {'lr': 0.00013546666666666666, 'samples': 260416, 'steps': 508, 'loss/train': 5.9627485275268555} -09/20/2021 16:15:01 - INFO - __main__ - Step 8139: {'lr': 0.00013546666666666666, 'samples': 260448, 'steps': 508, 'loss/train': 4.812012195587158} -09/20/2021 16:15:02 - INFO - __main__ - Step 8140: {'lr': 0.00013546666666666666, 'samples': 260480, 'steps': 508, 'loss/train': 5.156847953796387} -09/20/2021 16:15:03 - INFO - __main__ - Step 8141: {'lr': 0.00013546666666666666, 'samples': 260512, 'steps': 508, 'loss/train': 4.950094223022461} -09/20/2021 16:15:04 - INFO - __main__ - Step 8142: {'lr': 0.00013546666666666666, 'samples': 260544, 'steps': 508, 'loss/train': 6.048647880554199} -09/20/2021 16:15:04 - INFO - __main__ - Step 8143: {'lr': 0.00013546666666666666, 'samples': 260576, 'steps': 508, 'loss/train': 4.1268157958984375} -09/20/2021 16:15:05 - INFO - __main__ - Step 8144: {'lr': 0.00013546666666666666, 'samples': 260608, 'steps': 508, 'loss/train': 4.773965358734131} -09/20/2021 16:15:06 - INFO - __main__ - Step 8145: {'lr': 0.00013573333333333334, 'samples': 260640, 'steps': 509, 'loss/train': 4.486992835998535} -09/20/2021 16:15:07 - INFO - __main__ - Step 8146: {'lr': 0.00013573333333333334, 'samples': 260672, 'steps': 509, 'loss/train': 5.779450416564941} -09/20/2021 16:15:07 - INFO - __main__ - Step 8147: {'lr': 0.00013573333333333334, 'samples': 260704, 'steps': 509, 'loss/train': 2.7769856452941895} -09/20/2021 16:15:09 - INFO - __main__ - Step 8148: {'lr': 0.00013573333333333334, 'samples': 260736, 'steps': 509, 'loss/train': 4.050869941711426} -09/20/2021 16:15:10 - INFO - __main__ - Step 8149: {'lr': 0.00013573333333333334, 'samples': 260768, 'steps': 509, 'loss/train': 4.496238708496094} -09/20/2021 16:15:11 - INFO - __main__ - Step 8150: {'lr': 0.00013573333333333334, 'samples': 260800, 'steps': 509, 'loss/train': 4.687173843383789} -09/20/2021 16:15:12 - INFO - __main__ - Step 8151: {'lr': 0.00013573333333333334, 'samples': 260832, 'steps': 509, 'loss/train': 4.935514450073242} -09/20/2021 16:15:12 - INFO - __main__ - Step 8152: {'lr': 0.00013573333333333334, 'samples': 260864, 'steps': 509, 'loss/train': 5.854527473449707} -09/20/2021 16:15:13 - INFO - __main__ - Step 8153: {'lr': 0.00013573333333333334, 'samples': 260896, 'steps': 509, 'loss/train': 4.77799129486084} -09/20/2021 16:15:14 - INFO - __main__ - Step 8154: {'lr': 0.00013573333333333334, 'samples': 260928, 'steps': 509, 'loss/train': 5.2923994064331055} -09/20/2021 16:15:15 - INFO - __main__ - Step 8155: {'lr': 0.00013573333333333334, 'samples': 260960, 'steps': 509, 'loss/train': 4.158280372619629} -09/20/2021 16:15:15 - INFO - __main__ - Step 8156: {'lr': 0.00013573333333333334, 'samples': 260992, 'steps': 509, 'loss/train': 5.326257228851318} -09/20/2021 16:15:16 - INFO - __main__ - Step 8157: {'lr': 0.00013573333333333334, 'samples': 261024, 'steps': 509, 'loss/train': 5.390577793121338} -09/20/2021 16:15:17 - INFO - __main__ - Step 8158: {'lr': 0.00013573333333333334, 'samples': 261056, 'steps': 509, 'loss/train': 5.539467811584473} -09/20/2021 16:15:18 - INFO - __main__ - Step 8159: {'lr': 0.00013573333333333334, 'samples': 261088, 'steps': 509, 'loss/train': 5.127799034118652} -09/20/2021 16:15:18 - INFO - __main__ - Step 8160: {'lr': 0.00013573333333333334, 'samples': 261120, 'steps': 509, 'loss/train': 4.2862019538879395} -09/20/2021 16:15:19 - INFO - __main__ - Step 8161: {'lr': 0.00013600000000000003, 'samples': 261152, 'steps': 510, 'loss/train': 5.293164253234863} -09/20/2021 16:15:20 - INFO - __main__ - Step 8162: {'lr': 0.00013600000000000003, 'samples': 261184, 'steps': 510, 'loss/train': 5.077103137969971} -09/20/2021 16:15:21 - INFO - __main__ - Step 8163: {'lr': 0.00013600000000000003, 'samples': 261216, 'steps': 510, 'loss/train': 4.709159851074219} -09/20/2021 16:15:21 - INFO - __main__ - Step 8164: {'lr': 0.00013600000000000003, 'samples': 261248, 'steps': 510, 'loss/train': 3.4721593856811523} -09/20/2021 16:15:22 - INFO - __main__ - Step 8165: {'lr': 0.00013600000000000003, 'samples': 261280, 'steps': 510, 'loss/train': 3.7943549156188965} -09/20/2021 16:15:23 - INFO - __main__ - Step 8166: {'lr': 0.00013600000000000003, 'samples': 261312, 'steps': 510, 'loss/train': 4.421189785003662} -09/20/2021 16:15:24 - INFO - __main__ - Step 8167: {'lr': 0.00013600000000000003, 'samples': 261344, 'steps': 510, 'loss/train': 6.0911545753479} -09/20/2021 16:15:24 - INFO - __main__ - Step 8168: {'lr': 0.00013600000000000003, 'samples': 261376, 'steps': 510, 'loss/train': 4.498915195465088} -09/20/2021 16:15:25 - INFO - __main__ - Step 8169: {'lr': 0.00013600000000000003, 'samples': 261408, 'steps': 510, 'loss/train': 5.080559253692627} -09/20/2021 16:15:26 - INFO - __main__ - Step 8170: {'lr': 0.00013600000000000003, 'samples': 261440, 'steps': 510, 'loss/train': 5.042623043060303} -09/20/2021 16:15:27 - INFO - __main__ - Step 8171: {'lr': 0.00013600000000000003, 'samples': 261472, 'steps': 510, 'loss/train': 4.506575584411621} -09/20/2021 16:15:27 - INFO - __main__ - Step 8172: {'lr': 0.00013600000000000003, 'samples': 261504, 'steps': 510, 'loss/train': 5.100335121154785} -09/20/2021 16:15:28 - INFO - __main__ - Step 8173: {'lr': 0.00013600000000000003, 'samples': 261536, 'steps': 510, 'loss/train': 5.150991916656494} -09/20/2021 16:15:29 - INFO - __main__ - Step 8174: {'lr': 0.00013600000000000003, 'samples': 261568, 'steps': 510, 'loss/train': 4.774386882781982} -09/20/2021 16:15:30 - INFO - __main__ - Step 8175: {'lr': 0.00013600000000000003, 'samples': 261600, 'steps': 510, 'loss/train': 4.29871940612793} -09/20/2021 16:15:30 - INFO - __main__ - Step 8176: {'lr': 0.00013600000000000003, 'samples': 261632, 'steps': 510, 'loss/train': 4.784303665161133} -09/20/2021 16:15:31 - INFO - __main__ - Step 8177: {'lr': 0.00013626666666666668, 'samples': 261664, 'steps': 511, 'loss/train': 4.293397426605225} -09/20/2021 16:15:33 - INFO - __main__ - Step 8178: {'lr': 0.00013626666666666668, 'samples': 261696, 'steps': 511, 'loss/train': 4.8852643966674805} -09/20/2021 16:15:33 - INFO - __main__ - Step 8179: {'lr': 0.00013626666666666668, 'samples': 261728, 'steps': 511, 'loss/train': 4.80974817276001} -09/20/2021 16:15:34 - INFO - __main__ - Step 8180: {'lr': 0.00013626666666666668, 'samples': 261760, 'steps': 511, 'loss/train': 4.698880672454834} -09/20/2021 16:15:35 - INFO - __main__ - Step 8181: {'lr': 0.00013626666666666668, 'samples': 261792, 'steps': 511, 'loss/train': 6.136437892913818} -09/20/2021 16:15:36 - INFO - __main__ - Step 8182: {'lr': 0.00013626666666666668, 'samples': 261824, 'steps': 511, 'loss/train': 4.688915252685547} -09/20/2021 16:15:36 - INFO - __main__ - Step 8183: {'lr': 0.00013626666666666668, 'samples': 261856, 'steps': 511, 'loss/train': 4.955677509307861} -09/20/2021 16:15:37 - INFO - __main__ - Step 8184: {'lr': 0.00013626666666666668, 'samples': 261888, 'steps': 511, 'loss/train': 4.227379322052002} -09/20/2021 16:15:38 - INFO - __main__ - Step 8185: {'lr': 0.00013626666666666668, 'samples': 261920, 'steps': 511, 'loss/train': 4.158198356628418} -09/20/2021 16:15:39 - INFO - __main__ - Step 8186: {'lr': 0.00013626666666666668, 'samples': 261952, 'steps': 511, 'loss/train': 4.90410041809082} -09/20/2021 16:15:39 - INFO - __main__ - Step 8187: {'lr': 0.00013626666666666668, 'samples': 261984, 'steps': 511, 'loss/train': 4.581525802612305} -09/20/2021 16:15:40 - INFO - __main__ - Step 8188: {'lr': 0.00013626666666666668, 'samples': 262016, 'steps': 511, 'loss/train': 4.040858268737793} -09/20/2021 16:15:41 - INFO - __main__ - Step 8189: {'lr': 0.00013626666666666668, 'samples': 262048, 'steps': 511, 'loss/train': 4.022397994995117} -09/20/2021 16:15:42 - INFO - __main__ - Step 8190: {'lr': 0.00013626666666666668, 'samples': 262080, 'steps': 511, 'loss/train': 4.295567035675049} -09/20/2021 16:15:42 - INFO - __main__ - Step 8191: {'lr': 0.00013626666666666668, 'samples': 262112, 'steps': 511, 'loss/train': 5.0347795486450195} -09/20/2021 16:15:43 - INFO - __main__ - Step 8192: {'lr': 0.00013626666666666668, 'samples': 262144, 'steps': 511, 'loss/train': 5.310291767120361} -09/20/2021 16:15:44 - INFO - __main__ - Step 8193: {'lr': 0.00013653333333333334, 'samples': 262176, 'steps': 512, 'loss/train': 4.8740129470825195} -09/20/2021 16:15:45 - INFO - __main__ - Step 8194: {'lr': 0.00013653333333333334, 'samples': 262208, 'steps': 512, 'loss/train': 4.727631092071533} -09/20/2021 16:15:45 - INFO - __main__ - Step 8195: {'lr': 0.00013653333333333334, 'samples': 262240, 'steps': 512, 'loss/train': 4.933140277862549} -09/20/2021 16:15:46 - INFO - __main__ - Step 8196: {'lr': 0.00013653333333333334, 'samples': 262272, 'steps': 512, 'loss/train': 4.245588302612305} -09/20/2021 16:15:47 - INFO - __main__ - Step 8197: {'lr': 0.00013653333333333334, 'samples': 262304, 'steps': 512, 'loss/train': 5.288358211517334} -09/20/2021 16:15:48 - INFO - __main__ - Step 8198: {'lr': 0.00013653333333333334, 'samples': 262336, 'steps': 512, 'loss/train': 3.498425245285034} -09/20/2021 16:15:48 - INFO - __main__ - Step 8199: {'lr': 0.00013653333333333334, 'samples': 262368, 'steps': 512, 'loss/train': 4.413025856018066} -09/20/2021 16:15:49 - INFO - __main__ - Step 8200: {'lr': 0.00013653333333333334, 'samples': 262400, 'steps': 512, 'loss/train': 4.6172661781311035} -09/20/2021 16:15:50 - INFO - __main__ - Step 8201: {'lr': 0.00013653333333333334, 'samples': 262432, 'steps': 512, 'loss/train': 5.183291912078857} -09/20/2021 16:15:51 - INFO - __main__ - Step 8202: {'lr': 0.00013653333333333334, 'samples': 262464, 'steps': 512, 'loss/train': 5.258609294891357} -09/20/2021 16:15:51 - INFO - __main__ - Step 8203: {'lr': 0.00013653333333333334, 'samples': 262496, 'steps': 512, 'loss/train': 4.68743896484375} -09/20/2021 16:15:52 - INFO - __main__ - Step 8204: {'lr': 0.00013653333333333334, 'samples': 262528, 'steps': 512, 'loss/train': 4.589786529541016} -09/20/2021 16:15:53 - INFO - __main__ - Step 8205: {'lr': 0.00013653333333333334, 'samples': 262560, 'steps': 512, 'loss/train': 5.253440856933594} -09/20/2021 16:15:54 - INFO - __main__ - Step 8206: {'lr': 0.00013653333333333334, 'samples': 262592, 'steps': 512, 'loss/train': 4.751091957092285} -09/20/2021 16:15:54 - INFO - __main__ - Step 8207: {'lr': 0.00013653333333333334, 'samples': 262624, 'steps': 512, 'loss/train': 4.478692054748535} -09/20/2021 16:15:55 - INFO - __main__ - Step 8208: {'lr': 0.00013653333333333334, 'samples': 262656, 'steps': 512, 'loss/train': 5.335365295410156} -09/20/2021 16:15:57 - INFO - __main__ - Step 8209: {'lr': 0.00013680000000000002, 'samples': 262688, 'steps': 513, 'loss/train': 4.487216472625732} -09/20/2021 16:15:57 - INFO - __main__ - Step 8210: {'lr': 0.00013680000000000002, 'samples': 262720, 'steps': 513, 'loss/train': 7.940284252166748} -09/20/2021 16:15:58 - INFO - __main__ - Step 8211: {'lr': 0.00013680000000000002, 'samples': 262752, 'steps': 513, 'loss/train': 5.423533916473389} -09/20/2021 16:15:59 - INFO - __main__ - Step 8212: {'lr': 0.00013680000000000002, 'samples': 262784, 'steps': 513, 'loss/train': 5.913768768310547} -09/20/2021 16:16:00 - INFO - __main__ - Step 8213: {'lr': 0.00013680000000000002, 'samples': 262816, 'steps': 513, 'loss/train': 5.1036834716796875} -09/20/2021 16:16:00 - INFO - __main__ - Step 8214: {'lr': 0.00013680000000000002, 'samples': 262848, 'steps': 513, 'loss/train': 4.485924243927002} -09/20/2021 16:16:01 - INFO - __main__ - Step 8215: {'lr': 0.00013680000000000002, 'samples': 262880, 'steps': 513, 'loss/train': 4.718984127044678} -09/20/2021 16:16:02 - INFO - __main__ - Step 8216: {'lr': 0.00013680000000000002, 'samples': 262912, 'steps': 513, 'loss/train': 4.489046096801758} -09/20/2021 16:16:03 - INFO - __main__ - Step 8217: {'lr': 0.00013680000000000002, 'samples': 262944, 'steps': 513, 'loss/train': 4.915503978729248} -09/20/2021 16:16:03 - INFO - __main__ - Step 8218: {'lr': 0.00013680000000000002, 'samples': 262976, 'steps': 513, 'loss/train': 4.74362325668335} -09/20/2021 16:16:04 - INFO - __main__ - Step 8219: {'lr': 0.00013680000000000002, 'samples': 263008, 'steps': 513, 'loss/train': 5.297684192657471} -09/20/2021 16:16:05 - INFO - __main__ - Step 8220: {'lr': 0.00013680000000000002, 'samples': 263040, 'steps': 513, 'loss/train': 6.06379508972168} -09/20/2021 16:16:06 - INFO - __main__ - Step 8221: {'lr': 0.00013680000000000002, 'samples': 263072, 'steps': 513, 'loss/train': 4.4706501960754395} -09/20/2021 16:16:06 - INFO - __main__ - Step 8222: {'lr': 0.00013680000000000002, 'samples': 263104, 'steps': 513, 'loss/train': 5.603203773498535} -09/20/2021 16:16:07 - INFO - __main__ - Step 8223: {'lr': 0.00013680000000000002, 'samples': 263136, 'steps': 513, 'loss/train': 4.691197872161865} -09/20/2021 16:16:08 - INFO - __main__ - Step 8224: {'lr': 0.00013680000000000002, 'samples': 263168, 'steps': 513, 'loss/train': 5.3788228034973145} -09/20/2021 16:16:09 - INFO - __main__ - Step 8225: {'lr': 0.00013706666666666667, 'samples': 263200, 'steps': 514, 'loss/train': 6.353540897369385} -09/20/2021 16:16:10 - INFO - __main__ - Step 8226: {'lr': 0.00013706666666666667, 'samples': 263232, 'steps': 514, 'loss/train': 5.064422607421875} -09/20/2021 16:16:10 - INFO - __main__ - Step 8227: {'lr': 0.00013706666666666667, 'samples': 263264, 'steps': 514, 'loss/train': 5.0379719734191895} -09/20/2021 16:16:11 - INFO - __main__ - Step 8228: {'lr': 0.00013706666666666667, 'samples': 263296, 'steps': 514, 'loss/train': 4.327494144439697} -09/20/2021 16:16:12 - INFO - __main__ - Step 8229: {'lr': 0.00013706666666666667, 'samples': 263328, 'steps': 514, 'loss/train': 4.709433078765869} -09/20/2021 16:16:13 - INFO - __main__ - Step 8230: {'lr': 0.00013706666666666667, 'samples': 263360, 'steps': 514, 'loss/train': 4.952918529510498} -09/20/2021 16:16:13 - INFO - __main__ - Step 8231: {'lr': 0.00013706666666666667, 'samples': 263392, 'steps': 514, 'loss/train': 4.307535171508789} -09/20/2021 16:16:14 - INFO - __main__ - Step 8232: {'lr': 0.00013706666666666667, 'samples': 263424, 'steps': 514, 'loss/train': 5.1117682456970215} -09/20/2021 16:16:15 - INFO - __main__ - Step 8233: {'lr': 0.00013706666666666667, 'samples': 263456, 'steps': 514, 'loss/train': 5.010421276092529} -09/20/2021 16:16:16 - INFO - __main__ - Step 8234: {'lr': 0.00013706666666666667, 'samples': 263488, 'steps': 514, 'loss/train': 5.52178430557251} -09/20/2021 16:16:16 - INFO - __main__ - Step 8235: {'lr': 0.00013706666666666667, 'samples': 263520, 'steps': 514, 'loss/train': 3.9577882289886475} -09/20/2021 16:16:17 - INFO - __main__ - Step 8236: {'lr': 0.00013706666666666667, 'samples': 263552, 'steps': 514, 'loss/train': 3.125263214111328} -09/20/2021 16:16:18 - INFO - __main__ - Step 8237: {'lr': 0.00013706666666666667, 'samples': 263584, 'steps': 514, 'loss/train': 2.706613302230835} -09/20/2021 16:16:19 - INFO - __main__ - Step 8238: {'lr': 0.00013706666666666667, 'samples': 263616, 'steps': 514, 'loss/train': 5.134960174560547} -09/20/2021 16:16:19 - INFO - __main__ - Step 8239: {'lr': 0.00013706666666666667, 'samples': 263648, 'steps': 514, 'loss/train': 4.883108615875244} -09/20/2021 16:16:21 - INFO - __main__ - Step 8240: {'lr': 0.00013706666666666667, 'samples': 263680, 'steps': 514, 'loss/train': 4.6785149574279785} -09/20/2021 16:16:22 - INFO - __main__ - Step 8241: {'lr': 0.00013733333333333333, 'samples': 263712, 'steps': 515, 'loss/train': 5.253059387207031} -09/20/2021 16:16:22 - INFO - __main__ - Step 8242: {'lr': 0.00013733333333333333, 'samples': 263744, 'steps': 515, 'loss/train': 5.3505730628967285} -09/20/2021 16:16:23 - INFO - __main__ - Step 8243: {'lr': 0.00013733333333333333, 'samples': 263776, 'steps': 515, 'loss/train': 4.234610557556152} -09/20/2021 16:16:24 - INFO - __main__ - Step 8244: {'lr': 0.00013733333333333333, 'samples': 263808, 'steps': 515, 'loss/train': 5.0356268882751465} -09/20/2021 16:16:25 - INFO - __main__ - Step 8245: {'lr': 0.00013733333333333333, 'samples': 263840, 'steps': 515, 'loss/train': 4.406744003295898} -09/20/2021 16:16:25 - INFO - __main__ - Step 8246: {'lr': 0.00013733333333333333, 'samples': 263872, 'steps': 515, 'loss/train': 4.702445983886719} -09/20/2021 16:16:26 - INFO - __main__ - Step 8247: {'lr': 0.00013733333333333333, 'samples': 263904, 'steps': 515, 'loss/train': 5.257935523986816} -09/20/2021 16:16:27 - INFO - __main__ - Step 8248: {'lr': 0.00013733333333333333, 'samples': 263936, 'steps': 515, 'loss/train': 5.411293983459473} -09/20/2021 16:16:28 - INFO - __main__ - Step 8249: {'lr': 0.00013733333333333333, 'samples': 263968, 'steps': 515, 'loss/train': 5.0842461585998535} -09/20/2021 16:16:28 - INFO - __main__ - Step 8250: {'lr': 0.00013733333333333333, 'samples': 264000, 'steps': 515, 'loss/train': 5.0411376953125} -09/20/2021 16:16:29 - INFO - __main__ - Step 8251: {'lr': 0.00013733333333333333, 'samples': 264032, 'steps': 515, 'loss/train': 4.18096923828125} -09/20/2021 16:16:30 - INFO - __main__ - Step 8252: {'lr': 0.00013733333333333333, 'samples': 264064, 'steps': 515, 'loss/train': 4.02484655380249} -09/20/2021 16:16:31 - INFO - __main__ - Step 8253: {'lr': 0.00013733333333333333, 'samples': 264096, 'steps': 515, 'loss/train': 4.4967193603515625} -09/20/2021 16:16:31 - INFO - __main__ - Step 8254: {'lr': 0.00013733333333333333, 'samples': 264128, 'steps': 515, 'loss/train': 4.736390113830566} -09/20/2021 16:16:32 - INFO - __main__ - Step 8255: {'lr': 0.00013733333333333333, 'samples': 264160, 'steps': 515, 'loss/train': 4.536403656005859} -09/20/2021 16:16:33 - INFO - __main__ - Step 8256: {'lr': 0.00013733333333333333, 'samples': 264192, 'steps': 515, 'loss/train': 4.825379371643066} -09/20/2021 16:16:34 - INFO - __main__ - Step 8257: {'lr': 0.00013759999999999998, 'samples': 264224, 'steps': 516, 'loss/train': 4.984072685241699} -09/20/2021 16:16:34 - INFO - __main__ - Step 8258: {'lr': 0.00013759999999999998, 'samples': 264256, 'steps': 516, 'loss/train': 4.578256130218506} -09/20/2021 16:16:35 - INFO - __main__ - Step 8259: {'lr': 0.00013759999999999998, 'samples': 264288, 'steps': 516, 'loss/train': 4.770174503326416} -09/20/2021 16:16:36 - INFO - __main__ - Step 8260: {'lr': 0.00013759999999999998, 'samples': 264320, 'steps': 516, 'loss/train': 4.056243896484375} -09/20/2021 16:16:37 - INFO - __main__ - Step 8261: {'lr': 0.00013759999999999998, 'samples': 264352, 'steps': 516, 'loss/train': 5.3342814445495605} -09/20/2021 16:16:37 - INFO - __main__ - Step 8262: {'lr': 0.00013759999999999998, 'samples': 264384, 'steps': 516, 'loss/train': 5.113504409790039} -09/20/2021 16:16:38 - INFO - __main__ - Step 8263: {'lr': 0.00013759999999999998, 'samples': 264416, 'steps': 516, 'loss/train': 6.053417205810547} -09/20/2021 16:16:39 - INFO - __main__ - Step 8264: {'lr': 0.00013759999999999998, 'samples': 264448, 'steps': 516, 'loss/train': 4.05882453918457} -09/20/2021 16:16:40 - INFO - __main__ - Step 8265: {'lr': 0.00013759999999999998, 'samples': 264480, 'steps': 516, 'loss/train': 5.1277852058410645} -09/20/2021 16:16:40 - INFO - __main__ - Step 8266: {'lr': 0.00013759999999999998, 'samples': 264512, 'steps': 516, 'loss/train': 4.912364959716797} -09/20/2021 16:16:41 - INFO - __main__ - Step 8267: {'lr': 0.00013759999999999998, 'samples': 264544, 'steps': 516, 'loss/train': 4.343206405639648} -09/20/2021 16:16:42 - INFO - __main__ - Step 8268: {'lr': 0.00013759999999999998, 'samples': 264576, 'steps': 516, 'loss/train': 6.089818954467773} -09/20/2021 16:16:43 - INFO - __main__ - Step 8269: {'lr': 0.00013759999999999998, 'samples': 264608, 'steps': 516, 'loss/train': 5.615055561065674} -09/20/2021 16:16:43 - INFO - __main__ - Step 8270: {'lr': 0.00013759999999999998, 'samples': 264640, 'steps': 516, 'loss/train': 4.492799282073975} -09/20/2021 16:16:45 - INFO - __main__ - Step 8271: {'lr': 0.00013759999999999998, 'samples': 264672, 'steps': 516, 'loss/train': 4.057308673858643} -09/20/2021 16:16:45 - INFO - __main__ - Step 8272: {'lr': 0.00013759999999999998, 'samples': 264704, 'steps': 516, 'loss/train': 4.959055423736572} -09/20/2021 16:16:46 - INFO - __main__ - Step 8273: {'lr': 0.00013786666666666667, 'samples': 264736, 'steps': 517, 'loss/train': 4.9857683181762695} -09/20/2021 16:16:47 - INFO - __main__ - Step 8274: {'lr': 0.00013786666666666667, 'samples': 264768, 'steps': 517, 'loss/train': 4.609445095062256} -09/20/2021 16:16:48 - INFO - __main__ - Step 8275: {'lr': 0.00013786666666666667, 'samples': 264800, 'steps': 517, 'loss/train': 5.897220134735107} -09/20/2021 16:16:49 - INFO - __main__ - Step 8276: {'lr': 0.00013786666666666667, 'samples': 264832, 'steps': 517, 'loss/train': 5.925364017486572} -09/20/2021 16:16:49 - INFO - __main__ - Step 8277: {'lr': 0.00013786666666666667, 'samples': 264864, 'steps': 517, 'loss/train': 6.018309593200684} -09/20/2021 16:16:50 - INFO - __main__ - Step 8278: {'lr': 0.00013786666666666667, 'samples': 264896, 'steps': 517, 'loss/train': 5.123812675476074} -09/20/2021 16:16:51 - INFO - __main__ - Step 8279: {'lr': 0.00013786666666666667, 'samples': 264928, 'steps': 517, 'loss/train': 5.170071601867676} -09/20/2021 16:16:52 - INFO - __main__ - Step 8280: {'lr': 0.00013786666666666667, 'samples': 264960, 'steps': 517, 'loss/train': 4.681013584136963} -09/20/2021 16:16:52 - INFO - __main__ - Step 8281: {'lr': 0.00013786666666666667, 'samples': 264992, 'steps': 517, 'loss/train': 4.475762844085693} -09/20/2021 16:16:53 - INFO - __main__ - Step 8282: {'lr': 0.00013786666666666667, 'samples': 265024, 'steps': 517, 'loss/train': 4.7479352951049805} -09/20/2021 16:16:54 - INFO - __main__ - Step 8283: {'lr': 0.00013786666666666667, 'samples': 265056, 'steps': 517, 'loss/train': 4.9596476554870605} -09/20/2021 16:16:55 - INFO - __main__ - Step 8284: {'lr': 0.00013786666666666667, 'samples': 265088, 'steps': 517, 'loss/train': 4.589717388153076} -09/20/2021 16:16:55 - INFO - __main__ - Step 8285: {'lr': 0.00013786666666666667, 'samples': 265120, 'steps': 517, 'loss/train': 5.0972137451171875} -09/20/2021 16:16:56 - INFO - __main__ - Step 8286: {'lr': 0.00013786666666666667, 'samples': 265152, 'steps': 517, 'loss/train': 5.20241641998291} -09/20/2021 16:16:57 - INFO - __main__ - Step 8287: {'lr': 0.00013786666666666667, 'samples': 265184, 'steps': 517, 'loss/train': 4.073169708251953} -09/20/2021 16:16:58 - INFO - __main__ - Step 8288: {'lr': 0.00013786666666666667, 'samples': 265216, 'steps': 517, 'loss/train': 4.22564697265625} -09/20/2021 16:16:58 - INFO - __main__ - Step 8289: {'lr': 0.00013813333333333335, 'samples': 265248, 'steps': 518, 'loss/train': 4.219852447509766} -09/20/2021 16:16:59 - INFO - __main__ - Step 8290: {'lr': 0.00013813333333333335, 'samples': 265280, 'steps': 518, 'loss/train': 4.456119537353516} -09/20/2021 16:17:00 - INFO - __main__ - Step 8291: {'lr': 0.00013813333333333335, 'samples': 265312, 'steps': 518, 'loss/train': 4.891211032867432} -09/20/2021 16:17:01 - INFO - __main__ - Step 8292: {'lr': 0.00013813333333333335, 'samples': 265344, 'steps': 518, 'loss/train': 4.014957904815674} -09/20/2021 16:17:01 - INFO - __main__ - Step 8293: {'lr': 0.00013813333333333335, 'samples': 265376, 'steps': 518, 'loss/train': 4.901701927185059} -09/20/2021 16:17:02 - INFO - __main__ - Step 8294: {'lr': 0.00013813333333333335, 'samples': 265408, 'steps': 518, 'loss/train': 4.666901588439941} -09/20/2021 16:17:03 - INFO - __main__ - Step 8295: {'lr': 0.00013813333333333335, 'samples': 265440, 'steps': 518, 'loss/train': 4.966566562652588} -09/20/2021 16:17:04 - INFO - __main__ - Step 8296: {'lr': 0.00013813333333333335, 'samples': 265472, 'steps': 518, 'loss/train': 4.953579425811768} -09/20/2021 16:17:04 - INFO - __main__ - Step 8297: {'lr': 0.00013813333333333335, 'samples': 265504, 'steps': 518, 'loss/train': 4.560795307159424} -09/20/2021 16:17:05 - INFO - __main__ - Step 8298: {'lr': 0.00013813333333333335, 'samples': 265536, 'steps': 518, 'loss/train': 4.448799133300781} -09/20/2021 16:17:06 - INFO - __main__ - Step 8299: {'lr': 0.00013813333333333335, 'samples': 265568, 'steps': 518, 'loss/train': 5.278107643127441} -09/20/2021 16:17:07 - INFO - __main__ - Step 8300: {'lr': 0.00013813333333333335, 'samples': 265600, 'steps': 518, 'loss/train': 4.8210296630859375} -09/20/2021 16:17:08 - INFO - __main__ - Step 8301: {'lr': 0.00013813333333333335, 'samples': 265632, 'steps': 518, 'loss/train': 5.118541717529297} -09/20/2021 16:17:09 - INFO - __main__ - Step 8302: {'lr': 0.00013813333333333335, 'samples': 265664, 'steps': 518, 'loss/train': 4.803258419036865} -09/20/2021 16:17:09 - INFO - __main__ - Step 8303: {'lr': 0.00013813333333333335, 'samples': 265696, 'steps': 518, 'loss/train': 4.983299255371094} -09/20/2021 16:17:10 - INFO - __main__ - Step 8304: {'lr': 0.00013813333333333335, 'samples': 265728, 'steps': 518, 'loss/train': 5.192386150360107} -09/20/2021 16:17:11 - INFO - __main__ - Step 8305: {'lr': 0.0001384, 'samples': 265760, 'steps': 519, 'loss/train': 5.374884605407715} -09/20/2021 16:17:12 - INFO - __main__ - Step 8306: {'lr': 0.0001384, 'samples': 265792, 'steps': 519, 'loss/train': 5.312557697296143} -09/20/2021 16:17:13 - INFO - __main__ - Step 8307: {'lr': 0.0001384, 'samples': 265824, 'steps': 519, 'loss/train': 4.705141067504883} -09/20/2021 16:17:13 - INFO - __main__ - Step 8308: {'lr': 0.0001384, 'samples': 265856, 'steps': 519, 'loss/train': 4.916872501373291} -09/20/2021 16:17:14 - INFO - __main__ - Step 8309: {'lr': 0.0001384, 'samples': 265888, 'steps': 519, 'loss/train': 4.211173057556152} -09/20/2021 16:17:15 - INFO - __main__ - Step 8310: {'lr': 0.0001384, 'samples': 265920, 'steps': 519, 'loss/train': 5.325112342834473} -09/20/2021 16:17:16 - INFO - __main__ - Step 8311: {'lr': 0.0001384, 'samples': 265952, 'steps': 519, 'loss/train': 4.890938758850098} -09/20/2021 16:17:16 - INFO - __main__ - Step 8312: {'lr': 0.0001384, 'samples': 265984, 'steps': 519, 'loss/train': 5.0255913734436035} -09/20/2021 16:17:17 - INFO - __main__ - Step 8313: {'lr': 0.0001384, 'samples': 266016, 'steps': 519, 'loss/train': 4.245161533355713} -09/20/2021 16:17:18 - INFO - __main__ - Step 8314: {'lr': 0.0001384, 'samples': 266048, 'steps': 519, 'loss/train': 4.666331768035889} -09/20/2021 16:17:19 - INFO - __main__ - Step 8315: {'lr': 0.0001384, 'samples': 266080, 'steps': 519, 'loss/train': 4.758396625518799} -09/20/2021 16:17:19 - INFO - __main__ - Step 8316: {'lr': 0.0001384, 'samples': 266112, 'steps': 519, 'loss/train': 5.0908684730529785} -09/20/2021 16:17:20 - INFO - __main__ - Step 8317: {'lr': 0.0001384, 'samples': 266144, 'steps': 519, 'loss/train': 5.073812961578369} -09/20/2021 16:17:21 - INFO - __main__ - Step 8318: {'lr': 0.0001384, 'samples': 266176, 'steps': 519, 'loss/train': 4.5440874099731445} -09/20/2021 16:17:22 - INFO - __main__ - Step 8319: {'lr': 0.0001384, 'samples': 266208, 'steps': 519, 'loss/train': 4.656091213226318} -09/20/2021 16:17:22 - INFO - __main__ - Step 8320: {'lr': 0.0001384, 'samples': 266240, 'steps': 519, 'loss/train': 3.8859703540802} -09/20/2021 16:17:23 - INFO - __main__ - Step 8321: {'lr': 0.00013866666666666669, 'samples': 266272, 'steps': 520, 'loss/train': 5.288235187530518} -09/20/2021 16:17:24 - INFO - __main__ - Step 8322: {'lr': 0.00013866666666666669, 'samples': 266304, 'steps': 520, 'loss/train': 4.290469646453857} -09/20/2021 16:17:25 - INFO - __main__ - Step 8323: {'lr': 0.00013866666666666669, 'samples': 266336, 'steps': 520, 'loss/train': 3.156390428543091} -09/20/2021 16:17:25 - INFO - __main__ - Step 8324: {'lr': 0.00013866666666666669, 'samples': 266368, 'steps': 520, 'loss/train': 2.3457837104797363} -09/20/2021 16:17:26 - INFO - __main__ - Step 8325: {'lr': 0.00013866666666666669, 'samples': 266400, 'steps': 520, 'loss/train': 4.415004730224609} -09/20/2021 16:17:27 - INFO - __main__ - Step 8326: {'lr': 0.00013866666666666669, 'samples': 266432, 'steps': 520, 'loss/train': 4.674689292907715} -09/20/2021 16:17:28 - INFO - __main__ - Step 8327: {'lr': 0.00013866666666666669, 'samples': 266464, 'steps': 520, 'loss/train': 3.900477647781372} -09/20/2021 16:17:28 - INFO - __main__ - Step 8328: {'lr': 0.00013866666666666669, 'samples': 266496, 'steps': 520, 'loss/train': 5.398026466369629} -09/20/2021 16:17:29 - INFO - __main__ - Step 8329: {'lr': 0.00013866666666666669, 'samples': 266528, 'steps': 520, 'loss/train': 5.222321033477783} -09/20/2021 16:17:30 - INFO - __main__ - Step 8330: {'lr': 0.00013866666666666669, 'samples': 266560, 'steps': 520, 'loss/train': 5.05440616607666} -09/20/2021 16:17:31 - INFO - __main__ - Step 8331: {'lr': 0.00013866666666666669, 'samples': 266592, 'steps': 520, 'loss/train': 4.660726070404053} -09/20/2021 16:17:32 - INFO - __main__ - Step 8332: {'lr': 0.00013866666666666669, 'samples': 266624, 'steps': 520, 'loss/train': 4.476259708404541} -09/20/2021 16:17:33 - INFO - __main__ - Step 8333: {'lr': 0.00013866666666666669, 'samples': 266656, 'steps': 520, 'loss/train': 4.688841342926025} -09/20/2021 16:17:34 - INFO - __main__ - Step 8334: {'lr': 0.00013866666666666669, 'samples': 266688, 'steps': 520, 'loss/train': 4.332649230957031} -09/20/2021 16:17:34 - INFO - __main__ - Step 8335: {'lr': 0.00013866666666666669, 'samples': 266720, 'steps': 520, 'loss/train': 6.4903082847595215} -09/20/2021 16:17:35 - INFO - __main__ - Step 8336: {'lr': 0.00013866666666666669, 'samples': 266752, 'steps': 520, 'loss/train': 4.190954685211182} -09/20/2021 16:17:36 - INFO - __main__ - Step 8337: {'lr': 0.00013893333333333334, 'samples': 266784, 'steps': 521, 'loss/train': 4.290049076080322} -09/20/2021 16:17:37 - INFO - __main__ - Step 8338: {'lr': 0.00013893333333333334, 'samples': 266816, 'steps': 521, 'loss/train': 5.967911720275879} -09/20/2021 16:17:37 - INFO - __main__ - Step 8339: {'lr': 0.00013893333333333334, 'samples': 266848, 'steps': 521, 'loss/train': 4.905579090118408} -09/20/2021 16:17:38 - INFO - __main__ - Step 8340: {'lr': 0.00013893333333333334, 'samples': 266880, 'steps': 521, 'loss/train': 5.288913249969482} -09/20/2021 16:17:39 - INFO - __main__ - Step 8341: {'lr': 0.00013893333333333334, 'samples': 266912, 'steps': 521, 'loss/train': 4.607113838195801} -09/20/2021 16:17:40 - INFO - __main__ - Step 8342: {'lr': 0.00013893333333333334, 'samples': 266944, 'steps': 521, 'loss/train': 4.9455246925354} -09/20/2021 16:17:40 - INFO - __main__ - Step 8343: {'lr': 0.00013893333333333334, 'samples': 266976, 'steps': 521, 'loss/train': 6.5701799392700195} -09/20/2021 16:17:41 - INFO - __main__ - Step 8344: {'lr': 0.00013893333333333334, 'samples': 267008, 'steps': 521, 'loss/train': 6.540893077850342} -09/20/2021 16:17:42 - INFO - __main__ - Step 8345: {'lr': 0.00013893333333333334, 'samples': 267040, 'steps': 521, 'loss/train': 5.804166316986084} -09/20/2021 16:17:43 - INFO - __main__ - Step 8346: {'lr': 0.00013893333333333334, 'samples': 267072, 'steps': 521, 'loss/train': 4.887452602386475} -09/20/2021 16:17:43 - INFO - __main__ - Step 8347: {'lr': 0.00013893333333333334, 'samples': 267104, 'steps': 521, 'loss/train': 5.241595268249512} -09/20/2021 16:17:44 - INFO - __main__ - Step 8348: {'lr': 0.00013893333333333334, 'samples': 267136, 'steps': 521, 'loss/train': 2.508281946182251} -09/20/2021 16:17:45 - INFO - __main__ - Step 8349: {'lr': 0.00013893333333333334, 'samples': 267168, 'steps': 521, 'loss/train': 5.18813943862915} -09/20/2021 16:17:46 - INFO - __main__ - Step 8350: {'lr': 0.00013893333333333334, 'samples': 267200, 'steps': 521, 'loss/train': 4.314988136291504} -09/20/2021 16:17:46 - INFO - __main__ - Step 8351: {'lr': 0.00013893333333333334, 'samples': 267232, 'steps': 521, 'loss/train': 5.664224147796631} -09/20/2021 16:17:47 - INFO - __main__ - Step 8352: {'lr': 0.00013893333333333334, 'samples': 267264, 'steps': 521, 'loss/train': 5.391720294952393} -09/20/2021 16:17:48 - INFO - __main__ - Step 8353: {'lr': 0.0001392, 'samples': 267296, 'steps': 522, 'loss/train': 4.890407085418701} -09/20/2021 16:17:49 - INFO - __main__ - Step 8354: {'lr': 0.0001392, 'samples': 267328, 'steps': 522, 'loss/train': 5.3025336265563965} -09/20/2021 16:17:50 - INFO - __main__ - Step 8355: {'lr': 0.0001392, 'samples': 267360, 'steps': 522, 'loss/train': 4.262956619262695} -09/20/2021 16:17:50 - INFO - __main__ - Step 8356: {'lr': 0.0001392, 'samples': 267392, 'steps': 522, 'loss/train': 4.635143280029297} -09/20/2021 16:17:51 - INFO - __main__ - Step 8357: {'lr': 0.0001392, 'samples': 267424, 'steps': 522, 'loss/train': 4.652395725250244} -09/20/2021 16:17:52 - INFO - __main__ - Step 8358: {'lr': 0.0001392, 'samples': 267456, 'steps': 522, 'loss/train': 4.470128536224365} -09/20/2021 16:17:53 - INFO - __main__ - Step 8359: {'lr': 0.0001392, 'samples': 267488, 'steps': 522, 'loss/train': 4.545723915100098} -09/20/2021 16:17:53 - INFO - __main__ - Step 8360: {'lr': 0.0001392, 'samples': 267520, 'steps': 522, 'loss/train': 4.111733436584473} -09/20/2021 16:17:54 - INFO - __main__ - Step 8361: {'lr': 0.0001392, 'samples': 267552, 'steps': 522, 'loss/train': 4.381044387817383} -09/20/2021 16:17:55 - INFO - __main__ - Step 8362: {'lr': 0.0001392, 'samples': 267584, 'steps': 522, 'loss/train': 4.981093406677246} -09/20/2021 16:17:56 - INFO - __main__ - Step 8363: {'lr': 0.0001392, 'samples': 267616, 'steps': 522, 'loss/train': 4.54620885848999} -09/20/2021 16:17:57 - INFO - __main__ - Step 8364: {'lr': 0.0001392, 'samples': 267648, 'steps': 522, 'loss/train': 3.7017204761505127} -09/20/2021 16:17:58 - INFO - __main__ - Step 8365: {'lr': 0.0001392, 'samples': 267680, 'steps': 522, 'loss/train': 4.979038238525391} -09/20/2021 16:17:58 - INFO - __main__ - Step 8366: {'lr': 0.0001392, 'samples': 267712, 'steps': 522, 'loss/train': 6.225692272186279} -09/20/2021 16:17:59 - INFO - __main__ - Step 8367: {'lr': 0.0001392, 'samples': 267744, 'steps': 522, 'loss/train': 5.034327507019043} -09/20/2021 16:18:00 - INFO - __main__ - Step 8368: {'lr': 0.0001392, 'samples': 267776, 'steps': 522, 'loss/train': 4.709845066070557} -09/20/2021 16:18:01 - INFO - __main__ - Step 8369: {'lr': 0.00013946666666666668, 'samples': 267808, 'steps': 523, 'loss/train': 3.82847261428833} -09/20/2021 16:18:02 - INFO - __main__ - Step 8370: {'lr': 0.00013946666666666668, 'samples': 267840, 'steps': 523, 'loss/train': 4.212127685546875} -09/20/2021 16:18:02 - INFO - __main__ - Step 8371: {'lr': 0.00013946666666666668, 'samples': 267872, 'steps': 523, 'loss/train': 4.7287702560424805} -09/20/2021 16:18:03 - INFO - __main__ - Step 8372: {'lr': 0.00013946666666666668, 'samples': 267904, 'steps': 523, 'loss/train': 5.122190475463867} -09/20/2021 16:18:04 - INFO - __main__ - Step 8373: {'lr': 0.00013946666666666668, 'samples': 267936, 'steps': 523, 'loss/train': 4.421243190765381} -09/20/2021 16:18:05 - INFO - __main__ - Step 8374: {'lr': 0.00013946666666666668, 'samples': 267968, 'steps': 523, 'loss/train': 4.613197326660156} -09/20/2021 16:18:05 - INFO - __main__ - Step 8375: {'lr': 0.00013946666666666668, 'samples': 268000, 'steps': 523, 'loss/train': 4.85960054397583} -09/20/2021 16:18:06 - INFO - __main__ - Step 8376: {'lr': 0.00013946666666666668, 'samples': 268032, 'steps': 523, 'loss/train': 5.121060371398926} -09/20/2021 16:18:07 - INFO - __main__ - Step 8377: {'lr': 0.00013946666666666668, 'samples': 268064, 'steps': 523, 'loss/train': 5.128673076629639} -09/20/2021 16:18:08 - INFO - __main__ - Step 8378: {'lr': 0.00013946666666666668, 'samples': 268096, 'steps': 523, 'loss/train': 3.6870009899139404} -09/20/2021 16:18:08 - INFO - __main__ - Step 8379: {'lr': 0.00013946666666666668, 'samples': 268128, 'steps': 523, 'loss/train': 4.2932024002075195} -09/20/2021 16:18:09 - INFO - __main__ - Step 8380: {'lr': 0.00013946666666666668, 'samples': 268160, 'steps': 523, 'loss/train': 4.9027018547058105} -09/20/2021 16:18:10 - INFO - __main__ - Step 8381: {'lr': 0.00013946666666666668, 'samples': 268192, 'steps': 523, 'loss/train': 5.529719352722168} -09/20/2021 16:18:11 - INFO - __main__ - Step 8382: {'lr': 0.00013946666666666668, 'samples': 268224, 'steps': 523, 'loss/train': 6.040085315704346} -09/20/2021 16:18:11 - INFO - __main__ - Step 8383: {'lr': 0.00013946666666666668, 'samples': 268256, 'steps': 523, 'loss/train': 4.558676719665527} -09/20/2021 16:18:12 - INFO - __main__ - Step 8384: {'lr': 0.00013946666666666668, 'samples': 268288, 'steps': 523, 'loss/train': 4.3400983810424805} -09/20/2021 16:18:13 - INFO - __main__ - Step 8385: {'lr': 0.00013973333333333333, 'samples': 268320, 'steps': 524, 'loss/train': 4.51430606842041} -09/20/2021 16:18:14 - INFO - __main__ - Step 8386: {'lr': 0.00013973333333333333, 'samples': 268352, 'steps': 524, 'loss/train': 5.712860107421875} -09/20/2021 16:18:14 - INFO - __main__ - Step 8387: {'lr': 0.00013973333333333333, 'samples': 268384, 'steps': 524, 'loss/train': 4.628058433532715} -09/20/2021 16:18:15 - INFO - __main__ - Step 8388: {'lr': 0.00013973333333333333, 'samples': 268416, 'steps': 524, 'loss/train': 4.236032962799072} -09/20/2021 16:18:16 - INFO - __main__ - Step 8389: {'lr': 0.00013973333333333333, 'samples': 268448, 'steps': 524, 'loss/train': 5.042016983032227} -09/20/2021 16:18:17 - INFO - __main__ - Step 8390: {'lr': 0.00013973333333333333, 'samples': 268480, 'steps': 524, 'loss/train': 5.376533508300781} -09/20/2021 16:18:17 - INFO - __main__ - Step 8391: {'lr': 0.00013973333333333333, 'samples': 268512, 'steps': 524, 'loss/train': 4.40023946762085} -09/20/2021 16:18:18 - INFO - __main__ - Step 8392: {'lr': 0.00013973333333333333, 'samples': 268544, 'steps': 524, 'loss/train': 4.913669109344482} -09/20/2021 16:18:19 - INFO - __main__ - Step 8393: {'lr': 0.00013973333333333333, 'samples': 268576, 'steps': 524, 'loss/train': 3.212616443634033} -09/20/2021 16:18:20 - INFO - __main__ - Step 8394: {'lr': 0.00013973333333333333, 'samples': 268608, 'steps': 524, 'loss/train': 4.840591907501221} -09/20/2021 16:18:21 - INFO - __main__ - Step 8395: {'lr': 0.00013973333333333333, 'samples': 268640, 'steps': 524, 'loss/train': 4.602542877197266} -09/20/2021 16:18:22 - INFO - __main__ - Step 8396: {'lr': 0.00013973333333333333, 'samples': 268672, 'steps': 524, 'loss/train': 5.404891014099121} -09/20/2021 16:18:23 - INFO - __main__ - Step 8397: {'lr': 0.00013973333333333333, 'samples': 268704, 'steps': 524, 'loss/train': 5.168572425842285} -09/20/2021 16:18:23 - INFO - __main__ - Step 8398: {'lr': 0.00013973333333333333, 'samples': 268736, 'steps': 524, 'loss/train': 4.979480743408203} -09/20/2021 16:18:24 - INFO - __main__ - Step 8399: {'lr': 0.00013973333333333333, 'samples': 268768, 'steps': 524, 'loss/train': 4.517699241638184} -09/20/2021 16:18:25 - INFO - __main__ - Step 8400: {'lr': 0.00013973333333333333, 'samples': 268800, 'steps': 524, 'loss/train': 7.312889575958252} -09/20/2021 16:18:26 - INFO - __main__ - Step 8401: {'lr': 0.00014, 'samples': 268832, 'steps': 525, 'loss/train': 6.211106777191162} -09/20/2021 16:18:26 - INFO - __main__ - Step 8402: {'lr': 0.00014, 'samples': 268864, 'steps': 525, 'loss/train': 6.558599472045898} -09/20/2021 16:18:27 - INFO - __main__ - Step 8403: {'lr': 0.00014, 'samples': 268896, 'steps': 525, 'loss/train': 4.476475715637207} -09/20/2021 16:18:28 - INFO - __main__ - Step 8404: {'lr': 0.00014, 'samples': 268928, 'steps': 525, 'loss/train': 4.617824077606201} -09/20/2021 16:18:29 - INFO - __main__ - Step 8405: {'lr': 0.00014, 'samples': 268960, 'steps': 525, 'loss/train': 4.687784194946289} -09/20/2021 16:18:29 - INFO - __main__ - Step 8406: {'lr': 0.00014, 'samples': 268992, 'steps': 525, 'loss/train': 5.002508640289307} -09/20/2021 16:18:30 - INFO - __main__ - Step 8407: {'lr': 0.00014, 'samples': 269024, 'steps': 525, 'loss/train': 4.727361679077148} -09/20/2021 16:18:31 - INFO - __main__ - Step 8408: {'lr': 0.00014, 'samples': 269056, 'steps': 525, 'loss/train': 5.521719932556152} -09/20/2021 16:18:32 - INFO - __main__ - Step 8409: {'lr': 0.00014, 'samples': 269088, 'steps': 525, 'loss/train': 4.274972915649414} -09/20/2021 16:18:32 - INFO - __main__ - Step 8410: {'lr': 0.00014, 'samples': 269120, 'steps': 525, 'loss/train': 4.561725616455078} -09/20/2021 16:18:33 - INFO - __main__ - Step 8411: {'lr': 0.00014, 'samples': 269152, 'steps': 525, 'loss/train': 4.2398552894592285} -09/20/2021 16:18:34 - INFO - __main__ - Step 8412: {'lr': 0.00014, 'samples': 269184, 'steps': 525, 'loss/train': 4.870556354522705} -09/20/2021 16:18:35 - INFO - __main__ - Step 8413: {'lr': 0.00014, 'samples': 269216, 'steps': 525, 'loss/train': 4.897374153137207} -09/20/2021 16:18:35 - INFO - __main__ - Step 8414: {'lr': 0.00014, 'samples': 269248, 'steps': 525, 'loss/train': 5.216139316558838} -09/20/2021 16:18:36 - INFO - __main__ - Step 8415: {'lr': 0.00014, 'samples': 269280, 'steps': 525, 'loss/train': 4.588832855224609} -09/20/2021 16:18:37 - INFO - __main__ - Step 8416: {'lr': 0.00014, 'samples': 269312, 'steps': 525, 'loss/train': 5.2097601890563965} -09/20/2021 16:18:38 - INFO - __main__ - Step 8417: {'lr': 0.00014026666666666667, 'samples': 269344, 'steps': 526, 'loss/train': 4.810086727142334} -09/20/2021 16:18:39 - INFO - __main__ - Step 8418: {'lr': 0.00014026666666666667, 'samples': 269376, 'steps': 526, 'loss/train': 4.887829303741455} -09/20/2021 16:18:39 - INFO - __main__ - Step 8419: {'lr': 0.00014026666666666667, 'samples': 269408, 'steps': 526, 'loss/train': 5.328725337982178} -09/20/2021 16:18:40 - INFO - __main__ - Step 8420: {'lr': 0.00014026666666666667, 'samples': 269440, 'steps': 526, 'loss/train': 4.29345178604126} -09/20/2021 16:18:41 - INFO - __main__ - Step 8421: {'lr': 0.00014026666666666667, 'samples': 269472, 'steps': 526, 'loss/train': 4.458139419555664} -09/20/2021 16:18:42 - INFO - __main__ - Step 8422: {'lr': 0.00014026666666666667, 'samples': 269504, 'steps': 526, 'loss/train': 4.395535469055176} -09/20/2021 16:18:42 - INFO - __main__ - Step 8423: {'lr': 0.00014026666666666667, 'samples': 269536, 'steps': 526, 'loss/train': 4.4688496589660645} -09/20/2021 16:18:43 - INFO - __main__ - Step 8424: {'lr': 0.00014026666666666667, 'samples': 269568, 'steps': 526, 'loss/train': 2.218346118927002} -09/20/2021 16:18:44 - INFO - __main__ - Step 8425: {'lr': 0.00014026666666666667, 'samples': 269600, 'steps': 526, 'loss/train': 4.615657329559326} -09/20/2021 16:18:45 - INFO - __main__ - Step 8426: {'lr': 0.00014026666666666667, 'samples': 269632, 'steps': 526, 'loss/train': 4.1495137214660645} -09/20/2021 16:18:46 - INFO - __main__ - Step 8427: {'lr': 0.00014026666666666667, 'samples': 269664, 'steps': 526, 'loss/train': 4.761529445648193} -09/20/2021 16:18:47 - INFO - __main__ - Step 8428: {'lr': 0.00014026666666666667, 'samples': 269696, 'steps': 526, 'loss/train': 4.834897041320801} -09/20/2021 16:18:48 - INFO - __main__ - Step 8429: {'lr': 0.00014026666666666667, 'samples': 269728, 'steps': 526, 'loss/train': 4.4865288734436035} -09/20/2021 16:18:48 - INFO - __main__ - Step 8430: {'lr': 0.00014026666666666667, 'samples': 269760, 'steps': 526, 'loss/train': 4.741208553314209} -09/20/2021 16:18:49 - INFO - __main__ - Step 8431: {'lr': 0.00014026666666666667, 'samples': 269792, 'steps': 526, 'loss/train': 4.981827735900879} -09/20/2021 16:18:50 - INFO - __main__ - Step 8432: {'lr': 0.00014026666666666667, 'samples': 269824, 'steps': 526, 'loss/train': 4.242702007293701} -09/20/2021 16:18:51 - INFO - __main__ - Step 8433: {'lr': 0.00014053333333333335, 'samples': 269856, 'steps': 527, 'loss/train': 4.431872367858887} -09/20/2021 16:18:51 - INFO - __main__ - Step 8434: {'lr': 0.00014053333333333335, 'samples': 269888, 'steps': 527, 'loss/train': 5.225579738616943} -09/20/2021 16:18:52 - INFO - __main__ - Step 8435: {'lr': 0.00014053333333333335, 'samples': 269920, 'steps': 527, 'loss/train': 4.319027900695801} -09/20/2021 16:18:53 - INFO - __main__ - Step 8436: {'lr': 0.00014053333333333335, 'samples': 269952, 'steps': 527, 'loss/train': 5.360867023468018} -09/20/2021 16:18:54 - INFO - __main__ - Step 8437: {'lr': 0.00014053333333333335, 'samples': 269984, 'steps': 527, 'loss/train': 6.6829352378845215} -09/20/2021 16:18:54 - INFO - __main__ - Step 8438: {'lr': 0.00014053333333333335, 'samples': 270016, 'steps': 527, 'loss/train': 5.067068099975586} -09/20/2021 16:18:55 - INFO - __main__ - Step 8439: {'lr': 0.00014053333333333335, 'samples': 270048, 'steps': 527, 'loss/train': 5.112198829650879} -09/20/2021 16:18:56 - INFO - __main__ - Step 8440: {'lr': 0.00014053333333333335, 'samples': 270080, 'steps': 527, 'loss/train': 5.003281116485596} -09/20/2021 16:18:57 - INFO - __main__ - Step 8441: {'lr': 0.00014053333333333335, 'samples': 270112, 'steps': 527, 'loss/train': 4.780325412750244} -09/20/2021 16:18:57 - INFO - __main__ - Step 8442: {'lr': 0.00014053333333333335, 'samples': 270144, 'steps': 527, 'loss/train': 4.410913467407227} -09/20/2021 16:18:58 - INFO - __main__ - Step 8443: {'lr': 0.00014053333333333335, 'samples': 270176, 'steps': 527, 'loss/train': 4.662774562835693} -09/20/2021 16:18:59 - INFO - __main__ - Step 8444: {'lr': 0.00014053333333333335, 'samples': 270208, 'steps': 527, 'loss/train': 2.6446776390075684} -09/20/2021 16:19:00 - INFO - __main__ - Step 8445: {'lr': 0.00014053333333333335, 'samples': 270240, 'steps': 527, 'loss/train': 3.001793622970581} -09/20/2021 16:19:00 - INFO - __main__ - Step 8446: {'lr': 0.00014053333333333335, 'samples': 270272, 'steps': 527, 'loss/train': 2.3528270721435547} -09/20/2021 16:19:01 - INFO - __main__ - Step 8447: {'lr': 0.00014053333333333335, 'samples': 270304, 'steps': 527, 'loss/train': 1.7221425771713257} -09/20/2021 16:19:02 - INFO - __main__ - Step 8448: {'lr': 0.00014053333333333335, 'samples': 270336, 'steps': 527, 'loss/train': 2.691870927810669} -09/20/2021 16:19:03 - INFO - __main__ - Step 8449: {'lr': 0.0001408, 'samples': 270368, 'steps': 528, 'loss/train': 5.1194539070129395} -09/20/2021 16:19:04 - INFO - __main__ - Step 8450: {'lr': 0.0001408, 'samples': 270400, 'steps': 528, 'loss/train': 5.151662349700928} -09/20/2021 16:19:04 - INFO - __main__ - Step 8451: {'lr': 0.0001408, 'samples': 270432, 'steps': 528, 'loss/train': 4.285445690155029} -09/20/2021 16:19:05 - INFO - __main__ - Step 8452: {'lr': 0.0001408, 'samples': 270464, 'steps': 528, 'loss/train': 4.695291996002197} -09/20/2021 16:19:06 - INFO - __main__ - Step 8453: {'lr': 0.0001408, 'samples': 270496, 'steps': 528, 'loss/train': 4.549720764160156} -09/20/2021 16:19:07 - INFO - __main__ - Step 8454: {'lr': 0.0001408, 'samples': 270528, 'steps': 528, 'loss/train': 4.826260566711426} -09/20/2021 16:19:07 - INFO - __main__ - Step 8455: {'lr': 0.0001408, 'samples': 270560, 'steps': 528, 'loss/train': 3.580472707748413} -09/20/2021 16:19:08 - INFO - __main__ - Step 8456: {'lr': 0.0001408, 'samples': 270592, 'steps': 528, 'loss/train': 5.061766147613525} -09/20/2021 16:19:09 - INFO - __main__ - Step 8457: {'lr': 0.0001408, 'samples': 270624, 'steps': 528, 'loss/train': 4.534384727478027} -09/20/2021 16:19:10 - INFO - __main__ - Step 8458: {'lr': 0.0001408, 'samples': 270656, 'steps': 528, 'loss/train': 4.6651105880737305} -09/20/2021 16:19:11 - INFO - __main__ - Step 8459: {'lr': 0.0001408, 'samples': 270688, 'steps': 528, 'loss/train': 4.179879188537598} -09/20/2021 16:19:12 - INFO - __main__ - Step 8460: {'lr': 0.0001408, 'samples': 270720, 'steps': 528, 'loss/train': 3.870946168899536} -09/20/2021 16:19:13 - INFO - __main__ - Step 8461: {'lr': 0.0001408, 'samples': 270752, 'steps': 528, 'loss/train': 4.482969284057617} -09/20/2021 16:19:14 - INFO - __main__ - Step 8462: {'lr': 0.0001408, 'samples': 270784, 'steps': 528, 'loss/train': 3.634556293487549} -09/20/2021 16:19:14 - INFO - __main__ - Step 8463: {'lr': 0.0001408, 'samples': 270816, 'steps': 528, 'loss/train': 4.457303524017334} -09/20/2021 16:19:15 - INFO - __main__ - Step 8464: {'lr': 0.0001408, 'samples': 270848, 'steps': 528, 'loss/train': 4.430490493774414} -09/20/2021 16:19:16 - INFO - __main__ - Step 8465: {'lr': 0.0001410666666666667, 'samples': 270880, 'steps': 529, 'loss/train': 4.344137668609619} -09/20/2021 16:19:17 - INFO - __main__ - Step 8466: {'lr': 0.0001410666666666667, 'samples': 270912, 'steps': 529, 'loss/train': 4.634768486022949} -09/20/2021 16:19:17 - INFO - __main__ - Step 8467: {'lr': 0.0001410666666666667, 'samples': 270944, 'steps': 529, 'loss/train': 6.591773986816406} -09/20/2021 16:19:18 - INFO - __main__ - Step 8468: {'lr': 0.0001410666666666667, 'samples': 270976, 'steps': 529, 'loss/train': 6.073085784912109} -09/20/2021 16:19:19 - INFO - __main__ - Step 8469: {'lr': 0.0001410666666666667, 'samples': 271008, 'steps': 529, 'loss/train': 4.5094475746154785} -09/20/2021 16:19:20 - INFO - __main__ - Step 8470: {'lr': 0.0001410666666666667, 'samples': 271040, 'steps': 529, 'loss/train': 4.0693840980529785} -09/20/2021 16:19:20 - INFO - __main__ - Step 8471: {'lr': 0.0001410666666666667, 'samples': 271072, 'steps': 529, 'loss/train': 4.315787315368652} -09/20/2021 16:19:21 - INFO - __main__ - Step 8472: {'lr': 0.0001410666666666667, 'samples': 271104, 'steps': 529, 'loss/train': 4.055881023406982} -09/20/2021 16:19:22 - INFO - __main__ - Step 8473: {'lr': 0.0001410666666666667, 'samples': 271136, 'steps': 529, 'loss/train': 5.20236873626709} -09/20/2021 16:19:23 - INFO - __main__ - Step 8474: {'lr': 0.0001410666666666667, 'samples': 271168, 'steps': 529, 'loss/train': 5.882200717926025} -09/20/2021 16:19:23 - INFO - __main__ - Step 8475: {'lr': 0.0001410666666666667, 'samples': 271200, 'steps': 529, 'loss/train': 4.866821765899658} -09/20/2021 16:19:24 - INFO - __main__ - Step 8476: {'lr': 0.0001410666666666667, 'samples': 271232, 'steps': 529, 'loss/train': 4.8213958740234375} -09/20/2021 16:19:25 - INFO - __main__ - Step 8477: {'lr': 0.0001410666666666667, 'samples': 271264, 'steps': 529, 'loss/train': 4.481968879699707} -09/20/2021 16:19:26 - INFO - __main__ - Step 8478: {'lr': 0.0001410666666666667, 'samples': 271296, 'steps': 529, 'loss/train': 4.896060943603516} -09/20/2021 16:19:26 - INFO - __main__ - Step 8479: {'lr': 0.0001410666666666667, 'samples': 271328, 'steps': 529, 'loss/train': 4.316540241241455} -09/20/2021 16:19:27 - INFO - __main__ - Step 8480: {'lr': 0.0001410666666666667, 'samples': 271360, 'steps': 529, 'loss/train': 5.866024494171143} -09/20/2021 16:19:28 - INFO - __main__ - Step 8481: {'lr': 0.00014133333333333334, 'samples': 271392, 'steps': 530, 'loss/train': 4.475757598876953} -09/20/2021 16:19:29 - INFO - __main__ - Step 8482: {'lr': 0.00014133333333333334, 'samples': 271424, 'steps': 530, 'loss/train': 4.8020429611206055} -09/20/2021 16:19:30 - INFO - __main__ - Step 8483: {'lr': 0.00014133333333333334, 'samples': 271456, 'steps': 530, 'loss/train': 5.957148551940918} -09/20/2021 16:19:30 - INFO - __main__ - Step 8484: {'lr': 0.00014133333333333334, 'samples': 271488, 'steps': 530, 'loss/train': 4.563296794891357} -09/20/2021 16:19:31 - INFO - __main__ - Step 8485: {'lr': 0.00014133333333333334, 'samples': 271520, 'steps': 530, 'loss/train': 4.980384349822998} -09/20/2021 16:19:32 - INFO - __main__ - Step 8486: {'lr': 0.00014133333333333334, 'samples': 271552, 'steps': 530, 'loss/train': 4.45731782913208} -09/20/2021 16:19:33 - INFO - __main__ - Step 8487: {'lr': 0.00014133333333333334, 'samples': 271584, 'steps': 530, 'loss/train': 4.835742473602295} -09/20/2021 16:19:33 - INFO - __main__ - Step 8488: {'lr': 0.00014133333333333334, 'samples': 271616, 'steps': 530, 'loss/train': 5.003682613372803} -09/20/2021 16:19:35 - INFO - __main__ - Step 8489: {'lr': 0.00014133333333333334, 'samples': 271648, 'steps': 530, 'loss/train': 5.779517650604248} -09/20/2021 16:19:35 - INFO - __main__ - Step 8490: {'lr': 0.00014133333333333334, 'samples': 271680, 'steps': 530, 'loss/train': 4.849761962890625} -09/20/2021 16:19:36 - INFO - __main__ - Step 8491: {'lr': 0.00014133333333333334, 'samples': 271712, 'steps': 530, 'loss/train': 4.975593566894531} -09/20/2021 16:19:37 - INFO - __main__ - Step 8492: {'lr': 0.00014133333333333334, 'samples': 271744, 'steps': 530, 'loss/train': 4.844903945922852} -09/20/2021 16:19:38 - INFO - __main__ - Step 8493: {'lr': 0.00014133333333333334, 'samples': 271776, 'steps': 530, 'loss/train': 2.4456827640533447} -09/20/2021 16:19:38 - INFO - __main__ - Step 8494: {'lr': 0.00014133333333333334, 'samples': 271808, 'steps': 530, 'loss/train': 5.389601707458496} -09/20/2021 16:19:39 - INFO - __main__ - Step 8495: {'lr': 0.00014133333333333334, 'samples': 271840, 'steps': 530, 'loss/train': 4.143082618713379} -09/20/2021 16:19:40 - INFO - __main__ - Step 8496: {'lr': 0.00014133333333333334, 'samples': 271872, 'steps': 530, 'loss/train': 4.724514484405518} -09/20/2021 16:19:41 - INFO - __main__ - Step 8497: {'lr': 0.0001416, 'samples': 271904, 'steps': 531, 'loss/train': 4.373640537261963} -09/20/2021 16:19:42 - INFO - __main__ - Step 8498: {'lr': 0.0001416, 'samples': 271936, 'steps': 531, 'loss/train': 2.4951529502868652} -09/20/2021 16:19:42 - INFO - __main__ - Step 8499: {'lr': 0.0001416, 'samples': 271968, 'steps': 531, 'loss/train': 4.4178056716918945} -09/20/2021 16:19:43 - INFO - __main__ - Step 8500: {'lr': 0.0001416, 'samples': 272000, 'steps': 531, 'loss/train': 5.2708306312561035} -09/20/2021 16:19:44 - INFO - __main__ - Step 8501: {'lr': 0.0001416, 'samples': 272032, 'steps': 531, 'loss/train': 4.603973388671875} -09/20/2021 16:19:45 - INFO - __main__ - Step 8502: {'lr': 0.0001416, 'samples': 272064, 'steps': 531, 'loss/train': 4.73927640914917} -09/20/2021 16:19:45 - INFO - __main__ - Step 8503: {'lr': 0.0001416, 'samples': 272096, 'steps': 531, 'loss/train': 5.317549228668213} -09/20/2021 16:19:46 - INFO - __main__ - Step 8504: {'lr': 0.0001416, 'samples': 272128, 'steps': 531, 'loss/train': 5.071071147918701} -09/20/2021 16:19:47 - INFO - __main__ - Step 8505: {'lr': 0.0001416, 'samples': 272160, 'steps': 531, 'loss/train': 4.4710211753845215} -09/20/2021 16:19:48 - INFO - __main__ - Step 8506: {'lr': 0.0001416, 'samples': 272192, 'steps': 531, 'loss/train': 4.881669998168945} -09/20/2021 16:19:48 - INFO - __main__ - Step 8507: {'lr': 0.0001416, 'samples': 272224, 'steps': 531, 'loss/train': 4.970876216888428} -09/20/2021 16:19:49 - INFO - __main__ - Step 8508: {'lr': 0.0001416, 'samples': 272256, 'steps': 531, 'loss/train': 4.787450790405273} -09/20/2021 16:19:50 - INFO - __main__ - Step 8509: {'lr': 0.0001416, 'samples': 272288, 'steps': 531, 'loss/train': 5.245649337768555} -09/20/2021 16:19:51 - INFO - __main__ - Step 8510: {'lr': 0.0001416, 'samples': 272320, 'steps': 531, 'loss/train': 5.1072845458984375} -09/20/2021 16:19:51 - INFO - __main__ - Step 8511: {'lr': 0.0001416, 'samples': 272352, 'steps': 531, 'loss/train': 6.955463886260986} -09/20/2021 16:19:52 - INFO - __main__ - Step 8512: {'lr': 0.0001416, 'samples': 272384, 'steps': 531, 'loss/train': 2.6486716270446777} -09/20/2021 16:19:53 - INFO - __main__ - Step 8513: {'lr': 0.00014186666666666668, 'samples': 272416, 'steps': 532, 'loss/train': 2.1351046562194824} -09/20/2021 16:19:54 - INFO - __main__ - Step 8514: {'lr': 0.00014186666666666668, 'samples': 272448, 'steps': 532, 'loss/train': 5.141280174255371} -09/20/2021 16:19:54 - INFO - __main__ - Step 8515: {'lr': 0.00014186666666666668, 'samples': 272480, 'steps': 532, 'loss/train': 5.738983154296875} -09/20/2021 16:19:55 - INFO - __main__ - Step 8516: {'lr': 0.00014186666666666668, 'samples': 272512, 'steps': 532, 'loss/train': 4.483355522155762} -09/20/2021 16:19:56 - INFO - __main__ - Step 8517: {'lr': 0.00014186666666666668, 'samples': 272544, 'steps': 532, 'loss/train': 4.598844051361084} -09/20/2021 16:19:57 - INFO - __main__ - Step 8518: {'lr': 0.00014186666666666668, 'samples': 272576, 'steps': 532, 'loss/train': 4.772737979888916} -09/20/2021 16:19:57 - INFO - __main__ - Step 8519: {'lr': 0.00014186666666666668, 'samples': 272608, 'steps': 532, 'loss/train': 4.964468955993652} -09/20/2021 16:19:58 - INFO - __main__ - Step 8520: {'lr': 0.00014186666666666668, 'samples': 272640, 'steps': 532, 'loss/train': 4.6673784255981445} -09/20/2021 16:19:59 - INFO - __main__ - Step 8521: {'lr': 0.00014186666666666668, 'samples': 272672, 'steps': 532, 'loss/train': 5.5370564460754395} -09/20/2021 16:20:00 - INFO - __main__ - Step 8522: {'lr': 0.00014186666666666668, 'samples': 272704, 'steps': 532, 'loss/train': 5.115022659301758} -09/20/2021 16:20:01 - INFO - __main__ - Step 8523: {'lr': 0.00014186666666666668, 'samples': 272736, 'steps': 532, 'loss/train': 4.942553997039795} -09/20/2021 16:20:02 - INFO - __main__ - Step 8524: {'lr': 0.00014186666666666668, 'samples': 272768, 'steps': 532, 'loss/train': 5.070718288421631} -09/20/2021 16:20:02 - INFO - __main__ - Step 8525: {'lr': 0.00014186666666666668, 'samples': 272800, 'steps': 532, 'loss/train': 4.235053062438965} -09/20/2021 16:20:03 - INFO - __main__ - Step 8526: {'lr': 0.00014186666666666668, 'samples': 272832, 'steps': 532, 'loss/train': 4.481072902679443} -09/20/2021 16:20:04 - INFO - __main__ - Step 8527: {'lr': 0.00014186666666666668, 'samples': 272864, 'steps': 532, 'loss/train': 5.280544757843018} -09/20/2021 16:20:05 - INFO - __main__ - Step 8528: {'lr': 0.00014186666666666668, 'samples': 272896, 'steps': 532, 'loss/train': 4.870207786560059} -09/20/2021 16:20:06 - INFO - __main__ - Step 8529: {'lr': 0.00014213333333333334, 'samples': 272928, 'steps': 533, 'loss/train': 4.4631781578063965} -09/20/2021 16:20:06 - INFO - __main__ - Step 8530: {'lr': 0.00014213333333333334, 'samples': 272960, 'steps': 533, 'loss/train': 3.7277729511260986} -09/20/2021 16:20:07 - INFO - __main__ - Step 8531: {'lr': 0.00014213333333333334, 'samples': 272992, 'steps': 533, 'loss/train': 4.731350421905518} -09/20/2021 16:20:08 - INFO - __main__ - Step 8532: {'lr': 0.00014213333333333334, 'samples': 273024, 'steps': 533, 'loss/train': 3.8916995525360107} -09/20/2021 16:20:09 - INFO - __main__ - Step 8533: {'lr': 0.00014213333333333334, 'samples': 273056, 'steps': 533, 'loss/train': 5.1738104820251465} -09/20/2021 16:20:09 - INFO - __main__ - Step 8534: {'lr': 0.00014213333333333334, 'samples': 273088, 'steps': 533, 'loss/train': 4.710616111755371} -09/20/2021 16:20:10 - INFO - __main__ - Step 8535: {'lr': 0.00014213333333333334, 'samples': 273120, 'steps': 533, 'loss/train': 5.35020112991333} -09/20/2021 16:20:11 - INFO - __main__ - Step 8536: {'lr': 0.00014213333333333334, 'samples': 273152, 'steps': 533, 'loss/train': 5.015140533447266} -09/20/2021 16:20:12 - INFO - __main__ - Step 8537: {'lr': 0.00014213333333333334, 'samples': 273184, 'steps': 533, 'loss/train': 4.861170291900635} -09/20/2021 16:20:12 - INFO - __main__ - Step 8538: {'lr': 0.00014213333333333334, 'samples': 273216, 'steps': 533, 'loss/train': 4.033350944519043} -09/20/2021 16:20:13 - INFO - __main__ - Step 8539: {'lr': 0.00014213333333333334, 'samples': 273248, 'steps': 533, 'loss/train': 4.4929938316345215} -09/20/2021 16:20:14 - INFO - __main__ - Step 8540: {'lr': 0.00014213333333333334, 'samples': 273280, 'steps': 533, 'loss/train': 4.98721981048584} -09/20/2021 16:20:15 - INFO - __main__ - Step 8541: {'lr': 0.00014213333333333334, 'samples': 273312, 'steps': 533, 'loss/train': 2.093859910964966} -09/20/2021 16:20:15 - INFO - __main__ - Step 8542: {'lr': 0.00014213333333333334, 'samples': 273344, 'steps': 533, 'loss/train': 5.061645030975342} -09/20/2021 16:20:16 - INFO - __main__ - Step 8543: {'lr': 0.00014213333333333334, 'samples': 273376, 'steps': 533, 'loss/train': 4.8342695236206055} -09/20/2021 16:20:17 - INFO - __main__ - Step 8544: {'lr': 0.00014213333333333334, 'samples': 273408, 'steps': 533, 'loss/train': 5.7136640548706055} -09/20/2021 16:20:18 - INFO - __main__ - Step 8545: {'lr': 0.0001424, 'samples': 273440, 'steps': 534, 'loss/train': 5.288957595825195} -09/20/2021 16:20:19 - INFO - __main__ - Step 8546: {'lr': 0.0001424, 'samples': 273472, 'steps': 534, 'loss/train': 4.531991481781006} -09/20/2021 16:20:19 - INFO - __main__ - Step 8547: {'lr': 0.0001424, 'samples': 273504, 'steps': 534, 'loss/train': 4.593311309814453} -09/20/2021 16:20:20 - INFO - __main__ - Step 8548: {'lr': 0.0001424, 'samples': 273536, 'steps': 534, 'loss/train': 4.623538017272949} -09/20/2021 16:20:21 - INFO - __main__ - Step 8549: {'lr': 0.0001424, 'samples': 273568, 'steps': 534, 'loss/train': 7.18848180770874} -09/20/2021 16:20:22 - INFO - __main__ - Step 8550: {'lr': 0.0001424, 'samples': 273600, 'steps': 534, 'loss/train': 4.447059631347656} -09/20/2021 16:20:23 - INFO - __main__ - Step 8551: {'lr': 0.0001424, 'samples': 273632, 'steps': 534, 'loss/train': 4.231389999389648} -09/20/2021 16:20:24 - INFO - __main__ - Step 8552: {'lr': 0.0001424, 'samples': 273664, 'steps': 534, 'loss/train': 4.866613388061523} -09/20/2021 16:20:24 - INFO - __main__ - Step 8553: {'lr': 0.0001424, 'samples': 273696, 'steps': 534, 'loss/train': 4.984864711761475} -09/20/2021 16:20:25 - INFO - __main__ - Step 8554: {'lr': 0.0001424, 'samples': 273728, 'steps': 534, 'loss/train': 4.405724048614502} -09/20/2021 16:20:26 - INFO - __main__ - Step 8555: {'lr': 0.0001424, 'samples': 273760, 'steps': 534, 'loss/train': 4.906392574310303} -09/20/2021 16:20:27 - INFO - __main__ - Step 8556: {'lr': 0.0001424, 'samples': 273792, 'steps': 534, 'loss/train': 4.87828254699707} -09/20/2021 16:20:27 - INFO - __main__ - Step 8557: {'lr': 0.0001424, 'samples': 273824, 'steps': 534, 'loss/train': 4.816371440887451} -09/20/2021 16:20:28 - INFO - __main__ - Step 8558: {'lr': 0.0001424, 'samples': 273856, 'steps': 534, 'loss/train': 4.9596686363220215} -09/20/2021 16:20:29 - INFO - __main__ - Step 8559: {'lr': 0.0001424, 'samples': 273888, 'steps': 534, 'loss/train': 4.693664073944092} -09/20/2021 16:20:30 - INFO - __main__ - Step 8560: {'lr': 0.0001424, 'samples': 273920, 'steps': 534, 'loss/train': 4.529881000518799} -09/20/2021 16:20:30 - INFO - __main__ - Step 8561: {'lr': 0.00014266666666666667, 'samples': 273952, 'steps': 535, 'loss/train': 4.416075229644775} -09/20/2021 16:20:31 - INFO - __main__ - Step 8562: {'lr': 0.00014266666666666667, 'samples': 273984, 'steps': 535, 'loss/train': 5.279847145080566} -09/20/2021 16:20:32 - INFO - __main__ - Step 8563: {'lr': 0.00014266666666666667, 'samples': 274016, 'steps': 535, 'loss/train': 5.096366882324219} -09/20/2021 16:20:33 - INFO - __main__ - Step 8564: {'lr': 0.00014266666666666667, 'samples': 274048, 'steps': 535, 'loss/train': 4.285220623016357} -09/20/2021 16:20:33 - INFO - __main__ - Step 8565: {'lr': 0.00014266666666666667, 'samples': 274080, 'steps': 535, 'loss/train': 4.713510990142822} -09/20/2021 16:20:34 - INFO - __main__ - Step 8566: {'lr': 0.00014266666666666667, 'samples': 274112, 'steps': 535, 'loss/train': 5.755059719085693} -09/20/2021 16:20:35 - INFO - __main__ - Step 8567: {'lr': 0.00014266666666666667, 'samples': 274144, 'steps': 535, 'loss/train': 5.260715007781982} -09/20/2021 16:20:36 - INFO - __main__ - Step 8568: {'lr': 0.00014266666666666667, 'samples': 274176, 'steps': 535, 'loss/train': 4.911330699920654} -09/20/2021 16:20:36 - INFO - __main__ - Step 8569: {'lr': 0.00014266666666666667, 'samples': 274208, 'steps': 535, 'loss/train': 5.1226725578308105} -09/20/2021 16:20:37 - INFO - __main__ - Step 8570: {'lr': 0.00014266666666666667, 'samples': 274240, 'steps': 535, 'loss/train': 5.202953815460205} -09/20/2021 16:20:38 - INFO - __main__ - Step 8571: {'lr': 0.00014266666666666667, 'samples': 274272, 'steps': 535, 'loss/train': 3.9337358474731445} -09/20/2021 16:20:39 - INFO - __main__ - Step 8572: {'lr': 0.00014266666666666667, 'samples': 274304, 'steps': 535, 'loss/train': 4.20900821685791} -09/20/2021 16:20:39 - INFO - __main__ - Step 8573: {'lr': 0.00014266666666666667, 'samples': 274336, 'steps': 535, 'loss/train': 4.451632499694824} -09/20/2021 16:20:40 - INFO - __main__ - Step 8574: {'lr': 0.00014266666666666667, 'samples': 274368, 'steps': 535, 'loss/train': 5.697014808654785} -09/20/2021 16:20:41 - INFO - __main__ - Step 8575: {'lr': 0.00014266666666666667, 'samples': 274400, 'steps': 535, 'loss/train': 4.524219989776611} -09/20/2021 16:20:42 - INFO - __main__ - Step 8576: {'lr': 0.00014266666666666667, 'samples': 274432, 'steps': 535, 'loss/train': 4.259039878845215} -09/20/2021 16:20:43 - INFO - __main__ - Step 8577: {'lr': 0.00014293333333333333, 'samples': 274464, 'steps': 536, 'loss/train': 4.081968307495117} -09/20/2021 16:20:43 - INFO - __main__ - Step 8578: {'lr': 0.00014293333333333333, 'samples': 274496, 'steps': 536, 'loss/train': 4.000454425811768} -09/20/2021 16:20:44 - INFO - __main__ - Step 8579: {'lr': 0.00014293333333333333, 'samples': 274528, 'steps': 536, 'loss/train': 4.850193500518799} -09/20/2021 16:20:45 - INFO - __main__ - Step 8580: {'lr': 0.00014293333333333333, 'samples': 274560, 'steps': 536, 'loss/train': 2.0229198932647705} -09/20/2021 16:20:46 - INFO - __main__ - Step 8581: {'lr': 0.00014293333333333333, 'samples': 274592, 'steps': 536, 'loss/train': 4.882555961608887} -09/20/2021 16:20:47 - INFO - __main__ - Step 8582: {'lr': 0.00014293333333333333, 'samples': 274624, 'steps': 536, 'loss/train': 3.999661684036255} -09/20/2021 16:20:48 - INFO - __main__ - Step 8583: {'lr': 0.00014293333333333333, 'samples': 274656, 'steps': 536, 'loss/train': 4.412973403930664} -09/20/2021 16:20:48 - INFO - __main__ - Step 8584: {'lr': 0.00014293333333333333, 'samples': 274688, 'steps': 536, 'loss/train': 5.112865924835205} -09/20/2021 16:20:49 - INFO - __main__ - Step 8585: {'lr': 0.00014293333333333333, 'samples': 274720, 'steps': 536, 'loss/train': 4.27836275100708} -09/20/2021 16:20:50 - INFO - __main__ - Step 8586: {'lr': 0.00014293333333333333, 'samples': 274752, 'steps': 536, 'loss/train': 4.565448760986328} -09/20/2021 16:20:51 - INFO - __main__ - Step 8587: {'lr': 0.00014293333333333333, 'samples': 274784, 'steps': 536, 'loss/train': 5.256210803985596} -09/20/2021 16:20:51 - INFO - __main__ - Step 8588: {'lr': 0.00014293333333333333, 'samples': 274816, 'steps': 536, 'loss/train': 4.941487789154053} -09/20/2021 16:20:52 - INFO - __main__ - Step 8589: {'lr': 0.00014293333333333333, 'samples': 274848, 'steps': 536, 'loss/train': 3.953704833984375} -09/20/2021 16:20:53 - INFO - __main__ - Step 8590: {'lr': 0.00014293333333333333, 'samples': 274880, 'steps': 536, 'loss/train': 5.258827209472656} -09/20/2021 16:20:54 - INFO - __main__ - Step 8591: {'lr': 0.00014293333333333333, 'samples': 274912, 'steps': 536, 'loss/train': 3.7023508548736572} -09/20/2021 16:20:54 - INFO - __main__ - Step 8592: {'lr': 0.00014293333333333333, 'samples': 274944, 'steps': 536, 'loss/train': 4.461130142211914} -09/20/2021 16:20:55 - INFO - __main__ - Step 8593: {'lr': 0.0001432, 'samples': 274976, 'steps': 537, 'loss/train': 4.7972893714904785} -09/20/2021 16:20:56 - INFO - __main__ - Step 8594: {'lr': 0.0001432, 'samples': 275008, 'steps': 537, 'loss/train': 3.9515013694763184} -09/20/2021 16:20:57 - INFO - __main__ - Step 8595: {'lr': 0.0001432, 'samples': 275040, 'steps': 537, 'loss/train': 4.552280902862549} -09/20/2021 16:20:57 - INFO - __main__ - Step 8596: {'lr': 0.0001432, 'samples': 275072, 'steps': 537, 'loss/train': 4.9941725730896} -09/20/2021 16:20:58 - INFO - __main__ - Step 8597: {'lr': 0.0001432, 'samples': 275104, 'steps': 537, 'loss/train': 4.74262809753418} -09/20/2021 16:20:59 - INFO - __main__ - Step 8598: {'lr': 0.0001432, 'samples': 275136, 'steps': 537, 'loss/train': 4.095609188079834} -09/20/2021 16:21:00 - INFO - __main__ - Step 8599: {'lr': 0.0001432, 'samples': 275168, 'steps': 537, 'loss/train': 3.8844950199127197} -09/20/2021 16:21:00 - INFO - __main__ - Step 8600: {'lr': 0.0001432, 'samples': 275200, 'steps': 537, 'loss/train': 4.925135135650635} -09/20/2021 16:21:01 - INFO - __main__ - Step 8601: {'lr': 0.0001432, 'samples': 275232, 'steps': 537, 'loss/train': 4.959153652191162} -09/20/2021 16:21:02 - INFO - __main__ - Step 8602: {'lr': 0.0001432, 'samples': 275264, 'steps': 537, 'loss/train': 4.275208950042725} -09/20/2021 16:21:03 - INFO - __main__ - Step 8603: {'lr': 0.0001432, 'samples': 275296, 'steps': 537, 'loss/train': 5.101418495178223} -09/20/2021 16:21:03 - INFO - __main__ - Step 8604: {'lr': 0.0001432, 'samples': 275328, 'steps': 537, 'loss/train': 4.333622455596924} -09/20/2021 16:21:04 - INFO - __main__ - Step 8605: {'lr': 0.0001432, 'samples': 275360, 'steps': 537, 'loss/train': 5.2811102867126465} -09/20/2021 16:21:05 - INFO - __main__ - Step 8606: {'lr': 0.0001432, 'samples': 275392, 'steps': 537, 'loss/train': 4.462065696716309} -09/20/2021 16:21:06 - INFO - __main__ - Step 8607: {'lr': 0.0001432, 'samples': 275424, 'steps': 537, 'loss/train': 4.579482078552246} -09/20/2021 16:21:06 - INFO - __main__ - Step 8608: {'lr': 0.0001432, 'samples': 275456, 'steps': 537, 'loss/train': 5.2504072189331055} -09/20/2021 16:21:07 - INFO - __main__ - Step 8609: {'lr': 0.0001434666666666667, 'samples': 275488, 'steps': 538, 'loss/train': 4.722216606140137} -09/20/2021 16:21:08 - INFO - __main__ - Step 8610: {'lr': 0.0001434666666666667, 'samples': 275520, 'steps': 538, 'loss/train': 4.870700359344482} -09/20/2021 16:21:09 - INFO - __main__ - Step 8611: {'lr': 0.0001434666666666667, 'samples': 275552, 'steps': 538, 'loss/train': 4.651228427886963} -09/20/2021 16:21:10 - INFO - __main__ - Step 8612: {'lr': 0.0001434666666666667, 'samples': 275584, 'steps': 538, 'loss/train': 3.8529627323150635} -09/20/2021 16:21:11 - INFO - __main__ - Step 8613: {'lr': 0.0001434666666666667, 'samples': 275616, 'steps': 538, 'loss/train': 3.941534996032715} -09/20/2021 16:21:12 - INFO - __main__ - Step 8614: {'lr': 0.0001434666666666667, 'samples': 275648, 'steps': 538, 'loss/train': 4.526480197906494} -09/20/2021 16:21:12 - INFO - __main__ - Step 8615: {'lr': 0.0001434666666666667, 'samples': 275680, 'steps': 538, 'loss/train': 4.324738502502441} -09/20/2021 16:21:13 - INFO - __main__ - Step 8616: {'lr': 0.0001434666666666667, 'samples': 275712, 'steps': 538, 'loss/train': 4.018342971801758} -09/20/2021 16:21:14 - INFO - __main__ - Step 8617: {'lr': 0.0001434666666666667, 'samples': 275744, 'steps': 538, 'loss/train': 3.9183366298675537} -09/20/2021 16:21:15 - INFO - __main__ - Step 8618: {'lr': 0.0001434666666666667, 'samples': 275776, 'steps': 538, 'loss/train': 5.246248722076416} -09/20/2021 16:21:15 - INFO - __main__ - Step 8619: {'lr': 0.0001434666666666667, 'samples': 275808, 'steps': 538, 'loss/train': 4.163156032562256} -09/20/2021 16:21:16 - INFO - __main__ - Step 8620: {'lr': 0.0001434666666666667, 'samples': 275840, 'steps': 538, 'loss/train': 4.274586200714111} -09/20/2021 16:21:17 - INFO - __main__ - Step 8621: {'lr': 0.0001434666666666667, 'samples': 275872, 'steps': 538, 'loss/train': 4.177013397216797} -09/20/2021 16:21:18 - INFO - __main__ - Step 8622: {'lr': 0.0001434666666666667, 'samples': 275904, 'steps': 538, 'loss/train': 4.882584571838379} -09/20/2021 16:21:18 - INFO - __main__ - Step 8623: {'lr': 0.0001434666666666667, 'samples': 275936, 'steps': 538, 'loss/train': 5.073654651641846} -09/20/2021 16:21:19 - INFO - __main__ - Step 8624: {'lr': 0.0001434666666666667, 'samples': 275968, 'steps': 538, 'loss/train': 5.636946678161621} -09/20/2021 16:21:20 - INFO - __main__ - Step 8625: {'lr': 0.00014373333333333335, 'samples': 276000, 'steps': 539, 'loss/train': 5.315260887145996} -09/20/2021 16:21:21 - INFO - __main__ - Step 8626: {'lr': 0.00014373333333333335, 'samples': 276032, 'steps': 539, 'loss/train': 4.9570512771606445} -09/20/2021 16:21:22 - INFO - __main__ - Step 8627: {'lr': 0.00014373333333333335, 'samples': 276064, 'steps': 539, 'loss/train': 5.678730487823486} -09/20/2021 16:21:22 - INFO - __main__ - Step 8628: {'lr': 0.00014373333333333335, 'samples': 276096, 'steps': 539, 'loss/train': 4.074306011199951} -09/20/2021 16:21:23 - INFO - __main__ - Step 8629: {'lr': 0.00014373333333333335, 'samples': 276128, 'steps': 539, 'loss/train': 4.59503173828125} -09/20/2021 16:21:24 - INFO - __main__ - Step 8630: {'lr': 0.00014373333333333335, 'samples': 276160, 'steps': 539, 'loss/train': 4.587224006652832} -09/20/2021 16:21:25 - INFO - __main__ - Step 8631: {'lr': 0.00014373333333333335, 'samples': 276192, 'steps': 539, 'loss/train': 4.569239139556885} -09/20/2021 16:21:25 - INFO - __main__ - Step 8632: {'lr': 0.00014373333333333335, 'samples': 276224, 'steps': 539, 'loss/train': 4.764120101928711} -09/20/2021 16:21:26 - INFO - __main__ - Step 8633: {'lr': 0.00014373333333333335, 'samples': 276256, 'steps': 539, 'loss/train': 5.105336666107178} -09/20/2021 16:21:27 - INFO - __main__ - Step 8634: {'lr': 0.00014373333333333335, 'samples': 276288, 'steps': 539, 'loss/train': 5.628556728363037} -09/20/2021 16:21:28 - INFO - __main__ - Step 8635: {'lr': 0.00014373333333333335, 'samples': 276320, 'steps': 539, 'loss/train': 4.800227642059326} -09/20/2021 16:21:28 - INFO - __main__ - Step 8636: {'lr': 0.00014373333333333335, 'samples': 276352, 'steps': 539, 'loss/train': 4.6448774337768555} -09/20/2021 16:21:29 - INFO - __main__ - Step 8637: {'lr': 0.00014373333333333335, 'samples': 276384, 'steps': 539, 'loss/train': 5.419508934020996} -09/20/2021 16:21:30 - INFO - __main__ - Step 8638: {'lr': 0.00014373333333333335, 'samples': 276416, 'steps': 539, 'loss/train': 4.404278755187988} -09/20/2021 16:21:31 - INFO - __main__ - Step 8639: {'lr': 0.00014373333333333335, 'samples': 276448, 'steps': 539, 'loss/train': 4.538841724395752} -09/20/2021 16:21:31 - INFO - __main__ - Step 8640: {'lr': 0.00014373333333333335, 'samples': 276480, 'steps': 539, 'loss/train': 4.142750263214111} -09/20/2021 16:21:32 - INFO - __main__ - Step 8641: {'lr': 0.000144, 'samples': 276512, 'steps': 540, 'loss/train': 3.913540840148926} -09/20/2021 16:21:33 - INFO - __main__ - Step 8642: {'lr': 0.000144, 'samples': 276544, 'steps': 540, 'loss/train': 4.475451469421387} -09/20/2021 16:21:34 - INFO - __main__ - Step 8643: {'lr': 0.000144, 'samples': 276576, 'steps': 540, 'loss/train': 4.8917155265808105} -09/20/2021 16:21:35 - INFO - __main__ - Step 8644: {'lr': 0.000144, 'samples': 276608, 'steps': 540, 'loss/train': 4.721489906311035} -09/20/2021 16:21:36 - INFO - __main__ - Step 8645: {'lr': 0.000144, 'samples': 276640, 'steps': 540, 'loss/train': 5.184974670410156} -09/20/2021 16:21:37 - INFO - __main__ - Step 8646: {'lr': 0.000144, 'samples': 276672, 'steps': 540, 'loss/train': 4.928077220916748} -09/20/2021 16:21:38 - INFO - __main__ - Step 8647: {'lr': 0.000144, 'samples': 276704, 'steps': 540, 'loss/train': 4.886809349060059} -09/20/2021 16:21:38 - INFO - __main__ - Step 8648: {'lr': 0.000144, 'samples': 276736, 'steps': 540, 'loss/train': 5.161494731903076} -09/20/2021 16:21:39 - INFO - __main__ - Step 8649: {'lr': 0.000144, 'samples': 276768, 'steps': 540, 'loss/train': 5.169743061065674} -09/20/2021 16:21:40 - INFO - __main__ - Step 8650: {'lr': 0.000144, 'samples': 276800, 'steps': 540, 'loss/train': 4.957679748535156} -09/20/2021 16:21:41 - INFO - __main__ - Step 8651: {'lr': 0.000144, 'samples': 276832, 'steps': 540, 'loss/train': 4.884688854217529} -09/20/2021 16:21:41 - INFO - __main__ - Step 8652: {'lr': 0.000144, 'samples': 276864, 'steps': 540, 'loss/train': 4.670226573944092} -09/20/2021 16:21:42 - INFO - __main__ - Step 8653: {'lr': 0.000144, 'samples': 276896, 'steps': 540, 'loss/train': 4.477506637573242} -09/20/2021 16:21:43 - INFO - __main__ - Step 8654: {'lr': 0.000144, 'samples': 276928, 'steps': 540, 'loss/train': 4.602237224578857} -09/20/2021 16:21:44 - INFO - __main__ - Step 8655: {'lr': 0.000144, 'samples': 276960, 'steps': 540, 'loss/train': 4.268200397491455} -09/20/2021 16:21:44 - INFO - __main__ - Step 8656: {'lr': 0.000144, 'samples': 276992, 'steps': 540, 'loss/train': 3.618330478668213} -09/20/2021 16:21:45 - INFO - __main__ - Step 8657: {'lr': 0.00014426666666666669, 'samples': 277024, 'steps': 541, 'loss/train': 5.313914775848389} -09/20/2021 16:21:46 - INFO - __main__ - Step 8658: {'lr': 0.00014426666666666669, 'samples': 277056, 'steps': 541, 'loss/train': 4.989913463592529} -09/20/2021 16:21:47 - INFO - __main__ - Step 8659: {'lr': 0.00014426666666666669, 'samples': 277088, 'steps': 541, 'loss/train': 4.478893756866455} -09/20/2021 16:21:48 - INFO - __main__ - Step 8660: {'lr': 0.00014426666666666669, 'samples': 277120, 'steps': 541, 'loss/train': 4.249532699584961} -09/20/2021 16:21:48 - INFO - __main__ - Step 8661: {'lr': 0.00014426666666666669, 'samples': 277152, 'steps': 541, 'loss/train': 5.366650104522705} -09/20/2021 16:21:49 - INFO - __main__ - Step 8662: {'lr': 0.00014426666666666669, 'samples': 277184, 'steps': 541, 'loss/train': 4.583704471588135} -09/20/2021 16:21:50 - INFO - __main__ - Step 8663: {'lr': 0.00014426666666666669, 'samples': 277216, 'steps': 541, 'loss/train': 5.435661315917969} -09/20/2021 16:21:51 - INFO - __main__ - Step 8664: {'lr': 0.00014426666666666669, 'samples': 277248, 'steps': 541, 'loss/train': 5.0781097412109375} -09/20/2021 16:21:51 - INFO - __main__ - Step 8665: {'lr': 0.00014426666666666669, 'samples': 277280, 'steps': 541, 'loss/train': 4.924991607666016} -09/20/2021 16:21:52 - INFO - __main__ - Step 8666: {'lr': 0.00014426666666666669, 'samples': 277312, 'steps': 541, 'loss/train': 4.995512962341309} -09/20/2021 16:21:53 - INFO - __main__ - Step 8667: {'lr': 0.00014426666666666669, 'samples': 277344, 'steps': 541, 'loss/train': 4.601343154907227} -09/20/2021 16:21:54 - INFO - __main__ - Step 8668: {'lr': 0.00014426666666666669, 'samples': 277376, 'steps': 541, 'loss/train': 3.765101909637451} -09/20/2021 16:21:54 - INFO - __main__ - Step 8669: {'lr': 0.00014426666666666669, 'samples': 277408, 'steps': 541, 'loss/train': 4.0301432609558105} -09/20/2021 16:21:55 - INFO - __main__ - Step 8670: {'lr': 0.00014426666666666669, 'samples': 277440, 'steps': 541, 'loss/train': 4.930648326873779} -09/20/2021 16:21:56 - INFO - __main__ - Step 8671: {'lr': 0.00014426666666666669, 'samples': 277472, 'steps': 541, 'loss/train': 4.884012222290039} -09/20/2021 16:21:57 - INFO - __main__ - Step 8672: {'lr': 0.00014426666666666669, 'samples': 277504, 'steps': 541, 'loss/train': 4.4512763023376465} -09/20/2021 16:21:57 - INFO - __main__ - Step 8673: {'lr': 0.00014453333333333334, 'samples': 277536, 'steps': 542, 'loss/train': 4.844992160797119} -09/20/2021 16:21:59 - INFO - __main__ - Step 8674: {'lr': 0.00014453333333333334, 'samples': 277568, 'steps': 542, 'loss/train': 4.703901290893555} -09/20/2021 16:21:59 - INFO - __main__ - Step 8675: {'lr': 0.00014453333333333334, 'samples': 277600, 'steps': 542, 'loss/train': 5.452399253845215} -09/20/2021 16:22:00 - INFO - __main__ - Step 8676: {'lr': 0.00014453333333333334, 'samples': 277632, 'steps': 542, 'loss/train': 5.6984148025512695} -09/20/2021 16:22:01 - INFO - __main__ - Step 8677: {'lr': 0.00014453333333333334, 'samples': 277664, 'steps': 542, 'loss/train': 5.054729461669922} -09/20/2021 16:22:02 - INFO - __main__ - Step 8678: {'lr': 0.00014453333333333334, 'samples': 277696, 'steps': 542, 'loss/train': 4.497401237487793} -09/20/2021 16:22:02 - INFO - __main__ - Step 8679: {'lr': 0.00014453333333333334, 'samples': 277728, 'steps': 542, 'loss/train': 4.048349857330322} -09/20/2021 16:22:03 - INFO - __main__ - Step 8680: {'lr': 0.00014453333333333334, 'samples': 277760, 'steps': 542, 'loss/train': 4.979940891265869} -09/20/2021 16:22:04 - INFO - __main__ - Step 8681: {'lr': 0.00014453333333333334, 'samples': 277792, 'steps': 542, 'loss/train': 4.633366107940674} -09/20/2021 16:22:05 - INFO - __main__ - Step 8682: {'lr': 0.00014453333333333334, 'samples': 277824, 'steps': 542, 'loss/train': 4.121127128601074} -09/20/2021 16:22:05 - INFO - __main__ - Step 8683: {'lr': 0.00014453333333333334, 'samples': 277856, 'steps': 542, 'loss/train': 4.77440071105957} -09/20/2021 16:22:06 - INFO - __main__ - Step 8684: {'lr': 0.00014453333333333334, 'samples': 277888, 'steps': 542, 'loss/train': 4.3921284675598145} -09/20/2021 16:22:07 - INFO - __main__ - Step 8685: {'lr': 0.00014453333333333334, 'samples': 277920, 'steps': 542, 'loss/train': 8.812451362609863} -09/20/2021 16:22:08 - INFO - __main__ - Step 8686: {'lr': 0.00014453333333333334, 'samples': 277952, 'steps': 542, 'loss/train': 6.635798454284668} -09/20/2021 16:22:08 - INFO - __main__ - Step 8687: {'lr': 0.00014453333333333334, 'samples': 277984, 'steps': 542, 'loss/train': 4.8322930335998535} -09/20/2021 16:22:09 - INFO - __main__ - Step 8688: {'lr': 0.00014453333333333334, 'samples': 278016, 'steps': 542, 'loss/train': 2.3093204498291016} -09/20/2021 16:22:10 - INFO - __main__ - Step 8689: {'lr': 0.0001448, 'samples': 278048, 'steps': 543, 'loss/train': 2.7384893894195557} -09/20/2021 16:22:11 - INFO - __main__ - Step 8690: {'lr': 0.0001448, 'samples': 278080, 'steps': 543, 'loss/train': 4.872547626495361} -09/20/2021 16:22:12 - INFO - __main__ - Step 8691: {'lr': 0.0001448, 'samples': 278112, 'steps': 543, 'loss/train': 4.407591819763184} -09/20/2021 16:22:12 - INFO - __main__ - Step 8692: {'lr': 0.0001448, 'samples': 278144, 'steps': 543, 'loss/train': 4.5949931144714355} -09/20/2021 16:22:13 - INFO - __main__ - Step 8693: {'lr': 0.0001448, 'samples': 278176, 'steps': 543, 'loss/train': 4.390746116638184} -09/20/2021 16:22:14 - INFO - __main__ - Step 8694: {'lr': 0.0001448, 'samples': 278208, 'steps': 543, 'loss/train': 4.230413436889648} -09/20/2021 16:22:15 - INFO - __main__ - Step 8695: {'lr': 0.0001448, 'samples': 278240, 'steps': 543, 'loss/train': 4.290513515472412} -09/20/2021 16:22:15 - INFO - __main__ - Step 8696: {'lr': 0.0001448, 'samples': 278272, 'steps': 543, 'loss/train': 6.143741607666016} -09/20/2021 16:22:16 - INFO - __main__ - Step 8697: {'lr': 0.0001448, 'samples': 278304, 'steps': 543, 'loss/train': 5.346500396728516} -09/20/2021 16:22:17 - INFO - __main__ - Step 8698: {'lr': 0.0001448, 'samples': 278336, 'steps': 543, 'loss/train': 5.178555965423584} -09/20/2021 16:22:18 - INFO - __main__ - Step 8699: {'lr': 0.0001448, 'samples': 278368, 'steps': 543, 'loss/train': 4.424061298370361} -09/20/2021 16:22:18 - INFO - __main__ - Step 8700: {'lr': 0.0001448, 'samples': 278400, 'steps': 543, 'loss/train': 5.164539813995361} -09/20/2021 16:22:19 - INFO - __main__ - Step 8701: {'lr': 0.0001448, 'samples': 278432, 'steps': 543, 'loss/train': 4.455605983734131} -09/20/2021 16:22:20 - INFO - __main__ - Step 8702: {'lr': 0.0001448, 'samples': 278464, 'steps': 543, 'loss/train': 4.518072605133057} -09/20/2021 16:22:21 - INFO - __main__ - Step 8703: {'lr': 0.0001448, 'samples': 278496, 'steps': 543, 'loss/train': 5.617737293243408} -09/20/2021 16:22:21 - INFO - __main__ - Step 8704: {'lr': 0.0001448, 'samples': 278528, 'steps': 543, 'loss/train': 5.053402900695801} -09/20/2021 16:22:23 - INFO - __main__ - Step 8705: {'lr': 0.00014506666666666668, 'samples': 278560, 'steps': 544, 'loss/train': 3.409853219985962} -09/20/2021 16:22:24 - INFO - __main__ - Step 8706: {'lr': 0.00014506666666666668, 'samples': 278592, 'steps': 544, 'loss/train': 5.815778732299805} -09/20/2021 16:22:24 - INFO - __main__ - Step 8707: {'lr': 0.00014506666666666668, 'samples': 278624, 'steps': 544, 'loss/train': 3.37567138671875} -09/20/2021 16:22:25 - INFO - __main__ - Step 8708: {'lr': 0.00014506666666666668, 'samples': 278656, 'steps': 544, 'loss/train': 3.933689594268799} -09/20/2021 16:22:26 - INFO - __main__ - Step 8709: {'lr': 0.00014506666666666668, 'samples': 278688, 'steps': 544, 'loss/train': 4.727020740509033} -09/20/2021 16:22:27 - INFO - __main__ - Step 8710: {'lr': 0.00014506666666666668, 'samples': 278720, 'steps': 544, 'loss/train': 4.793453693389893} -09/20/2021 16:22:27 - INFO - __main__ - Step 8711: {'lr': 0.00014506666666666668, 'samples': 278752, 'steps': 544, 'loss/train': 3.7516753673553467} -09/20/2021 16:22:28 - INFO - __main__ - Step 8712: {'lr': 0.00014506666666666668, 'samples': 278784, 'steps': 544, 'loss/train': 4.873437404632568} -09/20/2021 16:22:29 - INFO - __main__ - Step 8713: {'lr': 0.00014506666666666668, 'samples': 278816, 'steps': 544, 'loss/train': 3.621032238006592} -09/20/2021 16:22:30 - INFO - __main__ - Step 8714: {'lr': 0.00014506666666666668, 'samples': 278848, 'steps': 544, 'loss/train': 4.249039173126221} -09/20/2021 16:22:30 - INFO - __main__ - Step 8715: {'lr': 0.00014506666666666668, 'samples': 278880, 'steps': 544, 'loss/train': 5.111771106719971} -09/20/2021 16:22:31 - INFO - __main__ - Step 8716: {'lr': 0.00014506666666666668, 'samples': 278912, 'steps': 544, 'loss/train': 5.304750442504883} -09/20/2021 16:22:32 - INFO - __main__ - Step 8717: {'lr': 0.00014506666666666668, 'samples': 278944, 'steps': 544, 'loss/train': 2.3567047119140625} -09/20/2021 16:22:33 - INFO - __main__ - Step 8718: {'lr': 0.00014506666666666668, 'samples': 278976, 'steps': 544, 'loss/train': 3.7575180530548096} -09/20/2021 16:22:33 - INFO - __main__ - Step 8719: {'lr': 0.00014506666666666668, 'samples': 279008, 'steps': 544, 'loss/train': 5.058835983276367} -09/20/2021 16:22:34 - INFO - __main__ - Step 8720: {'lr': 0.00014506666666666668, 'samples': 279040, 'steps': 544, 'loss/train': 4.86111307144165} -09/20/2021 16:22:35 - INFO - __main__ - Step 8721: {'lr': 0.00014533333333333333, 'samples': 279072, 'steps': 545, 'loss/train': 4.22764778137207} -09/20/2021 16:22:36 - INFO - __main__ - Step 8722: {'lr': 0.00014533333333333333, 'samples': 279104, 'steps': 545, 'loss/train': 4.96473503112793} -09/20/2021 16:22:36 - INFO - __main__ - Step 8723: {'lr': 0.00014533333333333333, 'samples': 279136, 'steps': 545, 'loss/train': 4.5572381019592285} -09/20/2021 16:22:37 - INFO - __main__ - Step 8724: {'lr': 0.00014533333333333333, 'samples': 279168, 'steps': 545, 'loss/train': 3.9229743480682373} -09/20/2021 16:22:38 - INFO - __main__ - Step 8725: {'lr': 0.00014533333333333333, 'samples': 279200, 'steps': 545, 'loss/train': 5.306295394897461} -09/20/2021 16:22:39 - INFO - __main__ - Step 8726: {'lr': 0.00014533333333333333, 'samples': 279232, 'steps': 545, 'loss/train': 4.728877067565918} -09/20/2021 16:22:39 - INFO - __main__ - Step 8727: {'lr': 0.00014533333333333333, 'samples': 279264, 'steps': 545, 'loss/train': 5.301026821136475} -09/20/2021 16:22:40 - INFO - __main__ - Step 8728: {'lr': 0.00014533333333333333, 'samples': 279296, 'steps': 545, 'loss/train': 4.049553871154785} -09/20/2021 16:22:41 - INFO - __main__ - Step 8729: {'lr': 0.00014533333333333333, 'samples': 279328, 'steps': 545, 'loss/train': 1.613889455795288} -09/20/2021 16:22:42 - INFO - __main__ - Step 8730: {'lr': 0.00014533333333333333, 'samples': 279360, 'steps': 545, 'loss/train': 4.45424747467041} -09/20/2021 16:22:42 - INFO - __main__ - Step 8731: {'lr': 0.00014533333333333333, 'samples': 279392, 'steps': 545, 'loss/train': 4.8931884765625} -09/20/2021 16:22:43 - INFO - __main__ - Step 8732: {'lr': 0.00014533333333333333, 'samples': 279424, 'steps': 545, 'loss/train': 4.465628147125244} -09/20/2021 16:22:44 - INFO - __main__ - Step 8733: {'lr': 0.00014533333333333333, 'samples': 279456, 'steps': 545, 'loss/train': 2.9808309078216553} -09/20/2021 16:22:45 - INFO - __main__ - Step 8734: {'lr': 0.00014533333333333333, 'samples': 279488, 'steps': 545, 'loss/train': 4.6083245277404785} -09/20/2021 16:22:46 - INFO - __main__ - Step 8735: {'lr': 0.00014533333333333333, 'samples': 279520, 'steps': 545, 'loss/train': 4.299757957458496} -09/20/2021 16:22:47 - INFO - __main__ - Step 8736: {'lr': 0.00014533333333333333, 'samples': 279552, 'steps': 545, 'loss/train': 4.485967636108398} -09/20/2021 16:22:48 - INFO - __main__ - Step 8737: {'lr': 0.00014560000000000002, 'samples': 279584, 'steps': 546, 'loss/train': 4.350548267364502} -09/20/2021 16:22:49 - INFO - __main__ - Step 8738: {'lr': 0.00014560000000000002, 'samples': 279616, 'steps': 546, 'loss/train': 4.2686309814453125} -09/20/2021 16:22:49 - INFO - __main__ - Step 8739: {'lr': 0.00014560000000000002, 'samples': 279648, 'steps': 546, 'loss/train': 4.018514156341553} -09/20/2021 16:22:50 - INFO - __main__ - Step 8740: {'lr': 0.00014560000000000002, 'samples': 279680, 'steps': 546, 'loss/train': 3.938101053237915} -09/20/2021 16:22:51 - INFO - __main__ - Step 8741: {'lr': 0.00014560000000000002, 'samples': 279712, 'steps': 546, 'loss/train': 4.033778667449951} -09/20/2021 16:22:52 - INFO - __main__ - Step 8742: {'lr': 0.00014560000000000002, 'samples': 279744, 'steps': 546, 'loss/train': 3.918553590774536} -09/20/2021 16:22:52 - INFO - __main__ - Step 8743: {'lr': 0.00014560000000000002, 'samples': 279776, 'steps': 546, 'loss/train': 5.182283878326416} -09/20/2021 16:22:53 - INFO - __main__ - Step 8744: {'lr': 0.00014560000000000002, 'samples': 279808, 'steps': 546, 'loss/train': 4.236667156219482} -09/20/2021 16:22:54 - INFO - __main__ - Step 8745: {'lr': 0.00014560000000000002, 'samples': 279840, 'steps': 546, 'loss/train': 4.215882301330566} -09/20/2021 16:22:55 - INFO - __main__ - Step 8746: {'lr': 0.00014560000000000002, 'samples': 279872, 'steps': 546, 'loss/train': 4.644989013671875} -09/20/2021 16:22:55 - INFO - __main__ - Step 8747: {'lr': 0.00014560000000000002, 'samples': 279904, 'steps': 546, 'loss/train': 4.625006675720215} -09/20/2021 16:22:56 - INFO - __main__ - Step 8748: {'lr': 0.00014560000000000002, 'samples': 279936, 'steps': 546, 'loss/train': 5.232881546020508} -09/20/2021 16:22:57 - INFO - __main__ - Step 8749: {'lr': 0.00014560000000000002, 'samples': 279968, 'steps': 546, 'loss/train': 5.010272979736328} -09/20/2021 16:22:58 - INFO - __main__ - Step 8750: {'lr': 0.00014560000000000002, 'samples': 280000, 'steps': 546, 'loss/train': 5.320187091827393} -09/20/2021 16:22:58 - INFO - __main__ - Step 8751: {'lr': 0.00014560000000000002, 'samples': 280032, 'steps': 546, 'loss/train': 4.490715503692627} -09/20/2021 16:22:59 - INFO - __main__ - Step 8752: {'lr': 0.00014560000000000002, 'samples': 280064, 'steps': 546, 'loss/train': 4.959268569946289} -09/20/2021 16:23:00 - INFO - __main__ - Step 8753: {'lr': 0.00014586666666666667, 'samples': 280096, 'steps': 547, 'loss/train': 4.744622707366943} -09/20/2021 16:23:01 - INFO - __main__ - Step 8754: {'lr': 0.00014586666666666667, 'samples': 280128, 'steps': 547, 'loss/train': 4.025424957275391} -09/20/2021 16:23:01 - INFO - __main__ - Step 8755: {'lr': 0.00014586666666666667, 'samples': 280160, 'steps': 547, 'loss/train': 0.9227464199066162} -09/20/2021 16:23:02 - INFO - __main__ - Step 8756: {'lr': 0.00014586666666666667, 'samples': 280192, 'steps': 547, 'loss/train': 4.432146072387695} -09/20/2021 16:23:03 - INFO - __main__ - Step 8757: {'lr': 0.00014586666666666667, 'samples': 280224, 'steps': 547, 'loss/train': 6.753035545349121} -09/20/2021 16:23:04 - INFO - __main__ - Step 8758: {'lr': 0.00014586666666666667, 'samples': 280256, 'steps': 547, 'loss/train': 5.097656726837158} -09/20/2021 16:23:04 - INFO - __main__ - Step 8759: {'lr': 0.00014586666666666667, 'samples': 280288, 'steps': 547, 'loss/train': 3.9400484561920166} -09/20/2021 16:23:05 - INFO - __main__ - Step 8760: {'lr': 0.00014586666666666667, 'samples': 280320, 'steps': 547, 'loss/train': 4.805693626403809} -09/20/2021 16:23:06 - INFO - __main__ - Step 8761: {'lr': 0.00014586666666666667, 'samples': 280352, 'steps': 547, 'loss/train': 1.913260579109192} -09/20/2021 16:23:07 - INFO - __main__ - Step 8762: {'lr': 0.00014586666666666667, 'samples': 280384, 'steps': 547, 'loss/train': 1.7418928146362305} -09/20/2021 16:23:07 - INFO - __main__ - Step 8763: {'lr': 0.00014586666666666667, 'samples': 280416, 'steps': 547, 'loss/train': 5.638460159301758} -09/20/2021 16:23:08 - INFO - __main__ - Step 8764: {'lr': 0.00014586666666666667, 'samples': 280448, 'steps': 547, 'loss/train': 4.563520908355713} -09/20/2021 16:23:09 - INFO - __main__ - Step 8765: {'lr': 0.00014586666666666667, 'samples': 280480, 'steps': 547, 'loss/train': 4.184507369995117} -09/20/2021 16:23:10 - INFO - __main__ - Step 8766: {'lr': 0.00014586666666666667, 'samples': 280512, 'steps': 547, 'loss/train': 5.2215046882629395} -09/20/2021 16:23:11 - INFO - __main__ - Step 8767: {'lr': 0.00014586666666666667, 'samples': 280544, 'steps': 547, 'loss/train': 3.9947142601013184} -09/20/2021 16:23:12 - INFO - __main__ - Step 8768: {'lr': 0.00014586666666666667, 'samples': 280576, 'steps': 547, 'loss/train': 4.2927327156066895} -09/20/2021 16:23:13 - INFO - __main__ - Step 8769: {'lr': 0.00014613333333333335, 'samples': 280608, 'steps': 548, 'loss/train': 4.855863571166992} -09/20/2021 16:23:13 - INFO - __main__ - Step 8770: {'lr': 0.00014613333333333335, 'samples': 280640, 'steps': 548, 'loss/train': 4.503427982330322} -09/20/2021 16:23:14 - INFO - __main__ - Step 8771: {'lr': 0.00014613333333333335, 'samples': 280672, 'steps': 548, 'loss/train': 5.00895357131958} -09/20/2021 16:23:15 - INFO - __main__ - Step 8772: {'lr': 0.00014613333333333335, 'samples': 280704, 'steps': 548, 'loss/train': 4.832058429718018} -09/20/2021 16:23:16 - INFO - __main__ - Step 8773: {'lr': 0.00014613333333333335, 'samples': 280736, 'steps': 548, 'loss/train': 6.1590800285339355} -09/20/2021 16:23:16 - INFO - __main__ - Step 8774: {'lr': 0.00014613333333333335, 'samples': 280768, 'steps': 548, 'loss/train': 5.550589561462402} -09/20/2021 16:23:17 - INFO - __main__ - Step 8775: {'lr': 0.00014613333333333335, 'samples': 280800, 'steps': 548, 'loss/train': 2.1059064865112305} -09/20/2021 16:23:18 - INFO - __main__ - Step 8776: {'lr': 0.00014613333333333335, 'samples': 280832, 'steps': 548, 'loss/train': 4.20202112197876} -09/20/2021 16:23:19 - INFO - __main__ - Step 8777: {'lr': 0.00014613333333333335, 'samples': 280864, 'steps': 548, 'loss/train': 5.022310733795166} -09/20/2021 16:23:19 - INFO - __main__ - Step 8778: {'lr': 0.00014613333333333335, 'samples': 280896, 'steps': 548, 'loss/train': 4.706131458282471} -09/20/2021 16:23:20 - INFO - __main__ - Step 8779: {'lr': 0.00014613333333333335, 'samples': 280928, 'steps': 548, 'loss/train': 4.145749092102051} -09/20/2021 16:23:21 - INFO - __main__ - Step 8780: {'lr': 0.00014613333333333335, 'samples': 280960, 'steps': 548, 'loss/train': 4.388622283935547} -09/20/2021 16:23:22 - INFO - __main__ - Step 8781: {'lr': 0.00014613333333333335, 'samples': 280992, 'steps': 548, 'loss/train': 5.424875259399414} -09/20/2021 16:23:22 - INFO - __main__ - Step 8782: {'lr': 0.00014613333333333335, 'samples': 281024, 'steps': 548, 'loss/train': 5.064518451690674} -09/20/2021 16:23:23 - INFO - __main__ - Step 8783: {'lr': 0.00014613333333333335, 'samples': 281056, 'steps': 548, 'loss/train': 4.788963794708252} -09/20/2021 16:23:24 - INFO - __main__ - Step 8784: {'lr': 0.00014613333333333335, 'samples': 281088, 'steps': 548, 'loss/train': 4.942248821258545} -09/20/2021 16:23:25 - INFO - __main__ - Step 8785: {'lr': 0.0001464, 'samples': 281120, 'steps': 549, 'loss/train': 5.221830368041992} -09/20/2021 16:23:26 - INFO - __main__ - Step 8786: {'lr': 0.0001464, 'samples': 281152, 'steps': 549, 'loss/train': 4.990590572357178} -09/20/2021 16:23:26 - INFO - __main__ - Step 8787: {'lr': 0.0001464, 'samples': 281184, 'steps': 549, 'loss/train': 4.655102252960205} -09/20/2021 16:23:27 - INFO - __main__ - Step 8788: {'lr': 0.0001464, 'samples': 281216, 'steps': 549, 'loss/train': 4.762993812561035} -09/20/2021 16:23:28 - INFO - __main__ - Step 8789: {'lr': 0.0001464, 'samples': 281248, 'steps': 549, 'loss/train': 3.405433177947998} -09/20/2021 16:23:29 - INFO - __main__ - Step 8790: {'lr': 0.0001464, 'samples': 281280, 'steps': 549, 'loss/train': 5.840703010559082} -09/20/2021 16:23:29 - INFO - __main__ - Step 8791: {'lr': 0.0001464, 'samples': 281312, 'steps': 549, 'loss/train': 7.53125524520874} -09/20/2021 16:23:30 - INFO - __main__ - Step 8792: {'lr': 0.0001464, 'samples': 281344, 'steps': 549, 'loss/train': 7.740396022796631} -09/20/2021 16:23:31 - INFO - __main__ - Step 8793: {'lr': 0.0001464, 'samples': 281376, 'steps': 549, 'loss/train': 5.513426780700684} -09/20/2021 16:23:32 - INFO - __main__ - Step 8794: {'lr': 0.0001464, 'samples': 281408, 'steps': 549, 'loss/train': 4.19374418258667} -09/20/2021 16:23:32 - INFO - __main__ - Step 8795: {'lr': 0.0001464, 'samples': 281440, 'steps': 549, 'loss/train': 4.673464298248291} -09/20/2021 16:23:33 - INFO - __main__ - Step 8796: {'lr': 0.0001464, 'samples': 281472, 'steps': 549, 'loss/train': 4.022722244262695} -09/20/2021 16:23:34 - INFO - __main__ - Step 8797: {'lr': 0.0001464, 'samples': 281504, 'steps': 549, 'loss/train': 6.207230091094971} -09/20/2021 16:23:35 - INFO - __main__ - Step 8798: {'lr': 0.0001464, 'samples': 281536, 'steps': 549, 'loss/train': 4.65984582901001} -09/20/2021 16:23:36 - INFO - __main__ - Step 8799: {'lr': 0.0001464, 'samples': 281568, 'steps': 549, 'loss/train': 4.1105570793151855} -09/20/2021 16:23:37 - INFO - __main__ - Step 8800: {'lr': 0.0001464, 'samples': 281600, 'steps': 549, 'loss/train': 4.5115766525268555} -09/20/2021 16:23:38 - INFO - __main__ - Step 8801: {'lr': 0.00014666666666666666, 'samples': 281632, 'steps': 550, 'loss/train': 5.363185882568359} -09/20/2021 16:23:39 - INFO - __main__ - Step 8802: {'lr': 0.00014666666666666666, 'samples': 281664, 'steps': 550, 'loss/train': 4.014005661010742} -09/20/2021 16:23:39 - INFO - __main__ - Step 8803: {'lr': 0.00014666666666666666, 'samples': 281696, 'steps': 550, 'loss/train': 4.117419719696045} -09/20/2021 16:23:40 - INFO - __main__ - Step 8804: {'lr': 0.00014666666666666666, 'samples': 281728, 'steps': 550, 'loss/train': 4.198543548583984} -09/20/2021 16:23:41 - INFO - __main__ - Step 8805: {'lr': 0.00014666666666666666, 'samples': 281760, 'steps': 550, 'loss/train': 6.080329418182373} -09/20/2021 16:23:42 - INFO - __main__ - Step 8806: {'lr': 0.00014666666666666666, 'samples': 281792, 'steps': 550, 'loss/train': 4.844783782958984} -09/20/2021 16:23:42 - INFO - __main__ - Step 8807: {'lr': 0.00014666666666666666, 'samples': 281824, 'steps': 550, 'loss/train': 4.6055908203125} -09/20/2021 16:23:43 - INFO - __main__ - Step 8808: {'lr': 0.00014666666666666666, 'samples': 281856, 'steps': 550, 'loss/train': 3.8873579502105713} -09/20/2021 16:23:44 - INFO - __main__ - Step 8809: {'lr': 0.00014666666666666666, 'samples': 281888, 'steps': 550, 'loss/train': 5.174834251403809} -09/20/2021 16:23:45 - INFO - __main__ - Step 8810: {'lr': 0.00014666666666666666, 'samples': 281920, 'steps': 550, 'loss/train': 2.617835760116577} -09/20/2021 16:23:45 - INFO - __main__ - Step 8811: {'lr': 0.00014666666666666666, 'samples': 281952, 'steps': 550, 'loss/train': 3.423670768737793} -09/20/2021 16:23:46 - INFO - __main__ - Step 8812: {'lr': 0.00014666666666666666, 'samples': 281984, 'steps': 550, 'loss/train': 3.3882298469543457} -09/20/2021 16:23:47 - INFO - __main__ - Step 8813: {'lr': 0.00014666666666666666, 'samples': 282016, 'steps': 550, 'loss/train': 3.1760222911834717} -09/20/2021 16:23:48 - INFO - __main__ - Step 8814: {'lr': 0.00014666666666666666, 'samples': 282048, 'steps': 550, 'loss/train': 4.952771186828613} -09/20/2021 16:23:48 - INFO - __main__ - Step 8815: {'lr': 0.00014666666666666666, 'samples': 282080, 'steps': 550, 'loss/train': 4.921766757965088} -09/20/2021 16:23:49 - INFO - __main__ - Step 8816: {'lr': 0.00014666666666666666, 'samples': 282112, 'steps': 550, 'loss/train': 4.087123394012451} -09/20/2021 16:23:50 - INFO - __main__ - Step 8817: {'lr': 0.00014693333333333335, 'samples': 282144, 'steps': 551, 'loss/train': 4.535655975341797} -09/20/2021 16:23:51 - INFO - __main__ - Step 8818: {'lr': 0.00014693333333333335, 'samples': 282176, 'steps': 551, 'loss/train': 5.110498905181885} -09/20/2021 16:23:52 - INFO - __main__ - Step 8819: {'lr': 0.00014693333333333335, 'samples': 282208, 'steps': 551, 'loss/train': 4.3342180252075195} -09/20/2021 16:23:52 - INFO - __main__ - Step 8820: {'lr': 0.00014693333333333335, 'samples': 282240, 'steps': 551, 'loss/train': 3.931856155395508} -09/20/2021 16:23:53 - INFO - __main__ - Step 8821: {'lr': 0.00014693333333333335, 'samples': 282272, 'steps': 551, 'loss/train': 4.961073398590088} -09/20/2021 16:23:54 - INFO - __main__ - Step 8822: {'lr': 0.00014693333333333335, 'samples': 282304, 'steps': 551, 'loss/train': 4.552909851074219} -09/20/2021 16:23:55 - INFO - __main__ - Step 8823: {'lr': 0.00014693333333333335, 'samples': 282336, 'steps': 551, 'loss/train': 4.625499248504639} -09/20/2021 16:23:55 - INFO - __main__ - Step 8824: {'lr': 0.00014693333333333335, 'samples': 282368, 'steps': 551, 'loss/train': 4.476044654846191} -09/20/2021 16:23:56 - INFO - __main__ - Step 8825: {'lr': 0.00014693333333333335, 'samples': 282400, 'steps': 551, 'loss/train': 5.770176887512207} -09/20/2021 16:23:57 - INFO - __main__ - Step 8826: {'lr': 0.00014693333333333335, 'samples': 282432, 'steps': 551, 'loss/train': 4.686690330505371} -09/20/2021 16:23:58 - INFO - __main__ - Step 8827: {'lr': 0.00014693333333333335, 'samples': 282464, 'steps': 551, 'loss/train': 5.255993843078613} -09/20/2021 16:23:58 - INFO - __main__ - Step 8828: {'lr': 0.00014693333333333335, 'samples': 282496, 'steps': 551, 'loss/train': 4.860708713531494} -09/20/2021 16:23:59 - INFO - __main__ - Step 8829: {'lr': 0.00014693333333333335, 'samples': 282528, 'steps': 551, 'loss/train': 4.331442356109619} -09/20/2021 16:24:00 - INFO - __main__ - Step 8830: {'lr': 0.00014693333333333335, 'samples': 282560, 'steps': 551, 'loss/train': 4.685753345489502} -09/20/2021 16:24:01 - INFO - __main__ - Step 8831: {'lr': 0.00014693333333333335, 'samples': 282592, 'steps': 551, 'loss/train': 4.54278564453125} -09/20/2021 16:24:01 - INFO - __main__ - Step 8832: {'lr': 0.00014693333333333335, 'samples': 282624, 'steps': 551, 'loss/train': 4.477823257446289} -09/20/2021 16:24:02 - INFO - __main__ - Step 8833: {'lr': 0.0001472, 'samples': 282656, 'steps': 552, 'loss/train': 4.645668029785156} -09/20/2021 16:24:03 - INFO - __main__ - Step 8834: {'lr': 0.0001472, 'samples': 282688, 'steps': 552, 'loss/train': 4.39709997177124} -09/20/2021 16:24:04 - INFO - __main__ - Step 8835: {'lr': 0.0001472, 'samples': 282720, 'steps': 552, 'loss/train': 4.833993434906006} -09/20/2021 16:24:05 - INFO - __main__ - Step 8836: {'lr': 0.0001472, 'samples': 282752, 'steps': 552, 'loss/train': 5.109885215759277} -09/20/2021 16:24:06 - INFO - __main__ - Step 8837: {'lr': 0.0001472, 'samples': 282784, 'steps': 552, 'loss/train': 3.816988706588745} -09/20/2021 16:24:07 - INFO - __main__ - Step 8838: {'lr': 0.0001472, 'samples': 282816, 'steps': 552, 'loss/train': 4.912782192230225} -09/20/2021 16:24:07 - INFO - __main__ - Step 8839: {'lr': 0.0001472, 'samples': 282848, 'steps': 552, 'loss/train': 4.789555549621582} -09/20/2021 16:24:08 - INFO - __main__ - Step 8840: {'lr': 0.0001472, 'samples': 282880, 'steps': 552, 'loss/train': 1.7312630414962769} -09/20/2021 16:24:09 - INFO - __main__ - Step 8841: {'lr': 0.0001472, 'samples': 282912, 'steps': 552, 'loss/train': 4.448312759399414} -09/20/2021 16:24:10 - INFO - __main__ - Step 8842: {'lr': 0.0001472, 'samples': 282944, 'steps': 552, 'loss/train': 3.0448451042175293} -09/20/2021 16:24:10 - INFO - __main__ - Step 8843: {'lr': 0.0001472, 'samples': 282976, 'steps': 552, 'loss/train': 4.602610111236572} -09/20/2021 16:24:11 - INFO - __main__ - Step 8844: {'lr': 0.0001472, 'samples': 283008, 'steps': 552, 'loss/train': 5.9692206382751465} -09/20/2021 16:24:12 - INFO - __main__ - Step 8845: {'lr': 0.0001472, 'samples': 283040, 'steps': 552, 'loss/train': 4.496517658233643} -09/20/2021 16:24:13 - INFO - __main__ - Step 8846: {'lr': 0.0001472, 'samples': 283072, 'steps': 552, 'loss/train': 3.8389477729797363} -09/20/2021 16:24:13 - INFO - __main__ - Step 8847: {'lr': 0.0001472, 'samples': 283104, 'steps': 552, 'loss/train': 4.348290920257568} -09/20/2021 16:24:14 - INFO - __main__ - Step 8848: {'lr': 0.0001472, 'samples': 283136, 'steps': 552, 'loss/train': 4.1751837730407715} -09/20/2021 16:24:15 - INFO - __main__ - Step 8849: {'lr': 0.00014746666666666666, 'samples': 283168, 'steps': 553, 'loss/train': 4.692869663238525} -09/20/2021 16:24:16 - INFO - __main__ - Step 8850: {'lr': 0.00014746666666666666, 'samples': 283200, 'steps': 553, 'loss/train': 4.168046474456787} -09/20/2021 16:24:16 - INFO - __main__ - Step 8851: {'lr': 0.00014746666666666666, 'samples': 283232, 'steps': 553, 'loss/train': 4.9569525718688965} -09/20/2021 16:24:17 - INFO - __main__ - Step 8852: {'lr': 0.00014746666666666666, 'samples': 283264, 'steps': 553, 'loss/train': 6.212102890014648} -09/20/2021 16:24:18 - INFO - __main__ - Step 8853: {'lr': 0.00014746666666666666, 'samples': 283296, 'steps': 553, 'loss/train': 6.263455390930176} -09/20/2021 16:24:19 - INFO - __main__ - Step 8854: {'lr': 0.00014746666666666666, 'samples': 283328, 'steps': 553, 'loss/train': 6.279610633850098} -09/20/2021 16:24:19 - INFO - __main__ - Step 8855: {'lr': 0.00014746666666666666, 'samples': 283360, 'steps': 553, 'loss/train': 5.620344161987305} -09/20/2021 16:24:20 - INFO - __main__ - Step 8856: {'lr': 0.00014746666666666666, 'samples': 283392, 'steps': 553, 'loss/train': 5.307162761688232} -09/20/2021 16:24:21 - INFO - __main__ - Step 8857: {'lr': 0.00014746666666666666, 'samples': 283424, 'steps': 553, 'loss/train': 4.348668575286865} -09/20/2021 16:24:22 - INFO - __main__ - Step 8858: {'lr': 0.00014746666666666666, 'samples': 283456, 'steps': 553, 'loss/train': 4.86862325668335} -09/20/2021 16:24:22 - INFO - __main__ - Step 8859: {'lr': 0.00014746666666666666, 'samples': 283488, 'steps': 553, 'loss/train': 4.321255207061768} -09/20/2021 16:24:23 - INFO - __main__ - Step 8860: {'lr': 0.00014746666666666666, 'samples': 283520, 'steps': 553, 'loss/train': 4.1426825523376465} -09/20/2021 16:24:24 - INFO - __main__ - Step 8861: {'lr': 0.00014746666666666666, 'samples': 283552, 'steps': 553, 'loss/train': 4.583425521850586} -09/20/2021 16:24:25 - INFO - __main__ - Step 8862: {'lr': 0.00014746666666666666, 'samples': 283584, 'steps': 553, 'loss/train': 5.07042121887207} -09/20/2021 16:24:25 - INFO - __main__ - Step 8863: {'lr': 0.00014746666666666666, 'samples': 283616, 'steps': 553, 'loss/train': 4.274483680725098} -09/20/2021 16:24:26 - INFO - __main__ - Step 8864: {'lr': 0.00014746666666666666, 'samples': 283648, 'steps': 553, 'loss/train': 4.451789379119873} -09/20/2021 16:24:27 - INFO - __main__ - Step 8865: {'lr': 0.00014773333333333334, 'samples': 283680, 'steps': 554, 'loss/train': 5.020596504211426} -09/20/2021 16:24:28 - INFO - __main__ - Step 8866: {'lr': 0.00014773333333333334, 'samples': 283712, 'steps': 554, 'loss/train': 5.49672269821167} -09/20/2021 16:24:30 - INFO - __main__ - Step 8867: {'lr': 0.00014773333333333334, 'samples': 283744, 'steps': 554, 'loss/train': 3.784571647644043} -09/20/2021 16:24:30 - INFO - __main__ - Step 8868: {'lr': 0.00014773333333333334, 'samples': 283776, 'steps': 554, 'loss/train': 4.398290634155273} -09/20/2021 16:24:31 - INFO - __main__ - Step 8869: {'lr': 0.00014773333333333334, 'samples': 283808, 'steps': 554, 'loss/train': 4.215512275695801} -09/20/2021 16:24:32 - INFO - __main__ - Step 8870: {'lr': 0.00014773333333333334, 'samples': 283840, 'steps': 554, 'loss/train': 4.655342102050781} -09/20/2021 16:24:33 - INFO - __main__ - Step 8871: {'lr': 0.00014773333333333334, 'samples': 283872, 'steps': 554, 'loss/train': 4.943868637084961} -09/20/2021 16:24:33 - INFO - __main__ - Step 8872: {'lr': 0.00014773333333333334, 'samples': 283904, 'steps': 554, 'loss/train': 4.44386625289917} -09/20/2021 16:24:34 - INFO - __main__ - Step 8873: {'lr': 0.00014773333333333334, 'samples': 283936, 'steps': 554, 'loss/train': 4.416555881500244} -09/20/2021 16:24:35 - INFO - __main__ - Step 8874: {'lr': 0.00014773333333333334, 'samples': 283968, 'steps': 554, 'loss/train': 4.6960649490356445} -09/20/2021 16:24:36 - INFO - __main__ - Step 8875: {'lr': 0.00014773333333333334, 'samples': 284000, 'steps': 554, 'loss/train': 5.467188358306885} -09/20/2021 16:24:36 - INFO - __main__ - Step 8876: {'lr': 0.00014773333333333334, 'samples': 284032, 'steps': 554, 'loss/train': 4.913352012634277} -09/20/2021 16:24:37 - INFO - __main__ - Step 8877: {'lr': 0.00014773333333333334, 'samples': 284064, 'steps': 554, 'loss/train': 4.0274577140808105} -09/20/2021 16:24:38 - INFO - __main__ - Step 8878: {'lr': 0.00014773333333333334, 'samples': 284096, 'steps': 554, 'loss/train': 4.249619007110596} -09/20/2021 16:24:39 - INFO - __main__ - Step 8879: {'lr': 0.00014773333333333334, 'samples': 284128, 'steps': 554, 'loss/train': 5.2652997970581055} -09/20/2021 16:24:39 - INFO - __main__ - Step 8880: {'lr': 0.00014773333333333334, 'samples': 284160, 'steps': 554, 'loss/train': 5.727665901184082} -09/20/2021 16:24:40 - INFO - __main__ - Step 8881: {'lr': 0.000148, 'samples': 284192, 'steps': 555, 'loss/train': 5.4051008224487305} -09/20/2021 16:24:41 - INFO - __main__ - Step 8882: {'lr': 0.000148, 'samples': 284224, 'steps': 555, 'loss/train': 4.886484146118164} -09/20/2021 16:24:42 - INFO - __main__ - Step 8883: {'lr': 0.000148, 'samples': 284256, 'steps': 555, 'loss/train': 4.669949531555176} -09/20/2021 16:24:42 - INFO - __main__ - Step 8884: {'lr': 0.000148, 'samples': 284288, 'steps': 555, 'loss/train': 4.782452583312988} -09/20/2021 16:24:43 - INFO - __main__ - Step 8885: {'lr': 0.000148, 'samples': 284320, 'steps': 555, 'loss/train': 5.324540615081787} -09/20/2021 16:24:44 - INFO - __main__ - Step 8886: {'lr': 0.000148, 'samples': 284352, 'steps': 555, 'loss/train': 2.205382823944092} -09/20/2021 16:24:45 - INFO - __main__ - Step 8887: {'lr': 0.000148, 'samples': 284384, 'steps': 555, 'loss/train': 2.4185738563537598} -09/20/2021 16:24:45 - INFO - __main__ - Step 8888: {'lr': 0.000148, 'samples': 284416, 'steps': 555, 'loss/train': 2.711652994155884} -09/20/2021 16:24:46 - INFO - __main__ - Step 8889: {'lr': 0.000148, 'samples': 284448, 'steps': 555, 'loss/train': 2.9867029190063477} -09/20/2021 16:24:47 - INFO - __main__ - Step 8890: {'lr': 0.000148, 'samples': 284480, 'steps': 555, 'loss/train': 3.426304817199707} -09/20/2021 16:24:48 - INFO - __main__ - Step 8891: {'lr': 0.000148, 'samples': 284512, 'steps': 555, 'loss/train': 3.041686773300171} -09/20/2021 16:24:48 - INFO - __main__ - Step 8892: {'lr': 0.000148, 'samples': 284544, 'steps': 555, 'loss/train': 2.35727858543396} -09/20/2021 16:24:49 - INFO - __main__ - Step 8893: {'lr': 0.000148, 'samples': 284576, 'steps': 555, 'loss/train': 5.77281379699707} -09/20/2021 16:24:50 - INFO - __main__ - Step 8894: {'lr': 0.000148, 'samples': 284608, 'steps': 555, 'loss/train': 4.946949005126953} -09/20/2021 16:24:51 - INFO - __main__ - Step 8895: {'lr': 0.000148, 'samples': 284640, 'steps': 555, 'loss/train': 4.691661834716797} -09/20/2021 16:24:51 - INFO - __main__ - Step 8896: {'lr': 0.000148, 'samples': 284672, 'steps': 555, 'loss/train': 4.546394348144531} -09/20/2021 16:24:52 - INFO - __main__ - Step 8897: {'lr': 0.00014826666666666667, 'samples': 284704, 'steps': 556, 'loss/train': 4.069742202758789} -09/20/2021 16:24:54 - INFO - __main__ - Step 8898: {'lr': 0.00014826666666666667, 'samples': 284736, 'steps': 556, 'loss/train': 5.40427303314209} -09/20/2021 16:24:55 - INFO - __main__ - Step 8899: {'lr': 0.00014826666666666667, 'samples': 284768, 'steps': 556, 'loss/train': 5.232038497924805} -09/20/2021 16:24:55 - INFO - __main__ - Step 8900: {'lr': 0.00014826666666666667, 'samples': 284800, 'steps': 556, 'loss/train': 3.7768208980560303} -09/20/2021 16:24:56 - INFO - __main__ - Step 8901: {'lr': 0.00014826666666666667, 'samples': 284832, 'steps': 556, 'loss/train': 4.2652177810668945} -09/20/2021 16:24:57 - INFO - __main__ - Step 8902: {'lr': 0.00014826666666666667, 'samples': 284864, 'steps': 556, 'loss/train': 4.175860404968262} -09/20/2021 16:24:58 - INFO - __main__ - Step 8903: {'lr': 0.00014826666666666667, 'samples': 284896, 'steps': 556, 'loss/train': 5.1209917068481445} -09/20/2021 16:24:58 - INFO - __main__ - Step 8904: {'lr': 0.00014826666666666667, 'samples': 284928, 'steps': 556, 'loss/train': 4.8940277099609375} -09/20/2021 16:24:59 - INFO - __main__ - Step 8905: {'lr': 0.00014826666666666667, 'samples': 284960, 'steps': 556, 'loss/train': 3.2987263202667236} -09/20/2021 16:25:00 - INFO - __main__ - Step 8906: {'lr': 0.00014826666666666667, 'samples': 284992, 'steps': 556, 'loss/train': 4.883591175079346} -09/20/2021 16:25:01 - INFO - __main__ - Step 8907: {'lr': 0.00014826666666666667, 'samples': 285024, 'steps': 556, 'loss/train': 5.637696743011475} -09/20/2021 16:25:01 - INFO - __main__ - Step 8908: {'lr': 0.00014826666666666667, 'samples': 285056, 'steps': 556, 'loss/train': 6.008407115936279} -09/20/2021 16:25:02 - INFO - __main__ - Step 8909: {'lr': 0.00014826666666666667, 'samples': 285088, 'steps': 556, 'loss/train': 4.302331924438477} -09/20/2021 16:25:03 - INFO - __main__ - Step 8910: {'lr': 0.00014826666666666667, 'samples': 285120, 'steps': 556, 'loss/train': 4.287882328033447} -09/20/2021 16:25:04 - INFO - __main__ - Step 8911: {'lr': 0.00014826666666666667, 'samples': 285152, 'steps': 556, 'loss/train': 4.656167984008789} -09/20/2021 16:25:04 - INFO - __main__ - Step 8912: {'lr': 0.00014826666666666667, 'samples': 285184, 'steps': 556, 'loss/train': 4.696371078491211} -09/20/2021 16:25:05 - INFO - __main__ - Step 8913: {'lr': 0.00014853333333333336, 'samples': 285216, 'steps': 557, 'loss/train': 4.042333126068115} -09/20/2021 16:25:06 - INFO - __main__ - Step 8914: {'lr': 0.00014853333333333336, 'samples': 285248, 'steps': 557, 'loss/train': 4.816390514373779} -09/20/2021 16:25:07 - INFO - __main__ - Step 8915: {'lr': 0.00014853333333333336, 'samples': 285280, 'steps': 557, 'loss/train': 4.708370685577393} -09/20/2021 16:25:07 - INFO - __main__ - Step 8916: {'lr': 0.00014853333333333336, 'samples': 285312, 'steps': 557, 'loss/train': 4.239195346832275} -09/20/2021 16:25:08 - INFO - __main__ - Step 8917: {'lr': 0.00014853333333333336, 'samples': 285344, 'steps': 557, 'loss/train': 5.213936805725098} -09/20/2021 16:25:09 - INFO - __main__ - Step 8918: {'lr': 0.00014853333333333336, 'samples': 285376, 'steps': 557, 'loss/train': 4.4443159103393555} -09/20/2021 16:25:10 - INFO - __main__ - Step 8919: {'lr': 0.00014853333333333336, 'samples': 285408, 'steps': 557, 'loss/train': 4.31545352935791} -09/20/2021 16:25:10 - INFO - __main__ - Step 8920: {'lr': 0.00014853333333333336, 'samples': 285440, 'steps': 557, 'loss/train': 4.975985527038574} -09/20/2021 16:25:11 - INFO - __main__ - Step 8921: {'lr': 0.00014853333333333336, 'samples': 285472, 'steps': 557, 'loss/train': 4.830899238586426} -09/20/2021 16:25:12 - INFO - __main__ - Step 8922: {'lr': 0.00014853333333333336, 'samples': 285504, 'steps': 557, 'loss/train': 4.677197456359863} -09/20/2021 16:25:13 - INFO - __main__ - Step 8923: {'lr': 0.00014853333333333336, 'samples': 285536, 'steps': 557, 'loss/train': 4.373424053192139} -09/20/2021 16:25:13 - INFO - __main__ - Step 8924: {'lr': 0.00014853333333333336, 'samples': 285568, 'steps': 557, 'loss/train': 4.019127368927002} -09/20/2021 16:25:14 - INFO - __main__ - Step 8925: {'lr': 0.00014853333333333336, 'samples': 285600, 'steps': 557, 'loss/train': 3.6345536708831787} -09/20/2021 16:25:15 - INFO - __main__ - Step 8926: {'lr': 0.00014853333333333336, 'samples': 285632, 'steps': 557, 'loss/train': 4.736710071563721} -09/20/2021 16:25:16 - INFO - __main__ - Step 8927: {'lr': 0.00014853333333333336, 'samples': 285664, 'steps': 557, 'loss/train': 5.234403133392334} -09/20/2021 16:25:16 - INFO - __main__ - Step 8928: {'lr': 0.00014853333333333336, 'samples': 285696, 'steps': 557, 'loss/train': 5.497607707977295} -09/20/2021 16:25:18 - INFO - __main__ - Step 8929: {'lr': 0.0001488, 'samples': 285728, 'steps': 558, 'loss/train': 5.849778175354004} -09/20/2021 16:25:19 - INFO - __main__ - Step 8930: {'lr': 0.0001488, 'samples': 285760, 'steps': 558, 'loss/train': 4.4334893226623535} -09/20/2021 16:25:20 - INFO - __main__ - Step 8931: {'lr': 0.0001488, 'samples': 285792, 'steps': 558, 'loss/train': 4.480081558227539} -09/20/2021 16:25:20 - INFO - __main__ - Step 8932: {'lr': 0.0001488, 'samples': 285824, 'steps': 558, 'loss/train': 3.770507335662842} -09/20/2021 16:25:21 - INFO - __main__ - Step 8933: {'lr': 0.0001488, 'samples': 285856, 'steps': 558, 'loss/train': 5.101506233215332} -09/20/2021 16:25:22 - INFO - __main__ - Step 8934: {'lr': 0.0001488, 'samples': 285888, 'steps': 558, 'loss/train': 3.9207866191864014} -09/20/2021 16:25:23 - INFO - __main__ - Step 8935: {'lr': 0.0001488, 'samples': 285920, 'steps': 558, 'loss/train': 4.676867961883545} -09/20/2021 16:25:23 - INFO - __main__ - Step 8936: {'lr': 0.0001488, 'samples': 285952, 'steps': 558, 'loss/train': 4.636864185333252} -09/20/2021 16:25:24 - INFO - __main__ - Step 8937: {'lr': 0.0001488, 'samples': 285984, 'steps': 558, 'loss/train': 4.762354850769043} -09/20/2021 16:25:25 - INFO - __main__ - Step 8938: {'lr': 0.0001488, 'samples': 286016, 'steps': 558, 'loss/train': 4.2668681144714355} -09/20/2021 16:25:26 - INFO - __main__ - Step 8939: {'lr': 0.0001488, 'samples': 286048, 'steps': 558, 'loss/train': 3.9255621433258057} -09/20/2021 16:25:26 - INFO - __main__ - Step 8940: {'lr': 0.0001488, 'samples': 286080, 'steps': 558, 'loss/train': 4.25423002243042} -09/20/2021 16:25:27 - INFO - __main__ - Step 8941: {'lr': 0.0001488, 'samples': 286112, 'steps': 558, 'loss/train': 4.022226333618164} -09/20/2021 16:25:28 - INFO - __main__ - Step 8942: {'lr': 0.0001488, 'samples': 286144, 'steps': 558, 'loss/train': 4.323972702026367} -09/20/2021 16:25:29 - INFO - __main__ - Step 8943: {'lr': 0.0001488, 'samples': 286176, 'steps': 558, 'loss/train': 3.9924380779266357} -09/20/2021 16:25:29 - INFO - __main__ - Step 8944: {'lr': 0.0001488, 'samples': 286208, 'steps': 558, 'loss/train': 5.497575759887695} -09/20/2021 16:25:30 - INFO - __main__ - Step 8945: {'lr': 0.00014906666666666667, 'samples': 286240, 'steps': 559, 'loss/train': 3.9447543621063232} -09/20/2021 16:25:31 - INFO - __main__ - Step 8946: {'lr': 0.00014906666666666667, 'samples': 286272, 'steps': 559, 'loss/train': 4.389220237731934} -09/20/2021 16:25:32 - INFO - __main__ - Step 8947: {'lr': 0.00014906666666666667, 'samples': 286304, 'steps': 559, 'loss/train': 4.519771099090576} -09/20/2021 16:25:32 - INFO - __main__ - Step 8948: {'lr': 0.00014906666666666667, 'samples': 286336, 'steps': 559, 'loss/train': 4.0947184562683105} -09/20/2021 16:25:33 - INFO - __main__ - Step 8949: {'lr': 0.00014906666666666667, 'samples': 286368, 'steps': 559, 'loss/train': 4.223812580108643} -09/20/2021 16:25:34 - INFO - __main__ - Step 8950: {'lr': 0.00014906666666666667, 'samples': 286400, 'steps': 559, 'loss/train': 5.695662021636963} -09/20/2021 16:25:35 - INFO - __main__ - Step 8951: {'lr': 0.00014906666666666667, 'samples': 286432, 'steps': 559, 'loss/train': 5.92924690246582} -09/20/2021 16:25:35 - INFO - __main__ - Step 8952: {'lr': 0.00014906666666666667, 'samples': 286464, 'steps': 559, 'loss/train': 6.783718585968018} -09/20/2021 16:25:36 - INFO - __main__ - Step 8953: {'lr': 0.00014906666666666667, 'samples': 286496, 'steps': 559, 'loss/train': 6.956021308898926} -09/20/2021 16:25:37 - INFO - __main__ - Step 8954: {'lr': 0.00014906666666666667, 'samples': 286528, 'steps': 559, 'loss/train': 4.327691078186035} -09/20/2021 16:25:38 - INFO - __main__ - Step 8955: {'lr': 0.00014906666666666667, 'samples': 286560, 'steps': 559, 'loss/train': 4.489360809326172} -09/20/2021 16:25:38 - INFO - __main__ - Step 8956: {'lr': 0.00014906666666666667, 'samples': 286592, 'steps': 559, 'loss/train': 3.7648282051086426} -09/20/2021 16:25:39 - INFO - __main__ - Step 8957: {'lr': 0.00014906666666666667, 'samples': 286624, 'steps': 559, 'loss/train': 4.571831226348877} -09/20/2021 16:25:40 - INFO - __main__ - Step 8958: {'lr': 0.00014906666666666667, 'samples': 286656, 'steps': 559, 'loss/train': 4.535499095916748} -09/20/2021 16:25:41 - INFO - __main__ - Step 8959: {'lr': 0.00014906666666666667, 'samples': 286688, 'steps': 559, 'loss/train': 5.544300079345703} -09/20/2021 16:25:41 - INFO - __main__ - Step 8960: {'lr': 0.00014906666666666667, 'samples': 286720, 'steps': 559, 'loss/train': 4.387077808380127} -09/20/2021 16:25:43 - INFO - __main__ - Step 8961: {'lr': 0.00014933333333333335, 'samples': 286752, 'steps': 560, 'loss/train': 4.593481063842773} -09/20/2021 16:25:44 - INFO - __main__ - Step 8962: {'lr': 0.00014933333333333335, 'samples': 286784, 'steps': 560, 'loss/train': 4.1729607582092285} -09/20/2021 16:25:44 - INFO - __main__ - Step 8963: {'lr': 0.00014933333333333335, 'samples': 286816, 'steps': 560, 'loss/train': 6.710936069488525} -09/20/2021 16:25:45 - INFO - __main__ - Step 8964: {'lr': 0.00014933333333333335, 'samples': 286848, 'steps': 560, 'loss/train': 5.350627422332764} -09/20/2021 16:25:46 - INFO - __main__ - Step 8965: {'lr': 0.00014933333333333335, 'samples': 286880, 'steps': 560, 'loss/train': 5.441590785980225} -09/20/2021 16:25:47 - INFO - __main__ - Step 8966: {'lr': 0.00014933333333333335, 'samples': 286912, 'steps': 560, 'loss/train': 4.498012542724609} -09/20/2021 16:25:47 - INFO - __main__ - Step 8967: {'lr': 0.00014933333333333335, 'samples': 286944, 'steps': 560, 'loss/train': 3.573446273803711} -09/20/2021 16:25:48 - INFO - __main__ - Step 8968: {'lr': 0.00014933333333333335, 'samples': 286976, 'steps': 560, 'loss/train': 4.730489253997803} -09/20/2021 16:25:49 - INFO - __main__ - Step 8969: {'lr': 0.00014933333333333335, 'samples': 287008, 'steps': 560, 'loss/train': 5.011415958404541} -09/20/2021 16:25:50 - INFO - __main__ - Step 8970: {'lr': 0.00014933333333333335, 'samples': 287040, 'steps': 560, 'loss/train': 4.626043319702148} -09/20/2021 16:25:50 - INFO - __main__ - Step 8971: {'lr': 0.00014933333333333335, 'samples': 287072, 'steps': 560, 'loss/train': 4.087464809417725} -09/20/2021 16:25:51 - INFO - __main__ - Step 8972: {'lr': 0.00014933333333333335, 'samples': 287104, 'steps': 560, 'loss/train': 3.6785457134246826} -09/20/2021 16:25:52 - INFO - __main__ - Step 8973: {'lr': 0.00014933333333333335, 'samples': 287136, 'steps': 560, 'loss/train': 6.297886848449707} -09/20/2021 16:25:53 - INFO - __main__ - Step 8974: {'lr': 0.00014933333333333335, 'samples': 287168, 'steps': 560, 'loss/train': 4.428475856781006} -09/20/2021 16:25:53 - INFO - __main__ - Step 8975: {'lr': 0.00014933333333333335, 'samples': 287200, 'steps': 560, 'loss/train': 4.115301132202148} -09/20/2021 16:25:54 - INFO - __main__ - Step 8976: {'lr': 0.00014933333333333335, 'samples': 287232, 'steps': 560, 'loss/train': 4.578052043914795} -09/20/2021 16:25:55 - INFO - __main__ - Step 8977: {'lr': 0.0001496, 'samples': 287264, 'steps': 561, 'loss/train': 4.285655975341797} -09/20/2021 16:25:56 - INFO - __main__ - Step 8978: {'lr': 0.0001496, 'samples': 287296, 'steps': 561, 'loss/train': 5.208923816680908} -09/20/2021 16:25:57 - INFO - __main__ - Step 8979: {'lr': 0.0001496, 'samples': 287328, 'steps': 561, 'loss/train': 5.492185592651367} -09/20/2021 16:25:57 - INFO - __main__ - Step 8980: {'lr': 0.0001496, 'samples': 287360, 'steps': 561, 'loss/train': 5.246953010559082} -09/20/2021 16:25:58 - INFO - __main__ - Step 8981: {'lr': 0.0001496, 'samples': 287392, 'steps': 561, 'loss/train': 5.135563850402832} -09/20/2021 16:25:59 - INFO - __main__ - Step 8982: {'lr': 0.0001496, 'samples': 287424, 'steps': 561, 'loss/train': 4.079859256744385} -09/20/2021 16:26:00 - INFO - __main__ - Step 8983: {'lr': 0.0001496, 'samples': 287456, 'steps': 561, 'loss/train': 5.013972759246826} -09/20/2021 16:26:00 - INFO - __main__ - Step 8984: {'lr': 0.0001496, 'samples': 287488, 'steps': 561, 'loss/train': 4.013101577758789} -09/20/2021 16:26:01 - INFO - __main__ - Step 8985: {'lr': 0.0001496, 'samples': 287520, 'steps': 561, 'loss/train': 5.059783935546875} -09/20/2021 16:26:02 - INFO - __main__ - Step 8986: {'lr': 0.0001496, 'samples': 287552, 'steps': 561, 'loss/train': 4.437124729156494} -09/20/2021 16:26:03 - INFO - __main__ - Step 8987: {'lr': 0.0001496, 'samples': 287584, 'steps': 561, 'loss/train': 4.833842754364014} -09/20/2021 16:26:03 - INFO - __main__ - Step 8988: {'lr': 0.0001496, 'samples': 287616, 'steps': 561, 'loss/train': 4.725543022155762} -09/20/2021 16:26:04 - INFO - __main__ - Step 8989: {'lr': 0.0001496, 'samples': 287648, 'steps': 561, 'loss/train': 5.020447731018066} -09/20/2021 16:26:05 - INFO - __main__ - Step 8990: {'lr': 0.0001496, 'samples': 287680, 'steps': 561, 'loss/train': 4.710484981536865} -09/20/2021 16:26:06 - INFO - __main__ - Step 8991: {'lr': 0.0001496, 'samples': 287712, 'steps': 561, 'loss/train': 5.5542731285095215} -09/20/2021 16:26:07 - INFO - __main__ - Step 8992: {'lr': 0.0001496, 'samples': 287744, 'steps': 561, 'loss/train': 4.557441711425781} -09/20/2021 16:26:08 - INFO - __main__ - Step 8993: {'lr': 0.00014986666666666666, 'samples': 287776, 'steps': 562, 'loss/train': 5.231557369232178} -09/20/2021 16:26:09 - INFO - __main__ - Step 8994: {'lr': 0.00014986666666666666, 'samples': 287808, 'steps': 562, 'loss/train': 5.13483190536499} -09/20/2021 16:26:10 - INFO - __main__ - Step 8995: {'lr': 0.00014986666666666666, 'samples': 287840, 'steps': 562, 'loss/train': 3.793208360671997} -09/20/2021 16:26:11 - INFO - __main__ - Step 8996: {'lr': 0.00014986666666666666, 'samples': 287872, 'steps': 562, 'loss/train': 6.944189071655273} -09/20/2021 16:26:11 - INFO - __main__ - Step 8997: {'lr': 0.00014986666666666666, 'samples': 287904, 'steps': 562, 'loss/train': 3.8661949634552} -09/20/2021 16:26:12 - INFO - __main__ - Step 8998: {'lr': 0.00014986666666666666, 'samples': 287936, 'steps': 562, 'loss/train': 3.83553409576416} -09/20/2021 16:26:13 - INFO - __main__ - Step 8999: {'lr': 0.00014986666666666666, 'samples': 287968, 'steps': 562, 'loss/train': 4.670082092285156} -09/20/2021 16:26:14 - INFO - __main__ - Step 9000: {'lr': 0.00014986666666666666, 'samples': 288000, 'steps': 562, 'loss/train': 4.934453964233398} -09/20/2021 16:26:14 - INFO - __main__ - Step 9001: {'lr': 0.00014986666666666666, 'samples': 288032, 'steps': 562, 'loss/train': 4.896987438201904} -09/20/2021 16:26:15 - INFO - __main__ - Step 9002: {'lr': 0.00014986666666666666, 'samples': 288064, 'steps': 562, 'loss/train': 4.082223415374756} -09/20/2021 16:26:16 - INFO - __main__ - Step 9003: {'lr': 0.00014986666666666666, 'samples': 288096, 'steps': 562, 'loss/train': 4.853804588317871} -09/20/2021 16:26:17 - INFO - __main__ - Step 9004: {'lr': 0.00014986666666666666, 'samples': 288128, 'steps': 562, 'loss/train': 4.5594868659973145} -09/20/2021 16:26:17 - INFO - __main__ - Step 9005: {'lr': 0.00014986666666666666, 'samples': 288160, 'steps': 562, 'loss/train': 6.696537494659424} -09/20/2021 16:26:18 - INFO - __main__ - Step 9006: {'lr': 0.00014986666666666666, 'samples': 288192, 'steps': 562, 'loss/train': 2.9996602535247803} -09/20/2021 16:26:19 - INFO - __main__ - Step 9007: {'lr': 0.00014986666666666666, 'samples': 288224, 'steps': 562, 'loss/train': 4.743773460388184} -09/20/2021 16:26:20 - INFO - __main__ - Step 9008: {'lr': 0.00014986666666666666, 'samples': 288256, 'steps': 562, 'loss/train': 3.9956979751586914} -09/20/2021 16:26:21 - INFO - __main__ - Step 9009: {'lr': 0.00015013333333333334, 'samples': 288288, 'steps': 563, 'loss/train': 5.118213653564453} -09/20/2021 16:26:21 - INFO - __main__ - Step 9010: {'lr': 0.00015013333333333334, 'samples': 288320, 'steps': 563, 'loss/train': 5.013390064239502} -09/20/2021 16:26:22 - INFO - __main__ - Step 9011: {'lr': 0.00015013333333333334, 'samples': 288352, 'steps': 563, 'loss/train': 4.685291767120361} -09/20/2021 16:26:23 - INFO - __main__ - Step 9012: {'lr': 0.00015013333333333334, 'samples': 288384, 'steps': 563, 'loss/train': 5.156056880950928} -09/20/2021 16:26:24 - INFO - __main__ - Step 9013: {'lr': 0.00015013333333333334, 'samples': 288416, 'steps': 563, 'loss/train': 5.4762115478515625} -09/20/2021 16:26:24 - INFO - __main__ - Step 9014: {'lr': 0.00015013333333333334, 'samples': 288448, 'steps': 563, 'loss/train': 5.332608222961426} -09/20/2021 16:26:25 - INFO - __main__ - Step 9015: {'lr': 0.00015013333333333334, 'samples': 288480, 'steps': 563, 'loss/train': 3.915803909301758} -09/20/2021 16:26:26 - INFO - __main__ - Step 9016: {'lr': 0.00015013333333333334, 'samples': 288512, 'steps': 563, 'loss/train': 5.44727087020874} -09/20/2021 16:26:27 - INFO - __main__ - Step 9017: {'lr': 0.00015013333333333334, 'samples': 288544, 'steps': 563, 'loss/train': 4.799777030944824} -09/20/2021 16:26:27 - INFO - __main__ - Step 9018: {'lr': 0.00015013333333333334, 'samples': 288576, 'steps': 563, 'loss/train': 5.1971049308776855} -09/20/2021 16:26:28 - INFO - __main__ - Step 9019: {'lr': 0.00015013333333333334, 'samples': 288608, 'steps': 563, 'loss/train': 5.490307807922363} -09/20/2021 16:26:29 - INFO - __main__ - Step 9020: {'lr': 0.00015013333333333334, 'samples': 288640, 'steps': 563, 'loss/train': 5.452126979827881} -09/20/2021 16:26:30 - INFO - __main__ - Step 9021: {'lr': 0.00015013333333333334, 'samples': 288672, 'steps': 563, 'loss/train': 5.727464199066162} -09/20/2021 16:26:30 - INFO - __main__ - Step 9022: {'lr': 0.00015013333333333334, 'samples': 288704, 'steps': 563, 'loss/train': 5.478640079498291} -09/20/2021 16:26:31 - INFO - __main__ - Step 9023: {'lr': 0.00015013333333333334, 'samples': 288736, 'steps': 563, 'loss/train': 4.819941997528076} -09/20/2021 16:26:32 - INFO - __main__ - Step 9024: {'lr': 0.00015013333333333334, 'samples': 288768, 'steps': 563, 'loss/train': 4.633225917816162} -09/20/2021 16:26:33 - INFO - __main__ - Step 9025: {'lr': 0.0001504, 'samples': 288800, 'steps': 564, 'loss/train': 4.778414726257324} -09/20/2021 16:26:34 - INFO - __main__ - Step 9026: {'lr': 0.0001504, 'samples': 288832, 'steps': 564, 'loss/train': 4.138031482696533} -09/20/2021 16:26:35 - INFO - __main__ - Step 9027: {'lr': 0.0001504, 'samples': 288864, 'steps': 564, 'loss/train': 6.475677490234375} -09/20/2021 16:26:35 - INFO - __main__ - Step 9028: {'lr': 0.0001504, 'samples': 288896, 'steps': 564, 'loss/train': 5.1414995193481445} -09/20/2021 16:26:36 - INFO - __main__ - Step 9029: {'lr': 0.0001504, 'samples': 288928, 'steps': 564, 'loss/train': 4.126130104064941} -09/20/2021 16:26:37 - INFO - __main__ - Step 9030: {'lr': 0.0001504, 'samples': 288960, 'steps': 564, 'loss/train': 5.119898319244385} -09/20/2021 16:26:38 - INFO - __main__ - Step 9031: {'lr': 0.0001504, 'samples': 288992, 'steps': 564, 'loss/train': 4.392092704772949} -09/20/2021 16:26:38 - INFO - __main__ - Step 9032: {'lr': 0.0001504, 'samples': 289024, 'steps': 564, 'loss/train': 4.8486552238464355} -09/20/2021 16:26:39 - INFO - __main__ - Step 9033: {'lr': 0.0001504, 'samples': 289056, 'steps': 564, 'loss/train': 5.083441257476807} -09/20/2021 16:26:40 - INFO - __main__ - Step 9034: {'lr': 0.0001504, 'samples': 289088, 'steps': 564, 'loss/train': 5.019015312194824} -09/20/2021 16:26:41 - INFO - __main__ - Step 9035: {'lr': 0.0001504, 'samples': 289120, 'steps': 564, 'loss/train': 3.794283151626587} -09/20/2021 16:26:41 - INFO - __main__ - Step 9036: {'lr': 0.0001504, 'samples': 289152, 'steps': 564, 'loss/train': 4.66428279876709} -09/20/2021 16:26:42 - INFO - __main__ - Step 9037: {'lr': 0.0001504, 'samples': 289184, 'steps': 564, 'loss/train': 5.002567291259766} -09/20/2021 16:26:43 - INFO - __main__ - Step 9038: {'lr': 0.0001504, 'samples': 289216, 'steps': 564, 'loss/train': 5.276716232299805} -09/20/2021 16:26:44 - INFO - __main__ - Step 9039: {'lr': 0.0001504, 'samples': 289248, 'steps': 564, 'loss/train': 4.460023880004883} -09/20/2021 16:26:44 - INFO - __main__ - Step 9040: {'lr': 0.0001504, 'samples': 289280, 'steps': 564, 'loss/train': 5.1807942390441895} -09/20/2021 16:26:45 - INFO - __main__ - Step 9041: {'lr': 0.00015066666666666668, 'samples': 289312, 'steps': 565, 'loss/train': 4.393383026123047} -09/20/2021 16:26:46 - INFO - __main__ - Step 9042: {'lr': 0.00015066666666666668, 'samples': 289344, 'steps': 565, 'loss/train': 3.578817844390869} -09/20/2021 16:26:47 - INFO - __main__ - Step 9043: {'lr': 0.00015066666666666668, 'samples': 289376, 'steps': 565, 'loss/train': 4.337860584259033} -09/20/2021 16:26:48 - INFO - __main__ - Step 9044: {'lr': 0.00015066666666666668, 'samples': 289408, 'steps': 565, 'loss/train': 4.313659191131592} -09/20/2021 16:26:48 - INFO - __main__ - Step 9045: {'lr': 0.00015066666666666668, 'samples': 289440, 'steps': 565, 'loss/train': 5.4129509925842285} -09/20/2021 16:26:49 - INFO - __main__ - Step 9046: {'lr': 0.00015066666666666668, 'samples': 289472, 'steps': 565, 'loss/train': 4.5570831298828125} -09/20/2021 16:26:50 - INFO - __main__ - Step 9047: {'lr': 0.00015066666666666668, 'samples': 289504, 'steps': 565, 'loss/train': 4.976776123046875} -09/20/2021 16:26:51 - INFO - __main__ - Step 9048: {'lr': 0.00015066666666666668, 'samples': 289536, 'steps': 565, 'loss/train': 5.347739219665527} -09/20/2021 16:26:51 - INFO - __main__ - Step 9049: {'lr': 0.00015066666666666668, 'samples': 289568, 'steps': 565, 'loss/train': 5.389187335968018} -09/20/2021 16:26:52 - INFO - __main__ - Step 9050: {'lr': 0.00015066666666666668, 'samples': 289600, 'steps': 565, 'loss/train': 4.505646705627441} -09/20/2021 16:26:53 - INFO - __main__ - Step 9051: {'lr': 0.00015066666666666668, 'samples': 289632, 'steps': 565, 'loss/train': 7.417154312133789} -09/20/2021 16:26:54 - INFO - __main__ - Step 9052: {'lr': 0.00015066666666666668, 'samples': 289664, 'steps': 565, 'loss/train': 4.368812084197998} -09/20/2021 16:26:54 - INFO - __main__ - Step 9053: {'lr': 0.00015066666666666668, 'samples': 289696, 'steps': 565, 'loss/train': 4.080253601074219} -09/20/2021 16:26:55 - INFO - __main__ - Step 9054: {'lr': 0.00015066666666666668, 'samples': 289728, 'steps': 565, 'loss/train': 4.671489238739014} -09/20/2021 16:26:56 - INFO - __main__ - Step 9055: {'lr': 0.00015066666666666668, 'samples': 289760, 'steps': 565, 'loss/train': 4.6614274978637695} -09/20/2021 16:26:57 - INFO - __main__ - Step 9056: {'lr': 0.00015066666666666668, 'samples': 289792, 'steps': 565, 'loss/train': 4.938296794891357} -09/20/2021 16:26:58 - INFO - __main__ - Step 9057: {'lr': 0.00015093333333333336, 'samples': 289824, 'steps': 566, 'loss/train': 5.771374702453613} -09/20/2021 16:26:59 - INFO - __main__ - Step 9058: {'lr': 0.00015093333333333336, 'samples': 289856, 'steps': 566, 'loss/train': 4.521754264831543} -09/20/2021 16:27:00 - INFO - __main__ - Step 9059: {'lr': 0.00015093333333333336, 'samples': 289888, 'steps': 566, 'loss/train': 4.559384822845459} -09/20/2021 16:27:00 - INFO - __main__ - Step 9060: {'lr': 0.00015093333333333336, 'samples': 289920, 'steps': 566, 'loss/train': 5.448829174041748} -09/20/2021 16:27:01 - INFO - __main__ - Step 9061: {'lr': 0.00015093333333333336, 'samples': 289952, 'steps': 566, 'loss/train': 4.2284674644470215} -09/20/2021 16:27:02 - INFO - __main__ - Step 9062: {'lr': 0.00015093333333333336, 'samples': 289984, 'steps': 566, 'loss/train': 5.894586563110352} -09/20/2021 16:27:03 - INFO - __main__ - Step 9063: {'lr': 0.00015093333333333336, 'samples': 290016, 'steps': 566, 'loss/train': 5.646424770355225} -09/20/2021 16:27:03 - INFO - __main__ - Step 9064: {'lr': 0.00015093333333333336, 'samples': 290048, 'steps': 566, 'loss/train': 5.145243167877197} -09/20/2021 16:27:04 - INFO - __main__ - Step 9065: {'lr': 0.00015093333333333336, 'samples': 290080, 'steps': 566, 'loss/train': 5.023890972137451} -09/20/2021 16:27:05 - INFO - __main__ - Step 9066: {'lr': 0.00015093333333333336, 'samples': 290112, 'steps': 566, 'loss/train': 5.717960834503174} -09/20/2021 16:27:06 - INFO - __main__ - Step 9067: {'lr': 0.00015093333333333336, 'samples': 290144, 'steps': 566, 'loss/train': 4.924016952514648} -09/20/2021 16:27:06 - INFO - __main__ - Step 9068: {'lr': 0.00015093333333333336, 'samples': 290176, 'steps': 566, 'loss/train': 4.879947185516357} -09/20/2021 16:27:07 - INFO - __main__ - Step 9069: {'lr': 0.00015093333333333336, 'samples': 290208, 'steps': 566, 'loss/train': 5.0303802490234375} -09/20/2021 16:27:08 - INFO - __main__ - Step 9070: {'lr': 0.00015093333333333336, 'samples': 290240, 'steps': 566, 'loss/train': 5.590702056884766} -09/20/2021 16:27:09 - INFO - __main__ - Step 9071: {'lr': 0.00015093333333333336, 'samples': 290272, 'steps': 566, 'loss/train': 4.316104888916016} -09/20/2021 16:27:09 - INFO - __main__ - Step 9072: {'lr': 0.00015093333333333336, 'samples': 290304, 'steps': 566, 'loss/train': 4.13482666015625} -09/20/2021 16:27:10 - INFO - __main__ - Step 9073: {'lr': 0.00015120000000000002, 'samples': 290336, 'steps': 567, 'loss/train': 3.196866750717163} -09/20/2021 16:27:11 - INFO - __main__ - Step 9074: {'lr': 0.00015120000000000002, 'samples': 290368, 'steps': 567, 'loss/train': 5.483702182769775} -09/20/2021 16:27:12 - INFO - __main__ - Step 9075: {'lr': 0.00015120000000000002, 'samples': 290400, 'steps': 567, 'loss/train': 4.989425182342529} -09/20/2021 16:27:13 - INFO - __main__ - Step 9076: {'lr': 0.00015120000000000002, 'samples': 290432, 'steps': 567, 'loss/train': 4.796413421630859} -09/20/2021 16:27:13 - INFO - __main__ - Step 9077: {'lr': 0.00015120000000000002, 'samples': 290464, 'steps': 567, 'loss/train': 3.8276450634002686} -09/20/2021 16:27:14 - INFO - __main__ - Step 9078: {'lr': 0.00015120000000000002, 'samples': 290496, 'steps': 567, 'loss/train': 5.409974098205566} -09/20/2021 16:27:15 - INFO - __main__ - Step 9079: {'lr': 0.00015120000000000002, 'samples': 290528, 'steps': 567, 'loss/train': 4.725115776062012} -09/20/2021 16:27:16 - INFO - __main__ - Step 9080: {'lr': 0.00015120000000000002, 'samples': 290560, 'steps': 567, 'loss/train': 3.74096941947937} -09/20/2021 16:27:16 - INFO - __main__ - Step 9081: {'lr': 0.00015120000000000002, 'samples': 290592, 'steps': 567, 'loss/train': 5.248816013336182} -09/20/2021 16:27:17 - INFO - __main__ - Step 9082: {'lr': 0.00015120000000000002, 'samples': 290624, 'steps': 567, 'loss/train': 6.267171382904053} -09/20/2021 16:27:18 - INFO - __main__ - Step 9083: {'lr': 0.00015120000000000002, 'samples': 290656, 'steps': 567, 'loss/train': 4.3265275955200195} -09/20/2021 16:27:19 - INFO - __main__ - Step 9084: {'lr': 0.00015120000000000002, 'samples': 290688, 'steps': 567, 'loss/train': 4.255473613739014} -09/20/2021 16:27:19 - INFO - __main__ - Step 9085: {'lr': 0.00015120000000000002, 'samples': 290720, 'steps': 567, 'loss/train': 3.6437294483184814} -09/20/2021 16:27:21 - INFO - __main__ - Step 9086: {'lr': 0.00015120000000000002, 'samples': 290752, 'steps': 567, 'loss/train': 4.512482643127441} -09/20/2021 16:27:21 - INFO - __main__ - Step 9087: {'lr': 0.00015120000000000002, 'samples': 290784, 'steps': 567, 'loss/train': 4.474266052246094} -09/20/2021 16:27:22 - INFO - __main__ - Step 9088: {'lr': 0.00015120000000000002, 'samples': 290816, 'steps': 567, 'loss/train': 4.921911239624023} -09/20/2021 16:27:23 - INFO - __main__ - Step 9089: {'lr': 0.00015146666666666667, 'samples': 290848, 'steps': 568, 'loss/train': 2.4088618755340576} -09/20/2021 16:27:24 - INFO - __main__ - Step 9090: {'lr': 0.00015146666666666667, 'samples': 290880, 'steps': 568, 'loss/train': 2.6613235473632812} -09/20/2021 16:27:25 - INFO - __main__ - Step 9091: {'lr': 0.00015146666666666667, 'samples': 290912, 'steps': 568, 'loss/train': 2.8152482509613037} -09/20/2021 16:27:25 - INFO - __main__ - Step 9092: {'lr': 0.00015146666666666667, 'samples': 290944, 'steps': 568, 'loss/train': 4.393636226654053} -09/20/2021 16:27:26 - INFO - __main__ - Step 9093: {'lr': 0.00015146666666666667, 'samples': 290976, 'steps': 568, 'loss/train': 4.493373870849609} -09/20/2021 16:27:27 - INFO - __main__ - Step 9094: {'lr': 0.00015146666666666667, 'samples': 291008, 'steps': 568, 'loss/train': 4.625870704650879} -09/20/2021 16:27:28 - INFO - __main__ - Step 9095: {'lr': 0.00015146666666666667, 'samples': 291040, 'steps': 568, 'loss/train': 4.610742568969727} -09/20/2021 16:27:28 - INFO - __main__ - Step 9096: {'lr': 0.00015146666666666667, 'samples': 291072, 'steps': 568, 'loss/train': 5.361894130706787} -09/20/2021 16:27:29 - INFO - __main__ - Step 9097: {'lr': 0.00015146666666666667, 'samples': 291104, 'steps': 568, 'loss/train': 5.100122451782227} -09/20/2021 16:27:30 - INFO - __main__ - Step 9098: {'lr': 0.00015146666666666667, 'samples': 291136, 'steps': 568, 'loss/train': 4.198818206787109} -09/20/2021 16:27:31 - INFO - __main__ - Step 9099: {'lr': 0.00015146666666666667, 'samples': 291168, 'steps': 568, 'loss/train': 5.156449317932129} -09/20/2021 16:27:31 - INFO - __main__ - Step 9100: {'lr': 0.00015146666666666667, 'samples': 291200, 'steps': 568, 'loss/train': 5.231218338012695} -09/20/2021 16:27:32 - INFO - __main__ - Step 9101: {'lr': 0.00015146666666666667, 'samples': 291232, 'steps': 568, 'loss/train': 5.067554473876953} -09/20/2021 16:27:33 - INFO - __main__ - Step 9102: {'lr': 0.00015146666666666667, 'samples': 291264, 'steps': 568, 'loss/train': 4.718170166015625} -09/20/2021 16:27:34 - INFO - __main__ - Step 9103: {'lr': 0.00015146666666666667, 'samples': 291296, 'steps': 568, 'loss/train': 5.413739204406738} -09/20/2021 16:27:34 - INFO - __main__ - Step 9104: {'lr': 0.00015146666666666667, 'samples': 291328, 'steps': 568, 'loss/train': 4.099078178405762} -09/20/2021 16:27:35 - INFO - __main__ - Step 9105: {'lr': 0.00015173333333333335, 'samples': 291360, 'steps': 569, 'loss/train': 4.253979682922363} -09/20/2021 16:27:36 - INFO - __main__ - Step 9106: {'lr': 0.00015173333333333335, 'samples': 291392, 'steps': 569, 'loss/train': 3.0339410305023193} -09/20/2021 16:27:37 - INFO - __main__ - Step 9107: {'lr': 0.00015173333333333335, 'samples': 291424, 'steps': 569, 'loss/train': 4.410273551940918} -09/20/2021 16:27:37 - INFO - __main__ - Step 9108: {'lr': 0.00015173333333333335, 'samples': 291456, 'steps': 569, 'loss/train': 4.4545769691467285} -09/20/2021 16:27:38 - INFO - __main__ - Step 9109: {'lr': 0.00015173333333333335, 'samples': 291488, 'steps': 569, 'loss/train': 5.7941975593566895} -09/20/2021 16:27:39 - INFO - __main__ - Step 9110: {'lr': 0.00015173333333333335, 'samples': 291520, 'steps': 569, 'loss/train': 6.388078689575195} -09/20/2021 16:27:40 - INFO - __main__ - Step 9111: {'lr': 0.00015173333333333335, 'samples': 291552, 'steps': 569, 'loss/train': 4.0374956130981445} -09/20/2021 16:27:40 - INFO - __main__ - Step 9112: {'lr': 0.00015173333333333335, 'samples': 291584, 'steps': 569, 'loss/train': 5.138455867767334} -09/20/2021 16:27:41 - INFO - __main__ - Step 9113: {'lr': 0.00015173333333333335, 'samples': 291616, 'steps': 569, 'loss/train': 4.512075424194336} -09/20/2021 16:27:42 - INFO - __main__ - Step 9114: {'lr': 0.00015173333333333335, 'samples': 291648, 'steps': 569, 'loss/train': 4.2480926513671875} -09/20/2021 16:27:43 - INFO - __main__ - Step 9115: {'lr': 0.00015173333333333335, 'samples': 291680, 'steps': 569, 'loss/train': 4.613826751708984} -09/20/2021 16:27:43 - INFO - __main__ - Step 9116: {'lr': 0.00015173333333333335, 'samples': 291712, 'steps': 569, 'loss/train': 3.918207883834839} -09/20/2021 16:27:45 - INFO - __main__ - Step 9117: {'lr': 0.00015173333333333335, 'samples': 291744, 'steps': 569, 'loss/train': 1.8126277923583984} -09/20/2021 16:27:46 - INFO - __main__ - Step 9118: {'lr': 0.00015173333333333335, 'samples': 291776, 'steps': 569, 'loss/train': 4.817266464233398} -09/20/2021 16:27:47 - INFO - __main__ - Step 9119: {'lr': 0.00015173333333333335, 'samples': 291808, 'steps': 569, 'loss/train': 5.122084140777588} -09/20/2021 16:27:47 - INFO - __main__ - Step 9120: {'lr': 0.00015173333333333335, 'samples': 291840, 'steps': 569, 'loss/train': 5.462210178375244} -09/20/2021 16:27:48 - INFO - __main__ - Step 9121: {'lr': 0.000152, 'samples': 291872, 'steps': 570, 'loss/train': 4.655221462249756} -09/20/2021 16:27:49 - INFO - __main__ - Step 9122: {'lr': 0.000152, 'samples': 291904, 'steps': 570, 'loss/train': 4.2313232421875} -09/20/2021 16:27:50 - INFO - __main__ - Step 9123: {'lr': 0.000152, 'samples': 291936, 'steps': 570, 'loss/train': 4.829582214355469} -09/20/2021 16:27:50 - INFO - __main__ - Step 9124: {'lr': 0.000152, 'samples': 291968, 'steps': 570, 'loss/train': 4.948061943054199} -09/20/2021 16:27:51 - INFO - __main__ - Step 9125: {'lr': 0.000152, 'samples': 292000, 'steps': 570, 'loss/train': 3.469315528869629} -09/20/2021 16:27:52 - INFO - __main__ - Step 9126: {'lr': 0.000152, 'samples': 292032, 'steps': 570, 'loss/train': 4.477141857147217} -09/20/2021 16:27:53 - INFO - __main__ - Step 9127: {'lr': 0.000152, 'samples': 292064, 'steps': 570, 'loss/train': 0.5420833230018616} -09/20/2021 16:27:53 - INFO - __main__ - Step 9128: {'lr': 0.000152, 'samples': 292096, 'steps': 570, 'loss/train': 4.810525894165039} -09/20/2021 16:27:54 - INFO - __main__ - Step 9129: {'lr': 0.000152, 'samples': 292128, 'steps': 570, 'loss/train': 4.455426216125488} -09/20/2021 16:27:55 - INFO - __main__ - Step 9130: {'lr': 0.000152, 'samples': 292160, 'steps': 570, 'loss/train': 4.569716930389404} -09/20/2021 16:27:56 - INFO - __main__ - Step 9131: {'lr': 0.000152, 'samples': 292192, 'steps': 570, 'loss/train': 4.350915908813477} -09/20/2021 16:27:56 - INFO - __main__ - Step 9132: {'lr': 0.000152, 'samples': 292224, 'steps': 570, 'loss/train': 3.450169563293457} -09/20/2021 16:27:57 - INFO - __main__ - Step 9133: {'lr': 0.000152, 'samples': 292256, 'steps': 570, 'loss/train': 5.209268093109131} -09/20/2021 16:27:58 - INFO - __main__ - Step 9134: {'lr': 0.000152, 'samples': 292288, 'steps': 570, 'loss/train': 4.4221110343933105} -09/20/2021 16:27:59 - INFO - __main__ - Step 9135: {'lr': 0.000152, 'samples': 292320, 'steps': 570, 'loss/train': 1.9936856031417847} -09/20/2021 16:27:59 - INFO - __main__ - Step 9136: {'lr': 0.000152, 'samples': 292352, 'steps': 570, 'loss/train': 2.4867706298828125} -09/20/2021 16:28:00 - INFO - __main__ - Step 9137: {'lr': 0.00015226666666666666, 'samples': 292384, 'steps': 571, 'loss/train': 2.042292356491089} -09/20/2021 16:28:01 - INFO - __main__ - Step 9138: {'lr': 0.00015226666666666666, 'samples': 292416, 'steps': 571, 'loss/train': 1.8129947185516357} -09/20/2021 16:28:02 - INFO - __main__ - Step 9139: {'lr': 0.00015226666666666666, 'samples': 292448, 'steps': 571, 'loss/train': 3.263899803161621} -09/20/2021 16:28:03 - INFO - __main__ - Step 9140: {'lr': 0.00015226666666666666, 'samples': 292480, 'steps': 571, 'loss/train': 4.957621097564697} -09/20/2021 16:28:03 - INFO - __main__ - Step 9141: {'lr': 0.00015226666666666666, 'samples': 292512, 'steps': 571, 'loss/train': 4.867433071136475} -09/20/2021 16:28:04 - INFO - __main__ - Step 9142: {'lr': 0.00015226666666666666, 'samples': 292544, 'steps': 571, 'loss/train': 3.694397449493408} -09/20/2021 16:28:05 - INFO - __main__ - Step 9143: {'lr': 0.00015226666666666666, 'samples': 292576, 'steps': 571, 'loss/train': 4.793525695800781} -09/20/2021 16:28:06 - INFO - __main__ - Step 9144: {'lr': 0.00015226666666666666, 'samples': 292608, 'steps': 571, 'loss/train': 4.63333797454834} -09/20/2021 16:28:06 - INFO - __main__ - Step 9145: {'lr': 0.00015226666666666666, 'samples': 292640, 'steps': 571, 'loss/train': 4.639909744262695} -09/20/2021 16:28:07 - INFO - __main__ - Step 9146: {'lr': 0.00015226666666666666, 'samples': 292672, 'steps': 571, 'loss/train': 4.169002056121826} -09/20/2021 16:28:08 - INFO - __main__ - Step 9147: {'lr': 0.00015226666666666666, 'samples': 292704, 'steps': 571, 'loss/train': 5.9874138832092285} -09/20/2021 16:28:09 - INFO - __main__ - Step 9148: {'lr': 0.00015226666666666666, 'samples': 292736, 'steps': 571, 'loss/train': 3.941406011581421} -09/20/2021 16:28:10 - INFO - __main__ - Step 9149: {'lr': 0.00015226666666666666, 'samples': 292768, 'steps': 571, 'loss/train': 3.5811264514923096} -09/20/2021 16:28:11 - INFO - __main__ - Step 9150: {'lr': 0.00015226666666666666, 'samples': 292800, 'steps': 571, 'loss/train': 5.939342498779297} -09/20/2021 16:28:11 - INFO - __main__ - Step 9151: {'lr': 0.00015226666666666666, 'samples': 292832, 'steps': 571, 'loss/train': 3.8020074367523193} -09/20/2021 16:28:12 - INFO - __main__ - Step 9152: {'lr': 0.00015226666666666666, 'samples': 292864, 'steps': 571, 'loss/train': 5.742222785949707} -09/20/2021 16:28:13 - INFO - __main__ - Step 9153: {'lr': 0.00015253333333333335, 'samples': 292896, 'steps': 572, 'loss/train': 4.252342700958252} -09/20/2021 16:28:14 - INFO - __main__ - Step 9154: {'lr': 0.00015253333333333335, 'samples': 292928, 'steps': 572, 'loss/train': 4.815310001373291} -09/20/2021 16:28:15 - INFO - __main__ - Step 9155: {'lr': 0.00015253333333333335, 'samples': 292960, 'steps': 572, 'loss/train': 4.39493465423584} -09/20/2021 16:28:15 - INFO - __main__ - Step 9156: {'lr': 0.00015253333333333335, 'samples': 292992, 'steps': 572, 'loss/train': 4.455371379852295} -09/20/2021 16:28:16 - INFO - __main__ - Step 9157: {'lr': 0.00015253333333333335, 'samples': 293024, 'steps': 572, 'loss/train': 4.37715482711792} -09/20/2021 16:28:17 - INFO - __main__ - Step 9158: {'lr': 0.00015253333333333335, 'samples': 293056, 'steps': 572, 'loss/train': 4.411403179168701} -09/20/2021 16:28:18 - INFO - __main__ - Step 9159: {'lr': 0.00015253333333333335, 'samples': 293088, 'steps': 572, 'loss/train': 4.890551567077637} -09/20/2021 16:28:18 - INFO - __main__ - Step 9160: {'lr': 0.00015253333333333335, 'samples': 293120, 'steps': 572, 'loss/train': 4.9639105796813965} -09/20/2021 16:28:19 - INFO - __main__ - Step 9161: {'lr': 0.00015253333333333335, 'samples': 293152, 'steps': 572, 'loss/train': 4.153687477111816} -09/20/2021 16:28:20 - INFO - __main__ - Step 9162: {'lr': 0.00015253333333333335, 'samples': 293184, 'steps': 572, 'loss/train': 4.8709306716918945} -09/20/2021 16:28:21 - INFO - __main__ - Step 9163: {'lr': 0.00015253333333333335, 'samples': 293216, 'steps': 572, 'loss/train': 4.103753566741943} -09/20/2021 16:28:21 - INFO - __main__ - Step 9164: {'lr': 0.00015253333333333335, 'samples': 293248, 'steps': 572, 'loss/train': 4.809129238128662} -09/20/2021 16:28:22 - INFO - __main__ - Step 9165: {'lr': 0.00015253333333333335, 'samples': 293280, 'steps': 572, 'loss/train': 4.239647388458252} -09/20/2021 16:28:23 - INFO - __main__ - Step 9166: {'lr': 0.00015253333333333335, 'samples': 293312, 'steps': 572, 'loss/train': 4.607442378997803} -09/20/2021 16:28:24 - INFO - __main__ - Step 9167: {'lr': 0.00015253333333333335, 'samples': 293344, 'steps': 572, 'loss/train': 4.353703022003174} -09/20/2021 16:28:24 - INFO - __main__ - Step 9168: {'lr': 0.00015253333333333335, 'samples': 293376, 'steps': 572, 'loss/train': 2.2696990966796875} -09/20/2021 16:28:25 - INFO - __main__ - Step 9169: {'lr': 0.0001528, 'samples': 293408, 'steps': 573, 'loss/train': 4.5082688331604} -09/20/2021 16:28:26 - INFO - __main__ - Step 9170: {'lr': 0.0001528, 'samples': 293440, 'steps': 573, 'loss/train': 5.176546573638916} -09/20/2021 16:28:27 - INFO - __main__ - Step 9171: {'lr': 0.0001528, 'samples': 293472, 'steps': 573, 'loss/train': 5.336066246032715} -09/20/2021 16:28:27 - INFO - __main__ - Step 9172: {'lr': 0.0001528, 'samples': 293504, 'steps': 573, 'loss/train': 5.619908332824707} -09/20/2021 16:28:28 - INFO - __main__ - Step 9173: {'lr': 0.0001528, 'samples': 293536, 'steps': 573, 'loss/train': 4.89764928817749} -09/20/2021 16:28:29 - INFO - __main__ - Step 9174: {'lr': 0.0001528, 'samples': 293568, 'steps': 573, 'loss/train': 5.5867438316345215} -09/20/2021 16:28:30 - INFO - __main__ - Step 9175: {'lr': 0.0001528, 'samples': 293600, 'steps': 573, 'loss/train': 4.507909774780273} -09/20/2021 16:28:30 - INFO - __main__ - Step 9176: {'lr': 0.0001528, 'samples': 293632, 'steps': 573, 'loss/train': 4.134392738342285} -09/20/2021 16:28:31 - INFO - __main__ - Step 9177: {'lr': 0.0001528, 'samples': 293664, 'steps': 573, 'loss/train': 6.599765777587891} -09/20/2021 16:28:32 - INFO - __main__ - Step 9178: {'lr': 0.0001528, 'samples': 293696, 'steps': 573, 'loss/train': 6.74666166305542} -09/20/2021 16:28:33 - INFO - __main__ - Step 9179: {'lr': 0.0001528, 'samples': 293728, 'steps': 573, 'loss/train': 6.66065788269043} -09/20/2021 16:28:33 - INFO - __main__ - Step 9180: {'lr': 0.0001528, 'samples': 293760, 'steps': 573, 'loss/train': 6.599431991577148} -09/20/2021 16:28:34 - INFO - __main__ - Step 9181: {'lr': 0.0001528, 'samples': 293792, 'steps': 573, 'loss/train': 6.607213973999023} -09/20/2021 16:28:35 - INFO - __main__ - Step 9182: {'lr': 0.0001528, 'samples': 293824, 'steps': 573, 'loss/train': 3.484708547592163} -09/20/2021 16:28:36 - INFO - __main__ - Step 9183: {'lr': 0.0001528, 'samples': 293856, 'steps': 573, 'loss/train': 4.7184367179870605} -09/20/2021 16:28:37 - INFO - __main__ - Step 9184: {'lr': 0.0001528, 'samples': 293888, 'steps': 573, 'loss/train': 4.067212104797363} -09/20/2021 16:28:38 - INFO - __main__ - Step 9185: {'lr': 0.00015306666666666666, 'samples': 293920, 'steps': 574, 'loss/train': 4.134633541107178} -09/20/2021 16:28:39 - INFO - __main__ - Step 9186: {'lr': 0.00015306666666666666, 'samples': 293952, 'steps': 574, 'loss/train': 4.161486625671387} -09/20/2021 16:28:39 - INFO - __main__ - Step 9187: {'lr': 0.00015306666666666666, 'samples': 293984, 'steps': 574, 'loss/train': 4.685704231262207} -09/20/2021 16:28:40 - INFO - __main__ - Step 9188: {'lr': 0.00015306666666666666, 'samples': 294016, 'steps': 574, 'loss/train': 4.92158842086792} -09/20/2021 16:28:41 - INFO - __main__ - Step 9189: {'lr': 0.00015306666666666666, 'samples': 294048, 'steps': 574, 'loss/train': 4.299753189086914} -09/20/2021 16:28:42 - INFO - __main__ - Step 9190: {'lr': 0.00015306666666666666, 'samples': 294080, 'steps': 574, 'loss/train': 5.121466636657715} -09/20/2021 16:28:42 - INFO - __main__ - Step 9191: {'lr': 0.00015306666666666666, 'samples': 294112, 'steps': 574, 'loss/train': 4.097507476806641} -09/20/2021 16:28:43 - INFO - __main__ - Step 9192: {'lr': 0.00015306666666666666, 'samples': 294144, 'steps': 574, 'loss/train': 6.7293314933776855} -09/20/2021 16:28:44 - INFO - __main__ - Step 9193: {'lr': 0.00015306666666666666, 'samples': 294176, 'steps': 574, 'loss/train': 6.737128257751465} -09/20/2021 16:28:45 - INFO - __main__ - Step 9194: {'lr': 0.00015306666666666666, 'samples': 294208, 'steps': 574, 'loss/train': 1.220834493637085} -09/20/2021 16:28:45 - INFO - __main__ - Step 9195: {'lr': 0.00015306666666666666, 'samples': 294240, 'steps': 574, 'loss/train': 3.1697943210601807} -09/20/2021 16:28:46 - INFO - __main__ - Step 9196: {'lr': 0.00015306666666666666, 'samples': 294272, 'steps': 574, 'loss/train': 5.042102336883545} -09/20/2021 16:28:47 - INFO - __main__ - Step 9197: {'lr': 0.00015306666666666666, 'samples': 294304, 'steps': 574, 'loss/train': 3.8684051036834717} -09/20/2021 16:28:48 - INFO - __main__ - Step 9198: {'lr': 0.00015306666666666666, 'samples': 294336, 'steps': 574, 'loss/train': 4.410516262054443} -09/20/2021 16:28:48 - INFO - __main__ - Step 9199: {'lr': 0.00015306666666666666, 'samples': 294368, 'steps': 574, 'loss/train': 4.576119899749756} -09/20/2021 16:28:49 - INFO - __main__ - Step 9200: {'lr': 0.00015306666666666666, 'samples': 294400, 'steps': 574, 'loss/train': 4.924912452697754} -09/20/2021 16:28:50 - INFO - __main__ - Step 9201: {'lr': 0.00015333333333333334, 'samples': 294432, 'steps': 575, 'loss/train': 4.483798027038574} -09/20/2021 16:28:51 - INFO - __main__ - Step 9202: {'lr': 0.00015333333333333334, 'samples': 294464, 'steps': 575, 'loss/train': 3.023815155029297} -09/20/2021 16:28:52 - INFO - __main__ - Step 9203: {'lr': 0.00015333333333333334, 'samples': 294496, 'steps': 575, 'loss/train': 4.389077663421631} -09/20/2021 16:28:52 - INFO - __main__ - Step 9204: {'lr': 0.00015333333333333334, 'samples': 294528, 'steps': 575, 'loss/train': 5.070385932922363} -09/20/2021 16:28:53 - INFO - __main__ - Step 9205: {'lr': 0.00015333333333333334, 'samples': 294560, 'steps': 575, 'loss/train': 6.009032726287842} -09/20/2021 16:28:54 - INFO - __main__ - Step 9206: {'lr': 0.00015333333333333334, 'samples': 294592, 'steps': 575, 'loss/train': 4.614181995391846} -09/20/2021 16:28:55 - INFO - __main__ - Step 9207: {'lr': 0.00015333333333333334, 'samples': 294624, 'steps': 575, 'loss/train': 4.343713283538818} -09/20/2021 16:28:55 - INFO - __main__ - Step 9208: {'lr': 0.00015333333333333334, 'samples': 294656, 'steps': 575, 'loss/train': 4.844249248504639} -09/20/2021 16:28:56 - INFO - __main__ - Step 9209: {'lr': 0.00015333333333333334, 'samples': 294688, 'steps': 575, 'loss/train': 6.287209987640381} -09/20/2021 16:28:57 - INFO - __main__ - Step 9210: {'lr': 0.00015333333333333334, 'samples': 294720, 'steps': 575, 'loss/train': 3.841123580932617} -09/20/2021 16:28:58 - INFO - __main__ - Step 9211: {'lr': 0.00015333333333333334, 'samples': 294752, 'steps': 575, 'loss/train': 5.562195301055908} -09/20/2021 16:28:58 - INFO - __main__ - Step 9212: {'lr': 0.00015333333333333334, 'samples': 294784, 'steps': 575, 'loss/train': 2.8425776958465576} -09/20/2021 16:28:59 - INFO - __main__ - Step 9213: {'lr': 0.00015333333333333334, 'samples': 294816, 'steps': 575, 'loss/train': 3.9437084197998047} -09/20/2021 16:29:00 - INFO - __main__ - Step 9214: {'lr': 0.00015333333333333334, 'samples': 294848, 'steps': 575, 'loss/train': 3.641906261444092} -09/20/2021 16:29:01 - INFO - __main__ - Step 9215: {'lr': 0.00015333333333333334, 'samples': 294880, 'steps': 575, 'loss/train': 4.909311771392822} -09/20/2021 16:29:02 - INFO - __main__ - Step 9216: {'lr': 0.00015333333333333334, 'samples': 294912, 'steps': 575, 'loss/train': 5.090423583984375} -09/20/2021 16:29:03 - INFO - __main__ - Step 9217: {'lr': 0.00015360000000000002, 'samples': 294944, 'steps': 576, 'loss/train': 4.029866695404053} -09/20/2021 16:29:04 - INFO - __main__ - Step 9218: {'lr': 0.00015360000000000002, 'samples': 294976, 'steps': 576, 'loss/train': 4.369381904602051} -09/20/2021 16:29:04 - INFO - __main__ - Step 9219: {'lr': 0.00015360000000000002, 'samples': 295008, 'steps': 576, 'loss/train': 3.7883503437042236} -09/20/2021 16:29:05 - INFO - __main__ - Step 9220: {'lr': 0.00015360000000000002, 'samples': 295040, 'steps': 576, 'loss/train': 5.068562984466553} -09/20/2021 16:29:06 - INFO - __main__ - Step 9221: {'lr': 0.00015360000000000002, 'samples': 295072, 'steps': 576, 'loss/train': 4.166048526763916} -09/20/2021 16:29:07 - INFO - __main__ - Step 9222: {'lr': 0.00015360000000000002, 'samples': 295104, 'steps': 576, 'loss/train': 4.669317722320557} -09/20/2021 16:29:07 - INFO - __main__ - Step 9223: {'lr': 0.00015360000000000002, 'samples': 295136, 'steps': 576, 'loss/train': 5.430252552032471} -09/20/2021 16:29:08 - INFO - __main__ - Step 9224: {'lr': 0.00015360000000000002, 'samples': 295168, 'steps': 576, 'loss/train': 6.103929042816162} -09/20/2021 16:29:09 - INFO - __main__ - Step 9225: {'lr': 0.00015360000000000002, 'samples': 295200, 'steps': 576, 'loss/train': 4.654404640197754} -09/20/2021 16:29:10 - INFO - __main__ - Step 9226: {'lr': 0.00015360000000000002, 'samples': 295232, 'steps': 576, 'loss/train': 4.799233436584473} -09/20/2021 16:29:10 - INFO - __main__ - Step 9227: {'lr': 0.00015360000000000002, 'samples': 295264, 'steps': 576, 'loss/train': 4.489307403564453} -09/20/2021 16:29:11 - INFO - __main__ - Step 9228: {'lr': 0.00015360000000000002, 'samples': 295296, 'steps': 576, 'loss/train': 3.162201404571533} -09/20/2021 16:29:12 - INFO - __main__ - Step 9229: {'lr': 0.00015360000000000002, 'samples': 295328, 'steps': 576, 'loss/train': 4.430498123168945} -09/20/2021 16:29:13 - INFO - __main__ - Step 9230: {'lr': 0.00015360000000000002, 'samples': 295360, 'steps': 576, 'loss/train': 4.6192426681518555} -09/20/2021 16:29:13 - INFO - __main__ - Step 9231: {'lr': 0.00015360000000000002, 'samples': 295392, 'steps': 576, 'loss/train': 3.533003330230713} -09/20/2021 16:29:14 - INFO - __main__ - Step 9232: {'lr': 0.00015360000000000002, 'samples': 295424, 'steps': 576, 'loss/train': 4.7056565284729} -09/20/2021 16:29:15 - INFO - __main__ - Step 9233: {'lr': 0.00015386666666666668, 'samples': 295456, 'steps': 577, 'loss/train': 4.194883823394775} -09/20/2021 16:29:16 - INFO - __main__ - Step 9234: {'lr': 0.00015386666666666668, 'samples': 295488, 'steps': 577, 'loss/train': 3.7158546447753906} -09/20/2021 16:29:16 - INFO - __main__ - Step 9235: {'lr': 0.00015386666666666668, 'samples': 295520, 'steps': 577, 'loss/train': 3.474473714828491} -09/20/2021 16:29:17 - INFO - __main__ - Step 9236: {'lr': 0.00015386666666666668, 'samples': 295552, 'steps': 577, 'loss/train': 3.6989805698394775} -09/20/2021 16:29:18 - INFO - __main__ - Step 9237: {'lr': 0.00015386666666666668, 'samples': 295584, 'steps': 577, 'loss/train': 5.583254337310791} -09/20/2021 16:29:19 - INFO - __main__ - Step 9238: {'lr': 0.00015386666666666668, 'samples': 295616, 'steps': 577, 'loss/train': 5.007637977600098} -09/20/2021 16:29:19 - INFO - __main__ - Step 9239: {'lr': 0.00015386666666666668, 'samples': 295648, 'steps': 577, 'loss/train': 6.008291244506836} -09/20/2021 16:29:20 - INFO - __main__ - Step 9240: {'lr': 0.00015386666666666668, 'samples': 295680, 'steps': 577, 'loss/train': 5.221586227416992} -09/20/2021 16:29:21 - INFO - __main__ - Step 9241: {'lr': 0.00015386666666666668, 'samples': 295712, 'steps': 577, 'loss/train': 2.6133992671966553} -09/20/2021 16:29:22 - INFO - __main__ - Step 9242: {'lr': 0.00015386666666666668, 'samples': 295744, 'steps': 577, 'loss/train': 5.44734001159668} -09/20/2021 16:29:22 - INFO - __main__ - Step 9243: {'lr': 0.00015386666666666668, 'samples': 295776, 'steps': 577, 'loss/train': 4.739655494689941} -09/20/2021 16:29:23 - INFO - __main__ - Step 9244: {'lr': 0.00015386666666666668, 'samples': 295808, 'steps': 577, 'loss/train': 4.697142124176025} -09/20/2021 16:29:24 - INFO - __main__ - Step 9245: {'lr': 0.00015386666666666668, 'samples': 295840, 'steps': 577, 'loss/train': 4.279897689819336} -09/20/2021 16:29:25 - INFO - __main__ - Step 9246: {'lr': 0.00015386666666666668, 'samples': 295872, 'steps': 577, 'loss/train': 4.629110813140869} -09/20/2021 16:29:26 - INFO - __main__ - Step 9247: {'lr': 0.00015386666666666668, 'samples': 295904, 'steps': 577, 'loss/train': 5.5491251945495605} -09/20/2021 16:29:27 - INFO - __main__ - Step 9248: {'lr': 0.00015386666666666668, 'samples': 295936, 'steps': 577, 'loss/train': 4.183241844177246} -09/20/2021 16:29:28 - INFO - __main__ - Step 9249: {'lr': 0.00015413333333333336, 'samples': 295968, 'steps': 578, 'loss/train': 4.369015216827393} -09/20/2021 16:29:28 - INFO - __main__ - Step 9250: {'lr': 0.00015413333333333336, 'samples': 296000, 'steps': 578, 'loss/train': 5.050980567932129} -09/20/2021 16:29:29 - INFO - __main__ - Step 9251: {'lr': 0.00015413333333333336, 'samples': 296032, 'steps': 578, 'loss/train': 4.5918288230896} -09/20/2021 16:29:30 - INFO - __main__ - Step 9252: {'lr': 0.00015413333333333336, 'samples': 296064, 'steps': 578, 'loss/train': 5.451636791229248} -09/20/2021 16:29:31 - INFO - __main__ - Step 9253: {'lr': 0.00015413333333333336, 'samples': 296096, 'steps': 578, 'loss/train': 4.058322429656982} -09/20/2021 16:29:31 - INFO - __main__ - Step 9254: {'lr': 0.00015413333333333336, 'samples': 296128, 'steps': 578, 'loss/train': 5.3337812423706055} -09/20/2021 16:29:32 - INFO - __main__ - Step 9255: {'lr': 0.00015413333333333336, 'samples': 296160, 'steps': 578, 'loss/train': 4.391280174255371} -09/20/2021 16:29:33 - INFO - __main__ - Step 9256: {'lr': 0.00015413333333333336, 'samples': 296192, 'steps': 578, 'loss/train': 4.185029029846191} -09/20/2021 16:29:34 - INFO - __main__ - Step 9257: {'lr': 0.00015413333333333336, 'samples': 296224, 'steps': 578, 'loss/train': 5.147022247314453} -09/20/2021 16:29:34 - INFO - __main__ - Step 9258: {'lr': 0.00015413333333333336, 'samples': 296256, 'steps': 578, 'loss/train': 4.492595195770264} -09/20/2021 16:29:35 - INFO - __main__ - Step 9259: {'lr': 0.00015413333333333336, 'samples': 296288, 'steps': 578, 'loss/train': 5.631930351257324} -09/20/2021 16:29:36 - INFO - __main__ - Step 9260: {'lr': 0.00015413333333333336, 'samples': 296320, 'steps': 578, 'loss/train': 4.31976842880249} -09/20/2021 16:29:37 - INFO - __main__ - Step 9261: {'lr': 0.00015413333333333336, 'samples': 296352, 'steps': 578, 'loss/train': 5.573334693908691} -09/20/2021 16:29:37 - INFO - __main__ - Step 9262: {'lr': 0.00015413333333333336, 'samples': 296384, 'steps': 578, 'loss/train': 4.102834701538086} -09/20/2021 16:29:38 - INFO - __main__ - Step 9263: {'lr': 0.00015413333333333336, 'samples': 296416, 'steps': 578, 'loss/train': 3.1637074947357178} -09/20/2021 16:29:39 - INFO - __main__ - Step 9264: {'lr': 0.00015413333333333336, 'samples': 296448, 'steps': 578, 'loss/train': 4.684540748596191} -09/20/2021 16:29:40 - INFO - __main__ - Step 9265: {'lr': 0.0001544, 'samples': 296480, 'steps': 579, 'loss/train': 5.1241326332092285} -09/20/2021 16:29:40 - INFO - __main__ - Step 9266: {'lr': 0.0001544, 'samples': 296512, 'steps': 579, 'loss/train': 5.36445426940918} -09/20/2021 16:29:41 - INFO - __main__ - Step 9267: {'lr': 0.0001544, 'samples': 296544, 'steps': 579, 'loss/train': 4.059236526489258} -09/20/2021 16:29:42 - INFO - __main__ - Step 9268: {'lr': 0.0001544, 'samples': 296576, 'steps': 579, 'loss/train': 5.197988510131836} -09/20/2021 16:29:43 - INFO - __main__ - Step 9269: {'lr': 0.0001544, 'samples': 296608, 'steps': 579, 'loss/train': 5.570725440979004} -09/20/2021 16:29:43 - INFO - __main__ - Step 9270: {'lr': 0.0001544, 'samples': 296640, 'steps': 579, 'loss/train': 4.270401477813721} -09/20/2021 16:29:44 - INFO - __main__ - Step 9271: {'lr': 0.0001544, 'samples': 296672, 'steps': 579, 'loss/train': 4.807579517364502} -09/20/2021 16:29:45 - INFO - __main__ - Step 9272: {'lr': 0.0001544, 'samples': 296704, 'steps': 579, 'loss/train': 4.540106296539307} -09/20/2021 16:29:46 - INFO - __main__ - Step 9273: {'lr': 0.0001544, 'samples': 296736, 'steps': 579, 'loss/train': 4.308215141296387} -09/20/2021 16:29:46 - INFO - __main__ - Step 9274: {'lr': 0.0001544, 'samples': 296768, 'steps': 579, 'loss/train': 3.5511741638183594} -09/20/2021 16:29:47 - INFO - __main__ - Step 9275: {'lr': 0.0001544, 'samples': 296800, 'steps': 579, 'loss/train': 5.033788204193115} -09/20/2021 16:29:48 - INFO - __main__ - Step 9276: {'lr': 0.0001544, 'samples': 296832, 'steps': 579, 'loss/train': 1.7341618537902832} -09/20/2021 16:29:49 - INFO - __main__ - Step 9277: {'lr': 0.0001544, 'samples': 296864, 'steps': 579, 'loss/train': 4.877492427825928} -09/20/2021 16:29:50 - INFO - __main__ - Step 9278: {'lr': 0.0001544, 'samples': 296896, 'steps': 579, 'loss/train': 4.2953200340271} -09/20/2021 16:29:51 - INFO - __main__ - Step 9279: {'lr': 0.0001544, 'samples': 296928, 'steps': 579, 'loss/train': 5.454253196716309} -09/20/2021 16:29:51 - INFO - __main__ - Step 9280: {'lr': 0.0001544, 'samples': 296960, 'steps': 579, 'loss/train': 4.61253023147583} -09/20/2021 16:29:52 - INFO - __main__ - Step 9281: {'lr': 0.00015466666666666667, 'samples': 296992, 'steps': 580, 'loss/train': 5.147242546081543} -09/20/2021 16:29:53 - INFO - __main__ - Step 9282: {'lr': 0.00015466666666666667, 'samples': 297024, 'steps': 580, 'loss/train': 3.8523926734924316} -09/20/2021 16:29:54 - INFO - __main__ - Step 9283: {'lr': 0.00015466666666666667, 'samples': 297056, 'steps': 580, 'loss/train': 4.629055976867676} -09/20/2021 16:29:55 - INFO - __main__ - Step 9284: {'lr': 0.00015466666666666667, 'samples': 297088, 'steps': 580, 'loss/train': 5.702465534210205} -09/20/2021 16:29:55 - INFO - __main__ - Step 9285: {'lr': 0.00015466666666666667, 'samples': 297120, 'steps': 580, 'loss/train': 4.86728572845459} -09/20/2021 16:29:56 - INFO - __main__ - Step 9286: {'lr': 0.00015466666666666667, 'samples': 297152, 'steps': 580, 'loss/train': 4.331594944000244} -09/20/2021 16:29:57 - INFO - __main__ - Step 9287: {'lr': 0.00015466666666666667, 'samples': 297184, 'steps': 580, 'loss/train': 1.9746708869934082} -09/20/2021 16:29:58 - INFO - __main__ - Step 9288: {'lr': 0.00015466666666666667, 'samples': 297216, 'steps': 580, 'loss/train': 5.729973316192627} -09/20/2021 16:29:58 - INFO - __main__ - Step 9289: {'lr': 0.00015466666666666667, 'samples': 297248, 'steps': 580, 'loss/train': 5.214742660522461} -09/20/2021 16:29:59 - INFO - __main__ - Step 9290: {'lr': 0.00015466666666666667, 'samples': 297280, 'steps': 580, 'loss/train': 7.159904956817627} -09/20/2021 16:30:00 - INFO - __main__ - Step 9291: {'lr': 0.00015466666666666667, 'samples': 297312, 'steps': 580, 'loss/train': 3.9143364429473877} -09/20/2021 16:30:01 - INFO - __main__ - Step 9292: {'lr': 0.00015466666666666667, 'samples': 297344, 'steps': 580, 'loss/train': 3.0707685947418213} -09/20/2021 16:30:01 - INFO - __main__ - Step 9293: {'lr': 0.00015466666666666667, 'samples': 297376, 'steps': 580, 'loss/train': 4.783838272094727} -09/20/2021 16:30:02 - INFO - __main__ - Step 9294: {'lr': 0.00015466666666666667, 'samples': 297408, 'steps': 580, 'loss/train': 4.867555141448975} -09/20/2021 16:30:03 - INFO - __main__ - Step 9295: {'lr': 0.00015466666666666667, 'samples': 297440, 'steps': 580, 'loss/train': 4.908377647399902} -09/20/2021 16:30:04 - INFO - __main__ - Step 9296: {'lr': 0.00015466666666666667, 'samples': 297472, 'steps': 580, 'loss/train': 4.554978370666504} -09/20/2021 16:30:05 - INFO - __main__ - Step 9297: {'lr': 0.00015493333333333332, 'samples': 297504, 'steps': 581, 'loss/train': 3.551007032394409} -09/20/2021 16:30:05 - INFO - __main__ - Step 9298: {'lr': 0.00015493333333333332, 'samples': 297536, 'steps': 581, 'loss/train': 4.264064311981201} -09/20/2021 16:30:06 - INFO - __main__ - Step 9299: {'lr': 0.00015493333333333332, 'samples': 297568, 'steps': 581, 'loss/train': 3.9977517127990723} -09/20/2021 16:30:07 - INFO - __main__ - Step 9300: {'lr': 0.00015493333333333332, 'samples': 297600, 'steps': 581, 'loss/train': 5.079782009124756} -09/20/2021 16:30:08 - INFO - __main__ - Step 9301: {'lr': 0.00015493333333333332, 'samples': 297632, 'steps': 581, 'loss/train': 4.240828514099121} -09/20/2021 16:30:08 - INFO - __main__ - Step 9302: {'lr': 0.00015493333333333332, 'samples': 297664, 'steps': 581, 'loss/train': 4.504662990570068} -09/20/2021 16:30:09 - INFO - __main__ - Step 9303: {'lr': 0.00015493333333333332, 'samples': 297696, 'steps': 581, 'loss/train': 5.464138984680176} -09/20/2021 16:30:10 - INFO - __main__ - Step 9304: {'lr': 0.00015493333333333332, 'samples': 297728, 'steps': 581, 'loss/train': 4.700360298156738} -09/20/2021 16:30:11 - INFO - __main__ - Step 9305: {'lr': 0.00015493333333333332, 'samples': 297760, 'steps': 581, 'loss/train': 4.6331024169921875} -09/20/2021 16:30:11 - INFO - __main__ - Step 9306: {'lr': 0.00015493333333333332, 'samples': 297792, 'steps': 581, 'loss/train': 4.653619766235352} -09/20/2021 16:30:12 - INFO - __main__ - Step 9307: {'lr': 0.00015493333333333332, 'samples': 297824, 'steps': 581, 'loss/train': 4.649620532989502} -09/20/2021 16:30:14 - INFO - __main__ - Step 9308: {'lr': 0.00015493333333333332, 'samples': 297856, 'steps': 581, 'loss/train': 4.489755153656006} -09/20/2021 16:30:14 - INFO - __main__ - Step 9309: {'lr': 0.00015493333333333332, 'samples': 297888, 'steps': 581, 'loss/train': 5.15381383895874} -09/20/2021 16:30:15 - INFO - __main__ - Step 9310: {'lr': 0.00015493333333333332, 'samples': 297920, 'steps': 581, 'loss/train': 4.5852131843566895} -09/20/2021 16:30:16 - INFO - __main__ - Step 9311: {'lr': 0.00015493333333333332, 'samples': 297952, 'steps': 581, 'loss/train': 4.611542224884033} -09/20/2021 16:30:17 - INFO - __main__ - Step 9312: {'lr': 0.00015493333333333332, 'samples': 297984, 'steps': 581, 'loss/train': 4.549009323120117} -09/20/2021 16:30:18 - INFO - __main__ - Step 9313: {'lr': 0.0001552, 'samples': 298016, 'steps': 582, 'loss/train': 5.123684406280518} -09/20/2021 16:30:18 - INFO - __main__ - Step 9314: {'lr': 0.0001552, 'samples': 298048, 'steps': 582, 'loss/train': 3.5417897701263428} -09/20/2021 16:30:19 - INFO - __main__ - Step 9315: {'lr': 0.0001552, 'samples': 298080, 'steps': 582, 'loss/train': 4.651724815368652} -09/20/2021 16:30:20 - INFO - __main__ - Step 9316: {'lr': 0.0001552, 'samples': 298112, 'steps': 582, 'loss/train': 3.798348903656006} -09/20/2021 16:30:21 - INFO - __main__ - Step 9317: {'lr': 0.0001552, 'samples': 298144, 'steps': 582, 'loss/train': 5.524624347686768} -09/20/2021 16:30:21 - INFO - __main__ - Step 9318: {'lr': 0.0001552, 'samples': 298176, 'steps': 582, 'loss/train': 4.893937587738037} -09/20/2021 16:30:22 - INFO - __main__ - Step 9319: {'lr': 0.0001552, 'samples': 298208, 'steps': 582, 'loss/train': 4.385846138000488} -09/20/2021 16:30:23 - INFO - __main__ - Step 9320: {'lr': 0.0001552, 'samples': 298240, 'steps': 582, 'loss/train': 4.440754413604736} -09/20/2021 16:30:24 - INFO - __main__ - Step 9321: {'lr': 0.0001552, 'samples': 298272, 'steps': 582, 'loss/train': 4.7507805824279785} -09/20/2021 16:30:24 - INFO - __main__ - Step 9322: {'lr': 0.0001552, 'samples': 298304, 'steps': 582, 'loss/train': 4.768107891082764} -09/20/2021 16:30:25 - INFO - __main__ - Step 9323: {'lr': 0.0001552, 'samples': 298336, 'steps': 582, 'loss/train': 4.293576717376709} -09/20/2021 16:30:26 - INFO - __main__ - Step 9324: {'lr': 0.0001552, 'samples': 298368, 'steps': 582, 'loss/train': 4.822847843170166} -09/20/2021 16:30:27 - INFO - __main__ - Step 9325: {'lr': 0.0001552, 'samples': 298400, 'steps': 582, 'loss/train': 4.939576148986816} -09/20/2021 16:30:27 - INFO - __main__ - Step 9326: {'lr': 0.0001552, 'samples': 298432, 'steps': 582, 'loss/train': 4.320757865905762} -09/20/2021 16:30:28 - INFO - __main__ - Step 9327: {'lr': 0.0001552, 'samples': 298464, 'steps': 582, 'loss/train': 5.051089286804199} -09/20/2021 16:30:29 - INFO - __main__ - Step 9328: {'lr': 0.0001552, 'samples': 298496, 'steps': 582, 'loss/train': 3.4861931800842285} -09/20/2021 16:30:30 - INFO - __main__ - Step 9329: {'lr': 0.00015546666666666666, 'samples': 298528, 'steps': 583, 'loss/train': 3.303741455078125} -09/20/2021 16:30:30 - INFO - __main__ - Step 9330: {'lr': 0.00015546666666666666, 'samples': 298560, 'steps': 583, 'loss/train': 2.8746097087860107} -09/20/2021 16:30:31 - INFO - __main__ - Step 9331: {'lr': 0.00015546666666666666, 'samples': 298592, 'steps': 583, 'loss/train': 3.7083098888397217} -09/20/2021 16:30:32 - INFO - __main__ - Step 9332: {'lr': 0.00015546666666666666, 'samples': 298624, 'steps': 583, 'loss/train': 4.55633020401001} -09/20/2021 16:30:33 - INFO - __main__ - Step 9333: {'lr': 0.00015546666666666666, 'samples': 298656, 'steps': 583, 'loss/train': 2.743323564529419} -09/20/2021 16:30:33 - INFO - __main__ - Step 9334: {'lr': 0.00015546666666666666, 'samples': 298688, 'steps': 583, 'loss/train': 4.010953903198242} -09/20/2021 16:30:34 - INFO - __main__ - Step 9335: {'lr': 0.00015546666666666666, 'samples': 298720, 'steps': 583, 'loss/train': 3.229154348373413} -09/20/2021 16:30:35 - INFO - __main__ - Step 9336: {'lr': 0.00015546666666666666, 'samples': 298752, 'steps': 583, 'loss/train': 2.6470324993133545} -09/20/2021 16:30:36 - INFO - __main__ - Step 9337: {'lr': 0.00015546666666666666, 'samples': 298784, 'steps': 583, 'loss/train': 2.652125597000122} -09/20/2021 16:30:36 - INFO - __main__ - Step 9338: {'lr': 0.00015546666666666666, 'samples': 298816, 'steps': 583, 'loss/train': 3.387387752532959} -09/20/2021 16:30:37 - INFO - __main__ - Step 9339: {'lr': 0.00015546666666666666, 'samples': 298848, 'steps': 583, 'loss/train': 3.545266628265381} -09/20/2021 16:30:38 - INFO - __main__ - Step 9340: {'lr': 0.00015546666666666666, 'samples': 298880, 'steps': 583, 'loss/train': 5.051119327545166} -09/20/2021 16:30:39 - INFO - __main__ - Step 9341: {'lr': 0.00015546666666666666, 'samples': 298912, 'steps': 583, 'loss/train': 3.474015712738037} -09/20/2021 16:30:39 - INFO - __main__ - Step 9342: {'lr': 0.00015546666666666666, 'samples': 298944, 'steps': 583, 'loss/train': 4.610651969909668} -09/20/2021 16:30:40 - INFO - __main__ - Step 9343: {'lr': 0.00015546666666666666, 'samples': 298976, 'steps': 583, 'loss/train': 5.521502494812012} -09/20/2021 16:30:41 - INFO - __main__ - Step 9344: {'lr': 0.00015546666666666666, 'samples': 299008, 'steps': 583, 'loss/train': 4.752877235412598} -09/20/2021 16:30:42 - INFO - __main__ - Step 9345: {'lr': 0.00015573333333333334, 'samples': 299040, 'steps': 584, 'loss/train': 4.739267349243164} -09/20/2021 16:30:44 - INFO - __main__ - Step 9346: {'lr': 0.00015573333333333334, 'samples': 299072, 'steps': 584, 'loss/train': 4.661870002746582} -09/20/2021 16:30:44 - INFO - __main__ - Step 9347: {'lr': 0.00015573333333333334, 'samples': 299104, 'steps': 584, 'loss/train': 4.743530750274658} -09/20/2021 16:30:45 - INFO - __main__ - Step 9348: {'lr': 0.00015573333333333334, 'samples': 299136, 'steps': 584, 'loss/train': 4.177597999572754} -09/20/2021 16:30:46 - INFO - __main__ - Step 9349: {'lr': 0.00015573333333333334, 'samples': 299168, 'steps': 584, 'loss/train': 5.047518730163574} -09/20/2021 16:30:47 - INFO - __main__ - Step 9350: {'lr': 0.00015573333333333334, 'samples': 299200, 'steps': 584, 'loss/train': 4.799640655517578} -09/20/2021 16:30:47 - INFO - __main__ - Step 9351: {'lr': 0.00015573333333333334, 'samples': 299232, 'steps': 584, 'loss/train': 5.383493900299072} -09/20/2021 16:30:48 - INFO - __main__ - Step 9352: {'lr': 0.00015573333333333334, 'samples': 299264, 'steps': 584, 'loss/train': 4.6413750648498535} -09/20/2021 16:30:49 - INFO - __main__ - Step 9353: {'lr': 0.00015573333333333334, 'samples': 299296, 'steps': 584, 'loss/train': 5.221963882446289} -09/20/2021 16:30:50 - INFO - __main__ - Step 9354: {'lr': 0.00015573333333333334, 'samples': 299328, 'steps': 584, 'loss/train': 4.221322059631348} -09/20/2021 16:30:50 - INFO - __main__ - Step 9355: {'lr': 0.00015573333333333334, 'samples': 299360, 'steps': 584, 'loss/train': 4.851840496063232} -09/20/2021 16:30:51 - INFO - __main__ - Step 9356: {'lr': 0.00015573333333333334, 'samples': 299392, 'steps': 584, 'loss/train': 5.000359058380127} -09/20/2021 16:30:52 - INFO - __main__ - Step 9357: {'lr': 0.00015573333333333334, 'samples': 299424, 'steps': 584, 'loss/train': 3.988102436065674} -09/20/2021 16:30:53 - INFO - __main__ - Step 9358: {'lr': 0.00015573333333333334, 'samples': 299456, 'steps': 584, 'loss/train': 6.43444299697876} -09/20/2021 16:30:53 - INFO - __main__ - Step 9359: {'lr': 0.00015573333333333334, 'samples': 299488, 'steps': 584, 'loss/train': 5.187668800354004} -09/20/2021 16:30:54 - INFO - __main__ - Step 9360: {'lr': 0.00015573333333333334, 'samples': 299520, 'steps': 584, 'loss/train': 5.937278747558594} -09/20/2021 16:30:55 - INFO - __main__ - Step 9361: {'lr': 0.00015600000000000002, 'samples': 299552, 'steps': 585, 'loss/train': 5.404601097106934} -09/20/2021 16:30:56 - INFO - __main__ - Step 9362: {'lr': 0.00015600000000000002, 'samples': 299584, 'steps': 585, 'loss/train': 4.4545183181762695} -09/20/2021 16:30:56 - INFO - __main__ - Step 9363: {'lr': 0.00015600000000000002, 'samples': 299616, 'steps': 585, 'loss/train': 4.1494574546813965} -09/20/2021 16:30:57 - INFO - __main__ - Step 9364: {'lr': 0.00015600000000000002, 'samples': 299648, 'steps': 585, 'loss/train': 4.785559177398682} -09/20/2021 16:30:58 - INFO - __main__ - Step 9365: {'lr': 0.00015600000000000002, 'samples': 299680, 'steps': 585, 'loss/train': 4.420159816741943} -09/20/2021 16:30:59 - INFO - __main__ - Step 9366: {'lr': 0.00015600000000000002, 'samples': 299712, 'steps': 585, 'loss/train': 3.8108270168304443} -09/20/2021 16:30:59 - INFO - __main__ - Step 9367: {'lr': 0.00015600000000000002, 'samples': 299744, 'steps': 585, 'loss/train': 4.107551097869873} -09/20/2021 16:31:00 - INFO - __main__ - Step 9368: {'lr': 0.00015600000000000002, 'samples': 299776, 'steps': 585, 'loss/train': 3.9928503036499023} -09/20/2021 16:31:01 - INFO - __main__ - Step 9369: {'lr': 0.00015600000000000002, 'samples': 299808, 'steps': 585, 'loss/train': 4.193702697753906} -09/20/2021 16:31:02 - INFO - __main__ - Step 9370: {'lr': 0.00015600000000000002, 'samples': 299840, 'steps': 585, 'loss/train': 4.131744384765625} -09/20/2021 16:31:02 - INFO - __main__ - Step 9371: {'lr': 0.00015600000000000002, 'samples': 299872, 'steps': 585, 'loss/train': 5.127267360687256} -09/20/2021 16:31:03 - INFO - __main__ - Step 9372: {'lr': 0.00015600000000000002, 'samples': 299904, 'steps': 585, 'loss/train': 4.347264766693115} -09/20/2021 16:31:04 - INFO - __main__ - Step 9373: {'lr': 0.00015600000000000002, 'samples': 299936, 'steps': 585, 'loss/train': 4.405947208404541} -09/20/2021 16:31:05 - INFO - __main__ - Step 9374: {'lr': 0.00015600000000000002, 'samples': 299968, 'steps': 585, 'loss/train': 6.214147090911865} -09/20/2021 16:31:06 - INFO - __main__ - Step 9375: {'lr': 0.00015600000000000002, 'samples': 300000, 'steps': 585, 'loss/train': 4.774648666381836} -09/20/2021 16:31:07 - INFO - __main__ - Step 9376: {'lr': 0.00015600000000000002, 'samples': 300032, 'steps': 585, 'loss/train': 3.486860990524292} -09/20/2021 16:31:08 - INFO - __main__ - Step 9377: {'lr': 0.00015626666666666668, 'samples': 300064, 'steps': 586, 'loss/train': 4.732381820678711} -09/20/2021 16:31:08 - INFO - __main__ - Step 9378: {'lr': 0.00015626666666666668, 'samples': 300096, 'steps': 586, 'loss/train': 5.407897472381592} -09/20/2021 16:31:09 - INFO - __main__ - Step 9379: {'lr': 0.00015626666666666668, 'samples': 300128, 'steps': 586, 'loss/train': 3.60341477394104} -09/20/2021 16:31:10 - INFO - __main__ - Step 9380: {'lr': 0.00015626666666666668, 'samples': 300160, 'steps': 586, 'loss/train': 5.179311752319336} -09/20/2021 16:31:11 - INFO - __main__ - Step 9381: {'lr': 0.00015626666666666668, 'samples': 300192, 'steps': 586, 'loss/train': 4.445324420928955} -09/20/2021 16:31:11 - INFO - __main__ - Step 9382: {'lr': 0.00015626666666666668, 'samples': 300224, 'steps': 586, 'loss/train': 4.376417636871338} -09/20/2021 16:31:12 - INFO - __main__ - Step 9383: {'lr': 0.00015626666666666668, 'samples': 300256, 'steps': 586, 'loss/train': 4.639883041381836} -09/20/2021 16:31:13 - INFO - __main__ - Step 9384: {'lr': 0.00015626666666666668, 'samples': 300288, 'steps': 586, 'loss/train': 4.706721782684326} -09/20/2021 16:31:14 - INFO - __main__ - Step 9385: {'lr': 0.00015626666666666668, 'samples': 300320, 'steps': 586, 'loss/train': 5.533502101898193} -09/20/2021 16:31:14 - INFO - __main__ - Step 9386: {'lr': 0.00015626666666666668, 'samples': 300352, 'steps': 586, 'loss/train': 4.65383768081665} -09/20/2021 16:31:15 - INFO - __main__ - Step 9387: {'lr': 0.00015626666666666668, 'samples': 300384, 'steps': 586, 'loss/train': 5.12178897857666} -09/20/2021 16:31:16 - INFO - __main__ - Step 9388: {'lr': 0.00015626666666666668, 'samples': 300416, 'steps': 586, 'loss/train': 4.038923263549805} -09/20/2021 16:31:17 - INFO - __main__ - Step 9389: {'lr': 0.00015626666666666668, 'samples': 300448, 'steps': 586, 'loss/train': 5.349039554595947} -09/20/2021 16:31:17 - INFO - __main__ - Step 9390: {'lr': 0.00015626666666666668, 'samples': 300480, 'steps': 586, 'loss/train': 4.026980876922607} -09/20/2021 16:31:18 - INFO - __main__ - Step 9391: {'lr': 0.00015626666666666668, 'samples': 300512, 'steps': 586, 'loss/train': 5.758174419403076} -09/20/2021 16:31:19 - INFO - __main__ - Step 9392: {'lr': 0.00015626666666666668, 'samples': 300544, 'steps': 586, 'loss/train': 4.58479642868042} -09/20/2021 16:31:20 - INFO - __main__ - Step 9393: {'lr': 0.00015653333333333333, 'samples': 300576, 'steps': 587, 'loss/train': 4.957027435302734} -09/20/2021 16:31:21 - INFO - __main__ - Step 9394: {'lr': 0.00015653333333333333, 'samples': 300608, 'steps': 587, 'loss/train': 4.100807189941406} -09/20/2021 16:31:21 - INFO - __main__ - Step 9395: {'lr': 0.00015653333333333333, 'samples': 300640, 'steps': 587, 'loss/train': 5.241373538970947} -09/20/2021 16:31:22 - INFO - __main__ - Step 9396: {'lr': 0.00015653333333333333, 'samples': 300672, 'steps': 587, 'loss/train': 4.617614269256592} -09/20/2021 16:31:23 - INFO - __main__ - Step 9397: {'lr': 0.00015653333333333333, 'samples': 300704, 'steps': 587, 'loss/train': 2.9725306034088135} -09/20/2021 16:31:24 - INFO - __main__ - Step 9398: {'lr': 0.00015653333333333333, 'samples': 300736, 'steps': 587, 'loss/train': 4.852626800537109} -09/20/2021 16:31:24 - INFO - __main__ - Step 9399: {'lr': 0.00015653333333333333, 'samples': 300768, 'steps': 587, 'loss/train': 2.302398681640625} -09/20/2021 16:31:25 - INFO - __main__ - Step 9400: {'lr': 0.00015653333333333333, 'samples': 300800, 'steps': 587, 'loss/train': 4.747882843017578} -09/20/2021 16:31:26 - INFO - __main__ - Step 9401: {'lr': 0.00015653333333333333, 'samples': 300832, 'steps': 587, 'loss/train': 5.086187362670898} -09/20/2021 16:31:27 - INFO - __main__ - Step 9402: {'lr': 0.00015653333333333333, 'samples': 300864, 'steps': 587, 'loss/train': 4.631653308868408} -09/20/2021 16:31:27 - INFO - __main__ - Step 9403: {'lr': 0.00015653333333333333, 'samples': 300896, 'steps': 587, 'loss/train': 4.644740104675293} -09/20/2021 16:31:28 - INFO - __main__ - Step 9404: {'lr': 0.00015653333333333333, 'samples': 300928, 'steps': 587, 'loss/train': 5.370577335357666} -09/20/2021 16:31:29 - INFO - __main__ - Step 9405: {'lr': 0.00015653333333333333, 'samples': 300960, 'steps': 587, 'loss/train': 4.056272983551025} -09/20/2021 16:31:30 - INFO - __main__ - Step 9406: {'lr': 0.00015653333333333333, 'samples': 300992, 'steps': 587, 'loss/train': 4.253056526184082} -09/20/2021 16:31:31 - INFO - __main__ - Step 9407: {'lr': 0.00015653333333333333, 'samples': 301024, 'steps': 587, 'loss/train': 4.245187282562256} -09/20/2021 16:31:32 - INFO - __main__ - Step 9408: {'lr': 0.00015653333333333333, 'samples': 301056, 'steps': 587, 'loss/train': 4.4184441566467285} -09/20/2021 16:31:33 - INFO - __main__ - Step 9409: {'lr': 0.00015680000000000002, 'samples': 301088, 'steps': 588, 'loss/train': 5.508489608764648} -09/20/2021 16:31:34 - INFO - __main__ - Step 9410: {'lr': 0.00015680000000000002, 'samples': 301120, 'steps': 588, 'loss/train': 4.729679107666016} -09/20/2021 16:31:34 - INFO - __main__ - Step 9411: {'lr': 0.00015680000000000002, 'samples': 301152, 'steps': 588, 'loss/train': 4.143667697906494} -09/20/2021 16:31:35 - INFO - __main__ - Step 9412: {'lr': 0.00015680000000000002, 'samples': 301184, 'steps': 588, 'loss/train': 3.7640678882598877} -09/20/2021 16:31:36 - INFO - __main__ - Step 9413: {'lr': 0.00015680000000000002, 'samples': 301216, 'steps': 588, 'loss/train': 4.262370586395264} -09/20/2021 16:31:37 - INFO - __main__ - Step 9414: {'lr': 0.00015680000000000002, 'samples': 301248, 'steps': 588, 'loss/train': 5.263091087341309} -09/20/2021 16:31:37 - INFO - __main__ - Step 9415: {'lr': 0.00015680000000000002, 'samples': 301280, 'steps': 588, 'loss/train': 5.162417888641357} -09/20/2021 16:31:38 - INFO - __main__ - Step 9416: {'lr': 0.00015680000000000002, 'samples': 301312, 'steps': 588, 'loss/train': 6.030243873596191} -09/20/2021 16:31:39 - INFO - __main__ - Step 9417: {'lr': 0.00015680000000000002, 'samples': 301344, 'steps': 588, 'loss/train': 2.5720407962799072} -09/20/2021 16:31:40 - INFO - __main__ - Step 9418: {'lr': 0.00015680000000000002, 'samples': 301376, 'steps': 588, 'loss/train': 6.51075553894043} -09/20/2021 16:31:40 - INFO - __main__ - Step 9419: {'lr': 0.00015680000000000002, 'samples': 301408, 'steps': 588, 'loss/train': 4.176728248596191} -09/20/2021 16:31:41 - INFO - __main__ - Step 9420: {'lr': 0.00015680000000000002, 'samples': 301440, 'steps': 588, 'loss/train': 0.6930268406867981} -09/20/2021 16:31:42 - INFO - __main__ - Step 9421: {'lr': 0.00015680000000000002, 'samples': 301472, 'steps': 588, 'loss/train': 4.690462589263916} -09/20/2021 16:31:43 - INFO - __main__ - Step 9422: {'lr': 0.00015680000000000002, 'samples': 301504, 'steps': 588, 'loss/train': 7.383231163024902} -09/20/2021 16:31:43 - INFO - __main__ - Step 9423: {'lr': 0.00015680000000000002, 'samples': 301536, 'steps': 588, 'loss/train': 5.833637714385986} -09/20/2021 16:31:44 - INFO - __main__ - Step 9424: {'lr': 0.00015680000000000002, 'samples': 301568, 'steps': 588, 'loss/train': 4.059863090515137} -09/20/2021 16:31:45 - INFO - __main__ - Step 9425: {'lr': 0.00015706666666666667, 'samples': 301600, 'steps': 589, 'loss/train': 4.335049152374268} -09/20/2021 16:31:46 - INFO - __main__ - Step 9426: {'lr': 0.00015706666666666667, 'samples': 301632, 'steps': 589, 'loss/train': 4.5440850257873535} -09/20/2021 16:31:47 - INFO - __main__ - Step 9427: {'lr': 0.00015706666666666667, 'samples': 301664, 'steps': 589, 'loss/train': 4.949906826019287} -09/20/2021 16:31:47 - INFO - __main__ - Step 9428: {'lr': 0.00015706666666666667, 'samples': 301696, 'steps': 589, 'loss/train': 4.353229999542236} -09/20/2021 16:31:48 - INFO - __main__ - Step 9429: {'lr': 0.00015706666666666667, 'samples': 301728, 'steps': 589, 'loss/train': 4.906029224395752} -09/20/2021 16:31:49 - INFO - __main__ - Step 9430: {'lr': 0.00015706666666666667, 'samples': 301760, 'steps': 589, 'loss/train': 4.796454906463623} -09/20/2021 16:31:50 - INFO - __main__ - Step 9431: {'lr': 0.00015706666666666667, 'samples': 301792, 'steps': 589, 'loss/train': 4.312124729156494} -09/20/2021 16:31:50 - INFO - __main__ - Step 9432: {'lr': 0.00015706666666666667, 'samples': 301824, 'steps': 589, 'loss/train': 6.018484115600586} -09/20/2021 16:31:51 - INFO - __main__ - Step 9433: {'lr': 0.00015706666666666667, 'samples': 301856, 'steps': 589, 'loss/train': 4.3232293128967285} -09/20/2021 16:31:52 - INFO - __main__ - Step 9434: {'lr': 0.00015706666666666667, 'samples': 301888, 'steps': 589, 'loss/train': 3.8351948261260986} -09/20/2021 16:31:53 - INFO - __main__ - Step 9435: {'lr': 0.00015706666666666667, 'samples': 301920, 'steps': 589, 'loss/train': 5.155989170074463} -09/20/2021 16:31:53 - INFO - __main__ - Step 9436: {'lr': 0.00015706666666666667, 'samples': 301952, 'steps': 589, 'loss/train': 5.311859130859375} -09/20/2021 16:31:54 - INFO - __main__ - Step 9437: {'lr': 0.00015706666666666667, 'samples': 301984, 'steps': 589, 'loss/train': 3.4678871631622314} -09/20/2021 16:31:55 - INFO - __main__ - Step 9438: {'lr': 0.00015706666666666667, 'samples': 302016, 'steps': 589, 'loss/train': 3.166214942932129} -09/20/2021 16:31:56 - INFO - __main__ - Step 9439: {'lr': 0.00015706666666666667, 'samples': 302048, 'steps': 589, 'loss/train': 3.423630952835083} -09/20/2021 16:31:56 - INFO - __main__ - Step 9440: {'lr': 0.00015706666666666667, 'samples': 302080, 'steps': 589, 'loss/train': 3.446570873260498} -09/20/2021 16:31:57 - INFO - __main__ - Step 9441: {'lr': 0.00015733333333333333, 'samples': 302112, 'steps': 590, 'loss/train': 2.581336736679077} -09/20/2021 16:31:58 - INFO - __main__ - Step 9442: {'lr': 0.00015733333333333333, 'samples': 302144, 'steps': 590, 'loss/train': 2.084639549255371} -09/20/2021 16:31:59 - INFO - __main__ - Step 9443: {'lr': 0.00015733333333333333, 'samples': 302176, 'steps': 590, 'loss/train': 4.055043697357178} -09/20/2021 16:32:00 - INFO - __main__ - Step 9444: {'lr': 0.00015733333333333333, 'samples': 302208, 'steps': 590, 'loss/train': 4.992487907409668} -09/20/2021 16:32:01 - INFO - __main__ - Step 9445: {'lr': 0.00015733333333333333, 'samples': 302240, 'steps': 590, 'loss/train': 5.40080451965332} -09/20/2021 16:32:02 - INFO - __main__ - Step 9446: {'lr': 0.00015733333333333333, 'samples': 302272, 'steps': 590, 'loss/train': 4.271342754364014} -09/20/2021 16:32:02 - INFO - __main__ - Step 9447: {'lr': 0.00015733333333333333, 'samples': 302304, 'steps': 590, 'loss/train': 4.5489373207092285} -09/20/2021 16:32:03 - INFO - __main__ - Step 9448: {'lr': 0.00015733333333333333, 'samples': 302336, 'steps': 590, 'loss/train': 5.314863681793213} -09/20/2021 16:32:04 - INFO - __main__ - Step 9449: {'lr': 0.00015733333333333333, 'samples': 302368, 'steps': 590, 'loss/train': 3.9880151748657227} -09/20/2021 16:32:05 - INFO - __main__ - Step 9450: {'lr': 0.00015733333333333333, 'samples': 302400, 'steps': 590, 'loss/train': 5.196207046508789} -09/20/2021 16:32:05 - INFO - __main__ - Step 9451: {'lr': 0.00015733333333333333, 'samples': 302432, 'steps': 590, 'loss/train': 5.07686710357666} -09/20/2021 16:32:06 - INFO - __main__ - Step 9452: {'lr': 0.00015733333333333333, 'samples': 302464, 'steps': 590, 'loss/train': 4.3953962326049805} -09/20/2021 16:32:07 - INFO - __main__ - Step 9453: {'lr': 0.00015733333333333333, 'samples': 302496, 'steps': 590, 'loss/train': 5.222629070281982} -09/20/2021 16:32:08 - INFO - __main__ - Step 9454: {'lr': 0.00015733333333333333, 'samples': 302528, 'steps': 590, 'loss/train': 4.708476543426514} -09/20/2021 16:32:08 - INFO - __main__ - Step 9455: {'lr': 0.00015733333333333333, 'samples': 302560, 'steps': 590, 'loss/train': 4.5632452964782715} -09/20/2021 16:32:09 - INFO - __main__ - Step 9456: {'lr': 0.00015733333333333333, 'samples': 302592, 'steps': 590, 'loss/train': 4.02946662902832} -09/20/2021 16:32:10 - INFO - __main__ - Step 9457: {'lr': 0.0001576, 'samples': 302624, 'steps': 591, 'loss/train': 4.036014080047607} -09/20/2021 16:32:11 - INFO - __main__ - Step 9458: {'lr': 0.0001576, 'samples': 302656, 'steps': 591, 'loss/train': 5.17730188369751} -09/20/2021 16:32:11 - INFO - __main__ - Step 9459: {'lr': 0.0001576, 'samples': 302688, 'steps': 591, 'loss/train': 4.791169166564941} -09/20/2021 16:32:12 - INFO - __main__ - Step 9460: {'lr': 0.0001576, 'samples': 302720, 'steps': 591, 'loss/train': 4.826863765716553} -09/20/2021 16:32:13 - INFO - __main__ - Step 9461: {'lr': 0.0001576, 'samples': 302752, 'steps': 591, 'loss/train': 3.5293049812316895} -09/20/2021 16:32:14 - INFO - __main__ - Step 9462: {'lr': 0.0001576, 'samples': 302784, 'steps': 591, 'loss/train': 6.2798380851745605} -09/20/2021 16:32:14 - INFO - __main__ - Step 9463: {'lr': 0.0001576, 'samples': 302816, 'steps': 591, 'loss/train': 6.522195339202881} -09/20/2021 16:32:15 - INFO - __main__ - Step 9464: {'lr': 0.0001576, 'samples': 302848, 'steps': 591, 'loss/train': 5.967350006103516} -09/20/2021 16:32:16 - INFO - __main__ - Step 9465: {'lr': 0.0001576, 'samples': 302880, 'steps': 591, 'loss/train': 5.438601016998291} -09/20/2021 16:32:17 - INFO - __main__ - Step 9466: {'lr': 0.0001576, 'samples': 302912, 'steps': 591, 'loss/train': 4.839938640594482} -09/20/2021 16:32:17 - INFO - __main__ - Step 9467: {'lr': 0.0001576, 'samples': 302944, 'steps': 591, 'loss/train': 4.317349433898926} -09/20/2021 16:32:18 - INFO - __main__ - Step 9468: {'lr': 0.0001576, 'samples': 302976, 'steps': 591, 'loss/train': 4.992597579956055} -09/20/2021 16:32:19 - INFO - __main__ - Step 9469: {'lr': 0.0001576, 'samples': 303008, 'steps': 591, 'loss/train': 5.0302581787109375} -09/20/2021 16:32:20 - INFO - __main__ - Step 9470: {'lr': 0.0001576, 'samples': 303040, 'steps': 591, 'loss/train': 4.399410724639893} -09/20/2021 16:32:20 - INFO - __main__ - Step 9471: {'lr': 0.0001576, 'samples': 303072, 'steps': 591, 'loss/train': 4.484638690948486} -09/20/2021 16:32:21 - INFO - __main__ - Step 9472: {'lr': 0.0001576, 'samples': 303104, 'steps': 591, 'loss/train': 4.636609077453613} -09/20/2021 16:32:23 - INFO - __main__ - Step 9473: {'lr': 0.00015786666666666666, 'samples': 303136, 'steps': 592, 'loss/train': 4.437835693359375} -09/20/2021 16:32:23 - INFO - __main__ - Step 9474: {'lr': 0.00015786666666666666, 'samples': 303168, 'steps': 592, 'loss/train': 4.152968406677246} -09/20/2021 16:32:24 - INFO - __main__ - Step 9475: {'lr': 0.00015786666666666666, 'samples': 303200, 'steps': 592, 'loss/train': 5.195725917816162} -09/20/2021 16:32:25 - INFO - __main__ - Step 9476: {'lr': 0.00015786666666666666, 'samples': 303232, 'steps': 592, 'loss/train': 3.901036500930786} -09/20/2021 16:32:26 - INFO - __main__ - Step 9477: {'lr': 0.00015786666666666666, 'samples': 303264, 'steps': 592, 'loss/train': 4.456173896789551} -09/20/2021 16:32:26 - INFO - __main__ - Step 9478: {'lr': 0.00015786666666666666, 'samples': 303296, 'steps': 592, 'loss/train': 4.291168689727783} -09/20/2021 16:32:27 - INFO - __main__ - Step 9479: {'lr': 0.00015786666666666666, 'samples': 303328, 'steps': 592, 'loss/train': 4.537577152252197} -09/20/2021 16:32:28 - INFO - __main__ - Step 9480: {'lr': 0.00015786666666666666, 'samples': 303360, 'steps': 592, 'loss/train': 4.134299278259277} -09/20/2021 16:32:29 - INFO - __main__ - Step 9481: {'lr': 0.00015786666666666666, 'samples': 303392, 'steps': 592, 'loss/train': 4.486248970031738} -09/20/2021 16:32:29 - INFO - __main__ - Step 9482: {'lr': 0.00015786666666666666, 'samples': 303424, 'steps': 592, 'loss/train': 4.8489861488342285} -09/20/2021 16:32:30 - INFO - __main__ - Step 9483: {'lr': 0.00015786666666666666, 'samples': 303456, 'steps': 592, 'loss/train': 4.9666924476623535} -09/20/2021 16:32:31 - INFO - __main__ - Step 9484: {'lr': 0.00015786666666666666, 'samples': 303488, 'steps': 592, 'loss/train': 3.921708345413208} -09/20/2021 16:32:32 - INFO - __main__ - Step 9485: {'lr': 0.00015786666666666666, 'samples': 303520, 'steps': 592, 'loss/train': 5.16762113571167} -09/20/2021 16:32:32 - INFO - __main__ - Step 9486: {'lr': 0.00015786666666666666, 'samples': 303552, 'steps': 592, 'loss/train': 6.457355499267578} -09/20/2021 16:32:33 - INFO - __main__ - Step 9487: {'lr': 0.00015786666666666666, 'samples': 303584, 'steps': 592, 'loss/train': 6.054868698120117} -09/20/2021 16:32:34 - INFO - __main__ - Step 9488: {'lr': 0.00015786666666666666, 'samples': 303616, 'steps': 592, 'loss/train': 4.681726932525635} -09/20/2021 16:32:35 - INFO - __main__ - Step 9489: {'lr': 0.00015813333333333335, 'samples': 303648, 'steps': 593, 'loss/train': 4.460578441619873} -09/20/2021 16:32:36 - INFO - __main__ - Step 9490: {'lr': 0.00015813333333333335, 'samples': 303680, 'steps': 593, 'loss/train': 6.210025787353516} -09/20/2021 16:32:36 - INFO - __main__ - Step 9491: {'lr': 0.00015813333333333335, 'samples': 303712, 'steps': 593, 'loss/train': 3.2314164638519287} -09/20/2021 16:32:37 - INFO - __main__ - Step 9492: {'lr': 0.00015813333333333335, 'samples': 303744, 'steps': 593, 'loss/train': 5.835082530975342} -09/20/2021 16:32:38 - INFO - __main__ - Step 9493: {'lr': 0.00015813333333333335, 'samples': 303776, 'steps': 593, 'loss/train': 4.726351261138916} -09/20/2021 16:32:39 - INFO - __main__ - Step 9494: {'lr': 0.00015813333333333335, 'samples': 303808, 'steps': 593, 'loss/train': 4.9817070960998535} -09/20/2021 16:32:39 - INFO - __main__ - Step 9495: {'lr': 0.00015813333333333335, 'samples': 303840, 'steps': 593, 'loss/train': 4.669632434844971} -09/20/2021 16:32:40 - INFO - __main__ - Step 9496: {'lr': 0.00015813333333333335, 'samples': 303872, 'steps': 593, 'loss/train': 0.9518687129020691} -09/20/2021 16:32:41 - INFO - __main__ - Step 9497: {'lr': 0.00015813333333333335, 'samples': 303904, 'steps': 593, 'loss/train': 4.978538513183594} -09/20/2021 16:32:42 - INFO - __main__ - Step 9498: {'lr': 0.00015813333333333335, 'samples': 303936, 'steps': 593, 'loss/train': 4.0873613357543945} -09/20/2021 16:32:42 - INFO - __main__ - Step 9499: {'lr': 0.00015813333333333335, 'samples': 303968, 'steps': 593, 'loss/train': 3.913262128829956} -09/20/2021 16:32:43 - INFO - __main__ - Step 9500: {'lr': 0.00015813333333333335, 'samples': 304000, 'steps': 593, 'loss/train': 4.081508159637451} -09/20/2021 16:32:44 - INFO - __main__ - Step 9501: {'lr': 0.00015813333333333335, 'samples': 304032, 'steps': 593, 'loss/train': 4.075128078460693} -09/20/2021 16:32:45 - INFO - __main__ - Step 9502: {'lr': 0.00015813333333333335, 'samples': 304064, 'steps': 593, 'loss/train': 4.741560935974121} -09/20/2021 16:32:45 - INFO - __main__ - Step 9503: {'lr': 0.00015813333333333335, 'samples': 304096, 'steps': 593, 'loss/train': 4.82165002822876} -09/20/2021 16:32:46 - INFO - __main__ - Step 9504: {'lr': 0.00015813333333333335, 'samples': 304128, 'steps': 593, 'loss/train': 5.194748401641846} -09/20/2021 16:32:48 - INFO - __main__ - Step 9505: {'lr': 0.00015840000000000003, 'samples': 304160, 'steps': 594, 'loss/train': 3.8669204711914062} -09/20/2021 16:32:48 - INFO - __main__ - Step 9506: {'lr': 0.00015840000000000003, 'samples': 304192, 'steps': 594, 'loss/train': 4.085922718048096} -09/20/2021 16:32:49 - INFO - __main__ - Step 9507: {'lr': 0.00015840000000000003, 'samples': 304224, 'steps': 594, 'loss/train': 4.718973159790039} -09/20/2021 16:32:50 - INFO - __main__ - Step 9508: {'lr': 0.00015840000000000003, 'samples': 304256, 'steps': 594, 'loss/train': 4.772704124450684} -09/20/2021 16:32:51 - INFO - __main__ - Step 9509: {'lr': 0.00015840000000000003, 'samples': 304288, 'steps': 594, 'loss/train': 4.102306842803955} -09/20/2021 16:32:51 - INFO - __main__ - Step 9510: {'lr': 0.00015840000000000003, 'samples': 304320, 'steps': 594, 'loss/train': 4.695287227630615} -09/20/2021 16:32:52 - INFO - __main__ - Step 9511: {'lr': 0.00015840000000000003, 'samples': 304352, 'steps': 594, 'loss/train': 4.730114459991455} -09/20/2021 16:32:53 - INFO - __main__ - Step 9512: {'lr': 0.00015840000000000003, 'samples': 304384, 'steps': 594, 'loss/train': 4.492393970489502} -09/20/2021 16:32:54 - INFO - __main__ - Step 9513: {'lr': 0.00015840000000000003, 'samples': 304416, 'steps': 594, 'loss/train': 4.4377217292785645} -09/20/2021 16:32:54 - INFO - __main__ - Step 9514: {'lr': 0.00015840000000000003, 'samples': 304448, 'steps': 594, 'loss/train': 4.210892200469971} -09/20/2021 16:32:55 - INFO - __main__ - Step 9515: {'lr': 0.00015840000000000003, 'samples': 304480, 'steps': 594, 'loss/train': 5.030020236968994} -09/20/2021 16:32:56 - INFO - __main__ - Step 9516: {'lr': 0.00015840000000000003, 'samples': 304512, 'steps': 594, 'loss/train': 4.647110462188721} -09/20/2021 16:32:57 - INFO - __main__ - Step 9517: {'lr': 0.00015840000000000003, 'samples': 304544, 'steps': 594, 'loss/train': 4.006067752838135} -09/20/2021 16:32:57 - INFO - __main__ - Step 9518: {'lr': 0.00015840000000000003, 'samples': 304576, 'steps': 594, 'loss/train': 4.256843566894531} -09/20/2021 16:32:58 - INFO - __main__ - Step 9519: {'lr': 0.00015840000000000003, 'samples': 304608, 'steps': 594, 'loss/train': 3.774951219558716} -09/20/2021 16:32:59 - INFO - __main__ - Step 9520: {'lr': 0.00015840000000000003, 'samples': 304640, 'steps': 594, 'loss/train': 4.460005760192871} -09/20/2021 16:33:00 - INFO - __main__ - Step 9521: {'lr': 0.00015866666666666668, 'samples': 304672, 'steps': 595, 'loss/train': 3.656355857849121} -09/20/2021 16:33:00 - INFO - __main__ - Step 9522: {'lr': 0.00015866666666666668, 'samples': 304704, 'steps': 595, 'loss/train': 4.50439977645874} -09/20/2021 16:33:01 - INFO - __main__ - Step 9523: {'lr': 0.00015866666666666668, 'samples': 304736, 'steps': 595, 'loss/train': 6.194570541381836} -09/20/2021 16:33:02 - INFO - __main__ - Step 9524: {'lr': 0.00015866666666666668, 'samples': 304768, 'steps': 595, 'loss/train': 4.88549280166626} -09/20/2021 16:33:03 - INFO - __main__ - Step 9525: {'lr': 0.00015866666666666668, 'samples': 304800, 'steps': 595, 'loss/train': 5.457211494445801} -09/20/2021 16:33:03 - INFO - __main__ - Step 9526: {'lr': 0.00015866666666666668, 'samples': 304832, 'steps': 595, 'loss/train': 4.712647438049316} -09/20/2021 16:33:04 - INFO - __main__ - Step 9527: {'lr': 0.00015866666666666668, 'samples': 304864, 'steps': 595, 'loss/train': 5.409646987915039} -09/20/2021 16:33:05 - INFO - __main__ - Step 9528: {'lr': 0.00015866666666666668, 'samples': 304896, 'steps': 595, 'loss/train': 5.279347896575928} -09/20/2021 16:33:06 - INFO - __main__ - Step 9529: {'lr': 0.00015866666666666668, 'samples': 304928, 'steps': 595, 'loss/train': 3.813539505004883} -09/20/2021 16:33:06 - INFO - __main__ - Step 9530: {'lr': 0.00015866666666666668, 'samples': 304960, 'steps': 595, 'loss/train': 4.315881252288818} -09/20/2021 16:33:07 - INFO - __main__ - Step 9531: {'lr': 0.00015866666666666668, 'samples': 304992, 'steps': 595, 'loss/train': 2.1488988399505615} -09/20/2021 16:33:08 - INFO - __main__ - Step 9532: {'lr': 0.00015866666666666668, 'samples': 305024, 'steps': 595, 'loss/train': 2.012075185775757} -09/20/2021 16:33:09 - INFO - __main__ - Step 9533: {'lr': 0.00015866666666666668, 'samples': 305056, 'steps': 595, 'loss/train': 4.211091995239258} -09/20/2021 16:33:09 - INFO - __main__ - Step 9534: {'lr': 0.00015866666666666668, 'samples': 305088, 'steps': 595, 'loss/train': 5.9193339347839355} -09/20/2021 16:33:11 - INFO - __main__ - Step 9535: {'lr': 0.00015866666666666668, 'samples': 305120, 'steps': 595, 'loss/train': 4.903415679931641} -09/20/2021 16:33:11 - INFO - __main__ - Step 9536: {'lr': 0.00015866666666666668, 'samples': 305152, 'steps': 595, 'loss/train': 6.38132905960083} -09/20/2021 16:33:12 - INFO - __main__ - Step 9537: {'lr': 0.00015893333333333334, 'samples': 305184, 'steps': 596, 'loss/train': 3.992365837097168} -09/20/2021 16:33:13 - INFO - __main__ - Step 9538: {'lr': 0.00015893333333333334, 'samples': 305216, 'steps': 596, 'loss/train': 4.360015869140625} -09/20/2021 16:33:14 - INFO - __main__ - Step 9539: {'lr': 0.00015893333333333334, 'samples': 305248, 'steps': 596, 'loss/train': 4.319106578826904} -09/20/2021 16:33:15 - INFO - __main__ - Step 9540: {'lr': 0.00015893333333333334, 'samples': 305280, 'steps': 596, 'loss/train': 4.328796863555908} -09/20/2021 16:33:15 - INFO - __main__ - Step 9541: {'lr': 0.00015893333333333334, 'samples': 305312, 'steps': 596, 'loss/train': 3.7932729721069336} -09/20/2021 16:33:16 - INFO - __main__ - Step 9542: {'lr': 0.00015893333333333334, 'samples': 305344, 'steps': 596, 'loss/train': 3.9988133907318115} -09/20/2021 16:33:17 - INFO - __main__ - Step 9543: {'lr': 0.00015893333333333334, 'samples': 305376, 'steps': 596, 'loss/train': 5.443305015563965} -09/20/2021 16:33:18 - INFO - __main__ - Step 9544: {'lr': 0.00015893333333333334, 'samples': 305408, 'steps': 596, 'loss/train': 5.34959077835083} -09/20/2021 16:33:18 - INFO - __main__ - Step 9545: {'lr': 0.00015893333333333334, 'samples': 305440, 'steps': 596, 'loss/train': 5.3357086181640625} -09/20/2021 16:33:19 - INFO - __main__ - Step 9546: {'lr': 0.00015893333333333334, 'samples': 305472, 'steps': 596, 'loss/train': 4.679216384887695} -09/20/2021 16:33:20 - INFO - __main__ - Step 9547: {'lr': 0.00015893333333333334, 'samples': 305504, 'steps': 596, 'loss/train': 4.586813926696777} -09/20/2021 16:33:21 - INFO - __main__ - Step 9548: {'lr': 0.00015893333333333334, 'samples': 305536, 'steps': 596, 'loss/train': 5.153166770935059} -09/20/2021 16:33:21 - INFO - __main__ - Step 9549: {'lr': 0.00015893333333333334, 'samples': 305568, 'steps': 596, 'loss/train': 4.949374675750732} -09/20/2021 16:33:22 - INFO - __main__ - Step 9550: {'lr': 0.00015893333333333334, 'samples': 305600, 'steps': 596, 'loss/train': 4.373086929321289} -09/20/2021 16:33:23 - INFO - __main__ - Step 9551: {'lr': 0.00015893333333333334, 'samples': 305632, 'steps': 596, 'loss/train': 5.241957664489746} -09/20/2021 16:33:24 - INFO - __main__ - Step 9552: {'lr': 0.00015893333333333334, 'samples': 305664, 'steps': 596, 'loss/train': 4.857705116271973} -09/20/2021 16:33:24 - INFO - __main__ - Step 9553: {'lr': 0.00015920000000000002, 'samples': 305696, 'steps': 597, 'loss/train': 4.421994686126709} -09/20/2021 16:33:25 - INFO - __main__ - Step 9554: {'lr': 0.00015920000000000002, 'samples': 305728, 'steps': 597, 'loss/train': 4.614131450653076} -09/20/2021 16:33:26 - INFO - __main__ - Step 9555: {'lr': 0.00015920000000000002, 'samples': 305760, 'steps': 597, 'loss/train': 5.9738335609436035} -09/20/2021 16:33:27 - INFO - __main__ - Step 9556: {'lr': 0.00015920000000000002, 'samples': 305792, 'steps': 597, 'loss/train': 4.581900596618652} -09/20/2021 16:33:27 - INFO - __main__ - Step 9557: {'lr': 0.00015920000000000002, 'samples': 305824, 'steps': 597, 'loss/train': 3.656297206878662} -09/20/2021 16:33:28 - INFO - __main__ - Step 9558: {'lr': 0.00015920000000000002, 'samples': 305856, 'steps': 597, 'loss/train': 4.298595428466797} -09/20/2021 16:33:29 - INFO - __main__ - Step 9559: {'lr': 0.00015920000000000002, 'samples': 305888, 'steps': 597, 'loss/train': 4.731559753417969} -09/20/2021 16:33:30 - INFO - __main__ - Step 9560: {'lr': 0.00015920000000000002, 'samples': 305920, 'steps': 597, 'loss/train': 4.032661437988281} -09/20/2021 16:33:30 - INFO - __main__ - Step 9561: {'lr': 0.00015920000000000002, 'samples': 305952, 'steps': 597, 'loss/train': 4.537276268005371} -09/20/2021 16:33:31 - INFO - __main__ - Step 9562: {'lr': 0.00015920000000000002, 'samples': 305984, 'steps': 597, 'loss/train': 4.523667335510254} -09/20/2021 16:33:32 - INFO - __main__ - Step 9563: {'lr': 0.00015920000000000002, 'samples': 306016, 'steps': 597, 'loss/train': 5.317408561706543} -09/20/2021 16:33:33 - INFO - __main__ - Step 9564: {'lr': 0.00015920000000000002, 'samples': 306048, 'steps': 597, 'loss/train': 4.3603668212890625} -09/20/2021 16:33:33 - INFO - __main__ - Step 9565: {'lr': 0.00015920000000000002, 'samples': 306080, 'steps': 597, 'loss/train': 5.131959438323975} -09/20/2021 16:33:35 - INFO - __main__ - Step 9566: {'lr': 0.00015920000000000002, 'samples': 306112, 'steps': 597, 'loss/train': 3.323962926864624} -09/20/2021 16:33:36 - INFO - __main__ - Step 9567: {'lr': 0.00015920000000000002, 'samples': 306144, 'steps': 597, 'loss/train': 5.02057409286499} -09/20/2021 16:33:36 - INFO - __main__ - Step 9568: {'lr': 0.00015920000000000002, 'samples': 306176, 'steps': 597, 'loss/train': 5.491189956665039} -09/20/2021 16:33:37 - INFO - __main__ - Step 9569: {'lr': 0.00015946666666666668, 'samples': 306208, 'steps': 598, 'loss/train': 5.015308380126953} -09/20/2021 16:33:38 - INFO - __main__ - Step 9570: {'lr': 0.00015946666666666668, 'samples': 306240, 'steps': 598, 'loss/train': 4.7790350914001465} -09/20/2021 16:33:39 - INFO - __main__ - Step 9571: {'lr': 0.00015946666666666668, 'samples': 306272, 'steps': 598, 'loss/train': 5.337977409362793} -09/20/2021 16:33:39 - INFO - __main__ - Step 9572: {'lr': 0.00015946666666666668, 'samples': 306304, 'steps': 598, 'loss/train': 5.189072132110596} -09/20/2021 16:33:40 - INFO - __main__ - Step 9573: {'lr': 0.00015946666666666668, 'samples': 306336, 'steps': 598, 'loss/train': 4.504708290100098} -09/20/2021 16:33:41 - INFO - __main__ - Step 9574: {'lr': 0.00015946666666666668, 'samples': 306368, 'steps': 598, 'loss/train': 5.169275760650635} -09/20/2021 16:33:42 - INFO - __main__ - Step 9575: {'lr': 0.00015946666666666668, 'samples': 306400, 'steps': 598, 'loss/train': 4.489861488342285} -09/20/2021 16:33:42 - INFO - __main__ - Step 9576: {'lr': 0.00015946666666666668, 'samples': 306432, 'steps': 598, 'loss/train': 4.075072288513184} -09/20/2021 16:33:43 - INFO - __main__ - Step 9577: {'lr': 0.00015946666666666668, 'samples': 306464, 'steps': 598, 'loss/train': 4.397602081298828} -09/20/2021 16:33:44 - INFO - __main__ - Step 9578: {'lr': 0.00015946666666666668, 'samples': 306496, 'steps': 598, 'loss/train': 5.127641677856445} -09/20/2021 16:33:45 - INFO - __main__ - Step 9579: {'lr': 0.00015946666666666668, 'samples': 306528, 'steps': 598, 'loss/train': 5.705199241638184} -09/20/2021 16:33:45 - INFO - __main__ - Step 9580: {'lr': 0.00015946666666666668, 'samples': 306560, 'steps': 598, 'loss/train': 4.43613862991333} -09/20/2021 16:33:46 - INFO - __main__ - Step 9581: {'lr': 0.00015946666666666668, 'samples': 306592, 'steps': 598, 'loss/train': 4.24114465713501} -09/20/2021 16:33:47 - INFO - __main__ - Step 9582: {'lr': 0.00015946666666666668, 'samples': 306624, 'steps': 598, 'loss/train': 4.247201442718506} -09/20/2021 16:33:48 - INFO - __main__ - Step 9583: {'lr': 0.00015946666666666668, 'samples': 306656, 'steps': 598, 'loss/train': 4.827347755432129} -09/20/2021 16:33:48 - INFO - __main__ - Step 9584: {'lr': 0.00015946666666666668, 'samples': 306688, 'steps': 598, 'loss/train': 4.763698101043701} -09/20/2021 16:33:49 - INFO - __main__ - Step 9585: {'lr': 0.00015973333333333333, 'samples': 306720, 'steps': 599, 'loss/train': 4.888095855712891} -09/20/2021 16:33:50 - INFO - __main__ - Step 9586: {'lr': 0.00015973333333333333, 'samples': 306752, 'steps': 599, 'loss/train': 4.6192731857299805} -09/20/2021 16:33:51 - INFO - __main__ - Step 9587: {'lr': 0.00015973333333333333, 'samples': 306784, 'steps': 599, 'loss/train': 4.516692638397217} -09/20/2021 16:33:52 - INFO - __main__ - Step 9588: {'lr': 0.00015973333333333333, 'samples': 306816, 'steps': 599, 'loss/train': 4.459847927093506} -09/20/2021 16:33:52 - INFO - __main__ - Step 9589: {'lr': 0.00015973333333333333, 'samples': 306848, 'steps': 599, 'loss/train': 4.813413143157959} -09/20/2021 16:33:53 - INFO - __main__ - Step 9590: {'lr': 0.00015973333333333333, 'samples': 306880, 'steps': 599, 'loss/train': 5.365158557891846} -09/20/2021 16:33:54 - INFO - __main__ - Step 9591: {'lr': 0.00015973333333333333, 'samples': 306912, 'steps': 599, 'loss/train': 4.287588119506836} -09/20/2021 16:33:55 - INFO - __main__ - Step 9592: {'lr': 0.00015973333333333333, 'samples': 306944, 'steps': 599, 'loss/train': 4.700772285461426} -09/20/2021 16:33:55 - INFO - __main__ - Step 9593: {'lr': 0.00015973333333333333, 'samples': 306976, 'steps': 599, 'loss/train': 3.7850682735443115} -09/20/2021 16:33:56 - INFO - __main__ - Step 9594: {'lr': 0.00015973333333333333, 'samples': 307008, 'steps': 599, 'loss/train': 5.1419358253479} -09/20/2021 16:33:57 - INFO - __main__ - Step 9595: {'lr': 0.00015973333333333333, 'samples': 307040, 'steps': 599, 'loss/train': 4.06008768081665} -09/20/2021 16:33:58 - INFO - __main__ - Step 9596: {'lr': 0.00015973333333333333, 'samples': 307072, 'steps': 599, 'loss/train': 5.581484317779541} -09/20/2021 16:33:59 - INFO - __main__ - Step 9597: {'lr': 0.00015973333333333333, 'samples': 307104, 'steps': 599, 'loss/train': 4.49293851852417} -09/20/2021 16:34:00 - INFO - __main__ - Step 9598: {'lr': 0.00015973333333333333, 'samples': 307136, 'steps': 599, 'loss/train': 4.376172065734863} -09/20/2021 16:34:00 - INFO - __main__ - Step 9599: {'lr': 0.00015973333333333333, 'samples': 307168, 'steps': 599, 'loss/train': 4.70913028717041} -09/20/2021 16:34:01 - INFO - __main__ - Step 9600: {'lr': 0.00015973333333333333, 'samples': 307200, 'steps': 599, 'loss/train': 4.543754577636719} -09/20/2021 16:34:02 - INFO - __main__ - Step 9601: {'lr': 0.00016, 'samples': 307232, 'steps': 600, 'loss/train': 3.9507696628570557} -09/20/2021 16:34:03 - INFO - __main__ - Step 9602: {'lr': 0.00016, 'samples': 307264, 'steps': 600, 'loss/train': 4.403048992156982} -09/20/2021 16:34:03 - INFO - __main__ - Step 9603: {'lr': 0.00016, 'samples': 307296, 'steps': 600, 'loss/train': 5.195565700531006} -09/20/2021 16:34:04 - INFO - __main__ - Step 9604: {'lr': 0.00016, 'samples': 307328, 'steps': 600, 'loss/train': 4.211541652679443} -09/20/2021 16:34:05 - INFO - __main__ - Step 9605: {'lr': 0.00016, 'samples': 307360, 'steps': 600, 'loss/train': 4.391272068023682} -09/20/2021 16:34:06 - INFO - __main__ - Step 9606: {'lr': 0.00016, 'samples': 307392, 'steps': 600, 'loss/train': 5.069795608520508} -09/20/2021 16:34:06 - INFO - __main__ - Step 9607: {'lr': 0.00016, 'samples': 307424, 'steps': 600, 'loss/train': 4.437841415405273} -09/20/2021 16:34:07 - INFO - __main__ - Step 9608: {'lr': 0.00016, 'samples': 307456, 'steps': 600, 'loss/train': 4.044817924499512} -09/20/2021 16:34:08 - INFO - __main__ - Step 9609: {'lr': 0.00016, 'samples': 307488, 'steps': 600, 'loss/train': 5.0226030349731445} -09/20/2021 16:34:09 - INFO - __main__ - Step 9610: {'lr': 0.00016, 'samples': 307520, 'steps': 600, 'loss/train': 4.166698932647705} -09/20/2021 16:34:09 - INFO - __main__ - Step 9611: {'lr': 0.00016, 'samples': 307552, 'steps': 600, 'loss/train': 4.702640533447266} -09/20/2021 16:34:10 - INFO - __main__ - Step 9612: {'lr': 0.00016, 'samples': 307584, 'steps': 600, 'loss/train': 4.377586841583252} -09/20/2021 16:34:11 - INFO - __main__ - Step 9613: {'lr': 0.00016, 'samples': 307616, 'steps': 600, 'loss/train': 4.874180793762207} -09/20/2021 16:34:12 - INFO - __main__ - Step 9614: {'lr': 0.00016, 'samples': 307648, 'steps': 600, 'loss/train': 3.925393581390381} -09/20/2021 16:34:12 - INFO - __main__ - Step 9615: {'lr': 0.00016, 'samples': 307680, 'steps': 600, 'loss/train': 3.6908669471740723} -09/20/2021 16:34:13 - INFO - __main__ - Step 9616: {'lr': 0.00016, 'samples': 307712, 'steps': 600, 'loss/train': 5.219935417175293} -09/20/2021 16:34:14 - INFO - __main__ - Step 9617: {'lr': 0.00016026666666666667, 'samples': 307744, 'steps': 601, 'loss/train': 4.096340179443359} -09/20/2021 16:34:15 - INFO - __main__ - Step 9618: {'lr': 0.00016026666666666667, 'samples': 307776, 'steps': 601, 'loss/train': 2.7557849884033203} -09/20/2021 16:34:16 - INFO - __main__ - Step 9619: {'lr': 0.00016026666666666667, 'samples': 307808, 'steps': 601, 'loss/train': 4.7109479904174805} -09/20/2021 16:34:16 - INFO - __main__ - Step 9620: {'lr': 0.00016026666666666667, 'samples': 307840, 'steps': 601, 'loss/train': 5.211875915527344} -09/20/2021 16:34:17 - INFO - __main__ - Step 9621: {'lr': 0.00016026666666666667, 'samples': 307872, 'steps': 601, 'loss/train': 3.072206974029541} -09/20/2021 16:34:18 - INFO - __main__ - Step 9622: {'lr': 0.00016026666666666667, 'samples': 307904, 'steps': 601, 'loss/train': 4.186412811279297} -09/20/2021 16:34:19 - INFO - __main__ - Step 9623: {'lr': 0.00016026666666666667, 'samples': 307936, 'steps': 601, 'loss/train': 4.289722919464111} -09/20/2021 16:34:19 - INFO - __main__ - Step 9624: {'lr': 0.00016026666666666667, 'samples': 307968, 'steps': 601, 'loss/train': 3.6811630725860596} -09/20/2021 16:34:20 - INFO - __main__ - Step 9625: {'lr': 0.00016026666666666667, 'samples': 308000, 'steps': 601, 'loss/train': 4.411168098449707} -09/20/2021 16:34:21 - INFO - __main__ - Step 9626: {'lr': 0.00016026666666666667, 'samples': 308032, 'steps': 601, 'loss/train': 4.764659881591797} -09/20/2021 16:34:22 - INFO - __main__ - Step 9627: {'lr': 0.00016026666666666667, 'samples': 308064, 'steps': 601, 'loss/train': 4.564080238342285} -09/20/2021 16:34:22 - INFO - __main__ - Step 9628: {'lr': 0.00016026666666666667, 'samples': 308096, 'steps': 601, 'loss/train': 4.527450084686279} -09/20/2021 16:34:24 - INFO - __main__ - Step 9629: {'lr': 0.00016026666666666667, 'samples': 308128, 'steps': 601, 'loss/train': 4.062946796417236} -09/20/2021 16:34:25 - INFO - __main__ - Step 9630: {'lr': 0.00016026666666666667, 'samples': 308160, 'steps': 601, 'loss/train': 4.82744836807251} -09/20/2021 16:34:25 - INFO - __main__ - Step 9631: {'lr': 0.00016026666666666667, 'samples': 308192, 'steps': 601, 'loss/train': 4.607547760009766} -09/20/2021 16:34:26 - INFO - __main__ - Step 9632: {'lr': 0.00016026666666666667, 'samples': 308224, 'steps': 601, 'loss/train': 3.979283094406128} -09/20/2021 16:34:27 - INFO - __main__ - Step 9633: {'lr': 0.00016053333333333332, 'samples': 308256, 'steps': 602, 'loss/train': 4.254997730255127} -09/20/2021 16:34:28 - INFO - __main__ - Step 9634: {'lr': 0.00016053333333333332, 'samples': 308288, 'steps': 602, 'loss/train': 4.274353504180908} -09/20/2021 16:34:28 - INFO - __main__ - Step 9635: {'lr': 0.00016053333333333332, 'samples': 308320, 'steps': 602, 'loss/train': 4.3507795333862305} -09/20/2021 16:34:29 - INFO - __main__ - Step 9636: {'lr': 0.00016053333333333332, 'samples': 308352, 'steps': 602, 'loss/train': 4.377114772796631} -09/20/2021 16:34:30 - INFO - __main__ - Step 9637: {'lr': 0.00016053333333333332, 'samples': 308384, 'steps': 602, 'loss/train': 4.90697717666626} -09/20/2021 16:34:31 - INFO - __main__ - Step 9638: {'lr': 0.00016053333333333332, 'samples': 308416, 'steps': 602, 'loss/train': 5.224609851837158} -09/20/2021 16:34:31 - INFO - __main__ - Step 9639: {'lr': 0.00016053333333333332, 'samples': 308448, 'steps': 602, 'loss/train': 4.256809711456299} -09/20/2021 16:34:32 - INFO - __main__ - Step 9640: {'lr': 0.00016053333333333332, 'samples': 308480, 'steps': 602, 'loss/train': 6.6805195808410645} -09/20/2021 16:34:33 - INFO - __main__ - Step 9641: {'lr': 0.00016053333333333332, 'samples': 308512, 'steps': 602, 'loss/train': 4.76017951965332} -09/20/2021 16:34:34 - INFO - __main__ - Step 9642: {'lr': 0.00016053333333333332, 'samples': 308544, 'steps': 602, 'loss/train': 4.045232772827148} -09/20/2021 16:34:34 - INFO - __main__ - Step 9643: {'lr': 0.00016053333333333332, 'samples': 308576, 'steps': 602, 'loss/train': 4.670497417449951} -09/20/2021 16:34:35 - INFO - __main__ - Step 9644: {'lr': 0.00016053333333333332, 'samples': 308608, 'steps': 602, 'loss/train': 4.40716028213501} -09/20/2021 16:34:36 - INFO - __main__ - Step 9645: {'lr': 0.00016053333333333332, 'samples': 308640, 'steps': 602, 'loss/train': 4.850952625274658} -09/20/2021 16:34:37 - INFO - __main__ - Step 9646: {'lr': 0.00016053333333333332, 'samples': 308672, 'steps': 602, 'loss/train': 5.725254058837891} -09/20/2021 16:34:37 - INFO - __main__ - Step 9647: {'lr': 0.00016053333333333332, 'samples': 308704, 'steps': 602, 'loss/train': 5.894286155700684} -09/20/2021 16:34:38 - INFO - __main__ - Step 9648: {'lr': 0.00016053333333333332, 'samples': 308736, 'steps': 602, 'loss/train': 5.496121883392334} -09/20/2021 16:34:39 - INFO - __main__ - Step 9649: {'lr': 0.0001608, 'samples': 308768, 'steps': 603, 'loss/train': 4.639679431915283} -09/20/2021 16:34:40 - INFO - __main__ - Step 9650: {'lr': 0.0001608, 'samples': 308800, 'steps': 603, 'loss/train': 4.147747993469238} -09/20/2021 16:34:41 - INFO - __main__ - Step 9651: {'lr': 0.0001608, 'samples': 308832, 'steps': 603, 'loss/train': 4.43212890625} -09/20/2021 16:34:41 - INFO - __main__ - Step 9652: {'lr': 0.0001608, 'samples': 308864, 'steps': 603, 'loss/train': 4.024624824523926} -09/20/2021 16:34:42 - INFO - __main__ - Step 9653: {'lr': 0.0001608, 'samples': 308896, 'steps': 603, 'loss/train': 4.51198148727417} -09/20/2021 16:34:43 - INFO - __main__ - Step 9654: {'lr': 0.0001608, 'samples': 308928, 'steps': 603, 'loss/train': 4.057615756988525} -09/20/2021 16:34:44 - INFO - __main__ - Step 9655: {'lr': 0.0001608, 'samples': 308960, 'steps': 603, 'loss/train': 4.389288425445557} -09/20/2021 16:34:44 - INFO - __main__ - Step 9656: {'lr': 0.0001608, 'samples': 308992, 'steps': 603, 'loss/train': 5.363722801208496} -09/20/2021 16:34:45 - INFO - __main__ - Step 9657: {'lr': 0.0001608, 'samples': 309024, 'steps': 603, 'loss/train': 4.196804046630859} -09/20/2021 16:34:46 - INFO - __main__ - Step 9658: {'lr': 0.0001608, 'samples': 309056, 'steps': 603, 'loss/train': 6.039022922515869} -09/20/2021 16:34:48 - INFO - __main__ - Step 9659: {'lr': 0.0001608, 'samples': 309088, 'steps': 603, 'loss/train': 4.042257308959961} -09/20/2021 16:34:48 - INFO - __main__ - Step 9660: {'lr': 0.0001608, 'samples': 309120, 'steps': 603, 'loss/train': 4.9129319190979} -09/20/2021 16:34:49 - INFO - __main__ - Step 9661: {'lr': 0.0001608, 'samples': 309152, 'steps': 603, 'loss/train': 5.1608662605285645} -09/20/2021 16:34:50 - INFO - __main__ - Step 9662: {'lr': 0.0001608, 'samples': 309184, 'steps': 603, 'loss/train': 5.182137966156006} -09/20/2021 16:34:51 - INFO - __main__ - Step 9663: {'lr': 0.0001608, 'samples': 309216, 'steps': 603, 'loss/train': 4.4384026527404785} -09/20/2021 16:34:51 - INFO - __main__ - Step 9664: {'lr': 0.0001608, 'samples': 309248, 'steps': 603, 'loss/train': 4.7546892166137695} -09/20/2021 16:34:52 - INFO - __main__ - Step 9665: {'lr': 0.0001610666666666667, 'samples': 309280, 'steps': 604, 'loss/train': 3.542492628097534} -09/20/2021 16:34:53 - INFO - __main__ - Step 9666: {'lr': 0.0001610666666666667, 'samples': 309312, 'steps': 604, 'loss/train': 4.082633972167969} -09/20/2021 16:34:54 - INFO - __main__ - Step 9667: {'lr': 0.0001610666666666667, 'samples': 309344, 'steps': 604, 'loss/train': 4.6408281326293945} -09/20/2021 16:34:54 - INFO - __main__ - Step 9668: {'lr': 0.0001610666666666667, 'samples': 309376, 'steps': 604, 'loss/train': 5.262568950653076} -09/20/2021 16:34:55 - INFO - __main__ - Step 9669: {'lr': 0.0001610666666666667, 'samples': 309408, 'steps': 604, 'loss/train': 5.001911163330078} -09/20/2021 16:34:56 - INFO - __main__ - Step 9670: {'lr': 0.0001610666666666667, 'samples': 309440, 'steps': 604, 'loss/train': 4.5392374992370605} -09/20/2021 16:34:57 - INFO - __main__ - Step 9671: {'lr': 0.0001610666666666667, 'samples': 309472, 'steps': 604, 'loss/train': 5.128146648406982} -09/20/2021 16:34:57 - INFO - __main__ - Step 9672: {'lr': 0.0001610666666666667, 'samples': 309504, 'steps': 604, 'loss/train': 4.015884876251221} -09/20/2021 16:34:58 - INFO - __main__ - Step 9673: {'lr': 0.0001610666666666667, 'samples': 309536, 'steps': 604, 'loss/train': 4.420529842376709} -09/20/2021 16:34:59 - INFO - __main__ - Step 9674: {'lr': 0.0001610666666666667, 'samples': 309568, 'steps': 604, 'loss/train': 4.569782257080078} -09/20/2021 16:35:00 - INFO - __main__ - Step 9675: {'lr': 0.0001610666666666667, 'samples': 309600, 'steps': 604, 'loss/train': 2.4926888942718506} -09/20/2021 16:35:00 - INFO - __main__ - Step 9676: {'lr': 0.0001610666666666667, 'samples': 309632, 'steps': 604, 'loss/train': 5.457167148590088} -09/20/2021 16:35:01 - INFO - __main__ - Step 9677: {'lr': 0.0001610666666666667, 'samples': 309664, 'steps': 604, 'loss/train': 4.490167140960693} -09/20/2021 16:35:02 - INFO - __main__ - Step 9678: {'lr': 0.0001610666666666667, 'samples': 309696, 'steps': 604, 'loss/train': 4.577218532562256} -09/20/2021 16:35:03 - INFO - __main__ - Step 9679: {'lr': 0.0001610666666666667, 'samples': 309728, 'steps': 604, 'loss/train': 3.015275001525879} -09/20/2021 16:35:03 - INFO - __main__ - Step 9680: {'lr': 0.0001610666666666667, 'samples': 309760, 'steps': 604, 'loss/train': 4.181816577911377} -09/20/2021 16:35:04 - INFO - __main__ - Step 9681: {'lr': 0.00016133333333333334, 'samples': 309792, 'steps': 605, 'loss/train': 4.110971450805664} -09/20/2021 16:35:05 - INFO - __main__ - Step 9682: {'lr': 0.00016133333333333334, 'samples': 309824, 'steps': 605, 'loss/train': 4.258848667144775} -09/20/2021 16:35:06 - INFO - __main__ - Step 9683: {'lr': 0.00016133333333333334, 'samples': 309856, 'steps': 605, 'loss/train': 4.38545560836792} -09/20/2021 16:35:07 - INFO - __main__ - Step 9684: {'lr': 0.00016133333333333334, 'samples': 309888, 'steps': 605, 'loss/train': 4.50836706161499} -09/20/2021 16:35:07 - INFO - __main__ - Step 9685: {'lr': 0.00016133333333333334, 'samples': 309920, 'steps': 605, 'loss/train': 4.840784072875977} -09/20/2021 16:35:08 - INFO - __main__ - Step 9686: {'lr': 0.00016133333333333334, 'samples': 309952, 'steps': 605, 'loss/train': 4.739279747009277} -09/20/2021 16:35:09 - INFO - __main__ - Step 9687: {'lr': 0.00016133333333333334, 'samples': 309984, 'steps': 605, 'loss/train': 4.335422515869141} -09/20/2021 16:35:10 - INFO - __main__ - Step 9688: {'lr': 0.00016133333333333334, 'samples': 310016, 'steps': 605, 'loss/train': 4.026561260223389} -09/20/2021 16:35:11 - INFO - __main__ - Step 9689: {'lr': 0.00016133333333333334, 'samples': 310048, 'steps': 605, 'loss/train': 4.781574726104736} -09/20/2021 16:35:12 - INFO - __main__ - Step 9690: {'lr': 0.00016133333333333334, 'samples': 310080, 'steps': 605, 'loss/train': 5.408544063568115} -09/20/2021 16:35:12 - INFO - __main__ - Step 9691: {'lr': 0.00016133333333333334, 'samples': 310112, 'steps': 605, 'loss/train': 4.456814289093018} -09/20/2021 16:35:13 - INFO - __main__ - Step 9692: {'lr': 0.00016133333333333334, 'samples': 310144, 'steps': 605, 'loss/train': 5.026973724365234} -09/20/2021 16:35:14 - INFO - __main__ - Step 9693: {'lr': 0.00016133333333333334, 'samples': 310176, 'steps': 605, 'loss/train': 5.753762722015381} -09/20/2021 16:35:15 - INFO - __main__ - Step 9694: {'lr': 0.00016133333333333334, 'samples': 310208, 'steps': 605, 'loss/train': 5.080402374267578} -09/20/2021 16:35:15 - INFO - __main__ - Step 9695: {'lr': 0.00016133333333333334, 'samples': 310240, 'steps': 605, 'loss/train': 3.824071168899536} -09/20/2021 16:35:16 - INFO - __main__ - Step 9696: {'lr': 0.00016133333333333334, 'samples': 310272, 'steps': 605, 'loss/train': 5.063183784484863} -09/20/2021 16:35:17 - INFO - __main__ - Step 9697: {'lr': 0.00016160000000000002, 'samples': 310304, 'steps': 606, 'loss/train': 4.416193008422852} -09/20/2021 16:35:18 - INFO - __main__ - Step 9698: {'lr': 0.00016160000000000002, 'samples': 310336, 'steps': 606, 'loss/train': 4.975937366485596} -09/20/2021 16:35:19 - INFO - __main__ - Step 9699: {'lr': 0.00016160000000000002, 'samples': 310368, 'steps': 606, 'loss/train': 4.837840557098389} -09/20/2021 16:35:19 - INFO - __main__ - Step 9700: {'lr': 0.00016160000000000002, 'samples': 310400, 'steps': 606, 'loss/train': 4.549968719482422} -09/20/2021 16:35:20 - INFO - __main__ - Step 9701: {'lr': 0.00016160000000000002, 'samples': 310432, 'steps': 606, 'loss/train': 4.922073841094971} -09/20/2021 16:35:21 - INFO - __main__ - Step 9702: {'lr': 0.00016160000000000002, 'samples': 310464, 'steps': 606, 'loss/train': 5.380263805389404} -09/20/2021 16:35:22 - INFO - __main__ - Step 9703: {'lr': 0.00016160000000000002, 'samples': 310496, 'steps': 606, 'loss/train': 4.00075101852417} -09/20/2021 16:35:22 - INFO - __main__ - Step 9704: {'lr': 0.00016160000000000002, 'samples': 310528, 'steps': 606, 'loss/train': 4.410190582275391} -09/20/2021 16:35:23 - INFO - __main__ - Step 9705: {'lr': 0.00016160000000000002, 'samples': 310560, 'steps': 606, 'loss/train': 3.5316925048828125} -09/20/2021 16:35:24 - INFO - __main__ - Step 9706: {'lr': 0.00016160000000000002, 'samples': 310592, 'steps': 606, 'loss/train': 4.644876480102539} -09/20/2021 16:35:25 - INFO - __main__ - Step 9707: {'lr': 0.00016160000000000002, 'samples': 310624, 'steps': 606, 'loss/train': 3.7080249786376953} -09/20/2021 16:35:25 - INFO - __main__ - Step 9708: {'lr': 0.00016160000000000002, 'samples': 310656, 'steps': 606, 'loss/train': 4.238968372344971} -09/20/2021 16:35:26 - INFO - __main__ - Step 9709: {'lr': 0.00016160000000000002, 'samples': 310688, 'steps': 606, 'loss/train': 4.1198649406433105} -09/20/2021 16:35:27 - INFO - __main__ - Step 9710: {'lr': 0.00016160000000000002, 'samples': 310720, 'steps': 606, 'loss/train': 2.1519532203674316} -09/20/2021 16:35:28 - INFO - __main__ - Step 9711: {'lr': 0.00016160000000000002, 'samples': 310752, 'steps': 606, 'loss/train': 3.675130605697632} -09/20/2021 16:35:28 - INFO - __main__ - Step 9712: {'lr': 0.00016160000000000002, 'samples': 310784, 'steps': 606, 'loss/train': 4.5883588790893555} -09/20/2021 16:35:29 - INFO - __main__ - Step 9713: {'lr': 0.00016186666666666668, 'samples': 310816, 'steps': 607, 'loss/train': 5.753523349761963} -09/20/2021 16:35:30 - INFO - __main__ - Step 9714: {'lr': 0.00016186666666666668, 'samples': 310848, 'steps': 607, 'loss/train': 4.493867874145508} -09/20/2021 16:35:31 - INFO - __main__ - Step 9715: {'lr': 0.00016186666666666668, 'samples': 310880, 'steps': 607, 'loss/train': 4.055542469024658} -09/20/2021 16:35:31 - INFO - __main__ - Step 9716: {'lr': 0.00016186666666666668, 'samples': 310912, 'steps': 607, 'loss/train': 4.825367450714111} -09/20/2021 16:35:32 - INFO - __main__ - Step 9717: {'lr': 0.00016186666666666668, 'samples': 310944, 'steps': 607, 'loss/train': 5.585977077484131} -09/20/2021 16:35:33 - INFO - __main__ - Step 9718: {'lr': 0.00016186666666666668, 'samples': 310976, 'steps': 607, 'loss/train': 4.293691635131836} -09/20/2021 16:35:34 - INFO - __main__ - Step 9719: {'lr': 0.00016186666666666668, 'samples': 311008, 'steps': 607, 'loss/train': 4.562497138977051} -09/20/2021 16:35:34 - INFO - __main__ - Step 9720: {'lr': 0.00016186666666666668, 'samples': 311040, 'steps': 607, 'loss/train': 5.501621246337891} -09/20/2021 16:35:36 - INFO - __main__ - Step 9721: {'lr': 0.00016186666666666668, 'samples': 311072, 'steps': 607, 'loss/train': 4.313990116119385} -09/20/2021 16:35:36 - INFO - __main__ - Step 9722: {'lr': 0.00016186666666666668, 'samples': 311104, 'steps': 607, 'loss/train': 3.8123795986175537} -09/20/2021 16:35:37 - INFO - __main__ - Step 9723: {'lr': 0.00016186666666666668, 'samples': 311136, 'steps': 607, 'loss/train': 4.8015007972717285} -09/20/2021 16:35:38 - INFO - __main__ - Step 9724: {'lr': 0.00016186666666666668, 'samples': 311168, 'steps': 607, 'loss/train': 5.834838390350342} -09/20/2021 16:35:39 - INFO - __main__ - Step 9725: {'lr': 0.00016186666666666668, 'samples': 311200, 'steps': 607, 'loss/train': 4.8145670890808105} -09/20/2021 16:35:39 - INFO - __main__ - Step 9726: {'lr': 0.00016186666666666668, 'samples': 311232, 'steps': 607, 'loss/train': 5.261593341827393} -09/20/2021 16:35:40 - INFO - __main__ - Step 9727: {'lr': 0.00016186666666666668, 'samples': 311264, 'steps': 607, 'loss/train': 2.6796462535858154} -09/20/2021 16:35:41 - INFO - __main__ - Step 9728: {'lr': 0.00016186666666666668, 'samples': 311296, 'steps': 607, 'loss/train': 4.617274761199951} -09/20/2021 16:35:42 - INFO - __main__ - Step 9729: {'lr': 0.00016213333333333334, 'samples': 311328, 'steps': 608, 'loss/train': 4.361098766326904} -09/20/2021 16:35:43 - INFO - __main__ - Step 9730: {'lr': 0.00016213333333333334, 'samples': 311360, 'steps': 608, 'loss/train': 4.387691020965576} -09/20/2021 16:35:43 - INFO - __main__ - Step 9731: {'lr': 0.00016213333333333334, 'samples': 311392, 'steps': 608, 'loss/train': 4.4458818435668945} -09/20/2021 16:35:44 - INFO - __main__ - Step 9732: {'lr': 0.00016213333333333334, 'samples': 311424, 'steps': 608, 'loss/train': 2.653278350830078} -09/20/2021 16:35:45 - INFO - __main__ - Step 9733: {'lr': 0.00016213333333333334, 'samples': 311456, 'steps': 608, 'loss/train': 4.820837497711182} -09/20/2021 16:35:46 - INFO - __main__ - Step 9734: {'lr': 0.00016213333333333334, 'samples': 311488, 'steps': 608, 'loss/train': 5.544128894805908} -09/20/2021 16:35:46 - INFO - __main__ - Step 9735: {'lr': 0.00016213333333333334, 'samples': 311520, 'steps': 608, 'loss/train': 4.848658561706543} -09/20/2021 16:35:47 - INFO - __main__ - Step 9736: {'lr': 0.00016213333333333334, 'samples': 311552, 'steps': 608, 'loss/train': 4.470303058624268} -09/20/2021 16:35:48 - INFO - __main__ - Step 9737: {'lr': 0.00016213333333333334, 'samples': 311584, 'steps': 608, 'loss/train': 5.484256744384766} -09/20/2021 16:35:49 - INFO - __main__ - Step 9738: {'lr': 0.00016213333333333334, 'samples': 311616, 'steps': 608, 'loss/train': 3.6735737323760986} -09/20/2021 16:35:49 - INFO - __main__ - Step 9739: {'lr': 0.00016213333333333334, 'samples': 311648, 'steps': 608, 'loss/train': 4.75417423248291} -09/20/2021 16:35:50 - INFO - __main__ - Step 9740: {'lr': 0.00016213333333333334, 'samples': 311680, 'steps': 608, 'loss/train': 4.418270111083984} -09/20/2021 16:35:51 - INFO - __main__ - Step 9741: {'lr': 0.00016213333333333334, 'samples': 311712, 'steps': 608, 'loss/train': 4.584242820739746} -09/20/2021 16:35:52 - INFO - __main__ - Step 9742: {'lr': 0.00016213333333333334, 'samples': 311744, 'steps': 608, 'loss/train': 4.355024814605713} -09/20/2021 16:35:52 - INFO - __main__ - Step 9743: {'lr': 0.00016213333333333334, 'samples': 311776, 'steps': 608, 'loss/train': 5.220989227294922} -09/20/2021 16:35:53 - INFO - __main__ - Step 9744: {'lr': 0.00016213333333333334, 'samples': 311808, 'steps': 608, 'loss/train': 4.094355583190918} -09/20/2021 16:35:54 - INFO - __main__ - Step 9745: {'lr': 0.00016240000000000002, 'samples': 311840, 'steps': 609, 'loss/train': 4.236801624298096} -09/20/2021 16:35:55 - INFO - __main__ - Step 9746: {'lr': 0.00016240000000000002, 'samples': 311872, 'steps': 609, 'loss/train': 4.557821750640869} -09/20/2021 16:35:55 - INFO - __main__ - Step 9747: {'lr': 0.00016240000000000002, 'samples': 311904, 'steps': 609, 'loss/train': 3.809638500213623} -09/20/2021 16:35:56 - INFO - __main__ - Step 9748: {'lr': 0.00016240000000000002, 'samples': 311936, 'steps': 609, 'loss/train': 4.7410173416137695} -09/20/2021 16:35:57 - INFO - __main__ - Step 9749: {'lr': 0.00016240000000000002, 'samples': 311968, 'steps': 609, 'loss/train': 4.699602127075195} -09/20/2021 16:35:58 - INFO - __main__ - Step 9750: {'lr': 0.00016240000000000002, 'samples': 312000, 'steps': 609, 'loss/train': 4.738755226135254} -09/20/2021 16:35:58 - INFO - __main__ - Step 9751: {'lr': 0.00016240000000000002, 'samples': 312032, 'steps': 609, 'loss/train': 4.424738883972168} -09/20/2021 16:36:00 - INFO - __main__ - Step 9752: {'lr': 0.00016240000000000002, 'samples': 312064, 'steps': 609, 'loss/train': 5.190267562866211} -09/20/2021 16:36:00 - INFO - __main__ - Step 9753: {'lr': 0.00016240000000000002, 'samples': 312096, 'steps': 609, 'loss/train': 4.448258876800537} -09/20/2021 16:36:01 - INFO - __main__ - Step 9754: {'lr': 0.00016240000000000002, 'samples': 312128, 'steps': 609, 'loss/train': 4.373721599578857} -09/20/2021 16:36:02 - INFO - __main__ - Step 9755: {'lr': 0.00016240000000000002, 'samples': 312160, 'steps': 609, 'loss/train': 4.02048397064209} -09/20/2021 16:36:03 - INFO - __main__ - Step 9756: {'lr': 0.00016240000000000002, 'samples': 312192, 'steps': 609, 'loss/train': 4.055936336517334} -09/20/2021 16:36:03 - INFO - __main__ - Step 9757: {'lr': 0.00016240000000000002, 'samples': 312224, 'steps': 609, 'loss/train': 5.8501386642456055} -09/20/2021 16:36:04 - INFO - __main__ - Step 9758: {'lr': 0.00016240000000000002, 'samples': 312256, 'steps': 609, 'loss/train': 5.259927272796631} -09/20/2021 16:36:05 - INFO - __main__ - Step 9759: {'lr': 0.00016240000000000002, 'samples': 312288, 'steps': 609, 'loss/train': 4.516717433929443} -09/20/2021 16:36:06 - INFO - __main__ - Step 9760: {'lr': 0.00016240000000000002, 'samples': 312320, 'steps': 609, 'loss/train': 5.392034530639648} -09/20/2021 16:36:07 - INFO - __main__ - Step 9761: {'lr': 0.00016266666666666667, 'samples': 312352, 'steps': 610, 'loss/train': 4.637871742248535} -09/20/2021 16:36:07 - INFO - __main__ - Step 9762: {'lr': 0.00016266666666666667, 'samples': 312384, 'steps': 610, 'loss/train': 4.72062349319458} -09/20/2021 16:36:08 - INFO - __main__ - Step 9763: {'lr': 0.00016266666666666667, 'samples': 312416, 'steps': 610, 'loss/train': 4.0808515548706055} -09/20/2021 16:36:09 - INFO - __main__ - Step 9764: {'lr': 0.00016266666666666667, 'samples': 312448, 'steps': 610, 'loss/train': 4.344486236572266} -09/20/2021 16:36:10 - INFO - __main__ - Step 9765: {'lr': 0.00016266666666666667, 'samples': 312480, 'steps': 610, 'loss/train': 4.59877872467041} -09/20/2021 16:36:10 - INFO - __main__ - Step 9766: {'lr': 0.00016266666666666667, 'samples': 312512, 'steps': 610, 'loss/train': 5.065079689025879} -09/20/2021 16:36:11 - INFO - __main__ - Step 9767: {'lr': 0.00016266666666666667, 'samples': 312544, 'steps': 610, 'loss/train': 4.058957576751709} -09/20/2021 16:36:12 - INFO - __main__ - Step 9768: {'lr': 0.00016266666666666667, 'samples': 312576, 'steps': 610, 'loss/train': 4.722684860229492} -09/20/2021 16:36:13 - INFO - __main__ - Step 9769: {'lr': 0.00016266666666666667, 'samples': 312608, 'steps': 610, 'loss/train': 7.074296951293945} -09/20/2021 16:36:13 - INFO - __main__ - Step 9770: {'lr': 0.00016266666666666667, 'samples': 312640, 'steps': 610, 'loss/train': 4.173902988433838} -09/20/2021 16:36:14 - INFO - __main__ - Step 9771: {'lr': 0.00016266666666666667, 'samples': 312672, 'steps': 610, 'loss/train': 5.33219575881958} -09/20/2021 16:36:15 - INFO - __main__ - Step 9772: {'lr': 0.00016266666666666667, 'samples': 312704, 'steps': 610, 'loss/train': 5.139655590057373} -09/20/2021 16:36:16 - INFO - __main__ - Step 9773: {'lr': 0.00016266666666666667, 'samples': 312736, 'steps': 610, 'loss/train': 4.645700454711914} -09/20/2021 16:36:16 - INFO - __main__ - Step 9774: {'lr': 0.00016266666666666667, 'samples': 312768, 'steps': 610, 'loss/train': 3.839165449142456} -09/20/2021 16:36:17 - INFO - __main__ - Step 9775: {'lr': 0.00016266666666666667, 'samples': 312800, 'steps': 610, 'loss/train': 3.2212047576904297} -09/20/2021 16:36:18 - INFO - __main__ - Step 9776: {'lr': 0.00016266666666666667, 'samples': 312832, 'steps': 610, 'loss/train': 5.29836893081665} -09/20/2021 16:36:19 - INFO - __main__ - Step 9777: {'lr': 0.00016293333333333333, 'samples': 312864, 'steps': 611, 'loss/train': 3.8047122955322266} -09/20/2021 16:36:20 - INFO - __main__ - Step 9778: {'lr': 0.00016293333333333333, 'samples': 312896, 'steps': 611, 'loss/train': 4.054251194000244} -09/20/2021 16:36:20 - INFO - __main__ - Step 9779: {'lr': 0.00016293333333333333, 'samples': 312928, 'steps': 611, 'loss/train': 4.476972579956055} -09/20/2021 16:36:21 - INFO - __main__ - Step 9780: {'lr': 0.00016293333333333333, 'samples': 312960, 'steps': 611, 'loss/train': 4.08460807800293} -09/20/2021 16:36:22 - INFO - __main__ - Step 9781: {'lr': 0.00016293333333333333, 'samples': 312992, 'steps': 611, 'loss/train': 5.163658142089844} -09/20/2021 16:36:23 - INFO - __main__ - Step 9782: {'lr': 0.00016293333333333333, 'samples': 313024, 'steps': 611, 'loss/train': 4.270273208618164} -09/20/2021 16:36:24 - INFO - __main__ - Step 9783: {'lr': 0.00016293333333333333, 'samples': 313056, 'steps': 611, 'loss/train': 4.743257999420166} -09/20/2021 16:36:25 - INFO - __main__ - Step 9784: {'lr': 0.00016293333333333333, 'samples': 313088, 'steps': 611, 'loss/train': 3.784451723098755} -09/20/2021 16:36:25 - INFO - __main__ - Step 9785: {'lr': 0.00016293333333333333, 'samples': 313120, 'steps': 611, 'loss/train': 4.531570911407471} -09/20/2021 16:36:26 - INFO - __main__ - Step 9786: {'lr': 0.00016293333333333333, 'samples': 313152, 'steps': 611, 'loss/train': 4.3366169929504395} -09/20/2021 16:36:27 - INFO - __main__ - Step 9787: {'lr': 0.00016293333333333333, 'samples': 313184, 'steps': 611, 'loss/train': 4.3117265701293945} -09/20/2021 16:36:28 - INFO - __main__ - Step 9788: {'lr': 0.00016293333333333333, 'samples': 313216, 'steps': 611, 'loss/train': 4.412666320800781} -09/20/2021 16:36:28 - INFO - __main__ - Step 9789: {'lr': 0.00016293333333333333, 'samples': 313248, 'steps': 611, 'loss/train': 4.928809642791748} -09/20/2021 16:36:29 - INFO - __main__ - Step 9790: {'lr': 0.00016293333333333333, 'samples': 313280, 'steps': 611, 'loss/train': 3.9364864826202393} -09/20/2021 16:36:30 - INFO - __main__ - Step 9791: {'lr': 0.00016293333333333333, 'samples': 313312, 'steps': 611, 'loss/train': 4.524498462677002} -09/20/2021 16:36:31 - INFO - __main__ - Step 9792: {'lr': 0.00016293333333333333, 'samples': 313344, 'steps': 611, 'loss/train': 2.322685480117798} -09/20/2021 16:36:32 - INFO - __main__ - Step 9793: {'lr': 0.0001632, 'samples': 313376, 'steps': 612, 'loss/train': 2.1780240535736084} -09/20/2021 16:36:32 - INFO - __main__ - Step 9794: {'lr': 0.0001632, 'samples': 313408, 'steps': 612, 'loss/train': 2.1718738079071045} -09/20/2021 16:36:33 - INFO - __main__ - Step 9795: {'lr': 0.0001632, 'samples': 313440, 'steps': 612, 'loss/train': 2.153731346130371} -09/20/2021 16:36:34 - INFO - __main__ - Step 9796: {'lr': 0.0001632, 'samples': 313472, 'steps': 612, 'loss/train': 2.2028939723968506} -09/20/2021 16:36:35 - INFO - __main__ - Step 9797: {'lr': 0.0001632, 'samples': 313504, 'steps': 612, 'loss/train': 3.4043350219726562} -09/20/2021 16:36:35 - INFO - __main__ - Step 9798: {'lr': 0.0001632, 'samples': 313536, 'steps': 612, 'loss/train': 4.362309455871582} -09/20/2021 16:36:36 - INFO - __main__ - Step 9799: {'lr': 0.0001632, 'samples': 313568, 'steps': 612, 'loss/train': 4.248364448547363} -09/20/2021 16:36:37 - INFO - __main__ - Step 9800: {'lr': 0.0001632, 'samples': 313600, 'steps': 612, 'loss/train': 5.033612251281738} -09/20/2021 16:36:38 - INFO - __main__ - Step 9801: {'lr': 0.0001632, 'samples': 313632, 'steps': 612, 'loss/train': 4.365025043487549} -09/20/2021 16:36:38 - INFO - __main__ - Step 9802: {'lr': 0.0001632, 'samples': 313664, 'steps': 612, 'loss/train': 5.882238388061523} -09/20/2021 16:36:39 - INFO - __main__ - Step 9803: {'lr': 0.0001632, 'samples': 313696, 'steps': 612, 'loss/train': 3.8963422775268555} -09/20/2021 16:36:40 - INFO - __main__ - Step 9804: {'lr': 0.0001632, 'samples': 313728, 'steps': 612, 'loss/train': 4.540084362030029} -09/20/2021 16:36:41 - INFO - __main__ - Step 9805: {'lr': 0.0001632, 'samples': 313760, 'steps': 612, 'loss/train': 4.305485248565674} -09/20/2021 16:36:41 - INFO - __main__ - Step 9806: {'lr': 0.0001632, 'samples': 313792, 'steps': 612, 'loss/train': 5.304643630981445} -09/20/2021 16:36:42 - INFO - __main__ - Step 9807: {'lr': 0.0001632, 'samples': 313824, 'steps': 612, 'loss/train': 5.067833423614502} -09/20/2021 16:36:43 - INFO - __main__ - Step 9808: {'lr': 0.0001632, 'samples': 313856, 'steps': 612, 'loss/train': 3.6405184268951416} -09/20/2021 16:36:44 - INFO - __main__ - Step 9809: {'lr': 0.0001634666666666667, 'samples': 313888, 'steps': 613, 'loss/train': 4.925570011138916} -09/20/2021 16:36:44 - INFO - __main__ - Step 9810: {'lr': 0.0001634666666666667, 'samples': 313920, 'steps': 613, 'loss/train': 4.4336442947387695} -09/20/2021 16:36:45 - INFO - __main__ - Step 9811: {'lr': 0.0001634666666666667, 'samples': 313952, 'steps': 613, 'loss/train': 0.7005857825279236} -09/20/2021 16:36:46 - INFO - __main__ - Step 9812: {'lr': 0.0001634666666666667, 'samples': 313984, 'steps': 613, 'loss/train': 3.7650063037872314} -09/20/2021 16:36:47 - INFO - __main__ - Step 9813: {'lr': 0.0001634666666666667, 'samples': 314016, 'steps': 613, 'loss/train': 1.8231596946716309} -09/20/2021 16:36:47 - INFO - __main__ - Step 9814: {'lr': 0.0001634666666666667, 'samples': 314048, 'steps': 613, 'loss/train': 1.8718318939208984} -09/20/2021 16:36:48 - INFO - __main__ - Step 9815: {'lr': 0.0001634666666666667, 'samples': 314080, 'steps': 613, 'loss/train': 4.381525993347168} -09/20/2021 16:36:49 - INFO - __main__ - Step 9816: {'lr': 0.0001634666666666667, 'samples': 314112, 'steps': 613, 'loss/train': 1.9095650911331177} -09/20/2021 16:36:50 - INFO - __main__ - Step 9817: {'lr': 0.0001634666666666667, 'samples': 314144, 'steps': 613, 'loss/train': 4.958460807800293} -09/20/2021 16:36:51 - INFO - __main__ - Step 9818: {'lr': 0.0001634666666666667, 'samples': 314176, 'steps': 613, 'loss/train': 3.9796242713928223} -09/20/2021 16:36:52 - INFO - __main__ - Step 9819: {'lr': 0.0001634666666666667, 'samples': 314208, 'steps': 613, 'loss/train': 5.393336296081543} -09/20/2021 16:36:53 - INFO - __main__ - Step 9820: {'lr': 0.0001634666666666667, 'samples': 314240, 'steps': 613, 'loss/train': 4.429617404937744} -09/20/2021 16:36:53 - INFO - __main__ - Step 9821: {'lr': 0.0001634666666666667, 'samples': 314272, 'steps': 613, 'loss/train': 5.136372089385986} -09/20/2021 16:36:54 - INFO - __main__ - Step 9822: {'lr': 0.0001634666666666667, 'samples': 314304, 'steps': 613, 'loss/train': 2.227245807647705} -09/20/2021 16:36:55 - INFO - __main__ - Step 9823: {'lr': 0.0001634666666666667, 'samples': 314336, 'steps': 613, 'loss/train': 4.519093990325928} -09/20/2021 16:36:56 - INFO - __main__ - Step 9824: {'lr': 0.0001634666666666667, 'samples': 314368, 'steps': 613, 'loss/train': 4.553619384765625} -09/20/2021 16:36:56 - INFO - __main__ - Step 9825: {'lr': 0.00016373333333333335, 'samples': 314400, 'steps': 614, 'loss/train': 6.068646430969238} -09/20/2021 16:36:57 - INFO - __main__ - Step 9826: {'lr': 0.00016373333333333335, 'samples': 314432, 'steps': 614, 'loss/train': 6.126561164855957} -09/20/2021 16:36:58 - INFO - __main__ - Step 9827: {'lr': 0.00016373333333333335, 'samples': 314464, 'steps': 614, 'loss/train': 6.10523796081543} -09/20/2021 16:36:59 - INFO - __main__ - Step 9828: {'lr': 0.00016373333333333335, 'samples': 314496, 'steps': 614, 'loss/train': 6.094305992126465} -09/20/2021 16:36:59 - INFO - __main__ - Step 9829: {'lr': 0.00016373333333333335, 'samples': 314528, 'steps': 614, 'loss/train': 6.055574417114258} -09/20/2021 16:37:00 - INFO - __main__ - Step 9830: {'lr': 0.00016373333333333335, 'samples': 314560, 'steps': 614, 'loss/train': 4.337197780609131} -09/20/2021 16:37:01 - INFO - __main__ - Step 9831: {'lr': 0.00016373333333333335, 'samples': 314592, 'steps': 614, 'loss/train': 4.92045259475708} -09/20/2021 16:37:02 - INFO - __main__ - Step 9832: {'lr': 0.00016373333333333335, 'samples': 314624, 'steps': 614, 'loss/train': 2.6809396743774414} -09/20/2021 16:37:02 - INFO - __main__ - Step 9833: {'lr': 0.00016373333333333335, 'samples': 314656, 'steps': 614, 'loss/train': 5.306612014770508} -09/20/2021 16:37:03 - INFO - __main__ - Step 9834: {'lr': 0.00016373333333333335, 'samples': 314688, 'steps': 614, 'loss/train': 4.305194854736328} -09/20/2021 16:37:04 - INFO - __main__ - Step 9835: {'lr': 0.00016373333333333335, 'samples': 314720, 'steps': 614, 'loss/train': 4.197080612182617} -09/20/2021 16:37:05 - INFO - __main__ - Step 9836: {'lr': 0.00016373333333333335, 'samples': 314752, 'steps': 614, 'loss/train': 4.519383430480957} -09/20/2021 16:37:05 - INFO - __main__ - Step 9837: {'lr': 0.00016373333333333335, 'samples': 314784, 'steps': 614, 'loss/train': 5.012083053588867} -09/20/2021 16:37:06 - INFO - __main__ - Step 9838: {'lr': 0.00016373333333333335, 'samples': 314816, 'steps': 614, 'loss/train': 3.7952427864074707} -09/20/2021 16:37:07 - INFO - __main__ - Step 9839: {'lr': 0.00016373333333333335, 'samples': 314848, 'steps': 614, 'loss/train': 4.277667999267578} -09/20/2021 16:37:08 - INFO - __main__ - Step 9840: {'lr': 0.00016373333333333335, 'samples': 314880, 'steps': 614, 'loss/train': 4.675837993621826} -09/20/2021 16:37:09 - INFO - __main__ - Step 9841: {'lr': 0.000164, 'samples': 314912, 'steps': 615, 'loss/train': 4.497228145599365} -09/20/2021 16:37:09 - INFO - __main__ - Step 9842: {'lr': 0.000164, 'samples': 314944, 'steps': 615, 'loss/train': 5.378067493438721} -09/20/2021 16:37:10 - INFO - __main__ - Step 9843: {'lr': 0.000164, 'samples': 314976, 'steps': 615, 'loss/train': 4.903467655181885} -09/20/2021 16:37:11 - INFO - __main__ - Step 9844: {'lr': 0.000164, 'samples': 315008, 'steps': 615, 'loss/train': 6.299510478973389} -09/20/2021 16:37:12 - INFO - __main__ - Step 9845: {'lr': 0.000164, 'samples': 315040, 'steps': 615, 'loss/train': 5.013274669647217} -09/20/2021 16:37:12 - INFO - __main__ - Step 9846: {'lr': 0.000164, 'samples': 315072, 'steps': 615, 'loss/train': 5.553119659423828} -09/20/2021 16:37:13 - INFO - __main__ - Step 9847: {'lr': 0.000164, 'samples': 315104, 'steps': 615, 'loss/train': 4.793457508087158} -09/20/2021 16:37:14 - INFO - __main__ - Step 9848: {'lr': 0.000164, 'samples': 315136, 'steps': 615, 'loss/train': 4.289231777191162} -09/20/2021 16:37:15 - INFO - __main__ - Step 9849: {'lr': 0.000164, 'samples': 315168, 'steps': 615, 'loss/train': 3.438723564147949} -09/20/2021 16:37:15 - INFO - __main__ - Step 9850: {'lr': 0.000164, 'samples': 315200, 'steps': 615, 'loss/train': 4.252922534942627} -09/20/2021 16:37:17 - INFO - __main__ - Step 9851: {'lr': 0.000164, 'samples': 315232, 'steps': 615, 'loss/train': 4.426669120788574} -09/20/2021 16:37:17 - INFO - __main__ - Step 9852: {'lr': 0.000164, 'samples': 315264, 'steps': 615, 'loss/train': 5.002359867095947} -09/20/2021 16:37:18 - INFO - __main__ - Step 9853: {'lr': 0.000164, 'samples': 315296, 'steps': 615, 'loss/train': 3.6628384590148926} -09/20/2021 16:37:19 - INFO - __main__ - Step 9854: {'lr': 0.000164, 'samples': 315328, 'steps': 615, 'loss/train': 4.230682849884033} -09/20/2021 16:37:20 - INFO - __main__ - Step 9855: {'lr': 0.000164, 'samples': 315360, 'steps': 615, 'loss/train': 4.990752696990967} -09/20/2021 16:37:20 - INFO - __main__ - Step 9856: {'lr': 0.000164, 'samples': 315392, 'steps': 615, 'loss/train': 4.337410926818848} -09/20/2021 16:37:21 - INFO - __main__ - Step 9857: {'lr': 0.00016426666666666668, 'samples': 315424, 'steps': 616, 'loss/train': 4.701552867889404} -09/20/2021 16:37:22 - INFO - __main__ - Step 9858: {'lr': 0.00016426666666666668, 'samples': 315456, 'steps': 616, 'loss/train': 5.257281303405762} -09/20/2021 16:37:23 - INFO - __main__ - Step 9859: {'lr': 0.00016426666666666668, 'samples': 315488, 'steps': 616, 'loss/train': 5.297808647155762} -09/20/2021 16:37:24 - INFO - __main__ - Step 9860: {'lr': 0.00016426666666666668, 'samples': 315520, 'steps': 616, 'loss/train': 4.387063980102539} -09/20/2021 16:37:24 - INFO - __main__ - Step 9861: {'lr': 0.00016426666666666668, 'samples': 315552, 'steps': 616, 'loss/train': 4.685846328735352} -09/20/2021 16:37:25 - INFO - __main__ - Step 9862: {'lr': 0.00016426666666666668, 'samples': 315584, 'steps': 616, 'loss/train': 3.711359977722168} -09/20/2021 16:37:26 - INFO - __main__ - Step 9863: {'lr': 0.00016426666666666668, 'samples': 315616, 'steps': 616, 'loss/train': 3.7540032863616943} -09/20/2021 16:37:27 - INFO - __main__ - Step 9864: {'lr': 0.00016426666666666668, 'samples': 315648, 'steps': 616, 'loss/train': 3.7398600578308105} -09/20/2021 16:37:27 - INFO - __main__ - Step 9865: {'lr': 0.00016426666666666668, 'samples': 315680, 'steps': 616, 'loss/train': 4.277065277099609} -09/20/2021 16:37:28 - INFO - __main__ - Step 9866: {'lr': 0.00016426666666666668, 'samples': 315712, 'steps': 616, 'loss/train': 4.1644368171691895} -09/20/2021 16:37:29 - INFO - __main__ - Step 9867: {'lr': 0.00016426666666666668, 'samples': 315744, 'steps': 616, 'loss/train': 4.213189125061035} -09/20/2021 16:37:30 - INFO - __main__ - Step 9868: {'lr': 0.00016426666666666668, 'samples': 315776, 'steps': 616, 'loss/train': 4.664443016052246} -09/20/2021 16:37:30 - INFO - __main__ - Step 9869: {'lr': 0.00016426666666666668, 'samples': 315808, 'steps': 616, 'loss/train': 5.0180206298828125} -09/20/2021 16:37:31 - INFO - __main__ - Step 9870: {'lr': 0.00016426666666666668, 'samples': 315840, 'steps': 616, 'loss/train': 5.212804317474365} -09/20/2021 16:37:32 - INFO - __main__ - Step 9871: {'lr': 0.00016426666666666668, 'samples': 315872, 'steps': 616, 'loss/train': 4.014776229858398} -09/20/2021 16:37:33 - INFO - __main__ - Step 9872: {'lr': 0.00016426666666666668, 'samples': 315904, 'steps': 616, 'loss/train': 4.982839584350586} -09/20/2021 16:37:33 - INFO - __main__ - Step 9873: {'lr': 0.00016453333333333334, 'samples': 315936, 'steps': 617, 'loss/train': 4.96757698059082} -09/20/2021 16:37:34 - INFO - __main__ - Step 9874: {'lr': 0.00016453333333333334, 'samples': 315968, 'steps': 617, 'loss/train': 4.682194709777832} -09/20/2021 16:37:35 - INFO - __main__ - Step 9875: {'lr': 0.00016453333333333334, 'samples': 316000, 'steps': 617, 'loss/train': 5.116051197052002} -09/20/2021 16:37:36 - INFO - __main__ - Step 9876: {'lr': 0.00016453333333333334, 'samples': 316032, 'steps': 617, 'loss/train': 5.204657077789307} -09/20/2021 16:37:36 - INFO - __main__ - Step 9877: {'lr': 0.00016453333333333334, 'samples': 316064, 'steps': 617, 'loss/train': 4.661558628082275} -09/20/2021 16:37:37 - INFO - __main__ - Step 9878: {'lr': 0.00016453333333333334, 'samples': 316096, 'steps': 617, 'loss/train': 3.3978922367095947} -09/20/2021 16:37:38 - INFO - __main__ - Step 9879: {'lr': 0.00016453333333333334, 'samples': 316128, 'steps': 617, 'loss/train': 4.075404644012451} -09/20/2021 16:37:39 - INFO - __main__ - Step 9880: {'lr': 0.00016453333333333334, 'samples': 316160, 'steps': 617, 'loss/train': 4.320647716522217} -09/20/2021 16:37:39 - INFO - __main__ - Step 9881: {'lr': 0.00016453333333333334, 'samples': 316192, 'steps': 617, 'loss/train': 3.876685857772827} -09/20/2021 16:37:41 - INFO - __main__ - Step 9882: {'lr': 0.00016453333333333334, 'samples': 316224, 'steps': 617, 'loss/train': 4.772461891174316} -09/20/2021 16:37:41 - INFO - __main__ - Step 9883: {'lr': 0.00016453333333333334, 'samples': 316256, 'steps': 617, 'loss/train': 4.617743968963623} -09/20/2021 16:37:42 - INFO - __main__ - Step 9884: {'lr': 0.00016453333333333334, 'samples': 316288, 'steps': 617, 'loss/train': 4.749412536621094} -09/20/2021 16:37:43 - INFO - __main__ - Step 9885: {'lr': 0.00016453333333333334, 'samples': 316320, 'steps': 617, 'loss/train': 4.594456195831299} -09/20/2021 16:37:44 - INFO - __main__ - Step 9886: {'lr': 0.00016453333333333334, 'samples': 316352, 'steps': 617, 'loss/train': 3.1255602836608887} -09/20/2021 16:37:44 - INFO - __main__ - Step 9887: {'lr': 0.00016453333333333334, 'samples': 316384, 'steps': 617, 'loss/train': 5.8346452713012695} -09/20/2021 16:37:45 - INFO - __main__ - Step 9888: {'lr': 0.00016453333333333334, 'samples': 316416, 'steps': 617, 'loss/train': 5.208081245422363} -09/20/2021 16:37:46 - INFO - __main__ - Step 9889: {'lr': 0.0001648, 'samples': 316448, 'steps': 618, 'loss/train': 4.464643955230713} -09/20/2021 16:37:47 - INFO - __main__ - Step 9890: {'lr': 0.0001648, 'samples': 316480, 'steps': 618, 'loss/train': 3.726407527923584} -09/20/2021 16:37:48 - INFO - __main__ - Step 9891: {'lr': 0.0001648, 'samples': 316512, 'steps': 618, 'loss/train': 3.9166011810302734} -09/20/2021 16:37:48 - INFO - __main__ - Step 9892: {'lr': 0.0001648, 'samples': 316544, 'steps': 618, 'loss/train': 4.948554992675781} -09/20/2021 16:37:49 - INFO - __main__ - Step 9893: {'lr': 0.0001648, 'samples': 316576, 'steps': 618, 'loss/train': 4.335039138793945} -09/20/2021 16:37:50 - INFO - __main__ - Step 9894: {'lr': 0.0001648, 'samples': 316608, 'steps': 618, 'loss/train': 4.561501502990723} -09/20/2021 16:37:51 - INFO - __main__ - Step 9895: {'lr': 0.0001648, 'samples': 316640, 'steps': 618, 'loss/train': 4.491294860839844} -09/20/2021 16:37:51 - INFO - __main__ - Step 9896: {'lr': 0.0001648, 'samples': 316672, 'steps': 618, 'loss/train': 4.165192127227783} -09/20/2021 16:37:52 - INFO - __main__ - Step 9897: {'lr': 0.0001648, 'samples': 316704, 'steps': 618, 'loss/train': 4.303755760192871} -09/20/2021 16:37:53 - INFO - __main__ - Step 9898: {'lr': 0.0001648, 'samples': 316736, 'steps': 618, 'loss/train': 4.7060956954956055} -09/20/2021 16:37:54 - INFO - __main__ - Step 9899: {'lr': 0.0001648, 'samples': 316768, 'steps': 618, 'loss/train': 5.315939426422119} -09/20/2021 16:37:54 - INFO - __main__ - Step 9900: {'lr': 0.0001648, 'samples': 316800, 'steps': 618, 'loss/train': 5.3126020431518555} -09/20/2021 16:37:55 - INFO - __main__ - Step 9901: {'lr': 0.0001648, 'samples': 316832, 'steps': 618, 'loss/train': 4.451057434082031} -09/20/2021 16:37:56 - INFO - __main__ - Step 9902: {'lr': 0.0001648, 'samples': 316864, 'steps': 618, 'loss/train': 4.556003093719482} -09/20/2021 16:37:57 - INFO - __main__ - Step 9903: {'lr': 0.0001648, 'samples': 316896, 'steps': 618, 'loss/train': 4.666886806488037} -09/20/2021 16:37:57 - INFO - __main__ - Step 9904: {'lr': 0.0001648, 'samples': 316928, 'steps': 618, 'loss/train': 5.078549861907959} -09/20/2021 16:37:58 - INFO - __main__ - Step 9905: {'lr': 0.00016506666666666668, 'samples': 316960, 'steps': 619, 'loss/train': 4.563286781311035} -09/20/2021 16:37:59 - INFO - __main__ - Step 9906: {'lr': 0.00016506666666666668, 'samples': 316992, 'steps': 619, 'loss/train': 4.067861557006836} -09/20/2021 16:38:00 - INFO - __main__ - Step 9907: {'lr': 0.00016506666666666668, 'samples': 317024, 'steps': 619, 'loss/train': 4.369053363800049} -09/20/2021 16:38:00 - INFO - __main__ - Step 9908: {'lr': 0.00016506666666666668, 'samples': 317056, 'steps': 619, 'loss/train': 4.189558029174805} -09/20/2021 16:38:01 - INFO - __main__ - Step 9909: {'lr': 0.00016506666666666668, 'samples': 317088, 'steps': 619, 'loss/train': 4.9861650466918945} -09/20/2021 16:38:02 - INFO - __main__ - Step 9910: {'lr': 0.00016506666666666668, 'samples': 317120, 'steps': 619, 'loss/train': 4.781071662902832} -09/20/2021 16:38:03 - INFO - __main__ - Step 9911: {'lr': 0.00016506666666666668, 'samples': 317152, 'steps': 619, 'loss/train': 5.126859188079834} -09/20/2021 16:38:03 - INFO - __main__ - Step 9912: {'lr': 0.00016506666666666668, 'samples': 317184, 'steps': 619, 'loss/train': 6.213266849517822} -09/20/2021 16:38:05 - INFO - __main__ - Step 9913: {'lr': 0.00016506666666666668, 'samples': 317216, 'steps': 619, 'loss/train': 3.957573652267456} -09/20/2021 16:38:05 - INFO - __main__ - Step 9914: {'lr': 0.00016506666666666668, 'samples': 317248, 'steps': 619, 'loss/train': 5.334415912628174} -09/20/2021 16:38:06 - INFO - __main__ - Step 9915: {'lr': 0.00016506666666666668, 'samples': 317280, 'steps': 619, 'loss/train': 4.1190361976623535} -09/20/2021 16:38:07 - INFO - __main__ - Step 9916: {'lr': 0.00016506666666666668, 'samples': 317312, 'steps': 619, 'loss/train': 4.295323371887207} -09/20/2021 16:38:08 - INFO - __main__ - Step 9917: {'lr': 0.00016506666666666668, 'samples': 317344, 'steps': 619, 'loss/train': 4.039501667022705} -09/20/2021 16:38:08 - INFO - __main__ - Step 9918: {'lr': 0.00016506666666666668, 'samples': 317376, 'steps': 619, 'loss/train': 4.740423679351807} -09/20/2021 16:38:09 - INFO - __main__ - Step 9919: {'lr': 0.00016506666666666668, 'samples': 317408, 'steps': 619, 'loss/train': 5.911229610443115} -09/20/2021 16:38:10 - INFO - __main__ - Step 9920: {'lr': 0.00016506666666666668, 'samples': 317440, 'steps': 619, 'loss/train': 3.542302370071411} -09/20/2021 16:38:11 - INFO - __main__ - Step 9921: {'lr': 0.00016533333333333333, 'samples': 317472, 'steps': 620, 'loss/train': 3.71580171585083} -09/20/2021 16:38:12 - INFO - __main__ - Step 9922: {'lr': 0.00016533333333333333, 'samples': 317504, 'steps': 620, 'loss/train': 2.96911358833313} -09/20/2021 16:38:12 - INFO - __main__ - Step 9923: {'lr': 0.00016533333333333333, 'samples': 317536, 'steps': 620, 'loss/train': 4.277663707733154} -09/20/2021 16:38:13 - INFO - __main__ - Step 9924: {'lr': 0.00016533333333333333, 'samples': 317568, 'steps': 620, 'loss/train': 4.324569225311279} -09/20/2021 16:38:14 - INFO - __main__ - Step 9925: {'lr': 0.00016533333333333333, 'samples': 317600, 'steps': 620, 'loss/train': 4.7258124351501465} -09/20/2021 16:38:15 - INFO - __main__ - Step 9926: {'lr': 0.00016533333333333333, 'samples': 317632, 'steps': 620, 'loss/train': 4.070698261260986} -09/20/2021 16:38:15 - INFO - __main__ - Step 9927: {'lr': 0.00016533333333333333, 'samples': 317664, 'steps': 620, 'loss/train': 4.860753536224365} -09/20/2021 16:38:16 - INFO - __main__ - Step 9928: {'lr': 0.00016533333333333333, 'samples': 317696, 'steps': 620, 'loss/train': 4.030584335327148} -09/20/2021 16:38:17 - INFO - __main__ - Step 9929: {'lr': 0.00016533333333333333, 'samples': 317728, 'steps': 620, 'loss/train': 5.064307689666748} -09/20/2021 16:38:18 - INFO - __main__ - Step 9930: {'lr': 0.00016533333333333333, 'samples': 317760, 'steps': 620, 'loss/train': 4.248151779174805} -09/20/2021 16:38:18 - INFO - __main__ - Step 9931: {'lr': 0.00016533333333333333, 'samples': 317792, 'steps': 620, 'loss/train': 4.1362528800964355} -09/20/2021 16:38:19 - INFO - __main__ - Step 9932: {'lr': 0.00016533333333333333, 'samples': 317824, 'steps': 620, 'loss/train': 4.864956855773926} -09/20/2021 16:38:20 - INFO - __main__ - Step 9933: {'lr': 0.00016533333333333333, 'samples': 317856, 'steps': 620, 'loss/train': 5.555662155151367} -09/20/2021 16:38:21 - INFO - __main__ - Step 9934: {'lr': 0.00016533333333333333, 'samples': 317888, 'steps': 620, 'loss/train': 3.8116989135742188} -09/20/2021 16:38:21 - INFO - __main__ - Step 9935: {'lr': 0.00016533333333333333, 'samples': 317920, 'steps': 620, 'loss/train': 4.067811965942383} -09/20/2021 16:38:22 - INFO - __main__ - Step 9936: {'lr': 0.00016533333333333333, 'samples': 317952, 'steps': 620, 'loss/train': 4.933427333831787} -09/20/2021 16:38:23 - INFO - __main__ - Step 9937: {'lr': 0.0001656, 'samples': 317984, 'steps': 621, 'loss/train': 2.139923095703125} -09/20/2021 16:38:24 - INFO - __main__ - Step 9938: {'lr': 0.0001656, 'samples': 318016, 'steps': 621, 'loss/train': 4.19163703918457} -09/20/2021 16:38:24 - INFO - __main__ - Step 9939: {'lr': 0.0001656, 'samples': 318048, 'steps': 621, 'loss/train': 5.124873161315918} -09/20/2021 16:38:25 - INFO - __main__ - Step 9940: {'lr': 0.0001656, 'samples': 318080, 'steps': 621, 'loss/train': 4.478711128234863} -09/20/2021 16:38:26 - INFO - __main__ - Step 9941: {'lr': 0.0001656, 'samples': 318112, 'steps': 621, 'loss/train': 4.080122470855713} -09/20/2021 16:38:27 - INFO - __main__ - Step 9942: {'lr': 0.0001656, 'samples': 318144, 'steps': 621, 'loss/train': 4.969167709350586} -09/20/2021 16:38:27 - INFO - __main__ - Step 9943: {'lr': 0.0001656, 'samples': 318176, 'steps': 621, 'loss/train': 2.0103862285614014} -09/20/2021 16:38:28 - INFO - __main__ - Step 9944: {'lr': 0.0001656, 'samples': 318208, 'steps': 621, 'loss/train': 4.230654716491699} -09/20/2021 16:38:30 - INFO - __main__ - Step 9945: {'lr': 0.0001656, 'samples': 318240, 'steps': 621, 'loss/train': 4.4746575355529785} -09/20/2021 16:38:30 - INFO - __main__ - Step 9946: {'lr': 0.0001656, 'samples': 318272, 'steps': 621, 'loss/train': 4.297385215759277} -09/20/2021 16:38:31 - INFO - __main__ - Step 9947: {'lr': 0.0001656, 'samples': 318304, 'steps': 621, 'loss/train': 4.480856895446777} -09/20/2021 16:38:32 - INFO - __main__ - Step 9948: {'lr': 0.0001656, 'samples': 318336, 'steps': 621, 'loss/train': 4.756280899047852} -09/20/2021 16:38:33 - INFO - __main__ - Step 9949: {'lr': 0.0001656, 'samples': 318368, 'steps': 621, 'loss/train': 5.116272449493408} -09/20/2021 16:38:33 - INFO - __main__ - Step 9950: {'lr': 0.0001656, 'samples': 318400, 'steps': 621, 'loss/train': 2.587991952896118} -09/20/2021 16:38:34 - INFO - __main__ - Step 9951: {'lr': 0.0001656, 'samples': 318432, 'steps': 621, 'loss/train': 2.0892398357391357} -09/20/2021 16:38:35 - INFO - __main__ - Step 9952: {'lr': 0.0001656, 'samples': 318464, 'steps': 621, 'loss/train': 2.0207128524780273} -09/20/2021 16:38:36 - INFO - __main__ - Step 9953: {'lr': 0.00016586666666666667, 'samples': 318496, 'steps': 622, 'loss/train': 2.023092746734619} -09/20/2021 16:38:37 - INFO - __main__ - Step 9954: {'lr': 0.00016586666666666667, 'samples': 318528, 'steps': 622, 'loss/train': 4.394523620605469} -09/20/2021 16:38:37 - INFO - __main__ - Step 9955: {'lr': 0.00016586666666666667, 'samples': 318560, 'steps': 622, 'loss/train': 4.267662525177002} -09/20/2021 16:38:38 - INFO - __main__ - Step 9956: {'lr': 0.00016586666666666667, 'samples': 318592, 'steps': 622, 'loss/train': 4.279473781585693} -09/20/2021 16:38:39 - INFO - __main__ - Step 9957: {'lr': 0.00016586666666666667, 'samples': 318624, 'steps': 622, 'loss/train': 4.884124279022217} -09/20/2021 16:38:40 - INFO - __main__ - Step 9958: {'lr': 0.00016586666666666667, 'samples': 318656, 'steps': 622, 'loss/train': 4.430159091949463} -09/20/2021 16:38:40 - INFO - __main__ - Step 9959: {'lr': 0.00016586666666666667, 'samples': 318688, 'steps': 622, 'loss/train': 4.6137518882751465} -09/20/2021 16:38:41 - INFO - __main__ - Step 9960: {'lr': 0.00016586666666666667, 'samples': 318720, 'steps': 622, 'loss/train': 5.559455871582031} -09/20/2021 16:38:42 - INFO - __main__ - Step 9961: {'lr': 0.00016586666666666667, 'samples': 318752, 'steps': 622, 'loss/train': 4.3239874839782715} -09/20/2021 16:38:43 - INFO - __main__ - Step 9962: {'lr': 0.00016586666666666667, 'samples': 318784, 'steps': 622, 'loss/train': 4.887001991271973} -09/20/2021 16:38:43 - INFO - __main__ - Step 9963: {'lr': 0.00016586666666666667, 'samples': 318816, 'steps': 622, 'loss/train': 4.348359107971191} -09/20/2021 16:38:44 - INFO - __main__ - Step 9964: {'lr': 0.00016586666666666667, 'samples': 318848, 'steps': 622, 'loss/train': 4.8384833335876465} -09/20/2021 16:38:45 - INFO - __main__ - Step 9965: {'lr': 0.00016586666666666667, 'samples': 318880, 'steps': 622, 'loss/train': 4.803791046142578} -09/20/2021 16:38:46 - INFO - __main__ - Step 9966: {'lr': 0.00016586666666666667, 'samples': 318912, 'steps': 622, 'loss/train': 4.071444511413574} -09/20/2021 16:38:46 - INFO - __main__ - Step 9967: {'lr': 0.00016586666666666667, 'samples': 318944, 'steps': 622, 'loss/train': 3.529374837875366} -09/20/2021 16:38:47 - INFO - __main__ - Step 9968: {'lr': 0.00016586666666666667, 'samples': 318976, 'steps': 622, 'loss/train': 3.873953104019165} -09/20/2021 16:38:48 - INFO - __main__ - Step 9969: {'lr': 0.00016613333333333335, 'samples': 319008, 'steps': 623, 'loss/train': 4.754478454589844} -09/20/2021 16:38:49 - INFO - __main__ - Step 9970: {'lr': 0.00016613333333333335, 'samples': 319040, 'steps': 623, 'loss/train': 5.206114292144775} -09/20/2021 16:38:49 - INFO - __main__ - Step 9971: {'lr': 0.00016613333333333335, 'samples': 319072, 'steps': 623, 'loss/train': 5.615658283233643} -09/20/2021 16:38:50 - INFO - __main__ - Step 9972: {'lr': 0.00016613333333333335, 'samples': 319104, 'steps': 623, 'loss/train': 4.095446586608887} -09/20/2021 16:38:51 - INFO - __main__ - Step 9973: {'lr': 0.00016613333333333335, 'samples': 319136, 'steps': 623, 'loss/train': 4.6655402183532715} -09/20/2021 16:38:52 - INFO - __main__ - Step 9974: {'lr': 0.00016613333333333335, 'samples': 319168, 'steps': 623, 'loss/train': 4.113213539123535} -09/20/2021 16:38:53 - INFO - __main__ - Step 9975: {'lr': 0.00016613333333333335, 'samples': 319200, 'steps': 623, 'loss/train': 4.361632823944092} -09/20/2021 16:38:54 - INFO - __main__ - Step 9976: {'lr': 0.00016613333333333335, 'samples': 319232, 'steps': 623, 'loss/train': 4.770135879516602} -09/20/2021 16:38:55 - INFO - __main__ - Step 9977: {'lr': 0.00016613333333333335, 'samples': 319264, 'steps': 623, 'loss/train': 4.492886543273926} -09/20/2021 16:38:56 - INFO - __main__ - Step 9978: {'lr': 0.00016613333333333335, 'samples': 319296, 'steps': 623, 'loss/train': 4.6739935874938965} -09/20/2021 16:38:56 - INFO - __main__ - Step 9979: {'lr': 0.00016613333333333335, 'samples': 319328, 'steps': 623, 'loss/train': 4.291842937469482} -09/20/2021 16:38:57 - INFO - __main__ - Step 9980: {'lr': 0.00016613333333333335, 'samples': 319360, 'steps': 623, 'loss/train': 4.677893161773682} -09/20/2021 16:38:58 - INFO - __main__ - Step 9981: {'lr': 0.00016613333333333335, 'samples': 319392, 'steps': 623, 'loss/train': 4.234683990478516} -09/20/2021 16:38:59 - INFO - __main__ - Step 9982: {'lr': 0.00016613333333333335, 'samples': 319424, 'steps': 623, 'loss/train': 4.338271617889404} -09/20/2021 16:38:59 - INFO - __main__ - Step 9983: {'lr': 0.00016613333333333335, 'samples': 319456, 'steps': 623, 'loss/train': 5.178600311279297} -09/20/2021 16:39:00 - INFO - __main__ - Step 9984: {'lr': 0.00016613333333333335, 'samples': 319488, 'steps': 623, 'loss/train': 4.621699810028076} -09/20/2021 16:39:01 - INFO - __main__ - Step 9985: {'lr': 0.0001664, 'samples': 319520, 'steps': 624, 'loss/train': 4.5192975997924805} -09/20/2021 16:39:02 - INFO - __main__ - Step 9986: {'lr': 0.0001664, 'samples': 319552, 'steps': 624, 'loss/train': 4.483843803405762} -09/20/2021 16:39:03 - INFO - __main__ - Step 9987: {'lr': 0.0001664, 'samples': 319584, 'steps': 624, 'loss/train': 3.290112257003784} -09/20/2021 16:39:03 - INFO - __main__ - Step 9988: {'lr': 0.0001664, 'samples': 319616, 'steps': 624, 'loss/train': 4.268388748168945} -09/20/2021 16:39:04 - INFO - __main__ - Step 9989: {'lr': 0.0001664, 'samples': 319648, 'steps': 624, 'loss/train': 4.235447406768799} -09/20/2021 16:39:05 - INFO - __main__ - Step 9990: {'lr': 0.0001664, 'samples': 319680, 'steps': 624, 'loss/train': 4.066195964813232} -09/20/2021 16:39:06 - INFO - __main__ - Step 9991: {'lr': 0.0001664, 'samples': 319712, 'steps': 624, 'loss/train': 4.539148330688477} -09/20/2021 16:39:06 - INFO - __main__ - Step 9992: {'lr': 0.0001664, 'samples': 319744, 'steps': 624, 'loss/train': 6.999685287475586} -09/20/2021 16:39:07 - INFO - __main__ - Step 9993: {'lr': 0.0001664, 'samples': 319776, 'steps': 624, 'loss/train': 3.9571149349212646} -09/20/2021 16:39:08 - INFO - __main__ - Step 9994: {'lr': 0.0001664, 'samples': 319808, 'steps': 624, 'loss/train': 4.730258941650391} -09/20/2021 16:39:09 - INFO - __main__ - Step 9995: {'lr': 0.0001664, 'samples': 319840, 'steps': 624, 'loss/train': 4.2211432456970215} -09/20/2021 16:39:09 - INFO - __main__ - Step 9996: {'lr': 0.0001664, 'samples': 319872, 'steps': 624, 'loss/train': 3.744978189468384} -09/20/2021 16:39:10 - INFO - __main__ - Step 9997: {'lr': 0.0001664, 'samples': 319904, 'steps': 624, 'loss/train': 3.6730151176452637} -09/20/2021 16:39:11 - INFO - __main__ - Step 9998: {'lr': 0.0001664, 'samples': 319936, 'steps': 624, 'loss/train': 5.430405139923096} -09/20/2021 16:39:12 - INFO - __main__ - Step 9999: {'lr': 0.0001664, 'samples': 319968, 'steps': 624, 'loss/train': 3.8263773918151855} -09/20/2021 16:39:12 - INFO - __main__ - Step 10000: {'lr': 0.0001664, 'samples': 320000, 'steps': 624, 'loss/train': 4.452033996582031} -09/20/2021 16:39:13 - INFO - __main__ - Step 10001: {'lr': 0.0001666666666666667, 'samples': 320032, 'steps': 625, 'loss/train': 4.145682334899902} -09/20/2021 16:39:14 - INFO - __main__ - Step 10002: {'lr': 0.0001666666666666667, 'samples': 320064, 'steps': 625, 'loss/train': 5.382946014404297} -09/20/2021 16:39:15 - INFO - __main__ - Step 10003: {'lr': 0.0001666666666666667, 'samples': 320096, 'steps': 625, 'loss/train': 3.6951398849487305} -09/20/2021 16:39:15 - INFO - __main__ - Step 10004: {'lr': 0.0001666666666666667, 'samples': 320128, 'steps': 625, 'loss/train': 4.640779972076416} -09/20/2021 16:39:16 - INFO - __main__ - Step 10005: {'lr': 0.0001666666666666667, 'samples': 320160, 'steps': 625, 'loss/train': 4.50354528427124} -09/20/2021 16:39:18 - INFO - __main__ - Step 10006: {'lr': 0.0001666666666666667, 'samples': 320192, 'steps': 625, 'loss/train': 3.8940389156341553} -09/20/2021 16:39:18 - INFO - __main__ - Step 10007: {'lr': 0.0001666666666666667, 'samples': 320224, 'steps': 625, 'loss/train': 4.099694728851318} -09/20/2021 16:39:19 - INFO - __main__ - Step 10008: {'lr': 0.0001666666666666667, 'samples': 320256, 'steps': 625, 'loss/train': 4.464291572570801} -09/20/2021 16:39:20 - INFO - __main__ - Step 10009: {'lr': 0.0001666666666666667, 'samples': 320288, 'steps': 625, 'loss/train': 4.17569637298584} -09/20/2021 16:39:21 - INFO - __main__ - Step 10010: {'lr': 0.0001666666666666667, 'samples': 320320, 'steps': 625, 'loss/train': 4.964399814605713} -09/20/2021 16:39:21 - INFO - __main__ - Step 10011: {'lr': 0.0001666666666666667, 'samples': 320352, 'steps': 625, 'loss/train': 3.8497726917266846} -09/20/2021 16:39:22 - INFO - __main__ - Step 10012: {'lr': 0.0001666666666666667, 'samples': 320384, 'steps': 625, 'loss/train': 3.8907060623168945} -09/20/2021 16:39:23 - INFO - __main__ - Step 10013: {'lr': 0.0001666666666666667, 'samples': 320416, 'steps': 625, 'loss/train': 1.6876345872879028} -09/20/2021 16:39:24 - INFO - __main__ - Step 10014: {'lr': 0.0001666666666666667, 'samples': 320448, 'steps': 625, 'loss/train': 4.92135763168335} -09/20/2021 16:39:24 - INFO - __main__ - Step 10015: {'lr': 0.0001666666666666667, 'samples': 320480, 'steps': 625, 'loss/train': 3.9993014335632324} -09/20/2021 16:39:25 - INFO - __main__ - Step 10016: {'lr': 0.0001666666666666667, 'samples': 320512, 'steps': 625, 'loss/train': 4.140524864196777} -09/20/2021 16:39:26 - INFO - __main__ - Step 10017: {'lr': 0.00016693333333333334, 'samples': 320544, 'steps': 626, 'loss/train': 4.3780293464660645} -09/20/2021 16:39:27 - INFO - __main__ - Step 10018: {'lr': 0.00016693333333333334, 'samples': 320576, 'steps': 626, 'loss/train': 4.754703998565674} -09/20/2021 16:39:27 - INFO - __main__ - Step 10019: {'lr': 0.00016693333333333334, 'samples': 320608, 'steps': 626, 'loss/train': 4.896443843841553} -09/20/2021 16:39:28 - INFO - __main__ - Step 10020: {'lr': 0.00016693333333333334, 'samples': 320640, 'steps': 626, 'loss/train': 5.925414085388184} -09/20/2021 16:39:29 - INFO - __main__ - Step 10021: {'lr': 0.00016693333333333334, 'samples': 320672, 'steps': 626, 'loss/train': 4.329660892486572} -09/20/2021 16:39:30 - INFO - __main__ - Step 10022: {'lr': 0.00016693333333333334, 'samples': 320704, 'steps': 626, 'loss/train': 4.227713108062744} -09/20/2021 16:39:30 - INFO - __main__ - Step 10023: {'lr': 0.00016693333333333334, 'samples': 320736, 'steps': 626, 'loss/train': 3.5983402729034424} -09/20/2021 16:39:31 - INFO - __main__ - Step 10024: {'lr': 0.00016693333333333334, 'samples': 320768, 'steps': 626, 'loss/train': 4.574532985687256} -09/20/2021 16:39:32 - INFO - __main__ - Step 10025: {'lr': 0.00016693333333333334, 'samples': 320800, 'steps': 626, 'loss/train': 5.175206661224365} -09/20/2021 16:39:33 - INFO - __main__ - Step 10026: {'lr': 0.00016693333333333334, 'samples': 320832, 'steps': 626, 'loss/train': 4.390997886657715} -09/20/2021 16:39:33 - INFO - __main__ - Step 10027: {'lr': 0.00016693333333333334, 'samples': 320864, 'steps': 626, 'loss/train': 5.334691524505615} -09/20/2021 16:39:34 - INFO - __main__ - Step 10028: {'lr': 0.00016693333333333334, 'samples': 320896, 'steps': 626, 'loss/train': 4.2418532371521} -09/20/2021 16:39:35 - INFO - __main__ - Step 10029: {'lr': 0.00016693333333333334, 'samples': 320928, 'steps': 626, 'loss/train': 4.868732929229736} -09/20/2021 16:39:36 - INFO - __main__ - Step 10030: {'lr': 0.00016693333333333334, 'samples': 320960, 'steps': 626, 'loss/train': 5.224145412445068} -09/20/2021 16:39:36 - INFO - __main__ - Step 10031: {'lr': 0.00016693333333333334, 'samples': 320992, 'steps': 626, 'loss/train': 4.094022750854492} -09/20/2021 16:39:37 - INFO - __main__ - Step 10032: {'lr': 0.00016693333333333334, 'samples': 321024, 'steps': 626, 'loss/train': 5.469539165496826} -09/20/2021 16:39:38 - INFO - __main__ - Step 10033: {'lr': 0.0001672, 'samples': 321056, 'steps': 627, 'loss/train': 4.69596529006958} -09/20/2021 16:39:39 - INFO - __main__ - Step 10034: {'lr': 0.0001672, 'samples': 321088, 'steps': 627, 'loss/train': 4.846343517303467} -09/20/2021 16:39:40 - INFO - __main__ - Step 10035: {'lr': 0.0001672, 'samples': 321120, 'steps': 627, 'loss/train': 5.337927341461182} -09/20/2021 16:39:40 - INFO - __main__ - Step 10036: {'lr': 0.0001672, 'samples': 321152, 'steps': 627, 'loss/train': 4.335759162902832} -09/20/2021 16:39:42 - INFO - __main__ - Step 10037: {'lr': 0.0001672, 'samples': 321184, 'steps': 627, 'loss/train': 2.576620101928711} -09/20/2021 16:39:42 - INFO - __main__ - Step 10038: {'lr': 0.0001672, 'samples': 321216, 'steps': 627, 'loss/train': 4.2095489501953125} -09/20/2021 16:39:43 - INFO - __main__ - Step 10039: {'lr': 0.0001672, 'samples': 321248, 'steps': 627, 'loss/train': 4.371804714202881} -09/20/2021 16:39:44 - INFO - __main__ - Step 10040: {'lr': 0.0001672, 'samples': 321280, 'steps': 627, 'loss/train': 4.661613464355469} -09/20/2021 16:39:45 - INFO - __main__ - Step 10041: {'lr': 0.0001672, 'samples': 321312, 'steps': 627, 'loss/train': 4.524106502532959} -09/20/2021 16:39:45 - INFO - __main__ - Step 10042: {'lr': 0.0001672, 'samples': 321344, 'steps': 627, 'loss/train': 4.9365010261535645} -09/20/2021 16:39:46 - INFO - __main__ - Step 10043: {'lr': 0.0001672, 'samples': 321376, 'steps': 627, 'loss/train': 4.287324905395508} -09/20/2021 16:39:47 - INFO - __main__ - Step 10044: {'lr': 0.0001672, 'samples': 321408, 'steps': 627, 'loss/train': 4.707668781280518} -09/20/2021 16:39:48 - INFO - __main__ - Step 10045: {'lr': 0.0001672, 'samples': 321440, 'steps': 627, 'loss/train': 3.8196945190429688} -09/20/2021 16:39:48 - INFO - __main__ - Step 10046: {'lr': 0.0001672, 'samples': 321472, 'steps': 627, 'loss/train': 4.914789199829102} -09/20/2021 16:39:49 - INFO - __main__ - Step 10047: {'lr': 0.0001672, 'samples': 321504, 'steps': 627, 'loss/train': 4.907291412353516} -09/20/2021 16:39:50 - INFO - __main__ - Step 10048: {'lr': 0.0001672, 'samples': 321536, 'steps': 627, 'loss/train': 4.682919979095459} -09/20/2021 16:39:51 - INFO - __main__ - Step 10049: {'lr': 0.00016746666666666668, 'samples': 321568, 'steps': 628, 'loss/train': 3.006054639816284} -09/20/2021 16:39:51 - INFO - __main__ - Step 10050: {'lr': 0.00016746666666666668, 'samples': 321600, 'steps': 628, 'loss/train': 4.326083183288574} -09/20/2021 16:39:52 - INFO - __main__ - Step 10051: {'lr': 0.00016746666666666668, 'samples': 321632, 'steps': 628, 'loss/train': 4.384821891784668} -09/20/2021 16:39:53 - INFO - __main__ - Step 10052: {'lr': 0.00016746666666666668, 'samples': 321664, 'steps': 628, 'loss/train': 4.766671180725098} -09/20/2021 16:39:54 - INFO - __main__ - Step 10053: {'lr': 0.00016746666666666668, 'samples': 321696, 'steps': 628, 'loss/train': 4.519527435302734} -09/20/2021 16:39:54 - INFO - __main__ - Step 10054: {'lr': 0.00016746666666666668, 'samples': 321728, 'steps': 628, 'loss/train': 4.83016300201416} -09/20/2021 16:39:55 - INFO - __main__ - Step 10055: {'lr': 0.00016746666666666668, 'samples': 321760, 'steps': 628, 'loss/train': 4.970489501953125} -09/20/2021 16:39:56 - INFO - __main__ - Step 10056: {'lr': 0.00016746666666666668, 'samples': 321792, 'steps': 628, 'loss/train': 3.9484803676605225} -09/20/2021 16:39:57 - INFO - __main__ - Step 10057: {'lr': 0.00016746666666666668, 'samples': 321824, 'steps': 628, 'loss/train': 4.636166572570801} -09/20/2021 16:39:57 - INFO - __main__ - Step 10058: {'lr': 0.00016746666666666668, 'samples': 321856, 'steps': 628, 'loss/train': 5.658662796020508} -09/20/2021 16:39:58 - INFO - __main__ - Step 10059: {'lr': 0.00016746666666666668, 'samples': 321888, 'steps': 628, 'loss/train': 4.863079071044922} -09/20/2021 16:39:59 - INFO - __main__ - Step 10060: {'lr': 0.00016746666666666668, 'samples': 321920, 'steps': 628, 'loss/train': 4.268015384674072} -09/20/2021 16:40:00 - INFO - __main__ - Step 10061: {'lr': 0.00016746666666666668, 'samples': 321952, 'steps': 628, 'loss/train': 4.824823379516602} -09/20/2021 16:40:00 - INFO - __main__ - Step 10062: {'lr': 0.00016746666666666668, 'samples': 321984, 'steps': 628, 'loss/train': 3.6257007122039795} -09/20/2021 16:40:01 - INFO - __main__ - Step 10063: {'lr': 0.00016746666666666668, 'samples': 322016, 'steps': 628, 'loss/train': 4.237334728240967} -09/20/2021 16:40:02 - INFO - __main__ - Step 10064: {'lr': 0.00016746666666666668, 'samples': 322048, 'steps': 628, 'loss/train': 5.1184892654418945} -09/20/2021 16:40:03 - INFO - __main__ - Step 10065: {'lr': 0.00016773333333333334, 'samples': 322080, 'steps': 629, 'loss/train': 4.683593273162842} -09/20/2021 16:40:04 - INFO - __main__ - Step 10066: {'lr': 0.00016773333333333334, 'samples': 322112, 'steps': 629, 'loss/train': 4.373114585876465} -09/20/2021 16:40:05 - INFO - __main__ - Step 10067: {'lr': 0.00016773333333333334, 'samples': 322144, 'steps': 629, 'loss/train': 3.981144905090332} -09/20/2021 16:40:06 - INFO - __main__ - Step 10068: {'lr': 0.00016773333333333334, 'samples': 322176, 'steps': 629, 'loss/train': 3.417849063873291} -09/20/2021 16:40:06 - INFO - __main__ - Step 10069: {'lr': 0.00016773333333333334, 'samples': 322208, 'steps': 629, 'loss/train': 5.673725128173828} -09/20/2021 16:40:07 - INFO - __main__ - Step 10070: {'lr': 0.00016773333333333334, 'samples': 322240, 'steps': 629, 'loss/train': 5.212696075439453} -09/20/2021 16:40:08 - INFO - __main__ - Step 10071: {'lr': 0.00016773333333333334, 'samples': 322272, 'steps': 629, 'loss/train': 4.196231365203857} -09/20/2021 16:40:09 - INFO - __main__ - Step 10072: {'lr': 0.00016773333333333334, 'samples': 322304, 'steps': 629, 'loss/train': 3.8064074516296387} -09/20/2021 16:40:09 - INFO - __main__ - Step 10073: {'lr': 0.00016773333333333334, 'samples': 322336, 'steps': 629, 'loss/train': 4.607867240905762} -09/20/2021 16:40:10 - INFO - __main__ - Step 10074: {'lr': 0.00016773333333333334, 'samples': 322368, 'steps': 629, 'loss/train': 4.3464179039001465} -09/20/2021 16:40:11 - INFO - __main__ - Step 10075: {'lr': 0.00016773333333333334, 'samples': 322400, 'steps': 629, 'loss/train': 4.562891483306885} -09/20/2021 16:40:12 - INFO - __main__ - Step 10076: {'lr': 0.00016773333333333334, 'samples': 322432, 'steps': 629, 'loss/train': 5.8349127769470215} -09/20/2021 16:40:12 - INFO - __main__ - Step 10077: {'lr': 0.00016773333333333334, 'samples': 322464, 'steps': 629, 'loss/train': 2.9461145401000977} -09/20/2021 16:40:13 - INFO - __main__ - Step 10078: {'lr': 0.00016773333333333334, 'samples': 322496, 'steps': 629, 'loss/train': 5.010960102081299} -09/20/2021 16:40:14 - INFO - __main__ - Step 10079: {'lr': 0.00016773333333333334, 'samples': 322528, 'steps': 629, 'loss/train': 4.110593795776367} -09/20/2021 16:40:15 - INFO - __main__ - Step 10080: {'lr': 0.00016773333333333334, 'samples': 322560, 'steps': 629, 'loss/train': 4.560376167297363} -09/20/2021 16:40:15 - INFO - __main__ - Step 10081: {'lr': 0.000168, 'samples': 322592, 'steps': 630, 'loss/train': 4.7551188468933105} -09/20/2021 16:40:16 - INFO - __main__ - Step 10082: {'lr': 0.000168, 'samples': 322624, 'steps': 630, 'loss/train': 5.126014709472656} -09/20/2021 16:40:17 - INFO - __main__ - Step 10083: {'lr': 0.000168, 'samples': 322656, 'steps': 630, 'loss/train': 4.728687286376953} -09/20/2021 16:40:18 - INFO - __main__ - Step 10084: {'lr': 0.000168, 'samples': 322688, 'steps': 630, 'loss/train': 4.3882646560668945} -09/20/2021 16:40:18 - INFO - __main__ - Step 10085: {'lr': 0.000168, 'samples': 322720, 'steps': 630, 'loss/train': 2.8703861236572266} -09/20/2021 16:40:19 - INFO - __main__ - Step 10086: {'lr': 0.000168, 'samples': 322752, 'steps': 630, 'loss/train': 4.87047004699707} -09/20/2021 16:40:20 - INFO - __main__ - Step 10087: {'lr': 0.000168, 'samples': 322784, 'steps': 630, 'loss/train': 4.6341471672058105} -09/20/2021 16:40:21 - INFO - __main__ - Step 10088: {'lr': 0.000168, 'samples': 322816, 'steps': 630, 'loss/train': 4.1588826179504395} -09/20/2021 16:40:21 - INFO - __main__ - Step 10089: {'lr': 0.000168, 'samples': 322848, 'steps': 630, 'loss/train': 4.020715713500977} -09/20/2021 16:40:22 - INFO - __main__ - Step 10090: {'lr': 0.000168, 'samples': 322880, 'steps': 630, 'loss/train': 4.350329399108887} -09/20/2021 16:40:23 - INFO - __main__ - Step 10091: {'lr': 0.000168, 'samples': 322912, 'steps': 630, 'loss/train': 3.754815101623535} -09/20/2021 16:40:24 - INFO - __main__ - Step 10092: {'lr': 0.000168, 'samples': 322944, 'steps': 630, 'loss/train': 3.1252334117889404} -09/20/2021 16:40:24 - INFO - __main__ - Step 10093: {'lr': 0.000168, 'samples': 322976, 'steps': 630, 'loss/train': 5.503917217254639} -09/20/2021 16:40:25 - INFO - __main__ - Step 10094: {'lr': 0.000168, 'samples': 323008, 'steps': 630, 'loss/train': 4.8853759765625} -09/20/2021 16:40:26 - INFO - __main__ - Step 10095: {'lr': 0.000168, 'samples': 323040, 'steps': 630, 'loss/train': 5.319187164306641} -09/20/2021 16:40:27 - INFO - __main__ - Step 10096: {'lr': 0.000168, 'samples': 323072, 'steps': 630, 'loss/train': 3.7378273010253906} -09/20/2021 16:40:28 - INFO - __main__ - Step 10097: {'lr': 0.00016826666666666667, 'samples': 323104, 'steps': 631, 'loss/train': 5.041411399841309} -09/20/2021 16:40:28 - INFO - __main__ - Step 10098: {'lr': 0.00016826666666666667, 'samples': 323136, 'steps': 631, 'loss/train': 4.09431266784668} -09/20/2021 16:40:30 - INFO - __main__ - Step 10099: {'lr': 0.00016826666666666667, 'samples': 323168, 'steps': 631, 'loss/train': 7.055292129516602} -09/20/2021 16:40:30 - INFO - __main__ - Step 10100: {'lr': 0.00016826666666666667, 'samples': 323200, 'steps': 631, 'loss/train': 6.484431743621826} -09/20/2021 16:40:31 - INFO - __main__ - Step 10101: {'lr': 0.00016826666666666667, 'samples': 323232, 'steps': 631, 'loss/train': 3.7160346508026123} -09/20/2021 16:40:32 - INFO - __main__ - Step 10102: {'lr': 0.00016826666666666667, 'samples': 323264, 'steps': 631, 'loss/train': 2.5366759300231934} -09/20/2021 16:40:33 - INFO - __main__ - Step 10103: {'lr': 0.00016826666666666667, 'samples': 323296, 'steps': 631, 'loss/train': 4.256667613983154} -09/20/2021 16:40:33 - INFO - __main__ - Step 10104: {'lr': 0.00016826666666666667, 'samples': 323328, 'steps': 631, 'loss/train': 5.184509754180908} -09/20/2021 16:40:34 - INFO - __main__ - Step 10105: {'lr': 0.00016826666666666667, 'samples': 323360, 'steps': 631, 'loss/train': 4.487205982208252} -09/20/2021 16:40:35 - INFO - __main__ - Step 10106: {'lr': 0.00016826666666666667, 'samples': 323392, 'steps': 631, 'loss/train': 3.6262052059173584} -09/20/2021 16:40:36 - INFO - __main__ - Step 10107: {'lr': 0.00016826666666666667, 'samples': 323424, 'steps': 631, 'loss/train': 4.370908260345459} -09/20/2021 16:40:36 - INFO - __main__ - Step 10108: {'lr': 0.00016826666666666667, 'samples': 323456, 'steps': 631, 'loss/train': 4.214153289794922} -09/20/2021 16:40:37 - INFO - __main__ - Step 10109: {'lr': 0.00016826666666666667, 'samples': 323488, 'steps': 631, 'loss/train': 4.85012674331665} -09/20/2021 16:40:38 - INFO - __main__ - Step 10110: {'lr': 0.00016826666666666667, 'samples': 323520, 'steps': 631, 'loss/train': 4.668302059173584} -09/20/2021 16:40:39 - INFO - __main__ - Step 10111: {'lr': 0.00016826666666666667, 'samples': 323552, 'steps': 631, 'loss/train': 4.9391560554504395} -09/20/2021 16:40:39 - INFO - __main__ - Step 10112: {'lr': 0.00016826666666666667, 'samples': 323584, 'steps': 631, 'loss/train': 5.498301029205322} -09/20/2021 16:40:40 - INFO - __main__ - Step 10113: {'lr': 0.00016853333333333336, 'samples': 323616, 'steps': 632, 'loss/train': 5.391256332397461} -09/20/2021 16:40:41 - INFO - __main__ - Step 10114: {'lr': 0.00016853333333333336, 'samples': 323648, 'steps': 632, 'loss/train': 4.440759658813477} -09/20/2021 16:40:42 - INFO - __main__ - Step 10115: {'lr': 0.00016853333333333336, 'samples': 323680, 'steps': 632, 'loss/train': 4.486217975616455} -09/20/2021 16:40:43 - INFO - __main__ - Step 10116: {'lr': 0.00016853333333333336, 'samples': 323712, 'steps': 632, 'loss/train': 5.106453895568848} -09/20/2021 16:40:43 - INFO - __main__ - Step 10117: {'lr': 0.00016853333333333336, 'samples': 323744, 'steps': 632, 'loss/train': 4.771122932434082} -09/20/2021 16:40:44 - INFO - __main__ - Step 10118: {'lr': 0.00016853333333333336, 'samples': 323776, 'steps': 632, 'loss/train': 4.690314292907715} -09/20/2021 16:40:45 - INFO - __main__ - Step 10119: {'lr': 0.00016853333333333336, 'samples': 323808, 'steps': 632, 'loss/train': 5.230865001678467} -09/20/2021 16:40:46 - INFO - __main__ - Step 10120: {'lr': 0.00016853333333333336, 'samples': 323840, 'steps': 632, 'loss/train': 5.055270671844482} -09/20/2021 16:40:46 - INFO - __main__ - Step 10121: {'lr': 0.00016853333333333336, 'samples': 323872, 'steps': 632, 'loss/train': 4.226318836212158} -09/20/2021 16:40:47 - INFO - __main__ - Step 10122: {'lr': 0.00016853333333333336, 'samples': 323904, 'steps': 632, 'loss/train': 4.01892614364624} -09/20/2021 16:40:48 - INFO - __main__ - Step 10123: {'lr': 0.00016853333333333336, 'samples': 323936, 'steps': 632, 'loss/train': 4.437810897827148} -09/20/2021 16:40:49 - INFO - __main__ - Step 10124: {'lr': 0.00016853333333333336, 'samples': 323968, 'steps': 632, 'loss/train': 6.1741623878479} -09/20/2021 16:40:49 - INFO - __main__ - Step 10125: {'lr': 0.00016853333333333336, 'samples': 324000, 'steps': 632, 'loss/train': 5.0777506828308105} -09/20/2021 16:40:50 - INFO - __main__ - Step 10126: {'lr': 0.00016853333333333336, 'samples': 324032, 'steps': 632, 'loss/train': 4.678248882293701} -09/20/2021 16:40:51 - INFO - __main__ - Step 10127: {'lr': 0.00016853333333333336, 'samples': 324064, 'steps': 632, 'loss/train': 4.080193996429443} -09/20/2021 16:40:52 - INFO - __main__ - Step 10128: {'lr': 0.00016853333333333336, 'samples': 324096, 'steps': 632, 'loss/train': 4.633996486663818} -09/20/2021 16:40:52 - INFO - __main__ - Step 10129: {'lr': 0.0001688, 'samples': 324128, 'steps': 633, 'loss/train': 4.41294527053833} -09/20/2021 16:40:54 - INFO - __main__ - Step 10130: {'lr': 0.0001688, 'samples': 324160, 'steps': 633, 'loss/train': 4.0488457679748535} -09/20/2021 16:40:54 - INFO - __main__ - Step 10131: {'lr': 0.0001688, 'samples': 324192, 'steps': 633, 'loss/train': 3.9045345783233643} -09/20/2021 16:40:55 - INFO - __main__ - Step 10132: {'lr': 0.0001688, 'samples': 324224, 'steps': 633, 'loss/train': 4.2445292472839355} -09/20/2021 16:40:56 - INFO - __main__ - Step 10133: {'lr': 0.0001688, 'samples': 324256, 'steps': 633, 'loss/train': 4.356705188751221} -09/20/2021 16:40:57 - INFO - __main__ - Step 10134: {'lr': 0.0001688, 'samples': 324288, 'steps': 633, 'loss/train': 4.452414035797119} -09/20/2021 16:40:57 - INFO - __main__ - Step 10135: {'lr': 0.0001688, 'samples': 324320, 'steps': 633, 'loss/train': 4.1927032470703125} -09/20/2021 16:40:58 - INFO - __main__ - Step 10136: {'lr': 0.0001688, 'samples': 324352, 'steps': 633, 'loss/train': 4.734131336212158} -09/20/2021 16:40:59 - INFO - __main__ - Step 10137: {'lr': 0.0001688, 'samples': 324384, 'steps': 633, 'loss/train': 4.280320644378662} -09/20/2021 16:41:00 - INFO - __main__ - Step 10138: {'lr': 0.0001688, 'samples': 324416, 'steps': 633, 'loss/train': 4.4610676765441895} -09/20/2021 16:41:00 - INFO - __main__ - Step 10139: {'lr': 0.0001688, 'samples': 324448, 'steps': 633, 'loss/train': 4.963132381439209} -09/20/2021 16:41:01 - INFO - __main__ - Step 10140: {'lr': 0.0001688, 'samples': 324480, 'steps': 633, 'loss/train': 1.644898772239685} -09/20/2021 16:41:02 - INFO - __main__ - Step 10141: {'lr': 0.0001688, 'samples': 324512, 'steps': 633, 'loss/train': 4.933330059051514} -09/20/2021 16:41:03 - INFO - __main__ - Step 10142: {'lr': 0.0001688, 'samples': 324544, 'steps': 633, 'loss/train': 4.475231170654297} -09/20/2021 16:41:03 - INFO - __main__ - Step 10143: {'lr': 0.0001688, 'samples': 324576, 'steps': 633, 'loss/train': 3.8442585468292236} -09/20/2021 16:41:04 - INFO - __main__ - Step 10144: {'lr': 0.0001688, 'samples': 324608, 'steps': 633, 'loss/train': 3.7989189624786377} -09/20/2021 16:41:05 - INFO - __main__ - Step 10145: {'lr': 0.0001690666666666667, 'samples': 324640, 'steps': 634, 'loss/train': 4.484861850738525} -09/20/2021 16:41:06 - INFO - __main__ - Step 10146: {'lr': 0.0001690666666666667, 'samples': 324672, 'steps': 634, 'loss/train': 3.8718130588531494} -09/20/2021 16:41:07 - INFO - __main__ - Step 10147: {'lr': 0.0001690666666666667, 'samples': 324704, 'steps': 634, 'loss/train': 4.28097677230835} -09/20/2021 16:41:07 - INFO - __main__ - Step 10148: {'lr': 0.0001690666666666667, 'samples': 324736, 'steps': 634, 'loss/train': 5.152368068695068} -09/20/2021 16:41:08 - INFO - __main__ - Step 10149: {'lr': 0.0001690666666666667, 'samples': 324768, 'steps': 634, 'loss/train': 5.981654644012451} -09/20/2021 16:41:09 - INFO - __main__ - Step 10150: {'lr': 0.0001690666666666667, 'samples': 324800, 'steps': 634, 'loss/train': 3.6422619819641113} -09/20/2021 16:41:10 - INFO - __main__ - Step 10151: {'lr': 0.0001690666666666667, 'samples': 324832, 'steps': 634, 'loss/train': 4.85672664642334} -09/20/2021 16:41:10 - INFO - __main__ - Step 10152: {'lr': 0.0001690666666666667, 'samples': 324864, 'steps': 634, 'loss/train': 7.223397254943848} -09/20/2021 16:41:11 - INFO - __main__ - Step 10153: {'lr': 0.0001690666666666667, 'samples': 324896, 'steps': 634, 'loss/train': 3.8990097045898438} -09/20/2021 16:41:12 - INFO - __main__ - Step 10154: {'lr': 0.0001690666666666667, 'samples': 324928, 'steps': 634, 'loss/train': 4.058773994445801} -09/20/2021 16:41:13 - INFO - __main__ - Step 10155: {'lr': 0.0001690666666666667, 'samples': 324960, 'steps': 634, 'loss/train': 4.482312202453613} -09/20/2021 16:41:13 - INFO - __main__ - Step 10156: {'lr': 0.0001690666666666667, 'samples': 324992, 'steps': 634, 'loss/train': 3.5350069999694824} -09/20/2021 16:41:14 - INFO - __main__ - Step 10157: {'lr': 0.0001690666666666667, 'samples': 325024, 'steps': 634, 'loss/train': 5.632074356079102} -09/20/2021 16:41:15 - INFO - __main__ - Step 10158: {'lr': 0.0001690666666666667, 'samples': 325056, 'steps': 634, 'loss/train': 4.4295501708984375} -09/20/2021 16:41:16 - INFO - __main__ - Step 10159: {'lr': 0.0001690666666666667, 'samples': 325088, 'steps': 634, 'loss/train': 4.193883895874023} -09/20/2021 16:41:16 - INFO - __main__ - Step 10160: {'lr': 0.0001690666666666667, 'samples': 325120, 'steps': 634, 'loss/train': 4.367762088775635} -09/20/2021 16:41:17 - INFO - __main__ - Step 10161: {'lr': 0.00016933333333333335, 'samples': 325152, 'steps': 635, 'loss/train': 5.117253303527832} -09/20/2021 16:41:18 - INFO - __main__ - Step 10162: {'lr': 0.00016933333333333335, 'samples': 325184, 'steps': 635, 'loss/train': 4.740849494934082} -09/20/2021 16:41:19 - INFO - __main__ - Step 10163: {'lr': 0.00016933333333333335, 'samples': 325216, 'steps': 635, 'loss/train': 3.60903263092041} -09/20/2021 16:41:20 - INFO - __main__ - Step 10164: {'lr': 0.00016933333333333335, 'samples': 325248, 'steps': 635, 'loss/train': 4.07126522064209} -09/20/2021 16:41:21 - INFO - __main__ - Step 10165: {'lr': 0.00016933333333333335, 'samples': 325280, 'steps': 635, 'loss/train': 5.0553202629089355} -09/20/2021 16:41:21 - INFO - __main__ - Step 10166: {'lr': 0.00016933333333333335, 'samples': 325312, 'steps': 635, 'loss/train': 5.186087608337402} -09/20/2021 16:41:22 - INFO - __main__ - Step 10167: {'lr': 0.00016933333333333335, 'samples': 325344, 'steps': 635, 'loss/train': 4.155294895172119} -09/20/2021 16:41:23 - INFO - __main__ - Step 10168: {'lr': 0.00016933333333333335, 'samples': 325376, 'steps': 635, 'loss/train': 5.120288848876953} -09/20/2021 16:41:24 - INFO - __main__ - Step 10169: {'lr': 0.00016933333333333335, 'samples': 325408, 'steps': 635, 'loss/train': 4.5129008293151855} -09/20/2021 16:41:24 - INFO - __main__ - Step 10170: {'lr': 0.00016933333333333335, 'samples': 325440, 'steps': 635, 'loss/train': 4.383552074432373} -09/20/2021 16:41:25 - INFO - __main__ - Step 10171: {'lr': 0.00016933333333333335, 'samples': 325472, 'steps': 635, 'loss/train': 4.633635520935059} -09/20/2021 16:41:26 - INFO - __main__ - Step 10172: {'lr': 0.00016933333333333335, 'samples': 325504, 'steps': 635, 'loss/train': 4.104255676269531} -09/20/2021 16:41:27 - INFO - __main__ - Step 10173: {'lr': 0.00016933333333333335, 'samples': 325536, 'steps': 635, 'loss/train': 5.021966457366943} -09/20/2021 16:41:27 - INFO - __main__ - Step 10174: {'lr': 0.00016933333333333335, 'samples': 325568, 'steps': 635, 'loss/train': 4.274361610412598} -09/20/2021 16:41:28 - INFO - __main__ - Step 10175: {'lr': 0.00016933333333333335, 'samples': 325600, 'steps': 635, 'loss/train': 4.291200160980225} -09/20/2021 16:41:29 - INFO - __main__ - Step 10176: {'lr': 0.00016933333333333335, 'samples': 325632, 'steps': 635, 'loss/train': 4.351728916168213} -09/20/2021 16:41:30 - INFO - __main__ - Step 10177: {'lr': 0.0001696, 'samples': 325664, 'steps': 636, 'loss/train': 3.899359703063965} -09/20/2021 16:41:31 - INFO - __main__ - Step 10178: {'lr': 0.0001696, 'samples': 325696, 'steps': 636, 'loss/train': 4.362307071685791} -09/20/2021 16:41:31 - INFO - __main__ - Step 10179: {'lr': 0.0001696, 'samples': 325728, 'steps': 636, 'loss/train': 4.634158611297607} -09/20/2021 16:41:32 - INFO - __main__ - Step 10180: {'lr': 0.0001696, 'samples': 325760, 'steps': 636, 'loss/train': 4.752762794494629} -09/20/2021 16:41:33 - INFO - __main__ - Step 10181: {'lr': 0.0001696, 'samples': 325792, 'steps': 636, 'loss/train': 4.571507453918457} -09/20/2021 16:41:34 - INFO - __main__ - Step 10182: {'lr': 0.0001696, 'samples': 325824, 'steps': 636, 'loss/train': 3.961545944213867} -09/20/2021 16:41:34 - INFO - __main__ - Step 10183: {'lr': 0.0001696, 'samples': 325856, 'steps': 636, 'loss/train': 4.350127220153809} -09/20/2021 16:41:35 - INFO - __main__ - Step 10184: {'lr': 0.0001696, 'samples': 325888, 'steps': 636, 'loss/train': 4.387403964996338} -09/20/2021 16:41:36 - INFO - __main__ - Step 10185: {'lr': 0.0001696, 'samples': 325920, 'steps': 636, 'loss/train': 4.82633113861084} -09/20/2021 16:41:37 - INFO - __main__ - Step 10186: {'lr': 0.0001696, 'samples': 325952, 'steps': 636, 'loss/train': 4.640994071960449} -09/20/2021 16:41:37 - INFO - __main__ - Step 10187: {'lr': 0.0001696, 'samples': 325984, 'steps': 636, 'loss/train': 4.3254265785217285} -09/20/2021 16:41:38 - INFO - __main__ - Step 10188: {'lr': 0.0001696, 'samples': 326016, 'steps': 636, 'loss/train': 4.265139102935791} -09/20/2021 16:41:39 - INFO - __main__ - Step 10189: {'lr': 0.0001696, 'samples': 326048, 'steps': 636, 'loss/train': 4.278520584106445} -09/20/2021 16:41:40 - INFO - __main__ - Step 10190: {'lr': 0.0001696, 'samples': 326080, 'steps': 636, 'loss/train': 4.240435600280762} -09/20/2021 16:41:40 - INFO - __main__ - Step 10191: {'lr': 0.0001696, 'samples': 326112, 'steps': 636, 'loss/train': 5.357181549072266} -09/20/2021 16:41:41 - INFO - __main__ - Step 10192: {'lr': 0.0001696, 'samples': 326144, 'steps': 636, 'loss/train': 2.7763404846191406} -09/20/2021 16:41:43 - INFO - __main__ - Step 10193: {'lr': 0.00016986666666666668, 'samples': 326176, 'steps': 637, 'loss/train': 4.193379878997803} -09/20/2021 16:41:43 - INFO - __main__ - Step 10194: {'lr': 0.00016986666666666668, 'samples': 326208, 'steps': 637, 'loss/train': 5.0548624992370605} -09/20/2021 16:41:44 - INFO - __main__ - Step 10195: {'lr': 0.00016986666666666668, 'samples': 326240, 'steps': 637, 'loss/train': 5.034738063812256} -09/20/2021 16:41:45 - INFO - __main__ - Step 10196: {'lr': 0.00016986666666666668, 'samples': 326272, 'steps': 637, 'loss/train': 3.8144233226776123} -09/20/2021 16:41:46 - INFO - __main__ - Step 10197: {'lr': 0.00016986666666666668, 'samples': 326304, 'steps': 637, 'loss/train': 5.289655685424805} -09/20/2021 16:41:46 - INFO - __main__ - Step 10198: {'lr': 0.00016986666666666668, 'samples': 326336, 'steps': 637, 'loss/train': 4.266887187957764} -09/20/2021 16:41:47 - INFO - __main__ - Step 10199: {'lr': 0.00016986666666666668, 'samples': 326368, 'steps': 637, 'loss/train': 4.219175338745117} -09/20/2021 16:41:48 - INFO - __main__ - Step 10200: {'lr': 0.00016986666666666668, 'samples': 326400, 'steps': 637, 'loss/train': 4.069677829742432} -09/20/2021 16:41:49 - INFO - __main__ - Step 10201: {'lr': 0.00016986666666666668, 'samples': 326432, 'steps': 637, 'loss/train': 3.827530860900879} -09/20/2021 16:41:49 - INFO - __main__ - Step 10202: {'lr': 0.00016986666666666668, 'samples': 326464, 'steps': 637, 'loss/train': 4.153782367706299} -09/20/2021 16:41:50 - INFO - __main__ - Step 10203: {'lr': 0.00016986666666666668, 'samples': 326496, 'steps': 637, 'loss/train': 4.322978496551514} -09/20/2021 16:41:51 - INFO - __main__ - Step 10204: {'lr': 0.00016986666666666668, 'samples': 326528, 'steps': 637, 'loss/train': 4.863372325897217} -09/20/2021 16:41:52 - INFO - __main__ - Step 10205: {'lr': 0.00016986666666666668, 'samples': 326560, 'steps': 637, 'loss/train': 3.6398494243621826} -09/20/2021 16:41:52 - INFO - __main__ - Step 10206: {'lr': 0.00016986666666666668, 'samples': 326592, 'steps': 637, 'loss/train': 4.963572025299072} -09/20/2021 16:41:53 - INFO - __main__ - Step 10207: {'lr': 0.00016986666666666668, 'samples': 326624, 'steps': 637, 'loss/train': 6.64964485168457} -09/20/2021 16:41:54 - INFO - __main__ - Step 10208: {'lr': 0.00016986666666666668, 'samples': 326656, 'steps': 637, 'loss/train': 4.774106025695801} -09/20/2021 16:41:55 - INFO - __main__ - Step 10209: {'lr': 0.00017013333333333334, 'samples': 326688, 'steps': 638, 'loss/train': 4.791684627532959} -09/20/2021 16:41:55 - INFO - __main__ - Step 10210: {'lr': 0.00017013333333333334, 'samples': 326720, 'steps': 638, 'loss/train': 4.430123805999756} -09/20/2021 16:41:56 - INFO - __main__ - Step 10211: {'lr': 0.00017013333333333334, 'samples': 326752, 'steps': 638, 'loss/train': 4.338196754455566} -09/20/2021 16:41:57 - INFO - __main__ - Step 10212: {'lr': 0.00017013333333333334, 'samples': 326784, 'steps': 638, 'loss/train': 4.121429920196533} -09/20/2021 16:41:58 - INFO - __main__ - Step 10213: {'lr': 0.00017013333333333334, 'samples': 326816, 'steps': 638, 'loss/train': 4.110612392425537} -09/20/2021 16:41:58 - INFO - __main__ - Step 10214: {'lr': 0.00017013333333333334, 'samples': 326848, 'steps': 638, 'loss/train': 3.927441358566284} -09/20/2021 16:41:59 - INFO - __main__ - Step 10215: {'lr': 0.00017013333333333334, 'samples': 326880, 'steps': 638, 'loss/train': 4.292637348175049} -09/20/2021 16:42:00 - INFO - __main__ - Step 10216: {'lr': 0.00017013333333333334, 'samples': 326912, 'steps': 638, 'loss/train': 3.782259464263916} -09/20/2021 16:42:01 - INFO - __main__ - Step 10217: {'lr': 0.00017013333333333334, 'samples': 326944, 'steps': 638, 'loss/train': 4.097708702087402} -09/20/2021 16:42:01 - INFO - __main__ - Step 10218: {'lr': 0.00017013333333333334, 'samples': 326976, 'steps': 638, 'loss/train': 4.811102390289307} -09/20/2021 16:42:02 - INFO - __main__ - Step 10219: {'lr': 0.00017013333333333334, 'samples': 327008, 'steps': 638, 'loss/train': 4.355464458465576} -09/20/2021 16:42:03 - INFO - __main__ - Step 10220: {'lr': 0.00017013333333333334, 'samples': 327040, 'steps': 638, 'loss/train': 3.828673839569092} -09/20/2021 16:42:04 - INFO - __main__ - Step 10221: {'lr': 0.00017013333333333334, 'samples': 327072, 'steps': 638, 'loss/train': 3.8134469985961914} -09/20/2021 16:42:04 - INFO - __main__ - Step 10222: {'lr': 0.00017013333333333334, 'samples': 327104, 'steps': 638, 'loss/train': 5.007174491882324} -09/20/2021 16:42:06 - INFO - __main__ - Step 10223: {'lr': 0.00017013333333333334, 'samples': 327136, 'steps': 638, 'loss/train': 4.224386215209961} -09/20/2021 16:42:06 - INFO - __main__ - Step 10224: {'lr': 0.00017013333333333334, 'samples': 327168, 'steps': 638, 'loss/train': 4.520863056182861} -09/20/2021 16:42:07 - INFO - __main__ - Step 10225: {'lr': 0.0001704, 'samples': 327200, 'steps': 639, 'loss/train': 4.209879398345947} -09/20/2021 16:42:08 - INFO - __main__ - Step 10226: {'lr': 0.0001704, 'samples': 327232, 'steps': 639, 'loss/train': 4.9684224128723145} -09/20/2021 16:42:09 - INFO - __main__ - Step 10227: {'lr': 0.0001704, 'samples': 327264, 'steps': 639, 'loss/train': 3.4777462482452393} -09/20/2021 16:42:10 - INFO - __main__ - Step 10228: {'lr': 0.0001704, 'samples': 327296, 'steps': 639, 'loss/train': 4.644818305969238} -09/20/2021 16:42:10 - INFO - __main__ - Step 10229: {'lr': 0.0001704, 'samples': 327328, 'steps': 639, 'loss/train': 5.077436447143555} -09/20/2021 16:42:11 - INFO - __main__ - Step 10230: {'lr': 0.0001704, 'samples': 327360, 'steps': 639, 'loss/train': 3.966174364089966} -09/20/2021 16:42:12 - INFO - __main__ - Step 10231: {'lr': 0.0001704, 'samples': 327392, 'steps': 639, 'loss/train': 4.156737804412842} -09/20/2021 16:42:13 - INFO - __main__ - Step 10232: {'lr': 0.0001704, 'samples': 327424, 'steps': 639, 'loss/train': 6.2366743087768555} -09/20/2021 16:42:13 - INFO - __main__ - Step 10233: {'lr': 0.0001704, 'samples': 327456, 'steps': 639, 'loss/train': 4.648721218109131} -09/20/2021 16:42:14 - INFO - __main__ - Step 10234: {'lr': 0.0001704, 'samples': 327488, 'steps': 639, 'loss/train': 3.6964516639709473} -09/20/2021 16:42:15 - INFO - __main__ - Step 10235: {'lr': 0.0001704, 'samples': 327520, 'steps': 639, 'loss/train': 5.46309757232666} -09/20/2021 16:42:16 - INFO - __main__ - Step 10236: {'lr': 0.0001704, 'samples': 327552, 'steps': 639, 'loss/train': 4.471590995788574} -09/20/2021 16:42:16 - INFO - __main__ - Step 10237: {'lr': 0.0001704, 'samples': 327584, 'steps': 639, 'loss/train': 3.8247034549713135} -09/20/2021 16:42:17 - INFO - __main__ - Step 10238: {'lr': 0.0001704, 'samples': 327616, 'steps': 639, 'loss/train': 3.760958433151245} -09/20/2021 16:42:18 - INFO - __main__ - Step 10239: {'lr': 0.0001704, 'samples': 327648, 'steps': 639, 'loss/train': 4.7422776222229} -09/20/2021 16:42:19 - INFO - __main__ - Step 10240: {'lr': 0.0001704, 'samples': 327680, 'steps': 639, 'loss/train': 5.647744178771973} -09/20/2021 16:42:19 - INFO - __main__ - Step 10241: {'lr': 0.00017066666666666668, 'samples': 327712, 'steps': 640, 'loss/train': 5.135714054107666} -09/20/2021 16:42:20 - INFO - __main__ - Step 10242: {'lr': 0.00017066666666666668, 'samples': 327744, 'steps': 640, 'loss/train': 4.378232002258301} -09/20/2021 16:42:21 - INFO - __main__ - Step 10243: {'lr': 0.00017066666666666668, 'samples': 327776, 'steps': 640, 'loss/train': 4.48250675201416} -09/20/2021 16:42:22 - INFO - __main__ - Step 10244: {'lr': 0.00017066666666666668, 'samples': 327808, 'steps': 640, 'loss/train': 5.479816913604736} -09/20/2021 16:42:22 - INFO - __main__ - Step 10245: {'lr': 0.00017066666666666668, 'samples': 327840, 'steps': 640, 'loss/train': 3.547147035598755} -09/20/2021 16:42:23 - INFO - __main__ - Step 10246: {'lr': 0.00017066666666666668, 'samples': 327872, 'steps': 640, 'loss/train': 5.292395114898682} -09/20/2021 16:42:24 - INFO - __main__ - Step 10247: {'lr': 0.00017066666666666668, 'samples': 327904, 'steps': 640, 'loss/train': 4.7165751457214355} -09/20/2021 16:42:25 - INFO - __main__ - Step 10248: {'lr': 0.00017066666666666668, 'samples': 327936, 'steps': 640, 'loss/train': 4.647023677825928} -09/20/2021 16:42:25 - INFO - __main__ - Step 10249: {'lr': 0.00017066666666666668, 'samples': 327968, 'steps': 640, 'loss/train': 4.114291191101074} -09/20/2021 16:42:26 - INFO - __main__ - Step 10250: {'lr': 0.00017066666666666668, 'samples': 328000, 'steps': 640, 'loss/train': 5.4768195152282715} -09/20/2021 16:42:27 - INFO - __main__ - Step 10251: {'lr': 0.00017066666666666668, 'samples': 328032, 'steps': 640, 'loss/train': 4.616696357727051} -09/20/2021 16:42:28 - INFO - __main__ - Step 10252: {'lr': 0.00017066666666666668, 'samples': 328064, 'steps': 640, 'loss/train': 3.6432180404663086} -09/20/2021 16:42:29 - INFO - __main__ - Step 10253: {'lr': 0.00017066666666666668, 'samples': 328096, 'steps': 640, 'loss/train': 6.006295680999756} -09/20/2021 16:42:30 - INFO - __main__ - Step 10254: {'lr': 0.00017066666666666668, 'samples': 328128, 'steps': 640, 'loss/train': 4.889559268951416} -09/20/2021 16:42:30 - INFO - __main__ - Step 10255: {'lr': 0.00017066666666666668, 'samples': 328160, 'steps': 640, 'loss/train': 3.888500928878784} -09/20/2021 16:42:31 - INFO - __main__ - Step 10256: {'lr': 0.00017066666666666668, 'samples': 328192, 'steps': 640, 'loss/train': 4.954118251800537} -09/20/2021 16:42:32 - INFO - __main__ - Step 10257: {'lr': 0.00017093333333333333, 'samples': 328224, 'steps': 641, 'loss/train': 4.457268238067627} -09/20/2021 16:42:33 - INFO - __main__ - Step 10258: {'lr': 0.00017093333333333333, 'samples': 328256, 'steps': 641, 'loss/train': 3.8657166957855225} -09/20/2021 16:42:34 - INFO - __main__ - Step 10259: {'lr': 0.00017093333333333333, 'samples': 328288, 'steps': 641, 'loss/train': 5.54072904586792} -09/20/2021 16:42:34 - INFO - __main__ - Step 10260: {'lr': 0.00017093333333333333, 'samples': 328320, 'steps': 641, 'loss/train': 4.013070106506348} -09/20/2021 16:42:35 - INFO - __main__ - Step 10261: {'lr': 0.00017093333333333333, 'samples': 328352, 'steps': 641, 'loss/train': 4.2534074783325195} -09/20/2021 16:42:36 - INFO - __main__ - Step 10262: {'lr': 0.00017093333333333333, 'samples': 328384, 'steps': 641, 'loss/train': 3.6029841899871826} -09/20/2021 16:42:37 - INFO - __main__ - Step 10263: {'lr': 0.00017093333333333333, 'samples': 328416, 'steps': 641, 'loss/train': 4.092920780181885} -09/20/2021 16:42:37 - INFO - __main__ - Step 10264: {'lr': 0.00017093333333333333, 'samples': 328448, 'steps': 641, 'loss/train': 5.8225226402282715} -09/20/2021 16:42:38 - INFO - __main__ - Step 10265: {'lr': 0.00017093333333333333, 'samples': 328480, 'steps': 641, 'loss/train': 2.895137310028076} -09/20/2021 16:42:39 - INFO - __main__ - Step 10266: {'lr': 0.00017093333333333333, 'samples': 328512, 'steps': 641, 'loss/train': 4.816889762878418} -09/20/2021 16:42:40 - INFO - __main__ - Step 10267: {'lr': 0.00017093333333333333, 'samples': 328544, 'steps': 641, 'loss/train': 3.9469687938690186} -09/20/2021 16:42:40 - INFO - __main__ - Step 10268: {'lr': 0.00017093333333333333, 'samples': 328576, 'steps': 641, 'loss/train': 6.439028263092041} -09/20/2021 16:42:41 - INFO - __main__ - Step 10269: {'lr': 0.00017093333333333333, 'samples': 328608, 'steps': 641, 'loss/train': 2.5736029148101807} -09/20/2021 16:42:42 - INFO - __main__ - Step 10270: {'lr': 0.00017093333333333333, 'samples': 328640, 'steps': 641, 'loss/train': 2.3606302738189697} -09/20/2021 16:42:43 - INFO - __main__ - Step 10271: {'lr': 0.00017093333333333333, 'samples': 328672, 'steps': 641, 'loss/train': 2.1015658378601074} -09/20/2021 16:42:43 - INFO - __main__ - Step 10272: {'lr': 0.00017093333333333333, 'samples': 328704, 'steps': 641, 'loss/train': 3.7926366329193115} -09/20/2021 16:42:44 - INFO - __main__ - Step 10273: {'lr': 0.00017120000000000001, 'samples': 328736, 'steps': 642, 'loss/train': 3.428029775619507} -09/20/2021 16:42:45 - INFO - __main__ - Step 10274: {'lr': 0.00017120000000000001, 'samples': 328768, 'steps': 642, 'loss/train': 5.630785942077637} -09/20/2021 16:42:46 - INFO - __main__ - Step 10275: {'lr': 0.00017120000000000001, 'samples': 328800, 'steps': 642, 'loss/train': 3.817152261734009} -09/20/2021 16:42:47 - INFO - __main__ - Step 10276: {'lr': 0.00017120000000000001, 'samples': 328832, 'steps': 642, 'loss/train': 4.309672832489014} -09/20/2021 16:42:47 - INFO - __main__ - Step 10277: {'lr': 0.00017120000000000001, 'samples': 328864, 'steps': 642, 'loss/train': 4.711504936218262} -09/20/2021 16:42:48 - INFO - __main__ - Step 10278: {'lr': 0.00017120000000000001, 'samples': 328896, 'steps': 642, 'loss/train': 3.8922691345214844} -09/20/2021 16:42:49 - INFO - __main__ - Step 10279: {'lr': 0.00017120000000000001, 'samples': 328928, 'steps': 642, 'loss/train': 5.308880805969238} -09/20/2021 16:42:50 - INFO - __main__ - Step 10280: {'lr': 0.00017120000000000001, 'samples': 328960, 'steps': 642, 'loss/train': 5.043359756469727} -09/20/2021 16:42:50 - INFO - __main__ - Step 10281: {'lr': 0.00017120000000000001, 'samples': 328992, 'steps': 642, 'loss/train': 4.367264270782471} -09/20/2021 16:42:51 - INFO - __main__ - Step 10282: {'lr': 0.00017120000000000001, 'samples': 329024, 'steps': 642, 'loss/train': 4.22314977645874} -09/20/2021 16:42:52 - INFO - __main__ - Step 10283: {'lr': 0.00017120000000000001, 'samples': 329056, 'steps': 642, 'loss/train': 4.051526069641113} -09/20/2021 16:42:53 - INFO - __main__ - Step 10284: {'lr': 0.00017120000000000001, 'samples': 329088, 'steps': 642, 'loss/train': 4.220839977264404} -09/20/2021 16:42:54 - INFO - __main__ - Step 10285: {'lr': 0.00017120000000000001, 'samples': 329120, 'steps': 642, 'loss/train': 3.9744350910186768} -09/20/2021 16:42:55 - INFO - __main__ - Step 10286: {'lr': 0.00017120000000000001, 'samples': 329152, 'steps': 642, 'loss/train': 3.9779810905456543} -09/20/2021 16:42:55 - INFO - __main__ - Step 10287: {'lr': 0.00017120000000000001, 'samples': 329184, 'steps': 642, 'loss/train': 4.525704860687256} -09/20/2021 16:42:56 - INFO - __main__ - Step 10288: {'lr': 0.00017120000000000001, 'samples': 329216, 'steps': 642, 'loss/train': 4.464062213897705} -09/20/2021 16:42:57 - INFO - __main__ - Step 10289: {'lr': 0.00017146666666666667, 'samples': 329248, 'steps': 643, 'loss/train': 2.125096321105957} -09/20/2021 16:42:58 - INFO - __main__ - Step 10290: {'lr': 0.00017146666666666667, 'samples': 329280, 'steps': 643, 'loss/train': 1.8107576370239258} -09/20/2021 16:42:59 - INFO - __main__ - Step 10291: {'lr': 0.00017146666666666667, 'samples': 329312, 'steps': 643, 'loss/train': 2.6197423934936523} -09/20/2021 16:42:59 - INFO - __main__ - Step 10292: {'lr': 0.00017146666666666667, 'samples': 329344, 'steps': 643, 'loss/train': 2.478606939315796} -09/20/2021 16:43:00 - INFO - __main__ - Step 10293: {'lr': 0.00017146666666666667, 'samples': 329376, 'steps': 643, 'loss/train': 2.3630449771881104} -09/20/2021 16:43:01 - INFO - __main__ - Step 10294: {'lr': 0.00017146666666666667, 'samples': 329408, 'steps': 643, 'loss/train': 4.308208465576172} -09/20/2021 16:43:02 - INFO - __main__ - Step 10295: {'lr': 0.00017146666666666667, 'samples': 329440, 'steps': 643, 'loss/train': 4.6891913414001465} -09/20/2021 16:43:02 - INFO - __main__ - Step 10296: {'lr': 0.00017146666666666667, 'samples': 329472, 'steps': 643, 'loss/train': 5.076071739196777} -09/20/2021 16:43:03 - INFO - __main__ - Step 10297: {'lr': 0.00017146666666666667, 'samples': 329504, 'steps': 643, 'loss/train': 2.319042444229126} -09/20/2021 16:43:04 - INFO - __main__ - Step 10298: {'lr': 0.00017146666666666667, 'samples': 329536, 'steps': 643, 'loss/train': 3.9524385929107666} -09/20/2021 16:43:05 - INFO - __main__ - Step 10299: {'lr': 0.00017146666666666667, 'samples': 329568, 'steps': 643, 'loss/train': 4.699763774871826} -09/20/2021 16:43:05 - INFO - __main__ - Step 10300: {'lr': 0.00017146666666666667, 'samples': 329600, 'steps': 643, 'loss/train': 4.1698126792907715} -09/20/2021 16:43:06 - INFO - __main__ - Step 10301: {'lr': 0.00017146666666666667, 'samples': 329632, 'steps': 643, 'loss/train': 1.4614582061767578} -09/20/2021 16:43:07 - INFO - __main__ - Step 10302: {'lr': 0.00017146666666666667, 'samples': 329664, 'steps': 643, 'loss/train': 4.242882251739502} -09/20/2021 16:43:08 - INFO - __main__ - Step 10303: {'lr': 0.00017146666666666667, 'samples': 329696, 'steps': 643, 'loss/train': 3.9285008907318115} -09/20/2021 16:43:08 - INFO - __main__ - Step 10304: {'lr': 0.00017146666666666667, 'samples': 329728, 'steps': 643, 'loss/train': 4.857725620269775} -09/20/2021 16:43:09 - INFO - __main__ - Step 10305: {'lr': 0.00017173333333333335, 'samples': 329760, 'steps': 644, 'loss/train': 4.756720066070557} -09/20/2021 16:43:10 - INFO - __main__ - Step 10306: {'lr': 0.00017173333333333335, 'samples': 329792, 'steps': 644, 'loss/train': 4.699141502380371} -09/20/2021 16:43:11 - INFO - __main__ - Step 10307: {'lr': 0.00017173333333333335, 'samples': 329824, 'steps': 644, 'loss/train': 4.534216403961182} -09/20/2021 16:43:11 - INFO - __main__ - Step 10308: {'lr': 0.00017173333333333335, 'samples': 329856, 'steps': 644, 'loss/train': 4.205583572387695} -09/20/2021 16:43:12 - INFO - __main__ - Step 10309: {'lr': 0.00017173333333333335, 'samples': 329888, 'steps': 644, 'loss/train': 3.994755506515503} -09/20/2021 16:43:13 - INFO - __main__ - Step 10310: {'lr': 0.00017173333333333335, 'samples': 329920, 'steps': 644, 'loss/train': 3.819843053817749} -09/20/2021 16:43:14 - INFO - __main__ - Step 10311: {'lr': 0.00017173333333333335, 'samples': 329952, 'steps': 644, 'loss/train': 4.687933921813965} -09/20/2021 16:43:14 - INFO - __main__ - Step 10312: {'lr': 0.00017173333333333335, 'samples': 329984, 'steps': 644, 'loss/train': 4.093545436859131} -09/20/2021 16:43:15 - INFO - __main__ - Step 10313: {'lr': 0.00017173333333333335, 'samples': 330016, 'steps': 644, 'loss/train': 3.858779191970825} -09/20/2021 16:43:17 - INFO - __main__ - Step 10314: {'lr': 0.00017173333333333335, 'samples': 330048, 'steps': 644, 'loss/train': 4.685606002807617} -09/20/2021 16:43:18 - INFO - __main__ - Step 10315: {'lr': 0.00017173333333333335, 'samples': 330080, 'steps': 644, 'loss/train': 3.906996965408325} -09/20/2021 16:43:19 - INFO - __main__ - Step 10316: {'lr': 0.00017173333333333335, 'samples': 330112, 'steps': 644, 'loss/train': 4.294662952423096} -09/20/2021 16:43:19 - INFO - __main__ - Step 10317: {'lr': 0.00017173333333333335, 'samples': 330144, 'steps': 644, 'loss/train': 4.518238544464111} -09/20/2021 16:43:20 - INFO - __main__ - Step 10318: {'lr': 0.00017173333333333335, 'samples': 330176, 'steps': 644, 'loss/train': 4.552175045013428} -09/20/2021 16:43:21 - INFO - __main__ - Step 10319: {'lr': 0.00017173333333333335, 'samples': 330208, 'steps': 644, 'loss/train': 4.349515914916992} -09/20/2021 16:43:22 - INFO - __main__ - Step 10320: {'lr': 0.00017173333333333335, 'samples': 330240, 'steps': 644, 'loss/train': 4.911230087280273} -09/20/2021 16:43:22 - INFO - __main__ - Step 10321: {'lr': 0.000172, 'samples': 330272, 'steps': 645, 'loss/train': 4.657660484313965} -09/20/2021 16:43:23 - INFO - __main__ - Step 10322: {'lr': 0.000172, 'samples': 330304, 'steps': 645, 'loss/train': 5.079786777496338} -09/20/2021 16:43:24 - INFO - __main__ - Step 10323: {'lr': 0.000172, 'samples': 330336, 'steps': 645, 'loss/train': 4.6907639503479} -09/20/2021 16:43:25 - INFO - __main__ - Step 10324: {'lr': 0.000172, 'samples': 330368, 'steps': 645, 'loss/train': 4.318727970123291} -09/20/2021 16:43:25 - INFO - __main__ - Step 10325: {'lr': 0.000172, 'samples': 330400, 'steps': 645, 'loss/train': 4.3311357498168945} -09/20/2021 16:43:26 - INFO - __main__ - Step 10326: {'lr': 0.000172, 'samples': 330432, 'steps': 645, 'loss/train': 5.801637172698975} -09/20/2021 16:43:27 - INFO - __main__ - Step 10327: {'lr': 0.000172, 'samples': 330464, 'steps': 645, 'loss/train': 5.11436653137207} -09/20/2021 16:43:28 - INFO - __main__ - Step 10328: {'lr': 0.000172, 'samples': 330496, 'steps': 645, 'loss/train': 3.877318859100342} -09/20/2021 16:43:28 - INFO - __main__ - Step 10329: {'lr': 0.000172, 'samples': 330528, 'steps': 645, 'loss/train': 5.035760402679443} -09/20/2021 16:43:29 - INFO - __main__ - Step 10330: {'lr': 0.000172, 'samples': 330560, 'steps': 645, 'loss/train': 4.210616111755371} -09/20/2021 16:43:30 - INFO - __main__ - Step 10331: {'lr': 0.000172, 'samples': 330592, 'steps': 645, 'loss/train': 4.122326850891113} -09/20/2021 16:43:31 - INFO - __main__ - Step 10332: {'lr': 0.000172, 'samples': 330624, 'steps': 645, 'loss/train': 3.6649363040924072} -09/20/2021 16:43:31 - INFO - __main__ - Step 10333: {'lr': 0.000172, 'samples': 330656, 'steps': 645, 'loss/train': 2.0545170307159424} -09/20/2021 16:43:32 - INFO - __main__ - Step 10334: {'lr': 0.000172, 'samples': 330688, 'steps': 645, 'loss/train': 4.623583793640137} -09/20/2021 16:43:33 - INFO - __main__ - Step 10335: {'lr': 0.000172, 'samples': 330720, 'steps': 645, 'loss/train': 4.537016868591309} -09/20/2021 16:43:34 - INFO - __main__ - Step 10336: {'lr': 0.000172, 'samples': 330752, 'steps': 645, 'loss/train': 4.550151348114014} -09/20/2021 16:43:35 - INFO - __main__ - Step 10337: {'lr': 0.00017226666666666666, 'samples': 330784, 'steps': 646, 'loss/train': 4.153733730316162} -09/20/2021 16:43:35 - INFO - __main__ - Step 10338: {'lr': 0.00017226666666666666, 'samples': 330816, 'steps': 646, 'loss/train': 4.607836723327637} -09/20/2021 16:43:36 - INFO - __main__ - Step 10339: {'lr': 0.00017226666666666666, 'samples': 330848, 'steps': 646, 'loss/train': 4.404702663421631} -09/20/2021 16:43:37 - INFO - __main__ - Step 10340: {'lr': 0.00017226666666666666, 'samples': 330880, 'steps': 646, 'loss/train': 5.756114959716797} -09/20/2021 16:43:38 - INFO - __main__ - Step 10341: {'lr': 0.00017226666666666666, 'samples': 330912, 'steps': 646, 'loss/train': 4.373592853546143} -09/20/2021 16:43:38 - INFO - __main__ - Step 10342: {'lr': 0.00017226666666666666, 'samples': 330944, 'steps': 646, 'loss/train': 2.149991035461426} -09/20/2021 16:43:39 - INFO - __main__ - Step 10343: {'lr': 0.00017226666666666666, 'samples': 330976, 'steps': 646, 'loss/train': 2.046450614929199} -09/20/2021 16:43:40 - INFO - __main__ - Step 10344: {'lr': 0.00017226666666666666, 'samples': 331008, 'steps': 646, 'loss/train': 1.5463552474975586} -09/20/2021 16:43:41 - INFO - __main__ - Step 10345: {'lr': 0.00017226666666666666, 'samples': 331040, 'steps': 646, 'loss/train': 2.61098575592041} -09/20/2021 16:43:42 - INFO - __main__ - Step 10346: {'lr': 0.00017226666666666666, 'samples': 331072, 'steps': 646, 'loss/train': 3.444389820098877} -09/20/2021 16:43:43 - INFO - __main__ - Step 10347: {'lr': 0.00017226666666666666, 'samples': 331104, 'steps': 646, 'loss/train': 4.9770355224609375} -09/20/2021 16:43:44 - INFO - __main__ - Step 10348: {'lr': 0.00017226666666666666, 'samples': 331136, 'steps': 646, 'loss/train': 3.8860950469970703} -09/20/2021 16:43:44 - INFO - __main__ - Step 10349: {'lr': 0.00017226666666666666, 'samples': 331168, 'steps': 646, 'loss/train': 4.0530900955200195} -09/20/2021 16:43:45 - INFO - __main__ - Step 10350: {'lr': 0.00017226666666666666, 'samples': 331200, 'steps': 646, 'loss/train': 4.32453727722168} -09/20/2021 16:43:46 - INFO - __main__ - Step 10351: {'lr': 0.00017226666666666666, 'samples': 331232, 'steps': 646, 'loss/train': 4.872138977050781} -09/20/2021 16:43:47 - INFO - __main__ - Step 10352: {'lr': 0.00017226666666666666, 'samples': 331264, 'steps': 646, 'loss/train': 4.824289321899414} -09/20/2021 16:43:47 - INFO - __main__ - Step 10353: {'lr': 0.00017253333333333334, 'samples': 331296, 'steps': 647, 'loss/train': 1.8280929327011108} -09/20/2021 16:43:48 - INFO - __main__ - Step 10354: {'lr': 0.00017253333333333334, 'samples': 331328, 'steps': 647, 'loss/train': 4.689761161804199} -09/20/2021 16:43:49 - INFO - __main__ - Step 10355: {'lr': 0.00017253333333333334, 'samples': 331360, 'steps': 647, 'loss/train': 7.646622657775879} -09/20/2021 16:43:50 - INFO - __main__ - Step 10356: {'lr': 0.00017253333333333334, 'samples': 331392, 'steps': 647, 'loss/train': 4.265886306762695} -09/20/2021 16:43:50 - INFO - __main__ - Step 10357: {'lr': 0.00017253333333333334, 'samples': 331424, 'steps': 647, 'loss/train': 1.9728529453277588} -09/20/2021 16:43:51 - INFO - __main__ - Step 10358: {'lr': 0.00017253333333333334, 'samples': 331456, 'steps': 647, 'loss/train': 3.863361120223999} -09/20/2021 16:43:52 - INFO - __main__ - Step 10359: {'lr': 0.00017253333333333334, 'samples': 331488, 'steps': 647, 'loss/train': 5.687500476837158} -09/20/2021 16:43:53 - INFO - __main__ - Step 10360: {'lr': 0.00017253333333333334, 'samples': 331520, 'steps': 647, 'loss/train': 4.600867748260498} -09/20/2021 16:43:53 - INFO - __main__ - Step 10361: {'lr': 0.00017253333333333334, 'samples': 331552, 'steps': 647, 'loss/train': 4.148759841918945} -09/20/2021 16:43:54 - INFO - __main__ - Step 10362: {'lr': 0.00017253333333333334, 'samples': 331584, 'steps': 647, 'loss/train': 4.857623100280762} -09/20/2021 16:43:55 - INFO - __main__ - Step 10363: {'lr': 0.00017253333333333334, 'samples': 331616, 'steps': 647, 'loss/train': 4.524783134460449} -09/20/2021 16:43:56 - INFO - __main__ - Step 10364: {'lr': 0.00017253333333333334, 'samples': 331648, 'steps': 647, 'loss/train': 3.717499256134033} -09/20/2021 16:43:56 - INFO - __main__ - Step 10365: {'lr': 0.00017253333333333334, 'samples': 331680, 'steps': 647, 'loss/train': 4.638562202453613} -09/20/2021 16:43:57 - INFO - __main__ - Step 10366: {'lr': 0.00017253333333333334, 'samples': 331712, 'steps': 647, 'loss/train': 4.121563911437988} -09/20/2021 16:43:58 - INFO - __main__ - Step 10367: {'lr': 0.00017253333333333334, 'samples': 331744, 'steps': 647, 'loss/train': 4.2702765464782715} -09/20/2021 16:43:59 - INFO - __main__ - Step 10368: {'lr': 0.00017253333333333334, 'samples': 331776, 'steps': 647, 'loss/train': 4.527890205383301} -09/20/2021 16:44:00 - INFO - __main__ - Step 10369: {'lr': 0.0001728, 'samples': 331808, 'steps': 648, 'loss/train': 4.912214756011963} -09/20/2021 16:44:00 - INFO - __main__ - Step 10370: {'lr': 0.0001728, 'samples': 331840, 'steps': 648, 'loss/train': 4.948783874511719} -09/20/2021 16:44:01 - INFO - __main__ - Step 10371: {'lr': 0.0001728, 'samples': 331872, 'steps': 648, 'loss/train': 4.18960428237915} -09/20/2021 16:44:02 - INFO - __main__ - Step 10372: {'lr': 0.0001728, 'samples': 331904, 'steps': 648, 'loss/train': 3.639456033706665} -09/20/2021 16:44:03 - INFO - __main__ - Step 10373: {'lr': 0.0001728, 'samples': 331936, 'steps': 648, 'loss/train': 4.509542465209961} -09/20/2021 16:44:03 - INFO - __main__ - Step 10374: {'lr': 0.0001728, 'samples': 331968, 'steps': 648, 'loss/train': 5.281994819641113} -09/20/2021 16:44:04 - INFO - __main__ - Step 10375: {'lr': 0.0001728, 'samples': 332000, 'steps': 648, 'loss/train': 1.5887742042541504} -09/20/2021 16:44:05 - INFO - __main__ - Step 10376: {'lr': 0.0001728, 'samples': 332032, 'steps': 648, 'loss/train': 1.8525807857513428} -09/20/2021 16:44:06 - INFO - __main__ - Step 10377: {'lr': 0.0001728, 'samples': 332064, 'steps': 648, 'loss/train': 1.6078674793243408} -09/20/2021 16:44:07 - INFO - __main__ - Step 10378: {'lr': 0.0001728, 'samples': 332096, 'steps': 648, 'loss/train': 4.159146308898926} -09/20/2021 16:44:08 - INFO - __main__ - Step 10379: {'lr': 0.0001728, 'samples': 332128, 'steps': 648, 'loss/train': 4.213747978210449} -09/20/2021 16:44:08 - INFO - __main__ - Step 10380: {'lr': 0.0001728, 'samples': 332160, 'steps': 648, 'loss/train': 4.612967014312744} -09/20/2021 16:44:09 - INFO - __main__ - Step 10381: {'lr': 0.0001728, 'samples': 332192, 'steps': 648, 'loss/train': 4.102993488311768} -09/20/2021 16:44:10 - INFO - __main__ - Step 10382: {'lr': 0.0001728, 'samples': 332224, 'steps': 648, 'loss/train': 3.13688588142395} -09/20/2021 16:44:11 - INFO - __main__ - Step 10383: {'lr': 0.0001728, 'samples': 332256, 'steps': 648, 'loss/train': 3.9649484157562256} -09/20/2021 16:44:11 - INFO - __main__ - Step 10384: {'lr': 0.0001728, 'samples': 332288, 'steps': 648, 'loss/train': 4.070309638977051} -09/20/2021 16:44:12 - INFO - __main__ - Step 10385: {'lr': 0.00017306666666666665, 'samples': 332320, 'steps': 649, 'loss/train': 3.58358097076416} -09/20/2021 16:44:13 - INFO - __main__ - Step 10386: {'lr': 0.00017306666666666665, 'samples': 332352, 'steps': 649, 'loss/train': 5.5092387199401855} -09/20/2021 16:44:14 - INFO - __main__ - Step 10387: {'lr': 0.00017306666666666665, 'samples': 332384, 'steps': 649, 'loss/train': 4.17742395401001} -09/20/2021 16:44:14 - INFO - __main__ - Step 10388: {'lr': 0.00017306666666666665, 'samples': 332416, 'steps': 649, 'loss/train': 4.089846134185791} -09/20/2021 16:44:15 - INFO - __main__ - Step 10389: {'lr': 0.00017306666666666665, 'samples': 332448, 'steps': 649, 'loss/train': 4.385047912597656} -09/20/2021 16:44:16 - INFO - __main__ - Step 10390: {'lr': 0.00017306666666666665, 'samples': 332480, 'steps': 649, 'loss/train': 4.476358413696289} -09/20/2021 16:44:17 - INFO - __main__ - Step 10391: {'lr': 0.00017306666666666665, 'samples': 332512, 'steps': 649, 'loss/train': 4.444438457489014} -09/20/2021 16:44:17 - INFO - __main__ - Step 10392: {'lr': 0.00017306666666666665, 'samples': 332544, 'steps': 649, 'loss/train': 4.374939918518066} -09/20/2021 16:44:18 - INFO - __main__ - Step 10393: {'lr': 0.00017306666666666665, 'samples': 332576, 'steps': 649, 'loss/train': 3.8072900772094727} -09/20/2021 16:44:19 - INFO - __main__ - Step 10394: {'lr': 0.00017306666666666665, 'samples': 332608, 'steps': 649, 'loss/train': 4.616887092590332} -09/20/2021 16:44:20 - INFO - __main__ - Step 10395: {'lr': 0.00017306666666666665, 'samples': 332640, 'steps': 649, 'loss/train': 4.012620449066162} -09/20/2021 16:44:20 - INFO - __main__ - Step 10396: {'lr': 0.00017306666666666665, 'samples': 332672, 'steps': 649, 'loss/train': 4.2349629402160645} -09/20/2021 16:44:21 - INFO - __main__ - Step 10397: {'lr': 0.00017306666666666665, 'samples': 332704, 'steps': 649, 'loss/train': 4.427550315856934} -09/20/2021 16:44:22 - INFO - __main__ - Step 10398: {'lr': 0.00017306666666666665, 'samples': 332736, 'steps': 649, 'loss/train': 4.367433071136475} -09/20/2021 16:44:23 - INFO - __main__ - Step 10399: {'lr': 0.00017306666666666665, 'samples': 332768, 'steps': 649, 'loss/train': 3.7011420726776123} -09/20/2021 16:44:23 - INFO - __main__ - Step 10400: {'lr': 0.00017306666666666665, 'samples': 332800, 'steps': 649, 'loss/train': 3.4467477798461914} -09/20/2021 16:44:24 - INFO - __main__ - Step 10401: {'lr': 0.00017333333333333334, 'samples': 332832, 'steps': 650, 'loss/train': 3.931945562362671} -09/20/2021 16:44:25 - INFO - __main__ - Step 10402: {'lr': 0.00017333333333333334, 'samples': 332864, 'steps': 650, 'loss/train': 4.350550174713135} -09/20/2021 16:44:26 - INFO - __main__ - Step 10403: {'lr': 0.00017333333333333334, 'samples': 332896, 'steps': 650, 'loss/train': 4.223275184631348} -09/20/2021 16:44:27 - INFO - __main__ - Step 10404: {'lr': 0.00017333333333333334, 'samples': 332928, 'steps': 650, 'loss/train': 4.425329208374023} -09/20/2021 16:44:27 - INFO - __main__ - Step 10405: {'lr': 0.00017333333333333334, 'samples': 332960, 'steps': 650, 'loss/train': 5.0525383949279785} -09/20/2021 16:44:28 - INFO - __main__ - Step 10406: {'lr': 0.00017333333333333334, 'samples': 332992, 'steps': 650, 'loss/train': 4.824010848999023} -09/20/2021 16:44:30 - INFO - __main__ - Step 10407: {'lr': 0.00017333333333333334, 'samples': 333024, 'steps': 650, 'loss/train': 3.9068477153778076} -09/20/2021 16:44:30 - INFO - __main__ - Step 10408: {'lr': 0.00017333333333333334, 'samples': 333056, 'steps': 650, 'loss/train': 4.732909679412842} -09/20/2021 16:44:31 - INFO - __main__ - Step 10409: {'lr': 0.00017333333333333334, 'samples': 333088, 'steps': 650, 'loss/train': 4.296350479125977} -09/20/2021 16:44:32 - INFO - __main__ - Step 10410: {'lr': 0.00017333333333333334, 'samples': 333120, 'steps': 650, 'loss/train': 3.87902569770813} -09/20/2021 16:44:33 - INFO - __main__ - Step 10411: {'lr': 0.00017333333333333334, 'samples': 333152, 'steps': 650, 'loss/train': 3.204880475997925} -09/20/2021 16:44:33 - INFO - __main__ - Step 10412: {'lr': 0.00017333333333333334, 'samples': 333184, 'steps': 650, 'loss/train': 3.583420753479004} -09/20/2021 16:44:34 - INFO - __main__ - Step 10413: {'lr': 0.00017333333333333334, 'samples': 333216, 'steps': 650, 'loss/train': 3.6669552326202393} -09/20/2021 16:44:35 - INFO - __main__ - Step 10414: {'lr': 0.00017333333333333334, 'samples': 333248, 'steps': 650, 'loss/train': 3.874253034591675} -09/20/2021 16:44:36 - INFO - __main__ - Step 10415: {'lr': 0.00017333333333333334, 'samples': 333280, 'steps': 650, 'loss/train': 4.249661445617676} -09/20/2021 16:44:36 - INFO - __main__ - Step 10416: {'lr': 0.00017333333333333334, 'samples': 333312, 'steps': 650, 'loss/train': 4.814536094665527} -09/20/2021 16:44:37 - INFO - __main__ - Step 10417: {'lr': 0.00017360000000000002, 'samples': 333344, 'steps': 651, 'loss/train': 4.843518257141113} -09/20/2021 16:44:38 - INFO - __main__ - Step 10418: {'lr': 0.00017360000000000002, 'samples': 333376, 'steps': 651, 'loss/train': 4.731437683105469} -09/20/2021 16:44:39 - INFO - __main__ - Step 10419: {'lr': 0.00017360000000000002, 'samples': 333408, 'steps': 651, 'loss/train': 4.0346879959106445} -09/20/2021 16:44:40 - INFO - __main__ - Step 10420: {'lr': 0.00017360000000000002, 'samples': 333440, 'steps': 651, 'loss/train': 5.136067867279053} -09/20/2021 16:44:40 - INFO - __main__ - Step 10421: {'lr': 0.00017360000000000002, 'samples': 333472, 'steps': 651, 'loss/train': 4.477573394775391} -09/20/2021 16:44:41 - INFO - __main__ - Step 10422: {'lr': 0.00017360000000000002, 'samples': 333504, 'steps': 651, 'loss/train': 3.839618682861328} -09/20/2021 16:44:42 - INFO - __main__ - Step 10423: {'lr': 0.00017360000000000002, 'samples': 333536, 'steps': 651, 'loss/train': 4.8891730308532715} -09/20/2021 16:44:43 - INFO - __main__ - Step 10424: {'lr': 0.00017360000000000002, 'samples': 333568, 'steps': 651, 'loss/train': 3.9976415634155273} -09/20/2021 16:44:43 - INFO - __main__ - Step 10425: {'lr': 0.00017360000000000002, 'samples': 333600, 'steps': 651, 'loss/train': 4.496819019317627} -09/20/2021 16:44:44 - INFO - __main__ - Step 10426: {'lr': 0.00017360000000000002, 'samples': 333632, 'steps': 651, 'loss/train': 4.1490559577941895} -09/20/2021 16:44:45 - INFO - __main__ - Step 10427: {'lr': 0.00017360000000000002, 'samples': 333664, 'steps': 651, 'loss/train': 4.562625885009766} -09/20/2021 16:44:46 - INFO - __main__ - Step 10428: {'lr': 0.00017360000000000002, 'samples': 333696, 'steps': 651, 'loss/train': 3.3006370067596436} -09/20/2021 16:44:46 - INFO - __main__ - Step 10429: {'lr': 0.00017360000000000002, 'samples': 333728, 'steps': 651, 'loss/train': 3.749722719192505} -09/20/2021 16:44:47 - INFO - __main__ - Step 10430: {'lr': 0.00017360000000000002, 'samples': 333760, 'steps': 651, 'loss/train': 2.551849842071533} -09/20/2021 16:44:48 - INFO - __main__ - Step 10431: {'lr': 0.00017360000000000002, 'samples': 333792, 'steps': 651, 'loss/train': 3.237619638442993} -09/20/2021 16:44:49 - INFO - __main__ - Step 10432: {'lr': 0.00017360000000000002, 'samples': 333824, 'steps': 651, 'loss/train': 2.8688511848449707} -09/20/2021 16:44:50 - INFO - __main__ - Step 10433: {'lr': 0.00017386666666666667, 'samples': 333856, 'steps': 652, 'loss/train': 2.5316078662872314} -09/20/2021 16:44:50 - INFO - __main__ - Step 10434: {'lr': 0.00017386666666666667, 'samples': 333888, 'steps': 652, 'loss/train': 2.4708638191223145} -09/20/2021 16:44:51 - INFO - __main__ - Step 10435: {'lr': 0.00017386666666666667, 'samples': 333920, 'steps': 652, 'loss/train': 3.3576042652130127} -09/20/2021 16:44:52 - INFO - __main__ - Step 10436: {'lr': 0.00017386666666666667, 'samples': 333952, 'steps': 652, 'loss/train': 3.3401033878326416} -09/20/2021 16:44:53 - INFO - __main__ - Step 10437: {'lr': 0.00017386666666666667, 'samples': 333984, 'steps': 652, 'loss/train': 4.633533477783203} -09/20/2021 16:44:53 - INFO - __main__ - Step 10438: {'lr': 0.00017386666666666667, 'samples': 334016, 'steps': 652, 'loss/train': 3.7966158390045166} -09/20/2021 16:44:54 - INFO - __main__ - Step 10439: {'lr': 0.00017386666666666667, 'samples': 334048, 'steps': 652, 'loss/train': 4.101380348205566} -09/20/2021 16:44:55 - INFO - __main__ - Step 10440: {'lr': 0.00017386666666666667, 'samples': 334080, 'steps': 652, 'loss/train': 4.144776821136475} -09/20/2021 16:44:56 - INFO - __main__ - Step 10441: {'lr': 0.00017386666666666667, 'samples': 334112, 'steps': 652, 'loss/train': 3.7234394550323486} -09/20/2021 16:44:56 - INFO - __main__ - Step 10442: {'lr': 0.00017386666666666667, 'samples': 334144, 'steps': 652, 'loss/train': 5.273244380950928} -09/20/2021 16:44:57 - INFO - __main__ - Step 10443: {'lr': 0.00017386666666666667, 'samples': 334176, 'steps': 652, 'loss/train': 4.476210117340088} -09/20/2021 16:44:59 - INFO - __main__ - Step 10444: {'lr': 0.00017386666666666667, 'samples': 334208, 'steps': 652, 'loss/train': 5.1448540687561035} -09/20/2021 16:44:59 - INFO - __main__ - Step 10445: {'lr': 0.00017386666666666667, 'samples': 334240, 'steps': 652, 'loss/train': 4.174772262573242} -09/20/2021 16:45:00 - INFO - __main__ - Step 10446: {'lr': 0.00017386666666666667, 'samples': 334272, 'steps': 652, 'loss/train': 3.471750020980835} -09/20/2021 16:45:01 - INFO - __main__ - Step 10447: {'lr': 0.00017386666666666667, 'samples': 334304, 'steps': 652, 'loss/train': 3.5306053161621094} -09/20/2021 16:45:02 - INFO - __main__ - Step 10448: {'lr': 0.00017386666666666667, 'samples': 334336, 'steps': 652, 'loss/train': 3.4984934329986572} -09/20/2021 16:45:02 - INFO - __main__ - Step 10449: {'lr': 0.00017413333333333336, 'samples': 334368, 'steps': 653, 'loss/train': 3.200810194015503} -09/20/2021 16:45:03 - INFO - __main__ - Step 10450: {'lr': 0.00017413333333333336, 'samples': 334400, 'steps': 653, 'loss/train': 3.17862868309021} -09/20/2021 16:45:04 - INFO - __main__ - Step 10451: {'lr': 0.00017413333333333336, 'samples': 334432, 'steps': 653, 'loss/train': 3.8877358436584473} -09/20/2021 16:45:05 - INFO - __main__ - Step 10452: {'lr': 0.00017413333333333336, 'samples': 334464, 'steps': 653, 'loss/train': 3.85070538520813} -09/20/2021 16:45:05 - INFO - __main__ - Step 10453: {'lr': 0.00017413333333333336, 'samples': 334496, 'steps': 653, 'loss/train': 4.229180812835693} -09/20/2021 16:45:06 - INFO - __main__ - Step 10454: {'lr': 0.00017413333333333336, 'samples': 334528, 'steps': 653, 'loss/train': 1.76949942111969} -09/20/2021 16:45:07 - INFO - __main__ - Step 10455: {'lr': 0.00017413333333333336, 'samples': 334560, 'steps': 653, 'loss/train': 4.331706523895264} -09/20/2021 16:45:08 - INFO - __main__ - Step 10456: {'lr': 0.00017413333333333336, 'samples': 334592, 'steps': 653, 'loss/train': 4.608278274536133} -09/20/2021 16:45:08 - INFO - __main__ - Step 10457: {'lr': 0.00017413333333333336, 'samples': 334624, 'steps': 653, 'loss/train': 4.196272850036621} -09/20/2021 16:45:09 - INFO - __main__ - Step 10458: {'lr': 0.00017413333333333336, 'samples': 334656, 'steps': 653, 'loss/train': 3.556488513946533} -09/20/2021 16:45:10 - INFO - __main__ - Step 10459: {'lr': 0.00017413333333333336, 'samples': 334688, 'steps': 653, 'loss/train': 5.22199010848999} -09/20/2021 16:45:11 - INFO - __main__ - Step 10460: {'lr': 0.00017413333333333336, 'samples': 334720, 'steps': 653, 'loss/train': 3.886258363723755} -09/20/2021 16:45:11 - INFO - __main__ - Step 10461: {'lr': 0.00017413333333333336, 'samples': 334752, 'steps': 653, 'loss/train': 4.462453365325928} -09/20/2021 16:45:12 - INFO - __main__ - Step 10462: {'lr': 0.00017413333333333336, 'samples': 334784, 'steps': 653, 'loss/train': 4.6969733238220215} -09/20/2021 16:45:13 - INFO - __main__ - Step 10463: {'lr': 0.00017413333333333336, 'samples': 334816, 'steps': 653, 'loss/train': 5.758875846862793} -09/20/2021 16:45:14 - INFO - __main__ - Step 10464: {'lr': 0.00017413333333333336, 'samples': 334848, 'steps': 653, 'loss/train': 4.4018073081970215} -09/20/2021 16:45:15 - INFO - __main__ - Step 10465: {'lr': 0.0001744, 'samples': 334880, 'steps': 654, 'loss/train': 4.06862735748291} -09/20/2021 16:45:15 - INFO - __main__ - Step 10466: {'lr': 0.0001744, 'samples': 334912, 'steps': 654, 'loss/train': 4.587326526641846} -09/20/2021 16:45:16 - INFO - __main__ - Step 10467: {'lr': 0.0001744, 'samples': 334944, 'steps': 654, 'loss/train': 3.7565062046051025} -09/20/2021 16:45:17 - INFO - __main__ - Step 10468: {'lr': 0.0001744, 'samples': 334976, 'steps': 654, 'loss/train': 4.170257091522217} -09/20/2021 16:45:18 - INFO - __main__ - Step 10469: {'lr': 0.0001744, 'samples': 335008, 'steps': 654, 'loss/train': 4.592902183532715} -09/20/2021 16:45:18 - INFO - __main__ - Step 10470: {'lr': 0.0001744, 'samples': 335040, 'steps': 654, 'loss/train': 3.981398820877075} -09/20/2021 16:45:19 - INFO - __main__ - Step 10471: {'lr': 0.0001744, 'samples': 335072, 'steps': 654, 'loss/train': 4.205925464630127} -09/20/2021 16:45:20 - INFO - __main__ - Step 10472: {'lr': 0.0001744, 'samples': 335104, 'steps': 654, 'loss/train': 1.733882188796997} -09/20/2021 16:45:21 - INFO - __main__ - Step 10473: {'lr': 0.0001744, 'samples': 335136, 'steps': 654, 'loss/train': 2.835134983062744} -09/20/2021 16:45:21 - INFO - __main__ - Step 10474: {'lr': 0.0001744, 'samples': 335168, 'steps': 654, 'loss/train': 4.66607666015625} -09/20/2021 16:45:22 - INFO - __main__ - Step 10475: {'lr': 0.0001744, 'samples': 335200, 'steps': 654, 'loss/train': 4.220746994018555} -09/20/2021 16:45:23 - INFO - __main__ - Step 10476: {'lr': 0.0001744, 'samples': 335232, 'steps': 654, 'loss/train': 3.9580228328704834} -09/20/2021 16:45:24 - INFO - __main__ - Step 10477: {'lr': 0.0001744, 'samples': 335264, 'steps': 654, 'loss/train': 4.393165588378906} -09/20/2021 16:45:24 - INFO - __main__ - Step 10478: {'lr': 0.0001744, 'samples': 335296, 'steps': 654, 'loss/train': 5.021004676818848} -09/20/2021 16:45:26 - INFO - __main__ - Step 10479: {'lr': 0.0001744, 'samples': 335328, 'steps': 654, 'loss/train': 4.752250671386719} -09/20/2021 16:45:26 - INFO - __main__ - Step 10480: {'lr': 0.0001744, 'samples': 335360, 'steps': 654, 'loss/train': 4.631201267242432} -09/20/2021 16:45:27 - INFO - __main__ - Step 10481: {'lr': 0.00017466666666666667, 'samples': 335392, 'steps': 655, 'loss/train': 5.145892143249512} -09/20/2021 16:45:28 - INFO - __main__ - Step 10482: {'lr': 0.00017466666666666667, 'samples': 335424, 'steps': 655, 'loss/train': 3.1500754356384277} -09/20/2021 16:45:29 - INFO - __main__ - Step 10483: {'lr': 0.00017466666666666667, 'samples': 335456, 'steps': 655, 'loss/train': 4.143188953399658} -09/20/2021 16:45:29 - INFO - __main__ - Step 10484: {'lr': 0.00017466666666666667, 'samples': 335488, 'steps': 655, 'loss/train': 4.317288875579834} -09/20/2021 16:45:30 - INFO - __main__ - Step 10485: {'lr': 0.00017466666666666667, 'samples': 335520, 'steps': 655, 'loss/train': 4.124907493591309} -09/20/2021 16:45:31 - INFO - __main__ - Step 10486: {'lr': 0.00017466666666666667, 'samples': 335552, 'steps': 655, 'loss/train': 4.157785892486572} -09/20/2021 16:45:32 - INFO - __main__ - Step 10487: {'lr': 0.00017466666666666667, 'samples': 335584, 'steps': 655, 'loss/train': 4.123380184173584} -09/20/2021 16:45:32 - INFO - __main__ - Step 10488: {'lr': 0.00017466666666666667, 'samples': 335616, 'steps': 655, 'loss/train': 4.309909343719482} -09/20/2021 16:45:33 - INFO - __main__ - Step 10489: {'lr': 0.00017466666666666667, 'samples': 335648, 'steps': 655, 'loss/train': 4.756484508514404} -09/20/2021 16:45:34 - INFO - __main__ - Step 10490: {'lr': 0.00017466666666666667, 'samples': 335680, 'steps': 655, 'loss/train': 4.205253601074219} -09/20/2021 16:45:35 - INFO - __main__ - Step 10491: {'lr': 0.00017466666666666667, 'samples': 335712, 'steps': 655, 'loss/train': 4.662364482879639} -09/20/2021 16:45:35 - INFO - __main__ - Step 10492: {'lr': 0.00017466666666666667, 'samples': 335744, 'steps': 655, 'loss/train': 4.192196846008301} -09/20/2021 16:45:36 - INFO - __main__ - Step 10493: {'lr': 0.00017466666666666667, 'samples': 335776, 'steps': 655, 'loss/train': 5.002904415130615} -09/20/2021 16:45:37 - INFO - __main__ - Step 10494: {'lr': 0.00017466666666666667, 'samples': 335808, 'steps': 655, 'loss/train': 3.6190638542175293} -09/20/2021 16:45:38 - INFO - __main__ - Step 10495: {'lr': 0.00017466666666666667, 'samples': 335840, 'steps': 655, 'loss/train': 3.2611045837402344} -09/20/2021 16:45:38 - INFO - __main__ - Step 10496: {'lr': 0.00017466666666666667, 'samples': 335872, 'steps': 655, 'loss/train': 4.123140335083008} -09/20/2021 16:45:39 - INFO - __main__ - Step 10497: {'lr': 0.00017493333333333335, 'samples': 335904, 'steps': 656, 'loss/train': 4.822150707244873} -09/20/2021 16:45:40 - INFO - __main__ - Step 10498: {'lr': 0.00017493333333333335, 'samples': 335936, 'steps': 656, 'loss/train': 4.47462797164917} -09/20/2021 16:45:41 - INFO - __main__ - Step 10499: {'lr': 0.00017493333333333335, 'samples': 335968, 'steps': 656, 'loss/train': 4.5355401039123535} -09/20/2021 16:45:42 - INFO - __main__ - Step 10500: {'lr': 0.00017493333333333335, 'samples': 336000, 'steps': 656, 'loss/train': 5.219723224639893} -09/20/2021 16:45:42 - INFO - __main__ - Step 10501: {'lr': 0.00017493333333333335, 'samples': 336032, 'steps': 656, 'loss/train': 3.958045482635498} -09/20/2021 16:45:43 - INFO - __main__ - Step 10502: {'lr': 0.00017493333333333335, 'samples': 336064, 'steps': 656, 'loss/train': 5.255721569061279} -09/20/2021 16:45:44 - INFO - __main__ - Step 10503: {'lr': 0.00017493333333333335, 'samples': 336096, 'steps': 656, 'loss/train': 4.835816383361816} -09/20/2021 16:45:45 - INFO - __main__ - Step 10504: {'lr': 0.00017493333333333335, 'samples': 336128, 'steps': 656, 'loss/train': 4.746545314788818} -09/20/2021 16:45:45 - INFO - __main__ - Step 10505: {'lr': 0.00017493333333333335, 'samples': 336160, 'steps': 656, 'loss/train': 5.436575412750244} -09/20/2021 16:45:46 - INFO - __main__ - Step 10506: {'lr': 0.00017493333333333335, 'samples': 336192, 'steps': 656, 'loss/train': 2.5664405822753906} -09/20/2021 16:45:47 - INFO - __main__ - Step 10507: {'lr': 0.00017493333333333335, 'samples': 336224, 'steps': 656, 'loss/train': 4.746216773986816} -09/20/2021 16:45:48 - INFO - __main__ - Step 10508: {'lr': 0.00017493333333333335, 'samples': 336256, 'steps': 656, 'loss/train': 3.6324071884155273} -09/20/2021 16:45:48 - INFO - __main__ - Step 10509: {'lr': 0.00017493333333333335, 'samples': 336288, 'steps': 656, 'loss/train': 2.8237874507904053} -09/20/2021 16:45:50 - INFO - __main__ - Step 10510: {'lr': 0.00017493333333333335, 'samples': 336320, 'steps': 656, 'loss/train': 4.26629638671875} -09/20/2021 16:45:50 - INFO - __main__ - Step 10511: {'lr': 0.00017493333333333335, 'samples': 336352, 'steps': 656, 'loss/train': 4.155777454376221} -09/20/2021 16:45:51 - INFO - __main__ - Step 10512: {'lr': 0.00017493333333333335, 'samples': 336384, 'steps': 656, 'loss/train': 4.213776588439941} -09/20/2021 16:45:52 - INFO - __main__ - Step 10513: {'lr': 0.0001752, 'samples': 336416, 'steps': 657, 'loss/train': 3.5282981395721436} -09/20/2021 16:45:53 - INFO - __main__ - Step 10514: {'lr': 0.0001752, 'samples': 336448, 'steps': 657, 'loss/train': 4.021828651428223} -09/20/2021 16:45:53 - INFO - __main__ - Step 10515: {'lr': 0.0001752, 'samples': 336480, 'steps': 657, 'loss/train': 4.154494285583496} -09/20/2021 16:45:54 - INFO - __main__ - Step 10516: {'lr': 0.0001752, 'samples': 336512, 'steps': 657, 'loss/train': 4.317999839782715} -09/20/2021 16:45:55 - INFO - __main__ - Step 10517: {'lr': 0.0001752, 'samples': 336544, 'steps': 657, 'loss/train': 4.21370267868042} -09/20/2021 16:45:56 - INFO - __main__ - Step 10518: {'lr': 0.0001752, 'samples': 336576, 'steps': 657, 'loss/train': 4.496139049530029} -09/20/2021 16:45:56 - INFO - __main__ - Step 10519: {'lr': 0.0001752, 'samples': 336608, 'steps': 657, 'loss/train': 4.516943454742432} -09/20/2021 16:45:57 - INFO - __main__ - Step 10520: {'lr': 0.0001752, 'samples': 336640, 'steps': 657, 'loss/train': 4.533854007720947} -09/20/2021 16:45:58 - INFO - __main__ - Step 10521: {'lr': 0.0001752, 'samples': 336672, 'steps': 657, 'loss/train': 5.059892177581787} -09/20/2021 16:45:59 - INFO - __main__ - Step 10522: {'lr': 0.0001752, 'samples': 336704, 'steps': 657, 'loss/train': 4.117922782897949} -09/20/2021 16:45:59 - INFO - __main__ - Step 10523: {'lr': 0.0001752, 'samples': 336736, 'steps': 657, 'loss/train': 5.1873393058776855} -09/20/2021 16:46:00 - INFO - __main__ - Step 10524: {'lr': 0.0001752, 'samples': 336768, 'steps': 657, 'loss/train': 4.89213228225708} -09/20/2021 16:46:01 - INFO - __main__ - Step 10525: {'lr': 0.0001752, 'samples': 336800, 'steps': 657, 'loss/train': 4.34438419342041} -09/20/2021 16:46:02 - INFO - __main__ - Step 10526: {'lr': 0.0001752, 'samples': 336832, 'steps': 657, 'loss/train': 5.210491180419922} -09/20/2021 16:46:02 - INFO - __main__ - Step 10527: {'lr': 0.0001752, 'samples': 336864, 'steps': 657, 'loss/train': 4.407757759094238} -09/20/2021 16:46:03 - INFO - __main__ - Step 10528: {'lr': 0.0001752, 'samples': 336896, 'steps': 657, 'loss/train': 4.112328052520752} -09/20/2021 16:46:04 - INFO - __main__ - Step 10529: {'lr': 0.00017546666666666666, 'samples': 336928, 'steps': 658, 'loss/train': 3.908726453781128} -09/20/2021 16:46:05 - INFO - __main__ - Step 10530: {'lr': 0.00017546666666666666, 'samples': 336960, 'steps': 658, 'loss/train': 3.9822046756744385} -09/20/2021 16:46:06 - INFO - __main__ - Step 10531: {'lr': 0.00017546666666666666, 'samples': 336992, 'steps': 658, 'loss/train': 3.512779951095581} -09/20/2021 16:46:06 - INFO - __main__ - Step 10532: {'lr': 0.00017546666666666666, 'samples': 337024, 'steps': 658, 'loss/train': 4.613461971282959} -09/20/2021 16:46:07 - INFO - __main__ - Step 10533: {'lr': 0.00017546666666666666, 'samples': 337056, 'steps': 658, 'loss/train': 5.091205596923828} -09/20/2021 16:46:08 - INFO - __main__ - Step 10534: {'lr': 0.00017546666666666666, 'samples': 337088, 'steps': 658, 'loss/train': 3.9120938777923584} -09/20/2021 16:46:09 - INFO - __main__ - Step 10535: {'lr': 0.00017546666666666666, 'samples': 337120, 'steps': 658, 'loss/train': 4.443889617919922} -09/20/2021 16:46:09 - INFO - __main__ - Step 10536: {'lr': 0.00017546666666666666, 'samples': 337152, 'steps': 658, 'loss/train': 3.631579875946045} -09/20/2021 16:46:10 - INFO - __main__ - Step 10537: {'lr': 0.00017546666666666666, 'samples': 337184, 'steps': 658, 'loss/train': 3.763453722000122} -09/20/2021 16:46:11 - INFO - __main__ - Step 10538: {'lr': 0.00017546666666666666, 'samples': 337216, 'steps': 658, 'loss/train': 4.200841903686523} -09/20/2021 16:46:12 - INFO - __main__ - Step 10539: {'lr': 0.00017546666666666666, 'samples': 337248, 'steps': 658, 'loss/train': 3.7716732025146484} -09/20/2021 16:46:12 - INFO - __main__ - Step 10540: {'lr': 0.00017546666666666666, 'samples': 337280, 'steps': 658, 'loss/train': 5.237102031707764} -09/20/2021 16:46:14 - INFO - __main__ - Step 10541: {'lr': 0.00017546666666666666, 'samples': 337312, 'steps': 658, 'loss/train': 3.965346574783325} -09/20/2021 16:46:14 - INFO - __main__ - Step 10542: {'lr': 0.00017546666666666666, 'samples': 337344, 'steps': 658, 'loss/train': 5.106149196624756} -09/20/2021 16:46:15 - INFO - __main__ - Step 10543: {'lr': 0.00017546666666666666, 'samples': 337376, 'steps': 658, 'loss/train': 4.112148761749268} -09/20/2021 16:46:16 - INFO - __main__ - Step 10544: {'lr': 0.00017546666666666666, 'samples': 337408, 'steps': 658, 'loss/train': 4.10458517074585} -09/20/2021 16:46:17 - INFO - __main__ - Step 10545: {'lr': 0.00017573333333333334, 'samples': 337440, 'steps': 659, 'loss/train': 3.841639757156372} -09/20/2021 16:46:18 - INFO - __main__ - Step 10546: {'lr': 0.00017573333333333334, 'samples': 337472, 'steps': 659, 'loss/train': 3.8164875507354736} -09/20/2021 16:46:18 - INFO - __main__ - Step 10547: {'lr': 0.00017573333333333334, 'samples': 337504, 'steps': 659, 'loss/train': 4.730325698852539} -09/20/2021 16:46:19 - INFO - __main__ - Step 10548: {'lr': 0.00017573333333333334, 'samples': 337536, 'steps': 659, 'loss/train': 3.693905830383301} -09/20/2021 16:46:20 - INFO - __main__ - Step 10549: {'lr': 0.00017573333333333334, 'samples': 337568, 'steps': 659, 'loss/train': 5.250576019287109} -09/20/2021 16:46:21 - INFO - __main__ - Step 10550: {'lr': 0.00017573333333333334, 'samples': 337600, 'steps': 659, 'loss/train': 4.0963521003723145} -09/20/2021 16:46:21 - INFO - __main__ - Step 10551: {'lr': 0.00017573333333333334, 'samples': 337632, 'steps': 659, 'loss/train': 3.9524307250976562} -09/20/2021 16:46:22 - INFO - __main__ - Step 10552: {'lr': 0.00017573333333333334, 'samples': 337664, 'steps': 659, 'loss/train': 2.516395330429077} -09/20/2021 16:46:23 - INFO - __main__ - Step 10553: {'lr': 0.00017573333333333334, 'samples': 337696, 'steps': 659, 'loss/train': 4.560606479644775} -09/20/2021 16:46:24 - INFO - __main__ - Step 10554: {'lr': 0.00017573333333333334, 'samples': 337728, 'steps': 659, 'loss/train': 4.20713996887207} -09/20/2021 16:46:24 - INFO - __main__ - Step 10555: {'lr': 0.00017573333333333334, 'samples': 337760, 'steps': 659, 'loss/train': 4.136289596557617} -09/20/2021 16:46:25 - INFO - __main__ - Step 10556: {'lr': 0.00017573333333333334, 'samples': 337792, 'steps': 659, 'loss/train': 4.656594276428223} -09/20/2021 16:46:26 - INFO - __main__ - Step 10557: {'lr': 0.00017573333333333334, 'samples': 337824, 'steps': 659, 'loss/train': 5.09838342666626} -09/20/2021 16:46:27 - INFO - __main__ - Step 10558: {'lr': 0.00017573333333333334, 'samples': 337856, 'steps': 659, 'loss/train': 4.649855136871338} -09/20/2021 16:46:27 - INFO - __main__ - Step 10559: {'lr': 0.00017573333333333334, 'samples': 337888, 'steps': 659, 'loss/train': 4.47335147857666} -09/20/2021 16:46:28 - INFO - __main__ - Step 10560: {'lr': 0.00017573333333333334, 'samples': 337920, 'steps': 659, 'loss/train': 4.702092170715332} -09/20/2021 16:46:29 - INFO - __main__ - Step 10561: {'lr': 0.00017600000000000002, 'samples': 337952, 'steps': 660, 'loss/train': 2.6573009490966797} -09/20/2021 16:46:30 - INFO - __main__ - Step 10562: {'lr': 0.00017600000000000002, 'samples': 337984, 'steps': 660, 'loss/train': 3.7946598529815674} -09/20/2021 16:46:30 - INFO - __main__ - Step 10563: {'lr': 0.00017600000000000002, 'samples': 338016, 'steps': 660, 'loss/train': 3.2716586589813232} -09/20/2021 16:46:31 - INFO - __main__ - Step 10564: {'lr': 0.00017600000000000002, 'samples': 338048, 'steps': 660, 'loss/train': 4.035428047180176} -09/20/2021 16:46:32 - INFO - __main__ - Step 10565: {'lr': 0.00017600000000000002, 'samples': 338080, 'steps': 660, 'loss/train': 4.527972221374512} -09/20/2021 16:46:33 - INFO - __main__ - Step 10566: {'lr': 0.00017600000000000002, 'samples': 338112, 'steps': 660, 'loss/train': 5.2505035400390625} -09/20/2021 16:46:33 - INFO - __main__ - Step 10567: {'lr': 0.00017600000000000002, 'samples': 338144, 'steps': 660, 'loss/train': 4.6715006828308105} -09/20/2021 16:46:34 - INFO - __main__ - Step 10568: {'lr': 0.00017600000000000002, 'samples': 338176, 'steps': 660, 'loss/train': 4.635469913482666} -09/20/2021 16:46:35 - INFO - __main__ - Step 10569: {'lr': 0.00017600000000000002, 'samples': 338208, 'steps': 660, 'loss/train': 4.01348876953125} -09/20/2021 16:46:36 - INFO - __main__ - Step 10570: {'lr': 0.00017600000000000002, 'samples': 338240, 'steps': 660, 'loss/train': 3.550518274307251} -09/20/2021 16:46:36 - INFO - __main__ - Step 10571: {'lr': 0.00017600000000000002, 'samples': 338272, 'steps': 660, 'loss/train': 4.385488510131836} -09/20/2021 16:46:37 - INFO - __main__ - Step 10572: {'lr': 0.00017600000000000002, 'samples': 338304, 'steps': 660, 'loss/train': 4.37652587890625} -09/20/2021 16:46:39 - INFO - __main__ - Step 10573: {'lr': 0.00017600000000000002, 'samples': 338336, 'steps': 660, 'loss/train': 3.7670764923095703} -09/20/2021 16:46:40 - INFO - __main__ - Step 10574: {'lr': 0.00017600000000000002, 'samples': 338368, 'steps': 660, 'loss/train': 5.1238250732421875} -09/20/2021 16:46:40 - INFO - __main__ - Step 10575: {'lr': 0.00017600000000000002, 'samples': 338400, 'steps': 660, 'loss/train': 4.534255027770996} -09/20/2021 16:46:41 - INFO - __main__ - Step 10576: {'lr': 0.00017600000000000002, 'samples': 338432, 'steps': 660, 'loss/train': 4.195713043212891} -09/20/2021 16:46:42 - INFO - __main__ - Step 10577: {'lr': 0.00017626666666666668, 'samples': 338464, 'steps': 661, 'loss/train': 1.6003830432891846} -09/20/2021 16:46:43 - INFO - __main__ - Step 10578: {'lr': 0.00017626666666666668, 'samples': 338496, 'steps': 661, 'loss/train': 4.163867950439453} -09/20/2021 16:46:43 - INFO - __main__ - Step 10579: {'lr': 0.00017626666666666668, 'samples': 338528, 'steps': 661, 'loss/train': 4.227255344390869} -09/20/2021 16:46:44 - INFO - __main__ - Step 10580: {'lr': 0.00017626666666666668, 'samples': 338560, 'steps': 661, 'loss/train': 4.240952968597412} -09/20/2021 16:46:45 - INFO - __main__ - Step 10581: {'lr': 0.00017626666666666668, 'samples': 338592, 'steps': 661, 'loss/train': 5.047826766967773} -09/20/2021 16:46:46 - INFO - __main__ - Step 10582: {'lr': 0.00017626666666666668, 'samples': 338624, 'steps': 661, 'loss/train': 3.849630832672119} -09/20/2021 16:46:46 - INFO - __main__ - Step 10583: {'lr': 0.00017626666666666668, 'samples': 338656, 'steps': 661, 'loss/train': 4.612513065338135} -09/20/2021 16:46:47 - INFO - __main__ - Step 10584: {'lr': 0.00017626666666666668, 'samples': 338688, 'steps': 661, 'loss/train': 4.957599639892578} -09/20/2021 16:46:48 - INFO - __main__ - Step 10585: {'lr': 0.00017626666666666668, 'samples': 338720, 'steps': 661, 'loss/train': 4.231832981109619} -09/20/2021 16:46:49 - INFO - __main__ - Step 10586: {'lr': 0.00017626666666666668, 'samples': 338752, 'steps': 661, 'loss/train': 3.7865495681762695} -09/20/2021 16:46:49 - INFO - __main__ - Step 10587: {'lr': 0.00017626666666666668, 'samples': 338784, 'steps': 661, 'loss/train': 3.785512685775757} -09/20/2021 16:46:50 - INFO - __main__ - Step 10588: {'lr': 0.00017626666666666668, 'samples': 338816, 'steps': 661, 'loss/train': 5.207725524902344} -09/20/2021 16:46:51 - INFO - __main__ - Step 10589: {'lr': 0.00017626666666666668, 'samples': 338848, 'steps': 661, 'loss/train': 4.386537075042725} -09/20/2021 16:46:52 - INFO - __main__ - Step 10590: {'lr': 0.00017626666666666668, 'samples': 338880, 'steps': 661, 'loss/train': 5.085824966430664} -09/20/2021 16:46:52 - INFO - __main__ - Step 10591: {'lr': 0.00017626666666666668, 'samples': 338912, 'steps': 661, 'loss/train': 2.811375856399536} -09/20/2021 16:46:53 - INFO - __main__ - Step 10592: {'lr': 0.00017626666666666668, 'samples': 338944, 'steps': 661, 'loss/train': 4.656874179840088} -09/20/2021 16:46:54 - INFO - __main__ - Step 10593: {'lr': 0.00017653333333333336, 'samples': 338976, 'steps': 662, 'loss/train': 4.7326765060424805} -09/20/2021 16:46:55 - INFO - __main__ - Step 10594: {'lr': 0.00017653333333333336, 'samples': 339008, 'steps': 662, 'loss/train': 3.758397102355957} -09/20/2021 16:46:56 - INFO - __main__ - Step 10595: {'lr': 0.00017653333333333336, 'samples': 339040, 'steps': 662, 'loss/train': 4.516158580780029} -09/20/2021 16:46:56 - INFO - __main__ - Step 10596: {'lr': 0.00017653333333333336, 'samples': 339072, 'steps': 662, 'loss/train': 5.448105812072754} -09/20/2021 16:46:57 - INFO - __main__ - Step 10597: {'lr': 0.00017653333333333336, 'samples': 339104, 'steps': 662, 'loss/train': 2.9724812507629395} -09/20/2021 16:46:58 - INFO - __main__ - Step 10598: {'lr': 0.00017653333333333336, 'samples': 339136, 'steps': 662, 'loss/train': 4.093414306640625} -09/20/2021 16:46:59 - INFO - __main__ - Step 10599: {'lr': 0.00017653333333333336, 'samples': 339168, 'steps': 662, 'loss/train': 3.6789703369140625} -09/20/2021 16:46:59 - INFO - __main__ - Step 10600: {'lr': 0.00017653333333333336, 'samples': 339200, 'steps': 662, 'loss/train': 3.0114479064941406} -09/20/2021 16:47:00 - INFO - __main__ - Step 10601: {'lr': 0.00017653333333333336, 'samples': 339232, 'steps': 662, 'loss/train': 2.2637314796447754} -09/20/2021 16:47:01 - INFO - __main__ - Step 10602: {'lr': 0.00017653333333333336, 'samples': 339264, 'steps': 662, 'loss/train': 3.1178090572357178} -09/20/2021 16:47:02 - INFO - __main__ - Step 10603: {'lr': 0.00017653333333333336, 'samples': 339296, 'steps': 662, 'loss/train': 3.164950132369995} -09/20/2021 16:47:02 - INFO - __main__ - Step 10604: {'lr': 0.00017653333333333336, 'samples': 339328, 'steps': 662, 'loss/train': 2.1081135272979736} -09/20/2021 16:47:03 - INFO - __main__ - Step 10605: {'lr': 0.00017653333333333336, 'samples': 339360, 'steps': 662, 'loss/train': 2.3756847381591797} -09/20/2021 16:47:04 - INFO - __main__ - Step 10606: {'lr': 0.00017653333333333336, 'samples': 339392, 'steps': 662, 'loss/train': 3.2015321254730225} -09/20/2021 16:47:05 - INFO - __main__ - Step 10607: {'lr': 0.00017653333333333336, 'samples': 339424, 'steps': 662, 'loss/train': 3.287447929382324} -09/20/2021 16:47:05 - INFO - __main__ - Step 10608: {'lr': 0.00017653333333333336, 'samples': 339456, 'steps': 662, 'loss/train': 4.676942825317383} -09/20/2021 16:47:07 - INFO - __main__ - Step 10609: {'lr': 0.00017680000000000001, 'samples': 339488, 'steps': 663, 'loss/train': 5.036538600921631} -09/20/2021 16:47:08 - INFO - __main__ - Step 10610: {'lr': 0.00017680000000000001, 'samples': 339520, 'steps': 663, 'loss/train': 0.6468448042869568} -09/20/2021 16:47:09 - INFO - __main__ - Step 10611: {'lr': 0.00017680000000000001, 'samples': 339552, 'steps': 663, 'loss/train': 3.7737691402435303} -09/20/2021 16:47:10 - INFO - __main__ - Step 10612: {'lr': 0.00017680000000000001, 'samples': 339584, 'steps': 663, 'loss/train': 5.1616129875183105} -09/20/2021 16:47:10 - INFO - __main__ - Step 10613: {'lr': 0.00017680000000000001, 'samples': 339616, 'steps': 663, 'loss/train': 5.013461589813232} -09/20/2021 16:47:11 - INFO - __main__ - Step 10614: {'lr': 0.00017680000000000001, 'samples': 339648, 'steps': 663, 'loss/train': 3.7651147842407227} -09/20/2021 16:47:12 - INFO - __main__ - Step 10615: {'lr': 0.00017680000000000001, 'samples': 339680, 'steps': 663, 'loss/train': 4.682193279266357} -09/20/2021 16:47:13 - INFO - __main__ - Step 10616: {'lr': 0.00017680000000000001, 'samples': 339712, 'steps': 663, 'loss/train': 4.644949436187744} -09/20/2021 16:47:13 - INFO - __main__ - Step 10617: {'lr': 0.00017680000000000001, 'samples': 339744, 'steps': 663, 'loss/train': 4.519559383392334} -09/20/2021 16:47:14 - INFO - __main__ - Step 10618: {'lr': 0.00017680000000000001, 'samples': 339776, 'steps': 663, 'loss/train': 4.979047775268555} -09/20/2021 16:47:15 - INFO - __main__ - Step 10619: {'lr': 0.00017680000000000001, 'samples': 339808, 'steps': 663, 'loss/train': 4.987420082092285} -09/20/2021 16:47:16 - INFO - __main__ - Step 10620: {'lr': 0.00017680000000000001, 'samples': 339840, 'steps': 663, 'loss/train': 4.72322416305542} -09/20/2021 16:47:16 - INFO - __main__ - Step 10621: {'lr': 0.00017680000000000001, 'samples': 339872, 'steps': 663, 'loss/train': 4.322843551635742} -09/20/2021 16:47:17 - INFO - __main__ - Step 10622: {'lr': 0.00017680000000000001, 'samples': 339904, 'steps': 663, 'loss/train': 4.596656799316406} -09/20/2021 16:47:18 - INFO - __main__ - Step 10623: {'lr': 0.00017680000000000001, 'samples': 339936, 'steps': 663, 'loss/train': 3.909156322479248} -09/20/2021 16:47:19 - INFO - __main__ - Step 10624: {'lr': 0.00017680000000000001, 'samples': 339968, 'steps': 663, 'loss/train': 4.44904088973999} -09/20/2021 16:47:19 - INFO - __main__ - Step 10625: {'lr': 0.00017706666666666667, 'samples': 340000, 'steps': 664, 'loss/train': 3.684051990509033} -09/20/2021 16:47:20 - INFO - __main__ - Step 10626: {'lr': 0.00017706666666666667, 'samples': 340032, 'steps': 664, 'loss/train': 3.957301378250122} -09/20/2021 16:47:21 - INFO - __main__ - Step 10627: {'lr': 0.00017706666666666667, 'samples': 340064, 'steps': 664, 'loss/train': 6.277539253234863} -09/20/2021 16:47:22 - INFO - __main__ - Step 10628: {'lr': 0.00017706666666666667, 'samples': 340096, 'steps': 664, 'loss/train': 4.858173370361328} -09/20/2021 16:47:22 - INFO - __main__ - Step 10629: {'lr': 0.00017706666666666667, 'samples': 340128, 'steps': 664, 'loss/train': 4.154018878936768} -09/20/2021 16:47:23 - INFO - __main__ - Step 10630: {'lr': 0.00017706666666666667, 'samples': 340160, 'steps': 664, 'loss/train': 4.905262470245361} -09/20/2021 16:47:24 - INFO - __main__ - Step 10631: {'lr': 0.00017706666666666667, 'samples': 340192, 'steps': 664, 'loss/train': 4.597325325012207} -09/20/2021 16:47:25 - INFO - __main__ - Step 10632: {'lr': 0.00017706666666666667, 'samples': 340224, 'steps': 664, 'loss/train': 4.800408363342285} -09/20/2021 16:47:25 - INFO - __main__ - Step 10633: {'lr': 0.00017706666666666667, 'samples': 340256, 'steps': 664, 'loss/train': 4.7302751541137695} -09/20/2021 16:47:26 - INFO - __main__ - Step 10634: {'lr': 0.00017706666666666667, 'samples': 340288, 'steps': 664, 'loss/train': 4.204488277435303} -09/20/2021 16:47:27 - INFO - __main__ - Step 10635: {'lr': 0.00017706666666666667, 'samples': 340320, 'steps': 664, 'loss/train': 3.857795238494873} -09/20/2021 16:47:28 - INFO - __main__ - Step 10636: {'lr': 0.00017706666666666667, 'samples': 340352, 'steps': 664, 'loss/train': 4.472656726837158} -09/20/2021 16:47:28 - INFO - __main__ - Step 10637: {'lr': 0.00017706666666666667, 'samples': 340384, 'steps': 664, 'loss/train': 4.424192905426025} -09/20/2021 16:47:29 - INFO - __main__ - Step 10638: {'lr': 0.00017706666666666667, 'samples': 340416, 'steps': 664, 'loss/train': 4.7312517166137695} -09/20/2021 16:47:30 - INFO - __main__ - Step 10639: {'lr': 0.00017706666666666667, 'samples': 340448, 'steps': 664, 'loss/train': 4.603412628173828} -09/20/2021 16:47:32 - INFO - __main__ - Step 10640: {'lr': 0.00017706666666666667, 'samples': 340480, 'steps': 664, 'loss/train': 4.125955104827881} -09/20/2021 16:47:33 - INFO - __main__ - Step 10641: {'lr': 0.00017733333333333335, 'samples': 340512, 'steps': 665, 'loss/train': 3.8551459312438965} -09/20/2021 16:47:33 - INFO - __main__ - Step 10642: {'lr': 0.00017733333333333335, 'samples': 340544, 'steps': 665, 'loss/train': 4.55058479309082} -09/20/2021 16:47:34 - INFO - __main__ - Step 10643: {'lr': 0.00017733333333333335, 'samples': 340576, 'steps': 665, 'loss/train': 2.9411518573760986} -09/20/2021 16:47:35 - INFO - __main__ - Step 10644: {'lr': 0.00017733333333333335, 'samples': 340608, 'steps': 665, 'loss/train': 1.4697762727737427} -09/20/2021 16:47:36 - INFO - __main__ - Step 10645: {'lr': 0.00017733333333333335, 'samples': 340640, 'steps': 665, 'loss/train': 2.461376190185547} -09/20/2021 16:47:36 - INFO - __main__ - Step 10646: {'lr': 0.00017733333333333335, 'samples': 340672, 'steps': 665, 'loss/train': 1.67366623878479} -09/20/2021 16:47:37 - INFO - __main__ - Step 10647: {'lr': 0.00017733333333333335, 'samples': 340704, 'steps': 665, 'loss/train': 2.757333993911743} -09/20/2021 16:47:38 - INFO - __main__ - Step 10648: {'lr': 0.00017733333333333335, 'samples': 340736, 'steps': 665, 'loss/train': 2.759618043899536} -09/20/2021 16:47:39 - INFO - __main__ - Step 10649: {'lr': 0.00017733333333333335, 'samples': 340768, 'steps': 665, 'loss/train': 2.068049430847168} -09/20/2021 16:47:39 - INFO - __main__ - Step 10650: {'lr': 0.00017733333333333335, 'samples': 340800, 'steps': 665, 'loss/train': 1.8240978717803955} -09/20/2021 16:47:40 - INFO - __main__ - Step 10651: {'lr': 0.00017733333333333335, 'samples': 340832, 'steps': 665, 'loss/train': 4.325057506561279} -09/20/2021 16:47:41 - INFO - __main__ - Step 10652: {'lr': 0.00017733333333333335, 'samples': 340864, 'steps': 665, 'loss/train': 4.3684892654418945} -09/20/2021 16:47:42 - INFO - __main__ - Step 10653: {'lr': 0.00017733333333333335, 'samples': 340896, 'steps': 665, 'loss/train': 4.658807277679443} -09/20/2021 16:47:42 - INFO - __main__ - Step 10654: {'lr': 0.00017733333333333335, 'samples': 340928, 'steps': 665, 'loss/train': 3.961214065551758} -09/20/2021 16:47:43 - INFO - __main__ - Step 10655: {'lr': 0.00017733333333333335, 'samples': 340960, 'steps': 665, 'loss/train': 3.626439332962036} -09/20/2021 16:47:44 - INFO - __main__ - Step 10656: {'lr': 0.00017733333333333335, 'samples': 340992, 'steps': 665, 'loss/train': 5.105169296264648} -09/20/2021 16:47:45 - INFO - __main__ - Step 10657: {'lr': 0.0001776, 'samples': 341024, 'steps': 666, 'loss/train': 3.9763731956481934} -09/20/2021 16:47:46 - INFO - __main__ - Step 10658: {'lr': 0.0001776, 'samples': 341056, 'steps': 666, 'loss/train': 4.854033946990967} -09/20/2021 16:47:46 - INFO - __main__ - Step 10659: {'lr': 0.0001776, 'samples': 341088, 'steps': 666, 'loss/train': 4.4841837882995605} -09/20/2021 16:47:47 - INFO - __main__ - Step 10660: {'lr': 0.0001776, 'samples': 341120, 'steps': 666, 'loss/train': 3.8724448680877686} -09/20/2021 16:47:48 - INFO - __main__ - Step 10661: {'lr': 0.0001776, 'samples': 341152, 'steps': 666, 'loss/train': 4.755134582519531} -09/20/2021 16:47:49 - INFO - __main__ - Step 10662: {'lr': 0.0001776, 'samples': 341184, 'steps': 666, 'loss/train': 5.1055474281311035} -09/20/2021 16:47:49 - INFO - __main__ - Step 10663: {'lr': 0.0001776, 'samples': 341216, 'steps': 666, 'loss/train': 5.4810943603515625} -09/20/2021 16:47:50 - INFO - __main__ - Step 10664: {'lr': 0.0001776, 'samples': 341248, 'steps': 666, 'loss/train': 4.2847113609313965} -09/20/2021 16:47:51 - INFO - __main__ - Step 10665: {'lr': 0.0001776, 'samples': 341280, 'steps': 666, 'loss/train': 4.31807804107666} -09/20/2021 16:47:52 - INFO - __main__ - Step 10666: {'lr': 0.0001776, 'samples': 341312, 'steps': 666, 'loss/train': 4.4716691970825195} -09/20/2021 16:47:52 - INFO - __main__ - Step 10667: {'lr': 0.0001776, 'samples': 341344, 'steps': 666, 'loss/train': 4.893887042999268} -09/20/2021 16:47:53 - INFO - __main__ - Step 10668: {'lr': 0.0001776, 'samples': 341376, 'steps': 666, 'loss/train': 3.7287540435791016} -09/20/2021 16:47:54 - INFO - __main__ - Step 10669: {'lr': 0.0001776, 'samples': 341408, 'steps': 666, 'loss/train': 4.350986003875732} -09/20/2021 16:47:55 - INFO - __main__ - Step 10670: {'lr': 0.0001776, 'samples': 341440, 'steps': 666, 'loss/train': 4.2984137535095215} -09/20/2021 16:47:56 - INFO - __main__ - Step 10671: {'lr': 0.0001776, 'samples': 341472, 'steps': 666, 'loss/train': 4.830106258392334} -09/20/2021 16:47:57 - INFO - __main__ - Step 10672: {'lr': 0.0001776, 'samples': 341504, 'steps': 666, 'loss/train': 4.524476528167725} -09/20/2021 16:47:57 - INFO - __main__ - Step 10673: {'lr': 0.00017786666666666666, 'samples': 341536, 'steps': 667, 'loss/train': 5.519395351409912} -09/20/2021 16:47:58 - INFO - __main__ - Step 10674: {'lr': 0.00017786666666666666, 'samples': 341568, 'steps': 667, 'loss/train': 5.098978042602539} -09/20/2021 16:47:59 - INFO - __main__ - Step 10675: {'lr': 0.00017786666666666666, 'samples': 341600, 'steps': 667, 'loss/train': 4.399795055389404} -09/20/2021 16:48:00 - INFO - __main__ - Step 10676: {'lr': 0.00017786666666666666, 'samples': 341632, 'steps': 667, 'loss/train': 4.711519718170166} -09/20/2021 16:48:00 - INFO - __main__ - Step 10677: {'lr': 0.00017786666666666666, 'samples': 341664, 'steps': 667, 'loss/train': 5.2777228355407715} -09/20/2021 16:48:01 - INFO - __main__ - Step 10678: {'lr': 0.00017786666666666666, 'samples': 341696, 'steps': 667, 'loss/train': 1.7861714363098145} -09/20/2021 16:48:02 - INFO - __main__ - Step 10679: {'lr': 0.00017786666666666666, 'samples': 341728, 'steps': 667, 'loss/train': 4.368166446685791} -09/20/2021 16:48:03 - INFO - __main__ - Step 10680: {'lr': 0.00017786666666666666, 'samples': 341760, 'steps': 667, 'loss/train': 2.02959942817688} -09/20/2021 16:48:03 - INFO - __main__ - Step 10681: {'lr': 0.00017786666666666666, 'samples': 341792, 'steps': 667, 'loss/train': 4.995675563812256} -09/20/2021 16:48:04 - INFO - __main__ - Step 10682: {'lr': 0.00017786666666666666, 'samples': 341824, 'steps': 667, 'loss/train': 3.9678759574890137} -09/20/2021 16:48:05 - INFO - __main__ - Step 10683: {'lr': 0.00017786666666666666, 'samples': 341856, 'steps': 667, 'loss/train': 4.2527384757995605} -09/20/2021 16:48:06 - INFO - __main__ - Step 10684: {'lr': 0.00017786666666666666, 'samples': 341888, 'steps': 667, 'loss/train': 4.263549327850342} -09/20/2021 16:48:06 - INFO - __main__ - Step 10685: {'lr': 0.00017786666666666666, 'samples': 341920, 'steps': 667, 'loss/train': 4.27578592300415} -09/20/2021 16:48:07 - INFO - __main__ - Step 10686: {'lr': 0.00017786666666666666, 'samples': 341952, 'steps': 667, 'loss/train': 1.9687731266021729} -09/20/2021 16:48:08 - INFO - __main__ - Step 10687: {'lr': 0.00017786666666666666, 'samples': 341984, 'steps': 667, 'loss/train': 4.108392238616943} -09/20/2021 16:48:09 - INFO - __main__ - Step 10688: {'lr': 0.00017786666666666666, 'samples': 342016, 'steps': 667, 'loss/train': 5.244431972503662} -09/20/2021 16:48:10 - INFO - __main__ - Step 10689: {'lr': 0.00017813333333333334, 'samples': 342048, 'steps': 668, 'loss/train': 2.684945821762085} -09/20/2021 16:48:10 - INFO - __main__ - Step 10690: {'lr': 0.00017813333333333334, 'samples': 342080, 'steps': 668, 'loss/train': 3.8359713554382324} -09/20/2021 16:48:11 - INFO - __main__ - Step 10691: {'lr': 0.00017813333333333334, 'samples': 342112, 'steps': 668, 'loss/train': 5.025691032409668} -09/20/2021 16:48:12 - INFO - __main__ - Step 10692: {'lr': 0.00017813333333333334, 'samples': 342144, 'steps': 668, 'loss/train': 4.135557651519775} -09/20/2021 16:48:13 - INFO - __main__ - Step 10693: {'lr': 0.00017813333333333334, 'samples': 342176, 'steps': 668, 'loss/train': 5.731607437133789} -09/20/2021 16:48:13 - INFO - __main__ - Step 10694: {'lr': 0.00017813333333333334, 'samples': 342208, 'steps': 668, 'loss/train': 3.7299599647521973} -09/20/2021 16:48:14 - INFO - __main__ - Step 10695: {'lr': 0.00017813333333333334, 'samples': 342240, 'steps': 668, 'loss/train': 4.304282188415527} -09/20/2021 16:48:15 - INFO - __main__ - Step 10696: {'lr': 0.00017813333333333334, 'samples': 342272, 'steps': 668, 'loss/train': 3.9876298904418945} -09/20/2021 16:48:16 - INFO - __main__ - Step 10697: {'lr': 0.00017813333333333334, 'samples': 342304, 'steps': 668, 'loss/train': 5.31649923324585} -09/20/2021 16:48:16 - INFO - __main__ - Step 10698: {'lr': 0.00017813333333333334, 'samples': 342336, 'steps': 668, 'loss/train': 4.673520565032959} -09/20/2021 16:48:17 - INFO - __main__ - Step 10699: {'lr': 0.00017813333333333334, 'samples': 342368, 'steps': 668, 'loss/train': 6.493608474731445} -09/20/2021 16:48:18 - INFO - __main__ - Step 10700: {'lr': 0.00017813333333333334, 'samples': 342400, 'steps': 668, 'loss/train': 4.8535542488098145} -09/20/2021 16:48:19 - INFO - __main__ - Step 10701: {'lr': 0.00017813333333333334, 'samples': 342432, 'steps': 668, 'loss/train': 5.311326503753662} -09/20/2021 16:48:20 - INFO - __main__ - Step 10702: {'lr': 0.00017813333333333334, 'samples': 342464, 'steps': 668, 'loss/train': 1.9289757013320923} -09/20/2021 16:48:21 - INFO - __main__ - Step 10703: {'lr': 0.00017813333333333334, 'samples': 342496, 'steps': 668, 'loss/train': 1.6343697309494019} -09/20/2021 16:48:21 - INFO - __main__ - Step 10704: {'lr': 0.00017813333333333334, 'samples': 342528, 'steps': 668, 'loss/train': 2.2295804023742676} -09/20/2021 16:48:22 - INFO - __main__ - Step 10705: {'lr': 0.0001784, 'samples': 342560, 'steps': 669, 'loss/train': 2.014453649520874} -09/20/2021 16:48:23 - INFO - __main__ - Step 10706: {'lr': 0.0001784, 'samples': 342592, 'steps': 669, 'loss/train': 4.611207485198975} -09/20/2021 16:48:24 - INFO - __main__ - Step 10707: {'lr': 0.0001784, 'samples': 342624, 'steps': 669, 'loss/train': 3.7285571098327637} -09/20/2021 16:48:25 - INFO - __main__ - Step 10708: {'lr': 0.0001784, 'samples': 342656, 'steps': 669, 'loss/train': 4.438520908355713} -09/20/2021 16:48:25 - INFO - __main__ - Step 10709: {'lr': 0.0001784, 'samples': 342688, 'steps': 669, 'loss/train': 4.339228630065918} -09/20/2021 16:48:26 - INFO - __main__ - Step 10710: {'lr': 0.0001784, 'samples': 342720, 'steps': 669, 'loss/train': 6.189252853393555} -09/20/2021 16:48:27 - INFO - __main__ - Step 10711: {'lr': 0.0001784, 'samples': 342752, 'steps': 669, 'loss/train': 6.331375598907471} -09/20/2021 16:48:28 - INFO - __main__ - Step 10712: {'lr': 0.0001784, 'samples': 342784, 'steps': 669, 'loss/train': 4.886335849761963} -09/20/2021 16:48:28 - INFO - __main__ - Step 10713: {'lr': 0.0001784, 'samples': 342816, 'steps': 669, 'loss/train': 2.7683751583099365} -09/20/2021 16:48:29 - INFO - __main__ - Step 10714: {'lr': 0.0001784, 'samples': 342848, 'steps': 669, 'loss/train': 2.275996208190918} -09/20/2021 16:48:30 - INFO - __main__ - Step 10715: {'lr': 0.0001784, 'samples': 342880, 'steps': 669, 'loss/train': 2.490644931793213} -09/20/2021 16:48:31 - INFO - __main__ - Step 10716: {'lr': 0.0001784, 'samples': 342912, 'steps': 669, 'loss/train': 2.294316053390503} -09/20/2021 16:48:31 - INFO - __main__ - Step 10717: {'lr': 0.0001784, 'samples': 342944, 'steps': 669, 'loss/train': 5.478721618652344} -09/20/2021 16:48:32 - INFO - __main__ - Step 10718: {'lr': 0.0001784, 'samples': 342976, 'steps': 669, 'loss/train': 4.265659332275391} -09/20/2021 16:48:33 - INFO - __main__ - Step 10719: {'lr': 0.0001784, 'samples': 343008, 'steps': 669, 'loss/train': 3.5493500232696533} -09/20/2021 16:48:34 - INFO - __main__ - Step 10720: {'lr': 0.0001784, 'samples': 343040, 'steps': 669, 'loss/train': 4.549510955810547} -09/20/2021 16:48:34 - INFO - __main__ - Step 10721: {'lr': 0.00017866666666666668, 'samples': 343072, 'steps': 670, 'loss/train': 3.8756613731384277} -09/20/2021 16:48:35 - INFO - __main__ - Step 10722: {'lr': 0.00017866666666666668, 'samples': 343104, 'steps': 670, 'loss/train': 4.3531904220581055} -09/20/2021 16:48:36 - INFO - __main__ - Step 10723: {'lr': 0.00017866666666666668, 'samples': 343136, 'steps': 670, 'loss/train': 4.434488296508789} -09/20/2021 16:48:37 - INFO - __main__ - Step 10724: {'lr': 0.00017866666666666668, 'samples': 343168, 'steps': 670, 'loss/train': 4.940755844116211} -09/20/2021 16:48:37 - INFO - __main__ - Step 10725: {'lr': 0.00017866666666666668, 'samples': 343200, 'steps': 670, 'loss/train': 4.361424446105957} -09/20/2021 16:48:38 - INFO - __main__ - Step 10726: {'lr': 0.00017866666666666668, 'samples': 343232, 'steps': 670, 'loss/train': 4.421128273010254} -09/20/2021 16:48:39 - INFO - __main__ - Step 10727: {'lr': 0.00017866666666666668, 'samples': 343264, 'steps': 670, 'loss/train': 4.689929962158203} -09/20/2021 16:48:40 - INFO - __main__ - Step 10728: {'lr': 0.00017866666666666668, 'samples': 343296, 'steps': 670, 'loss/train': 3.892058849334717} -09/20/2021 16:48:41 - INFO - __main__ - Step 10729: {'lr': 0.00017866666666666668, 'samples': 343328, 'steps': 670, 'loss/train': 4.531875133514404} -09/20/2021 16:48:41 - INFO - __main__ - Step 10730: {'lr': 0.00017866666666666668, 'samples': 343360, 'steps': 670, 'loss/train': 4.147751808166504} -09/20/2021 16:48:43 - INFO - __main__ - Step 10731: {'lr': 0.00017866666666666668, 'samples': 343392, 'steps': 670, 'loss/train': 4.482996463775635} -09/20/2021 16:48:43 - INFO - __main__ - Step 10732: {'lr': 0.00017866666666666668, 'samples': 343424, 'steps': 670, 'loss/train': 3.843937873840332} -09/20/2021 16:48:44 - INFO - __main__ - Step 10733: {'lr': 0.00017866666666666668, 'samples': 343456, 'steps': 670, 'loss/train': 5.453270435333252} -09/20/2021 16:48:45 - INFO - __main__ - Step 10734: {'lr': 0.00017866666666666668, 'samples': 343488, 'steps': 670, 'loss/train': 3.7883505821228027} -09/20/2021 16:48:46 - INFO - __main__ - Step 10735: {'lr': 0.00017866666666666668, 'samples': 343520, 'steps': 670, 'loss/train': 5.648000240325928} -09/20/2021 16:48:46 - INFO - __main__ - Step 10736: {'lr': 0.00017866666666666668, 'samples': 343552, 'steps': 670, 'loss/train': 4.3765740394592285} -09/20/2021 16:48:47 - INFO - __main__ - Step 10737: {'lr': 0.00017893333333333336, 'samples': 343584, 'steps': 671, 'loss/train': 3.987105131149292} -09/20/2021 16:48:48 - INFO - __main__ - Step 10738: {'lr': 0.00017893333333333336, 'samples': 343616, 'steps': 671, 'loss/train': 4.46692419052124} -09/20/2021 16:48:49 - INFO - __main__ - Step 10739: {'lr': 0.00017893333333333336, 'samples': 343648, 'steps': 671, 'loss/train': 4.051703929901123} -09/20/2021 16:48:49 - INFO - __main__ - Step 10740: {'lr': 0.00017893333333333336, 'samples': 343680, 'steps': 671, 'loss/train': 4.518496513366699} -09/20/2021 16:48:50 - INFO - __main__ - Step 10741: {'lr': 0.00017893333333333336, 'samples': 343712, 'steps': 671, 'loss/train': 4.3723344802856445} -09/20/2021 16:48:51 - INFO - __main__ - Step 10742: {'lr': 0.00017893333333333336, 'samples': 343744, 'steps': 671, 'loss/train': 4.908609390258789} -09/20/2021 16:48:52 - INFO - __main__ - Step 10743: {'lr': 0.00017893333333333336, 'samples': 343776, 'steps': 671, 'loss/train': 4.486223220825195} -09/20/2021 16:48:52 - INFO - __main__ - Step 10744: {'lr': 0.00017893333333333336, 'samples': 343808, 'steps': 671, 'loss/train': 4.798036098480225} -09/20/2021 16:48:53 - INFO - __main__ - Step 10745: {'lr': 0.00017893333333333336, 'samples': 343840, 'steps': 671, 'loss/train': 5.486306190490723} -09/20/2021 16:48:54 - INFO - __main__ - Step 10746: {'lr': 0.00017893333333333336, 'samples': 343872, 'steps': 671, 'loss/train': 3.9221906661987305} -09/20/2021 16:48:55 - INFO - __main__ - Step 10747: {'lr': 0.00017893333333333336, 'samples': 343904, 'steps': 671, 'loss/train': 5.363776683807373} -09/20/2021 16:48:55 - INFO - __main__ - Step 10748: {'lr': 0.00017893333333333336, 'samples': 343936, 'steps': 671, 'loss/train': 1.85971999168396} -09/20/2021 16:48:56 - INFO - __main__ - Step 10749: {'lr': 0.00017893333333333336, 'samples': 343968, 'steps': 671, 'loss/train': 4.240412712097168} -09/20/2021 16:48:57 - INFO - __main__ - Step 10750: {'lr': 0.00017893333333333336, 'samples': 344000, 'steps': 671, 'loss/train': 4.572696208953857} -09/20/2021 16:48:58 - INFO - __main__ - Step 10751: {'lr': 0.00017893333333333336, 'samples': 344032, 'steps': 671, 'loss/train': 3.329005479812622} -09/20/2021 16:48:58 - INFO - __main__ - Step 10752: {'lr': 0.00017893333333333336, 'samples': 344064, 'steps': 671, 'loss/train': 4.161521911621094} -09/20/2021 16:48:59 - INFO - __main__ - Step 10753: {'lr': 0.00017920000000000002, 'samples': 344096, 'steps': 672, 'loss/train': 4.593267917633057} -09/20/2021 16:49:00 - INFO - __main__ - Step 10754: {'lr': 0.00017920000000000002, 'samples': 344128, 'steps': 672, 'loss/train': 4.17971658706665} -09/20/2021 16:49:01 - INFO - __main__ - Step 10755: {'lr': 0.00017920000000000002, 'samples': 344160, 'steps': 672, 'loss/train': 4.229859352111816} -09/20/2021 16:49:02 - INFO - __main__ - Step 10756: {'lr': 0.00017920000000000002, 'samples': 344192, 'steps': 672, 'loss/train': 5.148030757904053} -09/20/2021 16:49:02 - INFO - __main__ - Step 10757: {'lr': 0.00017920000000000002, 'samples': 344224, 'steps': 672, 'loss/train': 4.569922924041748} -09/20/2021 16:49:03 - INFO - __main__ - Step 10758: {'lr': 0.00017920000000000002, 'samples': 344256, 'steps': 672, 'loss/train': 3.051478624343872} -09/20/2021 16:49:04 - INFO - __main__ - Step 10759: {'lr': 0.00017920000000000002, 'samples': 344288, 'steps': 672, 'loss/train': 4.139029502868652} -09/20/2021 16:49:05 - INFO - __main__ - Step 10760: {'lr': 0.00017920000000000002, 'samples': 344320, 'steps': 672, 'loss/train': 4.607849597930908} -09/20/2021 16:49:05 - INFO - __main__ - Step 10761: {'lr': 0.00017920000000000002, 'samples': 344352, 'steps': 672, 'loss/train': 4.645808696746826} -09/20/2021 16:49:06 - INFO - __main__ - Step 10762: {'lr': 0.00017920000000000002, 'samples': 344384, 'steps': 672, 'loss/train': 4.766033172607422} -09/20/2021 16:49:07 - INFO - __main__ - Step 10763: {'lr': 0.00017920000000000002, 'samples': 344416, 'steps': 672, 'loss/train': 5.498807907104492} -09/20/2021 16:49:08 - INFO - __main__ - Step 10764: {'lr': 0.00017920000000000002, 'samples': 344448, 'steps': 672, 'loss/train': 4.590956687927246} -09/20/2021 16:49:09 - INFO - __main__ - Step 10765: {'lr': 0.00017920000000000002, 'samples': 344480, 'steps': 672, 'loss/train': 4.787577152252197} -09/20/2021 16:49:10 - INFO - __main__ - Step 10766: {'lr': 0.00017920000000000002, 'samples': 344512, 'steps': 672, 'loss/train': 5.168051242828369} -09/20/2021 16:49:10 - INFO - __main__ - Step 10767: {'lr': 0.00017920000000000002, 'samples': 344544, 'steps': 672, 'loss/train': 3.67746901512146} -09/20/2021 16:49:11 - INFO - __main__ - Step 10768: {'lr': 0.00017920000000000002, 'samples': 344576, 'steps': 672, 'loss/train': 1.8517704010009766} -09/20/2021 16:49:12 - INFO - __main__ - Step 10769: {'lr': 0.00017946666666666667, 'samples': 344608, 'steps': 673, 'loss/train': 4.062729835510254} -09/20/2021 16:49:13 - INFO - __main__ - Step 10770: {'lr': 0.00017946666666666667, 'samples': 344640, 'steps': 673, 'loss/train': 5.8320722579956055} -09/20/2021 16:49:14 - INFO - __main__ - Step 10771: {'lr': 0.00017946666666666667, 'samples': 344672, 'steps': 673, 'loss/train': 4.7228827476501465} -09/20/2021 16:49:14 - INFO - __main__ - Step 10772: {'lr': 0.00017946666666666667, 'samples': 344704, 'steps': 673, 'loss/train': 4.504336357116699} -09/20/2021 16:49:15 - INFO - __main__ - Step 10773: {'lr': 0.00017946666666666667, 'samples': 344736, 'steps': 673, 'loss/train': 4.527651309967041} -09/20/2021 16:49:16 - INFO - __main__ - Step 10774: {'lr': 0.00017946666666666667, 'samples': 344768, 'steps': 673, 'loss/train': 4.299437999725342} -09/20/2021 16:49:17 - INFO - __main__ - Step 10775: {'lr': 0.00017946666666666667, 'samples': 344800, 'steps': 673, 'loss/train': 4.521568775177002} -09/20/2021 16:49:17 - INFO - __main__ - Step 10776: {'lr': 0.00017946666666666667, 'samples': 344832, 'steps': 673, 'loss/train': 4.510168075561523} -09/20/2021 16:49:18 - INFO - __main__ - Step 10777: {'lr': 0.00017946666666666667, 'samples': 344864, 'steps': 673, 'loss/train': 4.114369869232178} -09/20/2021 16:49:19 - INFO - __main__ - Step 10778: {'lr': 0.00017946666666666667, 'samples': 344896, 'steps': 673, 'loss/train': 3.9431521892547607} -09/20/2021 16:49:20 - INFO - __main__ - Step 10779: {'lr': 0.00017946666666666667, 'samples': 344928, 'steps': 673, 'loss/train': 5.499642372131348} -09/20/2021 16:49:20 - INFO - __main__ - Step 10780: {'lr': 0.00017946666666666667, 'samples': 344960, 'steps': 673, 'loss/train': 4.581426620483398} -09/20/2021 16:49:21 - INFO - __main__ - Step 10781: {'lr': 0.00017946666666666667, 'samples': 344992, 'steps': 673, 'loss/train': 2.6850109100341797} -09/20/2021 16:49:22 - INFO - __main__ - Step 10782: {'lr': 0.00017946666666666667, 'samples': 345024, 'steps': 673, 'loss/train': 3.1432406902313232} -09/20/2021 16:49:23 - INFO - __main__ - Step 10783: {'lr': 0.00017946666666666667, 'samples': 345056, 'steps': 673, 'loss/train': 4.172867774963379} -09/20/2021 16:49:23 - INFO - __main__ - Step 10784: {'lr': 0.00017946666666666667, 'samples': 345088, 'steps': 673, 'loss/train': 3.1248974800109863} -09/20/2021 16:49:24 - INFO - __main__ - Step 10785: {'lr': 0.00017973333333333333, 'samples': 345120, 'steps': 674, 'loss/train': 4.215472221374512} -09/20/2021 16:49:25 - INFO - __main__ - Step 10786: {'lr': 0.00017973333333333333, 'samples': 345152, 'steps': 674, 'loss/train': 3.8090524673461914} -09/20/2021 16:49:26 - INFO - __main__ - Step 10787: {'lr': 0.00017973333333333333, 'samples': 345184, 'steps': 674, 'loss/train': 3.9335246086120605} -09/20/2021 16:49:26 - INFO - __main__ - Step 10788: {'lr': 0.00017973333333333333, 'samples': 345216, 'steps': 674, 'loss/train': 4.720710754394531} -09/20/2021 16:49:27 - INFO - __main__ - Step 10789: {'lr': 0.00017973333333333333, 'samples': 345248, 'steps': 674, 'loss/train': 4.371865272521973} -09/20/2021 16:49:28 - INFO - __main__ - Step 10790: {'lr': 0.00017973333333333333, 'samples': 345280, 'steps': 674, 'loss/train': 3.625518560409546} -09/20/2021 16:49:29 - INFO - __main__ - Step 10791: {'lr': 0.00017973333333333333, 'samples': 345312, 'steps': 674, 'loss/train': 4.4254045486450195} -09/20/2021 16:49:29 - INFO - __main__ - Step 10792: {'lr': 0.00017973333333333333, 'samples': 345344, 'steps': 674, 'loss/train': 4.5244574546813965} -09/20/2021 16:49:30 - INFO - __main__ - Step 10793: {'lr': 0.00017973333333333333, 'samples': 345376, 'steps': 674, 'loss/train': 4.5296478271484375} -09/20/2021 16:49:31 - INFO - __main__ - Step 10794: {'lr': 0.00017973333333333333, 'samples': 345408, 'steps': 674, 'loss/train': 4.368458271026611} -09/20/2021 16:49:32 - INFO - __main__ - Step 10795: {'lr': 0.00017973333333333333, 'samples': 345440, 'steps': 674, 'loss/train': 3.820333242416382} -09/20/2021 16:49:33 - INFO - __main__ - Step 10796: {'lr': 0.00017973333333333333, 'samples': 345472, 'steps': 674, 'loss/train': 4.056308269500732} -09/20/2021 16:49:34 - INFO - __main__ - Step 10797: {'lr': 0.00017973333333333333, 'samples': 345504, 'steps': 674, 'loss/train': 4.77293586730957} -09/20/2021 16:49:34 - INFO - __main__ - Step 10798: {'lr': 0.00017973333333333333, 'samples': 345536, 'steps': 674, 'loss/train': 4.621386528015137} -09/20/2021 16:49:35 - INFO - __main__ - Step 10799: {'lr': 0.00017973333333333333, 'samples': 345568, 'steps': 674, 'loss/train': 4.878896236419678} -09/20/2021 16:49:36 - INFO - __main__ - Step 10800: {'lr': 0.00017973333333333333, 'samples': 345600, 'steps': 674, 'loss/train': 0.9288025498390198} -09/20/2021 16:49:37 - INFO - __main__ - Step 10801: {'lr': 0.00018, 'samples': 345632, 'steps': 675, 'loss/train': 5.343786716461182} -09/20/2021 16:49:38 - INFO - __main__ - Step 10802: {'lr': 0.00018, 'samples': 345664, 'steps': 675, 'loss/train': 5.951689720153809} -09/20/2021 16:49:38 - INFO - __main__ - Step 10803: {'lr': 0.00018, 'samples': 345696, 'steps': 675, 'loss/train': 4.3148112297058105} -09/20/2021 16:49:39 - INFO - __main__ - Step 10804: {'lr': 0.00018, 'samples': 345728, 'steps': 675, 'loss/train': 4.28952693939209} -09/20/2021 16:49:40 - INFO - __main__ - Step 10805: {'lr': 0.00018, 'samples': 345760, 'steps': 675, 'loss/train': 4.552250385284424} -09/20/2021 16:49:41 - INFO - __main__ - Step 10806: {'lr': 0.00018, 'samples': 345792, 'steps': 675, 'loss/train': 5.300316333770752} -09/20/2021 16:49:41 - INFO - __main__ - Step 10807: {'lr': 0.00018, 'samples': 345824, 'steps': 675, 'loss/train': 5.222606658935547} -09/20/2021 16:49:42 - INFO - __main__ - Step 10808: {'lr': 0.00018, 'samples': 345856, 'steps': 675, 'loss/train': 4.6053667068481445} -09/20/2021 16:49:43 - INFO - __main__ - Step 10809: {'lr': 0.00018, 'samples': 345888, 'steps': 675, 'loss/train': 2.4873170852661133} -09/20/2021 16:49:44 - INFO - __main__ - Step 10810: {'lr': 0.00018, 'samples': 345920, 'steps': 675, 'loss/train': 4.987094879150391} -09/20/2021 16:49:44 - INFO - __main__ - Step 10811: {'lr': 0.00018, 'samples': 345952, 'steps': 675, 'loss/train': 4.007360458374023} -09/20/2021 16:49:45 - INFO - __main__ - Step 10812: {'lr': 0.00018, 'samples': 345984, 'steps': 675, 'loss/train': 4.409208297729492} -09/20/2021 16:49:46 - INFO - __main__ - Step 10813: {'lr': 0.00018, 'samples': 346016, 'steps': 675, 'loss/train': 3.1742796897888184} -09/20/2021 16:49:47 - INFO - __main__ - Step 10814: {'lr': 0.00018, 'samples': 346048, 'steps': 675, 'loss/train': 5.124698162078857} -09/20/2021 16:49:47 - INFO - __main__ - Step 10815: {'lr': 0.00018, 'samples': 346080, 'steps': 675, 'loss/train': 3.65160870552063} -09/20/2021 16:49:48 - INFO - __main__ - Step 10816: {'lr': 0.00018, 'samples': 346112, 'steps': 675, 'loss/train': 4.388720989227295} -09/20/2021 16:49:49 - INFO - __main__ - Step 10817: {'lr': 0.00018026666666666667, 'samples': 346144, 'steps': 676, 'loss/train': 4.2657790184021} -09/20/2021 16:49:50 - INFO - __main__ - Step 10818: {'lr': 0.00018026666666666667, 'samples': 346176, 'steps': 676, 'loss/train': 4.551428318023682} -09/20/2021 16:49:51 - INFO - __main__ - Step 10819: {'lr': 0.00018026666666666667, 'samples': 346208, 'steps': 676, 'loss/train': 4.757599830627441} -09/20/2021 16:49:51 - INFO - __main__ - Step 10820: {'lr': 0.00018026666666666667, 'samples': 346240, 'steps': 676, 'loss/train': 4.970279216766357} -09/20/2021 16:49:52 - INFO - __main__ - Step 10821: {'lr': 0.00018026666666666667, 'samples': 346272, 'steps': 676, 'loss/train': 5.479583740234375} -09/20/2021 16:49:53 - INFO - __main__ - Step 10822: {'lr': 0.00018026666666666667, 'samples': 346304, 'steps': 676, 'loss/train': 4.663471698760986} -09/20/2021 16:49:54 - INFO - __main__ - Step 10823: {'lr': 0.00018026666666666667, 'samples': 346336, 'steps': 676, 'loss/train': 4.390904426574707} -09/20/2021 16:49:54 - INFO - __main__ - Step 10824: {'lr': 0.00018026666666666667, 'samples': 346368, 'steps': 676, 'loss/train': 3.751655340194702} -09/20/2021 16:49:55 - INFO - __main__ - Step 10825: {'lr': 0.00018026666666666667, 'samples': 346400, 'steps': 676, 'loss/train': 3.885845422744751} -09/20/2021 16:49:56 - INFO - __main__ - Step 10826: {'lr': 0.00018026666666666667, 'samples': 346432, 'steps': 676, 'loss/train': 3.396193504333496} -09/20/2021 16:49:57 - INFO - __main__ - Step 10827: {'lr': 0.00018026666666666667, 'samples': 346464, 'steps': 676, 'loss/train': 4.326448917388916} -09/20/2021 16:49:58 - INFO - __main__ - Step 10828: {'lr': 0.00018026666666666667, 'samples': 346496, 'steps': 676, 'loss/train': 4.479605197906494} -09/20/2021 16:49:59 - INFO - __main__ - Step 10829: {'lr': 0.00018026666666666667, 'samples': 346528, 'steps': 676, 'loss/train': 2.1313090324401855} -09/20/2021 16:50:00 - INFO - __main__ - Step 10830: {'lr': 0.00018026666666666667, 'samples': 346560, 'steps': 676, 'loss/train': 1.9714666604995728} -09/20/2021 16:50:00 - INFO - __main__ - Step 10831: {'lr': 0.00018026666666666667, 'samples': 346592, 'steps': 676, 'loss/train': 3.1971898078918457} -09/20/2021 16:50:01 - INFO - __main__ - Step 10832: {'lr': 0.00018026666666666667, 'samples': 346624, 'steps': 676, 'loss/train': 1.7801471948623657} -09/20/2021 16:50:02 - INFO - __main__ - Step 10833: {'lr': 0.00018053333333333332, 'samples': 346656, 'steps': 677, 'loss/train': 3.2879486083984375} -09/20/2021 16:50:03 - INFO - __main__ - Step 10834: {'lr': 0.00018053333333333332, 'samples': 346688, 'steps': 677, 'loss/train': 4.495823860168457} -09/20/2021 16:50:03 - INFO - __main__ - Step 10835: {'lr': 0.00018053333333333332, 'samples': 346720, 'steps': 677, 'loss/train': 3.936948776245117} -09/20/2021 16:50:04 - INFO - __main__ - Step 10836: {'lr': 0.00018053333333333332, 'samples': 346752, 'steps': 677, 'loss/train': 4.55739164352417} -09/20/2021 16:50:05 - INFO - __main__ - Step 10837: {'lr': 0.00018053333333333332, 'samples': 346784, 'steps': 677, 'loss/train': 4.224781036376953} -09/20/2021 16:50:06 - INFO - __main__ - Step 10838: {'lr': 0.00018053333333333332, 'samples': 346816, 'steps': 677, 'loss/train': 4.115950584411621} -09/20/2021 16:50:06 - INFO - __main__ - Step 10839: {'lr': 0.00018053333333333332, 'samples': 346848, 'steps': 677, 'loss/train': 5.200076580047607} -09/20/2021 16:50:07 - INFO - __main__ - Step 10840: {'lr': 0.00018053333333333332, 'samples': 346880, 'steps': 677, 'loss/train': 3.757497549057007} -09/20/2021 16:50:08 - INFO - __main__ - Step 10841: {'lr': 0.00018053333333333332, 'samples': 346912, 'steps': 677, 'loss/train': 4.946522235870361} -09/20/2021 16:50:09 - INFO - __main__ - Step 10842: {'lr': 0.00018053333333333332, 'samples': 346944, 'steps': 677, 'loss/train': 4.499200820922852} -09/20/2021 16:50:09 - INFO - __main__ - Step 10843: {'lr': 0.00018053333333333332, 'samples': 346976, 'steps': 677, 'loss/train': 5.57647180557251} -09/20/2021 16:50:10 - INFO - __main__ - Step 10844: {'lr': 0.00018053333333333332, 'samples': 347008, 'steps': 677, 'loss/train': 4.396167278289795} -09/20/2021 16:50:11 - INFO - __main__ - Step 10845: {'lr': 0.00018053333333333332, 'samples': 347040, 'steps': 677, 'loss/train': 3.937542200088501} -09/20/2021 16:50:12 - INFO - __main__ - Step 10846: {'lr': 0.00018053333333333332, 'samples': 347072, 'steps': 677, 'loss/train': 4.304494380950928} -09/20/2021 16:50:12 - INFO - __main__ - Step 10847: {'lr': 0.00018053333333333332, 'samples': 347104, 'steps': 677, 'loss/train': 4.57253360748291} -09/20/2021 16:50:13 - INFO - __main__ - Step 10848: {'lr': 0.00018053333333333332, 'samples': 347136, 'steps': 677, 'loss/train': 4.2254958152771} -09/20/2021 16:50:14 - INFO - __main__ - Step 10849: {'lr': 0.0001808, 'samples': 347168, 'steps': 678, 'loss/train': 4.078309059143066} -09/20/2021 16:50:15 - INFO - __main__ - Step 10850: {'lr': 0.0001808, 'samples': 347200, 'steps': 678, 'loss/train': 4.06155252456665} -09/20/2021 16:50:16 - INFO - __main__ - Step 10851: {'lr': 0.0001808, 'samples': 347232, 'steps': 678, 'loss/train': 4.410572528839111} -09/20/2021 16:50:16 - INFO - __main__ - Step 10852: {'lr': 0.0001808, 'samples': 347264, 'steps': 678, 'loss/train': 4.492618083953857} -09/20/2021 16:50:17 - INFO - __main__ - Step 10853: {'lr': 0.0001808, 'samples': 347296, 'steps': 678, 'loss/train': 4.373283386230469} -09/20/2021 16:50:18 - INFO - __main__ - Step 10854: {'lr': 0.0001808, 'samples': 347328, 'steps': 678, 'loss/train': 3.835913896560669} -09/20/2021 16:50:19 - INFO - __main__ - Step 10855: {'lr': 0.0001808, 'samples': 347360, 'steps': 678, 'loss/train': 4.406978130340576} -09/20/2021 16:50:19 - INFO - __main__ - Step 10856: {'lr': 0.0001808, 'samples': 347392, 'steps': 678, 'loss/train': 4.546807765960693} -09/20/2021 16:50:20 - INFO - __main__ - Step 10857: {'lr': 0.0001808, 'samples': 347424, 'steps': 678, 'loss/train': 4.819818019866943} -09/20/2021 16:50:21 - INFO - __main__ - Step 10858: {'lr': 0.0001808, 'samples': 347456, 'steps': 678, 'loss/train': 4.9457221031188965} -09/20/2021 16:50:22 - INFO - __main__ - Step 10859: {'lr': 0.0001808, 'samples': 347488, 'steps': 678, 'loss/train': 4.1789751052856445} -09/20/2021 16:50:23 - INFO - __main__ - Step 10860: {'lr': 0.0001808, 'samples': 347520, 'steps': 678, 'loss/train': 4.812355995178223} -09/20/2021 16:50:24 - INFO - __main__ - Step 10861: {'lr': 0.0001808, 'samples': 347552, 'steps': 678, 'loss/train': 4.901540756225586} -09/20/2021 16:50:24 - INFO - __main__ - Step 10862: {'lr': 0.0001808, 'samples': 347584, 'steps': 678, 'loss/train': 4.10862398147583} -09/20/2021 16:50:25 - INFO - __main__ - Step 10863: {'lr': 0.0001808, 'samples': 347616, 'steps': 678, 'loss/train': 4.154789447784424} -09/20/2021 16:50:26 - INFO - __main__ - Step 10864: {'lr': 0.0001808, 'samples': 347648, 'steps': 678, 'loss/train': 4.61421012878418} -09/20/2021 16:50:27 - INFO - __main__ - Step 10865: {'lr': 0.00018106666666666669, 'samples': 347680, 'steps': 679, 'loss/train': 3.9017038345336914} -09/20/2021 16:50:27 - INFO - __main__ - Step 10866: {'lr': 0.00018106666666666669, 'samples': 347712, 'steps': 679, 'loss/train': 6.321042537689209} -09/20/2021 16:50:28 - INFO - __main__ - Step 10867: {'lr': 0.00018106666666666669, 'samples': 347744, 'steps': 679, 'loss/train': 4.522170543670654} -09/20/2021 16:50:29 - INFO - __main__ - Step 10868: {'lr': 0.00018106666666666669, 'samples': 347776, 'steps': 679, 'loss/train': 5.460057735443115} -09/20/2021 16:50:30 - INFO - __main__ - Step 10869: {'lr': 0.00018106666666666669, 'samples': 347808, 'steps': 679, 'loss/train': 4.177525997161865} -09/20/2021 16:50:30 - INFO - __main__ - Step 10870: {'lr': 0.00018106666666666669, 'samples': 347840, 'steps': 679, 'loss/train': 4.154599189758301} -09/20/2021 16:50:31 - INFO - __main__ - Step 10871: {'lr': 0.00018106666666666669, 'samples': 347872, 'steps': 679, 'loss/train': 4.227782726287842} -09/20/2021 16:50:32 - INFO - __main__ - Step 10872: {'lr': 0.00018106666666666669, 'samples': 347904, 'steps': 679, 'loss/train': 5.592429161071777} -09/20/2021 16:50:33 - INFO - __main__ - Step 10873: {'lr': 0.00018106666666666669, 'samples': 347936, 'steps': 679, 'loss/train': 5.180152893066406} -09/20/2021 16:50:33 - INFO - __main__ - Step 10874: {'lr': 0.00018106666666666669, 'samples': 347968, 'steps': 679, 'loss/train': 4.332795143127441} -09/20/2021 16:50:34 - INFO - __main__ - Step 10875: {'lr': 0.00018106666666666669, 'samples': 348000, 'steps': 679, 'loss/train': 4.487744331359863} -09/20/2021 16:50:35 - INFO - __main__ - Step 10876: {'lr': 0.00018106666666666669, 'samples': 348032, 'steps': 679, 'loss/train': 2.768172264099121} -09/20/2021 16:50:36 - INFO - __main__ - Step 10877: {'lr': 0.00018106666666666669, 'samples': 348064, 'steps': 679, 'loss/train': 3.669783592224121} -09/20/2021 16:50:36 - INFO - __main__ - Step 10878: {'lr': 0.00018106666666666669, 'samples': 348096, 'steps': 679, 'loss/train': 4.936586380004883} -09/20/2021 16:50:37 - INFO - __main__ - Step 10879: {'lr': 0.00018106666666666669, 'samples': 348128, 'steps': 679, 'loss/train': 4.509798049926758} -09/20/2021 16:50:38 - INFO - __main__ - Step 10880: {'lr': 0.00018106666666666669, 'samples': 348160, 'steps': 679, 'loss/train': 4.673344135284424} -09/20/2021 16:50:39 - INFO - __main__ - Step 10881: {'lr': 0.00018133333333333334, 'samples': 348192, 'steps': 680, 'loss/train': 3.5670881271362305} -09/20/2021 16:50:40 - INFO - __main__ - Step 10882: {'lr': 0.00018133333333333334, 'samples': 348224, 'steps': 680, 'loss/train': 4.719455242156982} -09/20/2021 16:50:40 - INFO - __main__ - Step 10883: {'lr': 0.00018133333333333334, 'samples': 348256, 'steps': 680, 'loss/train': 5.548771381378174} -09/20/2021 16:50:41 - INFO - __main__ - Step 10884: {'lr': 0.00018133333333333334, 'samples': 348288, 'steps': 680, 'loss/train': 3.539553642272949} -09/20/2021 16:50:42 - INFO - __main__ - Step 10885: {'lr': 0.00018133333333333334, 'samples': 348320, 'steps': 680, 'loss/train': 4.153834819793701} -09/20/2021 16:50:43 - INFO - __main__ - Step 10886: {'lr': 0.00018133333333333334, 'samples': 348352, 'steps': 680, 'loss/train': 4.6659955978393555} -09/20/2021 16:50:43 - INFO - __main__ - Step 10887: {'lr': 0.00018133333333333334, 'samples': 348384, 'steps': 680, 'loss/train': 3.3369412422180176} -09/20/2021 16:50:45 - INFO - __main__ - Step 10888: {'lr': 0.00018133333333333334, 'samples': 348416, 'steps': 680, 'loss/train': 3.901648759841919} -09/20/2021 16:50:46 - INFO - __main__ - Step 10889: {'lr': 0.00018133333333333334, 'samples': 348448, 'steps': 680, 'loss/train': 4.508498668670654} -09/20/2021 16:50:47 - INFO - __main__ - Step 10890: {'lr': 0.00018133333333333334, 'samples': 348480, 'steps': 680, 'loss/train': 3.970496416091919} -09/20/2021 16:50:47 - INFO - __main__ - Step 10891: {'lr': 0.00018133333333333334, 'samples': 348512, 'steps': 680, 'loss/train': 4.792495250701904} -09/20/2021 16:50:48 - INFO - __main__ - Step 10892: {'lr': 0.00018133333333333334, 'samples': 348544, 'steps': 680, 'loss/train': 4.655270576477051} -09/20/2021 16:50:49 - INFO - __main__ - Step 10893: {'lr': 0.00018133333333333334, 'samples': 348576, 'steps': 680, 'loss/train': 4.816337585449219} -09/20/2021 16:50:50 - INFO - __main__ - Step 10894: {'lr': 0.00018133333333333334, 'samples': 348608, 'steps': 680, 'loss/train': 4.5707502365112305} -09/20/2021 16:50:50 - INFO - __main__ - Step 10895: {'lr': 0.00018133333333333334, 'samples': 348640, 'steps': 680, 'loss/train': 6.5377197265625} -09/20/2021 16:50:51 - INFO - __main__ - Step 10896: {'lr': 0.00018133333333333334, 'samples': 348672, 'steps': 680, 'loss/train': 4.276993274688721} -09/20/2021 16:50:52 - INFO - __main__ - Step 10897: {'lr': 0.00018160000000000002, 'samples': 348704, 'steps': 681, 'loss/train': 3.785681962966919} -09/20/2021 16:50:53 - INFO - __main__ - Step 10898: {'lr': 0.00018160000000000002, 'samples': 348736, 'steps': 681, 'loss/train': 3.8120126724243164} -09/20/2021 16:50:53 - INFO - __main__ - Step 10899: {'lr': 0.00018160000000000002, 'samples': 348768, 'steps': 681, 'loss/train': 3.7183544635772705} -09/20/2021 16:50:54 - INFO - __main__ - Step 10900: {'lr': 0.00018160000000000002, 'samples': 348800, 'steps': 681, 'loss/train': 4.181933879852295} -09/20/2021 16:50:55 - INFO - __main__ - Step 10901: {'lr': 0.00018160000000000002, 'samples': 348832, 'steps': 681, 'loss/train': 5.262768745422363} -09/20/2021 16:50:56 - INFO - __main__ - Step 10902: {'lr': 0.00018160000000000002, 'samples': 348864, 'steps': 681, 'loss/train': 5.535642147064209} -09/20/2021 16:50:56 - INFO - __main__ - Step 10903: {'lr': 0.00018160000000000002, 'samples': 348896, 'steps': 681, 'loss/train': 5.083432197570801} -09/20/2021 16:50:57 - INFO - __main__ - Step 10904: {'lr': 0.00018160000000000002, 'samples': 348928, 'steps': 681, 'loss/train': 5.368762493133545} -09/20/2021 16:50:58 - INFO - __main__ - Step 10905: {'lr': 0.00018160000000000002, 'samples': 348960, 'steps': 681, 'loss/train': 6.206662178039551} -09/20/2021 16:50:59 - INFO - __main__ - Step 10906: {'lr': 0.00018160000000000002, 'samples': 348992, 'steps': 681, 'loss/train': 6.496585845947266} -09/20/2021 16:50:59 - INFO - __main__ - Step 10907: {'lr': 0.00018160000000000002, 'samples': 349024, 'steps': 681, 'loss/train': 6.745029449462891} -09/20/2021 16:51:00 - INFO - __main__ - Step 10908: {'lr': 0.00018160000000000002, 'samples': 349056, 'steps': 681, 'loss/train': 4.9629034996032715} -09/20/2021 16:51:01 - INFO - __main__ - Step 10909: {'lr': 0.00018160000000000002, 'samples': 349088, 'steps': 681, 'loss/train': 4.6873064041137695} -09/20/2021 16:51:02 - INFO - __main__ - Step 10910: {'lr': 0.00018160000000000002, 'samples': 349120, 'steps': 681, 'loss/train': 2.305853843688965} -09/20/2021 16:51:02 - INFO - __main__ - Step 10911: {'lr': 0.00018160000000000002, 'samples': 349152, 'steps': 681, 'loss/train': 4.7584123611450195} -09/20/2021 16:51:03 - INFO - __main__ - Step 10912: {'lr': 0.00018160000000000002, 'samples': 349184, 'steps': 681, 'loss/train': 4.91589879989624} -09/20/2021 16:51:04 - INFO - __main__ - Step 10913: {'lr': 0.00018186666666666668, 'samples': 349216, 'steps': 682, 'loss/train': 4.978450298309326} -09/20/2021 16:51:05 - INFO - __main__ - Step 10914: {'lr': 0.00018186666666666668, 'samples': 349248, 'steps': 682, 'loss/train': 4.795481204986572} -09/20/2021 16:51:06 - INFO - __main__ - Step 10915: {'lr': 0.00018186666666666668, 'samples': 349280, 'steps': 682, 'loss/train': 4.294610023498535} -09/20/2021 16:51:06 - INFO - __main__ - Step 10916: {'lr': 0.00018186666666666668, 'samples': 349312, 'steps': 682, 'loss/train': 4.292045593261719} -09/20/2021 16:51:07 - INFO - __main__ - Step 10917: {'lr': 0.00018186666666666668, 'samples': 349344, 'steps': 682, 'loss/train': 4.268395900726318} -09/20/2021 16:51:08 - INFO - __main__ - Step 10918: {'lr': 0.00018186666666666668, 'samples': 349376, 'steps': 682, 'loss/train': 5.00375509262085} -09/20/2021 16:51:09 - INFO - __main__ - Step 10919: {'lr': 0.00018186666666666668, 'samples': 349408, 'steps': 682, 'loss/train': 4.163473129272461} -09/20/2021 16:51:10 - INFO - __main__ - Step 10920: {'lr': 0.00018186666666666668, 'samples': 349440, 'steps': 682, 'loss/train': 4.0250163078308105} -09/20/2021 16:51:11 - INFO - __main__ - Step 10921: {'lr': 0.00018186666666666668, 'samples': 349472, 'steps': 682, 'loss/train': 4.26948881149292} -09/20/2021 16:51:11 - INFO - __main__ - Step 10922: {'lr': 0.00018186666666666668, 'samples': 349504, 'steps': 682, 'loss/train': 3.8392648696899414} -09/20/2021 16:51:12 - INFO - __main__ - Step 10923: {'lr': 0.00018186666666666668, 'samples': 349536, 'steps': 682, 'loss/train': 5.307719707489014} -09/20/2021 16:51:13 - INFO - __main__ - Step 10924: {'lr': 0.00018186666666666668, 'samples': 349568, 'steps': 682, 'loss/train': 4.232734203338623} -09/20/2021 16:51:14 - INFO - __main__ - Step 10925: {'lr': 0.00018186666666666668, 'samples': 349600, 'steps': 682, 'loss/train': 5.158954620361328} -09/20/2021 16:51:14 - INFO - __main__ - Step 10926: {'lr': 0.00018186666666666668, 'samples': 349632, 'steps': 682, 'loss/train': 6.3218560218811035} -09/20/2021 16:51:15 - INFO - __main__ - Step 10927: {'lr': 0.00018186666666666668, 'samples': 349664, 'steps': 682, 'loss/train': 4.577366352081299} -09/20/2021 16:51:16 - INFO - __main__ - Step 10928: {'lr': 0.00018186666666666668, 'samples': 349696, 'steps': 682, 'loss/train': 5.467546463012695} -09/20/2021 16:51:17 - INFO - __main__ - Step 10929: {'lr': 0.00018213333333333333, 'samples': 349728, 'steps': 683, 'loss/train': 4.83486795425415} -09/20/2021 16:51:17 - INFO - __main__ - Step 10930: {'lr': 0.00018213333333333333, 'samples': 349760, 'steps': 683, 'loss/train': 4.444235801696777} -09/20/2021 16:51:18 - INFO - __main__ - Step 10931: {'lr': 0.00018213333333333333, 'samples': 349792, 'steps': 683, 'loss/train': 4.001070976257324} -09/20/2021 16:51:19 - INFO - __main__ - Step 10932: {'lr': 0.00018213333333333333, 'samples': 349824, 'steps': 683, 'loss/train': 5.106433391571045} -09/20/2021 16:51:20 - INFO - __main__ - Step 10933: {'lr': 0.00018213333333333333, 'samples': 349856, 'steps': 683, 'loss/train': 3.8872931003570557} -09/20/2021 16:51:20 - INFO - __main__ - Step 10934: {'lr': 0.00018213333333333333, 'samples': 349888, 'steps': 683, 'loss/train': 4.442902088165283} -09/20/2021 16:51:21 - INFO - __main__ - Step 10935: {'lr': 0.00018213333333333333, 'samples': 349920, 'steps': 683, 'loss/train': 5.6085381507873535} -09/20/2021 16:51:22 - INFO - __main__ - Step 10936: {'lr': 0.00018213333333333333, 'samples': 349952, 'steps': 683, 'loss/train': 4.5260396003723145} -09/20/2021 16:51:23 - INFO - __main__ - Step 10937: {'lr': 0.00018213333333333333, 'samples': 349984, 'steps': 683, 'loss/train': 4.893665313720703} -09/20/2021 16:51:23 - INFO - __main__ - Step 10938: {'lr': 0.00018213333333333333, 'samples': 350016, 'steps': 683, 'loss/train': 4.2945556640625} -09/20/2021 16:51:24 - INFO - __main__ - Step 10939: {'lr': 0.00018213333333333333, 'samples': 350048, 'steps': 683, 'loss/train': 4.326089859008789} -09/20/2021 16:51:25 - INFO - __main__ - Step 10940: {'lr': 0.00018213333333333333, 'samples': 350080, 'steps': 683, 'loss/train': 4.088235855102539} -09/20/2021 16:51:26 - INFO - __main__ - Step 10941: {'lr': 0.00018213333333333333, 'samples': 350112, 'steps': 683, 'loss/train': 4.376861572265625} -09/20/2021 16:51:26 - INFO - __main__ - Step 10942: {'lr': 0.00018213333333333333, 'samples': 350144, 'steps': 683, 'loss/train': 4.209083080291748} -09/20/2021 16:51:27 - INFO - __main__ - Step 10943: {'lr': 0.00018213333333333333, 'samples': 350176, 'steps': 683, 'loss/train': 4.742677211761475} -09/20/2021 16:51:28 - INFO - __main__ - Step 10944: {'lr': 0.00018213333333333333, 'samples': 350208, 'steps': 683, 'loss/train': 4.201920509338379} -09/20/2021 16:51:29 - INFO - __main__ - Step 10945: {'lr': 0.00018240000000000002, 'samples': 350240, 'steps': 684, 'loss/train': 4.945565700531006} -09/20/2021 16:51:30 - INFO - __main__ - Step 10946: {'lr': 0.00018240000000000002, 'samples': 350272, 'steps': 684, 'loss/train': 4.528669834136963} -09/20/2021 16:51:30 - INFO - __main__ - Step 10947: {'lr': 0.00018240000000000002, 'samples': 350304, 'steps': 684, 'loss/train': 4.693422317504883} -09/20/2021 16:51:31 - INFO - __main__ - Step 10948: {'lr': 0.00018240000000000002, 'samples': 350336, 'steps': 684, 'loss/train': 3.980787992477417} -09/20/2021 16:51:32 - INFO - __main__ - Step 10949: {'lr': 0.00018240000000000002, 'samples': 350368, 'steps': 684, 'loss/train': 4.399478912353516} -09/20/2021 16:51:33 - INFO - __main__ - Step 10950: {'lr': 0.00018240000000000002, 'samples': 350400, 'steps': 684, 'loss/train': 4.598125457763672} -09/20/2021 16:51:34 - INFO - __main__ - Step 10951: {'lr': 0.00018240000000000002, 'samples': 350432, 'steps': 684, 'loss/train': 4.714125156402588} -09/20/2021 16:51:35 - INFO - __main__ - Step 10952: {'lr': 0.00018240000000000002, 'samples': 350464, 'steps': 684, 'loss/train': 4.3820343017578125} -09/20/2021 16:51:35 - INFO - __main__ - Step 10953: {'lr': 0.00018240000000000002, 'samples': 350496, 'steps': 684, 'loss/train': 4.4825568199157715} -09/20/2021 16:51:36 - INFO - __main__ - Step 10954: {'lr': 0.00018240000000000002, 'samples': 350528, 'steps': 684, 'loss/train': 3.525393009185791} -09/20/2021 16:51:37 - INFO - __main__ - Step 10955: {'lr': 0.00018240000000000002, 'samples': 350560, 'steps': 684, 'loss/train': 5.935513496398926} -09/20/2021 16:51:38 - INFO - __main__ - Step 10956: {'lr': 0.00018240000000000002, 'samples': 350592, 'steps': 684, 'loss/train': 6.040468692779541} -09/20/2021 16:51:38 - INFO - __main__ - Step 10957: {'lr': 0.00018240000000000002, 'samples': 350624, 'steps': 684, 'loss/train': 4.799202919006348} -09/20/2021 16:51:39 - INFO - __main__ - Step 10958: {'lr': 0.00018240000000000002, 'samples': 350656, 'steps': 684, 'loss/train': 3.9262781143188477} -09/20/2021 16:51:40 - INFO - __main__ - Step 10959: {'lr': 0.00018240000000000002, 'samples': 350688, 'steps': 684, 'loss/train': 4.049635410308838} -09/20/2021 16:51:41 - INFO - __main__ - Step 10960: {'lr': 0.00018240000000000002, 'samples': 350720, 'steps': 684, 'loss/train': 5.052242279052734} -09/20/2021 16:51:41 - INFO - __main__ - Step 10961: {'lr': 0.00018266666666666667, 'samples': 350752, 'steps': 685, 'loss/train': 4.823923587799072} -09/20/2021 16:51:42 - INFO - __main__ - Step 10962: {'lr': 0.00018266666666666667, 'samples': 350784, 'steps': 685, 'loss/train': 3.960401773452759} -09/20/2021 16:51:43 - INFO - __main__ - Step 10963: {'lr': 0.00018266666666666667, 'samples': 350816, 'steps': 685, 'loss/train': 3.832875967025757} -09/20/2021 16:51:44 - INFO - __main__ - Step 10964: {'lr': 0.00018266666666666667, 'samples': 350848, 'steps': 685, 'loss/train': 4.647024154663086} -09/20/2021 16:51:44 - INFO - __main__ - Step 10965: {'lr': 0.00018266666666666667, 'samples': 350880, 'steps': 685, 'loss/train': 3.7124550342559814} -09/20/2021 16:51:45 - INFO - __main__ - Step 10966: {'lr': 0.00018266666666666667, 'samples': 350912, 'steps': 685, 'loss/train': 1.6957253217697144} -09/20/2021 16:51:46 - INFO - __main__ - Step 10967: {'lr': 0.00018266666666666667, 'samples': 350944, 'steps': 685, 'loss/train': 2.8206377029418945} -09/20/2021 16:51:47 - INFO - __main__ - Step 10968: {'lr': 0.00018266666666666667, 'samples': 350976, 'steps': 685, 'loss/train': 3.987022876739502} -09/20/2021 16:51:47 - INFO - __main__ - Step 10969: {'lr': 0.00018266666666666667, 'samples': 351008, 'steps': 685, 'loss/train': 4.234043121337891} -09/20/2021 16:51:48 - INFO - __main__ - Step 10970: {'lr': 0.00018266666666666667, 'samples': 351040, 'steps': 685, 'loss/train': 4.303547382354736} -09/20/2021 16:51:49 - INFO - __main__ - Step 10971: {'lr': 0.00018266666666666667, 'samples': 351072, 'steps': 685, 'loss/train': 4.144259452819824} -09/20/2021 16:51:50 - INFO - __main__ - Step 10972: {'lr': 0.00018266666666666667, 'samples': 351104, 'steps': 685, 'loss/train': 4.0468831062316895} -09/20/2021 16:51:50 - INFO - __main__ - Step 10973: {'lr': 0.00018266666666666667, 'samples': 351136, 'steps': 685, 'loss/train': 4.880460739135742} -09/20/2021 16:51:51 - INFO - __main__ - Step 10974: {'lr': 0.00018266666666666667, 'samples': 351168, 'steps': 685, 'loss/train': 3.8500068187713623} -09/20/2021 16:51:52 - INFO - __main__ - Step 10975: {'lr': 0.00018266666666666667, 'samples': 351200, 'steps': 685, 'loss/train': 4.263260364532471} -09/20/2021 16:51:53 - INFO - __main__ - Step 10976: {'lr': 0.00018266666666666667, 'samples': 351232, 'steps': 685, 'loss/train': 4.140552520751953} -09/20/2021 16:51:54 - INFO - __main__ - Step 10977: {'lr': 0.00018293333333333333, 'samples': 351264, 'steps': 686, 'loss/train': 5.571901798248291} -09/20/2021 16:51:54 - INFO - __main__ - Step 10978: {'lr': 0.00018293333333333333, 'samples': 351296, 'steps': 686, 'loss/train': 3.7569050788879395} -09/20/2021 16:51:55 - INFO - __main__ - Step 10979: {'lr': 0.00018293333333333333, 'samples': 351328, 'steps': 686, 'loss/train': 4.977989673614502} -09/20/2021 16:51:57 - INFO - __main__ - Step 10980: {'lr': 0.00018293333333333333, 'samples': 351360, 'steps': 686, 'loss/train': 4.639523983001709} -09/20/2021 16:51:58 - INFO - __main__ - Step 10981: {'lr': 0.00018293333333333333, 'samples': 351392, 'steps': 686, 'loss/train': 3.4360716342926025} -09/20/2021 16:51:58 - INFO - __main__ - Step 10982: {'lr': 0.00018293333333333333, 'samples': 351424, 'steps': 686, 'loss/train': 4.721436023712158} -09/20/2021 16:51:59 - INFO - __main__ - Step 10983: {'lr': 0.00018293333333333333, 'samples': 351456, 'steps': 686, 'loss/train': 4.382144927978516} -09/20/2021 16:52:00 - INFO - __main__ - Step 10984: {'lr': 0.00018293333333333333, 'samples': 351488, 'steps': 686, 'loss/train': 6.199126243591309} -09/20/2021 16:52:01 - INFO - __main__ - Step 10985: {'lr': 0.00018293333333333333, 'samples': 351520, 'steps': 686, 'loss/train': 3.907444477081299} -09/20/2021 16:52:01 - INFO - __main__ - Step 10986: {'lr': 0.00018293333333333333, 'samples': 351552, 'steps': 686, 'loss/train': 3.6923558712005615} -09/20/2021 16:52:02 - INFO - __main__ - Step 10987: {'lr': 0.00018293333333333333, 'samples': 351584, 'steps': 686, 'loss/train': 5.08538818359375} -09/20/2021 16:52:03 - INFO - __main__ - Step 10988: {'lr': 0.00018293333333333333, 'samples': 351616, 'steps': 686, 'loss/train': 4.551494598388672} -09/20/2021 16:52:04 - INFO - __main__ - Step 10989: {'lr': 0.00018293333333333333, 'samples': 351648, 'steps': 686, 'loss/train': 5.866156578063965} -09/20/2021 16:52:04 - INFO - __main__ - Step 10990: {'lr': 0.00018293333333333333, 'samples': 351680, 'steps': 686, 'loss/train': 4.437488079071045} -09/20/2021 16:52:05 - INFO - __main__ - Step 10991: {'lr': 0.00018293333333333333, 'samples': 351712, 'steps': 686, 'loss/train': 5.075619220733643} -09/20/2021 16:52:06 - INFO - __main__ - Step 10992: {'lr': 0.00018293333333333333, 'samples': 351744, 'steps': 686, 'loss/train': 4.399689674377441} -09/20/2021 16:52:07 - INFO - __main__ - Step 10993: {'lr': 0.0001832, 'samples': 351776, 'steps': 687, 'loss/train': 4.341544151306152} -09/20/2021 16:52:07 - INFO - __main__ - Step 10994: {'lr': 0.0001832, 'samples': 351808, 'steps': 687, 'loss/train': 4.583425521850586} -09/20/2021 16:52:08 - INFO - __main__ - Step 10995: {'lr': 0.0001832, 'samples': 351840, 'steps': 687, 'loss/train': 4.826277732849121} -09/20/2021 16:52:09 - INFO - __main__ - Step 10996: {'lr': 0.0001832, 'samples': 351872, 'steps': 687, 'loss/train': 4.326051712036133} -09/20/2021 16:52:10 - INFO - __main__ - Step 10997: {'lr': 0.0001832, 'samples': 351904, 'steps': 687, 'loss/train': 2.1512558460235596} -09/20/2021 16:52:10 - INFO - __main__ - Step 10998: {'lr': 0.0001832, 'samples': 351936, 'steps': 687, 'loss/train': 4.432768821716309} -09/20/2021 16:52:11 - INFO - __main__ - Step 10999: {'lr': 0.0001832, 'samples': 351968, 'steps': 687, 'loss/train': 4.305235862731934} -09/20/2021 16:52:12 - INFO - __main__ - Step 11000: {'lr': 0.0001832, 'samples': 352000, 'steps': 687, 'loss/train': 6.895567893981934} -09/20/2021 16:52:13 - INFO - __main__ - Step 11001: {'lr': 0.0001832, 'samples': 352032, 'steps': 687, 'loss/train': 4.081051826477051} -09/20/2021 16:52:13 - INFO - __main__ - Step 11002: {'lr': 0.0001832, 'samples': 352064, 'steps': 687, 'loss/train': 4.22404146194458} -09/20/2021 16:52:14 - INFO - __main__ - Step 11003: {'lr': 0.0001832, 'samples': 352096, 'steps': 687, 'loss/train': 3.48587703704834} -09/20/2021 16:52:15 - INFO - __main__ - Step 11004: {'lr': 0.0001832, 'samples': 352128, 'steps': 687, 'loss/train': 6.440478324890137} -09/20/2021 16:52:16 - INFO - __main__ - Step 11005: {'lr': 0.0001832, 'samples': 352160, 'steps': 687, 'loss/train': 3.751420021057129} -09/20/2021 16:52:16 - INFO - __main__ - Step 11006: {'lr': 0.0001832, 'samples': 352192, 'steps': 687, 'loss/train': 4.319115161895752} -09/20/2021 16:52:17 - INFO - __main__ - Step 11007: {'lr': 0.0001832, 'samples': 352224, 'steps': 687, 'loss/train': 4.425450325012207} -09/20/2021 16:52:18 - INFO - __main__ - Step 11008: {'lr': 0.0001832, 'samples': 352256, 'steps': 687, 'loss/train': 4.122127532958984} -09/20/2021 16:52:19 - INFO - __main__ - Step 11009: {'lr': 0.00018346666666666666, 'samples': 352288, 'steps': 688, 'loss/train': 3.747483968734741} -09/20/2021 16:52:20 - INFO - __main__ - Step 11010: {'lr': 0.00018346666666666666, 'samples': 352320, 'steps': 688, 'loss/train': 3.9915356636047363} -09/20/2021 16:52:21 - INFO - __main__ - Step 11011: {'lr': 0.00018346666666666666, 'samples': 352352, 'steps': 688, 'loss/train': 4.477544784545898} -09/20/2021 16:52:22 - INFO - __main__ - Step 11012: {'lr': 0.00018346666666666666, 'samples': 352384, 'steps': 688, 'loss/train': 4.324519157409668} -09/20/2021 16:52:23 - INFO - __main__ - Step 11013: {'lr': 0.00018346666666666666, 'samples': 352416, 'steps': 688, 'loss/train': 4.519750118255615} -09/20/2021 16:52:23 - INFO - __main__ - Step 11014: {'lr': 0.00018346666666666666, 'samples': 352448, 'steps': 688, 'loss/train': 4.700618743896484} -09/20/2021 16:52:24 - INFO - __main__ - Step 11015: {'lr': 0.00018346666666666666, 'samples': 352480, 'steps': 688, 'loss/train': 5.808730125427246} -09/20/2021 16:52:25 - INFO - __main__ - Step 11016: {'lr': 0.00018346666666666666, 'samples': 352512, 'steps': 688, 'loss/train': 4.961874961853027} -09/20/2021 16:52:26 - INFO - __main__ - Step 11017: {'lr': 0.00018346666666666666, 'samples': 352544, 'steps': 688, 'loss/train': 4.300730228424072} -09/20/2021 16:52:26 - INFO - __main__ - Step 11018: {'lr': 0.00018346666666666666, 'samples': 352576, 'steps': 688, 'loss/train': 5.114593029022217} -09/20/2021 16:52:27 - INFO - __main__ - Step 11019: {'lr': 0.00018346666666666666, 'samples': 352608, 'steps': 688, 'loss/train': 3.0324127674102783} -09/20/2021 16:52:28 - INFO - __main__ - Step 11020: {'lr': 0.00018346666666666666, 'samples': 352640, 'steps': 688, 'loss/train': 2.1365363597869873} -09/20/2021 16:52:29 - INFO - __main__ - Step 11021: {'lr': 0.00018346666666666666, 'samples': 352672, 'steps': 688, 'loss/train': 1.9687604904174805} -09/20/2021 16:52:29 - INFO - __main__ - Step 11022: {'lr': 0.00018346666666666666, 'samples': 352704, 'steps': 688, 'loss/train': 2.504607915878296} -09/20/2021 16:52:30 - INFO - __main__ - Step 11023: {'lr': 0.00018346666666666666, 'samples': 352736, 'steps': 688, 'loss/train': 2.0464136600494385} -09/20/2021 16:52:31 - INFO - __main__ - Step 11024: {'lr': 0.00018346666666666666, 'samples': 352768, 'steps': 688, 'loss/train': 4.679162979125977} -09/20/2021 16:52:32 - INFO - __main__ - Step 11025: {'lr': 0.00018373333333333335, 'samples': 352800, 'steps': 689, 'loss/train': 3.9775900840759277} -09/20/2021 16:52:33 - INFO - __main__ - Step 11026: {'lr': 0.00018373333333333335, 'samples': 352832, 'steps': 689, 'loss/train': 4.520700931549072} -09/20/2021 16:52:33 - INFO - __main__ - Step 11027: {'lr': 0.00018373333333333335, 'samples': 352864, 'steps': 689, 'loss/train': 4.246415138244629} -09/20/2021 16:52:34 - INFO - __main__ - Step 11028: {'lr': 0.00018373333333333335, 'samples': 352896, 'steps': 689, 'loss/train': 4.306687831878662} -09/20/2021 16:52:35 - INFO - __main__ - Step 11029: {'lr': 0.00018373333333333335, 'samples': 352928, 'steps': 689, 'loss/train': 3.941751718521118} -09/20/2021 16:52:36 - INFO - __main__ - Step 11030: {'lr': 0.00018373333333333335, 'samples': 352960, 'steps': 689, 'loss/train': 4.303613662719727} -09/20/2021 16:52:36 - INFO - __main__ - Step 11031: {'lr': 0.00018373333333333335, 'samples': 352992, 'steps': 689, 'loss/train': 4.209549903869629} -09/20/2021 16:52:37 - INFO - __main__ - Step 11032: {'lr': 0.00018373333333333335, 'samples': 353024, 'steps': 689, 'loss/train': 3.66066312789917} -09/20/2021 16:52:38 - INFO - __main__ - Step 11033: {'lr': 0.00018373333333333335, 'samples': 353056, 'steps': 689, 'loss/train': 4.390666484832764} -09/20/2021 16:52:39 - INFO - __main__ - Step 11034: {'lr': 0.00018373333333333335, 'samples': 353088, 'steps': 689, 'loss/train': 3.6366019248962402} -09/20/2021 16:52:39 - INFO - __main__ - Step 11035: {'lr': 0.00018373333333333335, 'samples': 353120, 'steps': 689, 'loss/train': 4.066492557525635} -09/20/2021 16:52:40 - INFO - __main__ - Step 11036: {'lr': 0.00018373333333333335, 'samples': 353152, 'steps': 689, 'loss/train': 4.508783340454102} -09/20/2021 16:52:41 - INFO - __main__ - Step 11037: {'lr': 0.00018373333333333335, 'samples': 353184, 'steps': 689, 'loss/train': 3.6137115955352783} -09/20/2021 16:52:42 - INFO - __main__ - Step 11038: {'lr': 0.00018373333333333335, 'samples': 353216, 'steps': 689, 'loss/train': 4.494476795196533} -09/20/2021 16:52:42 - INFO - __main__ - Step 11039: {'lr': 0.00018373333333333335, 'samples': 353248, 'steps': 689, 'loss/train': 4.684318542480469} -09/20/2021 16:52:43 - INFO - __main__ - Step 11040: {'lr': 0.00018373333333333335, 'samples': 353280, 'steps': 689, 'loss/train': 4.334941864013672} -09/20/2021 16:52:45 - INFO - __main__ - Step 11041: {'lr': 0.00018400000000000003, 'samples': 353312, 'steps': 690, 'loss/train': 3.669055223464966} -09/20/2021 16:52:45 - INFO - __main__ - Step 11042: {'lr': 0.00018400000000000003, 'samples': 353344, 'steps': 690, 'loss/train': 1.7705193758010864} -09/20/2021 16:52:46 - INFO - __main__ - Step 11043: {'lr': 0.00018400000000000003, 'samples': 353376, 'steps': 690, 'loss/train': 4.207993984222412} -09/20/2021 16:52:47 - INFO - __main__ - Step 11044: {'lr': 0.00018400000000000003, 'samples': 353408, 'steps': 690, 'loss/train': 5.288417339324951} -09/20/2021 16:52:48 - INFO - __main__ - Step 11045: {'lr': 0.00018400000000000003, 'samples': 353440, 'steps': 690, 'loss/train': 5.042601108551025} -09/20/2021 16:52:48 - INFO - __main__ - Step 11046: {'lr': 0.00018400000000000003, 'samples': 353472, 'steps': 690, 'loss/train': 4.6073150634765625} -09/20/2021 16:52:49 - INFO - __main__ - Step 11047: {'lr': 0.00018400000000000003, 'samples': 353504, 'steps': 690, 'loss/train': 3.767268657684326} -09/20/2021 16:52:50 - INFO - __main__ - Step 11048: {'lr': 0.00018400000000000003, 'samples': 353536, 'steps': 690, 'loss/train': 4.105034351348877} -09/20/2021 16:52:51 - INFO - __main__ - Step 11049: {'lr': 0.00018400000000000003, 'samples': 353568, 'steps': 690, 'loss/train': 4.210188865661621} -09/20/2021 16:52:51 - INFO - __main__ - Step 11050: {'lr': 0.00018400000000000003, 'samples': 353600, 'steps': 690, 'loss/train': 4.482959747314453} -09/20/2021 16:52:52 - INFO - __main__ - Step 11051: {'lr': 0.00018400000000000003, 'samples': 353632, 'steps': 690, 'loss/train': 4.031498432159424} -09/20/2021 16:52:53 - INFO - __main__ - Step 11052: {'lr': 0.00018400000000000003, 'samples': 353664, 'steps': 690, 'loss/train': 4.039671421051025} -09/20/2021 16:52:54 - INFO - __main__ - Step 11053: {'lr': 0.00018400000000000003, 'samples': 353696, 'steps': 690, 'loss/train': 3.8835794925689697} -09/20/2021 16:52:54 - INFO - __main__ - Step 11054: {'lr': 0.00018400000000000003, 'samples': 353728, 'steps': 690, 'loss/train': 3.645784378051758} -09/20/2021 16:52:55 - INFO - __main__ - Step 11055: {'lr': 0.00018400000000000003, 'samples': 353760, 'steps': 690, 'loss/train': 4.090284824371338} -09/20/2021 16:52:56 - INFO - __main__ - Step 11056: {'lr': 0.00018400000000000003, 'samples': 353792, 'steps': 690, 'loss/train': 4.755816459655762} -09/20/2021 16:52:57 - INFO - __main__ - Step 11057: {'lr': 0.00018426666666666668, 'samples': 353824, 'steps': 691, 'loss/train': 3.9969844818115234} -09/20/2021 16:52:58 - INFO - __main__ - Step 11058: {'lr': 0.00018426666666666668, 'samples': 353856, 'steps': 691, 'loss/train': 5.2442121505737305} -09/20/2021 16:52:58 - INFO - __main__ - Step 11059: {'lr': 0.00018426666666666668, 'samples': 353888, 'steps': 691, 'loss/train': 3.796799421310425} -09/20/2021 16:52:59 - INFO - __main__ - Step 11060: {'lr': 0.00018426666666666668, 'samples': 353920, 'steps': 691, 'loss/train': 4.76046895980835} -09/20/2021 16:53:00 - INFO - __main__ - Step 11061: {'lr': 0.00018426666666666668, 'samples': 353952, 'steps': 691, 'loss/train': 6.054234981536865} -09/20/2021 16:53:01 - INFO - __main__ - Step 11062: {'lr': 0.00018426666666666668, 'samples': 353984, 'steps': 691, 'loss/train': 4.254875183105469} -09/20/2021 16:53:01 - INFO - __main__ - Step 11063: {'lr': 0.00018426666666666668, 'samples': 354016, 'steps': 691, 'loss/train': 5.293246269226074} -09/20/2021 16:53:02 - INFO - __main__ - Step 11064: {'lr': 0.00018426666666666668, 'samples': 354048, 'steps': 691, 'loss/train': 5.131263256072998} -09/20/2021 16:53:03 - INFO - __main__ - Step 11065: {'lr': 0.00018426666666666668, 'samples': 354080, 'steps': 691, 'loss/train': 4.050186634063721} -09/20/2021 16:53:04 - INFO - __main__ - Step 11066: {'lr': 0.00018426666666666668, 'samples': 354112, 'steps': 691, 'loss/train': 4.142632961273193} -09/20/2021 16:53:04 - INFO - __main__ - Step 11067: {'lr': 0.00018426666666666668, 'samples': 354144, 'steps': 691, 'loss/train': 5.675346851348877} -09/20/2021 16:53:05 - INFO - __main__ - Step 11068: {'lr': 0.00018426666666666668, 'samples': 354176, 'steps': 691, 'loss/train': 4.173637390136719} -09/20/2021 16:53:06 - INFO - __main__ - Step 11069: {'lr': 0.00018426666666666668, 'samples': 354208, 'steps': 691, 'loss/train': 4.366824150085449} -09/20/2021 16:53:07 - INFO - __main__ - Step 11070: {'lr': 0.00018426666666666668, 'samples': 354240, 'steps': 691, 'loss/train': 3.9301023483276367} -09/20/2021 16:53:07 - INFO - __main__ - Step 11071: {'lr': 0.00018426666666666668, 'samples': 354272, 'steps': 691, 'loss/train': 3.2871170043945312} -09/20/2021 16:53:09 - INFO - __main__ - Step 11072: {'lr': 0.00018426666666666668, 'samples': 354304, 'steps': 691, 'loss/train': 3.8174023628234863} -09/20/2021 16:53:09 - INFO - __main__ - Step 11073: {'lr': 0.00018453333333333334, 'samples': 354336, 'steps': 692, 'loss/train': 4.517948627471924} -09/20/2021 16:53:10 - INFO - __main__ - Step 11074: {'lr': 0.00018453333333333334, 'samples': 354368, 'steps': 692, 'loss/train': 4.215946674346924} -09/20/2021 16:53:11 - INFO - __main__ - Step 11075: {'lr': 0.00018453333333333334, 'samples': 354400, 'steps': 692, 'loss/train': 4.587474822998047} -09/20/2021 16:53:12 - INFO - __main__ - Step 11076: {'lr': 0.00018453333333333334, 'samples': 354432, 'steps': 692, 'loss/train': 4.004622936248779} -09/20/2021 16:53:12 - INFO - __main__ - Step 11077: {'lr': 0.00018453333333333334, 'samples': 354464, 'steps': 692, 'loss/train': 4.080695152282715} -09/20/2021 16:53:13 - INFO - __main__ - Step 11078: {'lr': 0.00018453333333333334, 'samples': 354496, 'steps': 692, 'loss/train': 4.271389961242676} -09/20/2021 16:53:14 - INFO - __main__ - Step 11079: {'lr': 0.00018453333333333334, 'samples': 354528, 'steps': 692, 'loss/train': 4.404866695404053} -09/20/2021 16:53:15 - INFO - __main__ - Step 11080: {'lr': 0.00018453333333333334, 'samples': 354560, 'steps': 692, 'loss/train': 3.884547472000122} -09/20/2021 16:53:15 - INFO - __main__ - Step 11081: {'lr': 0.00018453333333333334, 'samples': 354592, 'steps': 692, 'loss/train': 4.217467784881592} -09/20/2021 16:53:16 - INFO - __main__ - Step 11082: {'lr': 0.00018453333333333334, 'samples': 354624, 'steps': 692, 'loss/train': 4.033894062042236} -09/20/2021 16:53:17 - INFO - __main__ - Step 11083: {'lr': 0.00018453333333333334, 'samples': 354656, 'steps': 692, 'loss/train': 5.154455661773682} -09/20/2021 16:53:18 - INFO - __main__ - Step 11084: {'lr': 0.00018453333333333334, 'samples': 354688, 'steps': 692, 'loss/train': 5.70654821395874} -09/20/2021 16:53:18 - INFO - __main__ - Step 11085: {'lr': 0.00018453333333333334, 'samples': 354720, 'steps': 692, 'loss/train': 3.6775689125061035} -09/20/2021 16:53:19 - INFO - __main__ - Step 11086: {'lr': 0.00018453333333333334, 'samples': 354752, 'steps': 692, 'loss/train': 3.1009864807128906} -09/20/2021 16:53:20 - INFO - __main__ - Step 11087: {'lr': 0.00018453333333333334, 'samples': 354784, 'steps': 692, 'loss/train': 4.694949626922607} -09/20/2021 16:53:21 - INFO - __main__ - Step 11088: {'lr': 0.00018453333333333334, 'samples': 354816, 'steps': 692, 'loss/train': 4.22764253616333} -09/20/2021 16:53:22 - INFO - __main__ - Step 11089: {'lr': 0.00018480000000000002, 'samples': 354848, 'steps': 693, 'loss/train': 4.381032466888428} -09/20/2021 16:53:22 - INFO - __main__ - Step 11090: {'lr': 0.00018480000000000002, 'samples': 354880, 'steps': 693, 'loss/train': 3.896592617034912} -09/20/2021 16:53:23 - INFO - __main__ - Step 11091: {'lr': 0.00018480000000000002, 'samples': 354912, 'steps': 693, 'loss/train': 4.3562541007995605} -09/20/2021 16:53:24 - INFO - __main__ - Step 11092: {'lr': 0.00018480000000000002, 'samples': 354944, 'steps': 693, 'loss/train': 3.5842092037200928} -09/20/2021 16:53:25 - INFO - __main__ - Step 11093: {'lr': 0.00018480000000000002, 'samples': 354976, 'steps': 693, 'loss/train': 4.400552749633789} -09/20/2021 16:53:25 - INFO - __main__ - Step 11094: {'lr': 0.00018480000000000002, 'samples': 355008, 'steps': 693, 'loss/train': 3.3354146480560303} -09/20/2021 16:53:26 - INFO - __main__ - Step 11095: {'lr': 0.00018480000000000002, 'samples': 355040, 'steps': 693, 'loss/train': 4.288604259490967} -09/20/2021 16:53:27 - INFO - __main__ - Step 11096: {'lr': 0.00018480000000000002, 'samples': 355072, 'steps': 693, 'loss/train': 3.821202278137207} -09/20/2021 16:53:28 - INFO - __main__ - Step 11097: {'lr': 0.00018480000000000002, 'samples': 355104, 'steps': 693, 'loss/train': 4.344983100891113} -09/20/2021 16:53:28 - INFO - __main__ - Step 11098: {'lr': 0.00018480000000000002, 'samples': 355136, 'steps': 693, 'loss/train': 4.405046463012695} -09/20/2021 16:53:29 - INFO - __main__ - Step 11099: {'lr': 0.00018480000000000002, 'samples': 355168, 'steps': 693, 'loss/train': 4.2018537521362305} -09/20/2021 16:53:30 - INFO - __main__ - Step 11100: {'lr': 0.00018480000000000002, 'samples': 355200, 'steps': 693, 'loss/train': 4.649186134338379} -09/20/2021 16:53:31 - INFO - __main__ - Step 11101: {'lr': 0.00018480000000000002, 'samples': 355232, 'steps': 693, 'loss/train': 4.685657024383545} -09/20/2021 16:53:31 - INFO - __main__ - Step 11102: {'lr': 0.00018480000000000002, 'samples': 355264, 'steps': 693, 'loss/train': 4.981956958770752} -09/20/2021 16:53:33 - INFO - __main__ - Step 11103: {'lr': 0.00018480000000000002, 'samples': 355296, 'steps': 693, 'loss/train': 3.5302557945251465} -09/20/2021 16:53:34 - INFO - __main__ - Step 11104: {'lr': 0.00018480000000000002, 'samples': 355328, 'steps': 693, 'loss/train': 4.690622806549072} -09/20/2021 16:53:34 - INFO - __main__ - Step 11105: {'lr': 0.00018506666666666667, 'samples': 355360, 'steps': 694, 'loss/train': 3.8106255531311035} -09/20/2021 16:53:35 - INFO - __main__ - Step 11106: {'lr': 0.00018506666666666667, 'samples': 355392, 'steps': 694, 'loss/train': 5.434937953948975} -09/20/2021 16:53:36 - INFO - __main__ - Step 11107: {'lr': 0.00018506666666666667, 'samples': 355424, 'steps': 694, 'loss/train': 4.8858819007873535} -09/20/2021 16:53:37 - INFO - __main__ - Step 11108: {'lr': 0.00018506666666666667, 'samples': 355456, 'steps': 694, 'loss/train': 4.18435525894165} -09/20/2021 16:53:37 - INFO - __main__ - Step 11109: {'lr': 0.00018506666666666667, 'samples': 355488, 'steps': 694, 'loss/train': 4.657719612121582} -09/20/2021 16:53:38 - INFO - __main__ - Step 11110: {'lr': 0.00018506666666666667, 'samples': 355520, 'steps': 694, 'loss/train': 4.385720252990723} -09/20/2021 16:53:39 - INFO - __main__ - Step 11111: {'lr': 0.00018506666666666667, 'samples': 355552, 'steps': 694, 'loss/train': 4.421297550201416} -09/20/2021 16:53:40 - INFO - __main__ - Step 11112: {'lr': 0.00018506666666666667, 'samples': 355584, 'steps': 694, 'loss/train': 3.1455276012420654} -09/20/2021 16:53:40 - INFO - __main__ - Step 11113: {'lr': 0.00018506666666666667, 'samples': 355616, 'steps': 694, 'loss/train': 5.0130391120910645} -09/20/2021 16:53:41 - INFO - __main__ - Step 11114: {'lr': 0.00018506666666666667, 'samples': 355648, 'steps': 694, 'loss/train': 4.369174957275391} -09/20/2021 16:53:42 - INFO - __main__ - Step 11115: {'lr': 0.00018506666666666667, 'samples': 355680, 'steps': 694, 'loss/train': 4.728602409362793} -09/20/2021 16:53:43 - INFO - __main__ - Step 11116: {'lr': 0.00018506666666666667, 'samples': 355712, 'steps': 694, 'loss/train': 4.7167067527771} -09/20/2021 16:53:43 - INFO - __main__ - Step 11117: {'lr': 0.00018506666666666667, 'samples': 355744, 'steps': 694, 'loss/train': 3.8309078216552734} -09/20/2021 16:53:44 - INFO - __main__ - Step 11118: {'lr': 0.00018506666666666667, 'samples': 355776, 'steps': 694, 'loss/train': 3.695772171020508} -09/20/2021 16:53:45 - INFO - __main__ - Step 11119: {'lr': 0.00018506666666666667, 'samples': 355808, 'steps': 694, 'loss/train': 4.957359313964844} -09/20/2021 16:53:46 - INFO - __main__ - Step 11120: {'lr': 0.00018506666666666667, 'samples': 355840, 'steps': 694, 'loss/train': 4.271944046020508} -09/20/2021 16:53:47 - INFO - __main__ - Step 11121: {'lr': 0.00018533333333333333, 'samples': 355872, 'steps': 695, 'loss/train': 3.726823568344116} -09/20/2021 16:53:47 - INFO - __main__ - Step 11122: {'lr': 0.00018533333333333333, 'samples': 355904, 'steps': 695, 'loss/train': 3.763686418533325} -09/20/2021 16:53:48 - INFO - __main__ - Step 11123: {'lr': 0.00018533333333333333, 'samples': 355936, 'steps': 695, 'loss/train': 5.186069011688232} -09/20/2021 16:53:49 - INFO - __main__ - Step 11124: {'lr': 0.00018533333333333333, 'samples': 355968, 'steps': 695, 'loss/train': 6.505827903747559} -09/20/2021 16:53:50 - INFO - __main__ - Step 11125: {'lr': 0.00018533333333333333, 'samples': 356000, 'steps': 695, 'loss/train': 6.444966793060303} -09/20/2021 16:53:50 - INFO - __main__ - Step 11126: {'lr': 0.00018533333333333333, 'samples': 356032, 'steps': 695, 'loss/train': 6.394215106964111} -09/20/2021 16:53:51 - INFO - __main__ - Step 11127: {'lr': 0.00018533333333333333, 'samples': 356064, 'steps': 695, 'loss/train': 6.454896926879883} -09/20/2021 16:53:52 - INFO - __main__ - Step 11128: {'lr': 0.00018533333333333333, 'samples': 356096, 'steps': 695, 'loss/train': 6.314675807952881} -09/20/2021 16:53:53 - INFO - __main__ - Step 11129: {'lr': 0.00018533333333333333, 'samples': 356128, 'steps': 695, 'loss/train': 6.351470470428467} -09/20/2021 16:53:53 - INFO - __main__ - Step 11130: {'lr': 0.00018533333333333333, 'samples': 356160, 'steps': 695, 'loss/train': 6.386819839477539} -09/20/2021 16:53:54 - INFO - __main__ - Step 11131: {'lr': 0.00018533333333333333, 'samples': 356192, 'steps': 695, 'loss/train': 3.8766872882843018} -09/20/2021 16:53:55 - INFO - __main__ - Step 11132: {'lr': 0.00018533333333333333, 'samples': 356224, 'steps': 695, 'loss/train': 3.57576847076416} -09/20/2021 16:53:56 - INFO - __main__ - Step 11133: {'lr': 0.00018533333333333333, 'samples': 356256, 'steps': 695, 'loss/train': 3.8976686000823975} -09/20/2021 16:53:56 - INFO - __main__ - Step 11134: {'lr': 0.00018533333333333333, 'samples': 356288, 'steps': 695, 'loss/train': 5.1983466148376465} -09/20/2021 16:53:57 - INFO - __main__ - Step 11135: {'lr': 0.00018533333333333333, 'samples': 356320, 'steps': 695, 'loss/train': 4.612381458282471} -09/20/2021 16:53:58 - INFO - __main__ - Step 11136: {'lr': 0.00018533333333333333, 'samples': 356352, 'steps': 695, 'loss/train': 3.8592610359191895} -09/20/2021 16:53:59 - INFO - __main__ - Step 11137: {'lr': 0.0001856, 'samples': 356384, 'steps': 696, 'loss/train': 4.747340679168701} -09/20/2021 16:54:00 - INFO - __main__ - Step 11138: {'lr': 0.0001856, 'samples': 356416, 'steps': 696, 'loss/train': 4.4111857414245605} -09/20/2021 16:54:01 - INFO - __main__ - Step 11139: {'lr': 0.0001856, 'samples': 356448, 'steps': 696, 'loss/train': 4.407690525054932} -09/20/2021 16:54:02 - INFO - __main__ - Step 11140: {'lr': 0.0001856, 'samples': 356480, 'steps': 696, 'loss/train': 4.9667768478393555} -09/20/2021 16:54:02 - INFO - __main__ - Step 11141: {'lr': 0.0001856, 'samples': 356512, 'steps': 696, 'loss/train': 4.339874267578125} -09/20/2021 16:54:03 - INFO - __main__ - Step 11142: {'lr': 0.0001856, 'samples': 356544, 'steps': 696, 'loss/train': 4.4979753494262695} -09/20/2021 16:54:04 - INFO - __main__ - Step 11143: {'lr': 0.0001856, 'samples': 356576, 'steps': 696, 'loss/train': 4.692720890045166} -09/20/2021 16:54:05 - INFO - __main__ - Step 11144: {'lr': 0.0001856, 'samples': 356608, 'steps': 696, 'loss/train': 4.4097795486450195} -09/20/2021 16:54:05 - INFO - __main__ - Step 11145: {'lr': 0.0001856, 'samples': 356640, 'steps': 696, 'loss/train': 3.4418938159942627} -09/20/2021 16:54:06 - INFO - __main__ - Step 11146: {'lr': 0.0001856, 'samples': 356672, 'steps': 696, 'loss/train': 1.56178879737854} -09/20/2021 16:54:07 - INFO - __main__ - Step 11147: {'lr': 0.0001856, 'samples': 356704, 'steps': 696, 'loss/train': 1.8475399017333984} -09/20/2021 16:54:08 - INFO - __main__ - Step 11148: {'lr': 0.0001856, 'samples': 356736, 'steps': 696, 'loss/train': 2.3864939212799072} -09/20/2021 16:54:08 - INFO - __main__ - Step 11149: {'lr': 0.0001856, 'samples': 356768, 'steps': 696, 'loss/train': 1.9581598043441772} -09/20/2021 16:54:09 - INFO - __main__ - Step 11150: {'lr': 0.0001856, 'samples': 356800, 'steps': 696, 'loss/train': 4.162323474884033} -09/20/2021 16:54:10 - INFO - __main__ - Step 11151: {'lr': 0.0001856, 'samples': 356832, 'steps': 696, 'loss/train': 4.698967933654785} -09/20/2021 16:54:11 - INFO - __main__ - Step 11152: {'lr': 0.0001856, 'samples': 356864, 'steps': 696, 'loss/train': 3.350768804550171} -09/20/2021 16:54:12 - INFO - __main__ - Step 11153: {'lr': 0.00018586666666666667, 'samples': 356896, 'steps': 697, 'loss/train': 4.152111053466797} -09/20/2021 16:54:12 - INFO - __main__ - Step 11154: {'lr': 0.00018586666666666667, 'samples': 356928, 'steps': 697, 'loss/train': 4.01918363571167} -09/20/2021 16:54:13 - INFO - __main__ - Step 11155: {'lr': 0.00018586666666666667, 'samples': 356960, 'steps': 697, 'loss/train': 4.865062713623047} -09/20/2021 16:54:14 - INFO - __main__ - Step 11156: {'lr': 0.00018586666666666667, 'samples': 356992, 'steps': 697, 'loss/train': 4.536833763122559} -09/20/2021 16:54:15 - INFO - __main__ - Step 11157: {'lr': 0.00018586666666666667, 'samples': 357024, 'steps': 697, 'loss/train': 4.242519855499268} -09/20/2021 16:54:15 - INFO - __main__ - Step 11158: {'lr': 0.00018586666666666667, 'samples': 357056, 'steps': 697, 'loss/train': 4.188387870788574} -09/20/2021 16:54:16 - INFO - __main__ - Step 11159: {'lr': 0.00018586666666666667, 'samples': 357088, 'steps': 697, 'loss/train': 4.3400421142578125} -09/20/2021 16:54:17 - INFO - __main__ - Step 11160: {'lr': 0.00018586666666666667, 'samples': 357120, 'steps': 697, 'loss/train': 4.090182304382324} -09/20/2021 16:54:18 - INFO - __main__ - Step 11161: {'lr': 0.00018586666666666667, 'samples': 357152, 'steps': 697, 'loss/train': 4.153143882751465} -09/20/2021 16:54:18 - INFO - __main__ - Step 11162: {'lr': 0.00018586666666666667, 'samples': 357184, 'steps': 697, 'loss/train': 4.86424446105957} -09/20/2021 16:54:19 - INFO - __main__ - Step 11163: {'lr': 0.00018586666666666667, 'samples': 357216, 'steps': 697, 'loss/train': 3.793015956878662} -09/20/2021 16:54:20 - INFO - __main__ - Step 11164: {'lr': 0.00018586666666666667, 'samples': 357248, 'steps': 697, 'loss/train': 4.481766700744629} -09/20/2021 16:54:21 - INFO - __main__ - Step 11165: {'lr': 0.00018586666666666667, 'samples': 357280, 'steps': 697, 'loss/train': 4.239414215087891} -09/20/2021 16:54:21 - INFO - __main__ - Step 11166: {'lr': 0.00018586666666666667, 'samples': 357312, 'steps': 697, 'loss/train': 3.7954211235046387} -09/20/2021 16:54:22 - INFO - __main__ - Step 11167: {'lr': 0.00018586666666666667, 'samples': 357344, 'steps': 697, 'loss/train': 3.7166614532470703} -09/20/2021 16:54:23 - INFO - __main__ - Step 11168: {'lr': 0.00018586666666666667, 'samples': 357376, 'steps': 697, 'loss/train': 4.851043701171875} -09/20/2021 16:54:24 - INFO - __main__ - Step 11169: {'lr': 0.00018613333333333335, 'samples': 357408, 'steps': 698, 'loss/train': 4.504152774810791} -09/20/2021 16:54:25 - INFO - __main__ - Step 11170: {'lr': 0.00018613333333333335, 'samples': 357440, 'steps': 698, 'loss/train': 4.295408725738525} -09/20/2021 16:54:26 - INFO - __main__ - Step 11171: {'lr': 0.00018613333333333335, 'samples': 357472, 'steps': 698, 'loss/train': 4.351712226867676} -09/20/2021 16:54:26 - INFO - __main__ - Step 11172: {'lr': 0.00018613333333333335, 'samples': 357504, 'steps': 698, 'loss/train': 3.8900246620178223} -09/20/2021 16:54:27 - INFO - __main__ - Step 11173: {'lr': 0.00018613333333333335, 'samples': 357536, 'steps': 698, 'loss/train': 4.967743873596191} -09/20/2021 16:54:28 - INFO - __main__ - Step 11174: {'lr': 0.00018613333333333335, 'samples': 357568, 'steps': 698, 'loss/train': 4.661613941192627} -09/20/2021 16:54:29 - INFO - __main__ - Step 11175: {'lr': 0.00018613333333333335, 'samples': 357600, 'steps': 698, 'loss/train': 4.036383628845215} -09/20/2021 16:54:29 - INFO - __main__ - Step 11176: {'lr': 0.00018613333333333335, 'samples': 357632, 'steps': 698, 'loss/train': 5.0867414474487305} -09/20/2021 16:54:30 - INFO - __main__ - Step 11177: {'lr': 0.00018613333333333335, 'samples': 357664, 'steps': 698, 'loss/train': 3.7445616722106934} -09/20/2021 16:54:31 - INFO - __main__ - Step 11178: {'lr': 0.00018613333333333335, 'samples': 357696, 'steps': 698, 'loss/train': 6.350292205810547} -09/20/2021 16:54:32 - INFO - __main__ - Step 11179: {'lr': 0.00018613333333333335, 'samples': 357728, 'steps': 698, 'loss/train': 4.229259014129639} -09/20/2021 16:54:32 - INFO - __main__ - Step 11180: {'lr': 0.00018613333333333335, 'samples': 357760, 'steps': 698, 'loss/train': 4.461276054382324} -09/20/2021 16:54:33 - INFO - __main__ - Step 11181: {'lr': 0.00018613333333333335, 'samples': 357792, 'steps': 698, 'loss/train': 4.635037899017334} -09/20/2021 16:54:34 - INFO - __main__ - Step 11182: {'lr': 0.00018613333333333335, 'samples': 357824, 'steps': 698, 'loss/train': 5.262924671173096} -09/20/2021 16:54:35 - INFO - __main__ - Step 11183: {'lr': 0.00018613333333333335, 'samples': 357856, 'steps': 698, 'loss/train': 4.7763872146606445} -09/20/2021 16:54:35 - INFO - __main__ - Step 11184: {'lr': 0.00018613333333333335, 'samples': 357888, 'steps': 698, 'loss/train': 4.910128593444824} -09/20/2021 16:54:36 - INFO - __main__ - Step 11185: {'lr': 0.00018640000000000003, 'samples': 357920, 'steps': 699, 'loss/train': 3.914794921875} -09/20/2021 16:54:37 - INFO - __main__ - Step 11186: {'lr': 0.00018640000000000003, 'samples': 357952, 'steps': 699, 'loss/train': 5.223903656005859} -09/20/2021 16:54:38 - INFO - __main__ - Step 11187: {'lr': 0.00018640000000000003, 'samples': 357984, 'steps': 699, 'loss/train': 4.142485618591309} -09/20/2021 16:54:39 - INFO - __main__ - Step 11188: {'lr': 0.00018640000000000003, 'samples': 358016, 'steps': 699, 'loss/train': 3.9239044189453125} -09/20/2021 16:54:39 - INFO - __main__ - Step 11189: {'lr': 0.00018640000000000003, 'samples': 358048, 'steps': 699, 'loss/train': 4.02017879486084} -09/20/2021 16:54:40 - INFO - __main__ - Step 11190: {'lr': 0.00018640000000000003, 'samples': 358080, 'steps': 699, 'loss/train': 4.204233646392822} -09/20/2021 16:54:41 - INFO - __main__ - Step 11191: {'lr': 0.00018640000000000003, 'samples': 358112, 'steps': 699, 'loss/train': 4.1760573387146} -09/20/2021 16:54:42 - INFO - __main__ - Step 11192: {'lr': 0.00018640000000000003, 'samples': 358144, 'steps': 699, 'loss/train': 5.020533561706543} -09/20/2021 16:54:42 - INFO - __main__ - Step 11193: {'lr': 0.00018640000000000003, 'samples': 358176, 'steps': 699, 'loss/train': 4.437668323516846} -09/20/2021 16:54:43 - INFO - __main__ - Step 11194: {'lr': 0.00018640000000000003, 'samples': 358208, 'steps': 699, 'loss/train': 4.864872932434082} -09/20/2021 16:54:44 - INFO - __main__ - Step 11195: {'lr': 0.00018640000000000003, 'samples': 358240, 'steps': 699, 'loss/train': 4.154875755310059} -09/20/2021 16:54:45 - INFO - __main__ - Step 11196: {'lr': 0.00018640000000000003, 'samples': 358272, 'steps': 699, 'loss/train': 4.413610935211182} -09/20/2021 16:54:45 - INFO - __main__ - Step 11197: {'lr': 0.00018640000000000003, 'samples': 358304, 'steps': 699, 'loss/train': 5.381319999694824} -09/20/2021 16:54:46 - INFO - __main__ - Step 11198: {'lr': 0.00018640000000000003, 'samples': 358336, 'steps': 699, 'loss/train': 4.251371383666992} -09/20/2021 16:54:47 - INFO - __main__ - Step 11199: {'lr': 0.00018640000000000003, 'samples': 358368, 'steps': 699, 'loss/train': 4.620230197906494} -09/20/2021 16:54:48 - INFO - __main__ - Step 11200: {'lr': 0.00018640000000000003, 'samples': 358400, 'steps': 699, 'loss/train': 3.5671017169952393} -09/20/2021 16:54:49 - INFO - __main__ - Step 11201: {'lr': 0.0001866666666666667, 'samples': 358432, 'steps': 700, 'loss/train': 4.402175426483154} -09/20/2021 16:54:50 - INFO - __main__ - Step 11202: {'lr': 0.0001866666666666667, 'samples': 358464, 'steps': 700, 'loss/train': 4.810846328735352} -09/20/2021 16:54:51 - INFO - __main__ - Step 11203: {'lr': 0.0001866666666666667, 'samples': 358496, 'steps': 700, 'loss/train': 5.162858486175537} -09/20/2021 16:54:51 - INFO - __main__ - Step 11204: {'lr': 0.0001866666666666667, 'samples': 358528, 'steps': 700, 'loss/train': 4.968283653259277} -09/20/2021 16:54:52 - INFO - __main__ - Step 11205: {'lr': 0.0001866666666666667, 'samples': 358560, 'steps': 700, 'loss/train': 4.882223129272461} -09/20/2021 16:54:53 - INFO - __main__ - Step 11206: {'lr': 0.0001866666666666667, 'samples': 358592, 'steps': 700, 'loss/train': 3.3363494873046875} -09/20/2021 16:54:54 - INFO - __main__ - Step 11207: {'lr': 0.0001866666666666667, 'samples': 358624, 'steps': 700, 'loss/train': 4.689452171325684} -09/20/2021 16:54:54 - INFO - __main__ - Step 11208: {'lr': 0.0001866666666666667, 'samples': 358656, 'steps': 700, 'loss/train': 5.666888236999512} -09/20/2021 16:54:55 - INFO - __main__ - Step 11209: {'lr': 0.0001866666666666667, 'samples': 358688, 'steps': 700, 'loss/train': 5.183023452758789} -09/20/2021 16:54:56 - INFO - __main__ - Step 11210: {'lr': 0.0001866666666666667, 'samples': 358720, 'steps': 700, 'loss/train': 4.676233768463135} -09/20/2021 16:54:57 - INFO - __main__ - Step 11211: {'lr': 0.0001866666666666667, 'samples': 358752, 'steps': 700, 'loss/train': 4.729020595550537} -09/20/2021 16:54:57 - INFO - __main__ - Step 11212: {'lr': 0.0001866666666666667, 'samples': 358784, 'steps': 700, 'loss/train': 5.372630596160889} -09/20/2021 16:54:58 - INFO - __main__ - Step 11213: {'lr': 0.0001866666666666667, 'samples': 358816, 'steps': 700, 'loss/train': 3.680453062057495} -09/20/2021 16:54:59 - INFO - __main__ - Step 11214: {'lr': 0.0001866666666666667, 'samples': 358848, 'steps': 700, 'loss/train': 4.716707706451416} -09/20/2021 16:55:00 - INFO - __main__ - Step 11215: {'lr': 0.0001866666666666667, 'samples': 358880, 'steps': 700, 'loss/train': 3.6488142013549805} -09/20/2021 16:55:00 - INFO - __main__ - Step 11216: {'lr': 0.0001866666666666667, 'samples': 358912, 'steps': 700, 'loss/train': 4.737509250640869} -09/20/2021 16:55:01 - INFO - __main__ - Step 11217: {'lr': 0.00018693333333333334, 'samples': 358944, 'steps': 701, 'loss/train': 4.178997039794922} -09/20/2021 16:55:02 - INFO - __main__ - Step 11218: {'lr': 0.00018693333333333334, 'samples': 358976, 'steps': 701, 'loss/train': 4.247750759124756} -09/20/2021 16:55:03 - INFO - __main__ - Step 11219: {'lr': 0.00018693333333333334, 'samples': 359008, 'steps': 701, 'loss/train': 4.386443614959717} -09/20/2021 16:55:03 - INFO - __main__ - Step 11220: {'lr': 0.00018693333333333334, 'samples': 359040, 'steps': 701, 'loss/train': 3.8221054077148438} -09/20/2021 16:55:04 - INFO - __main__ - Step 11221: {'lr': 0.00018693333333333334, 'samples': 359072, 'steps': 701, 'loss/train': 3.956859827041626} -09/20/2021 16:55:05 - INFO - __main__ - Step 11222: {'lr': 0.00018693333333333334, 'samples': 359104, 'steps': 701, 'loss/train': 4.892744541168213} -09/20/2021 16:55:06 - INFO - __main__ - Step 11223: {'lr': 0.00018693333333333334, 'samples': 359136, 'steps': 701, 'loss/train': 5.478114604949951} -09/20/2021 16:55:06 - INFO - __main__ - Step 11224: {'lr': 0.00018693333333333334, 'samples': 359168, 'steps': 701, 'loss/train': 4.553344249725342} -09/20/2021 16:55:07 - INFO - __main__ - Step 11225: {'lr': 0.00018693333333333334, 'samples': 359200, 'steps': 701, 'loss/train': 4.425262928009033} -09/20/2021 16:55:08 - INFO - __main__ - Step 11226: {'lr': 0.00018693333333333334, 'samples': 359232, 'steps': 701, 'loss/train': 3.871757984161377} -09/20/2021 16:55:09 - INFO - __main__ - Step 11227: {'lr': 0.00018693333333333334, 'samples': 359264, 'steps': 701, 'loss/train': 4.957165241241455} -09/20/2021 16:55:09 - INFO - __main__ - Step 11228: {'lr': 0.00018693333333333334, 'samples': 359296, 'steps': 701, 'loss/train': 4.110820770263672} -09/20/2021 16:55:10 - INFO - __main__ - Step 11229: {'lr': 0.00018693333333333334, 'samples': 359328, 'steps': 701, 'loss/train': 3.913707733154297} -09/20/2021 16:55:11 - INFO - __main__ - Step 11230: {'lr': 0.00018693333333333334, 'samples': 359360, 'steps': 701, 'loss/train': 4.044948101043701} -09/20/2021 16:55:12 - INFO - __main__ - Step 11231: {'lr': 0.00018693333333333334, 'samples': 359392, 'steps': 701, 'loss/train': 4.482124328613281} -09/20/2021 16:55:13 - INFO - __main__ - Step 11232: {'lr': 0.00018693333333333334, 'samples': 359424, 'steps': 701, 'loss/train': 4.220638275146484} -09/20/2021 16:55:14 - INFO - __main__ - Step 11233: {'lr': 0.00018720000000000002, 'samples': 359456, 'steps': 702, 'loss/train': 3.7509195804595947} -09/20/2021 16:55:15 - INFO - __main__ - Step 11234: {'lr': 0.00018720000000000002, 'samples': 359488, 'steps': 702, 'loss/train': 4.898077964782715} -09/20/2021 16:55:16 - INFO - __main__ - Step 11235: {'lr': 0.00018720000000000002, 'samples': 359520, 'steps': 702, 'loss/train': 4.916294574737549} -09/20/2021 16:55:16 - INFO - __main__ - Step 11236: {'lr': 0.00018720000000000002, 'samples': 359552, 'steps': 702, 'loss/train': 5.00370454788208} -09/20/2021 16:55:17 - INFO - __main__ - Step 11237: {'lr': 0.00018720000000000002, 'samples': 359584, 'steps': 702, 'loss/train': 3.426565647125244} -09/20/2021 16:55:18 - INFO - __main__ - Step 11238: {'lr': 0.00018720000000000002, 'samples': 359616, 'steps': 702, 'loss/train': 4.299834251403809} -09/20/2021 16:55:19 - INFO - __main__ - Step 11239: {'lr': 0.00018720000000000002, 'samples': 359648, 'steps': 702, 'loss/train': 4.065923690795898} -09/20/2021 16:55:19 - INFO - __main__ - Step 11240: {'lr': 0.00018720000000000002, 'samples': 359680, 'steps': 702, 'loss/train': 4.529930591583252} -09/20/2021 16:55:20 - INFO - __main__ - Step 11241: {'lr': 0.00018720000000000002, 'samples': 359712, 'steps': 702, 'loss/train': 5.500468730926514} -09/20/2021 16:55:21 - INFO - __main__ - Step 11242: {'lr': 0.00018720000000000002, 'samples': 359744, 'steps': 702, 'loss/train': 4.399942874908447} -09/20/2021 16:55:22 - INFO - __main__ - Step 11243: {'lr': 0.00018720000000000002, 'samples': 359776, 'steps': 702, 'loss/train': 2.6953389644622803} -09/20/2021 16:55:22 - INFO - __main__ - Step 11244: {'lr': 0.00018720000000000002, 'samples': 359808, 'steps': 702, 'loss/train': 4.031644821166992} -09/20/2021 16:55:23 - INFO - __main__ - Step 11245: {'lr': 0.00018720000000000002, 'samples': 359840, 'steps': 702, 'loss/train': 4.12111234664917} -09/20/2021 16:55:24 - INFO - __main__ - Step 11246: {'lr': 0.00018720000000000002, 'samples': 359872, 'steps': 702, 'loss/train': 3.821059226989746} -09/20/2021 16:55:25 - INFO - __main__ - Step 11247: {'lr': 0.00018720000000000002, 'samples': 359904, 'steps': 702, 'loss/train': 5.253561019897461} -09/20/2021 16:55:25 - INFO - __main__ - Step 11248: {'lr': 0.00018720000000000002, 'samples': 359936, 'steps': 702, 'loss/train': 6.1584792137146} -09/20/2021 16:55:26 - INFO - __main__ - Step 11249: {'lr': 0.00018746666666666668, 'samples': 359968, 'steps': 703, 'loss/train': 4.241442680358887} -09/20/2021 16:55:27 - INFO - __main__ - Step 11250: {'lr': 0.00018746666666666668, 'samples': 360000, 'steps': 703, 'loss/train': 1.7130695581436157} -09/20/2021 16:55:28 - INFO - __main__ - Step 11251: {'lr': 0.00018746666666666668, 'samples': 360032, 'steps': 703, 'loss/train': 4.17717981338501} -09/20/2021 16:55:28 - INFO - __main__ - Step 11252: {'lr': 0.00018746666666666668, 'samples': 360064, 'steps': 703, 'loss/train': 5.075399398803711} -09/20/2021 16:55:29 - INFO - __main__ - Step 11253: {'lr': 0.00018746666666666668, 'samples': 360096, 'steps': 703, 'loss/train': 4.644542694091797} -09/20/2021 16:55:30 - INFO - __main__ - Step 11254: {'lr': 0.00018746666666666668, 'samples': 360128, 'steps': 703, 'loss/train': 4.356349945068359} -09/20/2021 16:55:31 - INFO - __main__ - Step 11255: {'lr': 0.00018746666666666668, 'samples': 360160, 'steps': 703, 'loss/train': 3.6007421016693115} -09/20/2021 16:55:31 - INFO - __main__ - Step 11256: {'lr': 0.00018746666666666668, 'samples': 360192, 'steps': 703, 'loss/train': 4.674230098724365} -09/20/2021 16:55:32 - INFO - __main__ - Step 11257: {'lr': 0.00018746666666666668, 'samples': 360224, 'steps': 703, 'loss/train': 4.5777788162231445} -09/20/2021 16:55:33 - INFO - __main__ - Step 11258: {'lr': 0.00018746666666666668, 'samples': 360256, 'steps': 703, 'loss/train': 3.4343621730804443} -09/20/2021 16:55:34 - INFO - __main__ - Step 11259: {'lr': 0.00018746666666666668, 'samples': 360288, 'steps': 703, 'loss/train': 3.8184077739715576} -09/20/2021 16:55:34 - INFO - __main__ - Step 11260: {'lr': 0.00018746666666666668, 'samples': 360320, 'steps': 703, 'loss/train': 5.181297779083252} -09/20/2021 16:55:36 - INFO - __main__ - Step 11261: {'lr': 0.00018746666666666668, 'samples': 360352, 'steps': 703, 'loss/train': 4.774933815002441} -09/20/2021 16:55:36 - INFO - __main__ - Step 11262: {'lr': 0.00018746666666666668, 'samples': 360384, 'steps': 703, 'loss/train': 4.559683322906494} -09/20/2021 16:55:37 - INFO - __main__ - Step 11263: {'lr': 0.00018746666666666668, 'samples': 360416, 'steps': 703, 'loss/train': 4.521308422088623} -09/20/2021 16:55:38 - INFO - __main__ - Step 11264: {'lr': 0.00018746666666666668, 'samples': 360448, 'steps': 703, 'loss/train': 4.954966068267822} -09/20/2021 16:55:39 - INFO - __main__ - Step 11265: {'lr': 0.00018773333333333333, 'samples': 360480, 'steps': 704, 'loss/train': 4.3107805252075195} -09/20/2021 16:55:40 - INFO - __main__ - Step 11266: {'lr': 0.00018773333333333333, 'samples': 360512, 'steps': 704, 'loss/train': 3.940261125564575} -09/20/2021 16:55:40 - INFO - __main__ - Step 11267: {'lr': 0.00018773333333333333, 'samples': 360544, 'steps': 704, 'loss/train': 4.705063343048096} -09/20/2021 16:55:41 - INFO - __main__ - Step 11268: {'lr': 0.00018773333333333333, 'samples': 360576, 'steps': 704, 'loss/train': 3.94248366355896} -09/20/2021 16:55:42 - INFO - __main__ - Step 11269: {'lr': 0.00018773333333333333, 'samples': 360608, 'steps': 704, 'loss/train': 4.353455543518066} -09/20/2021 16:55:43 - INFO - __main__ - Step 11270: {'lr': 0.00018773333333333333, 'samples': 360640, 'steps': 704, 'loss/train': 4.0122575759887695} -09/20/2021 16:55:43 - INFO - __main__ - Step 11271: {'lr': 0.00018773333333333333, 'samples': 360672, 'steps': 704, 'loss/train': 4.896043300628662} -09/20/2021 16:55:44 - INFO - __main__ - Step 11272: {'lr': 0.00018773333333333333, 'samples': 360704, 'steps': 704, 'loss/train': 3.8302409648895264} -09/20/2021 16:55:45 - INFO - __main__ - Step 11273: {'lr': 0.00018773333333333333, 'samples': 360736, 'steps': 704, 'loss/train': 5.080112457275391} -09/20/2021 16:55:46 - INFO - __main__ - Step 11274: {'lr': 0.00018773333333333333, 'samples': 360768, 'steps': 704, 'loss/train': 3.7759273052215576} -09/20/2021 16:55:46 - INFO - __main__ - Step 11275: {'lr': 0.00018773333333333333, 'samples': 360800, 'steps': 704, 'loss/train': 4.365203857421875} -09/20/2021 16:55:47 - INFO - __main__ - Step 11276: {'lr': 0.00018773333333333333, 'samples': 360832, 'steps': 704, 'loss/train': 4.234359264373779} -09/20/2021 16:55:48 - INFO - __main__ - Step 11277: {'lr': 0.00018773333333333333, 'samples': 360864, 'steps': 704, 'loss/train': 4.20524263381958} -09/20/2021 16:55:49 - INFO - __main__ - Step 11278: {'lr': 0.00018773333333333333, 'samples': 360896, 'steps': 704, 'loss/train': 5.713846206665039} -09/20/2021 16:55:49 - INFO - __main__ - Step 11279: {'lr': 0.00018773333333333333, 'samples': 360928, 'steps': 704, 'loss/train': 4.463252544403076} -09/20/2021 16:55:50 - INFO - __main__ - Step 11280: {'lr': 0.00018773333333333333, 'samples': 360960, 'steps': 704, 'loss/train': 3.7781288623809814} -09/20/2021 16:55:51 - INFO - __main__ - Step 11281: {'lr': 0.000188, 'samples': 360992, 'steps': 705, 'loss/train': 3.063176155090332} -09/20/2021 16:55:52 - INFO - __main__ - Step 11282: {'lr': 0.000188, 'samples': 361024, 'steps': 705, 'loss/train': 4.302892208099365} -09/20/2021 16:55:52 - INFO - __main__ - Step 11283: {'lr': 0.000188, 'samples': 361056, 'steps': 705, 'loss/train': 4.109063148498535} -09/20/2021 16:55:53 - INFO - __main__ - Step 11284: {'lr': 0.000188, 'samples': 361088, 'steps': 705, 'loss/train': 4.181624889373779} -09/20/2021 16:55:54 - INFO - __main__ - Step 11285: {'lr': 0.000188, 'samples': 361120, 'steps': 705, 'loss/train': 4.520687580108643} -09/20/2021 16:55:55 - INFO - __main__ - Step 11286: {'lr': 0.000188, 'samples': 361152, 'steps': 705, 'loss/train': 5.230519771575928} -09/20/2021 16:55:55 - INFO - __main__ - Step 11287: {'lr': 0.000188, 'samples': 361184, 'steps': 705, 'loss/train': 4.247565269470215} -09/20/2021 16:55:56 - INFO - __main__ - Step 11288: {'lr': 0.000188, 'samples': 361216, 'steps': 705, 'loss/train': 4.886206150054932} -09/20/2021 16:55:57 - INFO - __main__ - Step 11289: {'lr': 0.000188, 'samples': 361248, 'steps': 705, 'loss/train': 3.8253068923950195} -09/20/2021 16:55:58 - INFO - __main__ - Step 11290: {'lr': 0.000188, 'samples': 361280, 'steps': 705, 'loss/train': 4.5138702392578125} -09/20/2021 16:55:58 - INFO - __main__ - Step 11291: {'lr': 0.000188, 'samples': 361312, 'steps': 705, 'loss/train': 4.2194342613220215} -09/20/2021 16:56:00 - INFO - __main__ - Step 11292: {'lr': 0.000188, 'samples': 361344, 'steps': 705, 'loss/train': 4.756901264190674} -09/20/2021 16:56:01 - INFO - __main__ - Step 11293: {'lr': 0.000188, 'samples': 361376, 'steps': 705, 'loss/train': 4.368873596191406} -09/20/2021 16:56:02 - INFO - __main__ - Step 11294: {'lr': 0.000188, 'samples': 361408, 'steps': 705, 'loss/train': 4.845852375030518} -09/20/2021 16:56:03 - INFO - __main__ - Step 11295: {'lr': 0.000188, 'samples': 361440, 'steps': 705, 'loss/train': 3.8857359886169434} -09/20/2021 16:56:03 - INFO - __main__ - Step 11296: {'lr': 0.000188, 'samples': 361472, 'steps': 705, 'loss/train': 5.027984142303467} -09/20/2021 16:56:04 - INFO - __main__ - Step 11297: {'lr': 0.00018826666666666667, 'samples': 361504, 'steps': 706, 'loss/train': 3.9419186115264893} -09/20/2021 16:56:05 - INFO - __main__ - Step 11298: {'lr': 0.00018826666666666667, 'samples': 361536, 'steps': 706, 'loss/train': 2.494464635848999} -09/20/2021 16:56:06 - INFO - __main__ - Step 11299: {'lr': 0.00018826666666666667, 'samples': 361568, 'steps': 706, 'loss/train': 4.787599563598633} -09/20/2021 16:56:06 - INFO - __main__ - Step 11300: {'lr': 0.00018826666666666667, 'samples': 361600, 'steps': 706, 'loss/train': 4.072394847869873} -09/20/2021 16:56:07 - INFO - __main__ - Step 11301: {'lr': 0.00018826666666666667, 'samples': 361632, 'steps': 706, 'loss/train': 4.063255786895752} -09/20/2021 16:56:08 - INFO - __main__ - Step 11302: {'lr': 0.00018826666666666667, 'samples': 361664, 'steps': 706, 'loss/train': 3.6792666912078857} -09/20/2021 16:56:09 - INFO - __main__ - Step 11303: {'lr': 0.00018826666666666667, 'samples': 361696, 'steps': 706, 'loss/train': 4.370833873748779} -09/20/2021 16:56:09 - INFO - __main__ - Step 11304: {'lr': 0.00018826666666666667, 'samples': 361728, 'steps': 706, 'loss/train': 4.34027099609375} -09/20/2021 16:56:10 - INFO - __main__ - Step 11305: {'lr': 0.00018826666666666667, 'samples': 361760, 'steps': 706, 'loss/train': 4.203998565673828} -09/20/2021 16:56:11 - INFO - __main__ - Step 11306: {'lr': 0.00018826666666666667, 'samples': 361792, 'steps': 706, 'loss/train': 3.47554874420166} -09/20/2021 16:56:12 - INFO - __main__ - Step 11307: {'lr': 0.00018826666666666667, 'samples': 361824, 'steps': 706, 'loss/train': 6.068390369415283} -09/20/2021 16:56:12 - INFO - __main__ - Step 11308: {'lr': 0.00018826666666666667, 'samples': 361856, 'steps': 706, 'loss/train': 5.708106994628906} -09/20/2021 16:56:13 - INFO - __main__ - Step 11309: {'lr': 0.00018826666666666667, 'samples': 361888, 'steps': 706, 'loss/train': 5.858125686645508} -09/20/2021 16:56:14 - INFO - __main__ - Step 11310: {'lr': 0.00018826666666666667, 'samples': 361920, 'steps': 706, 'loss/train': 6.039351463317871} -09/20/2021 16:56:15 - INFO - __main__ - Step 11311: {'lr': 0.00018826666666666667, 'samples': 361952, 'steps': 706, 'loss/train': 3.5465095043182373} -09/20/2021 16:56:15 - INFO - __main__ - Step 11312: {'lr': 0.00018826666666666667, 'samples': 361984, 'steps': 706, 'loss/train': 4.552252292633057} -09/20/2021 16:56:16 - INFO - __main__ - Step 11313: {'lr': 0.00018853333333333333, 'samples': 362016, 'steps': 707, 'loss/train': 3.977241277694702} -09/20/2021 16:56:17 - INFO - __main__ - Step 11314: {'lr': 0.00018853333333333333, 'samples': 362048, 'steps': 707, 'loss/train': 3.516533851623535} -09/20/2021 16:56:18 - INFO - __main__ - Step 11315: {'lr': 0.00018853333333333333, 'samples': 362080, 'steps': 707, 'loss/train': 3.6668694019317627} -09/20/2021 16:56:19 - INFO - __main__ - Step 11316: {'lr': 0.00018853333333333333, 'samples': 362112, 'steps': 707, 'loss/train': 4.337321758270264} -09/20/2021 16:56:19 - INFO - __main__ - Step 11317: {'lr': 0.00018853333333333333, 'samples': 362144, 'steps': 707, 'loss/train': 4.351069927215576} -09/20/2021 16:56:20 - INFO - __main__ - Step 11318: {'lr': 0.00018853333333333333, 'samples': 362176, 'steps': 707, 'loss/train': 5.383344650268555} -09/20/2021 16:56:21 - INFO - __main__ - Step 11319: {'lr': 0.00018853333333333333, 'samples': 362208, 'steps': 707, 'loss/train': 4.267788410186768} -09/20/2021 16:56:22 - INFO - __main__ - Step 11320: {'lr': 0.00018853333333333333, 'samples': 362240, 'steps': 707, 'loss/train': 4.245926380157471} -09/20/2021 16:56:22 - INFO - __main__ - Step 11321: {'lr': 0.00018853333333333333, 'samples': 362272, 'steps': 707, 'loss/train': 4.429569721221924} -09/20/2021 16:56:23 - INFO - __main__ - Step 11322: {'lr': 0.00018853333333333333, 'samples': 362304, 'steps': 707, 'loss/train': 4.420252799987793} -09/20/2021 16:56:24 - INFO - __main__ - Step 11323: {'lr': 0.00018853333333333333, 'samples': 362336, 'steps': 707, 'loss/train': 4.424712181091309} -09/20/2021 16:56:25 - INFO - __main__ - Step 11324: {'lr': 0.00018853333333333333, 'samples': 362368, 'steps': 707, 'loss/train': 3.7041819095611572} -09/20/2021 16:56:26 - INFO - __main__ - Step 11325: {'lr': 0.00018853333333333333, 'samples': 362400, 'steps': 707, 'loss/train': 4.122419834136963} -09/20/2021 16:56:27 - INFO - __main__ - Step 11326: {'lr': 0.00018853333333333333, 'samples': 362432, 'steps': 707, 'loss/train': 4.736020565032959} -09/20/2021 16:56:27 - INFO - __main__ - Step 11327: {'lr': 0.00018853333333333333, 'samples': 362464, 'steps': 707, 'loss/train': 6.196974754333496} -09/20/2021 16:56:28 - INFO - __main__ - Step 11328: {'lr': 0.00018853333333333333, 'samples': 362496, 'steps': 707, 'loss/train': 3.947544813156128} -09/20/2021 16:56:29 - INFO - __main__ - Step 11329: {'lr': 0.0001888, 'samples': 362528, 'steps': 708, 'loss/train': 4.865401744842529} -09/20/2021 16:56:30 - INFO - __main__ - Step 11330: {'lr': 0.0001888, 'samples': 362560, 'steps': 708, 'loss/train': 5.296445846557617} -09/20/2021 16:56:31 - INFO - __main__ - Step 11331: {'lr': 0.0001888, 'samples': 362592, 'steps': 708, 'loss/train': 4.286447525024414} -09/20/2021 16:56:31 - INFO - __main__ - Step 11332: {'lr': 0.0001888, 'samples': 362624, 'steps': 708, 'loss/train': 4.2951884269714355} -09/20/2021 16:56:32 - INFO - __main__ - Step 11333: {'lr': 0.0001888, 'samples': 362656, 'steps': 708, 'loss/train': 4.250777721405029} -09/20/2021 16:56:33 - INFO - __main__ - Step 11334: {'lr': 0.0001888, 'samples': 362688, 'steps': 708, 'loss/train': 2.7746336460113525} -09/20/2021 16:56:34 - INFO - __main__ - Step 11335: {'lr': 0.0001888, 'samples': 362720, 'steps': 708, 'loss/train': 5.939903259277344} -09/20/2021 16:56:34 - INFO - __main__ - Step 11336: {'lr': 0.0001888, 'samples': 362752, 'steps': 708, 'loss/train': 4.659902572631836} -09/20/2021 16:56:35 - INFO - __main__ - Step 11337: {'lr': 0.0001888, 'samples': 362784, 'steps': 708, 'loss/train': 4.162271022796631} -09/20/2021 16:56:36 - INFO - __main__ - Step 11338: {'lr': 0.0001888, 'samples': 362816, 'steps': 708, 'loss/train': 5.158646106719971} -09/20/2021 16:56:37 - INFO - __main__ - Step 11339: {'lr': 0.0001888, 'samples': 362848, 'steps': 708, 'loss/train': 5.65268611907959} -09/20/2021 16:56:37 - INFO - __main__ - Step 11340: {'lr': 0.0001888, 'samples': 362880, 'steps': 708, 'loss/train': 5.09292459487915} -09/20/2021 16:56:38 - INFO - __main__ - Step 11341: {'lr': 0.0001888, 'samples': 362912, 'steps': 708, 'loss/train': 4.98360538482666} -09/20/2021 16:56:39 - INFO - __main__ - Step 11342: {'lr': 0.0001888, 'samples': 362944, 'steps': 708, 'loss/train': 5.707160472869873} -09/20/2021 16:56:40 - INFO - __main__ - Step 11343: {'lr': 0.0001888, 'samples': 362976, 'steps': 708, 'loss/train': 4.085366725921631} -09/20/2021 16:56:40 - INFO - __main__ - Step 11344: {'lr': 0.0001888, 'samples': 363008, 'steps': 708, 'loss/train': 4.381335735321045} -09/20/2021 16:56:41 - INFO - __main__ - Step 11345: {'lr': 0.0001890666666666667, 'samples': 363040, 'steps': 709, 'loss/train': 4.768544673919678} -09/20/2021 16:56:42 - INFO - __main__ - Step 11346: {'lr': 0.0001890666666666667, 'samples': 363072, 'steps': 709, 'loss/train': 5.079098701477051} -09/20/2021 16:56:43 - INFO - __main__ - Step 11347: {'lr': 0.0001890666666666667, 'samples': 363104, 'steps': 709, 'loss/train': 4.256768703460693} -09/20/2021 16:56:44 - INFO - __main__ - Step 11348: {'lr': 0.0001890666666666667, 'samples': 363136, 'steps': 709, 'loss/train': 3.0486104488372803} -09/20/2021 16:56:44 - INFO - __main__ - Step 11349: {'lr': 0.0001890666666666667, 'samples': 363168, 'steps': 709, 'loss/train': 4.646679878234863} -09/20/2021 16:56:45 - INFO - __main__ - Step 11350: {'lr': 0.0001890666666666667, 'samples': 363200, 'steps': 709, 'loss/train': 4.20842170715332} -09/20/2021 16:56:46 - INFO - __main__ - Step 11351: {'lr': 0.0001890666666666667, 'samples': 363232, 'steps': 709, 'loss/train': 4.06257963180542} -09/20/2021 16:56:47 - INFO - __main__ - Step 11352: {'lr': 0.0001890666666666667, 'samples': 363264, 'steps': 709, 'loss/train': 4.70460319519043} -09/20/2021 16:56:47 - INFO - __main__ - Step 11353: {'lr': 0.0001890666666666667, 'samples': 363296, 'steps': 709, 'loss/train': 4.538336277008057} -09/20/2021 16:56:48 - INFO - __main__ - Step 11354: {'lr': 0.0001890666666666667, 'samples': 363328, 'steps': 709, 'loss/train': 4.150511264801025} -09/20/2021 16:56:49 - INFO - __main__ - Step 11355: {'lr': 0.0001890666666666667, 'samples': 363360, 'steps': 709, 'loss/train': 4.522943496704102} -09/20/2021 16:56:50 - INFO - __main__ - Step 11356: {'lr': 0.0001890666666666667, 'samples': 363392, 'steps': 709, 'loss/train': 4.761258602142334} -09/20/2021 16:56:50 - INFO - __main__ - Step 11357: {'lr': 0.0001890666666666667, 'samples': 363424, 'steps': 709, 'loss/train': 3.4818108081817627} -09/20/2021 16:56:52 - INFO - __main__ - Step 11358: {'lr': 0.0001890666666666667, 'samples': 363456, 'steps': 709, 'loss/train': 3.819248914718628} -09/20/2021 16:56:53 - INFO - __main__ - Step 11359: {'lr': 0.0001890666666666667, 'samples': 363488, 'steps': 709, 'loss/train': 4.468949794769287} -09/20/2021 16:56:53 - INFO - __main__ - Step 11360: {'lr': 0.0001890666666666667, 'samples': 363520, 'steps': 709, 'loss/train': 6.447366237640381} -09/20/2021 16:56:54 - INFO - __main__ - Step 11361: {'lr': 0.00018933333333333335, 'samples': 363552, 'steps': 710, 'loss/train': 3.506798505783081} -09/20/2021 16:56:55 - INFO - __main__ - Step 11362: {'lr': 0.00018933333333333335, 'samples': 363584, 'steps': 710, 'loss/train': 5.256617069244385} -09/20/2021 16:56:56 - INFO - __main__ - Step 11363: {'lr': 0.00018933333333333335, 'samples': 363616, 'steps': 710, 'loss/train': 4.029258728027344} -09/20/2021 16:56:56 - INFO - __main__ - Step 11364: {'lr': 0.00018933333333333335, 'samples': 363648, 'steps': 710, 'loss/train': 5.157622337341309} -09/20/2021 16:56:57 - INFO - __main__ - Step 11365: {'lr': 0.00018933333333333335, 'samples': 363680, 'steps': 710, 'loss/train': 3.589038372039795} -09/20/2021 16:56:58 - INFO - __main__ - Step 11366: {'lr': 0.00018933333333333335, 'samples': 363712, 'steps': 710, 'loss/train': 4.196320056915283} -09/20/2021 16:56:59 - INFO - __main__ - Step 11367: {'lr': 0.00018933333333333335, 'samples': 363744, 'steps': 710, 'loss/train': 3.6198034286499023} -09/20/2021 16:56:59 - INFO - __main__ - Step 11368: {'lr': 0.00018933333333333335, 'samples': 363776, 'steps': 710, 'loss/train': 2.4029483795166016} -09/20/2021 16:57:00 - INFO - __main__ - Step 11369: {'lr': 0.00018933333333333335, 'samples': 363808, 'steps': 710, 'loss/train': 2.147031784057617} -09/20/2021 16:57:01 - INFO - __main__ - Step 11370: {'lr': 0.00018933333333333335, 'samples': 363840, 'steps': 710, 'loss/train': 1.9885307550430298} -09/20/2021 16:57:02 - INFO - __main__ - Step 11371: {'lr': 0.00018933333333333335, 'samples': 363872, 'steps': 710, 'loss/train': 3.857713460922241} -09/20/2021 16:57:02 - INFO - __main__ - Step 11372: {'lr': 0.00018933333333333335, 'samples': 363904, 'steps': 710, 'loss/train': 3.859879493713379} -09/20/2021 16:57:03 - INFO - __main__ - Step 11373: {'lr': 0.00018933333333333335, 'samples': 363936, 'steps': 710, 'loss/train': 4.6203532218933105} -09/20/2021 16:57:04 - INFO - __main__ - Step 11374: {'lr': 0.00018933333333333335, 'samples': 363968, 'steps': 710, 'loss/train': 5.367814064025879} -09/20/2021 16:57:05 - INFO - __main__ - Step 11375: {'lr': 0.00018933333333333335, 'samples': 364000, 'steps': 710, 'loss/train': 4.756133556365967} -09/20/2021 16:57:05 - INFO - __main__ - Step 11376: {'lr': 0.00018933333333333335, 'samples': 364032, 'steps': 710, 'loss/train': 3.831815242767334} -09/20/2021 16:57:06 - INFO - __main__ - Step 11377: {'lr': 0.0001896, 'samples': 364064, 'steps': 711, 'loss/train': 5.272395610809326} -09/20/2021 16:57:07 - INFO - __main__ - Step 11378: {'lr': 0.0001896, 'samples': 364096, 'steps': 711, 'loss/train': 5.033905982971191} -09/20/2021 16:57:08 - INFO - __main__ - Step 11379: {'lr': 0.0001896, 'samples': 364128, 'steps': 711, 'loss/train': 5.028512954711914} -09/20/2021 16:57:09 - INFO - __main__ - Step 11380: {'lr': 0.0001896, 'samples': 364160, 'steps': 711, 'loss/train': 3.90885066986084} -09/20/2021 16:57:09 - INFO - __main__ - Step 11381: {'lr': 0.0001896, 'samples': 364192, 'steps': 711, 'loss/train': 3.9242429733276367} -09/20/2021 16:57:10 - INFO - __main__ - Step 11382: {'lr': 0.0001896, 'samples': 364224, 'steps': 711, 'loss/train': 4.4532470703125} -09/20/2021 16:57:11 - INFO - __main__ - Step 11383: {'lr': 0.0001896, 'samples': 364256, 'steps': 711, 'loss/train': 4.245319366455078} -09/20/2021 16:57:12 - INFO - __main__ - Step 11384: {'lr': 0.0001896, 'samples': 364288, 'steps': 711, 'loss/train': 4.881449222564697} -09/20/2021 16:57:12 - INFO - __main__ - Step 11385: {'lr': 0.0001896, 'samples': 364320, 'steps': 711, 'loss/train': 4.418461322784424} -09/20/2021 16:57:13 - INFO - __main__ - Step 11386: {'lr': 0.0001896, 'samples': 364352, 'steps': 711, 'loss/train': 4.027853488922119} -09/20/2021 16:57:14 - INFO - __main__ - Step 11387: {'lr': 0.0001896, 'samples': 364384, 'steps': 711, 'loss/train': 4.3585405349731445} -09/20/2021 16:57:15 - INFO - __main__ - Step 11388: {'lr': 0.0001896, 'samples': 364416, 'steps': 711, 'loss/train': 5.787886619567871} -09/20/2021 16:57:15 - INFO - __main__ - Step 11389: {'lr': 0.0001896, 'samples': 364448, 'steps': 711, 'loss/train': 4.708009719848633} -09/20/2021 16:57:17 - INFO - __main__ - Step 11390: {'lr': 0.0001896, 'samples': 364480, 'steps': 711, 'loss/train': 4.807241916656494} -09/20/2021 16:57:17 - INFO - __main__ - Step 11391: {'lr': 0.0001896, 'samples': 364512, 'steps': 711, 'loss/train': 3.97341251373291} -09/20/2021 16:57:18 - INFO - __main__ - Step 11392: {'lr': 0.0001896, 'samples': 364544, 'steps': 711, 'loss/train': 3.755002975463867} -09/20/2021 16:57:19 - INFO - __main__ - Step 11393: {'lr': 0.00018986666666666668, 'samples': 364576, 'steps': 712, 'loss/train': 4.420286178588867} -09/20/2021 16:57:20 - INFO - __main__ - Step 11394: {'lr': 0.00018986666666666668, 'samples': 364608, 'steps': 712, 'loss/train': 4.503334045410156} -09/20/2021 16:57:21 - INFO - __main__ - Step 11395: {'lr': 0.00018986666666666668, 'samples': 364640, 'steps': 712, 'loss/train': 3.6907436847686768} -09/20/2021 16:57:21 - INFO - __main__ - Step 11396: {'lr': 0.00018986666666666668, 'samples': 364672, 'steps': 712, 'loss/train': 3.4020752906799316} -09/20/2021 16:57:22 - INFO - __main__ - Step 11397: {'lr': 0.00018986666666666668, 'samples': 364704, 'steps': 712, 'loss/train': 4.016862869262695} -09/20/2021 16:57:23 - INFO - __main__ - Step 11398: {'lr': 0.00018986666666666668, 'samples': 364736, 'steps': 712, 'loss/train': 4.117268085479736} -09/20/2021 16:57:24 - INFO - __main__ - Step 11399: {'lr': 0.00018986666666666668, 'samples': 364768, 'steps': 712, 'loss/train': 4.191667556762695} -09/20/2021 16:57:24 - INFO - __main__ - Step 11400: {'lr': 0.00018986666666666668, 'samples': 364800, 'steps': 712, 'loss/train': 4.613410949707031} -09/20/2021 16:57:25 - INFO - __main__ - Step 11401: {'lr': 0.00018986666666666668, 'samples': 364832, 'steps': 712, 'loss/train': 3.632192850112915} -09/20/2021 16:57:26 - INFO - __main__ - Step 11402: {'lr': 0.00018986666666666668, 'samples': 364864, 'steps': 712, 'loss/train': 4.924283027648926} -09/20/2021 16:57:27 - INFO - __main__ - Step 11403: {'lr': 0.00018986666666666668, 'samples': 364896, 'steps': 712, 'loss/train': 4.206644535064697} -09/20/2021 16:57:27 - INFO - __main__ - Step 11404: {'lr': 0.00018986666666666668, 'samples': 364928, 'steps': 712, 'loss/train': 4.711085319519043} -09/20/2021 16:57:28 - INFO - __main__ - Step 11405: {'lr': 0.00018986666666666668, 'samples': 364960, 'steps': 712, 'loss/train': 5.414877891540527} -09/20/2021 16:57:29 - INFO - __main__ - Step 11406: {'lr': 0.00018986666666666668, 'samples': 364992, 'steps': 712, 'loss/train': 4.2944560050964355} -09/20/2021 16:57:30 - INFO - __main__ - Step 11407: {'lr': 0.00018986666666666668, 'samples': 365024, 'steps': 712, 'loss/train': 2.6154961585998535} -09/20/2021 16:57:30 - INFO - __main__ - Step 11408: {'lr': 0.00018986666666666668, 'samples': 365056, 'steps': 712, 'loss/train': 4.642685413360596} -09/20/2021 16:57:31 - INFO - __main__ - Step 11409: {'lr': 0.00019013333333333334, 'samples': 365088, 'steps': 713, 'loss/train': 3.868739128112793} -09/20/2021 16:57:32 - INFO - __main__ - Step 11410: {'lr': 0.00019013333333333334, 'samples': 365120, 'steps': 713, 'loss/train': 3.4501867294311523} -09/20/2021 16:57:33 - INFO - __main__ - Step 11411: {'lr': 0.00019013333333333334, 'samples': 365152, 'steps': 713, 'loss/train': 4.521446228027344} -09/20/2021 16:57:33 - INFO - __main__ - Step 11412: {'lr': 0.00019013333333333334, 'samples': 365184, 'steps': 713, 'loss/train': 3.835965871810913} -09/20/2021 16:57:34 - INFO - __main__ - Step 11413: {'lr': 0.00019013333333333334, 'samples': 365216, 'steps': 713, 'loss/train': 4.025625228881836} -09/20/2021 16:57:35 - INFO - __main__ - Step 11414: {'lr': 0.00019013333333333334, 'samples': 365248, 'steps': 713, 'loss/train': 4.013362884521484} -09/20/2021 16:57:36 - INFO - __main__ - Step 11415: {'lr': 0.00019013333333333334, 'samples': 365280, 'steps': 713, 'loss/train': 4.717960357666016} -09/20/2021 16:57:36 - INFO - __main__ - Step 11416: {'lr': 0.00019013333333333334, 'samples': 365312, 'steps': 713, 'loss/train': 4.005649089813232} -09/20/2021 16:57:37 - INFO - __main__ - Step 11417: {'lr': 0.00019013333333333334, 'samples': 365344, 'steps': 713, 'loss/train': 4.132259368896484} -09/20/2021 16:57:38 - INFO - __main__ - Step 11418: {'lr': 0.00019013333333333334, 'samples': 365376, 'steps': 713, 'loss/train': 4.341554164886475} -09/20/2021 16:57:39 - INFO - __main__ - Step 11419: {'lr': 0.00019013333333333334, 'samples': 365408, 'steps': 713, 'loss/train': 5.190452575683594} -09/20/2021 16:57:39 - INFO - __main__ - Step 11420: {'lr': 0.00019013333333333334, 'samples': 365440, 'steps': 713, 'loss/train': 4.584140777587891} -09/20/2021 16:57:41 - INFO - __main__ - Step 11421: {'lr': 0.00019013333333333334, 'samples': 365472, 'steps': 713, 'loss/train': 3.7954766750335693} -09/20/2021 16:57:41 - INFO - __main__ - Step 11422: {'lr': 0.00019013333333333334, 'samples': 365504, 'steps': 713, 'loss/train': 4.518103122711182} -09/20/2021 16:57:42 - INFO - __main__ - Step 11423: {'lr': 0.00019013333333333334, 'samples': 365536, 'steps': 713, 'loss/train': 4.32830810546875} -09/20/2021 16:57:43 - INFO - __main__ - Step 11424: {'lr': 0.00019013333333333334, 'samples': 365568, 'steps': 713, 'loss/train': 4.239782810211182} -09/20/2021 16:57:44 - INFO - __main__ - Step 11425: {'lr': 0.0001904, 'samples': 365600, 'steps': 714, 'loss/train': 4.119216442108154} -09/20/2021 16:57:45 - INFO - __main__ - Step 11426: {'lr': 0.0001904, 'samples': 365632, 'steps': 714, 'loss/train': 4.0674848556518555} -09/20/2021 16:57:45 - INFO - __main__ - Step 11427: {'lr': 0.0001904, 'samples': 365664, 'steps': 714, 'loss/train': 5.2251667976379395} -09/20/2021 16:57:46 - INFO - __main__ - Step 11428: {'lr': 0.0001904, 'samples': 365696, 'steps': 714, 'loss/train': 4.483108043670654} -09/20/2021 16:57:47 - INFO - __main__ - Step 11429: {'lr': 0.0001904, 'samples': 365728, 'steps': 714, 'loss/train': 3.8332459926605225} -09/20/2021 16:57:48 - INFO - __main__ - Step 11430: {'lr': 0.0001904, 'samples': 365760, 'steps': 714, 'loss/train': 4.397947788238525} -09/20/2021 16:57:48 - INFO - __main__ - Step 11431: {'lr': 0.0001904, 'samples': 365792, 'steps': 714, 'loss/train': 5.234524250030518} -09/20/2021 16:57:49 - INFO - __main__ - Step 11432: {'lr': 0.0001904, 'samples': 365824, 'steps': 714, 'loss/train': 4.111537456512451} -09/20/2021 16:57:50 - INFO - __main__ - Step 11433: {'lr': 0.0001904, 'samples': 365856, 'steps': 714, 'loss/train': 4.136196136474609} -09/20/2021 16:57:51 - INFO - __main__ - Step 11434: {'lr': 0.0001904, 'samples': 365888, 'steps': 714, 'loss/train': 3.5573816299438477} -09/20/2021 16:57:51 - INFO - __main__ - Step 11435: {'lr': 0.0001904, 'samples': 365920, 'steps': 714, 'loss/train': 4.529546737670898} -09/20/2021 16:57:52 - INFO - __main__ - Step 11436: {'lr': 0.0001904, 'samples': 365952, 'steps': 714, 'loss/train': 3.8329567909240723} -09/20/2021 16:57:53 - INFO - __main__ - Step 11437: {'lr': 0.0001904, 'samples': 365984, 'steps': 714, 'loss/train': 3.098876476287842} -09/20/2021 16:57:54 - INFO - __main__ - Step 11438: {'lr': 0.0001904, 'samples': 366016, 'steps': 714, 'loss/train': 4.762154579162598} -09/20/2021 16:57:54 - INFO - __main__ - Step 11439: {'lr': 0.0001904, 'samples': 366048, 'steps': 714, 'loss/train': 3.998145818710327} -09/20/2021 16:57:55 - INFO - __main__ - Step 11440: {'lr': 0.0001904, 'samples': 366080, 'steps': 714, 'loss/train': 4.708771705627441} -09/20/2021 16:57:56 - INFO - __main__ - Step 11441: {'lr': 0.00019066666666666668, 'samples': 366112, 'steps': 715, 'loss/train': 2.990645170211792} -09/20/2021 16:57:57 - INFO - __main__ - Step 11442: {'lr': 0.00019066666666666668, 'samples': 366144, 'steps': 715, 'loss/train': 4.176728248596191} -09/20/2021 16:57:57 - INFO - __main__ - Step 11443: {'lr': 0.00019066666666666668, 'samples': 366176, 'steps': 715, 'loss/train': 3.6194019317626953} -09/20/2021 16:57:58 - INFO - __main__ - Step 11444: {'lr': 0.00019066666666666668, 'samples': 366208, 'steps': 715, 'loss/train': 4.2096452713012695} -09/20/2021 16:57:59 - INFO - __main__ - Step 11445: {'lr': 0.00019066666666666668, 'samples': 366240, 'steps': 715, 'loss/train': 4.8414716720581055} -09/20/2021 16:58:00 - INFO - __main__ - Step 11446: {'lr': 0.00019066666666666668, 'samples': 366272, 'steps': 715, 'loss/train': 3.7709567546844482} -09/20/2021 16:58:00 - INFO - __main__ - Step 11447: {'lr': 0.00019066666666666668, 'samples': 366304, 'steps': 715, 'loss/train': 3.9579787254333496} -09/20/2021 16:58:01 - INFO - __main__ - Step 11448: {'lr': 0.00019066666666666668, 'samples': 366336, 'steps': 715, 'loss/train': 3.9143779277801514} -09/20/2021 16:58:02 - INFO - __main__ - Step 11449: {'lr': 0.00019066666666666668, 'samples': 366368, 'steps': 715, 'loss/train': 4.072429180145264} -09/20/2021 16:58:03 - INFO - __main__ - Step 11450: {'lr': 0.00019066666666666668, 'samples': 366400, 'steps': 715, 'loss/train': 3.9620554447174072} -09/20/2021 16:58:04 - INFO - __main__ - Step 11451: {'lr': 0.00019066666666666668, 'samples': 366432, 'steps': 715, 'loss/train': 4.175148010253906} -09/20/2021 16:58:05 - INFO - __main__ - Step 11452: {'lr': 0.00019066666666666668, 'samples': 366464, 'steps': 715, 'loss/train': 3.8677992820739746} -09/20/2021 16:58:06 - INFO - __main__ - Step 11453: {'lr': 0.00019066666666666668, 'samples': 366496, 'steps': 715, 'loss/train': 3.605058193206787} -09/20/2021 16:58:06 - INFO - __main__ - Step 11454: {'lr': 0.00019066666666666668, 'samples': 366528, 'steps': 715, 'loss/train': 3.055131435394287} -09/20/2021 16:58:07 - INFO - __main__ - Step 11455: {'lr': 0.00019066666666666668, 'samples': 366560, 'steps': 715, 'loss/train': 3.511500120162964} -09/20/2021 16:58:08 - INFO - __main__ - Step 11456: {'lr': 0.00019066666666666668, 'samples': 366592, 'steps': 715, 'loss/train': 3.6793322563171387} -09/20/2021 16:58:09 - INFO - __main__ - Step 11457: {'lr': 0.00019093333333333333, 'samples': 366624, 'steps': 716, 'loss/train': 4.827730655670166} -09/20/2021 16:58:09 - INFO - __main__ - Step 11458: {'lr': 0.00019093333333333333, 'samples': 366656, 'steps': 716, 'loss/train': 5.0676188468933105} -09/20/2021 16:58:10 - INFO - __main__ - Step 11459: {'lr': 0.00019093333333333333, 'samples': 366688, 'steps': 716, 'loss/train': 4.910806179046631} -09/20/2021 16:58:11 - INFO - __main__ - Step 11460: {'lr': 0.00019093333333333333, 'samples': 366720, 'steps': 716, 'loss/train': 4.007219314575195} -09/20/2021 16:58:12 - INFO - __main__ - Step 11461: {'lr': 0.00019093333333333333, 'samples': 366752, 'steps': 716, 'loss/train': 2.440037488937378} -09/20/2021 16:58:12 - INFO - __main__ - Step 11462: {'lr': 0.00019093333333333333, 'samples': 366784, 'steps': 716, 'loss/train': 4.232992649078369} -09/20/2021 16:58:13 - INFO - __main__ - Step 11463: {'lr': 0.00019093333333333333, 'samples': 366816, 'steps': 716, 'loss/train': 5.1013617515563965} -09/20/2021 16:58:14 - INFO - __main__ - Step 11464: {'lr': 0.00019093333333333333, 'samples': 366848, 'steps': 716, 'loss/train': 4.061690330505371} -09/20/2021 16:58:15 - INFO - __main__ - Step 11465: {'lr': 0.00019093333333333333, 'samples': 366880, 'steps': 716, 'loss/train': 4.910429000854492} -09/20/2021 16:58:15 - INFO - __main__ - Step 11466: {'lr': 0.00019093333333333333, 'samples': 366912, 'steps': 716, 'loss/train': 4.47970724105835} -09/20/2021 16:58:16 - INFO - __main__ - Step 11467: {'lr': 0.00019093333333333333, 'samples': 366944, 'steps': 716, 'loss/train': 4.174505233764648} -09/20/2021 16:58:17 - INFO - __main__ - Step 11468: {'lr': 0.00019093333333333333, 'samples': 366976, 'steps': 716, 'loss/train': 3.921023368835449} -09/20/2021 16:58:18 - INFO - __main__ - Step 11469: {'lr': 0.00019093333333333333, 'samples': 367008, 'steps': 716, 'loss/train': 3.5560765266418457} -09/20/2021 16:58:18 - INFO - __main__ - Step 11470: {'lr': 0.00019093333333333333, 'samples': 367040, 'steps': 716, 'loss/train': 4.02338981628418} -09/20/2021 16:58:19 - INFO - __main__ - Step 11471: {'lr': 0.00019093333333333333, 'samples': 367072, 'steps': 716, 'loss/train': 4.462831974029541} -09/20/2021 16:58:20 - INFO - __main__ - Step 11472: {'lr': 0.00019093333333333333, 'samples': 367104, 'steps': 716, 'loss/train': 5.065093994140625} -09/20/2021 16:58:21 - INFO - __main__ - Step 11473: {'lr': 0.0001912, 'samples': 367136, 'steps': 717, 'loss/train': 4.0625901222229} -09/20/2021 16:58:22 - INFO - __main__ - Step 11474: {'lr': 0.0001912, 'samples': 367168, 'steps': 717, 'loss/train': 4.625840663909912} -09/20/2021 16:58:22 - INFO - __main__ - Step 11475: {'lr': 0.0001912, 'samples': 367200, 'steps': 717, 'loss/train': 4.47227668762207} -09/20/2021 16:58:23 - INFO - __main__ - Step 11476: {'lr': 0.0001912, 'samples': 367232, 'steps': 717, 'loss/train': 1.9806731939315796} -09/20/2021 16:58:24 - INFO - __main__ - Step 11477: {'lr': 0.0001912, 'samples': 367264, 'steps': 717, 'loss/train': 2.2685277462005615} -09/20/2021 16:58:25 - INFO - __main__ - Step 11478: {'lr': 0.0001912, 'samples': 367296, 'steps': 717, 'loss/train': 1.6681139469146729} -09/20/2021 16:58:25 - INFO - __main__ - Step 11479: {'lr': 0.0001912, 'samples': 367328, 'steps': 717, 'loss/train': 1.4769670963287354} -09/20/2021 16:58:26 - INFO - __main__ - Step 11480: {'lr': 0.0001912, 'samples': 367360, 'steps': 717, 'loss/train': 3.5457701683044434} -09/20/2021 16:58:27 - INFO - __main__ - Step 11481: {'lr': 0.0001912, 'samples': 367392, 'steps': 717, 'loss/train': 4.3803181648254395} -09/20/2021 16:58:28 - INFO - __main__ - Step 11482: {'lr': 0.0001912, 'samples': 367424, 'steps': 717, 'loss/train': 4.356213569641113} -09/20/2021 16:58:29 - INFO - __main__ - Step 11483: {'lr': 0.0001912, 'samples': 367456, 'steps': 717, 'loss/train': 4.263067722320557} -09/20/2021 16:58:30 - INFO - __main__ - Step 11484: {'lr': 0.0001912, 'samples': 367488, 'steps': 717, 'loss/train': 5.172021865844727} -09/20/2021 16:58:30 - INFO - __main__ - Step 11485: {'lr': 0.0001912, 'samples': 367520, 'steps': 717, 'loss/train': 4.625100612640381} -09/20/2021 16:58:31 - INFO - __main__ - Step 11486: {'lr': 0.0001912, 'samples': 367552, 'steps': 717, 'loss/train': 3.69657039642334} -09/20/2021 16:58:32 - INFO - __main__ - Step 11487: {'lr': 0.0001912, 'samples': 367584, 'steps': 717, 'loss/train': 4.743928909301758} -09/20/2021 16:58:33 - INFO - __main__ - Step 11488: {'lr': 0.0001912, 'samples': 367616, 'steps': 717, 'loss/train': 4.7550859451293945} -09/20/2021 16:58:33 - INFO - __main__ - Step 11489: {'lr': 0.0001914666666666667, 'samples': 367648, 'steps': 718, 'loss/train': 5.380167484283447} -09/20/2021 16:58:34 - INFO - __main__ - Step 11490: {'lr': 0.0001914666666666667, 'samples': 367680, 'steps': 718, 'loss/train': 6.29706335067749} -09/20/2021 16:58:35 - INFO - __main__ - Step 11491: {'lr': 0.0001914666666666667, 'samples': 367712, 'steps': 718, 'loss/train': 3.730938673019409} -09/20/2021 16:58:36 - INFO - __main__ - Step 11492: {'lr': 0.0001914666666666667, 'samples': 367744, 'steps': 718, 'loss/train': 4.291188716888428} -09/20/2021 16:58:36 - INFO - __main__ - Step 11493: {'lr': 0.0001914666666666667, 'samples': 367776, 'steps': 718, 'loss/train': 4.388660430908203} -09/20/2021 16:58:37 - INFO - __main__ - Step 11494: {'lr': 0.0001914666666666667, 'samples': 367808, 'steps': 718, 'loss/train': 4.075806140899658} -09/20/2021 16:58:38 - INFO - __main__ - Step 11495: {'lr': 0.0001914666666666667, 'samples': 367840, 'steps': 718, 'loss/train': 4.185011386871338} -09/20/2021 16:58:39 - INFO - __main__ - Step 11496: {'lr': 0.0001914666666666667, 'samples': 367872, 'steps': 718, 'loss/train': 4.654881477355957} -09/20/2021 16:58:39 - INFO - __main__ - Step 11497: {'lr': 0.0001914666666666667, 'samples': 367904, 'steps': 718, 'loss/train': 3.6921935081481934} -09/20/2021 16:58:40 - INFO - __main__ - Step 11498: {'lr': 0.0001914666666666667, 'samples': 367936, 'steps': 718, 'loss/train': 4.338461399078369} -09/20/2021 16:58:41 - INFO - __main__ - Step 11499: {'lr': 0.0001914666666666667, 'samples': 367968, 'steps': 718, 'loss/train': 4.534453868865967} -09/20/2021 16:58:42 - INFO - __main__ - Step 11500: {'lr': 0.0001914666666666667, 'samples': 368000, 'steps': 718, 'loss/train': 2.649858236312866} -09/20/2021 16:58:42 - INFO - __main__ - Step 11501: {'lr': 0.0001914666666666667, 'samples': 368032, 'steps': 718, 'loss/train': 2.9665868282318115} -09/20/2021 16:58:43 - INFO - __main__ - Step 11502: {'lr': 0.0001914666666666667, 'samples': 368064, 'steps': 718, 'loss/train': 4.924558639526367} -09/20/2021 16:58:44 - INFO - __main__ - Step 11503: {'lr': 0.0001914666666666667, 'samples': 368096, 'steps': 718, 'loss/train': 3.8682312965393066} -09/20/2021 16:58:45 - INFO - __main__ - Step 11504: {'lr': 0.0001914666666666667, 'samples': 368128, 'steps': 718, 'loss/train': 6.1389594078063965} -09/20/2021 16:58:46 - INFO - __main__ - Step 11505: {'lr': 0.00019173333333333335, 'samples': 368160, 'steps': 719, 'loss/train': 4.439541339874268} -09/20/2021 16:58:46 - INFO - __main__ - Step 11506: {'lr': 0.00019173333333333335, 'samples': 368192, 'steps': 719, 'loss/train': 3.712735891342163} -09/20/2021 16:58:47 - INFO - __main__ - Step 11507: {'lr': 0.00019173333333333335, 'samples': 368224, 'steps': 719, 'loss/train': 3.945032835006714} -09/20/2021 16:58:48 - INFO - __main__ - Step 11508: {'lr': 0.00019173333333333335, 'samples': 368256, 'steps': 719, 'loss/train': 3.530611515045166} -09/20/2021 16:58:49 - INFO - __main__ - Step 11509: {'lr': 0.00019173333333333335, 'samples': 368288, 'steps': 719, 'loss/train': 4.226783752441406} -09/20/2021 16:58:49 - INFO - __main__ - Step 11510: {'lr': 0.00019173333333333335, 'samples': 368320, 'steps': 719, 'loss/train': 3.80674147605896} -09/20/2021 16:58:50 - INFO - __main__ - Step 11511: {'lr': 0.00019173333333333335, 'samples': 368352, 'steps': 719, 'loss/train': 4.211850166320801} -09/20/2021 16:58:51 - INFO - __main__ - Step 11512: {'lr': 0.00019173333333333335, 'samples': 368384, 'steps': 719, 'loss/train': 5.478085041046143} -09/20/2021 16:58:52 - INFO - __main__ - Step 11513: {'lr': 0.00019173333333333335, 'samples': 368416, 'steps': 719, 'loss/train': 4.281390190124512} -09/20/2021 16:58:52 - INFO - __main__ - Step 11514: {'lr': 0.00019173333333333335, 'samples': 368448, 'steps': 719, 'loss/train': 3.8896944522857666} -09/20/2021 16:58:54 - INFO - __main__ - Step 11515: {'lr': 0.00019173333333333335, 'samples': 368480, 'steps': 719, 'loss/train': 3.629985809326172} -09/20/2021 16:58:54 - INFO - __main__ - Step 11516: {'lr': 0.00019173333333333335, 'samples': 368512, 'steps': 719, 'loss/train': 1.8166279792785645} -09/20/2021 16:58:55 - INFO - __main__ - Step 11517: {'lr': 0.00019173333333333335, 'samples': 368544, 'steps': 719, 'loss/train': 3.893765687942505} -09/20/2021 16:58:56 - INFO - __main__ - Step 11518: {'lr': 0.00019173333333333335, 'samples': 368576, 'steps': 719, 'loss/train': 2.6783230304718018} -09/20/2021 16:58:57 - INFO - __main__ - Step 11519: {'lr': 0.00019173333333333335, 'samples': 368608, 'steps': 719, 'loss/train': 2.674971580505371} -09/20/2021 16:58:57 - INFO - __main__ - Step 11520: {'lr': 0.00019173333333333335, 'samples': 368640, 'steps': 719, 'loss/train': 4.307343006134033} -09/20/2021 16:58:58 - INFO - __main__ - Step 11521: {'lr': 0.000192, 'samples': 368672, 'steps': 720, 'loss/train': 4.921509742736816} -09/20/2021 16:58:59 - INFO - __main__ - Step 11522: {'lr': 0.000192, 'samples': 368704, 'steps': 720, 'loss/train': 4.449673652648926} -09/20/2021 16:59:00 - INFO - __main__ - Step 11523: {'lr': 0.000192, 'samples': 368736, 'steps': 720, 'loss/train': 4.45920467376709} -09/20/2021 16:59:01 - INFO - __main__ - Step 11524: {'lr': 0.000192, 'samples': 368768, 'steps': 720, 'loss/train': 3.4776580333709717} -09/20/2021 16:59:01 - INFO - __main__ - Step 11525: {'lr': 0.000192, 'samples': 368800, 'steps': 720, 'loss/train': 4.535389423370361} -09/20/2021 16:59:02 - INFO - __main__ - Step 11526: {'lr': 0.000192, 'samples': 368832, 'steps': 720, 'loss/train': 3.63179349899292} -09/20/2021 16:59:03 - INFO - __main__ - Step 11527: {'lr': 0.000192, 'samples': 368864, 'steps': 720, 'loss/train': 4.207215785980225} -09/20/2021 16:59:04 - INFO - __main__ - Step 11528: {'lr': 0.000192, 'samples': 368896, 'steps': 720, 'loss/train': 4.265780448913574} -09/20/2021 16:59:04 - INFO - __main__ - Step 11529: {'lr': 0.000192, 'samples': 368928, 'steps': 720, 'loss/train': 6.045478343963623} -09/20/2021 16:59:05 - INFO - __main__ - Step 11530: {'lr': 0.000192, 'samples': 368960, 'steps': 720, 'loss/train': 3.8983311653137207} -09/20/2021 16:59:06 - INFO - __main__ - Step 11531: {'lr': 0.000192, 'samples': 368992, 'steps': 720, 'loss/train': 4.722861289978027} -09/20/2021 16:59:07 - INFO - __main__ - Step 11532: {'lr': 0.000192, 'samples': 369024, 'steps': 720, 'loss/train': 4.673845291137695} -09/20/2021 16:59:07 - INFO - __main__ - Step 11533: {'lr': 0.000192, 'samples': 369056, 'steps': 720, 'loss/train': 4.527168273925781} -09/20/2021 16:59:08 - INFO - __main__ - Step 11534: {'lr': 0.000192, 'samples': 369088, 'steps': 720, 'loss/train': 3.964552402496338} -09/20/2021 16:59:09 - INFO - __main__ - Step 11535: {'lr': 0.000192, 'samples': 369120, 'steps': 720, 'loss/train': 4.002773761749268} -09/20/2021 16:59:10 - INFO - __main__ - Step 11536: {'lr': 0.000192, 'samples': 369152, 'steps': 720, 'loss/train': 4.354621410369873} -09/20/2021 16:59:10 - INFO - __main__ - Step 11537: {'lr': 0.0001922666666666667, 'samples': 369184, 'steps': 721, 'loss/train': 3.3656084537506104} -09/20/2021 16:59:11 - INFO - __main__ - Step 11538: {'lr': 0.0001922666666666667, 'samples': 369216, 'steps': 721, 'loss/train': 3.695998430252075} -09/20/2021 16:59:12 - INFO - __main__ - Step 11539: {'lr': 0.0001922666666666667, 'samples': 369248, 'steps': 721, 'loss/train': 4.496081829071045} -09/20/2021 16:59:13 - INFO - __main__ - Step 11540: {'lr': 0.0001922666666666667, 'samples': 369280, 'steps': 721, 'loss/train': 2.802415370941162} -09/20/2021 16:59:13 - INFO - __main__ - Step 11541: {'lr': 0.0001922666666666667, 'samples': 369312, 'steps': 721, 'loss/train': 3.905702590942383} -09/20/2021 16:59:14 - INFO - __main__ - Step 11542: {'lr': 0.0001922666666666667, 'samples': 369344, 'steps': 721, 'loss/train': 4.67728853225708} -09/20/2021 16:59:15 - INFO - __main__ - Step 11543: {'lr': 0.0001922666666666667, 'samples': 369376, 'steps': 721, 'loss/train': 3.9668312072753906} -09/20/2021 16:59:16 - INFO - __main__ - Step 11544: {'lr': 0.0001922666666666667, 'samples': 369408, 'steps': 721, 'loss/train': 3.6794636249542236} -09/20/2021 16:59:16 - INFO - __main__ - Step 11545: {'lr': 0.0001922666666666667, 'samples': 369440, 'steps': 721, 'loss/train': 4.4867095947265625} -09/20/2021 16:59:18 - INFO - __main__ - Step 11546: {'lr': 0.0001922666666666667, 'samples': 369472, 'steps': 721, 'loss/train': 3.3748085498809814} -09/20/2021 16:59:19 - INFO - __main__ - Step 11547: {'lr': 0.0001922666666666667, 'samples': 369504, 'steps': 721, 'loss/train': 3.979947566986084} -09/20/2021 16:59:19 - INFO - __main__ - Step 11548: {'lr': 0.0001922666666666667, 'samples': 369536, 'steps': 721, 'loss/train': 4.1921281814575195} -09/20/2021 16:59:20 - INFO - __main__ - Step 11549: {'lr': 0.0001922666666666667, 'samples': 369568, 'steps': 721, 'loss/train': 4.415772438049316} -09/20/2021 16:59:21 - INFO - __main__ - Step 11550: {'lr': 0.0001922666666666667, 'samples': 369600, 'steps': 721, 'loss/train': 4.366771221160889} -09/20/2021 16:59:22 - INFO - __main__ - Step 11551: {'lr': 0.0001922666666666667, 'samples': 369632, 'steps': 721, 'loss/train': 3.9557483196258545} -09/20/2021 16:59:22 - INFO - __main__ - Step 11552: {'lr': 0.0001922666666666667, 'samples': 369664, 'steps': 721, 'loss/train': 0.6577157378196716} -09/20/2021 16:59:23 - INFO - __main__ - Step 11553: {'lr': 0.00019253333333333334, 'samples': 369696, 'steps': 722, 'loss/train': 3.3172836303710938} -09/20/2021 16:59:24 - INFO - __main__ - Step 11554: {'lr': 0.00019253333333333334, 'samples': 369728, 'steps': 722, 'loss/train': 5.402655124664307} -09/20/2021 16:59:25 - INFO - __main__ - Step 11555: {'lr': 0.00019253333333333334, 'samples': 369760, 'steps': 722, 'loss/train': 3.3610589504241943} -09/20/2021 16:59:26 - INFO - __main__ - Step 11556: {'lr': 0.00019253333333333334, 'samples': 369792, 'steps': 722, 'loss/train': 4.135231018066406} -09/20/2021 16:59:26 - INFO - __main__ - Step 11557: {'lr': 0.00019253333333333334, 'samples': 369824, 'steps': 722, 'loss/train': 3.9134461879730225} -09/20/2021 16:59:27 - INFO - __main__ - Step 11558: {'lr': 0.00019253333333333334, 'samples': 369856, 'steps': 722, 'loss/train': 3.9666006565093994} -09/20/2021 16:59:28 - INFO - __main__ - Step 11559: {'lr': 0.00019253333333333334, 'samples': 369888, 'steps': 722, 'loss/train': 3.891845464706421} -09/20/2021 16:59:29 - INFO - __main__ - Step 11560: {'lr': 0.00019253333333333334, 'samples': 369920, 'steps': 722, 'loss/train': 1.6340231895446777} -09/20/2021 16:59:29 - INFO - __main__ - Step 11561: {'lr': 0.00019253333333333334, 'samples': 369952, 'steps': 722, 'loss/train': 1.8093341588974} -09/20/2021 16:59:30 - INFO - __main__ - Step 11562: {'lr': 0.00019253333333333334, 'samples': 369984, 'steps': 722, 'loss/train': 1.2153829336166382} -09/20/2021 16:59:31 - INFO - __main__ - Step 11563: {'lr': 0.00019253333333333334, 'samples': 370016, 'steps': 722, 'loss/train': 1.6763412952423096} -09/20/2021 16:59:32 - INFO - __main__ - Step 11564: {'lr': 0.00019253333333333334, 'samples': 370048, 'steps': 722, 'loss/train': 1.756174921989441} -09/20/2021 16:59:32 - INFO - __main__ - Step 11565: {'lr': 0.00019253333333333334, 'samples': 370080, 'steps': 722, 'loss/train': 5.6889119148254395} -09/20/2021 16:59:33 - INFO - __main__ - Step 11566: {'lr': 0.00019253333333333334, 'samples': 370112, 'steps': 722, 'loss/train': 3.8688318729400635} -09/20/2021 16:59:34 - INFO - __main__ - Step 11567: {'lr': 0.00019253333333333334, 'samples': 370144, 'steps': 722, 'loss/train': 3.8760905265808105} -09/20/2021 16:59:35 - INFO - __main__ - Step 11568: {'lr': 0.00019253333333333334, 'samples': 370176, 'steps': 722, 'loss/train': 3.8000051975250244} -09/20/2021 16:59:36 - INFO - __main__ - Step 11569: {'lr': 0.0001928, 'samples': 370208, 'steps': 723, 'loss/train': 5.7274298667907715} -09/20/2021 16:59:36 - INFO - __main__ - Step 11570: {'lr': 0.0001928, 'samples': 370240, 'steps': 723, 'loss/train': 4.23362398147583} -09/20/2021 16:59:37 - INFO - __main__ - Step 11571: {'lr': 0.0001928, 'samples': 370272, 'steps': 723, 'loss/train': 4.130541801452637} -09/20/2021 16:59:38 - INFO - __main__ - Step 11572: {'lr': 0.0001928, 'samples': 370304, 'steps': 723, 'loss/train': 3.7442190647125244} -09/20/2021 16:59:39 - INFO - __main__ - Step 11573: {'lr': 0.0001928, 'samples': 370336, 'steps': 723, 'loss/train': 4.40748405456543} -09/20/2021 16:59:39 - INFO - __main__ - Step 11574: {'lr': 0.0001928, 'samples': 370368, 'steps': 723, 'loss/train': 3.7384583950042725} -09/20/2021 16:59:40 - INFO - __main__ - Step 11575: {'lr': 0.0001928, 'samples': 370400, 'steps': 723, 'loss/train': 4.617203235626221} -09/20/2021 16:59:41 - INFO - __main__ - Step 11576: {'lr': 0.0001928, 'samples': 370432, 'steps': 723, 'loss/train': 3.5671072006225586} -09/20/2021 16:59:42 - INFO - __main__ - Step 11577: {'lr': 0.0001928, 'samples': 370464, 'steps': 723, 'loss/train': 3.9210822582244873} -09/20/2021 16:59:43 - INFO - __main__ - Step 11578: {'lr': 0.0001928, 'samples': 370496, 'steps': 723, 'loss/train': 4.137799263000488} -09/20/2021 16:59:44 - INFO - __main__ - Step 11579: {'lr': 0.0001928, 'samples': 370528, 'steps': 723, 'loss/train': 4.390698432922363} -09/20/2021 16:59:44 - INFO - __main__ - Step 11580: {'lr': 0.0001928, 'samples': 370560, 'steps': 723, 'loss/train': 4.4094953536987305} -09/20/2021 16:59:45 - INFO - __main__ - Step 11581: {'lr': 0.0001928, 'samples': 370592, 'steps': 723, 'loss/train': 4.351115703582764} -09/20/2021 16:59:46 - INFO - __main__ - Step 11582: {'lr': 0.0001928, 'samples': 370624, 'steps': 723, 'loss/train': 4.428478717803955} -09/20/2021 16:59:47 - INFO - __main__ - Step 11583: {'lr': 0.0001928, 'samples': 370656, 'steps': 723, 'loss/train': 2.9880857467651367} -09/20/2021 16:59:47 - INFO - __main__ - Step 11584: {'lr': 0.0001928, 'samples': 370688, 'steps': 723, 'loss/train': 3.3523783683776855} -09/20/2021 16:59:48 - INFO - __main__ - Step 11585: {'lr': 0.00019306666666666668, 'samples': 370720, 'steps': 724, 'loss/train': 3.5161564350128174} -09/20/2021 16:59:49 - INFO - __main__ - Step 11586: {'lr': 0.00019306666666666668, 'samples': 370752, 'steps': 724, 'loss/train': 4.774931907653809} -09/20/2021 16:59:50 - INFO - __main__ - Step 11587: {'lr': 0.00019306666666666668, 'samples': 370784, 'steps': 724, 'loss/train': 3.9034972190856934} -09/20/2021 16:59:50 - INFO - __main__ - Step 11588: {'lr': 0.00019306666666666668, 'samples': 370816, 'steps': 724, 'loss/train': 3.975566864013672} -09/20/2021 16:59:51 - INFO - __main__ - Step 11589: {'lr': 0.00019306666666666668, 'samples': 370848, 'steps': 724, 'loss/train': 3.8549246788024902} -09/20/2021 16:59:52 - INFO - __main__ - Step 11590: {'lr': 0.00019306666666666668, 'samples': 370880, 'steps': 724, 'loss/train': 3.426060199737549} -09/20/2021 16:59:53 - INFO - __main__ - Step 11591: {'lr': 0.00019306666666666668, 'samples': 370912, 'steps': 724, 'loss/train': 4.217355728149414} -09/20/2021 16:59:53 - INFO - __main__ - Step 11592: {'lr': 0.00019306666666666668, 'samples': 370944, 'steps': 724, 'loss/train': 4.511091709136963} -09/20/2021 16:59:54 - INFO - __main__ - Step 11593: {'lr': 0.00019306666666666668, 'samples': 370976, 'steps': 724, 'loss/train': 3.418491840362549} -09/20/2021 16:59:55 - INFO - __main__ - Step 11594: {'lr': 0.00019306666666666668, 'samples': 371008, 'steps': 724, 'loss/train': 4.191498756408691} -09/20/2021 16:59:56 - INFO - __main__ - Step 11595: {'lr': 0.00019306666666666668, 'samples': 371040, 'steps': 724, 'loss/train': 3.908031940460205} -09/20/2021 16:59:56 - INFO - __main__ - Step 11596: {'lr': 0.00019306666666666668, 'samples': 371072, 'steps': 724, 'loss/train': 3.934798002243042} -09/20/2021 16:59:57 - INFO - __main__ - Step 11597: {'lr': 0.00019306666666666668, 'samples': 371104, 'steps': 724, 'loss/train': 3.998523235321045} -09/20/2021 16:59:58 - INFO - __main__ - Step 11598: {'lr': 0.00019306666666666668, 'samples': 371136, 'steps': 724, 'loss/train': 4.056915760040283} -09/20/2021 16:59:59 - INFO - __main__ - Step 11599: {'lr': 0.00019306666666666668, 'samples': 371168, 'steps': 724, 'loss/train': 3.68571400642395} -09/20/2021 16:59:59 - INFO - __main__ - Step 11600: {'lr': 0.00019306666666666668, 'samples': 371200, 'steps': 724, 'loss/train': 4.161243915557861} -09/20/2021 17:00:00 - INFO - __main__ - Step 11601: {'lr': 0.00019333333333333333, 'samples': 371232, 'steps': 725, 'loss/train': 3.756256103515625} -09/20/2021 17:00:01 - INFO - __main__ - Step 11602: {'lr': 0.00019333333333333333, 'samples': 371264, 'steps': 725, 'loss/train': 4.706082344055176} -09/20/2021 17:00:02 - INFO - __main__ - Step 11603: {'lr': 0.00019333333333333333, 'samples': 371296, 'steps': 725, 'loss/train': 4.768709659576416} -09/20/2021 17:00:03 - INFO - __main__ - Step 11604: {'lr': 0.00019333333333333333, 'samples': 371328, 'steps': 725, 'loss/train': 4.946216583251953} -09/20/2021 17:00:03 - INFO - __main__ - Step 11605: {'lr': 0.00019333333333333333, 'samples': 371360, 'steps': 725, 'loss/train': 4.825407028198242} -09/20/2021 17:00:04 - INFO - __main__ - Step 11606: {'lr': 0.00019333333333333333, 'samples': 371392, 'steps': 725, 'loss/train': 4.133427619934082} -09/20/2021 17:00:05 - INFO - __main__ - Step 11607: {'lr': 0.00019333333333333333, 'samples': 371424, 'steps': 725, 'loss/train': 4.937673091888428} -09/20/2021 17:00:06 - INFO - __main__ - Step 11608: {'lr': 0.00019333333333333333, 'samples': 371456, 'steps': 725, 'loss/train': 4.818731307983398} -09/20/2021 17:00:06 - INFO - __main__ - Step 11609: {'lr': 0.00019333333333333333, 'samples': 371488, 'steps': 725, 'loss/train': 4.575329303741455} -09/20/2021 17:00:08 - INFO - __main__ - Step 11610: {'lr': 0.00019333333333333333, 'samples': 371520, 'steps': 725, 'loss/train': 3.9524288177490234} -09/20/2021 17:00:09 - INFO - __main__ - Step 11611: {'lr': 0.00019333333333333333, 'samples': 371552, 'steps': 725, 'loss/train': 4.338316917419434} -09/20/2021 17:00:10 - INFO - __main__ - Step 11612: {'lr': 0.00019333333333333333, 'samples': 371584, 'steps': 725, 'loss/train': 5.506185054779053} -09/20/2021 17:00:11 - INFO - __main__ - Step 11613: {'lr': 0.00019333333333333333, 'samples': 371616, 'steps': 725, 'loss/train': 4.25693416595459} -09/20/2021 17:00:11 - INFO - __main__ - Step 11614: {'lr': 0.00019333333333333333, 'samples': 371648, 'steps': 725, 'loss/train': 3.693342447280884} -09/20/2021 17:00:12 - INFO - __main__ - Step 11615: {'lr': 0.00019333333333333333, 'samples': 371680, 'steps': 725, 'loss/train': 4.207719326019287} -09/20/2021 17:00:13 - INFO - __main__ - Step 11616: {'lr': 0.00019333333333333333, 'samples': 371712, 'steps': 725, 'loss/train': 5.2491559982299805} -09/20/2021 17:00:14 - INFO - __main__ - Step 11617: {'lr': 0.00019360000000000002, 'samples': 371744, 'steps': 726, 'loss/train': 4.057404518127441} -09/20/2021 17:00:15 - INFO - __main__ - Step 11618: {'lr': 0.00019360000000000002, 'samples': 371776, 'steps': 726, 'loss/train': 4.3739333152771} -09/20/2021 17:00:15 - INFO - __main__ - Step 11619: {'lr': 0.00019360000000000002, 'samples': 371808, 'steps': 726, 'loss/train': 4.399534225463867} -09/20/2021 17:00:16 - INFO - __main__ - Step 11620: {'lr': 0.00019360000000000002, 'samples': 371840, 'steps': 726, 'loss/train': 4.095560550689697} -09/20/2021 17:00:17 - INFO - __main__ - Step 11621: {'lr': 0.00019360000000000002, 'samples': 371872, 'steps': 726, 'loss/train': 4.083966255187988} -09/20/2021 17:00:18 - INFO - __main__ - Step 11622: {'lr': 0.00019360000000000002, 'samples': 371904, 'steps': 726, 'loss/train': 2.234757661819458} -09/20/2021 17:00:18 - INFO - __main__ - Step 11623: {'lr': 0.00019360000000000002, 'samples': 371936, 'steps': 726, 'loss/train': 2.104790449142456} -09/20/2021 17:00:19 - INFO - __main__ - Step 11624: {'lr': 0.00019360000000000002, 'samples': 371968, 'steps': 726, 'loss/train': 1.8833708763122559} -09/20/2021 17:00:20 - INFO - __main__ - Step 11625: {'lr': 0.00019360000000000002, 'samples': 372000, 'steps': 726, 'loss/train': 1.5726672410964966} -09/20/2021 17:00:21 - INFO - __main__ - Step 11626: {'lr': 0.00019360000000000002, 'samples': 372032, 'steps': 726, 'loss/train': 1.5812722444534302} -09/20/2021 17:00:21 - INFO - __main__ - Step 11627: {'lr': 0.00019360000000000002, 'samples': 372064, 'steps': 726, 'loss/train': 2.0464236736297607} -09/20/2021 17:00:22 - INFO - __main__ - Step 11628: {'lr': 0.00019360000000000002, 'samples': 372096, 'steps': 726, 'loss/train': 5.616390705108643} -09/20/2021 17:00:23 - INFO - __main__ - Step 11629: {'lr': 0.00019360000000000002, 'samples': 372128, 'steps': 726, 'loss/train': 5.568938732147217} -09/20/2021 17:00:24 - INFO - __main__ - Step 11630: {'lr': 0.00019360000000000002, 'samples': 372160, 'steps': 726, 'loss/train': 4.909403324127197} -09/20/2021 17:00:24 - INFO - __main__ - Step 11631: {'lr': 0.00019360000000000002, 'samples': 372192, 'steps': 726, 'loss/train': 4.767960071563721} -09/20/2021 17:00:25 - INFO - __main__ - Step 11632: {'lr': 0.00019360000000000002, 'samples': 372224, 'steps': 726, 'loss/train': 4.150895118713379} -09/20/2021 17:00:26 - INFO - __main__ - Step 11633: {'lr': 0.0001938666666666667, 'samples': 372256, 'steps': 727, 'loss/train': 5.315032958984375} -09/20/2021 17:00:27 - INFO - __main__ - Step 11634: {'lr': 0.0001938666666666667, 'samples': 372288, 'steps': 727, 'loss/train': 5.075873374938965} -09/20/2021 17:00:27 - INFO - __main__ - Step 11635: {'lr': 0.0001938666666666667, 'samples': 372320, 'steps': 727, 'loss/train': 4.148561000823975} -09/20/2021 17:00:28 - INFO - __main__ - Step 11636: {'lr': 0.0001938666666666667, 'samples': 372352, 'steps': 727, 'loss/train': 4.556490898132324} -09/20/2021 17:00:29 - INFO - __main__ - Step 11637: {'lr': 0.0001938666666666667, 'samples': 372384, 'steps': 727, 'loss/train': 4.472095012664795} -09/20/2021 17:00:30 - INFO - __main__ - Step 11638: {'lr': 0.0001938666666666667, 'samples': 372416, 'steps': 727, 'loss/train': 4.530478000640869} -09/20/2021 17:00:30 - INFO - __main__ - Step 11639: {'lr': 0.0001938666666666667, 'samples': 372448, 'steps': 727, 'loss/train': 4.470946788787842} -09/20/2021 17:00:32 - INFO - __main__ - Step 11640: {'lr': 0.0001938666666666667, 'samples': 372480, 'steps': 727, 'loss/train': 4.016918182373047} -09/20/2021 17:00:32 - INFO - __main__ - Step 11641: {'lr': 0.0001938666666666667, 'samples': 372512, 'steps': 727, 'loss/train': 4.143375396728516} -09/20/2021 17:00:33 - INFO - __main__ - Step 11642: {'lr': 0.0001938666666666667, 'samples': 372544, 'steps': 727, 'loss/train': 4.212098598480225} -09/20/2021 17:00:34 - INFO - __main__ - Step 11643: {'lr': 0.0001938666666666667, 'samples': 372576, 'steps': 727, 'loss/train': 3.5449025630950928} -09/20/2021 17:00:35 - INFO - __main__ - Step 11644: {'lr': 0.0001938666666666667, 'samples': 372608, 'steps': 727, 'loss/train': 4.101510524749756} -09/20/2021 17:00:35 - INFO - __main__ - Step 11645: {'lr': 0.0001938666666666667, 'samples': 372640, 'steps': 727, 'loss/train': 3.7158493995666504} -09/20/2021 17:00:36 - INFO - __main__ - Step 11646: {'lr': 0.0001938666666666667, 'samples': 372672, 'steps': 727, 'loss/train': 4.5659098625183105} -09/20/2021 17:00:37 - INFO - __main__ - Step 11647: {'lr': 0.0001938666666666667, 'samples': 372704, 'steps': 727, 'loss/train': 3.6636669635772705} -09/20/2021 17:00:38 - INFO - __main__ - Step 11648: {'lr': 0.0001938666666666667, 'samples': 372736, 'steps': 727, 'loss/train': 4.65106201171875} -09/20/2021 17:00:39 - INFO - __main__ - Step 11649: {'lr': 0.00019413333333333335, 'samples': 372768, 'steps': 728, 'loss/train': 4.516819000244141} -09/20/2021 17:00:39 - INFO - __main__ - Step 11650: {'lr': 0.00019413333333333335, 'samples': 372800, 'steps': 728, 'loss/train': 3.8061599731445312} -09/20/2021 17:00:40 - INFO - __main__ - Step 11651: {'lr': 0.00019413333333333335, 'samples': 372832, 'steps': 728, 'loss/train': 4.4543561935424805} -09/20/2021 17:00:41 - INFO - __main__ - Step 11652: {'lr': 0.00019413333333333335, 'samples': 372864, 'steps': 728, 'loss/train': 3.990290641784668} -09/20/2021 17:00:42 - INFO - __main__ - Step 11653: {'lr': 0.00019413333333333335, 'samples': 372896, 'steps': 728, 'loss/train': 1.618713140487671} -09/20/2021 17:00:42 - INFO - __main__ - Step 11654: {'lr': 0.00019413333333333335, 'samples': 372928, 'steps': 728, 'loss/train': 4.309081554412842} -09/20/2021 17:00:43 - INFO - __main__ - Step 11655: {'lr': 0.00019413333333333335, 'samples': 372960, 'steps': 728, 'loss/train': 4.803846836090088} -09/20/2021 17:00:44 - INFO - __main__ - Step 11656: {'lr': 0.00019413333333333335, 'samples': 372992, 'steps': 728, 'loss/train': 3.725611448287964} -09/20/2021 17:00:45 - INFO - __main__ - Step 11657: {'lr': 0.00019413333333333335, 'samples': 373024, 'steps': 728, 'loss/train': 5.100845813751221} -09/20/2021 17:00:45 - INFO - __main__ - Step 11658: {'lr': 0.00019413333333333335, 'samples': 373056, 'steps': 728, 'loss/train': 4.088827610015869} -09/20/2021 17:00:46 - INFO - __main__ - Step 11659: {'lr': 0.00019413333333333335, 'samples': 373088, 'steps': 728, 'loss/train': 4.673882484436035} -09/20/2021 17:00:47 - INFO - __main__ - Step 11660: {'lr': 0.00019413333333333335, 'samples': 373120, 'steps': 728, 'loss/train': 4.610615253448486} -09/20/2021 17:00:48 - INFO - __main__ - Step 11661: {'lr': 0.00019413333333333335, 'samples': 373152, 'steps': 728, 'loss/train': 4.063808917999268} -09/20/2021 17:00:48 - INFO - __main__ - Step 11662: {'lr': 0.00019413333333333335, 'samples': 373184, 'steps': 728, 'loss/train': 3.5869948863983154} -09/20/2021 17:00:49 - INFO - __main__ - Step 11663: {'lr': 0.00019413333333333335, 'samples': 373216, 'steps': 728, 'loss/train': 2.1554787158966064} -09/20/2021 17:00:50 - INFO - __main__ - Step 11664: {'lr': 0.00019413333333333335, 'samples': 373248, 'steps': 728, 'loss/train': 3.903325080871582} -09/20/2021 17:00:51 - INFO - __main__ - Step 11665: {'lr': 0.0001944, 'samples': 373280, 'steps': 729, 'loss/train': 4.0537567138671875} -09/20/2021 17:00:51 - INFO - __main__ - Step 11666: {'lr': 0.0001944, 'samples': 373312, 'steps': 729, 'loss/train': 3.1634085178375244} -09/20/2021 17:00:52 - INFO - __main__ - Step 11667: {'lr': 0.0001944, 'samples': 373344, 'steps': 729, 'loss/train': 3.3970024585723877} -09/20/2021 17:00:53 - INFO - __main__ - Step 11668: {'lr': 0.0001944, 'samples': 373376, 'steps': 729, 'loss/train': 4.202138900756836} -09/20/2021 17:00:54 - INFO - __main__ - Step 11669: {'lr': 0.0001944, 'samples': 373408, 'steps': 729, 'loss/train': 3.3836262226104736} -09/20/2021 17:00:54 - INFO - __main__ - Step 11670: {'lr': 0.0001944, 'samples': 373440, 'steps': 729, 'loss/train': 3.9261772632598877} -09/20/2021 17:00:56 - INFO - __main__ - Step 11671: {'lr': 0.0001944, 'samples': 373472, 'steps': 729, 'loss/train': 3.7698066234588623} -09/20/2021 17:00:57 - INFO - __main__ - Step 11672: {'lr': 0.0001944, 'samples': 373504, 'steps': 729, 'loss/train': 5.404001712799072} -09/20/2021 17:00:57 - INFO - __main__ - Step 11673: {'lr': 0.0001944, 'samples': 373536, 'steps': 729, 'loss/train': 3.6836345195770264} -09/20/2021 17:00:58 - INFO - __main__ - Step 11674: {'lr': 0.0001944, 'samples': 373568, 'steps': 729, 'loss/train': 4.112332820892334} -09/20/2021 17:00:59 - INFO - __main__ - Step 11675: {'lr': 0.0001944, 'samples': 373600, 'steps': 729, 'loss/train': 4.438096523284912} -09/20/2021 17:01:00 - INFO - __main__ - Step 11676: {'lr': 0.0001944, 'samples': 373632, 'steps': 729, 'loss/train': 4.410788536071777} -09/20/2021 17:01:00 - INFO - __main__ - Step 11677: {'lr': 0.0001944, 'samples': 373664, 'steps': 729, 'loss/train': 4.796372413635254} -09/20/2021 17:01:01 - INFO - __main__ - Step 11678: {'lr': 0.0001944, 'samples': 373696, 'steps': 729, 'loss/train': 5.089422225952148} -09/20/2021 17:01:02 - INFO - __main__ - Step 11679: {'lr': 0.0001944, 'samples': 373728, 'steps': 729, 'loss/train': 4.910828590393066} -09/20/2021 17:01:03 - INFO - __main__ - Step 11680: {'lr': 0.0001944, 'samples': 373760, 'steps': 729, 'loss/train': 6.190402984619141} -09/20/2021 17:01:04 - INFO - __main__ - Step 11681: {'lr': 0.0001946666666666667, 'samples': 373792, 'steps': 730, 'loss/train': 4.648487567901611} -09/20/2021 17:01:04 - INFO - __main__ - Step 11682: {'lr': 0.0001946666666666667, 'samples': 373824, 'steps': 730, 'loss/train': 4.807085990905762} -09/20/2021 17:01:05 - INFO - __main__ - Step 11683: {'lr': 0.0001946666666666667, 'samples': 373856, 'steps': 730, 'loss/train': 4.7142510414123535} -09/20/2021 17:01:06 - INFO - __main__ - Step 11684: {'lr': 0.0001946666666666667, 'samples': 373888, 'steps': 730, 'loss/train': 4.497241973876953} -09/20/2021 17:01:07 - INFO - __main__ - Step 11685: {'lr': 0.0001946666666666667, 'samples': 373920, 'steps': 730, 'loss/train': 4.027170181274414} -09/20/2021 17:01:07 - INFO - __main__ - Step 11686: {'lr': 0.0001946666666666667, 'samples': 373952, 'steps': 730, 'loss/train': 4.200966835021973} -09/20/2021 17:01:08 - INFO - __main__ - Step 11687: {'lr': 0.0001946666666666667, 'samples': 373984, 'steps': 730, 'loss/train': 4.350976943969727} -09/20/2021 17:01:09 - INFO - __main__ - Step 11688: {'lr': 0.0001946666666666667, 'samples': 374016, 'steps': 730, 'loss/train': 4.730406284332275} -09/20/2021 17:01:10 - INFO - __main__ - Step 11689: {'lr': 0.0001946666666666667, 'samples': 374048, 'steps': 730, 'loss/train': 3.7654848098754883} -09/20/2021 17:01:10 - INFO - __main__ - Step 11690: {'lr': 0.0001946666666666667, 'samples': 374080, 'steps': 730, 'loss/train': 4.794814109802246} -09/20/2021 17:01:11 - INFO - __main__ - Step 11691: {'lr': 0.0001946666666666667, 'samples': 374112, 'steps': 730, 'loss/train': 4.329626083374023} -09/20/2021 17:01:12 - INFO - __main__ - Step 11692: {'lr': 0.0001946666666666667, 'samples': 374144, 'steps': 730, 'loss/train': 4.372623920440674} -09/20/2021 17:01:13 - INFO - __main__ - Step 11693: {'lr': 0.0001946666666666667, 'samples': 374176, 'steps': 730, 'loss/train': 4.783247947692871} -09/20/2021 17:01:13 - INFO - __main__ - Step 11694: {'lr': 0.0001946666666666667, 'samples': 374208, 'steps': 730, 'loss/train': 4.171695232391357} -09/20/2021 17:01:14 - INFO - __main__ - Step 11695: {'lr': 0.0001946666666666667, 'samples': 374240, 'steps': 730, 'loss/train': 4.599578857421875} -09/20/2021 17:01:15 - INFO - __main__ - Step 11696: {'lr': 0.0001946666666666667, 'samples': 374272, 'steps': 730, 'loss/train': 3.773597240447998} -09/20/2021 17:01:16 - INFO - __main__ - Step 11697: {'lr': 0.00019493333333333335, 'samples': 374304, 'steps': 731, 'loss/train': 4.311148166656494} -09/20/2021 17:01:16 - INFO - __main__ - Step 11698: {'lr': 0.00019493333333333335, 'samples': 374336, 'steps': 731, 'loss/train': 1.4184638261795044} -09/20/2021 17:01:17 - INFO - __main__ - Step 11699: {'lr': 0.00019493333333333335, 'samples': 374368, 'steps': 731, 'loss/train': 3.659001111984253} -09/20/2021 17:01:18 - INFO - __main__ - Step 11700: {'lr': 0.00019493333333333335, 'samples': 374400, 'steps': 731, 'loss/train': 4.547111988067627} -09/20/2021 17:01:19 - INFO - __main__ - Step 11701: {'lr': 0.00019493333333333335, 'samples': 374432, 'steps': 731, 'loss/train': 4.821411609649658} -09/20/2021 17:01:19 - INFO - __main__ - Step 11702: {'lr': 0.00019493333333333335, 'samples': 374464, 'steps': 731, 'loss/train': 5.0941996574401855} -09/20/2021 17:01:20 - INFO - __main__ - Step 11703: {'lr': 0.00019493333333333335, 'samples': 374496, 'steps': 731, 'loss/train': 4.852538108825684} -09/20/2021 17:01:21 - INFO - __main__ - Step 11704: {'lr': 0.00019493333333333335, 'samples': 374528, 'steps': 731, 'loss/train': 4.436147689819336} -09/20/2021 17:01:22 - INFO - __main__ - Step 11705: {'lr': 0.00019493333333333335, 'samples': 374560, 'steps': 731, 'loss/train': 5.140277862548828} -09/20/2021 17:01:23 - INFO - __main__ - Step 11706: {'lr': 0.00019493333333333335, 'samples': 374592, 'steps': 731, 'loss/train': 4.552582740783691} -09/20/2021 17:01:24 - INFO - __main__ - Step 11707: {'lr': 0.00019493333333333335, 'samples': 374624, 'steps': 731, 'loss/train': 4.749457359313965} -09/20/2021 17:01:24 - INFO - __main__ - Step 11708: {'lr': 0.00019493333333333335, 'samples': 374656, 'steps': 731, 'loss/train': 3.709418535232544} -09/20/2021 17:01:25 - INFO - __main__ - Step 11709: {'lr': 0.00019493333333333335, 'samples': 374688, 'steps': 731, 'loss/train': 4.831096649169922} -09/20/2021 17:01:26 - INFO - __main__ - Step 11710: {'lr': 0.00019493333333333335, 'samples': 374720, 'steps': 731, 'loss/train': 4.773156642913818} -09/20/2021 17:01:27 - INFO - __main__ - Step 11711: {'lr': 0.00019493333333333335, 'samples': 374752, 'steps': 731, 'loss/train': 3.8256897926330566} -09/20/2021 17:01:27 - INFO - __main__ - Step 11712: {'lr': 0.00019493333333333335, 'samples': 374784, 'steps': 731, 'loss/train': 4.33562707901001} -09/20/2021 17:01:28 - INFO - __main__ - Step 11713: {'lr': 0.0001952, 'samples': 374816, 'steps': 732, 'loss/train': 4.030192852020264} -09/20/2021 17:01:29 - INFO - __main__ - Step 11714: {'lr': 0.0001952, 'samples': 374848, 'steps': 732, 'loss/train': 4.20522403717041} -09/20/2021 17:01:30 - INFO - __main__ - Step 11715: {'lr': 0.0001952, 'samples': 374880, 'steps': 732, 'loss/train': 3.3330438137054443} -09/20/2021 17:01:31 - INFO - __main__ - Step 11716: {'lr': 0.0001952, 'samples': 374912, 'steps': 732, 'loss/train': 3.730198621749878} -09/20/2021 17:01:31 - INFO - __main__ - Step 11717: {'lr': 0.0001952, 'samples': 374944, 'steps': 732, 'loss/train': 3.8407063484191895} -09/20/2021 17:01:32 - INFO - __main__ - Step 11718: {'lr': 0.0001952, 'samples': 374976, 'steps': 732, 'loss/train': 4.396849632263184} -09/20/2021 17:01:33 - INFO - __main__ - Step 11719: {'lr': 0.0001952, 'samples': 375008, 'steps': 732, 'loss/train': 3.7463643550872803} -09/20/2021 17:01:34 - INFO - __main__ - Step 11720: {'lr': 0.0001952, 'samples': 375040, 'steps': 732, 'loss/train': 4.303954124450684} -09/20/2021 17:01:34 - INFO - __main__ - Step 11721: {'lr': 0.0001952, 'samples': 375072, 'steps': 732, 'loss/train': 3.677579879760742} -09/20/2021 17:01:35 - INFO - __main__ - Step 11722: {'lr': 0.0001952, 'samples': 375104, 'steps': 732, 'loss/train': 3.7885875701904297} -09/20/2021 17:01:36 - INFO - __main__ - Step 11723: {'lr': 0.0001952, 'samples': 375136, 'steps': 732, 'loss/train': 4.9531660079956055} -09/20/2021 17:01:37 - INFO - __main__ - Step 11724: {'lr': 0.0001952, 'samples': 375168, 'steps': 732, 'loss/train': 3.9768617153167725} -09/20/2021 17:01:37 - INFO - __main__ - Step 11725: {'lr': 0.0001952, 'samples': 375200, 'steps': 732, 'loss/train': 4.722806453704834} -09/20/2021 17:01:38 - INFO - __main__ - Step 11726: {'lr': 0.0001952, 'samples': 375232, 'steps': 732, 'loss/train': 3.8975255489349365} -09/20/2021 17:01:39 - INFO - __main__ - Step 11727: {'lr': 0.0001952, 'samples': 375264, 'steps': 732, 'loss/train': 5.794040203094482} -09/20/2021 17:01:40 - INFO - __main__ - Step 11728: {'lr': 0.0001952, 'samples': 375296, 'steps': 732, 'loss/train': 4.470818042755127} -09/20/2021 17:01:40 - INFO - __main__ - Step 11729: {'lr': 0.00019546666666666668, 'samples': 375328, 'steps': 733, 'loss/train': 3.5539419651031494} -09/20/2021 17:01:41 - INFO - __main__ - Step 11730: {'lr': 0.00019546666666666668, 'samples': 375360, 'steps': 733, 'loss/train': 5.0248589515686035} -09/20/2021 17:01:42 - INFO - __main__ - Step 11731: {'lr': 0.00019546666666666668, 'samples': 375392, 'steps': 733, 'loss/train': 3.1908209323883057} -09/20/2021 17:01:43 - INFO - __main__ - Step 11732: {'lr': 0.00019546666666666668, 'samples': 375424, 'steps': 733, 'loss/train': 4.9890618324279785} -09/20/2021 17:01:43 - INFO - __main__ - Step 11733: {'lr': 0.00019546666666666668, 'samples': 375456, 'steps': 733, 'loss/train': 4.253530025482178} -09/20/2021 17:01:45 - INFO - __main__ - Step 11734: {'lr': 0.00019546666666666668, 'samples': 375488, 'steps': 733, 'loss/train': 3.149568796157837} -09/20/2021 17:01:46 - INFO - __main__ - Step 11735: {'lr': 0.00019546666666666668, 'samples': 375520, 'steps': 733, 'loss/train': 4.265167713165283} -09/20/2021 17:01:46 - INFO - __main__ - Step 11736: {'lr': 0.00019546666666666668, 'samples': 375552, 'steps': 733, 'loss/train': 4.684190273284912} -09/20/2021 17:01:47 - INFO - __main__ - Step 11737: {'lr': 0.00019546666666666668, 'samples': 375584, 'steps': 733, 'loss/train': 4.706450939178467} -09/20/2021 17:01:48 - INFO - __main__ - Step 11738: {'lr': 0.00019546666666666668, 'samples': 375616, 'steps': 733, 'loss/train': 3.8432457447052} -09/20/2021 17:01:49 - INFO - __main__ - Step 11739: {'lr': 0.00019546666666666668, 'samples': 375648, 'steps': 733, 'loss/train': 4.598721981048584} -09/20/2021 17:01:49 - INFO - __main__ - Step 11740: {'lr': 0.00019546666666666668, 'samples': 375680, 'steps': 733, 'loss/train': 5.826290130615234} -09/20/2021 17:01:50 - INFO - __main__ - Step 11741: {'lr': 0.00019546666666666668, 'samples': 375712, 'steps': 733, 'loss/train': 4.844797134399414} -09/20/2021 17:01:51 - INFO - __main__ - Step 11742: {'lr': 0.00019546666666666668, 'samples': 375744, 'steps': 733, 'loss/train': 4.636508941650391} -09/20/2021 17:01:52 - INFO - __main__ - Step 11743: {'lr': 0.00019546666666666668, 'samples': 375776, 'steps': 733, 'loss/train': 4.93566370010376} -09/20/2021 17:01:52 - INFO - __main__ - Step 11744: {'lr': 0.00019546666666666668, 'samples': 375808, 'steps': 733, 'loss/train': 5.245081424713135} -09/20/2021 17:01:53 - INFO - __main__ - Step 11745: {'lr': 0.00019573333333333334, 'samples': 375840, 'steps': 734, 'loss/train': 3.41845440864563} -09/20/2021 17:01:54 - INFO - __main__ - Step 11746: {'lr': 0.00019573333333333334, 'samples': 375872, 'steps': 734, 'loss/train': 4.580541610717773} -09/20/2021 17:01:55 - INFO - __main__ - Step 11747: {'lr': 0.00019573333333333334, 'samples': 375904, 'steps': 734, 'loss/train': 3.5195393562316895} -09/20/2021 17:01:55 - INFO - __main__ - Step 11748: {'lr': 0.00019573333333333334, 'samples': 375936, 'steps': 734, 'loss/train': 4.638061046600342} -09/20/2021 17:01:56 - INFO - __main__ - Step 11749: {'lr': 0.00019573333333333334, 'samples': 375968, 'steps': 734, 'loss/train': 3.6606428623199463} -09/20/2021 17:01:57 - INFO - __main__ - Step 11750: {'lr': 0.00019573333333333334, 'samples': 376000, 'steps': 734, 'loss/train': 4.072280406951904} -09/20/2021 17:01:58 - INFO - __main__ - Step 11751: {'lr': 0.00019573333333333334, 'samples': 376032, 'steps': 734, 'loss/train': 4.0281476974487305} -09/20/2021 17:01:58 - INFO - __main__ - Step 11752: {'lr': 0.00019573333333333334, 'samples': 376064, 'steps': 734, 'loss/train': 4.242978096008301} -09/20/2021 17:01:59 - INFO - __main__ - Step 11753: {'lr': 0.00019573333333333334, 'samples': 376096, 'steps': 734, 'loss/train': 3.882052183151245} -09/20/2021 17:02:00 - INFO - __main__ - Step 11754: {'lr': 0.00019573333333333334, 'samples': 376128, 'steps': 734, 'loss/train': 4.318511486053467} -09/20/2021 17:02:01 - INFO - __main__ - Step 11755: {'lr': 0.00019573333333333334, 'samples': 376160, 'steps': 734, 'loss/train': 4.069665908813477} -09/20/2021 17:02:01 - INFO - __main__ - Step 11756: {'lr': 0.00019573333333333334, 'samples': 376192, 'steps': 734, 'loss/train': 3.612659454345703} -09/20/2021 17:02:02 - INFO - __main__ - Step 11757: {'lr': 0.00019573333333333334, 'samples': 376224, 'steps': 734, 'loss/train': 3.6692850589752197} -09/20/2021 17:02:03 - INFO - __main__ - Step 11758: {'lr': 0.00019573333333333334, 'samples': 376256, 'steps': 734, 'loss/train': 4.283987522125244} -09/20/2021 17:02:04 - INFO - __main__ - Step 11759: {'lr': 0.00019573333333333334, 'samples': 376288, 'steps': 734, 'loss/train': 4.0267014503479} -09/20/2021 17:02:04 - INFO - __main__ - Step 11760: {'lr': 0.00019573333333333334, 'samples': 376320, 'steps': 734, 'loss/train': 4.529381275177002} -09/20/2021 17:02:05 - INFO - __main__ - Step 11761: {'lr': 0.000196, 'samples': 376352, 'steps': 735, 'loss/train': 4.0372633934021} -09/20/2021 17:02:06 - INFO - __main__ - Step 11762: {'lr': 0.000196, 'samples': 376384, 'steps': 735, 'loss/train': 4.004928112030029} -09/20/2021 17:02:07 - INFO - __main__ - Step 11763: {'lr': 0.000196, 'samples': 376416, 'steps': 735, 'loss/train': 4.1445465087890625} -09/20/2021 17:02:08 - INFO - __main__ - Step 11764: {'lr': 0.000196, 'samples': 376448, 'steps': 735, 'loss/train': 4.489441871643066} -09/20/2021 17:02:09 - INFO - __main__ - Step 11765: {'lr': 0.000196, 'samples': 376480, 'steps': 735, 'loss/train': 3.5651233196258545} -09/20/2021 17:02:10 - INFO - __main__ - Step 11766: {'lr': 0.000196, 'samples': 376512, 'steps': 735, 'loss/train': 4.086383819580078} -09/20/2021 17:02:11 - INFO - __main__ - Step 11767: {'lr': 0.000196, 'samples': 376544, 'steps': 735, 'loss/train': 4.5371856689453125} -09/20/2021 17:02:12 - INFO - __main__ - Step 11768: {'lr': 0.000196, 'samples': 376576, 'steps': 735, 'loss/train': 3.942786455154419} -09/20/2021 17:02:12 - INFO - __main__ - Step 11769: {'lr': 0.000196, 'samples': 376608, 'steps': 735, 'loss/train': 3.8236353397369385} -09/20/2021 17:02:13 - INFO - __main__ - Step 11770: {'lr': 0.000196, 'samples': 376640, 'steps': 735, 'loss/train': 3.7678143978118896} -09/20/2021 17:02:14 - INFO - __main__ - Step 11771: {'lr': 0.000196, 'samples': 376672, 'steps': 735, 'loss/train': 4.775472164154053} -09/20/2021 17:02:15 - INFO - __main__ - Step 11772: {'lr': 0.000196, 'samples': 376704, 'steps': 735, 'loss/train': 4.08729887008667} -09/20/2021 17:02:15 - INFO - __main__ - Step 11773: {'lr': 0.000196, 'samples': 376736, 'steps': 735, 'loss/train': 3.9493918418884277} -09/20/2021 17:02:16 - INFO - __main__ - Step 11774: {'lr': 0.000196, 'samples': 376768, 'steps': 735, 'loss/train': 4.25882625579834} -09/20/2021 17:02:17 - INFO - __main__ - Step 11775: {'lr': 0.000196, 'samples': 376800, 'steps': 735, 'loss/train': 4.245980262756348} -09/20/2021 17:02:18 - INFO - __main__ - Step 11776: {'lr': 0.000196, 'samples': 376832, 'steps': 735, 'loss/train': 5.220357418060303} -09/20/2021 17:02:18 - INFO - __main__ - Step 11777: {'lr': 0.00019626666666666668, 'samples': 376864, 'steps': 736, 'loss/train': 3.941560745239258} -09/20/2021 17:02:19 - INFO - __main__ - Step 11778: {'lr': 0.00019626666666666668, 'samples': 376896, 'steps': 736, 'loss/train': 4.740715503692627} -09/20/2021 17:02:20 - INFO - __main__ - Step 11779: {'lr': 0.00019626666666666668, 'samples': 376928, 'steps': 736, 'loss/train': 3.7795169353485107} -09/20/2021 17:02:21 - INFO - __main__ - Step 11780: {'lr': 0.00019626666666666668, 'samples': 376960, 'steps': 736, 'loss/train': 2.8823792934417725} -09/20/2021 17:02:21 - INFO - __main__ - Step 11781: {'lr': 0.00019626666666666668, 'samples': 376992, 'steps': 736, 'loss/train': 3.9867875576019287} -09/20/2021 17:02:22 - INFO - __main__ - Step 11782: {'lr': 0.00019626666666666668, 'samples': 377024, 'steps': 736, 'loss/train': 4.150247573852539} -09/20/2021 17:02:23 - INFO - __main__ - Step 11783: {'lr': 0.00019626666666666668, 'samples': 377056, 'steps': 736, 'loss/train': 3.409292221069336} -09/20/2021 17:02:24 - INFO - __main__ - Step 11784: {'lr': 0.00019626666666666668, 'samples': 377088, 'steps': 736, 'loss/train': 3.6874938011169434} -09/20/2021 17:02:24 - INFO - __main__ - Step 11785: {'lr': 0.00019626666666666668, 'samples': 377120, 'steps': 736, 'loss/train': 3.960829496383667} -09/20/2021 17:02:25 - INFO - __main__ - Step 11786: {'lr': 0.00019626666666666668, 'samples': 377152, 'steps': 736, 'loss/train': 3.921562671661377} -09/20/2021 17:02:26 - INFO - __main__ - Step 11787: {'lr': 0.00019626666666666668, 'samples': 377184, 'steps': 736, 'loss/train': 4.05981969833374} -09/20/2021 17:02:27 - INFO - __main__ - Step 11788: {'lr': 0.00019626666666666668, 'samples': 377216, 'steps': 736, 'loss/train': 4.031872749328613} -09/20/2021 17:02:27 - INFO - __main__ - Step 11789: {'lr': 0.00019626666666666668, 'samples': 377248, 'steps': 736, 'loss/train': 3.908841133117676} -09/20/2021 17:02:28 - INFO - __main__ - Step 11790: {'lr': 0.00019626666666666668, 'samples': 377280, 'steps': 736, 'loss/train': 3.9103567600250244} -09/20/2021 17:02:29 - INFO - __main__ - Step 11791: {'lr': 0.00019626666666666668, 'samples': 377312, 'steps': 736, 'loss/train': 3.8771984577178955} -09/20/2021 17:02:30 - INFO - __main__ - Step 11792: {'lr': 0.00019626666666666668, 'samples': 377344, 'steps': 736, 'loss/train': 3.8596534729003906} -09/20/2021 17:02:31 - INFO - __main__ - Step 11793: {'lr': 0.00019653333333333336, 'samples': 377376, 'steps': 737, 'loss/train': 2.819859743118286} -09/20/2021 17:02:31 - INFO - __main__ - Step 11794: {'lr': 0.00019653333333333336, 'samples': 377408, 'steps': 737, 'loss/train': 2.8426451683044434} -09/20/2021 17:02:32 - INFO - __main__ - Step 11795: {'lr': 0.00019653333333333336, 'samples': 377440, 'steps': 737, 'loss/train': 4.302460193634033} -09/20/2021 17:02:33 - INFO - __main__ - Step 11796: {'lr': 0.00019653333333333336, 'samples': 377472, 'steps': 737, 'loss/train': 4.4379377365112305} -09/20/2021 17:02:34 - INFO - __main__ - Step 11797: {'lr': 0.00019653333333333336, 'samples': 377504, 'steps': 737, 'loss/train': 4.047879695892334} -09/20/2021 17:02:34 - INFO - __main__ - Step 11798: {'lr': 0.00019653333333333336, 'samples': 377536, 'steps': 737, 'loss/train': 4.465521812438965} -09/20/2021 17:02:35 - INFO - __main__ - Step 11799: {'lr': 0.00019653333333333336, 'samples': 377568, 'steps': 737, 'loss/train': 1.5613511800765991} -09/20/2021 17:02:36 - INFO - __main__ - Step 11800: {'lr': 0.00019653333333333336, 'samples': 377600, 'steps': 737, 'loss/train': 3.9738261699676514} -09/20/2021 17:02:37 - INFO - __main__ - Step 11801: {'lr': 0.00019653333333333336, 'samples': 377632, 'steps': 737, 'loss/train': 4.2836222648620605} -09/20/2021 17:02:37 - INFO - __main__ - Step 11802: {'lr': 0.00019653333333333336, 'samples': 377664, 'steps': 737, 'loss/train': 3.989962339401245} -09/20/2021 17:02:38 - INFO - __main__ - Step 11803: {'lr': 0.00019653333333333336, 'samples': 377696, 'steps': 737, 'loss/train': 4.912397861480713} -09/20/2021 17:02:39 - INFO - __main__ - Step 11804: {'lr': 0.00019653333333333336, 'samples': 377728, 'steps': 737, 'loss/train': 4.558909893035889} -09/20/2021 17:02:40 - INFO - __main__ - Step 11805: {'lr': 0.00019653333333333336, 'samples': 377760, 'steps': 737, 'loss/train': 4.820745944976807} -09/20/2021 17:02:41 - INFO - __main__ - Step 11806: {'lr': 0.00019653333333333336, 'samples': 377792, 'steps': 737, 'loss/train': 4.365828037261963} -09/20/2021 17:02:42 - INFO - __main__ - Step 11807: {'lr': 0.00019653333333333336, 'samples': 377824, 'steps': 737, 'loss/train': 3.525636911392212} -09/20/2021 17:02:42 - INFO - __main__ - Step 11808: {'lr': 0.00019653333333333336, 'samples': 377856, 'steps': 737, 'loss/train': 3.8802807331085205} -09/20/2021 17:02:43 - INFO - __main__ - Step 11809: {'lr': 0.0001968, 'samples': 377888, 'steps': 738, 'loss/train': 4.302486896514893} -09/20/2021 17:02:44 - INFO - __main__ - Step 11810: {'lr': 0.0001968, 'samples': 377920, 'steps': 738, 'loss/train': 5.095248699188232} -09/20/2021 17:02:45 - INFO - __main__ - Step 11811: {'lr': 0.0001968, 'samples': 377952, 'steps': 738, 'loss/train': 4.530704498291016} -09/20/2021 17:02:46 - INFO - __main__ - Step 11812: {'lr': 0.0001968, 'samples': 377984, 'steps': 738, 'loss/train': 3.6608428955078125} -09/20/2021 17:02:46 - INFO - __main__ - Step 11813: {'lr': 0.0001968, 'samples': 378016, 'steps': 738, 'loss/train': 4.474209308624268} -09/20/2021 17:02:47 - INFO - __main__ - Step 11814: {'lr': 0.0001968, 'samples': 378048, 'steps': 738, 'loss/train': 3.548940658569336} -09/20/2021 17:02:48 - INFO - __main__ - Step 11815: {'lr': 0.0001968, 'samples': 378080, 'steps': 738, 'loss/train': 3.6247689723968506} -09/20/2021 17:02:49 - INFO - __main__ - Step 11816: {'lr': 0.0001968, 'samples': 378112, 'steps': 738, 'loss/train': 3.9500741958618164} -09/20/2021 17:02:49 - INFO - __main__ - Step 11817: {'lr': 0.0001968, 'samples': 378144, 'steps': 738, 'loss/train': 3.856729030609131} -09/20/2021 17:02:50 - INFO - __main__ - Step 11818: {'lr': 0.0001968, 'samples': 378176, 'steps': 738, 'loss/train': 3.6835129261016846} -09/20/2021 17:02:51 - INFO - __main__ - Step 11819: {'lr': 0.0001968, 'samples': 378208, 'steps': 738, 'loss/train': 4.377021312713623} -09/20/2021 17:02:52 - INFO - __main__ - Step 11820: {'lr': 0.0001968, 'samples': 378240, 'steps': 738, 'loss/train': 3.7778494358062744} -09/20/2021 17:02:52 - INFO - __main__ - Step 11821: {'lr': 0.0001968, 'samples': 378272, 'steps': 738, 'loss/train': 4.6799116134643555} -09/20/2021 17:02:53 - INFO - __main__ - Step 11822: {'lr': 0.0001968, 'samples': 378304, 'steps': 738, 'loss/train': 1.9589061737060547} -09/20/2021 17:02:54 - INFO - __main__ - Step 11823: {'lr': 0.0001968, 'samples': 378336, 'steps': 738, 'loss/train': 2.10194993019104} -09/20/2021 17:02:55 - INFO - __main__ - Step 11824: {'lr': 0.0001968, 'samples': 378368, 'steps': 738, 'loss/train': 1.557639241218567} -09/20/2021 17:02:55 - INFO - __main__ - Step 11825: {'lr': 0.00019706666666666667, 'samples': 378400, 'steps': 739, 'loss/train': 4.486191749572754} -09/20/2021 17:02:56 - INFO - __main__ - Step 11826: {'lr': 0.00019706666666666667, 'samples': 378432, 'steps': 739, 'loss/train': 4.268476486206055} -09/20/2021 17:02:57 - INFO - __main__ - Step 11827: {'lr': 0.00019706666666666667, 'samples': 378464, 'steps': 739, 'loss/train': 4.22487211227417} -09/20/2021 17:02:58 - INFO - __main__ - Step 11828: {'lr': 0.00019706666666666667, 'samples': 378496, 'steps': 739, 'loss/train': 5.392628192901611} -09/20/2021 17:02:58 - INFO - __main__ - Step 11829: {'lr': 0.00019706666666666667, 'samples': 378528, 'steps': 739, 'loss/train': 3.365154981613159} -09/20/2021 17:02:59 - INFO - __main__ - Step 11830: {'lr': 0.00019706666666666667, 'samples': 378560, 'steps': 739, 'loss/train': 3.9949705600738525} -09/20/2021 17:03:00 - INFO - __main__ - Step 11831: {'lr': 0.00019706666666666667, 'samples': 378592, 'steps': 739, 'loss/train': 4.5972137451171875} -09/20/2021 17:03:01 - INFO - __main__ - Step 11832: {'lr': 0.00019706666666666667, 'samples': 378624, 'steps': 739, 'loss/train': 4.150126934051514} -09/20/2021 17:03:01 - INFO - __main__ - Step 11833: {'lr': 0.00019706666666666667, 'samples': 378656, 'steps': 739, 'loss/train': 0.8361316323280334} -09/20/2021 17:03:02 - INFO - __main__ - Step 11834: {'lr': 0.00019706666666666667, 'samples': 378688, 'steps': 739, 'loss/train': 4.460747718811035} -09/20/2021 17:03:03 - INFO - __main__ - Step 11835: {'lr': 0.00019706666666666667, 'samples': 378720, 'steps': 739, 'loss/train': 3.235687255859375} -09/20/2021 17:03:05 - INFO - __main__ - Step 11836: {'lr': 0.00019706666666666667, 'samples': 378752, 'steps': 739, 'loss/train': 3.9481849670410156} -09/20/2021 17:03:05 - INFO - __main__ - Step 11837: {'lr': 0.00019706666666666667, 'samples': 378784, 'steps': 739, 'loss/train': 4.079824447631836} -09/20/2021 17:03:06 - INFO - __main__ - Step 11838: {'lr': 0.00019706666666666667, 'samples': 378816, 'steps': 739, 'loss/train': 2.8021068572998047} -09/20/2021 17:03:07 - INFO - __main__ - Step 11839: {'lr': 0.00019706666666666667, 'samples': 378848, 'steps': 739, 'loss/train': 2.674231767654419} -09/20/2021 17:03:08 - INFO - __main__ - Step 11840: {'lr': 0.00019706666666666667, 'samples': 378880, 'steps': 739, 'loss/train': 2.482109546661377} -09/20/2021 17:03:08 - INFO - __main__ - Step 11841: {'lr': 0.00019733333333333335, 'samples': 378912, 'steps': 740, 'loss/train': 1.723211646080017} -09/20/2021 17:03:09 - INFO - __main__ - Step 11842: {'lr': 0.00019733333333333335, 'samples': 378944, 'steps': 740, 'loss/train': 2.4874274730682373} -09/20/2021 17:03:10 - INFO - __main__ - Step 11843: {'lr': 0.00019733333333333335, 'samples': 378976, 'steps': 740, 'loss/train': 1.0436928272247314} -09/20/2021 17:03:11 - INFO - __main__ - Step 11844: {'lr': 0.00019733333333333335, 'samples': 379008, 'steps': 740, 'loss/train': 2.591494560241699} -09/20/2021 17:03:11 - INFO - __main__ - Step 11845: {'lr': 0.00019733333333333335, 'samples': 379040, 'steps': 740, 'loss/train': 4.847860813140869} -09/20/2021 17:03:12 - INFO - __main__ - Step 11846: {'lr': 0.00019733333333333335, 'samples': 379072, 'steps': 740, 'loss/train': 5.011690616607666} -09/20/2021 17:03:13 - INFO - __main__ - Step 11847: {'lr': 0.00019733333333333335, 'samples': 379104, 'steps': 740, 'loss/train': 3.3491389751434326} -09/20/2021 17:03:14 - INFO - __main__ - Step 11848: {'lr': 0.00019733333333333335, 'samples': 379136, 'steps': 740, 'loss/train': 5.249492645263672} -09/20/2021 17:03:14 - INFO - __main__ - Step 11849: {'lr': 0.00019733333333333335, 'samples': 379168, 'steps': 740, 'loss/train': 5.749432563781738} -09/20/2021 17:03:15 - INFO - __main__ - Step 11850: {'lr': 0.00019733333333333335, 'samples': 379200, 'steps': 740, 'loss/train': 4.3545403480529785} -09/20/2021 17:03:16 - INFO - __main__ - Step 11851: {'lr': 0.00019733333333333335, 'samples': 379232, 'steps': 740, 'loss/train': 3.191882610321045} -09/20/2021 17:03:17 - INFO - __main__ - Step 11852: {'lr': 0.00019733333333333335, 'samples': 379264, 'steps': 740, 'loss/train': 4.225701808929443} -09/20/2021 17:03:17 - INFO - __main__ - Step 11853: {'lr': 0.00019733333333333335, 'samples': 379296, 'steps': 740, 'loss/train': 4.337653636932373} -09/20/2021 17:03:18 - INFO - __main__ - Step 11854: {'lr': 0.00019733333333333335, 'samples': 379328, 'steps': 740, 'loss/train': 4.092485427856445} -09/20/2021 17:03:19 - INFO - __main__ - Step 11855: {'lr': 0.00019733333333333335, 'samples': 379360, 'steps': 740, 'loss/train': 4.5521931648254395} -09/20/2021 17:03:20 - INFO - __main__ - Step 11856: {'lr': 0.00019733333333333335, 'samples': 379392, 'steps': 740, 'loss/train': 5.222597599029541} -09/20/2021 17:03:21 - INFO - __main__ - Step 11857: {'lr': 0.0001976, 'samples': 379424, 'steps': 741, 'loss/train': 4.627943992614746} -09/20/2021 17:03:21 - INFO - __main__ - Step 11858: {'lr': 0.0001976, 'samples': 379456, 'steps': 741, 'loss/train': 2.8977484703063965} -09/20/2021 17:03:22 - INFO - __main__ - Step 11859: {'lr': 0.0001976, 'samples': 379488, 'steps': 741, 'loss/train': 3.997919797897339} -09/20/2021 17:03:23 - INFO - __main__ - Step 11860: {'lr': 0.0001976, 'samples': 379520, 'steps': 741, 'loss/train': 1.5554769039154053} -09/20/2021 17:03:24 - INFO - __main__ - Step 11861: {'lr': 0.0001976, 'samples': 379552, 'steps': 741, 'loss/train': 2.003678321838379} -09/20/2021 17:03:24 - INFO - __main__ - Step 11862: {'lr': 0.0001976, 'samples': 379584, 'steps': 741, 'loss/train': 1.8320118188858032} -09/20/2021 17:03:25 - INFO - __main__ - Step 11863: {'lr': 0.0001976, 'samples': 379616, 'steps': 741, 'loss/train': 4.353635787963867} -09/20/2021 17:03:26 - INFO - __main__ - Step 11864: {'lr': 0.0001976, 'samples': 379648, 'steps': 741, 'loss/train': 3.8564367294311523} -09/20/2021 17:03:27 - INFO - __main__ - Step 11865: {'lr': 0.0001976, 'samples': 379680, 'steps': 741, 'loss/train': 4.323762893676758} -09/20/2021 17:03:28 - INFO - __main__ - Step 11866: {'lr': 0.0001976, 'samples': 379712, 'steps': 741, 'loss/train': 4.445949077606201} -09/20/2021 17:03:29 - INFO - __main__ - Step 11867: {'lr': 0.0001976, 'samples': 379744, 'steps': 741, 'loss/train': 4.5774006843566895} -09/20/2021 17:03:29 - INFO - __main__ - Step 11868: {'lr': 0.0001976, 'samples': 379776, 'steps': 741, 'loss/train': 4.928679466247559} -09/20/2021 17:03:30 - INFO - __main__ - Step 11869: {'lr': 0.0001976, 'samples': 379808, 'steps': 741, 'loss/train': 4.166357040405273} -09/20/2021 17:03:31 - INFO - __main__ - Step 11870: {'lr': 0.0001976, 'samples': 379840, 'steps': 741, 'loss/train': 4.706254482269287} -09/20/2021 17:03:32 - INFO - __main__ - Step 11871: {'lr': 0.0001976, 'samples': 379872, 'steps': 741, 'loss/train': 3.8281867504119873} -09/20/2021 17:03:32 - INFO - __main__ - Step 11872: {'lr': 0.0001976, 'samples': 379904, 'steps': 741, 'loss/train': 4.048415184020996} -09/20/2021 17:03:33 - INFO - __main__ - Step 11873: {'lr': 0.00019786666666666666, 'samples': 379936, 'steps': 742, 'loss/train': 5.5098490715026855} -09/20/2021 17:03:34 - INFO - __main__ - Step 11874: {'lr': 0.00019786666666666666, 'samples': 379968, 'steps': 742, 'loss/train': 3.953788995742798} -09/20/2021 17:03:35 - INFO - __main__ - Step 11875: {'lr': 0.00019786666666666666, 'samples': 380000, 'steps': 742, 'loss/train': 4.192965030670166} -09/20/2021 17:03:36 - INFO - __main__ - Step 11876: {'lr': 0.00019786666666666666, 'samples': 380032, 'steps': 742, 'loss/train': 4.0119099617004395} -09/20/2021 17:03:36 - INFO - __main__ - Step 11877: {'lr': 0.00019786666666666666, 'samples': 380064, 'steps': 742, 'loss/train': 4.6484270095825195} -09/20/2021 17:03:37 - INFO - __main__ - Step 11878: {'lr': 0.00019786666666666666, 'samples': 380096, 'steps': 742, 'loss/train': 1.8581477403640747} -09/20/2021 17:03:38 - INFO - __main__ - Step 11879: {'lr': 0.00019786666666666666, 'samples': 380128, 'steps': 742, 'loss/train': 5.109684467315674} -09/20/2021 17:03:39 - INFO - __main__ - Step 11880: {'lr': 0.00019786666666666666, 'samples': 380160, 'steps': 742, 'loss/train': 3.895092010498047} -09/20/2021 17:03:39 - INFO - __main__ - Step 11881: {'lr': 0.00019786666666666666, 'samples': 380192, 'steps': 742, 'loss/train': 4.577934741973877} -09/20/2021 17:03:40 - INFO - __main__ - Step 11882: {'lr': 0.00019786666666666666, 'samples': 380224, 'steps': 742, 'loss/train': 3.898754596710205} -09/20/2021 17:03:41 - INFO - __main__ - Step 11883: {'lr': 0.00019786666666666666, 'samples': 380256, 'steps': 742, 'loss/train': 4.461440563201904} -09/20/2021 17:03:42 - INFO - __main__ - Step 11884: {'lr': 0.00019786666666666666, 'samples': 380288, 'steps': 742, 'loss/train': 4.406505107879639} -09/20/2021 17:03:42 - INFO - __main__ - Step 11885: {'lr': 0.00019786666666666666, 'samples': 380320, 'steps': 742, 'loss/train': 3.3831193447113037} -09/20/2021 17:03:43 - INFO - __main__ - Step 11886: {'lr': 0.00019786666666666666, 'samples': 380352, 'steps': 742, 'loss/train': 3.9448840618133545} -09/20/2021 17:03:44 - INFO - __main__ - Step 11887: {'lr': 0.00019786666666666666, 'samples': 380384, 'steps': 742, 'loss/train': 2.2740962505340576} -09/20/2021 17:03:45 - INFO - __main__ - Step 11888: {'lr': 0.00019786666666666666, 'samples': 380416, 'steps': 742, 'loss/train': 4.810256481170654} -09/20/2021 17:03:46 - INFO - __main__ - Step 11889: {'lr': 0.00019813333333333334, 'samples': 380448, 'steps': 743, 'loss/train': 4.929937362670898} -09/20/2021 17:03:46 - INFO - __main__ - Step 11890: {'lr': 0.00019813333333333334, 'samples': 380480, 'steps': 743, 'loss/train': 4.320367336273193} -09/20/2021 17:03:47 - INFO - __main__ - Step 11891: {'lr': 0.00019813333333333334, 'samples': 380512, 'steps': 743, 'loss/train': 4.484714031219482} -09/20/2021 17:03:48 - INFO - __main__ - Step 11892: {'lr': 0.00019813333333333334, 'samples': 380544, 'steps': 743, 'loss/train': 4.8792901039123535} -09/20/2021 17:03:49 - INFO - __main__ - Step 11893: {'lr': 0.00019813333333333334, 'samples': 380576, 'steps': 743, 'loss/train': 3.9861762523651123} -09/20/2021 17:03:49 - INFO - __main__ - Step 11894: {'lr': 0.00019813333333333334, 'samples': 380608, 'steps': 743, 'loss/train': 4.613754749298096} -09/20/2021 17:03:50 - INFO - __main__ - Step 11895: {'lr': 0.00019813333333333334, 'samples': 380640, 'steps': 743, 'loss/train': 4.815604209899902} -09/20/2021 17:03:51 - INFO - __main__ - Step 11896: {'lr': 0.00019813333333333334, 'samples': 380672, 'steps': 743, 'loss/train': 4.895282745361328} -09/20/2021 17:03:52 - INFO - __main__ - Step 11897: {'lr': 0.00019813333333333334, 'samples': 380704, 'steps': 743, 'loss/train': 5.364243030548096} -09/20/2021 17:03:52 - INFO - __main__ - Step 11898: {'lr': 0.00019813333333333334, 'samples': 380736, 'steps': 743, 'loss/train': 5.985115051269531} -09/20/2021 17:03:54 - INFO - __main__ - Step 11899: {'lr': 0.00019813333333333334, 'samples': 380768, 'steps': 743, 'loss/train': 4.60617733001709} -09/20/2021 17:03:54 - INFO - __main__ - Step 11900: {'lr': 0.00019813333333333334, 'samples': 380800, 'steps': 743, 'loss/train': 3.61511492729187} -09/20/2021 17:03:55 - INFO - __main__ - Step 11901: {'lr': 0.00019813333333333334, 'samples': 380832, 'steps': 743, 'loss/train': 3.6948983669281006} -09/20/2021 17:03:56 - INFO - __main__ - Step 11902: {'lr': 0.00019813333333333334, 'samples': 380864, 'steps': 743, 'loss/train': 4.71351957321167} -09/20/2021 17:03:57 - INFO - __main__ - Step 11903: {'lr': 0.00019813333333333334, 'samples': 380896, 'steps': 743, 'loss/train': 5.2181501388549805} -09/20/2021 17:03:57 - INFO - __main__ - Step 11904: {'lr': 0.00019813333333333334, 'samples': 380928, 'steps': 743, 'loss/train': 3.682382583618164} -09/20/2021 17:03:58 - INFO - __main__ - Step 11905: {'lr': 0.0001984, 'samples': 380960, 'steps': 744, 'loss/train': 3.717707395553589} -09/20/2021 17:03:59 - INFO - __main__ - Step 11906: {'lr': 0.0001984, 'samples': 380992, 'steps': 744, 'loss/train': 3.9694488048553467} -09/20/2021 17:04:00 - INFO - __main__ - Step 11907: {'lr': 0.0001984, 'samples': 381024, 'steps': 744, 'loss/train': 3.7228291034698486} -09/20/2021 17:04:00 - INFO - __main__ - Step 11908: {'lr': 0.0001984, 'samples': 381056, 'steps': 744, 'loss/train': 3.607461452484131} -09/20/2021 17:04:01 - INFO - __main__ - Step 11909: {'lr': 0.0001984, 'samples': 381088, 'steps': 744, 'loss/train': 4.049388885498047} -09/20/2021 17:04:02 - INFO - __main__ - Step 11910: {'lr': 0.0001984, 'samples': 381120, 'steps': 744, 'loss/train': 3.3194098472595215} -09/20/2021 17:04:03 - INFO - __main__ - Step 11911: {'lr': 0.0001984, 'samples': 381152, 'steps': 744, 'loss/train': 3.3029541969299316} -09/20/2021 17:04:03 - INFO - __main__ - Step 11912: {'lr': 0.0001984, 'samples': 381184, 'steps': 744, 'loss/train': 3.1786932945251465} -09/20/2021 17:04:04 - INFO - __main__ - Step 11913: {'lr': 0.0001984, 'samples': 381216, 'steps': 744, 'loss/train': 3.750298261642456} -09/20/2021 17:04:05 - INFO - __main__ - Step 11914: {'lr': 0.0001984, 'samples': 381248, 'steps': 744, 'loss/train': 4.589051246643066} -09/20/2021 17:04:06 - INFO - __main__ - Step 11915: {'lr': 0.0001984, 'samples': 381280, 'steps': 744, 'loss/train': 4.476637363433838} -09/20/2021 17:04:06 - INFO - __main__ - Step 11916: {'lr': 0.0001984, 'samples': 381312, 'steps': 744, 'loss/train': 5.605377197265625} -09/20/2021 17:04:07 - INFO - __main__ - Step 11917: {'lr': 0.0001984, 'samples': 381344, 'steps': 744, 'loss/train': 4.412690162658691} -09/20/2021 17:04:08 - INFO - __main__ - Step 11918: {'lr': 0.0001984, 'samples': 381376, 'steps': 744, 'loss/train': 4.158065319061279} -09/20/2021 17:04:09 - INFO - __main__ - Step 11919: {'lr': 0.0001984, 'samples': 381408, 'steps': 744, 'loss/train': 4.477025508880615} -09/20/2021 17:04:09 - INFO - __main__ - Step 11920: {'lr': 0.0001984, 'samples': 381440, 'steps': 744, 'loss/train': 4.0302958488464355} -09/20/2021 17:04:10 - INFO - __main__ - Step 11921: {'lr': 0.00019866666666666668, 'samples': 381472, 'steps': 745, 'loss/train': 4.355391025543213} -09/20/2021 17:04:11 - INFO - __main__ - Step 11922: {'lr': 0.00019866666666666668, 'samples': 381504, 'steps': 745, 'loss/train': 4.68942403793335} -09/20/2021 17:04:12 - INFO - __main__ - Step 11923: {'lr': 0.00019866666666666668, 'samples': 381536, 'steps': 745, 'loss/train': 4.557911396026611} -09/20/2021 17:04:13 - INFO - __main__ - Step 11924: {'lr': 0.00019866666666666668, 'samples': 381568, 'steps': 745, 'loss/train': 3.720231294631958} -09/20/2021 17:04:13 - INFO - __main__ - Step 11925: {'lr': 0.00019866666666666668, 'samples': 381600, 'steps': 745, 'loss/train': 1.9360549449920654} -09/20/2021 17:04:14 - INFO - __main__ - Step 11926: {'lr': 0.00019866666666666668, 'samples': 381632, 'steps': 745, 'loss/train': 3.219974994659424} -09/20/2021 17:04:15 - INFO - __main__ - Step 11927: {'lr': 0.00019866666666666668, 'samples': 381664, 'steps': 745, 'loss/train': 4.813169956207275} -09/20/2021 17:04:16 - INFO - __main__ - Step 11928: {'lr': 0.00019866666666666668, 'samples': 381696, 'steps': 745, 'loss/train': 4.00286865234375} -09/20/2021 17:04:16 - INFO - __main__ - Step 11929: {'lr': 0.00019866666666666668, 'samples': 381728, 'steps': 745, 'loss/train': 4.982514381408691} -09/20/2021 17:04:18 - INFO - __main__ - Step 11930: {'lr': 0.00019866666666666668, 'samples': 381760, 'steps': 745, 'loss/train': 3.594360828399658} -09/20/2021 17:04:19 - INFO - __main__ - Step 11931: {'lr': 0.00019866666666666668, 'samples': 381792, 'steps': 745, 'loss/train': 3.28899884223938} -09/20/2021 17:04:20 - INFO - __main__ - Step 11932: {'lr': 0.00019866666666666668, 'samples': 381824, 'steps': 745, 'loss/train': 1.7273290157318115} -09/20/2021 17:04:20 - INFO - __main__ - Step 11933: {'lr': 0.00019866666666666668, 'samples': 381856, 'steps': 745, 'loss/train': 4.753590106964111} -09/20/2021 17:04:21 - INFO - __main__ - Step 11934: {'lr': 0.00019866666666666668, 'samples': 381888, 'steps': 745, 'loss/train': 6.022994041442871} -09/20/2021 17:04:22 - INFO - __main__ - Step 11935: {'lr': 0.00019866666666666668, 'samples': 381920, 'steps': 745, 'loss/train': 4.038693904876709} -09/20/2021 17:04:23 - INFO - __main__ - Step 11936: {'lr': 0.00019866666666666668, 'samples': 381952, 'steps': 745, 'loss/train': 3.6065123081207275} -09/20/2021 17:04:24 - INFO - __main__ - Step 11937: {'lr': 0.00019893333333333336, 'samples': 381984, 'steps': 746, 'loss/train': 4.3067097663879395} -09/20/2021 17:04:24 - INFO - __main__ - Step 11938: {'lr': 0.00019893333333333336, 'samples': 382016, 'steps': 746, 'loss/train': 5.09160041809082} -09/20/2021 17:04:25 - INFO - __main__ - Step 11939: {'lr': 0.00019893333333333336, 'samples': 382048, 'steps': 746, 'loss/train': 4.125298500061035} -09/20/2021 17:04:26 - INFO - __main__ - Step 11940: {'lr': 0.00019893333333333336, 'samples': 382080, 'steps': 746, 'loss/train': 3.424041748046875} -09/20/2021 17:04:27 - INFO - __main__ - Step 11941: {'lr': 0.00019893333333333336, 'samples': 382112, 'steps': 746, 'loss/train': 4.000033855438232} -09/20/2021 17:04:27 - INFO - __main__ - Step 11942: {'lr': 0.00019893333333333336, 'samples': 382144, 'steps': 746, 'loss/train': 4.258089065551758} -09/20/2021 17:04:28 - INFO - __main__ - Step 11943: {'lr': 0.00019893333333333336, 'samples': 382176, 'steps': 746, 'loss/train': 4.206252574920654} -09/20/2021 17:04:29 - INFO - __main__ - Step 11944: {'lr': 0.00019893333333333336, 'samples': 382208, 'steps': 746, 'loss/train': 3.7653751373291016} -09/20/2021 17:04:30 - INFO - __main__ - Step 11945: {'lr': 0.00019893333333333336, 'samples': 382240, 'steps': 746, 'loss/train': 4.1949639320373535} -09/20/2021 17:04:30 - INFO - __main__ - Step 11946: {'lr': 0.00019893333333333336, 'samples': 382272, 'steps': 746, 'loss/train': 4.329367637634277} -09/20/2021 17:04:31 - INFO - __main__ - Step 11947: {'lr': 0.00019893333333333336, 'samples': 382304, 'steps': 746, 'loss/train': 3.8943252563476562} -09/20/2021 17:04:32 - INFO - __main__ - Step 11948: {'lr': 0.00019893333333333336, 'samples': 382336, 'steps': 746, 'loss/train': 3.9801926612854004} -09/20/2021 17:04:33 - INFO - __main__ - Step 11949: {'lr': 0.00019893333333333336, 'samples': 382368, 'steps': 746, 'loss/train': 4.430422782897949} -09/20/2021 17:04:33 - INFO - __main__ - Step 11950: {'lr': 0.00019893333333333336, 'samples': 382400, 'steps': 746, 'loss/train': 3.613955020904541} -09/20/2021 17:04:34 - INFO - __main__ - Step 11951: {'lr': 0.00019893333333333336, 'samples': 382432, 'steps': 746, 'loss/train': 3.758925199508667} -09/20/2021 17:04:35 - INFO - __main__ - Step 11952: {'lr': 0.00019893333333333336, 'samples': 382464, 'steps': 746, 'loss/train': 4.4654951095581055} -09/20/2021 17:04:36 - INFO - __main__ - Step 11953: {'lr': 0.00019920000000000002, 'samples': 382496, 'steps': 747, 'loss/train': 3.9129176139831543} -09/20/2021 17:04:36 - INFO - __main__ - Step 11954: {'lr': 0.00019920000000000002, 'samples': 382528, 'steps': 747, 'loss/train': 4.024085521697998} -09/20/2021 17:04:37 - INFO - __main__ - Step 11955: {'lr': 0.00019920000000000002, 'samples': 382560, 'steps': 747, 'loss/train': 4.16132116317749} -09/20/2021 17:04:38 - INFO - __main__ - Step 11956: {'lr': 0.00019920000000000002, 'samples': 382592, 'steps': 747, 'loss/train': 4.11227560043335} -09/20/2021 17:04:39 - INFO - __main__ - Step 11957: {'lr': 0.00019920000000000002, 'samples': 382624, 'steps': 747, 'loss/train': 4.837817192077637} -09/20/2021 17:04:39 - INFO - __main__ - Step 11958: {'lr': 0.00019920000000000002, 'samples': 382656, 'steps': 747, 'loss/train': 4.704043388366699} -09/20/2021 17:04:40 - INFO - __main__ - Step 11959: {'lr': 0.00019920000000000002, 'samples': 382688, 'steps': 747, 'loss/train': 3.1310877799987793} -09/20/2021 17:04:41 - INFO - __main__ - Step 11960: {'lr': 0.00019920000000000002, 'samples': 382720, 'steps': 747, 'loss/train': 4.126892566680908} -09/20/2021 17:04:42 - INFO - __main__ - Step 11961: {'lr': 0.00019920000000000002, 'samples': 382752, 'steps': 747, 'loss/train': 5.1739630699157715} -09/20/2021 17:04:42 - INFO - __main__ - Step 11962: {'lr': 0.00019920000000000002, 'samples': 382784, 'steps': 747, 'loss/train': 4.790637016296387} -09/20/2021 17:04:44 - INFO - __main__ - Step 11963: {'lr': 0.00019920000000000002, 'samples': 382816, 'steps': 747, 'loss/train': 5.317304611206055} -09/20/2021 17:04:44 - INFO - __main__ - Step 11964: {'lr': 0.00019920000000000002, 'samples': 382848, 'steps': 747, 'loss/train': 4.818669319152832} -09/20/2021 17:04:45 - INFO - __main__ - Step 11965: {'lr': 0.00019920000000000002, 'samples': 382880, 'steps': 747, 'loss/train': 4.502408504486084} -09/20/2021 17:04:46 - INFO - __main__ - Step 11966: {'lr': 0.00019920000000000002, 'samples': 382912, 'steps': 747, 'loss/train': 4.541146278381348} -09/20/2021 17:04:47 - INFO - __main__ - Step 11967: {'lr': 0.00019920000000000002, 'samples': 382944, 'steps': 747, 'loss/train': 4.191047191619873} -09/20/2021 17:04:47 - INFO - __main__ - Step 11968: {'lr': 0.00019920000000000002, 'samples': 382976, 'steps': 747, 'loss/train': 4.031525611877441} -09/20/2021 17:04:48 - INFO - __main__ - Step 11969: {'lr': 0.00019946666666666667, 'samples': 383008, 'steps': 748, 'loss/train': 5.530219554901123} -09/20/2021 17:04:49 - INFO - __main__ - Step 11970: {'lr': 0.00019946666666666667, 'samples': 383040, 'steps': 748, 'loss/train': 4.882314682006836} -09/20/2021 17:04:50 - INFO - __main__ - Step 11971: {'lr': 0.00019946666666666667, 'samples': 383072, 'steps': 748, 'loss/train': 5.371760368347168} -09/20/2021 17:04:51 - INFO - __main__ - Step 11972: {'lr': 0.00019946666666666667, 'samples': 383104, 'steps': 748, 'loss/train': 3.4476399421691895} -09/20/2021 17:04:51 - INFO - __main__ - Step 11973: {'lr': 0.00019946666666666667, 'samples': 383136, 'steps': 748, 'loss/train': 3.8118622303009033} -09/20/2021 17:04:52 - INFO - __main__ - Step 11974: {'lr': 0.00019946666666666667, 'samples': 383168, 'steps': 748, 'loss/train': 4.031299591064453} -09/20/2021 17:04:53 - INFO - __main__ - Step 11975: {'lr': 0.00019946666666666667, 'samples': 383200, 'steps': 748, 'loss/train': 4.39909029006958} -09/20/2021 17:04:54 - INFO - __main__ - Step 11976: {'lr': 0.00019946666666666667, 'samples': 383232, 'steps': 748, 'loss/train': 4.195781707763672} -09/20/2021 17:04:54 - INFO - __main__ - Step 11977: {'lr': 0.00019946666666666667, 'samples': 383264, 'steps': 748, 'loss/train': 4.346925258636475} -09/20/2021 17:04:55 - INFO - __main__ - Step 11978: {'lr': 0.00019946666666666667, 'samples': 383296, 'steps': 748, 'loss/train': 5.001943111419678} -09/20/2021 17:04:56 - INFO - __main__ - Step 11979: {'lr': 0.00019946666666666667, 'samples': 383328, 'steps': 748, 'loss/train': 4.374213218688965} -09/20/2021 17:04:57 - INFO - __main__ - Step 11980: {'lr': 0.00019946666666666667, 'samples': 383360, 'steps': 748, 'loss/train': 4.161057472229004} -09/20/2021 17:04:57 - INFO - __main__ - Step 11981: {'lr': 0.00019946666666666667, 'samples': 383392, 'steps': 748, 'loss/train': 5.585141658782959} -09/20/2021 17:04:58 - INFO - __main__ - Step 11982: {'lr': 0.00019946666666666667, 'samples': 383424, 'steps': 748, 'loss/train': 3.850217819213867} -09/20/2021 17:04:59 - INFO - __main__ - Step 11983: {'lr': 0.00019946666666666667, 'samples': 383456, 'steps': 748, 'loss/train': 4.209871292114258} -09/20/2021 17:05:00 - INFO - __main__ - Step 11984: {'lr': 0.00019946666666666667, 'samples': 383488, 'steps': 748, 'loss/train': 3.5597317218780518} -09/20/2021 17:05:01 - INFO - __main__ - Step 11985: {'lr': 0.00019973333333333335, 'samples': 383520, 'steps': 749, 'loss/train': 3.7490644454956055} -09/20/2021 17:05:01 - INFO - __main__ - Step 11986: {'lr': 0.00019973333333333335, 'samples': 383552, 'steps': 749, 'loss/train': 3.7068748474121094} -09/20/2021 17:05:02 - INFO - __main__ - Step 11987: {'lr': 0.00019973333333333335, 'samples': 383584, 'steps': 749, 'loss/train': 5.2362895011901855} -09/20/2021 17:05:03 - INFO - __main__ - Step 11988: {'lr': 0.00019973333333333335, 'samples': 383616, 'steps': 749, 'loss/train': 3.578795909881592} -09/20/2021 17:05:04 - INFO - __main__ - Step 11989: {'lr': 0.00019973333333333335, 'samples': 383648, 'steps': 749, 'loss/train': 1.96052885055542} -09/20/2021 17:05:04 - INFO - __main__ - Step 11990: {'lr': 0.00019973333333333335, 'samples': 383680, 'steps': 749, 'loss/train': 4.329614639282227} -09/20/2021 17:05:05 - INFO - __main__ - Step 11991: {'lr': 0.00019973333333333335, 'samples': 383712, 'steps': 749, 'loss/train': 4.646417617797852} -09/20/2021 17:05:06 - INFO - __main__ - Step 11992: {'lr': 0.00019973333333333335, 'samples': 383744, 'steps': 749, 'loss/train': 3.7440013885498047} -09/20/2021 17:05:07 - INFO - __main__ - Step 11993: {'lr': 0.00019973333333333335, 'samples': 383776, 'steps': 749, 'loss/train': 4.543776988983154} -09/20/2021 17:05:08 - INFO - __main__ - Step 11994: {'lr': 0.00019973333333333335, 'samples': 383808, 'steps': 749, 'loss/train': 3.262502431869507} -09/20/2021 17:05:09 - INFO - __main__ - Step 11995: {'lr': 0.00019973333333333335, 'samples': 383840, 'steps': 749, 'loss/train': 5.679580211639404} -09/20/2021 17:05:09 - INFO - __main__ - Step 11996: {'lr': 0.00019973333333333335, 'samples': 383872, 'steps': 749, 'loss/train': 5.572450637817383} -09/20/2021 17:05:10 - INFO - __main__ - Step 11997: {'lr': 0.00019973333333333335, 'samples': 383904, 'steps': 749, 'loss/train': 4.174254894256592} -09/20/2021 17:05:11 - INFO - __main__ - Step 11998: {'lr': 0.00019973333333333335, 'samples': 383936, 'steps': 749, 'loss/train': 4.424700736999512} -09/20/2021 17:05:12 - INFO - __main__ - Step 11999: {'lr': 0.00019973333333333335, 'samples': 383968, 'steps': 749, 'loss/train': 3.8349244594573975} -09/20/2021 17:05:12 - INFO - __main__ - Step 12000: {'lr': 0.00019973333333333335, 'samples': 384000, 'steps': 749, 'loss/train': 4.389839172363281} -09/20/2021 17:05:13 - INFO - __main__ - Step 12001: {'lr': 0.0002, 'samples': 384032, 'steps': 750, 'loss/train': 3.2333154678344727} -09/20/2021 17:05:14 - INFO - __main__ - Step 12002: {'lr': 0.0002, 'samples': 384064, 'steps': 750, 'loss/train': 3.0033774375915527} -09/20/2021 17:05:15 - INFO - __main__ - Step 12003: {'lr': 0.0002, 'samples': 384096, 'steps': 750, 'loss/train': 4.204689025878906} -09/20/2021 17:05:15 - INFO - __main__ - Step 12004: {'lr': 0.0002, 'samples': 384128, 'steps': 750, 'loss/train': 4.748714923858643} -09/20/2021 17:05:16 - INFO - __main__ - Step 12005: {'lr': 0.0002, 'samples': 384160, 'steps': 750, 'loss/train': 3.937242269515991} -09/20/2021 17:05:17 - INFO - __main__ - Step 12006: {'lr': 0.0002, 'samples': 384192, 'steps': 750, 'loss/train': 4.37944221496582} -09/20/2021 17:05:18 - INFO - __main__ - Step 12007: {'lr': 0.0002, 'samples': 384224, 'steps': 750, 'loss/train': 4.710547924041748} -09/20/2021 17:05:18 - INFO - __main__ - Step 12008: {'lr': 0.0002, 'samples': 384256, 'steps': 750, 'loss/train': 4.258482933044434} -09/20/2021 17:05:19 - INFO - __main__ - Step 12009: {'lr': 0.0002, 'samples': 384288, 'steps': 750, 'loss/train': 4.368632793426514} -09/20/2021 17:05:20 - INFO - __main__ - Step 12010: {'lr': 0.0002, 'samples': 384320, 'steps': 750, 'loss/train': 4.112923622131348} -09/20/2021 17:05:21 - INFO - __main__ - Step 12011: {'lr': 0.0002, 'samples': 384352, 'steps': 750, 'loss/train': 5.498526573181152} -09/20/2021 17:05:21 - INFO - __main__ - Step 12012: {'lr': 0.0002, 'samples': 384384, 'steps': 750, 'loss/train': 3.6506187915802} -09/20/2021 17:05:22 - INFO - __main__ - Step 12013: {'lr': 0.0002, 'samples': 384416, 'steps': 750, 'loss/train': 4.435041427612305} -09/20/2021 17:05:23 - INFO - __main__ - Step 12014: {'lr': 0.0002, 'samples': 384448, 'steps': 750, 'loss/train': 4.941650867462158} -09/20/2021 17:05:24 - INFO - __main__ - Step 12015: {'lr': 0.0002, 'samples': 384480, 'steps': 750, 'loss/train': 3.5150623321533203} -09/20/2021 17:05:24 - INFO - __main__ - Step 12016: {'lr': 0.0002, 'samples': 384512, 'steps': 750, 'loss/train': 3.9261834621429443} -09/20/2021 17:05:25 - INFO - __main__ - Step 12017: {'lr': 0.00019999999979655023, 'samples': 384544, 'steps': 751, 'loss/train': 3.0738556385040283} -09/20/2021 17:05:26 - INFO - __main__ - Step 12018: {'lr': 0.00019999999979655023, 'samples': 384576, 'steps': 751, 'loss/train': 4.324124336242676} -09/20/2021 17:05:27 - INFO - __main__ - Step 12019: {'lr': 0.00019999999979655023, 'samples': 384608, 'steps': 751, 'loss/train': 4.239738464355469} -09/20/2021 17:05:28 - INFO - __main__ - Step 12020: {'lr': 0.00019999999979655023, 'samples': 384640, 'steps': 751, 'loss/train': 1.0130341053009033} -09/20/2021 17:05:28 - INFO - __main__ - Step 12021: {'lr': 0.00019999999979655023, 'samples': 384672, 'steps': 751, 'loss/train': 3.7819433212280273} -09/20/2021 17:05:29 - INFO - __main__ - Step 12022: {'lr': 0.00019999999979655023, 'samples': 384704, 'steps': 751, 'loss/train': 4.152037143707275} -09/20/2021 17:05:30 - INFO - __main__ - Step 12023: {'lr': 0.00019999999979655023, 'samples': 384736, 'steps': 751, 'loss/train': 4.051098346710205} -09/20/2021 17:05:31 - INFO - __main__ - Step 12024: {'lr': 0.00019999999979655023, 'samples': 384768, 'steps': 751, 'loss/train': 3.760239839553833} -09/20/2021 17:05:32 - INFO - __main__ - Step 12025: {'lr': 0.00019999999979655023, 'samples': 384800, 'steps': 751, 'loss/train': 4.4767889976501465} -09/20/2021 17:05:33 - INFO - __main__ - Step 12026: {'lr': 0.00019999999979655023, 'samples': 384832, 'steps': 751, 'loss/train': 4.415917873382568} -09/20/2021 17:05:33 - INFO - __main__ - Step 12027: {'lr': 0.00019999999979655023, 'samples': 384864, 'steps': 751, 'loss/train': 3.7082624435424805} -09/20/2021 17:05:34 - INFO - __main__ - Step 12028: {'lr': 0.00019999999979655023, 'samples': 384896, 'steps': 751, 'loss/train': 4.077666282653809} -09/20/2021 17:05:35 - INFO - __main__ - Step 12029: {'lr': 0.00019999999979655023, 'samples': 384928, 'steps': 751, 'loss/train': 3.4516828060150146} -09/20/2021 17:05:36 - INFO - __main__ - Step 12030: {'lr': 0.00019999999979655023, 'samples': 384960, 'steps': 751, 'loss/train': 4.886565208435059} -09/20/2021 17:05:36 - INFO - __main__ - Step 12031: {'lr': 0.00019999999979655023, 'samples': 384992, 'steps': 751, 'loss/train': 4.10750150680542} -09/20/2021 17:05:37 - INFO - __main__ - Step 12032: {'lr': 0.00019999999979655023, 'samples': 385024, 'steps': 751, 'loss/train': 4.458929061889648} -09/20/2021 17:05:38 - INFO - __main__ - Step 12033: {'lr': 0.00019999999918620079, 'samples': 385056, 'steps': 752, 'loss/train': 5.152259826660156} -09/20/2021 17:05:39 - INFO - __main__ - Step 12034: {'lr': 0.00019999999918620079, 'samples': 385088, 'steps': 752, 'loss/train': 4.007497310638428} -09/20/2021 17:05:40 - INFO - __main__ - Step 12035: {'lr': 0.00019999999918620079, 'samples': 385120, 'steps': 752, 'loss/train': 4.285330772399902} -09/20/2021 17:05:40 - INFO - __main__ - Step 12036: {'lr': 0.00019999999918620079, 'samples': 385152, 'steps': 752, 'loss/train': 4.964091777801514} -09/20/2021 17:05:41 - INFO - __main__ - Step 12037: {'lr': 0.00019999999918620079, 'samples': 385184, 'steps': 752, 'loss/train': 3.4545960426330566} -09/20/2021 17:05:42 - INFO - __main__ - Step 12038: {'lr': 0.00019999999918620079, 'samples': 385216, 'steps': 752, 'loss/train': 5.251169204711914} -09/20/2021 17:05:43 - INFO - __main__ - Step 12039: {'lr': 0.00019999999918620079, 'samples': 385248, 'steps': 752, 'loss/train': 3.995227336883545} -09/20/2021 17:05:43 - INFO - __main__ - Step 12040: {'lr': 0.00019999999918620079, 'samples': 385280, 'steps': 752, 'loss/train': 3.9511547088623047} -09/20/2021 17:05:44 - INFO - __main__ - Step 12041: {'lr': 0.00019999999918620079, 'samples': 385312, 'steps': 752, 'loss/train': 3.7958688735961914} -09/20/2021 17:05:45 - INFO - __main__ - Step 12042: {'lr': 0.00019999999918620079, 'samples': 385344, 'steps': 752, 'loss/train': 3.4194986820220947} -09/20/2021 17:05:46 - INFO - __main__ - Step 12043: {'lr': 0.00019999999918620079, 'samples': 385376, 'steps': 752, 'loss/train': 3.342839241027832} -09/20/2021 17:05:46 - INFO - __main__ - Step 12044: {'lr': 0.00019999999918620079, 'samples': 385408, 'steps': 752, 'loss/train': 4.537059783935547} -09/20/2021 17:05:47 - INFO - __main__ - Step 12045: {'lr': 0.00019999999918620079, 'samples': 385440, 'steps': 752, 'loss/train': 4.223266124725342} -09/20/2021 17:05:48 - INFO - __main__ - Step 12046: {'lr': 0.00019999999918620079, 'samples': 385472, 'steps': 752, 'loss/train': 3.9052329063415527} -09/20/2021 17:05:49 - INFO - __main__ - Step 12047: {'lr': 0.00019999999918620079, 'samples': 385504, 'steps': 752, 'loss/train': 3.972745180130005} -09/20/2021 17:05:49 - INFO - __main__ - Step 12048: {'lr': 0.00019999999918620079, 'samples': 385536, 'steps': 752, 'loss/train': 5.262760162353516} -09/20/2021 17:05:50 - INFO - __main__ - Step 12049: {'lr': 0.00019999999816895176, 'samples': 385568, 'steps': 753, 'loss/train': 4.353421688079834} -09/20/2021 17:05:51 - INFO - __main__ - Step 12050: {'lr': 0.00019999999816895176, 'samples': 385600, 'steps': 753, 'loss/train': 5.102088928222656} -09/20/2021 17:05:52 - INFO - __main__ - Step 12051: {'lr': 0.00019999999816895176, 'samples': 385632, 'steps': 753, 'loss/train': 5.789854049682617} -09/20/2021 17:05:52 - INFO - __main__ - Step 12052: {'lr': 0.00019999999816895176, 'samples': 385664, 'steps': 753, 'loss/train': 5.147348880767822} -09/20/2021 17:05:53 - INFO - __main__ - Step 12053: {'lr': 0.00019999999816895176, 'samples': 385696, 'steps': 753, 'loss/train': 5.154332637786865} -09/20/2021 17:05:54 - INFO - __main__ - Step 12054: {'lr': 0.00019999999816895176, 'samples': 385728, 'steps': 753, 'loss/train': 4.3058576583862305} -09/20/2021 17:05:55 - INFO - __main__ - Step 12055: {'lr': 0.00019999999816895176, 'samples': 385760, 'steps': 753, 'loss/train': 1.6745333671569824} -09/20/2021 17:05:56 - INFO - __main__ - Step 12056: {'lr': 0.00019999999816895176, 'samples': 385792, 'steps': 753, 'loss/train': 3.8141181468963623} -09/20/2021 17:05:57 - INFO - __main__ - Step 12057: {'lr': 0.00019999999816895176, 'samples': 385824, 'steps': 753, 'loss/train': 4.2482829093933105} -09/20/2021 17:05:58 - INFO - __main__ - Step 12058: {'lr': 0.00019999999816895176, 'samples': 385856, 'steps': 753, 'loss/train': 4.097041606903076} -09/20/2021 17:05:58 - INFO - __main__ - Step 12059: {'lr': 0.00019999999816895176, 'samples': 385888, 'steps': 753, 'loss/train': 4.046865940093994} -09/20/2021 17:05:59 - INFO - __main__ - Step 12060: {'lr': 0.00019999999816895176, 'samples': 385920, 'steps': 753, 'loss/train': 4.760095596313477} -09/20/2021 17:06:00 - INFO - __main__ - Step 12061: {'lr': 0.00019999999816895176, 'samples': 385952, 'steps': 753, 'loss/train': 3.7986559867858887} -09/20/2021 17:06:01 - INFO - __main__ - Step 12062: {'lr': 0.00019999999816895176, 'samples': 385984, 'steps': 753, 'loss/train': 4.1349005699157715} -09/20/2021 17:06:01 - INFO - __main__ - Step 12063: {'lr': 0.00019999999816895176, 'samples': 386016, 'steps': 753, 'loss/train': 4.219527721405029} -09/20/2021 17:06:02 - INFO - __main__ - Step 12064: {'lr': 0.00019999999816895176, 'samples': 386048, 'steps': 753, 'loss/train': 1.4039772748947144} -09/20/2021 17:06:03 - INFO - __main__ - Step 12065: {'lr': 0.00019999999674480314, 'samples': 386080, 'steps': 754, 'loss/train': 3.383570432662964} -09/20/2021 17:06:04 - INFO - __main__ - Step 12066: {'lr': 0.00019999999674480314, 'samples': 386112, 'steps': 754, 'loss/train': 3.5908126831054688} -09/20/2021 17:06:05 - INFO - __main__ - Step 12067: {'lr': 0.00019999999674480314, 'samples': 386144, 'steps': 754, 'loss/train': 4.598433017730713} -09/20/2021 17:06:05 - INFO - __main__ - Step 12068: {'lr': 0.00019999999674480314, 'samples': 386176, 'steps': 754, 'loss/train': 2.8180038928985596} -09/20/2021 17:06:06 - INFO - __main__ - Step 12069: {'lr': 0.00019999999674480314, 'samples': 386208, 'steps': 754, 'loss/train': 3.78873348236084} -09/20/2021 17:06:07 - INFO - __main__ - Step 12070: {'lr': 0.00019999999674480314, 'samples': 386240, 'steps': 754, 'loss/train': 3.844318389892578} -09/20/2021 17:06:08 - INFO - __main__ - Step 12071: {'lr': 0.00019999999674480314, 'samples': 386272, 'steps': 754, 'loss/train': 4.464303493499756} -09/20/2021 17:06:08 - INFO - __main__ - Step 12072: {'lr': 0.00019999999674480314, 'samples': 386304, 'steps': 754, 'loss/train': 4.854004859924316} -09/20/2021 17:06:09 - INFO - __main__ - Step 12073: {'lr': 0.00019999999674480314, 'samples': 386336, 'steps': 754, 'loss/train': 4.227140426635742} -09/20/2021 17:06:10 - INFO - __main__ - Step 12074: {'lr': 0.00019999999674480314, 'samples': 386368, 'steps': 754, 'loss/train': 4.332799434661865} -09/20/2021 17:06:11 - INFO - __main__ - Step 12075: {'lr': 0.00019999999674480314, 'samples': 386400, 'steps': 754, 'loss/train': 4.050940036773682} -09/20/2021 17:06:11 - INFO - __main__ - Step 12076: {'lr': 0.00019999999674480314, 'samples': 386432, 'steps': 754, 'loss/train': 0.621217668056488} -09/20/2021 17:06:12 - INFO - __main__ - Step 12077: {'lr': 0.00019999999674480314, 'samples': 386464, 'steps': 754, 'loss/train': 4.443437576293945} -09/20/2021 17:06:13 - INFO - __main__ - Step 12078: {'lr': 0.00019999999674480314, 'samples': 386496, 'steps': 754, 'loss/train': 3.1143665313720703} -09/20/2021 17:06:14 - INFO - __main__ - Step 12079: {'lr': 0.00019999999674480314, 'samples': 386528, 'steps': 754, 'loss/train': 4.161482334136963} -09/20/2021 17:06:14 - INFO - __main__ - Step 12080: {'lr': 0.00019999999674480314, 'samples': 386560, 'steps': 754, 'loss/train': 4.73284387588501} -09/20/2021 17:06:15 - INFO - __main__ - Step 12081: {'lr': 0.0001999999949137549, 'samples': 386592, 'steps': 755, 'loss/train': 4.524543762207031} -09/20/2021 17:06:16 - INFO - __main__ - Step 12082: {'lr': 0.0001999999949137549, 'samples': 386624, 'steps': 755, 'loss/train': 5.261424541473389} -09/20/2021 17:06:17 - INFO - __main__ - Step 12083: {'lr': 0.0001999999949137549, 'samples': 386656, 'steps': 755, 'loss/train': 3.308443069458008} -09/20/2021 17:06:17 - INFO - __main__ - Step 12084: {'lr': 0.0001999999949137549, 'samples': 386688, 'steps': 755, 'loss/train': 3.499561309814453} -09/20/2021 17:06:18 - INFO - __main__ - Step 12085: {'lr': 0.0001999999949137549, 'samples': 386720, 'steps': 755, 'loss/train': 3.495293617248535} -09/20/2021 17:06:19 - INFO - __main__ - Step 12086: {'lr': 0.0001999999949137549, 'samples': 386752, 'steps': 755, 'loss/train': 3.560781955718994} -09/20/2021 17:06:20 - INFO - __main__ - Step 12087: {'lr': 0.0001999999949137549, 'samples': 386784, 'steps': 755, 'loss/train': 6.646931171417236} -09/20/2021 17:06:21 - INFO - __main__ - Step 12088: {'lr': 0.0001999999949137549, 'samples': 386816, 'steps': 755, 'loss/train': 4.988211631774902} -09/20/2021 17:06:22 - INFO - __main__ - Step 12089: {'lr': 0.0001999999949137549, 'samples': 386848, 'steps': 755, 'loss/train': 3.7496769428253174} -09/20/2021 17:06:22 - INFO - __main__ - Step 12090: {'lr': 0.0001999999949137549, 'samples': 386880, 'steps': 755, 'loss/train': 1.4888962507247925} -09/20/2021 17:06:23 - INFO - __main__ - Step 12091: {'lr': 0.0001999999949137549, 'samples': 386912, 'steps': 755, 'loss/train': 3.773043155670166} -09/20/2021 17:06:24 - INFO - __main__ - Step 12092: {'lr': 0.0001999999949137549, 'samples': 386944, 'steps': 755, 'loss/train': 4.467594146728516} -09/20/2021 17:06:25 - INFO - __main__ - Step 12093: {'lr': 0.0001999999949137549, 'samples': 386976, 'steps': 755, 'loss/train': 4.134634971618652} -09/20/2021 17:06:25 - INFO - __main__ - Step 12094: {'lr': 0.0001999999949137549, 'samples': 387008, 'steps': 755, 'loss/train': 4.258672714233398} -09/20/2021 17:06:26 - INFO - __main__ - Step 12095: {'lr': 0.0001999999949137549, 'samples': 387040, 'steps': 755, 'loss/train': 4.495542049407959} -09/20/2021 17:06:27 - INFO - __main__ - Step 12096: {'lr': 0.0001999999949137549, 'samples': 387072, 'steps': 755, 'loss/train': 4.295207500457764} -09/20/2021 17:06:28 - INFO - __main__ - Step 12097: {'lr': 0.00019999999267580708, 'samples': 387104, 'steps': 756, 'loss/train': 4.06731653213501} -09/20/2021 17:06:29 - INFO - __main__ - Step 12098: {'lr': 0.00019999999267580708, 'samples': 387136, 'steps': 756, 'loss/train': 4.721609592437744} -09/20/2021 17:06:29 - INFO - __main__ - Step 12099: {'lr': 0.00019999999267580708, 'samples': 387168, 'steps': 756, 'loss/train': 2.4782702922821045} -09/20/2021 17:06:30 - INFO - __main__ - Step 12100: {'lr': 0.00019999999267580708, 'samples': 387200, 'steps': 756, 'loss/train': 4.199681282043457} -09/20/2021 17:06:31 - INFO - __main__ - Step 12101: {'lr': 0.00019999999267580708, 'samples': 387232, 'steps': 756, 'loss/train': 4.812793731689453} -09/20/2021 17:06:32 - INFO - __main__ - Step 12102: {'lr': 0.00019999999267580708, 'samples': 387264, 'steps': 756, 'loss/train': 3.657884359359741} -09/20/2021 17:06:32 - INFO - __main__ - Step 12103: {'lr': 0.00019999999267580708, 'samples': 387296, 'steps': 756, 'loss/train': 3.663384199142456} -09/20/2021 17:06:33 - INFO - __main__ - Step 12104: {'lr': 0.00019999999267580708, 'samples': 387328, 'steps': 756, 'loss/train': 1.528950810432434} -09/20/2021 17:06:34 - INFO - __main__ - Step 12105: {'lr': 0.00019999999267580708, 'samples': 387360, 'steps': 756, 'loss/train': 3.7912161350250244} -09/20/2021 17:06:35 - INFO - __main__ - Step 12106: {'lr': 0.00019999999267580708, 'samples': 387392, 'steps': 756, 'loss/train': 3.942172050476074} -09/20/2021 17:06:35 - INFO - __main__ - Step 12107: {'lr': 0.00019999999267580708, 'samples': 387424, 'steps': 756, 'loss/train': 4.524375915527344} -09/20/2021 17:06:36 - INFO - __main__ - Step 12108: {'lr': 0.00019999999267580708, 'samples': 387456, 'steps': 756, 'loss/train': 2.013338565826416} -09/20/2021 17:06:37 - INFO - __main__ - Step 12109: {'lr': 0.00019999999267580708, 'samples': 387488, 'steps': 756, 'loss/train': 3.6356003284454346} -09/20/2021 17:06:38 - INFO - __main__ - Step 12110: {'lr': 0.00019999999267580708, 'samples': 387520, 'steps': 756, 'loss/train': 4.109992504119873} -09/20/2021 17:06:38 - INFO - __main__ - Step 12111: {'lr': 0.00019999999267580708, 'samples': 387552, 'steps': 756, 'loss/train': 4.0031232833862305} -09/20/2021 17:06:39 - INFO - __main__ - Step 12112: {'lr': 0.00019999999267580708, 'samples': 387584, 'steps': 756, 'loss/train': 3.3798575401306152} -09/20/2021 17:06:40 - INFO - __main__ - Step 12113: {'lr': 0.0001999999900309597, 'samples': 387616, 'steps': 757, 'loss/train': 3.892023801803589} -09/20/2021 17:06:41 - INFO - __main__ - Step 12114: {'lr': 0.0001999999900309597, 'samples': 387648, 'steps': 757, 'loss/train': 5.354602336883545} -09/20/2021 17:06:41 - INFO - __main__ - Step 12115: {'lr': 0.0001999999900309597, 'samples': 387680, 'steps': 757, 'loss/train': 4.496068477630615} -09/20/2021 17:06:42 - INFO - __main__ - Step 12116: {'lr': 0.0001999999900309597, 'samples': 387712, 'steps': 757, 'loss/train': 4.083879470825195} -09/20/2021 17:06:43 - INFO - __main__ - Step 12117: {'lr': 0.0001999999900309597, 'samples': 387744, 'steps': 757, 'loss/train': 3.981842041015625} -09/20/2021 17:06:45 - INFO - __main__ - Step 12118: {'lr': 0.0001999999900309597, 'samples': 387776, 'steps': 757, 'loss/train': 3.904597043991089} -09/20/2021 17:06:45 - INFO - __main__ - Step 12119: {'lr': 0.0001999999900309597, 'samples': 387808, 'steps': 757, 'loss/train': 3.998875856399536} -09/20/2021 17:06:46 - INFO - __main__ - Step 12120: {'lr': 0.0001999999900309597, 'samples': 387840, 'steps': 757, 'loss/train': 5.098544597625732} -09/20/2021 17:06:47 - INFO - __main__ - Step 12121: {'lr': 0.0001999999900309597, 'samples': 387872, 'steps': 757, 'loss/train': 5.036008358001709} -09/20/2021 17:06:48 - INFO - __main__ - Step 12122: {'lr': 0.0001999999900309597, 'samples': 387904, 'steps': 757, 'loss/train': 4.123961448669434} -09/20/2021 17:06:48 - INFO - __main__ - Step 12123: {'lr': 0.0001999999900309597, 'samples': 387936, 'steps': 757, 'loss/train': 3.0836522579193115} -09/20/2021 17:06:49 - INFO - __main__ - Step 12124: {'lr': 0.0001999999900309597, 'samples': 387968, 'steps': 757, 'loss/train': 6.38083553314209} -09/20/2021 17:06:50 - INFO - __main__ - Step 12125: {'lr': 0.0001999999900309597, 'samples': 388000, 'steps': 757, 'loss/train': 4.759220600128174} -09/20/2021 17:06:51 - INFO - __main__ - Step 12126: {'lr': 0.0001999999900309597, 'samples': 388032, 'steps': 757, 'loss/train': 5.716927528381348} -09/20/2021 17:06:51 - INFO - __main__ - Step 12127: {'lr': 0.0001999999900309597, 'samples': 388064, 'steps': 757, 'loss/train': 5.483917713165283} -09/20/2021 17:06:52 - INFO - __main__ - Step 12128: {'lr': 0.0001999999900309597, 'samples': 388096, 'steps': 757, 'loss/train': 5.500570774078369} -09/20/2021 17:06:53 - INFO - __main__ - Step 12129: {'lr': 0.0001999999869792127, 'samples': 388128, 'steps': 758, 'loss/train': 4.17835807800293} -09/20/2021 17:06:54 - INFO - __main__ - Step 12130: {'lr': 0.0001999999869792127, 'samples': 388160, 'steps': 758, 'loss/train': 4.221107482910156} -09/20/2021 17:06:55 - INFO - __main__ - Step 12131: {'lr': 0.0001999999869792127, 'samples': 388192, 'steps': 758, 'loss/train': 4.342262268066406} -09/20/2021 17:06:55 - INFO - __main__ - Step 12132: {'lr': 0.0001999999869792127, 'samples': 388224, 'steps': 758, 'loss/train': 4.239351272583008} -09/20/2021 17:06:56 - INFO - __main__ - Step 12133: {'lr': 0.0001999999869792127, 'samples': 388256, 'steps': 758, 'loss/train': 2.2366085052490234} -09/20/2021 17:06:57 - INFO - __main__ - Step 12134: {'lr': 0.0001999999869792127, 'samples': 388288, 'steps': 758, 'loss/train': 2.2451601028442383} -09/20/2021 17:06:58 - INFO - __main__ - Step 12135: {'lr': 0.0001999999869792127, 'samples': 388320, 'steps': 758, 'loss/train': 2.1314284801483154} -09/20/2021 17:06:58 - INFO - __main__ - Step 12136: {'lr': 0.0001999999869792127, 'samples': 388352, 'steps': 758, 'loss/train': 1.7731308937072754} -09/20/2021 17:06:59 - INFO - __main__ - Step 12137: {'lr': 0.0001999999869792127, 'samples': 388384, 'steps': 758, 'loss/train': 2.0285956859588623} -09/20/2021 17:07:00 - INFO - __main__ - Step 12138: {'lr': 0.0001999999869792127, 'samples': 388416, 'steps': 758, 'loss/train': 2.2335574626922607} -09/20/2021 17:07:01 - INFO - __main__ - Step 12139: {'lr': 0.0001999999869792127, 'samples': 388448, 'steps': 758, 'loss/train': 4.522639274597168} -09/20/2021 17:07:01 - INFO - __main__ - Step 12140: {'lr': 0.0001999999869792127, 'samples': 388480, 'steps': 758, 'loss/train': 3.8825578689575195} -09/20/2021 17:07:02 - INFO - __main__ - Step 12141: {'lr': 0.0001999999869792127, 'samples': 388512, 'steps': 758, 'loss/train': 2.914163112640381} -09/20/2021 17:07:03 - INFO - __main__ - Step 12142: {'lr': 0.0001999999869792127, 'samples': 388544, 'steps': 758, 'loss/train': 1.7983306646347046} -09/20/2021 17:07:04 - INFO - __main__ - Step 12143: {'lr': 0.0001999999869792127, 'samples': 388576, 'steps': 758, 'loss/train': 2.122246265411377} -09/20/2021 17:07:04 - INFO - __main__ - Step 12144: {'lr': 0.0001999999869792127, 'samples': 388608, 'steps': 758, 'loss/train': 1.7908732891082764} -09/20/2021 17:07:05 - INFO - __main__ - Step 12145: {'lr': 0.0001999999835205662, 'samples': 388640, 'steps': 759, 'loss/train': 2.008037805557251} -09/20/2021 17:07:06 - INFO - __main__ - Step 12146: {'lr': 0.0001999999835205662, 'samples': 388672, 'steps': 759, 'loss/train': 4.763937473297119} -09/20/2021 17:07:07 - INFO - __main__ - Step 12147: {'lr': 0.0001999999835205662, 'samples': 388704, 'steps': 759, 'loss/train': 3.5210366249084473} -09/20/2021 17:07:07 - INFO - __main__ - Step 12148: {'lr': 0.0001999999835205662, 'samples': 388736, 'steps': 759, 'loss/train': 4.214256286621094} -09/20/2021 17:07:08 - INFO - __main__ - Step 12149: {'lr': 0.0001999999835205662, 'samples': 388768, 'steps': 759, 'loss/train': 3.8057401180267334} -09/20/2021 17:07:10 - INFO - __main__ - Step 12150: {'lr': 0.0001999999835205662, 'samples': 388800, 'steps': 759, 'loss/train': 3.163248300552368} -09/20/2021 17:07:10 - INFO - __main__ - Step 12151: {'lr': 0.0001999999835205662, 'samples': 388832, 'steps': 759, 'loss/train': 4.6302409172058105} -09/20/2021 17:07:11 - INFO - __main__ - Step 12152: {'lr': 0.0001999999835205662, 'samples': 388864, 'steps': 759, 'loss/train': 3.4830198287963867} -09/20/2021 17:07:12 - INFO - __main__ - Step 12153: {'lr': 0.0001999999835205662, 'samples': 388896, 'steps': 759, 'loss/train': 3.961688995361328} -09/20/2021 17:07:13 - INFO - __main__ - Step 12154: {'lr': 0.0001999999835205662, 'samples': 388928, 'steps': 759, 'loss/train': 3.896239995956421} -09/20/2021 17:07:13 - INFO - __main__ - Step 12155: {'lr': 0.0001999999835205662, 'samples': 388960, 'steps': 759, 'loss/train': 4.043107032775879} -09/20/2021 17:07:14 - INFO - __main__ - Step 12156: {'lr': 0.0001999999835205662, 'samples': 388992, 'steps': 759, 'loss/train': 3.931487560272217} -09/20/2021 17:07:15 - INFO - __main__ - Step 12157: {'lr': 0.0001999999835205662, 'samples': 389024, 'steps': 759, 'loss/train': 4.427278995513916} -09/20/2021 17:07:16 - INFO - __main__ - Step 12158: {'lr': 0.0001999999835205662, 'samples': 389056, 'steps': 759, 'loss/train': 4.341189861297607} -09/20/2021 17:07:16 - INFO - __main__ - Step 12159: {'lr': 0.0001999999835205662, 'samples': 389088, 'steps': 759, 'loss/train': 2.1089882850646973} -09/20/2021 17:07:17 - INFO - __main__ - Step 12160: {'lr': 0.0001999999835205662, 'samples': 389120, 'steps': 759, 'loss/train': 1.959175705909729} -09/20/2021 17:07:18 - INFO - __main__ - Step 12161: {'lr': 0.00019999997965502008, 'samples': 389152, 'steps': 760, 'loss/train': 2.5656495094299316} -09/20/2021 17:07:19 - INFO - __main__ - Step 12162: {'lr': 0.00019999997965502008, 'samples': 389184, 'steps': 760, 'loss/train': 4.785862922668457} -09/20/2021 17:07:19 - INFO - __main__ - Step 12163: {'lr': 0.00019999997965502008, 'samples': 389216, 'steps': 760, 'loss/train': 4.8756422996521} -09/20/2021 17:07:20 - INFO - __main__ - Step 12164: {'lr': 0.00019999997965502008, 'samples': 389248, 'steps': 760, 'loss/train': 5.033164978027344} -09/20/2021 17:07:21 - INFO - __main__ - Step 12165: {'lr': 0.00019999997965502008, 'samples': 389280, 'steps': 760, 'loss/train': 5.326353073120117} -09/20/2021 17:07:22 - INFO - __main__ - Step 12166: {'lr': 0.00019999997965502008, 'samples': 389312, 'steps': 760, 'loss/train': 5.66620397567749} -09/20/2021 17:07:22 - INFO - __main__ - Step 12167: {'lr': 0.00019999997965502008, 'samples': 389344, 'steps': 760, 'loss/train': 5.365381240844727} -09/20/2021 17:07:23 - INFO - __main__ - Step 12168: {'lr': 0.00019999997965502008, 'samples': 389376, 'steps': 760, 'loss/train': 3.575033187866211} -09/20/2021 17:07:24 - INFO - __main__ - Step 12169: {'lr': 0.00019999997965502008, 'samples': 389408, 'steps': 760, 'loss/train': 3.39231538772583} -09/20/2021 17:07:25 - INFO - __main__ - Step 12170: {'lr': 0.00019999997965502008, 'samples': 389440, 'steps': 760, 'loss/train': 4.219022274017334} -09/20/2021 17:07:25 - INFO - __main__ - Step 12171: {'lr': 0.00019999997965502008, 'samples': 389472, 'steps': 760, 'loss/train': 3.6414177417755127} -09/20/2021 17:07:26 - INFO - __main__ - Step 12172: {'lr': 0.00019999997965502008, 'samples': 389504, 'steps': 760, 'loss/train': 1.6037719249725342} -09/20/2021 17:07:27 - INFO - __main__ - Step 12173: {'lr': 0.00019999997965502008, 'samples': 389536, 'steps': 760, 'loss/train': 4.58066987991333} -09/20/2021 17:07:28 - INFO - __main__ - Step 12174: {'lr': 0.00019999997965502008, 'samples': 389568, 'steps': 760, 'loss/train': 5.016931056976318} -09/20/2021 17:07:28 - INFO - __main__ - Step 12175: {'lr': 0.00019999997965502008, 'samples': 389600, 'steps': 760, 'loss/train': 4.566237926483154} -09/20/2021 17:07:29 - INFO - __main__ - Step 12176: {'lr': 0.00019999997965502008, 'samples': 389632, 'steps': 760, 'loss/train': 5.381662368774414} -09/20/2021 17:07:30 - INFO - __main__ - Step 12177: {'lr': 0.00019999997538257448, 'samples': 389664, 'steps': 761, 'loss/train': 4.015583038330078} -09/20/2021 17:07:31 - INFO - __main__ - Step 12178: {'lr': 0.00019999997538257448, 'samples': 389696, 'steps': 761, 'loss/train': 4.922349452972412} -09/20/2021 17:07:32 - INFO - __main__ - Step 12179: {'lr': 0.00019999997538257448, 'samples': 389728, 'steps': 761, 'loss/train': 4.84450626373291} -09/20/2021 17:07:32 - INFO - __main__ - Step 12180: {'lr': 0.00019999997538257448, 'samples': 389760, 'steps': 761, 'loss/train': 4.32974910736084} -09/20/2021 17:07:34 - INFO - __main__ - Step 12181: {'lr': 0.00019999997538257448, 'samples': 389792, 'steps': 761, 'loss/train': 3.500697374343872} -09/20/2021 17:07:34 - INFO - __main__ - Step 12182: {'lr': 0.00019999997538257448, 'samples': 389824, 'steps': 761, 'loss/train': 4.222060203552246} -09/20/2021 17:07:35 - INFO - __main__ - Step 12183: {'lr': 0.00019999997538257448, 'samples': 389856, 'steps': 761, 'loss/train': 3.786580801010132} -09/20/2021 17:07:36 - INFO - __main__ - Step 12184: {'lr': 0.00019999997538257448, 'samples': 389888, 'steps': 761, 'loss/train': 3.6768667697906494} -09/20/2021 17:07:37 - INFO - __main__ - Step 12185: {'lr': 0.00019999997538257448, 'samples': 389920, 'steps': 761, 'loss/train': 4.868452072143555} -09/20/2021 17:07:37 - INFO - __main__ - Step 12186: {'lr': 0.00019999997538257448, 'samples': 389952, 'steps': 761, 'loss/train': 4.948462009429932} -09/20/2021 17:07:38 - INFO - __main__ - Step 12187: {'lr': 0.00019999997538257448, 'samples': 389984, 'steps': 761, 'loss/train': 4.539658069610596} -09/20/2021 17:07:39 - INFO - __main__ - Step 12188: {'lr': 0.00019999997538257448, 'samples': 390016, 'steps': 761, 'loss/train': 4.584507942199707} -09/20/2021 17:07:40 - INFO - __main__ - Step 12189: {'lr': 0.00019999997538257448, 'samples': 390048, 'steps': 761, 'loss/train': 4.156439304351807} -09/20/2021 17:07:40 - INFO - __main__ - Step 12190: {'lr': 0.00019999997538257448, 'samples': 390080, 'steps': 761, 'loss/train': 3.7633345127105713} -09/20/2021 17:07:41 - INFO - __main__ - Step 12191: {'lr': 0.00019999997538257448, 'samples': 390112, 'steps': 761, 'loss/train': 3.866628408432007} -09/20/2021 17:07:42 - INFO - __main__ - Step 12192: {'lr': 0.00019999997538257448, 'samples': 390144, 'steps': 761, 'loss/train': 4.026522636413574} -09/20/2021 17:07:43 - INFO - __main__ - Step 12193: {'lr': 0.00019999997070322938, 'samples': 390176, 'steps': 762, 'loss/train': 4.0276408195495605} -09/20/2021 17:07:43 - INFO - __main__ - Step 12194: {'lr': 0.00019999997070322938, 'samples': 390208, 'steps': 762, 'loss/train': 5.282375335693359} -09/20/2021 17:07:44 - INFO - __main__ - Step 12195: {'lr': 0.00019999997070322938, 'samples': 390240, 'steps': 762, 'loss/train': 4.428626537322998} -09/20/2021 17:07:45 - INFO - __main__ - Step 12196: {'lr': 0.00019999997070322938, 'samples': 390272, 'steps': 762, 'loss/train': 5.073704242706299} -09/20/2021 17:07:46 - INFO - __main__ - Step 12197: {'lr': 0.00019999997070322938, 'samples': 390304, 'steps': 762, 'loss/train': 4.705785751342773} -09/20/2021 17:07:46 - INFO - __main__ - Step 12198: {'lr': 0.00019999997070322938, 'samples': 390336, 'steps': 762, 'loss/train': 3.97867751121521} -09/20/2021 17:07:47 - INFO - __main__ - Step 12199: {'lr': 0.00019999997070322938, 'samples': 390368, 'steps': 762, 'loss/train': 3.911116123199463} -09/20/2021 17:07:48 - INFO - __main__ - Step 12200: {'lr': 0.00019999997070322938, 'samples': 390400, 'steps': 762, 'loss/train': 3.9222936630249023} -09/20/2021 17:07:49 - INFO - __main__ - Step 12201: {'lr': 0.00019999997070322938, 'samples': 390432, 'steps': 762, 'loss/train': 5.107321262359619} -09/20/2021 17:07:49 - INFO - __main__ - Step 12202: {'lr': 0.00019999997070322938, 'samples': 390464, 'steps': 762, 'loss/train': 2.7881863117218018} -09/20/2021 17:07:50 - INFO - __main__ - Step 12203: {'lr': 0.00019999997070322938, 'samples': 390496, 'steps': 762, 'loss/train': 4.339743137359619} -09/20/2021 17:07:51 - INFO - __main__ - Step 12204: {'lr': 0.00019999997070322938, 'samples': 390528, 'steps': 762, 'loss/train': 6.489375591278076} -09/20/2021 17:07:52 - INFO - __main__ - Step 12205: {'lr': 0.00019999997070322938, 'samples': 390560, 'steps': 762, 'loss/train': 3.428774833679199} -09/20/2021 17:07:52 - INFO - __main__ - Step 12206: {'lr': 0.00019999997070322938, 'samples': 390592, 'steps': 762, 'loss/train': 4.027410507202148} -09/20/2021 17:07:53 - INFO - __main__ - Step 12207: {'lr': 0.00019999997070322938, 'samples': 390624, 'steps': 762, 'loss/train': 5.017829895019531} -09/20/2021 17:07:54 - INFO - __main__ - Step 12208: {'lr': 0.00019999997070322938, 'samples': 390656, 'steps': 762, 'loss/train': 4.42488956451416} -09/20/2021 17:07:55 - INFO - __main__ - Step 12209: {'lr': 0.00019999996561698478, 'samples': 390688, 'steps': 763, 'loss/train': 5.008026599884033} -09/20/2021 17:07:56 - INFO - __main__ - Step 12210: {'lr': 0.00019999996561698478, 'samples': 390720, 'steps': 763, 'loss/train': 3.898630142211914} -09/20/2021 17:07:56 - INFO - __main__ - Step 12211: {'lr': 0.00019999996561698478, 'samples': 390752, 'steps': 763, 'loss/train': 4.825348377227783} -09/20/2021 17:07:57 - INFO - __main__ - Step 12212: {'lr': 0.00019999996561698478, 'samples': 390784, 'steps': 763, 'loss/train': 4.220505237579346} -09/20/2021 17:07:59 - INFO - __main__ - Step 12213: {'lr': 0.00019999996561698478, 'samples': 390816, 'steps': 763, 'loss/train': 3.9681687355041504} -09/20/2021 17:08:00 - INFO - __main__ - Step 12214: {'lr': 0.00019999996561698478, 'samples': 390848, 'steps': 763, 'loss/train': 4.4612555503845215} -09/20/2021 17:08:00 - INFO - __main__ - Step 12215: {'lr': 0.00019999996561698478, 'samples': 390880, 'steps': 763, 'loss/train': 3.4798824787139893} -09/20/2021 17:08:01 - INFO - __main__ - Step 12216: {'lr': 0.00019999996561698478, 'samples': 390912, 'steps': 763, 'loss/train': 4.168976306915283} -09/20/2021 17:08:02 - INFO - __main__ - Step 12217: {'lr': 0.00019999996561698478, 'samples': 390944, 'steps': 763, 'loss/train': 4.567706108093262} -09/20/2021 17:08:03 - INFO - __main__ - Step 12218: {'lr': 0.00019999996561698478, 'samples': 390976, 'steps': 763, 'loss/train': 4.550930023193359} -09/20/2021 17:08:03 - INFO - __main__ - Step 12219: {'lr': 0.00019999996561698478, 'samples': 391008, 'steps': 763, 'loss/train': 4.42177677154541} -09/20/2021 17:08:04 - INFO - __main__ - Step 12220: {'lr': 0.00019999996561698478, 'samples': 391040, 'steps': 763, 'loss/train': 3.292257070541382} -09/20/2021 17:08:05 - INFO - __main__ - Step 12221: {'lr': 0.00019999996561698478, 'samples': 391072, 'steps': 763, 'loss/train': 2.055551290512085} -09/20/2021 17:08:06 - INFO - __main__ - Step 12222: {'lr': 0.00019999996561698478, 'samples': 391104, 'steps': 763, 'loss/train': 1.6538761854171753} -09/20/2021 17:08:06 - INFO - __main__ - Step 12223: {'lr': 0.00019999996561698478, 'samples': 391136, 'steps': 763, 'loss/train': 1.7216583490371704} -09/20/2021 17:08:07 - INFO - __main__ - Step 12224: {'lr': 0.00019999996561698478, 'samples': 391168, 'steps': 763, 'loss/train': 1.842831015586853} -09/20/2021 17:08:08 - INFO - __main__ - Step 12225: {'lr': 0.00019999996012384067, 'samples': 391200, 'steps': 764, 'loss/train': 4.232878684997559} -09/20/2021 17:08:09 - INFO - __main__ - Step 12226: {'lr': 0.00019999996012384067, 'samples': 391232, 'steps': 764, 'loss/train': 4.484635829925537} -09/20/2021 17:08:09 - INFO - __main__ - Step 12227: {'lr': 0.00019999996012384067, 'samples': 391264, 'steps': 764, 'loss/train': 4.682472229003906} -09/20/2021 17:08:10 - INFO - __main__ - Step 12228: {'lr': 0.00019999996012384067, 'samples': 391296, 'steps': 764, 'loss/train': 3.6418111324310303} -09/20/2021 17:08:11 - INFO - __main__ - Step 12229: {'lr': 0.00019999996012384067, 'samples': 391328, 'steps': 764, 'loss/train': 4.769120216369629} -09/20/2021 17:08:12 - INFO - __main__ - Step 12230: {'lr': 0.00019999996012384067, 'samples': 391360, 'steps': 764, 'loss/train': 4.1741414070129395} -09/20/2021 17:08:12 - INFO - __main__ - Step 12231: {'lr': 0.00019999996012384067, 'samples': 391392, 'steps': 764, 'loss/train': 3.936643123626709} -09/20/2021 17:08:13 - INFO - __main__ - Step 12232: {'lr': 0.00019999996012384067, 'samples': 391424, 'steps': 764, 'loss/train': 3.422889471054077} -09/20/2021 17:08:14 - INFO - __main__ - Step 12233: {'lr': 0.00019999996012384067, 'samples': 391456, 'steps': 764, 'loss/train': 4.748690605163574} -09/20/2021 17:08:15 - INFO - __main__ - Step 12234: {'lr': 0.00019999996012384067, 'samples': 391488, 'steps': 764, 'loss/train': 6.146028995513916} -09/20/2021 17:08:15 - INFO - __main__ - Step 12235: {'lr': 0.00019999996012384067, 'samples': 391520, 'steps': 764, 'loss/train': 3.3782191276550293} -09/20/2021 17:08:16 - INFO - __main__ - Step 12236: {'lr': 0.00019999996012384067, 'samples': 391552, 'steps': 764, 'loss/train': 4.198638916015625} -09/20/2021 17:08:17 - INFO - __main__ - Step 12237: {'lr': 0.00019999996012384067, 'samples': 391584, 'steps': 764, 'loss/train': 3.6401760578155518} -09/20/2021 17:08:18 - INFO - __main__ - Step 12238: {'lr': 0.00019999996012384067, 'samples': 391616, 'steps': 764, 'loss/train': 4.019444942474365} -09/20/2021 17:08:18 - INFO - __main__ - Step 12239: {'lr': 0.00019999996012384067, 'samples': 391648, 'steps': 764, 'loss/train': 4.330134868621826} -09/20/2021 17:08:19 - INFO - __main__ - Step 12240: {'lr': 0.00019999996012384067, 'samples': 391680, 'steps': 764, 'loss/train': 4.323318004608154} -09/20/2021 17:08:20 - INFO - __main__ - Step 12241: {'lr': 0.00019999995422379714, 'samples': 391712, 'steps': 765, 'loss/train': 4.1942138671875} -09/20/2021 17:08:21 - INFO - __main__ - Step 12242: {'lr': 0.00019999995422379714, 'samples': 391744, 'steps': 765, 'loss/train': 3.458674669265747} -09/20/2021 17:08:22 - INFO - __main__ - Step 12243: {'lr': 0.00019999995422379714, 'samples': 391776, 'steps': 765, 'loss/train': 3.3991405963897705} -09/20/2021 17:08:22 - INFO - __main__ - Step 12244: {'lr': 0.00019999995422379714, 'samples': 391808, 'steps': 765, 'loss/train': 2.9480764865875244} -09/20/2021 17:08:23 - INFO - __main__ - Step 12245: {'lr': 0.00019999995422379714, 'samples': 391840, 'steps': 765, 'loss/train': 3.6136605739593506} -09/20/2021 17:08:24 - INFO - __main__ - Step 12246: {'lr': 0.00019999995422379714, 'samples': 391872, 'steps': 765, 'loss/train': 2.7796566486358643} -09/20/2021 17:08:25 - INFO - __main__ - Step 12247: {'lr': 0.00019999995422379714, 'samples': 391904, 'steps': 765, 'loss/train': 3.3841235637664795} -09/20/2021 17:08:25 - INFO - __main__ - Step 12248: {'lr': 0.00019999995422379714, 'samples': 391936, 'steps': 765, 'loss/train': 3.597039222717285} -09/20/2021 17:08:26 - INFO - __main__ - Step 12249: {'lr': 0.00019999995422379714, 'samples': 391968, 'steps': 765, 'loss/train': 4.051209926605225} -09/20/2021 17:08:27 - INFO - __main__ - Step 12250: {'lr': 0.00019999995422379714, 'samples': 392000, 'steps': 765, 'loss/train': 3.2436294555664062} -09/20/2021 17:08:28 - INFO - __main__ - Step 12251: {'lr': 0.00019999995422379714, 'samples': 392032, 'steps': 765, 'loss/train': 5.391672134399414} -09/20/2021 17:08:29 - INFO - __main__ - Step 12252: {'lr': 0.00019999995422379714, 'samples': 392064, 'steps': 765, 'loss/train': 3.9561495780944824} -09/20/2021 17:08:30 - INFO - __main__ - Step 12253: {'lr': 0.00019999995422379714, 'samples': 392096, 'steps': 765, 'loss/train': 3.0631089210510254} -09/20/2021 17:08:30 - INFO - __main__ - Step 12254: {'lr': 0.00019999995422379714, 'samples': 392128, 'steps': 765, 'loss/train': 3.662282943725586} -09/20/2021 17:08:31 - INFO - __main__ - Step 12255: {'lr': 0.00019999995422379714, 'samples': 392160, 'steps': 765, 'loss/train': 4.546079635620117} -09/20/2021 17:08:32 - INFO - __main__ - Step 12256: {'lr': 0.00019999995422379714, 'samples': 392192, 'steps': 765, 'loss/train': 4.105401992797852} -09/20/2021 17:08:33 - INFO - __main__ - Step 12257: {'lr': 0.0001999999479168542, 'samples': 392224, 'steps': 766, 'loss/train': 4.338230609893799} -09/20/2021 17:08:34 - INFO - __main__ - Step 12258: {'lr': 0.0001999999479168542, 'samples': 392256, 'steps': 766, 'loss/train': 4.079263687133789} -09/20/2021 17:08:34 - INFO - __main__ - Step 12259: {'lr': 0.0001999999479168542, 'samples': 392288, 'steps': 766, 'loss/train': 5.370180130004883} -09/20/2021 17:08:35 - INFO - __main__ - Step 12260: {'lr': 0.0001999999479168542, 'samples': 392320, 'steps': 766, 'loss/train': 3.051816701889038} -09/20/2021 17:08:36 - INFO - __main__ - Step 12261: {'lr': 0.0001999999479168542, 'samples': 392352, 'steps': 766, 'loss/train': 2.7354037761688232} -09/20/2021 17:08:37 - INFO - __main__ - Step 12262: {'lr': 0.0001999999479168542, 'samples': 392384, 'steps': 766, 'loss/train': 3.612619638442993} -09/20/2021 17:08:37 - INFO - __main__ - Step 12263: {'lr': 0.0001999999479168542, 'samples': 392416, 'steps': 766, 'loss/train': 2.777956485748291} -09/20/2021 17:08:38 - INFO - __main__ - Step 12264: {'lr': 0.0001999999479168542, 'samples': 392448, 'steps': 766, 'loss/train': 4.471179485321045} -09/20/2021 17:08:39 - INFO - __main__ - Step 12265: {'lr': 0.0001999999479168542, 'samples': 392480, 'steps': 766, 'loss/train': 4.81753396987915} -09/20/2021 17:08:40 - INFO - __main__ - Step 12266: {'lr': 0.0001999999479168542, 'samples': 392512, 'steps': 766, 'loss/train': 4.013160228729248} -09/20/2021 17:08:40 - INFO - __main__ - Step 12267: {'lr': 0.0001999999479168542, 'samples': 392544, 'steps': 766, 'loss/train': 5.059514045715332} -09/20/2021 17:08:41 - INFO - __main__ - Step 12268: {'lr': 0.0001999999479168542, 'samples': 392576, 'steps': 766, 'loss/train': 3.887845993041992} -09/20/2021 17:08:42 - INFO - __main__ - Step 12269: {'lr': 0.0001999999479168542, 'samples': 392608, 'steps': 766, 'loss/train': 4.416459083557129} -09/20/2021 17:08:43 - INFO - __main__ - Step 12270: {'lr': 0.0001999999479168542, 'samples': 392640, 'steps': 766, 'loss/train': 4.562020778656006} -09/20/2021 17:08:43 - INFO - __main__ - Step 12271: {'lr': 0.0001999999479168542, 'samples': 392672, 'steps': 766, 'loss/train': 4.0310750007629395} -09/20/2021 17:08:44 - INFO - __main__ - Step 12272: {'lr': 0.0001999999479168542, 'samples': 392704, 'steps': 766, 'loss/train': 4.007359027862549} -09/20/2021 17:08:45 - INFO - __main__ - Step 12273: {'lr': 0.00019999994120301184, 'samples': 392736, 'steps': 767, 'loss/train': 3.9121592044830322} -09/20/2021 17:08:46 - INFO - __main__ - Step 12274: {'lr': 0.00019999994120301184, 'samples': 392768, 'steps': 767, 'loss/train': 3.791978597640991} -09/20/2021 17:08:46 - INFO - __main__ - Step 12275: {'lr': 0.00019999994120301184, 'samples': 392800, 'steps': 767, 'loss/train': 4.532599925994873} -09/20/2021 17:08:47 - INFO - __main__ - Step 12276: {'lr': 0.00019999994120301184, 'samples': 392832, 'steps': 767, 'loss/train': 4.120996475219727} -09/20/2021 17:08:48 - INFO - __main__ - Step 12277: {'lr': 0.00019999994120301184, 'samples': 392864, 'steps': 767, 'loss/train': 4.196682929992676} -09/20/2021 17:08:49 - INFO - __main__ - Step 12278: {'lr': 0.00019999994120301184, 'samples': 392896, 'steps': 767, 'loss/train': 5.547607898712158} -09/20/2021 17:08:49 - INFO - __main__ - Step 12279: {'lr': 0.00019999994120301184, 'samples': 392928, 'steps': 767, 'loss/train': 4.54831600189209} -09/20/2021 17:08:50 - INFO - __main__ - Step 12280: {'lr': 0.00019999994120301184, 'samples': 392960, 'steps': 767, 'loss/train': 4.366966247558594} -09/20/2021 17:08:51 - INFO - __main__ - Step 12281: {'lr': 0.00019999994120301184, 'samples': 392992, 'steps': 767, 'loss/train': 4.256752014160156} -09/20/2021 17:08:53 - INFO - __main__ - Step 12282: {'lr': 0.00019999994120301184, 'samples': 393024, 'steps': 767, 'loss/train': 4.298328876495361} -09/20/2021 17:08:54 - INFO - __main__ - Step 12283: {'lr': 0.00019999994120301184, 'samples': 393056, 'steps': 767, 'loss/train': 4.62615966796875} -09/20/2021 17:08:54 - INFO - __main__ - Step 12284: {'lr': 0.00019999994120301184, 'samples': 393088, 'steps': 767, 'loss/train': 3.5392725467681885} -09/20/2021 17:08:55 - INFO - __main__ - Step 12285: {'lr': 0.00019999994120301184, 'samples': 393120, 'steps': 767, 'loss/train': 3.413342237472534} -09/20/2021 17:08:56 - INFO - __main__ - Step 12286: {'lr': 0.00019999994120301184, 'samples': 393152, 'steps': 767, 'loss/train': 4.104616641998291} -09/20/2021 17:08:57 - INFO - __main__ - Step 12287: {'lr': 0.00019999994120301184, 'samples': 393184, 'steps': 767, 'loss/train': 4.466394901275635} -09/20/2021 17:08:57 - INFO - __main__ - Step 12288: {'lr': 0.00019999994120301184, 'samples': 393216, 'steps': 767, 'loss/train': 3.759936571121216} -09/20/2021 17:08:58 - INFO - __main__ - Step 12289: {'lr': 0.0001999999340822701, 'samples': 393248, 'steps': 768, 'loss/train': 4.461043357849121} -09/20/2021 17:08:59 - INFO - __main__ - Step 12290: {'lr': 0.0001999999340822701, 'samples': 393280, 'steps': 768, 'loss/train': 4.110288143157959} -09/20/2021 17:09:00 - INFO - __main__ - Step 12291: {'lr': 0.0001999999340822701, 'samples': 393312, 'steps': 768, 'loss/train': 4.592430591583252} -09/20/2021 17:09:00 - INFO - __main__ - Step 12292: {'lr': 0.0001999999340822701, 'samples': 393344, 'steps': 768, 'loss/train': 3.224564552307129} -09/20/2021 17:09:01 - INFO - __main__ - Step 12293: {'lr': 0.0001999999340822701, 'samples': 393376, 'steps': 768, 'loss/train': 4.577212333679199} -09/20/2021 17:09:02 - INFO - __main__ - Step 12294: {'lr': 0.0001999999340822701, 'samples': 393408, 'steps': 768, 'loss/train': 3.8113224506378174} -09/20/2021 17:09:03 - INFO - __main__ - Step 12295: {'lr': 0.0001999999340822701, 'samples': 393440, 'steps': 768, 'loss/train': 4.273420333862305} -09/20/2021 17:09:03 - INFO - __main__ - Step 12296: {'lr': 0.0001999999340822701, 'samples': 393472, 'steps': 768, 'loss/train': 6.613803386688232} -09/20/2021 17:09:04 - INFO - __main__ - Step 12297: {'lr': 0.0001999999340822701, 'samples': 393504, 'steps': 768, 'loss/train': 4.034237861633301} -09/20/2021 17:09:05 - INFO - __main__ - Step 12298: {'lr': 0.0001999999340822701, 'samples': 393536, 'steps': 768, 'loss/train': 3.815969944000244} -09/20/2021 17:09:06 - INFO - __main__ - Step 12299: {'lr': 0.0001999999340822701, 'samples': 393568, 'steps': 768, 'loss/train': 3.4761569499969482} -09/20/2021 17:09:06 - INFO - __main__ - Step 12300: {'lr': 0.0001999999340822701, 'samples': 393600, 'steps': 768, 'loss/train': 3.8842554092407227} -09/20/2021 17:09:07 - INFO - __main__ - Step 12301: {'lr': 0.0001999999340822701, 'samples': 393632, 'steps': 768, 'loss/train': 5.767016410827637} -09/20/2021 17:09:08 - INFO - __main__ - Step 12302: {'lr': 0.0001999999340822701, 'samples': 393664, 'steps': 768, 'loss/train': 3.84420108795166} -09/20/2021 17:09:09 - INFO - __main__ - Step 12303: {'lr': 0.0001999999340822701, 'samples': 393696, 'steps': 768, 'loss/train': 3.514521360397339} -09/20/2021 17:09:09 - INFO - __main__ - Step 12304: {'lr': 0.0001999999340822701, 'samples': 393728, 'steps': 768, 'loss/train': 4.211025238037109} -09/20/2021 17:09:10 - INFO - __main__ - Step 12305: {'lr': 0.00019999992655462902, 'samples': 393760, 'steps': 769, 'loss/train': 3.904637098312378} -09/20/2021 17:09:11 - INFO - __main__ - Step 12306: {'lr': 0.00019999992655462902, 'samples': 393792, 'steps': 769, 'loss/train': 3.751598596572876} -09/20/2021 17:09:12 - INFO - __main__ - Step 12307: {'lr': 0.00019999992655462902, 'samples': 393824, 'steps': 769, 'loss/train': 3.9087541103363037} -09/20/2021 17:09:13 - INFO - __main__ - Step 12308: {'lr': 0.00019999992655462902, 'samples': 393856, 'steps': 769, 'loss/train': 3.6843984127044678} -09/20/2021 17:09:13 - INFO - __main__ - Step 12309: {'lr': 0.00019999992655462902, 'samples': 393888, 'steps': 769, 'loss/train': 4.346258163452148} -09/20/2021 17:09:14 - INFO - __main__ - Step 12310: {'lr': 0.00019999992655462902, 'samples': 393920, 'steps': 769, 'loss/train': 4.924984455108643} -09/20/2021 17:09:15 - INFO - __main__ - Step 12311: {'lr': 0.00019999992655462902, 'samples': 393952, 'steps': 769, 'loss/train': 5.810447692871094} -09/20/2021 17:09:16 - INFO - __main__ - Step 12312: {'lr': 0.00019999992655462902, 'samples': 393984, 'steps': 769, 'loss/train': 5.866605281829834} -09/20/2021 17:09:17 - INFO - __main__ - Step 12313: {'lr': 0.00019999992655462902, 'samples': 394016, 'steps': 769, 'loss/train': 4.311620235443115} -09/20/2021 17:09:18 - INFO - __main__ - Step 12314: {'lr': 0.00019999992655462902, 'samples': 394048, 'steps': 769, 'loss/train': 3.4732046127319336} -09/20/2021 17:09:18 - INFO - __main__ - Step 12315: {'lr': 0.00019999992655462902, 'samples': 394080, 'steps': 769, 'loss/train': 4.164444446563721} -09/20/2021 17:09:19 - INFO - __main__ - Step 12316: {'lr': 0.00019999992655462902, 'samples': 394112, 'steps': 769, 'loss/train': 4.8977556228637695} -09/20/2021 17:09:20 - INFO - __main__ - Step 12317: {'lr': 0.00019999992655462902, 'samples': 394144, 'steps': 769, 'loss/train': 3.885106325149536} -09/20/2021 17:09:21 - INFO - __main__ - Step 12318: {'lr': 0.00019999992655462902, 'samples': 394176, 'steps': 769, 'loss/train': 3.863269329071045} -09/20/2021 17:09:21 - INFO - __main__ - Step 12319: {'lr': 0.00019999992655462902, 'samples': 394208, 'steps': 769, 'loss/train': 4.123183250427246} -09/20/2021 17:09:22 - INFO - __main__ - Step 12320: {'lr': 0.00019999992655462902, 'samples': 394240, 'steps': 769, 'loss/train': 3.6206836700439453} -09/20/2021 17:09:23 - INFO - __main__ - Step 12321: {'lr': 0.00019999991862008865, 'samples': 394272, 'steps': 770, 'loss/train': 4.356002330780029} -09/20/2021 17:09:24 - INFO - __main__ - Step 12322: {'lr': 0.00019999991862008865, 'samples': 394304, 'steps': 770, 'loss/train': 3.9444963932037354} -09/20/2021 17:09:25 - INFO - __main__ - Step 12323: {'lr': 0.00019999991862008865, 'samples': 394336, 'steps': 770, 'loss/train': 3.858494758605957} -09/20/2021 17:09:25 - INFO - __main__ - Step 12324: {'lr': 0.00019999991862008865, 'samples': 394368, 'steps': 770, 'loss/train': 5.981497764587402} -09/20/2021 17:09:26 - INFO - __main__ - Step 12325: {'lr': 0.00019999991862008865, 'samples': 394400, 'steps': 770, 'loss/train': 5.127865314483643} -09/20/2021 17:09:27 - INFO - __main__ - Step 12326: {'lr': 0.00019999991862008865, 'samples': 394432, 'steps': 770, 'loss/train': 3.0095102787017822} -09/20/2021 17:09:28 - INFO - __main__ - Step 12327: {'lr': 0.00019999991862008865, 'samples': 394464, 'steps': 770, 'loss/train': 4.276915073394775} -09/20/2021 17:09:28 - INFO - __main__ - Step 12328: {'lr': 0.00019999991862008865, 'samples': 394496, 'steps': 770, 'loss/train': 4.281311988830566} -09/20/2021 17:09:29 - INFO - __main__ - Step 12329: {'lr': 0.00019999991862008865, 'samples': 394528, 'steps': 770, 'loss/train': 3.8747265338897705} -09/20/2021 17:09:30 - INFO - __main__ - Step 12330: {'lr': 0.00019999991862008865, 'samples': 394560, 'steps': 770, 'loss/train': 4.293976306915283} -09/20/2021 17:09:31 - INFO - __main__ - Step 12331: {'lr': 0.00019999991862008865, 'samples': 394592, 'steps': 770, 'loss/train': 4.042078495025635} -09/20/2021 17:09:31 - INFO - __main__ - Step 12332: {'lr': 0.00019999991862008865, 'samples': 394624, 'steps': 770, 'loss/train': 3.8597850799560547} -09/20/2021 17:09:32 - INFO - __main__ - Step 12333: {'lr': 0.00019999991862008865, 'samples': 394656, 'steps': 770, 'loss/train': 4.153085708618164} -09/20/2021 17:09:33 - INFO - __main__ - Step 12334: {'lr': 0.00019999991862008865, 'samples': 394688, 'steps': 770, 'loss/train': 4.2161712646484375} -09/20/2021 17:09:34 - INFO - __main__ - Step 12335: {'lr': 0.00019999991862008865, 'samples': 394720, 'steps': 770, 'loss/train': 3.233314275741577} -09/20/2021 17:09:34 - INFO - __main__ - Step 12336: {'lr': 0.00019999991862008865, 'samples': 394752, 'steps': 770, 'loss/train': 4.124072074890137} -09/20/2021 17:09:35 - INFO - __main__ - Step 12337: {'lr': 0.000199999910278649, 'samples': 394784, 'steps': 771, 'loss/train': 4.018508434295654} -09/20/2021 17:09:36 - INFO - __main__ - Step 12338: {'lr': 0.000199999910278649, 'samples': 394816, 'steps': 771, 'loss/train': 5.219825267791748} -09/20/2021 17:09:37 - INFO - __main__ - Step 12339: {'lr': 0.000199999910278649, 'samples': 394848, 'steps': 771, 'loss/train': 5.268248081207275} -09/20/2021 17:09:37 - INFO - __main__ - Step 12340: {'lr': 0.000199999910278649, 'samples': 394880, 'steps': 771, 'loss/train': 5.402420997619629} -09/20/2021 17:09:38 - INFO - __main__ - Step 12341: {'lr': 0.000199999910278649, 'samples': 394912, 'steps': 771, 'loss/train': 4.120033264160156} -09/20/2021 17:09:39 - INFO - __main__ - Step 12342: {'lr': 0.000199999910278649, 'samples': 394944, 'steps': 771, 'loss/train': 3.5353355407714844} -09/20/2021 17:09:40 - INFO - __main__ - Step 12343: {'lr': 0.000199999910278649, 'samples': 394976, 'steps': 771, 'loss/train': 4.040249347686768} -09/20/2021 17:09:41 - INFO - __main__ - Step 12344: {'lr': 0.000199999910278649, 'samples': 395008, 'steps': 771, 'loss/train': 3.7202255725860596} -09/20/2021 17:09:42 - INFO - __main__ - Step 12345: {'lr': 0.000199999910278649, 'samples': 395040, 'steps': 771, 'loss/train': 4.466850757598877} -09/20/2021 17:09:43 - INFO - __main__ - Step 12346: {'lr': 0.000199999910278649, 'samples': 395072, 'steps': 771, 'loss/train': 3.347456932067871} -09/20/2021 17:09:43 - INFO - __main__ - Step 12347: {'lr': 0.000199999910278649, 'samples': 395104, 'steps': 771, 'loss/train': 4.889294624328613} -09/20/2021 17:09:44 - INFO - __main__ - Step 12348: {'lr': 0.000199999910278649, 'samples': 395136, 'steps': 771, 'loss/train': 3.7153334617614746} -09/20/2021 17:09:45 - INFO - __main__ - Step 12349: {'lr': 0.000199999910278649, 'samples': 395168, 'steps': 771, 'loss/train': 4.220584869384766} -09/20/2021 17:09:46 - INFO - __main__ - Step 12350: {'lr': 0.000199999910278649, 'samples': 395200, 'steps': 771, 'loss/train': 3.9809322357177734} -09/20/2021 17:09:46 - INFO - __main__ - Step 12351: {'lr': 0.000199999910278649, 'samples': 395232, 'steps': 771, 'loss/train': 2.4033803939819336} -09/20/2021 17:09:47 - INFO - __main__ - Step 12352: {'lr': 0.000199999910278649, 'samples': 395264, 'steps': 771, 'loss/train': 3.4780352115631104} -09/20/2021 17:09:48 - INFO - __main__ - Step 12353: {'lr': 0.00019999990153031006, 'samples': 395296, 'steps': 772, 'loss/train': 4.575767517089844} -09/20/2021 17:09:49 - INFO - __main__ - Step 12354: {'lr': 0.00019999990153031006, 'samples': 395328, 'steps': 772, 'loss/train': 3.899152994155884} -09/20/2021 17:09:49 - INFO - __main__ - Step 12355: {'lr': 0.00019999990153031006, 'samples': 395360, 'steps': 772, 'loss/train': 4.716325283050537} -09/20/2021 17:09:50 - INFO - __main__ - Step 12356: {'lr': 0.00019999990153031006, 'samples': 395392, 'steps': 772, 'loss/train': 4.98757266998291} -09/20/2021 17:09:51 - INFO - __main__ - Step 12357: {'lr': 0.00019999990153031006, 'samples': 395424, 'steps': 772, 'loss/train': 3.6340582370758057} -09/20/2021 17:09:52 - INFO - __main__ - Step 12358: {'lr': 0.00019999990153031006, 'samples': 395456, 'steps': 772, 'loss/train': 4.589465141296387} -09/20/2021 17:09:52 - INFO - __main__ - Step 12359: {'lr': 0.00019999990153031006, 'samples': 395488, 'steps': 772, 'loss/train': 3.850231170654297} -09/20/2021 17:09:53 - INFO - __main__ - Step 12360: {'lr': 0.00019999990153031006, 'samples': 395520, 'steps': 772, 'loss/train': 3.550326108932495} -09/20/2021 17:09:54 - INFO - __main__ - Step 12361: {'lr': 0.00019999990153031006, 'samples': 395552, 'steps': 772, 'loss/train': 3.600987672805786} -09/20/2021 17:09:55 - INFO - __main__ - Step 12362: {'lr': 0.00019999990153031006, 'samples': 395584, 'steps': 772, 'loss/train': 4.98643159866333} -09/20/2021 17:09:55 - INFO - __main__ - Step 12363: {'lr': 0.00019999990153031006, 'samples': 395616, 'steps': 772, 'loss/train': 4.363832473754883} -09/20/2021 17:09:56 - INFO - __main__ - Step 12364: {'lr': 0.00019999990153031006, 'samples': 395648, 'steps': 772, 'loss/train': 4.3903326988220215} -09/20/2021 17:09:57 - INFO - __main__ - Step 12365: {'lr': 0.00019999990153031006, 'samples': 395680, 'steps': 772, 'loss/train': 4.111991882324219} -09/20/2021 17:09:58 - INFO - __main__ - Step 12366: {'lr': 0.00019999990153031006, 'samples': 395712, 'steps': 772, 'loss/train': 1.8272473812103271} -09/20/2021 17:09:58 - INFO - __main__ - Step 12367: {'lr': 0.00019999990153031006, 'samples': 395744, 'steps': 772, 'loss/train': 3.8680624961853027} -09/20/2021 17:09:59 - INFO - __main__ - Step 12368: {'lr': 0.00019999990153031006, 'samples': 395776, 'steps': 772, 'loss/train': 3.843754529953003} -09/20/2021 17:10:00 - INFO - __main__ - Step 12369: {'lr': 0.00019999989237507192, 'samples': 395808, 'steps': 773, 'loss/train': 3.7917065620422363} -09/20/2021 17:10:01 - INFO - __main__ - Step 12370: {'lr': 0.00019999989237507192, 'samples': 395840, 'steps': 773, 'loss/train': 4.117677211761475} -09/20/2021 17:10:02 - INFO - __main__ - Step 12371: {'lr': 0.00019999989237507192, 'samples': 395872, 'steps': 773, 'loss/train': 4.70542049407959} -09/20/2021 17:10:02 - INFO - __main__ - Step 12372: {'lr': 0.00019999989237507192, 'samples': 395904, 'steps': 773, 'loss/train': 4.616593360900879} -09/20/2021 17:10:03 - INFO - __main__ - Step 12373: {'lr': 0.00019999989237507192, 'samples': 395936, 'steps': 773, 'loss/train': 3.6243505477905273} -09/20/2021 17:10:04 - INFO - __main__ - Step 12374: {'lr': 0.00019999989237507192, 'samples': 395968, 'steps': 773, 'loss/train': 4.966310501098633} -09/20/2021 17:10:05 - INFO - __main__ - Step 12375: {'lr': 0.00019999989237507192, 'samples': 396000, 'steps': 773, 'loss/train': 4.62357759475708} -09/20/2021 17:10:06 - INFO - __main__ - Step 12376: {'lr': 0.00019999989237507192, 'samples': 396032, 'steps': 773, 'loss/train': 4.157111167907715} -09/20/2021 17:10:07 - INFO - __main__ - Step 12377: {'lr': 0.00019999989237507192, 'samples': 396064, 'steps': 773, 'loss/train': 3.0851011276245117} -09/20/2021 17:10:08 - INFO - __main__ - Step 12378: {'lr': 0.00019999989237507192, 'samples': 396096, 'steps': 773, 'loss/train': 5.013740539550781} -09/20/2021 17:10:08 - INFO - __main__ - Step 12379: {'lr': 0.00019999989237507192, 'samples': 396128, 'steps': 773, 'loss/train': 4.123917579650879} -09/20/2021 17:10:09 - INFO - __main__ - Step 12380: {'lr': 0.00019999989237507192, 'samples': 396160, 'steps': 773, 'loss/train': 4.1576313972473145} -09/20/2021 17:10:10 - INFO - __main__ - Step 12381: {'lr': 0.00019999989237507192, 'samples': 396192, 'steps': 773, 'loss/train': 4.322395324707031} -09/20/2021 17:10:11 - INFO - __main__ - Step 12382: {'lr': 0.00019999989237507192, 'samples': 396224, 'steps': 773, 'loss/train': 4.336226463317871} -09/20/2021 17:10:11 - INFO - __main__ - Step 12383: {'lr': 0.00019999989237507192, 'samples': 396256, 'steps': 773, 'loss/train': 4.37727165222168} -09/20/2021 17:10:12 - INFO - __main__ - Step 12384: {'lr': 0.00019999989237507192, 'samples': 396288, 'steps': 773, 'loss/train': 4.296212673187256} -09/20/2021 17:10:13 - INFO - __main__ - Step 12385: {'lr': 0.00019999988281293465, 'samples': 396320, 'steps': 774, 'loss/train': 1.8855059146881104} -09/20/2021 17:10:14 - INFO - __main__ - Step 12386: {'lr': 0.00019999988281293465, 'samples': 396352, 'steps': 774, 'loss/train': 1.7086971998214722} -09/20/2021 17:10:15 - INFO - __main__ - Step 12387: {'lr': 0.00019999988281293465, 'samples': 396384, 'steps': 774, 'loss/train': 2.5403692722320557} -09/20/2021 17:10:15 - INFO - __main__ - Step 12388: {'lr': 0.00019999988281293465, 'samples': 396416, 'steps': 774, 'loss/train': 1.9902734756469727} -09/20/2021 17:10:16 - INFO - __main__ - Step 12389: {'lr': 0.00019999988281293465, 'samples': 396448, 'steps': 774, 'loss/train': 1.6805638074874878} -09/20/2021 17:10:17 - INFO - __main__ - Step 12390: {'lr': 0.00019999988281293465, 'samples': 396480, 'steps': 774, 'loss/train': 2.8664488792419434} -09/20/2021 17:10:18 - INFO - __main__ - Step 12391: {'lr': 0.00019999988281293465, 'samples': 396512, 'steps': 774, 'loss/train': 4.588239669799805} -09/20/2021 17:10:18 - INFO - __main__ - Step 12392: {'lr': 0.00019999988281293465, 'samples': 396544, 'steps': 774, 'loss/train': 5.024819850921631} -09/20/2021 17:10:19 - INFO - __main__ - Step 12393: {'lr': 0.00019999988281293465, 'samples': 396576, 'steps': 774, 'loss/train': 3.4635086059570312} -09/20/2021 17:10:20 - INFO - __main__ - Step 12394: {'lr': 0.00019999988281293465, 'samples': 396608, 'steps': 774, 'loss/train': 4.057562351226807} -09/20/2021 17:10:21 - INFO - __main__ - Step 12395: {'lr': 0.00019999988281293465, 'samples': 396640, 'steps': 774, 'loss/train': 5.093348026275635} -09/20/2021 17:10:21 - INFO - __main__ - Step 12396: {'lr': 0.00019999988281293465, 'samples': 396672, 'steps': 774, 'loss/train': 4.068996906280518} -09/20/2021 17:10:22 - INFO - __main__ - Step 12397: {'lr': 0.00019999988281293465, 'samples': 396704, 'steps': 774, 'loss/train': 4.616059303283691} -09/20/2021 17:10:23 - INFO - __main__ - Step 12398: {'lr': 0.00019999988281293465, 'samples': 396736, 'steps': 774, 'loss/train': 4.704593181610107} -09/20/2021 17:10:24 - INFO - __main__ - Step 12399: {'lr': 0.00019999988281293465, 'samples': 396768, 'steps': 774, 'loss/train': 3.5763211250305176} -09/20/2021 17:10:24 - INFO - __main__ - Step 12400: {'lr': 0.00019999988281293465, 'samples': 396800, 'steps': 774, 'loss/train': 3.7995498180389404} -09/20/2021 17:10:25 - INFO - __main__ - Step 12401: {'lr': 0.0001999998728438982, 'samples': 396832, 'steps': 775, 'loss/train': 4.417167663574219} -09/20/2021 17:10:26 - INFO - __main__ - Step 12402: {'lr': 0.0001999998728438982, 'samples': 396864, 'steps': 775, 'loss/train': 1.8919185400009155} -09/20/2021 17:10:27 - INFO - __main__ - Step 12403: {'lr': 0.0001999998728438982, 'samples': 396896, 'steps': 775, 'loss/train': 4.531605243682861} -09/20/2021 17:10:27 - INFO - __main__ - Step 12404: {'lr': 0.0001999998728438982, 'samples': 396928, 'steps': 775, 'loss/train': 3.5157783031463623} -09/20/2021 17:10:28 - INFO - __main__ - Step 12405: {'lr': 0.0001999998728438982, 'samples': 396960, 'steps': 775, 'loss/train': 4.163156509399414} -09/20/2021 17:10:29 - INFO - __main__ - Step 12406: {'lr': 0.0001999998728438982, 'samples': 396992, 'steps': 775, 'loss/train': 7.5266594886779785} -09/20/2021 17:10:30 - INFO - __main__ - Step 12407: {'lr': 0.0001999998728438982, 'samples': 397024, 'steps': 775, 'loss/train': 7.456000328063965} -09/20/2021 17:10:30 - INFO - __main__ - Step 12408: {'lr': 0.0001999998728438982, 'samples': 397056, 'steps': 775, 'loss/train': 7.6443190574646} -09/20/2021 17:10:31 - INFO - __main__ - Step 12409: {'lr': 0.0001999998728438982, 'samples': 397088, 'steps': 775, 'loss/train': 7.916903972625732} -09/20/2021 17:10:32 - INFO - __main__ - Step 12410: {'lr': 0.0001999998728438982, 'samples': 397120, 'steps': 775, 'loss/train': 7.767866611480713} -09/20/2021 17:10:33 - INFO - __main__ - Step 12411: {'lr': 0.0001999998728438982, 'samples': 397152, 'steps': 775, 'loss/train': 7.961058139801025} -09/20/2021 17:10:34 - INFO - __main__ - Step 12412: {'lr': 0.0001999998728438982, 'samples': 397184, 'steps': 775, 'loss/train': 7.745315074920654} -09/20/2021 17:10:35 - INFO - __main__ - Step 12413: {'lr': 0.0001999998728438982, 'samples': 397216, 'steps': 775, 'loss/train': 3.9530811309814453} -09/20/2021 17:10:36 - INFO - __main__ - Step 12414: {'lr': 0.0001999998728438982, 'samples': 397248, 'steps': 775, 'loss/train': 4.373902320861816} -09/20/2021 17:10:36 - INFO - __main__ - Step 12415: {'lr': 0.0001999998728438982, 'samples': 397280, 'steps': 775, 'loss/train': 4.892560958862305} -09/20/2021 17:10:37 - INFO - __main__ - Step 12416: {'lr': 0.0001999998728438982, 'samples': 397312, 'steps': 775, 'loss/train': 3.8305063247680664} -09/20/2021 17:10:38 - INFO - __main__ - Step 12417: {'lr': 0.00019999986246796268, 'samples': 397344, 'steps': 776, 'loss/train': 3.8633055686950684} -09/20/2021 17:10:39 - INFO - __main__ - Step 12418: {'lr': 0.00019999986246796268, 'samples': 397376, 'steps': 776, 'loss/train': 4.053723335266113} -09/20/2021 17:10:39 - INFO - __main__ - Step 12419: {'lr': 0.00019999986246796268, 'samples': 397408, 'steps': 776, 'loss/train': 4.572997570037842} -09/20/2021 17:10:40 - INFO - __main__ - Step 12420: {'lr': 0.00019999986246796268, 'samples': 397440, 'steps': 776, 'loss/train': 3.9654738903045654} -09/20/2021 17:10:41 - INFO - __main__ - Step 12421: {'lr': 0.00019999986246796268, 'samples': 397472, 'steps': 776, 'loss/train': 5.650434494018555} -09/20/2021 17:10:42 - INFO - __main__ - Step 12422: {'lr': 0.00019999986246796268, 'samples': 397504, 'steps': 776, 'loss/train': 4.691856384277344} -09/20/2021 17:10:42 - INFO - __main__ - Step 12423: {'lr': 0.00019999986246796268, 'samples': 397536, 'steps': 776, 'loss/train': 5.784316539764404} -09/20/2021 17:10:43 - INFO - __main__ - Step 12424: {'lr': 0.00019999986246796268, 'samples': 397568, 'steps': 776, 'loss/train': 6.230695724487305} -09/20/2021 17:10:44 - INFO - __main__ - Step 12425: {'lr': 0.00019999986246796268, 'samples': 397600, 'steps': 776, 'loss/train': 3.4735918045043945} -09/20/2021 17:10:45 - INFO - __main__ - Step 12426: {'lr': 0.00019999986246796268, 'samples': 397632, 'steps': 776, 'loss/train': 3.865678310394287} -09/20/2021 17:10:45 - INFO - __main__ - Step 12427: {'lr': 0.00019999986246796268, 'samples': 397664, 'steps': 776, 'loss/train': 4.4492692947387695} -09/20/2021 17:10:46 - INFO - __main__ - Step 12428: {'lr': 0.00019999986246796268, 'samples': 397696, 'steps': 776, 'loss/train': 4.60496711730957} -09/20/2021 17:10:47 - INFO - __main__ - Step 12429: {'lr': 0.00019999986246796268, 'samples': 397728, 'steps': 776, 'loss/train': 4.770112991333008} -09/20/2021 17:10:48 - INFO - __main__ - Step 12430: {'lr': 0.00019999986246796268, 'samples': 397760, 'steps': 776, 'loss/train': 2.7853963375091553} -09/20/2021 17:10:48 - INFO - __main__ - Step 12431: {'lr': 0.00019999986246796268, 'samples': 397792, 'steps': 776, 'loss/train': 3.5190494060516357} -09/20/2021 17:10:49 - INFO - __main__ - Step 12432: {'lr': 0.00019999986246796268, 'samples': 397824, 'steps': 776, 'loss/train': 5.7602033615112305} -09/20/2021 17:10:50 - INFO - __main__ - Step 12433: {'lr': 0.00019999985168512812, 'samples': 397856, 'steps': 777, 'loss/train': 4.844461917877197} -09/20/2021 17:10:51 - INFO - __main__ - Step 12434: {'lr': 0.00019999985168512812, 'samples': 397888, 'steps': 777, 'loss/train': 3.8548412322998047} -09/20/2021 17:10:52 - INFO - __main__ - Step 12435: {'lr': 0.00019999985168512812, 'samples': 397920, 'steps': 777, 'loss/train': 3.708918571472168} -09/20/2021 17:10:52 - INFO - __main__ - Step 12436: {'lr': 0.00019999985168512812, 'samples': 397952, 'steps': 777, 'loss/train': 3.9711294174194336} -09/20/2021 17:10:53 - INFO - __main__ - Step 12437: {'lr': 0.00019999985168512812, 'samples': 397984, 'steps': 777, 'loss/train': 3.575546979904175} -09/20/2021 17:10:54 - INFO - __main__ - Step 12438: {'lr': 0.00019999985168512812, 'samples': 398016, 'steps': 777, 'loss/train': 4.591453552246094} -09/20/2021 17:10:55 - INFO - __main__ - Step 12439: {'lr': 0.00019999985168512812, 'samples': 398048, 'steps': 777, 'loss/train': 4.166141033172607} -09/20/2021 17:10:55 - INFO - __main__ - Step 12440: {'lr': 0.00019999985168512812, 'samples': 398080, 'steps': 777, 'loss/train': 4.459445476531982} -09/20/2021 17:10:56 - INFO - __main__ - Step 12441: {'lr': 0.00019999985168512812, 'samples': 398112, 'steps': 777, 'loss/train': 3.2287583351135254} -09/20/2021 17:10:57 - INFO - __main__ - Step 12442: {'lr': 0.00019999985168512812, 'samples': 398144, 'steps': 777, 'loss/train': 4.543874263763428} -09/20/2021 17:10:58 - INFO - __main__ - Step 12443: {'lr': 0.00019999985168512812, 'samples': 398176, 'steps': 777, 'loss/train': 3.9808201789855957} -09/20/2021 17:10:59 - INFO - __main__ - Step 12444: {'lr': 0.00019999985168512812, 'samples': 398208, 'steps': 777, 'loss/train': 4.814727783203125} -09/20/2021 17:11:00 - INFO - __main__ - Step 12445: {'lr': 0.00019999985168512812, 'samples': 398240, 'steps': 777, 'loss/train': 4.7378973960876465} -09/20/2021 17:11:00 - INFO - __main__ - Step 12446: {'lr': 0.00019999985168512812, 'samples': 398272, 'steps': 777, 'loss/train': 4.142251014709473} -09/20/2021 17:11:01 - INFO - __main__ - Step 12447: {'lr': 0.00019999985168512812, 'samples': 398304, 'steps': 777, 'loss/train': 3.4558870792388916} -09/20/2021 17:11:02 - INFO - __main__ - Step 12448: {'lr': 0.00019999985168512812, 'samples': 398336, 'steps': 777, 'loss/train': 4.3525519371032715} -09/20/2021 17:11:03 - INFO - __main__ - Step 12449: {'lr': 0.0001999998404953945, 'samples': 398368, 'steps': 778, 'loss/train': 5.039895057678223} -09/20/2021 17:11:03 - INFO - __main__ - Step 12450: {'lr': 0.0001999998404953945, 'samples': 398400, 'steps': 778, 'loss/train': 4.242005348205566} -09/20/2021 17:11:04 - INFO - __main__ - Step 12451: {'lr': 0.0001999998404953945, 'samples': 398432, 'steps': 778, 'loss/train': 4.1170244216918945} -09/20/2021 17:11:05 - INFO - __main__ - Step 12452: {'lr': 0.0001999998404953945, 'samples': 398464, 'steps': 778, 'loss/train': 4.178322792053223} -09/20/2021 17:11:06 - INFO - __main__ - Step 12453: {'lr': 0.0001999998404953945, 'samples': 398496, 'steps': 778, 'loss/train': 4.229297637939453} -09/20/2021 17:11:06 - INFO - __main__ - Step 12454: {'lr': 0.0001999998404953945, 'samples': 398528, 'steps': 778, 'loss/train': 6.017697811126709} -09/20/2021 17:11:07 - INFO - __main__ - Step 12455: {'lr': 0.0001999998404953945, 'samples': 398560, 'steps': 778, 'loss/train': 2.3180294036865234} -09/20/2021 17:11:08 - INFO - __main__ - Step 12456: {'lr': 0.0001999998404953945, 'samples': 398592, 'steps': 778, 'loss/train': 4.447969913482666} -09/20/2021 17:11:09 - INFO - __main__ - Step 12457: {'lr': 0.0001999998404953945, 'samples': 398624, 'steps': 778, 'loss/train': 3.53229022026062} -09/20/2021 17:11:09 - INFO - __main__ - Step 12458: {'lr': 0.0001999998404953945, 'samples': 398656, 'steps': 778, 'loss/train': 5.893205642700195} -09/20/2021 17:11:10 - INFO - __main__ - Step 12459: {'lr': 0.0001999998404953945, 'samples': 398688, 'steps': 778, 'loss/train': 3.301703453063965} -09/20/2021 17:11:11 - INFO - __main__ - Step 12460: {'lr': 0.0001999998404953945, 'samples': 398720, 'steps': 778, 'loss/train': 5.9010396003723145} -09/20/2021 17:11:12 - INFO - __main__ - Step 12461: {'lr': 0.0001999998404953945, 'samples': 398752, 'steps': 778, 'loss/train': 4.475660800933838} -09/20/2021 17:11:12 - INFO - __main__ - Step 12462: {'lr': 0.0001999998404953945, 'samples': 398784, 'steps': 778, 'loss/train': 4.354066848754883} -09/20/2021 17:11:13 - INFO - __main__ - Step 12463: {'lr': 0.0001999998404953945, 'samples': 398816, 'steps': 778, 'loss/train': 4.545957088470459} -09/20/2021 17:11:14 - INFO - __main__ - Step 12464: {'lr': 0.0001999998404953945, 'samples': 398848, 'steps': 778, 'loss/train': 4.612016201019287} -09/20/2021 17:11:15 - INFO - __main__ - Step 12465: {'lr': 0.00019999982889876196, 'samples': 398880, 'steps': 779, 'loss/train': 1.476585865020752} -09/20/2021 17:11:16 - INFO - __main__ - Step 12466: {'lr': 0.00019999982889876196, 'samples': 398912, 'steps': 779, 'loss/train': 4.3016815185546875} -09/20/2021 17:11:16 - INFO - __main__ - Step 12467: {'lr': 0.00019999982889876196, 'samples': 398944, 'steps': 779, 'loss/train': 4.20620059967041} -09/20/2021 17:11:17 - INFO - __main__ - Step 12468: {'lr': 0.00019999982889876196, 'samples': 398976, 'steps': 779, 'loss/train': 3.873750686645508} -09/20/2021 17:11:18 - INFO - __main__ - Step 12469: {'lr': 0.00019999982889876196, 'samples': 399008, 'steps': 779, 'loss/train': 5.034087657928467} -09/20/2021 17:11:19 - INFO - __main__ - Step 12470: {'lr': 0.00019999982889876196, 'samples': 399040, 'steps': 779, 'loss/train': 6.064895153045654} -09/20/2021 17:11:19 - INFO - __main__ - Step 12471: {'lr': 0.00019999982889876196, 'samples': 399072, 'steps': 779, 'loss/train': 3.512817621231079} -09/20/2021 17:11:20 - INFO - __main__ - Step 12472: {'lr': 0.00019999982889876196, 'samples': 399104, 'steps': 779, 'loss/train': 4.853234767913818} -09/20/2021 17:11:21 - INFO - __main__ - Step 12473: {'lr': 0.00019999982889876196, 'samples': 399136, 'steps': 779, 'loss/train': 4.0532660484313965} -09/20/2021 17:11:22 - INFO - __main__ - Step 12474: {'lr': 0.00019999982889876196, 'samples': 399168, 'steps': 779, 'loss/train': 4.944900035858154} -09/20/2021 17:11:23 - INFO - __main__ - Step 12475: {'lr': 0.00019999982889876196, 'samples': 399200, 'steps': 779, 'loss/train': 3.69585919380188} -09/20/2021 17:11:24 - INFO - __main__ - Step 12476: {'lr': 0.00019999982889876196, 'samples': 399232, 'steps': 779, 'loss/train': 3.393625497817993} -09/20/2021 17:11:24 - INFO - __main__ - Step 12477: {'lr': 0.00019999982889876196, 'samples': 399264, 'steps': 779, 'loss/train': 4.582082748413086} -09/20/2021 17:11:25 - INFO - __main__ - Step 12478: {'lr': 0.00019999982889876196, 'samples': 399296, 'steps': 779, 'loss/train': 3.7071924209594727} -09/20/2021 17:11:26 - INFO - __main__ - Step 12479: {'lr': 0.00019999982889876196, 'samples': 399328, 'steps': 779, 'loss/train': 1.9558879137039185} -09/20/2021 17:11:27 - INFO - __main__ - Step 12480: {'lr': 0.00019999982889876196, 'samples': 399360, 'steps': 779, 'loss/train': 3.613272190093994} -09/20/2021 17:11:28 - INFO - __main__ - Step 12481: {'lr': 0.0001999998168952305, 'samples': 399392, 'steps': 780, 'loss/train': 3.3990423679351807} -09/20/2021 17:11:28 - INFO - __main__ - Step 12482: {'lr': 0.0001999998168952305, 'samples': 399424, 'steps': 780, 'loss/train': 1.6097850799560547} -09/20/2021 17:11:29 - INFO - __main__ - Step 12483: {'lr': 0.0001999998168952305, 'samples': 399456, 'steps': 780, 'loss/train': 4.99755334854126} -09/20/2021 17:11:30 - INFO - __main__ - Step 12484: {'lr': 0.0001999998168952305, 'samples': 399488, 'steps': 780, 'loss/train': 2.5760724544525146} -09/20/2021 17:11:31 - INFO - __main__ - Step 12485: {'lr': 0.0001999998168952305, 'samples': 399520, 'steps': 780, 'loss/train': 2.4054150581359863} -09/20/2021 17:11:31 - INFO - __main__ - Step 12486: {'lr': 0.0001999998168952305, 'samples': 399552, 'steps': 780, 'loss/train': 2.96732759475708} -09/20/2021 17:11:32 - INFO - __main__ - Step 12487: {'lr': 0.0001999998168952305, 'samples': 399584, 'steps': 780, 'loss/train': 2.0477259159088135} -09/20/2021 17:11:33 - INFO - __main__ - Step 12488: {'lr': 0.0001999998168952305, 'samples': 399616, 'steps': 780, 'loss/train': 4.295543193817139} -09/20/2021 17:11:34 - INFO - __main__ - Step 12489: {'lr': 0.0001999998168952305, 'samples': 399648, 'steps': 780, 'loss/train': 4.289397239685059} -09/20/2021 17:11:34 - INFO - __main__ - Step 12490: {'lr': 0.0001999998168952305, 'samples': 399680, 'steps': 780, 'loss/train': 4.557643890380859} -09/20/2021 17:11:35 - INFO - __main__ - Step 12491: {'lr': 0.0001999998168952305, 'samples': 399712, 'steps': 780, 'loss/train': 4.141021251678467} -09/20/2021 17:11:36 - INFO - __main__ - Step 12492: {'lr': 0.0001999998168952305, 'samples': 399744, 'steps': 780, 'loss/train': 2.594330072402954} -09/20/2021 17:11:37 - INFO - __main__ - Step 12493: {'lr': 0.0001999998168952305, 'samples': 399776, 'steps': 780, 'loss/train': 4.67825984954834} -09/20/2021 17:11:37 - INFO - __main__ - Step 12494: {'lr': 0.0001999998168952305, 'samples': 399808, 'steps': 780, 'loss/train': 3.867528200149536} -09/20/2021 17:11:38 - INFO - __main__ - Step 12495: {'lr': 0.0001999998168952305, 'samples': 399840, 'steps': 780, 'loss/train': 4.23036003112793} -09/20/2021 17:11:39 - INFO - __main__ - Step 12496: {'lr': 0.0001999998168952305, 'samples': 399872, 'steps': 780, 'loss/train': 3.647655963897705} -09/20/2021 17:11:40 - INFO - __main__ - Step 12497: {'lr': 0.00019999980448480017, 'samples': 399904, 'steps': 781, 'loss/train': 4.232278823852539} -09/20/2021 17:11:40 - INFO - __main__ - Step 12498: {'lr': 0.00019999980448480017, 'samples': 399936, 'steps': 781, 'loss/train': 4.187654972076416} -09/20/2021 17:11:41 - INFO - __main__ - Step 12499: {'lr': 0.00019999980448480017, 'samples': 399968, 'steps': 781, 'loss/train': 4.18241024017334} -09/20/2021 17:11:42 - INFO - __main__ - Step 12500: {'lr': 0.00019999980448480017, 'samples': 400000, 'steps': 781, 'loss/train': 3.227794885635376} -09/20/2021 17:11:43 - INFO - __main__ - Step 12501: {'lr': 0.00019999980448480017, 'samples': 400032, 'steps': 781, 'loss/train': 6.365987777709961} -09/20/2021 17:11:43 - INFO - __main__ - Step 12502: {'lr': 0.00019999980448480017, 'samples': 400064, 'steps': 781, 'loss/train': 3.8193295001983643} -09/20/2021 17:11:44 - INFO - __main__ - Step 12503: {'lr': 0.00019999980448480017, 'samples': 400096, 'steps': 781, 'loss/train': 4.6545820236206055} -09/20/2021 17:11:45 - INFO - __main__ - Step 12504: {'lr': 0.00019999980448480017, 'samples': 400128, 'steps': 781, 'loss/train': 4.832113265991211} -09/20/2021 17:11:47 - INFO - __main__ - Step 12505: {'lr': 0.00019999980448480017, 'samples': 400160, 'steps': 781, 'loss/train': 4.312698841094971} -09/20/2021 17:11:47 - INFO - __main__ - Step 12506: {'lr': 0.00019999980448480017, 'samples': 400192, 'steps': 781, 'loss/train': 4.380430698394775} -09/20/2021 17:11:48 - INFO - __main__ - Step 12507: {'lr': 0.00019999980448480017, 'samples': 400224, 'steps': 781, 'loss/train': 4.484389305114746} -09/20/2021 17:11:49 - INFO - __main__ - Step 12508: {'lr': 0.00019999980448480017, 'samples': 400256, 'steps': 781, 'loss/train': 4.292314052581787} -09/20/2021 17:11:50 - INFO - __main__ - Step 12509: {'lr': 0.00019999980448480017, 'samples': 400288, 'steps': 781, 'loss/train': 4.013033390045166} -09/20/2021 17:11:50 - INFO - __main__ - Step 12510: {'lr': 0.00019999980448480017, 'samples': 400320, 'steps': 781, 'loss/train': 4.366974830627441} -09/20/2021 17:11:51 - INFO - __main__ - Step 12511: {'lr': 0.00019999980448480017, 'samples': 400352, 'steps': 781, 'loss/train': 3.0371222496032715} -09/20/2021 17:11:52 - INFO - __main__ - Step 12512: {'lr': 0.00019999980448480017, 'samples': 400384, 'steps': 781, 'loss/train': 4.870616436004639} -09/20/2021 17:11:53 - INFO - __main__ - Step 12513: {'lr': 0.000199999791667471, 'samples': 400416, 'steps': 782, 'loss/train': 4.517858028411865} -09/20/2021 17:11:53 - INFO - __main__ - Step 12514: {'lr': 0.000199999791667471, 'samples': 400448, 'steps': 782, 'loss/train': 3.4926321506500244} -09/20/2021 17:11:54 - INFO - __main__ - Step 12515: {'lr': 0.000199999791667471, 'samples': 400480, 'steps': 782, 'loss/train': 4.464543342590332} -09/20/2021 17:11:55 - INFO - __main__ - Step 12516: {'lr': 0.000199999791667471, 'samples': 400512, 'steps': 782, 'loss/train': 3.8404715061187744} -09/20/2021 17:11:56 - INFO - __main__ - Step 12517: {'lr': 0.000199999791667471, 'samples': 400544, 'steps': 782, 'loss/train': 4.462917327880859} -09/20/2021 17:11:56 - INFO - __main__ - Step 12518: {'lr': 0.000199999791667471, 'samples': 400576, 'steps': 782, 'loss/train': 5.079316139221191} -09/20/2021 17:11:57 - INFO - __main__ - Step 12519: {'lr': 0.000199999791667471, 'samples': 400608, 'steps': 782, 'loss/train': 4.107273578643799} -09/20/2021 17:11:58 - INFO - __main__ - Step 12520: {'lr': 0.000199999791667471, 'samples': 400640, 'steps': 782, 'loss/train': 3.7966461181640625} -09/20/2021 17:11:59 - INFO - __main__ - Step 12521: {'lr': 0.000199999791667471, 'samples': 400672, 'steps': 782, 'loss/train': 4.180296897888184} -09/20/2021 17:11:59 - INFO - __main__ - Step 12522: {'lr': 0.000199999791667471, 'samples': 400704, 'steps': 782, 'loss/train': 5.585046768188477} -09/20/2021 17:12:00 - INFO - __main__ - Step 12523: {'lr': 0.000199999791667471, 'samples': 400736, 'steps': 782, 'loss/train': 3.0026628971099854} -09/20/2021 17:12:01 - INFO - __main__ - Step 12524: {'lr': 0.000199999791667471, 'samples': 400768, 'steps': 782, 'loss/train': 2.958404779434204} -09/20/2021 17:12:02 - INFO - __main__ - Step 12525: {'lr': 0.000199999791667471, 'samples': 400800, 'steps': 782, 'loss/train': 3.628953456878662} -09/20/2021 17:12:02 - INFO - __main__ - Step 12526: {'lr': 0.000199999791667471, 'samples': 400832, 'steps': 782, 'loss/train': 3.06929349899292} -09/20/2021 17:12:03 - INFO - __main__ - Step 12527: {'lr': 0.000199999791667471, 'samples': 400864, 'steps': 782, 'loss/train': 2.7729175090789795} -09/20/2021 17:12:04 - INFO - __main__ - Step 12528: {'lr': 0.000199999791667471, 'samples': 400896, 'steps': 782, 'loss/train': 2.8837223052978516} -09/20/2021 17:12:05 - INFO - __main__ - Step 12529: {'lr': 0.0001999997784432431, 'samples': 400928, 'steps': 783, 'loss/train': 4.16561222076416} -09/20/2021 17:12:06 - INFO - __main__ - Step 12530: {'lr': 0.0001999997784432431, 'samples': 400960, 'steps': 783, 'loss/train': 6.649641990661621} -09/20/2021 17:12:06 - INFO - __main__ - Step 12531: {'lr': 0.0001999997784432431, 'samples': 400992, 'steps': 783, 'loss/train': 3.7060797214508057} -09/20/2021 17:12:07 - INFO - __main__ - Step 12532: {'lr': 0.0001999997784432431, 'samples': 401024, 'steps': 783, 'loss/train': 5.209306716918945} -09/20/2021 17:12:08 - INFO - __main__ - Step 12533: {'lr': 0.0001999997784432431, 'samples': 401056, 'steps': 783, 'loss/train': 4.859217643737793} -09/20/2021 17:12:09 - INFO - __main__ - Step 12534: {'lr': 0.0001999997784432431, 'samples': 401088, 'steps': 783, 'loss/train': 3.7735066413879395} -09/20/2021 17:12:09 - INFO - __main__ - Step 12535: {'lr': 0.0001999997784432431, 'samples': 401120, 'steps': 783, 'loss/train': 3.2816052436828613} -09/20/2021 17:12:11 - INFO - __main__ - Step 12536: {'lr': 0.0001999997784432431, 'samples': 401152, 'steps': 783, 'loss/train': 3.7305409908294678} -09/20/2021 17:12:11 - INFO - __main__ - Step 12537: {'lr': 0.0001999997784432431, 'samples': 401184, 'steps': 783, 'loss/train': 4.449097156524658} -09/20/2021 17:12:12 - INFO - __main__ - Step 12538: {'lr': 0.0001999997784432431, 'samples': 401216, 'steps': 783, 'loss/train': 3.7767834663391113} -09/20/2021 17:12:13 - INFO - __main__ - Step 12539: {'lr': 0.0001999997784432431, 'samples': 401248, 'steps': 783, 'loss/train': 5.3298211097717285} -09/20/2021 17:12:14 - INFO - __main__ - Step 12540: {'lr': 0.0001999997784432431, 'samples': 401280, 'steps': 783, 'loss/train': 4.0058064460754395} -09/20/2021 17:12:14 - INFO - __main__ - Step 12541: {'lr': 0.0001999997784432431, 'samples': 401312, 'steps': 783, 'loss/train': 4.306935787200928} -09/20/2021 17:12:15 - INFO - __main__ - Step 12542: {'lr': 0.0001999997784432431, 'samples': 401344, 'steps': 783, 'loss/train': 4.895886421203613} -09/20/2021 17:12:16 - INFO - __main__ - Step 12543: {'lr': 0.0001999997784432431, 'samples': 401376, 'steps': 783, 'loss/train': 3.379302740097046} -09/20/2021 17:12:17 - INFO - __main__ - Step 12544: {'lr': 0.0001999997784432431, 'samples': 401408, 'steps': 783, 'loss/train': 4.6935248374938965} -09/20/2021 17:12:18 - INFO - __main__ - Step 12545: {'lr': 0.00019999976481211646, 'samples': 401440, 'steps': 784, 'loss/train': 4.727725028991699} -09/20/2021 17:12:18 - INFO - __main__ - Step 12546: {'lr': 0.00019999976481211646, 'samples': 401472, 'steps': 784, 'loss/train': 4.463721752166748} -09/20/2021 17:12:19 - INFO - __main__ - Step 12547: {'lr': 0.00019999976481211646, 'samples': 401504, 'steps': 784, 'loss/train': 3.78352689743042} -09/20/2021 17:12:20 - INFO - __main__ - Step 12548: {'lr': 0.00019999976481211646, 'samples': 401536, 'steps': 784, 'loss/train': 4.067828178405762} -09/20/2021 17:12:21 - INFO - __main__ - Step 12549: {'lr': 0.00019999976481211646, 'samples': 401568, 'steps': 784, 'loss/train': 3.660893440246582} -09/20/2021 17:12:21 - INFO - __main__ - Step 12550: {'lr': 0.00019999976481211646, 'samples': 401600, 'steps': 784, 'loss/train': 4.8029985427856445} -09/20/2021 17:12:22 - INFO - __main__ - Step 12551: {'lr': 0.00019999976481211646, 'samples': 401632, 'steps': 784, 'loss/train': 3.880000591278076} -09/20/2021 17:12:23 - INFO - __main__ - Step 12552: {'lr': 0.00019999976481211646, 'samples': 401664, 'steps': 784, 'loss/train': 3.8686864376068115} -09/20/2021 17:12:24 - INFO - __main__ - Step 12553: {'lr': 0.00019999976481211646, 'samples': 401696, 'steps': 784, 'loss/train': 4.131222248077393} -09/20/2021 17:12:24 - INFO - __main__ - Step 12554: {'lr': 0.00019999976481211646, 'samples': 401728, 'steps': 784, 'loss/train': 4.687798500061035} -09/20/2021 17:12:25 - INFO - __main__ - Step 12555: {'lr': 0.00019999976481211646, 'samples': 401760, 'steps': 784, 'loss/train': 4.098946571350098} -09/20/2021 17:12:26 - INFO - __main__ - Step 12556: {'lr': 0.00019999976481211646, 'samples': 401792, 'steps': 784, 'loss/train': 5.406607627868652} -09/20/2021 17:12:27 - INFO - __main__ - Step 12557: {'lr': 0.00019999976481211646, 'samples': 401824, 'steps': 784, 'loss/train': 3.5756900310516357} -09/20/2021 17:12:27 - INFO - __main__ - Step 12558: {'lr': 0.00019999976481211646, 'samples': 401856, 'steps': 784, 'loss/train': 6.562992572784424} -09/20/2021 17:12:28 - INFO - __main__ - Step 12559: {'lr': 0.00019999976481211646, 'samples': 401888, 'steps': 784, 'loss/train': 6.555536270141602} -09/20/2021 17:12:29 - INFO - __main__ - Step 12560: {'lr': 0.00019999976481211646, 'samples': 401920, 'steps': 784, 'loss/train': 6.496168613433838} -09/20/2021 17:12:30 - INFO - __main__ - Step 12561: {'lr': 0.0001999997507740912, 'samples': 401952, 'steps': 785, 'loss/train': 6.295045852661133} -09/20/2021 17:12:31 - INFO - __main__ - Step 12562: {'lr': 0.0001999997507740912, 'samples': 401984, 'steps': 785, 'loss/train': 3.3719003200531006} -09/20/2021 17:12:31 - INFO - __main__ - Step 12563: {'lr': 0.0001999997507740912, 'samples': 402016, 'steps': 785, 'loss/train': 4.085517406463623} -09/20/2021 17:12:32 - INFO - __main__ - Step 12564: {'lr': 0.0001999997507740912, 'samples': 402048, 'steps': 785, 'loss/train': 4.348450660705566} -09/20/2021 17:12:33 - INFO - __main__ - Step 12565: {'lr': 0.0001999997507740912, 'samples': 402080, 'steps': 785, 'loss/train': 3.1453306674957275} -09/20/2021 17:12:34 - INFO - __main__ - Step 12566: {'lr': 0.0001999997507740912, 'samples': 402112, 'steps': 785, 'loss/train': 3.8636741638183594} -09/20/2021 17:12:34 - INFO - __main__ - Step 12567: {'lr': 0.0001999997507740912, 'samples': 402144, 'steps': 785, 'loss/train': 2.100806951522827} -09/20/2021 17:12:35 - INFO - __main__ - Step 12568: {'lr': 0.0001999997507740912, 'samples': 402176, 'steps': 785, 'loss/train': 4.265574932098389} -09/20/2021 17:12:36 - INFO - __main__ - Step 12569: {'lr': 0.0001999997507740912, 'samples': 402208, 'steps': 785, 'loss/train': 4.794382095336914} -09/20/2021 17:12:37 - INFO - __main__ - Step 12570: {'lr': 0.0001999997507740912, 'samples': 402240, 'steps': 785, 'loss/train': 4.579106330871582} -09/20/2021 17:12:38 - INFO - __main__ - Step 12571: {'lr': 0.0001999997507740912, 'samples': 402272, 'steps': 785, 'loss/train': 3.984381675720215} -09/20/2021 17:12:39 - INFO - __main__ - Step 12572: {'lr': 0.0001999997507740912, 'samples': 402304, 'steps': 785, 'loss/train': 3.441434860229492} -09/20/2021 17:12:39 - INFO - __main__ - Step 12573: {'lr': 0.0001999997507740912, 'samples': 402336, 'steps': 785, 'loss/train': 4.1097731590271} -09/20/2021 17:12:40 - INFO - __main__ - Step 12574: {'lr': 0.0001999997507740912, 'samples': 402368, 'steps': 785, 'loss/train': 4.286266326904297} -09/20/2021 17:12:41 - INFO - __main__ - Step 12575: {'lr': 0.0001999997507740912, 'samples': 402400, 'steps': 785, 'loss/train': 4.81972599029541} -09/20/2021 17:12:42 - INFO - __main__ - Step 12576: {'lr': 0.0001999997507740912, 'samples': 402432, 'steps': 785, 'loss/train': 4.577846527099609} -09/20/2021 17:12:42 - INFO - __main__ - Step 12577: {'lr': 0.0001999997363291673, 'samples': 402464, 'steps': 786, 'loss/train': 4.323163032531738} -09/20/2021 17:12:43 - INFO - __main__ - Step 12578: {'lr': 0.0001999997363291673, 'samples': 402496, 'steps': 786, 'loss/train': 4.977547645568848} -09/20/2021 17:12:44 - INFO - __main__ - Step 12579: {'lr': 0.0001999997363291673, 'samples': 402528, 'steps': 786, 'loss/train': 3.7276854515075684} -09/20/2021 17:12:45 - INFO - __main__ - Step 12580: {'lr': 0.0001999997363291673, 'samples': 402560, 'steps': 786, 'loss/train': 4.7800984382629395} -09/20/2021 17:12:45 - INFO - __main__ - Step 12581: {'lr': 0.0001999997363291673, 'samples': 402592, 'steps': 786, 'loss/train': 3.5546624660491943} -09/20/2021 17:12:46 - INFO - __main__ - Step 12582: {'lr': 0.0001999997363291673, 'samples': 402624, 'steps': 786, 'loss/train': 3.5458853244781494} -09/20/2021 17:12:47 - INFO - __main__ - Step 12583: {'lr': 0.0001999997363291673, 'samples': 402656, 'steps': 786, 'loss/train': 4.638569355010986} -09/20/2021 17:12:48 - INFO - __main__ - Step 12584: {'lr': 0.0001999997363291673, 'samples': 402688, 'steps': 786, 'loss/train': 4.285938739776611} -09/20/2021 17:12:48 - INFO - __main__ - Step 12585: {'lr': 0.0001999997363291673, 'samples': 402720, 'steps': 786, 'loss/train': 3.6391067504882812} -09/20/2021 17:12:49 - INFO - __main__ - Step 12586: {'lr': 0.0001999997363291673, 'samples': 402752, 'steps': 786, 'loss/train': 4.276482105255127} -09/20/2021 17:12:50 - INFO - __main__ - Step 12587: {'lr': 0.0001999997363291673, 'samples': 402784, 'steps': 786, 'loss/train': 4.656460762023926} -09/20/2021 17:12:51 - INFO - __main__ - Step 12588: {'lr': 0.0001999997363291673, 'samples': 402816, 'steps': 786, 'loss/train': 4.698629856109619} -09/20/2021 17:12:51 - INFO - __main__ - Step 12589: {'lr': 0.0001999997363291673, 'samples': 402848, 'steps': 786, 'loss/train': 3.775517463684082} -09/20/2021 17:12:52 - INFO - __main__ - Step 12590: {'lr': 0.0001999997363291673, 'samples': 402880, 'steps': 786, 'loss/train': 5.448059558868408} -09/20/2021 17:12:53 - INFO - __main__ - Step 12591: {'lr': 0.0001999997363291673, 'samples': 402912, 'steps': 786, 'loss/train': 5.289430618286133} -09/20/2021 17:12:54 - INFO - __main__ - Step 12592: {'lr': 0.0001999997363291673, 'samples': 402944, 'steps': 786, 'loss/train': 3.659522294998169} -09/20/2021 17:12:55 - INFO - __main__ - Step 12593: {'lr': 0.0001999997214773449, 'samples': 402976, 'steps': 787, 'loss/train': 3.788999080657959} -09/20/2021 17:12:55 - INFO - __main__ - Step 12594: {'lr': 0.0001999997214773449, 'samples': 403008, 'steps': 787, 'loss/train': 4.320240020751953} -09/20/2021 17:12:56 - INFO - __main__ - Step 12595: {'lr': 0.0001999997214773449, 'samples': 403040, 'steps': 787, 'loss/train': 4.526489734649658} -09/20/2021 17:12:57 - INFO - __main__ - Step 12596: {'lr': 0.0001999997214773449, 'samples': 403072, 'steps': 787, 'loss/train': 3.9936776161193848} -09/20/2021 17:12:58 - INFO - __main__ - Step 12597: {'lr': 0.0001999997214773449, 'samples': 403104, 'steps': 787, 'loss/train': 4.629432678222656} -09/20/2021 17:12:58 - INFO - __main__ - Step 12598: {'lr': 0.0001999997214773449, 'samples': 403136, 'steps': 787, 'loss/train': 4.162489414215088} -09/20/2021 17:12:59 - INFO - __main__ - Step 12599: {'lr': 0.0001999997214773449, 'samples': 403168, 'steps': 787, 'loss/train': 3.8919527530670166} -09/20/2021 17:13:00 - INFO - __main__ - Step 12600: {'lr': 0.0001999997214773449, 'samples': 403200, 'steps': 787, 'loss/train': 4.200564384460449} -09/20/2021 17:13:02 - INFO - __main__ - Step 12601: {'lr': 0.0001999997214773449, 'samples': 403232, 'steps': 787, 'loss/train': 5.568220138549805} -09/20/2021 17:13:02 - INFO - __main__ - Step 12602: {'lr': 0.0001999997214773449, 'samples': 403264, 'steps': 787, 'loss/train': 3.7410521507263184} -09/20/2021 17:13:03 - INFO - __main__ - Step 12603: {'lr': 0.0001999997214773449, 'samples': 403296, 'steps': 787, 'loss/train': 3.276329278945923} -09/20/2021 17:13:04 - INFO - __main__ - Step 12604: {'lr': 0.0001999997214773449, 'samples': 403328, 'steps': 787, 'loss/train': 4.607571601867676} -09/20/2021 17:13:05 - INFO - __main__ - Step 12605: {'lr': 0.0001999997214773449, 'samples': 403360, 'steps': 787, 'loss/train': 4.53736686706543} -09/20/2021 17:13:05 - INFO - __main__ - Step 12606: {'lr': 0.0001999997214773449, 'samples': 403392, 'steps': 787, 'loss/train': 4.656686305999756} -09/20/2021 17:13:06 - INFO - __main__ - Step 12607: {'lr': 0.0001999997214773449, 'samples': 403424, 'steps': 787, 'loss/train': 3.8067126274108887} -09/20/2021 17:13:07 - INFO - __main__ - Step 12608: {'lr': 0.0001999997214773449, 'samples': 403456, 'steps': 787, 'loss/train': 4.475351333618164} -09/20/2021 17:13:08 - INFO - __main__ - Step 12609: {'lr': 0.000199999706218624, 'samples': 403488, 'steps': 788, 'loss/train': 3.8731226921081543} -09/20/2021 17:13:08 - INFO - __main__ - Step 12610: {'lr': 0.000199999706218624, 'samples': 403520, 'steps': 788, 'loss/train': 4.302139759063721} -09/20/2021 17:13:09 - INFO - __main__ - Step 12611: {'lr': 0.000199999706218624, 'samples': 403552, 'steps': 788, 'loss/train': 3.6618666648864746} -09/20/2021 17:13:10 - INFO - __main__ - Step 12612: {'lr': 0.000199999706218624, 'samples': 403584, 'steps': 788, 'loss/train': 4.551875114440918} -09/20/2021 17:13:11 - INFO - __main__ - Step 12613: {'lr': 0.000199999706218624, 'samples': 403616, 'steps': 788, 'loss/train': 4.815613269805908} -09/20/2021 17:13:11 - INFO - __main__ - Step 12614: {'lr': 0.000199999706218624, 'samples': 403648, 'steps': 788, 'loss/train': 5.306308269500732} -09/20/2021 17:13:12 - INFO - __main__ - Step 12615: {'lr': 0.000199999706218624, 'samples': 403680, 'steps': 788, 'loss/train': 4.006840705871582} -09/20/2021 17:13:13 - INFO - __main__ - Step 12616: {'lr': 0.000199999706218624, 'samples': 403712, 'steps': 788, 'loss/train': 3.9847049713134766} -09/20/2021 17:13:14 - INFO - __main__ - Step 12617: {'lr': 0.000199999706218624, 'samples': 403744, 'steps': 788, 'loss/train': 3.9496262073516846} -09/20/2021 17:13:14 - INFO - __main__ - Step 12618: {'lr': 0.000199999706218624, 'samples': 403776, 'steps': 788, 'loss/train': 3.2324764728546143} -09/20/2021 17:13:15 - INFO - __main__ - Step 12619: {'lr': 0.000199999706218624, 'samples': 403808, 'steps': 788, 'loss/train': 4.1168904304504395} -09/20/2021 17:13:16 - INFO - __main__ - Step 12620: {'lr': 0.000199999706218624, 'samples': 403840, 'steps': 788, 'loss/train': 5.639684200286865} -09/20/2021 17:13:17 - INFO - __main__ - Step 12621: {'lr': 0.000199999706218624, 'samples': 403872, 'steps': 788, 'loss/train': 4.117878437042236} -09/20/2021 17:13:17 - INFO - __main__ - Step 12622: {'lr': 0.000199999706218624, 'samples': 403904, 'steps': 788, 'loss/train': 3.7949697971343994} -09/20/2021 17:13:18 - INFO - __main__ - Step 12623: {'lr': 0.000199999706218624, 'samples': 403936, 'steps': 788, 'loss/train': 4.827421188354492} -09/20/2021 17:13:19 - INFO - __main__ - Step 12624: {'lr': 0.000199999706218624, 'samples': 403968, 'steps': 788, 'loss/train': 4.804834842681885} -09/20/2021 17:13:20 - INFO - __main__ - Step 12625: {'lr': 0.0001999996905530047, 'samples': 404000, 'steps': 789, 'loss/train': 4.098694801330566} -09/20/2021 17:13:21 - INFO - __main__ - Step 12626: {'lr': 0.0001999996905530047, 'samples': 404032, 'steps': 789, 'loss/train': 4.552596092224121} -09/20/2021 17:13:21 - INFO - __main__ - Step 12627: {'lr': 0.0001999996905530047, 'samples': 404064, 'steps': 789, 'loss/train': 4.236587047576904} -09/20/2021 17:13:22 - INFO - __main__ - Step 12628: {'lr': 0.0001999996905530047, 'samples': 404096, 'steps': 789, 'loss/train': 3.398841381072998} -09/20/2021 17:13:23 - INFO - __main__ - Step 12629: {'lr': 0.0001999996905530047, 'samples': 404128, 'steps': 789, 'loss/train': 4.025099277496338} -09/20/2021 17:13:24 - INFO - __main__ - Step 12630: {'lr': 0.0001999996905530047, 'samples': 404160, 'steps': 789, 'loss/train': 4.033075332641602} -09/20/2021 17:13:24 - INFO - __main__ - Step 12631: {'lr': 0.0001999996905530047, 'samples': 404192, 'steps': 789, 'loss/train': 4.70956563949585} -09/20/2021 17:13:26 - INFO - __main__ - Step 12632: {'lr': 0.0001999996905530047, 'samples': 404224, 'steps': 789, 'loss/train': 2.9014546871185303} -09/20/2021 17:13:27 - INFO - __main__ - Step 12633: {'lr': 0.0001999996905530047, 'samples': 404256, 'steps': 789, 'loss/train': 3.5007097721099854} -09/20/2021 17:13:27 - INFO - __main__ - Step 12634: {'lr': 0.0001999996905530047, 'samples': 404288, 'steps': 789, 'loss/train': 4.25150728225708} -09/20/2021 17:13:28 - INFO - __main__ - Step 12635: {'lr': 0.0001999996905530047, 'samples': 404320, 'steps': 789, 'loss/train': 4.008569717407227} -09/20/2021 17:13:29 - INFO - __main__ - Step 12636: {'lr': 0.0001999996905530047, 'samples': 404352, 'steps': 789, 'loss/train': 4.518997669219971} -09/20/2021 17:13:30 - INFO - __main__ - Step 12637: {'lr': 0.0001999996905530047, 'samples': 404384, 'steps': 789, 'loss/train': 4.613321781158447} -09/20/2021 17:13:30 - INFO - __main__ - Step 12638: {'lr': 0.0001999996905530047, 'samples': 404416, 'steps': 789, 'loss/train': 4.284831523895264} -09/20/2021 17:13:31 - INFO - __main__ - Step 12639: {'lr': 0.0001999996905530047, 'samples': 404448, 'steps': 789, 'loss/train': 3.1150786876678467} -09/20/2021 17:13:32 - INFO - __main__ - Step 12640: {'lr': 0.0001999996905530047, 'samples': 404480, 'steps': 789, 'loss/train': 4.111393928527832} -09/20/2021 17:13:33 - INFO - __main__ - Step 12641: {'lr': 0.00019999967448048703, 'samples': 404512, 'steps': 790, 'loss/train': 1.2788642644882202} -09/20/2021 17:13:33 - INFO - __main__ - Step 12642: {'lr': 0.00019999967448048703, 'samples': 404544, 'steps': 790, 'loss/train': 1.6361844539642334} -09/20/2021 17:13:34 - INFO - __main__ - Step 12643: {'lr': 0.00019999967448048703, 'samples': 404576, 'steps': 790, 'loss/train': 1.865759015083313} -09/20/2021 17:13:35 - INFO - __main__ - Step 12644: {'lr': 0.00019999967448048703, 'samples': 404608, 'steps': 790, 'loss/train': 4.182620048522949} -09/20/2021 17:13:36 - INFO - __main__ - Step 12645: {'lr': 0.00019999967448048703, 'samples': 404640, 'steps': 790, 'loss/train': 4.037283420562744} -09/20/2021 17:13:36 - INFO - __main__ - Step 12646: {'lr': 0.00019999967448048703, 'samples': 404672, 'steps': 790, 'loss/train': 4.539785385131836} -09/20/2021 17:13:37 - INFO - __main__ - Step 12647: {'lr': 0.00019999967448048703, 'samples': 404704, 'steps': 790, 'loss/train': 4.4439473152160645} -09/20/2021 17:13:38 - INFO - __main__ - Step 12648: {'lr': 0.00019999967448048703, 'samples': 404736, 'steps': 790, 'loss/train': 4.713462829589844} -09/20/2021 17:13:39 - INFO - __main__ - Step 12649: {'lr': 0.00019999967448048703, 'samples': 404768, 'steps': 790, 'loss/train': 3.4617855548858643} -09/20/2021 17:13:39 - INFO - __main__ - Step 12650: {'lr': 0.00019999967448048703, 'samples': 404800, 'steps': 790, 'loss/train': 4.064929962158203} -09/20/2021 17:13:40 - INFO - __main__ - Step 12651: {'lr': 0.00019999967448048703, 'samples': 404832, 'steps': 790, 'loss/train': 4.078917026519775} -09/20/2021 17:13:41 - INFO - __main__ - Step 12652: {'lr': 0.00019999967448048703, 'samples': 404864, 'steps': 790, 'loss/train': 3.6188342571258545} -09/20/2021 17:13:42 - INFO - __main__ - Step 12653: {'lr': 0.00019999967448048703, 'samples': 404896, 'steps': 790, 'loss/train': 3.2485270500183105} -09/20/2021 17:13:42 - INFO - __main__ - Step 12654: {'lr': 0.00019999967448048703, 'samples': 404928, 'steps': 790, 'loss/train': 4.875603199005127} -09/20/2021 17:13:43 - INFO - __main__ - Step 12655: {'lr': 0.00019999967448048703, 'samples': 404960, 'steps': 790, 'loss/train': 4.447628498077393} -09/20/2021 17:13:44 - INFO - __main__ - Step 12656: {'lr': 0.00019999967448048703, 'samples': 404992, 'steps': 790, 'loss/train': 5.40305233001709} -09/20/2021 17:13:45 - INFO - __main__ - Step 12657: {'lr': 0.00019999965800107105, 'samples': 405024, 'steps': 791, 'loss/train': 3.771169424057007} -09/20/2021 17:13:46 - INFO - __main__ - Step 12658: {'lr': 0.00019999965800107105, 'samples': 405056, 'steps': 791, 'loss/train': 3.042668104171753} -09/20/2021 17:13:46 - INFO - __main__ - Step 12659: {'lr': 0.00019999965800107105, 'samples': 405088, 'steps': 791, 'loss/train': 2.0901999473571777} -09/20/2021 17:13:47 - INFO - __main__ - Step 12660: {'lr': 0.00019999965800107105, 'samples': 405120, 'steps': 791, 'loss/train': 1.6886872053146362} -09/20/2021 17:13:48 - INFO - __main__ - Step 12661: {'lr': 0.00019999965800107105, 'samples': 405152, 'steps': 791, 'loss/train': 1.7914494276046753} -09/20/2021 17:13:49 - INFO - __main__ - Step 12662: {'lr': 0.00019999965800107105, 'samples': 405184, 'steps': 791, 'loss/train': 1.5806825160980225} -09/20/2021 17:13:49 - INFO - __main__ - Step 12663: {'lr': 0.00019999965800107105, 'samples': 405216, 'steps': 791, 'loss/train': 4.283005237579346} -09/20/2021 17:13:51 - INFO - __main__ - Step 12664: {'lr': 0.00019999965800107105, 'samples': 405248, 'steps': 791, 'loss/train': 3.5687618255615234} -09/20/2021 17:13:51 - INFO - __main__ - Step 12665: {'lr': 0.00019999965800107105, 'samples': 405280, 'steps': 791, 'loss/train': 3.7513949871063232} -09/20/2021 17:13:52 - INFO - __main__ - Step 12666: {'lr': 0.00019999965800107105, 'samples': 405312, 'steps': 791, 'loss/train': 4.373179912567139} -09/20/2021 17:13:53 - INFO - __main__ - Step 12667: {'lr': 0.00019999965800107105, 'samples': 405344, 'steps': 791, 'loss/train': 4.815441131591797} -09/20/2021 17:13:54 - INFO - __main__ - Step 12668: {'lr': 0.00019999965800107105, 'samples': 405376, 'steps': 791, 'loss/train': 4.039748668670654} -09/20/2021 17:13:54 - INFO - __main__ - Step 12669: {'lr': 0.00019999965800107105, 'samples': 405408, 'steps': 791, 'loss/train': 3.0650994777679443} -09/20/2021 17:13:55 - INFO - __main__ - Step 12670: {'lr': 0.00019999965800107105, 'samples': 405440, 'steps': 791, 'loss/train': 4.859371185302734} -09/20/2021 17:13:56 - INFO - __main__ - Step 12671: {'lr': 0.00019999965800107105, 'samples': 405472, 'steps': 791, 'loss/train': 4.74815559387207} -09/20/2021 17:13:57 - INFO - __main__ - Step 12672: {'lr': 0.00019999965800107105, 'samples': 405504, 'steps': 791, 'loss/train': 4.2008538246154785} -09/20/2021 17:13:57 - INFO - __main__ - Step 12673: {'lr': 0.0001999996411147569, 'samples': 405536, 'steps': 792, 'loss/train': 3.3807411193847656} -09/20/2021 17:13:58 - INFO - __main__ - Step 12674: {'lr': 0.0001999996411147569, 'samples': 405568, 'steps': 792, 'loss/train': 4.667784214019775} -09/20/2021 17:13:59 - INFO - __main__ - Step 12675: {'lr': 0.0001999996411147569, 'samples': 405600, 'steps': 792, 'loss/train': 4.4388108253479} -09/20/2021 17:14:00 - INFO - __main__ - Step 12676: {'lr': 0.0001999996411147569, 'samples': 405632, 'steps': 792, 'loss/train': 3.99200177192688} -09/20/2021 17:14:00 - INFO - __main__ - Step 12677: {'lr': 0.0001999996411147569, 'samples': 405664, 'steps': 792, 'loss/train': 4.405107021331787} -09/20/2021 17:14:01 - INFO - __main__ - Step 12678: {'lr': 0.0001999996411147569, 'samples': 405696, 'steps': 792, 'loss/train': 4.658416271209717} -09/20/2021 17:14:02 - INFO - __main__ - Step 12679: {'lr': 0.0001999996411147569, 'samples': 405728, 'steps': 792, 'loss/train': 4.146568298339844} -09/20/2021 17:14:03 - INFO - __main__ - Step 12680: {'lr': 0.0001999996411147569, 'samples': 405760, 'steps': 792, 'loss/train': 3.9104764461517334} -09/20/2021 17:14:03 - INFO - __main__ - Step 12681: {'lr': 0.0001999996411147569, 'samples': 405792, 'steps': 792, 'loss/train': 2.3711800575256348} -09/20/2021 17:14:04 - INFO - __main__ - Step 12682: {'lr': 0.0001999996411147569, 'samples': 405824, 'steps': 792, 'loss/train': 4.204230785369873} -09/20/2021 17:14:05 - INFO - __main__ - Step 12683: {'lr': 0.0001999996411147569, 'samples': 405856, 'steps': 792, 'loss/train': 4.353430271148682} -09/20/2021 17:14:06 - INFO - __main__ - Step 12684: {'lr': 0.0001999996411147569, 'samples': 405888, 'steps': 792, 'loss/train': 3.5055551528930664} -09/20/2021 17:14:06 - INFO - __main__ - Step 12685: {'lr': 0.0001999996411147569, 'samples': 405920, 'steps': 792, 'loss/train': 1.769175410270691} -09/20/2021 17:14:07 - INFO - __main__ - Step 12686: {'lr': 0.0001999996411147569, 'samples': 405952, 'steps': 792, 'loss/train': 4.270269870758057} -09/20/2021 17:14:08 - INFO - __main__ - Step 12687: {'lr': 0.0001999996411147569, 'samples': 405984, 'steps': 792, 'loss/train': 3.72588849067688} -09/20/2021 17:14:09 - INFO - __main__ - Step 12688: {'lr': 0.0001999996411147569, 'samples': 406016, 'steps': 792, 'loss/train': 3.8085343837738037} -09/20/2021 17:14:10 - INFO - __main__ - Step 12689: {'lr': 0.00019999962382154457, 'samples': 406048, 'steps': 793, 'loss/train': 4.5633463859558105} -09/20/2021 17:14:10 - INFO - __main__ - Step 12690: {'lr': 0.00019999962382154457, 'samples': 406080, 'steps': 793, 'loss/train': 4.527415752410889} -09/20/2021 17:14:11 - INFO - __main__ - Step 12691: {'lr': 0.00019999962382154457, 'samples': 406112, 'steps': 793, 'loss/train': 4.173761367797852} -09/20/2021 17:14:12 - INFO - __main__ - Step 12692: {'lr': 0.00019999962382154457, 'samples': 406144, 'steps': 793, 'loss/train': 3.9749279022216797} -09/20/2021 17:14:13 - INFO - __main__ - Step 12693: {'lr': 0.00019999962382154457, 'samples': 406176, 'steps': 793, 'loss/train': 4.434247016906738} -09/20/2021 17:14:14 - INFO - __main__ - Step 12694: {'lr': 0.00019999962382154457, 'samples': 406208, 'steps': 793, 'loss/train': 3.4283623695373535} -09/20/2021 17:14:15 - INFO - __main__ - Step 12695: {'lr': 0.00019999962382154457, 'samples': 406240, 'steps': 793, 'loss/train': 3.8800108432769775} -09/20/2021 17:14:16 - INFO - __main__ - Step 12696: {'lr': 0.00019999962382154457, 'samples': 406272, 'steps': 793, 'loss/train': 4.921024322509766} -09/20/2021 17:14:16 - INFO - __main__ - Step 12697: {'lr': 0.00019999962382154457, 'samples': 406304, 'steps': 793, 'loss/train': 4.663579940795898} -09/20/2021 17:14:17 - INFO - __main__ - Step 12698: {'lr': 0.00019999962382154457, 'samples': 406336, 'steps': 793, 'loss/train': 6.421381950378418} -09/20/2021 17:14:18 - INFO - __main__ - Step 12699: {'lr': 0.00019999962382154457, 'samples': 406368, 'steps': 793, 'loss/train': 3.6944756507873535} -09/20/2021 17:14:19 - INFO - __main__ - Step 12700: {'lr': 0.00019999962382154457, 'samples': 406400, 'steps': 793, 'loss/train': 2.834099292755127} -09/20/2021 17:14:19 - INFO - __main__ - Step 12701: {'lr': 0.00019999962382154457, 'samples': 406432, 'steps': 793, 'loss/train': 3.8725485801696777} -09/20/2021 17:14:20 - INFO - __main__ - Step 12702: {'lr': 0.00019999962382154457, 'samples': 406464, 'steps': 793, 'loss/train': 3.161961317062378} -09/20/2021 17:14:21 - INFO - __main__ - Step 12703: {'lr': 0.00019999962382154457, 'samples': 406496, 'steps': 793, 'loss/train': 2.5714759826660156} -09/20/2021 17:14:22 - INFO - __main__ - Step 12704: {'lr': 0.00019999962382154457, 'samples': 406528, 'steps': 793, 'loss/train': 2.933316469192505} -09/20/2021 17:14:23 - INFO - __main__ - Step 12705: {'lr': 0.00019999960612143415, 'samples': 406560, 'steps': 794, 'loss/train': 2.8725757598876953} -09/20/2021 17:14:23 - INFO - __main__ - Step 12706: {'lr': 0.00019999960612143415, 'samples': 406592, 'steps': 794, 'loss/train': 2.66756272315979} -09/20/2021 17:14:24 - INFO - __main__ - Step 12707: {'lr': 0.00019999960612143415, 'samples': 406624, 'steps': 794, 'loss/train': 2.8853330612182617} -09/20/2021 17:14:25 - INFO - __main__ - Step 12708: {'lr': 0.00019999960612143415, 'samples': 406656, 'steps': 794, 'loss/train': 2.9812097549438477} -09/20/2021 17:14:26 - INFO - __main__ - Step 12709: {'lr': 0.00019999960612143415, 'samples': 406688, 'steps': 794, 'loss/train': 5.319435119628906} -09/20/2021 17:14:26 - INFO - __main__ - Step 12710: {'lr': 0.00019999960612143415, 'samples': 406720, 'steps': 794, 'loss/train': 3.6390159130096436} -09/20/2021 17:14:27 - INFO - __main__ - Step 12711: {'lr': 0.00019999960612143415, 'samples': 406752, 'steps': 794, 'loss/train': 4.441529750823975} -09/20/2021 17:14:28 - INFO - __main__ - Step 12712: {'lr': 0.00019999960612143415, 'samples': 406784, 'steps': 794, 'loss/train': 5.732016086578369} -09/20/2021 17:14:29 - INFO - __main__ - Step 12713: {'lr': 0.00019999960612143415, 'samples': 406816, 'steps': 794, 'loss/train': 3.931175947189331} -09/20/2021 17:14:29 - INFO - __main__ - Step 12714: {'lr': 0.00019999960612143415, 'samples': 406848, 'steps': 794, 'loss/train': 1.7380962371826172} -09/20/2021 17:14:30 - INFO - __main__ - Step 12715: {'lr': 0.00019999960612143415, 'samples': 406880, 'steps': 794, 'loss/train': 1.4228910207748413} -09/20/2021 17:14:31 - INFO - __main__ - Step 12716: {'lr': 0.00019999960612143415, 'samples': 406912, 'steps': 794, 'loss/train': 1.4544439315795898} -09/20/2021 17:14:32 - INFO - __main__ - Step 12717: {'lr': 0.00019999960612143415, 'samples': 406944, 'steps': 794, 'loss/train': 1.55228853225708} -09/20/2021 17:14:32 - INFO - __main__ - Step 12718: {'lr': 0.00019999960612143415, 'samples': 406976, 'steps': 794, 'loss/train': 2.8527441024780273} -09/20/2021 17:14:33 - INFO - __main__ - Step 12719: {'lr': 0.00019999960612143415, 'samples': 407008, 'steps': 794, 'loss/train': 3.9075746536254883} -09/20/2021 17:14:34 - INFO - __main__ - Step 12720: {'lr': 0.00019999960612143415, 'samples': 407040, 'steps': 794, 'loss/train': 4.512928485870361} -09/20/2021 17:14:35 - INFO - __main__ - Step 12721: {'lr': 0.00019999958801442575, 'samples': 407072, 'steps': 795, 'loss/train': 2.8840651512145996} -09/20/2021 17:14:35 - INFO - __main__ - Step 12722: {'lr': 0.00019999958801442575, 'samples': 407104, 'steps': 795, 'loss/train': 3.5160720348358154} -09/20/2021 17:14:36 - INFO - __main__ - Step 12723: {'lr': 0.00019999958801442575, 'samples': 407136, 'steps': 795, 'loss/train': 3.650529146194458} -09/20/2021 17:14:37 - INFO - __main__ - Step 12724: {'lr': 0.00019999958801442575, 'samples': 407168, 'steps': 795, 'loss/train': 3.347548007965088} -09/20/2021 17:14:38 - INFO - __main__ - Step 12725: {'lr': 0.00019999958801442575, 'samples': 407200, 'steps': 795, 'loss/train': 3.187016487121582} -09/20/2021 17:14:38 - INFO - __main__ - Step 12726: {'lr': 0.00019999958801442575, 'samples': 407232, 'steps': 795, 'loss/train': 3.9911141395568848} -09/20/2021 17:14:39 - INFO - __main__ - Step 12727: {'lr': 0.00019999958801442575, 'samples': 407264, 'steps': 795, 'loss/train': 5.092356204986572} -09/20/2021 17:14:40 - INFO - __main__ - Step 12728: {'lr': 0.00019999958801442575, 'samples': 407296, 'steps': 795, 'loss/train': 4.133018493652344} -09/20/2021 17:14:41 - INFO - __main__ - Step 12729: {'lr': 0.00019999958801442575, 'samples': 407328, 'steps': 795, 'loss/train': 4.703103065490723} -09/20/2021 17:14:41 - INFO - __main__ - Step 12730: {'lr': 0.00019999958801442575, 'samples': 407360, 'steps': 795, 'loss/train': 3.8282153606414795} -09/20/2021 17:14:42 - INFO - __main__ - Step 12731: {'lr': 0.00019999958801442575, 'samples': 407392, 'steps': 795, 'loss/train': 3.778618812561035} -09/20/2021 17:14:43 - INFO - __main__ - Step 12732: {'lr': 0.00019999958801442575, 'samples': 407424, 'steps': 795, 'loss/train': 3.0796656608581543} -09/20/2021 17:14:44 - INFO - __main__ - Step 12733: {'lr': 0.00019999958801442575, 'samples': 407456, 'steps': 795, 'loss/train': 6.693856239318848} -09/20/2021 17:14:45 - INFO - __main__ - Step 12734: {'lr': 0.00019999958801442575, 'samples': 407488, 'steps': 795, 'loss/train': 3.709261178970337} -09/20/2021 17:14:46 - INFO - __main__ - Step 12735: {'lr': 0.00019999958801442575, 'samples': 407520, 'steps': 795, 'loss/train': 5.123893737792969} -09/20/2021 17:14:47 - INFO - __main__ - Step 12736: {'lr': 0.00019999958801442575, 'samples': 407552, 'steps': 795, 'loss/train': 3.971078872680664} -09/20/2021 17:14:47 - INFO - __main__ - Step 12737: {'lr': 0.0001999995695005194, 'samples': 407584, 'steps': 796, 'loss/train': 4.554136753082275} -09/20/2021 17:14:48 - INFO - __main__ - Step 12738: {'lr': 0.0001999995695005194, 'samples': 407616, 'steps': 796, 'loss/train': 4.924213409423828} -09/20/2021 17:14:49 - INFO - __main__ - Step 12739: {'lr': 0.0001999995695005194, 'samples': 407648, 'steps': 796, 'loss/train': 4.666709899902344} -09/20/2021 17:14:50 - INFO - __main__ - Step 12740: {'lr': 0.0001999995695005194, 'samples': 407680, 'steps': 796, 'loss/train': 3.8874881267547607} -09/20/2021 17:14:50 - INFO - __main__ - Step 12741: {'lr': 0.0001999995695005194, 'samples': 407712, 'steps': 796, 'loss/train': 4.269143581390381} -09/20/2021 17:14:51 - INFO - __main__ - Step 12742: {'lr': 0.0001999995695005194, 'samples': 407744, 'steps': 796, 'loss/train': 4.488151550292969} -09/20/2021 17:14:52 - INFO - __main__ - Step 12743: {'lr': 0.0001999995695005194, 'samples': 407776, 'steps': 796, 'loss/train': 4.013187885284424} -09/20/2021 17:14:53 - INFO - __main__ - Step 12744: {'lr': 0.0001999995695005194, 'samples': 407808, 'steps': 796, 'loss/train': 4.224429607391357} -09/20/2021 17:14:53 - INFO - __main__ - Step 12745: {'lr': 0.0001999995695005194, 'samples': 407840, 'steps': 796, 'loss/train': 3.841801881790161} -09/20/2021 17:14:54 - INFO - __main__ - Step 12746: {'lr': 0.0001999995695005194, 'samples': 407872, 'steps': 796, 'loss/train': 4.469857692718506} -09/20/2021 17:14:55 - INFO - __main__ - Step 12747: {'lr': 0.0001999995695005194, 'samples': 407904, 'steps': 796, 'loss/train': 4.270907878875732} -09/20/2021 17:14:56 - INFO - __main__ - Step 12748: {'lr': 0.0001999995695005194, 'samples': 407936, 'steps': 796, 'loss/train': 3.7679483890533447} -09/20/2021 17:14:56 - INFO - __main__ - Step 12749: {'lr': 0.0001999995695005194, 'samples': 407968, 'steps': 796, 'loss/train': 1.8592296838760376} -09/20/2021 17:14:57 - INFO - __main__ - Step 12750: {'lr': 0.0001999995695005194, 'samples': 408000, 'steps': 796, 'loss/train': 3.814861297607422} -09/20/2021 17:14:58 - INFO - __main__ - Step 12751: {'lr': 0.0001999995695005194, 'samples': 408032, 'steps': 796, 'loss/train': 5.3074469566345215} -09/20/2021 17:14:59 - INFO - __main__ - Step 12752: {'lr': 0.0001999995695005194, 'samples': 408064, 'steps': 796, 'loss/train': 4.575798988342285} -09/20/2021 17:15:00 - INFO - __main__ - Step 12753: {'lr': 0.0001999995505797152, 'samples': 408096, 'steps': 797, 'loss/train': 4.979839324951172} -09/20/2021 17:15:00 - INFO - __main__ - Step 12754: {'lr': 0.0001999995505797152, 'samples': 408128, 'steps': 797, 'loss/train': 4.807497978210449} -09/20/2021 17:15:01 - INFO - __main__ - Step 12755: {'lr': 0.0001999995505797152, 'samples': 408160, 'steps': 797, 'loss/train': 0.8097463846206665} -09/20/2021 17:15:02 - INFO - __main__ - Step 12756: {'lr': 0.0001999995505797152, 'samples': 408192, 'steps': 797, 'loss/train': 3.9137065410614014} -09/20/2021 17:15:03 - INFO - __main__ - Step 12757: {'lr': 0.0001999995505797152, 'samples': 408224, 'steps': 797, 'loss/train': 3.8408777713775635} -09/20/2021 17:15:03 - INFO - __main__ - Step 12758: {'lr': 0.0001999995505797152, 'samples': 408256, 'steps': 797, 'loss/train': 1.2235063314437866} -09/20/2021 17:15:04 - INFO - __main__ - Step 12759: {'lr': 0.0001999995505797152, 'samples': 408288, 'steps': 797, 'loss/train': 1.499637484550476} -09/20/2021 17:15:05 - INFO - __main__ - Step 12760: {'lr': 0.0001999995505797152, 'samples': 408320, 'steps': 797, 'loss/train': 1.5969271659851074} -09/20/2021 17:15:06 - INFO - __main__ - Step 12761: {'lr': 0.0001999995505797152, 'samples': 408352, 'steps': 797, 'loss/train': 3.879056453704834} -09/20/2021 17:15:06 - INFO - __main__ - Step 12762: {'lr': 0.0001999995505797152, 'samples': 408384, 'steps': 797, 'loss/train': 3.9962475299835205} -09/20/2021 17:15:07 - INFO - __main__ - Step 12763: {'lr': 0.0001999995505797152, 'samples': 408416, 'steps': 797, 'loss/train': 4.15678071975708} -09/20/2021 17:15:08 - INFO - __main__ - Step 12764: {'lr': 0.0001999995505797152, 'samples': 408448, 'steps': 797, 'loss/train': 5.353755474090576} -09/20/2021 17:15:09 - INFO - __main__ - Step 12765: {'lr': 0.0001999995505797152, 'samples': 408480, 'steps': 797, 'loss/train': 3.9753506183624268} -09/20/2021 17:15:10 - INFO - __main__ - Step 12766: {'lr': 0.0001999995505797152, 'samples': 408512, 'steps': 797, 'loss/train': 4.509060382843018} -09/20/2021 17:15:11 - INFO - __main__ - Step 12767: {'lr': 0.0001999995505797152, 'samples': 408544, 'steps': 797, 'loss/train': 4.595391750335693} -09/20/2021 17:15:11 - INFO - __main__ - Step 12768: {'lr': 0.0001999995505797152, 'samples': 408576, 'steps': 797, 'loss/train': 3.6208441257476807} -09/20/2021 17:15:12 - INFO - __main__ - Step 12769: {'lr': 0.0001999995312520132, 'samples': 408608, 'steps': 798, 'loss/train': 3.8625388145446777} -09/20/2021 17:15:13 - INFO - __main__ - Step 12770: {'lr': 0.0001999995312520132, 'samples': 408640, 'steps': 798, 'loss/train': 4.477494239807129} -09/20/2021 17:15:14 - INFO - __main__ - Step 12771: {'lr': 0.0001999995312520132, 'samples': 408672, 'steps': 798, 'loss/train': 3.98857045173645} -09/20/2021 17:15:15 - INFO - __main__ - Step 12772: {'lr': 0.0001999995312520132, 'samples': 408704, 'steps': 798, 'loss/train': 3.9197356700897217} -09/20/2021 17:15:15 - INFO - __main__ - Step 12773: {'lr': 0.0001999995312520132, 'samples': 408736, 'steps': 798, 'loss/train': 4.816257476806641} -09/20/2021 17:15:16 - INFO - __main__ - Step 12774: {'lr': 0.0001999995312520132, 'samples': 408768, 'steps': 798, 'loss/train': 3.762073516845703} -09/20/2021 17:15:17 - INFO - __main__ - Step 12775: {'lr': 0.0001999995312520132, 'samples': 408800, 'steps': 798, 'loss/train': 3.909452438354492} -09/20/2021 17:15:18 - INFO - __main__ - Step 12776: {'lr': 0.0001999995312520132, 'samples': 408832, 'steps': 798, 'loss/train': 3.868509531021118} -09/20/2021 17:15:18 - INFO - __main__ - Step 12777: {'lr': 0.0001999995312520132, 'samples': 408864, 'steps': 798, 'loss/train': 4.992464065551758} -09/20/2021 17:15:19 - INFO - __main__ - Step 12778: {'lr': 0.0001999995312520132, 'samples': 408896, 'steps': 798, 'loss/train': 5.526097774505615} -09/20/2021 17:15:20 - INFO - __main__ - Step 12779: {'lr': 0.0001999995312520132, 'samples': 408928, 'steps': 798, 'loss/train': 2.774394989013672} -09/20/2021 17:15:21 - INFO - __main__ - Step 12780: {'lr': 0.0001999995312520132, 'samples': 408960, 'steps': 798, 'loss/train': 3.966214656829834} -09/20/2021 17:15:21 - INFO - __main__ - Step 12781: {'lr': 0.0001999995312520132, 'samples': 408992, 'steps': 798, 'loss/train': 3.8227667808532715} -09/20/2021 17:15:22 - INFO - __main__ - Step 12782: {'lr': 0.0001999995312520132, 'samples': 409024, 'steps': 798, 'loss/train': 1.8116611242294312} -09/20/2021 17:15:23 - INFO - __main__ - Step 12783: {'lr': 0.0001999995312520132, 'samples': 409056, 'steps': 798, 'loss/train': 5.003233909606934} -09/20/2021 17:15:24 - INFO - __main__ - Step 12784: {'lr': 0.0001999995312520132, 'samples': 409088, 'steps': 798, 'loss/train': 4.920543670654297} -09/20/2021 17:15:25 - INFO - __main__ - Step 12785: {'lr': 0.0001999995115174135, 'samples': 409120, 'steps': 799, 'loss/train': 4.630156993865967} -09/20/2021 17:15:25 - INFO - __main__ - Step 12786: {'lr': 0.0001999995115174135, 'samples': 409152, 'steps': 799, 'loss/train': 4.030745506286621} -09/20/2021 17:15:26 - INFO - __main__ - Step 12787: {'lr': 0.0001999995115174135, 'samples': 409184, 'steps': 799, 'loss/train': 3.667449951171875} -09/20/2021 17:15:27 - INFO - __main__ - Step 12788: {'lr': 0.0001999995115174135, 'samples': 409216, 'steps': 799, 'loss/train': 4.39162540435791} -09/20/2021 17:15:28 - INFO - __main__ - Step 12789: {'lr': 0.0001999995115174135, 'samples': 409248, 'steps': 799, 'loss/train': 4.323230743408203} -09/20/2021 17:15:28 - INFO - __main__ - Step 12790: {'lr': 0.0001999995115174135, 'samples': 409280, 'steps': 799, 'loss/train': 1.5934929847717285} -09/20/2021 17:15:29 - INFO - __main__ - Step 12791: {'lr': 0.0001999995115174135, 'samples': 409312, 'steps': 799, 'loss/train': 4.09921932220459} -09/20/2021 17:15:30 - INFO - __main__ - Step 12792: {'lr': 0.0001999995115174135, 'samples': 409344, 'steps': 799, 'loss/train': 4.621921539306641} -09/20/2021 17:15:31 - INFO - __main__ - Step 12793: {'lr': 0.0001999995115174135, 'samples': 409376, 'steps': 799, 'loss/train': 3.753744125366211} -09/20/2021 17:15:31 - INFO - __main__ - Step 12794: {'lr': 0.0001999995115174135, 'samples': 409408, 'steps': 799, 'loss/train': 4.1634016036987305} -09/20/2021 17:15:33 - INFO - __main__ - Step 12795: {'lr': 0.0001999995115174135, 'samples': 409440, 'steps': 799, 'loss/train': 4.4895501136779785} -09/20/2021 17:15:33 - INFO - __main__ - Step 12796: {'lr': 0.0001999995115174135, 'samples': 409472, 'steps': 799, 'loss/train': 3.673065185546875} -09/20/2021 17:15:34 - INFO - __main__ - Step 12797: {'lr': 0.0001999995115174135, 'samples': 409504, 'steps': 799, 'loss/train': 4.7223591804504395} -09/20/2021 17:15:35 - INFO - __main__ - Step 12798: {'lr': 0.0001999995115174135, 'samples': 409536, 'steps': 799, 'loss/train': 2.0831685066223145} -09/20/2021 17:15:36 - INFO - __main__ - Step 12799: {'lr': 0.0001999995115174135, 'samples': 409568, 'steps': 799, 'loss/train': 4.914181232452393} -09/20/2021 17:15:36 - INFO - __main__ - Step 12800: {'lr': 0.0001999995115174135, 'samples': 409600, 'steps': 799, 'loss/train': 4.333523273468018} -09/20/2021 17:15:37 - INFO - __main__ - Step 12801: {'lr': 0.0001999994913759162, 'samples': 409632, 'steps': 800, 'loss/train': 4.479361057281494} -09/20/2021 17:15:38 - INFO - __main__ - Step 12802: {'lr': 0.0001999994913759162, 'samples': 409664, 'steps': 800, 'loss/train': 3.5217130184173584} -09/20/2021 17:15:39 - INFO - __main__ - Step 12803: {'lr': 0.0001999994913759162, 'samples': 409696, 'steps': 800, 'loss/train': 3.7042903900146484} -09/20/2021 17:15:40 - INFO - __main__ - Step 12804: {'lr': 0.0001999994913759162, 'samples': 409728, 'steps': 800, 'loss/train': 4.6777024269104} -09/20/2021 17:15:40 - INFO - __main__ - Step 12805: {'lr': 0.0001999994913759162, 'samples': 409760, 'steps': 800, 'loss/train': 4.4436845779418945} -09/20/2021 17:15:41 - INFO - __main__ - Step 12806: {'lr': 0.0001999994913759162, 'samples': 409792, 'steps': 800, 'loss/train': 3.8864846229553223} -09/20/2021 17:15:42 - INFO - __main__ - Step 12807: {'lr': 0.0001999994913759162, 'samples': 409824, 'steps': 800, 'loss/train': 3.8775105476379395} -09/20/2021 17:15:43 - INFO - __main__ - Step 12808: {'lr': 0.0001999994913759162, 'samples': 409856, 'steps': 800, 'loss/train': 4.001714706420898} -09/20/2021 17:15:43 - INFO - __main__ - Step 12809: {'lr': 0.0001999994913759162, 'samples': 409888, 'steps': 800, 'loss/train': 4.601871967315674} -09/20/2021 17:15:44 - INFO - __main__ - Step 12810: {'lr': 0.0001999994913759162, 'samples': 409920, 'steps': 800, 'loss/train': 4.248022079467773} -09/20/2021 17:15:45 - INFO - __main__ - Step 12811: {'lr': 0.0001999994913759162, 'samples': 409952, 'steps': 800, 'loss/train': 4.577456951141357} -09/20/2021 17:15:46 - INFO - __main__ - Step 12812: {'lr': 0.0001999994913759162, 'samples': 409984, 'steps': 800, 'loss/train': 4.126646041870117} -09/20/2021 17:15:46 - INFO - __main__ - Step 12813: {'lr': 0.0001999994913759162, 'samples': 410016, 'steps': 800, 'loss/train': 4.038304805755615} -09/20/2021 17:15:47 - INFO - __main__ - Step 12814: {'lr': 0.0001999994913759162, 'samples': 410048, 'steps': 800, 'loss/train': 4.198471546173096} -09/20/2021 17:15:48 - INFO - __main__ - Step 12815: {'lr': 0.0001999994913759162, 'samples': 410080, 'steps': 800, 'loss/train': 4.805241107940674} -09/20/2021 17:15:49 - INFO - __main__ - Step 12816: {'lr': 0.0001999994913759162, 'samples': 410112, 'steps': 800, 'loss/train': 1.752308964729309} -09/20/2021 17:15:49 - INFO - __main__ - Step 12817: {'lr': 0.00019999947082752133, 'samples': 410144, 'steps': 801, 'loss/train': 1.0191107988357544} -09/20/2021 17:15:50 - INFO - __main__ - Step 12818: {'lr': 0.00019999947082752133, 'samples': 410176, 'steps': 801, 'loss/train': 1.482200264930725} -09/20/2021 17:15:51 - INFO - __main__ - Step 12819: {'lr': 0.00019999947082752133, 'samples': 410208, 'steps': 801, 'loss/train': 1.399036169052124} -09/20/2021 17:15:52 - INFO - __main__ - Step 12820: {'lr': 0.00019999947082752133, 'samples': 410240, 'steps': 801, 'loss/train': 2.6425721645355225} -09/20/2021 17:15:52 - INFO - __main__ - Step 12821: {'lr': 0.00019999947082752133, 'samples': 410272, 'steps': 801, 'loss/train': 4.623939037322998} -09/20/2021 17:15:53 - INFO - __main__ - Step 12822: {'lr': 0.00019999947082752133, 'samples': 410304, 'steps': 801, 'loss/train': 6.475821495056152} -09/20/2021 17:15:54 - INFO - __main__ - Step 12823: {'lr': 0.00019999947082752133, 'samples': 410336, 'steps': 801, 'loss/train': 3.7730748653411865} -09/20/2021 17:15:55 - INFO - __main__ - Step 12824: {'lr': 0.00019999947082752133, 'samples': 410368, 'steps': 801, 'loss/train': 3.432000160217285} -09/20/2021 17:15:55 - INFO - __main__ - Step 12825: {'lr': 0.00019999947082752133, 'samples': 410400, 'steps': 801, 'loss/train': 4.437355995178223} -09/20/2021 17:15:57 - INFO - __main__ - Step 12826: {'lr': 0.00019999947082752133, 'samples': 410432, 'steps': 801, 'loss/train': 4.269493579864502} -09/20/2021 17:15:58 - INFO - __main__ - Step 12827: {'lr': 0.00019999947082752133, 'samples': 410464, 'steps': 801, 'loss/train': 3.985626697540283} -09/20/2021 17:15:58 - INFO - __main__ - Step 12828: {'lr': 0.00019999947082752133, 'samples': 410496, 'steps': 801, 'loss/train': 4.480950832366943} -09/20/2021 17:15:59 - INFO - __main__ - Step 12829: {'lr': 0.00019999947082752133, 'samples': 410528, 'steps': 801, 'loss/train': 4.32623291015625} -09/20/2021 17:16:00 - INFO - __main__ - Step 12830: {'lr': 0.00019999947082752133, 'samples': 410560, 'steps': 801, 'loss/train': 4.270053386688232} -09/20/2021 17:16:01 - INFO - __main__ - Step 12831: {'lr': 0.00019999947082752133, 'samples': 410592, 'steps': 801, 'loss/train': 4.725941181182861} -09/20/2021 17:16:01 - INFO - __main__ - Step 12832: {'lr': 0.00019999947082752133, 'samples': 410624, 'steps': 801, 'loss/train': 3.536025047302246} -09/20/2021 17:16:02 - INFO - __main__ - Step 12833: {'lr': 0.00019999944987222898, 'samples': 410656, 'steps': 802, 'loss/train': 4.487989902496338} -09/20/2021 17:16:03 - INFO - __main__ - Step 12834: {'lr': 0.00019999944987222898, 'samples': 410688, 'steps': 802, 'loss/train': 5.282774448394775} -09/20/2021 17:16:04 - INFO - __main__ - Step 12835: {'lr': 0.00019999944987222898, 'samples': 410720, 'steps': 802, 'loss/train': 4.405673503875732} -09/20/2021 17:16:04 - INFO - __main__ - Step 12836: {'lr': 0.00019999944987222898, 'samples': 410752, 'steps': 802, 'loss/train': 4.267027378082275} -09/20/2021 17:16:05 - INFO - __main__ - Step 12837: {'lr': 0.00019999944987222898, 'samples': 410784, 'steps': 802, 'loss/train': 3.608248710632324} -09/20/2021 17:16:06 - INFO - __main__ - Step 12838: {'lr': 0.00019999944987222898, 'samples': 410816, 'steps': 802, 'loss/train': 4.401447296142578} -09/20/2021 17:16:07 - INFO - __main__ - Step 12839: {'lr': 0.00019999944987222898, 'samples': 410848, 'steps': 802, 'loss/train': 4.875267028808594} -09/20/2021 17:16:07 - INFO - __main__ - Step 12840: {'lr': 0.00019999944987222898, 'samples': 410880, 'steps': 802, 'loss/train': 4.09336519241333} -09/20/2021 17:16:08 - INFO - __main__ - Step 12841: {'lr': 0.00019999944987222898, 'samples': 410912, 'steps': 802, 'loss/train': 5.128800392150879} -09/20/2021 17:16:09 - INFO - __main__ - Step 12842: {'lr': 0.00019999944987222898, 'samples': 410944, 'steps': 802, 'loss/train': 4.331733226776123} -09/20/2021 17:16:10 - INFO - __main__ - Step 12843: {'lr': 0.00019999944987222898, 'samples': 410976, 'steps': 802, 'loss/train': 5.545936584472656} -09/20/2021 17:16:10 - INFO - __main__ - Step 12844: {'lr': 0.00019999944987222898, 'samples': 411008, 'steps': 802, 'loss/train': 4.6916961669921875} -09/20/2021 17:16:11 - INFO - __main__ - Step 12845: {'lr': 0.00019999944987222898, 'samples': 411040, 'steps': 802, 'loss/train': 4.241918087005615} -09/20/2021 17:16:12 - INFO - __main__ - Step 12846: {'lr': 0.00019999944987222898, 'samples': 411072, 'steps': 802, 'loss/train': 3.7814979553222656} -09/20/2021 17:16:13 - INFO - __main__ - Step 12847: {'lr': 0.00019999944987222898, 'samples': 411104, 'steps': 802, 'loss/train': 5.04267692565918} -09/20/2021 17:16:13 - INFO - __main__ - Step 12848: {'lr': 0.00019999944987222898, 'samples': 411136, 'steps': 802, 'loss/train': 4.478496074676514} -09/20/2021 17:16:14 - INFO - __main__ - Step 12849: {'lr': 0.0001999994285100393, 'samples': 411168, 'steps': 803, 'loss/train': 2.726240873336792} -09/20/2021 17:16:15 - INFO - __main__ - Step 12850: {'lr': 0.0001999994285100393, 'samples': 411200, 'steps': 803, 'loss/train': 4.528717994689941} -09/20/2021 17:16:16 - INFO - __main__ - Step 12851: {'lr': 0.0001999994285100393, 'samples': 411232, 'steps': 803, 'loss/train': 3.463517665863037} -09/20/2021 17:16:17 - INFO - __main__ - Step 12852: {'lr': 0.0001999994285100393, 'samples': 411264, 'steps': 803, 'loss/train': 4.610965251922607} -09/20/2021 17:16:17 - INFO - __main__ - Step 12853: {'lr': 0.0001999994285100393, 'samples': 411296, 'steps': 803, 'loss/train': 3.6529572010040283} -09/20/2021 17:16:18 - INFO - __main__ - Step 12854: {'lr': 0.0001999994285100393, 'samples': 411328, 'steps': 803, 'loss/train': 2.9992711544036865} -09/20/2021 17:16:19 - INFO - __main__ - Step 12855: {'lr': 0.0001999994285100393, 'samples': 411360, 'steps': 803, 'loss/train': 4.306686878204346} -09/20/2021 17:16:20 - INFO - __main__ - Step 12856: {'lr': 0.0001999994285100393, 'samples': 411392, 'steps': 803, 'loss/train': 4.595828056335449} -09/20/2021 17:16:21 - INFO - __main__ - Step 12857: {'lr': 0.0001999994285100393, 'samples': 411424, 'steps': 803, 'loss/train': 4.22176456451416} -09/20/2021 17:16:22 - INFO - __main__ - Step 12858: {'lr': 0.0001999994285100393, 'samples': 411456, 'steps': 803, 'loss/train': 1.6800777912139893} -09/20/2021 17:16:22 - INFO - __main__ - Step 12859: {'lr': 0.0001999994285100393, 'samples': 411488, 'steps': 803, 'loss/train': 3.1994121074676514} -09/20/2021 17:16:23 - INFO - __main__ - Step 12860: {'lr': 0.0001999994285100393, 'samples': 411520, 'steps': 803, 'loss/train': 3.820645332336426} -09/20/2021 17:16:24 - INFO - __main__ - Step 12861: {'lr': 0.0001999994285100393, 'samples': 411552, 'steps': 803, 'loss/train': 4.685145378112793} -09/20/2021 17:16:25 - INFO - __main__ - Step 12862: {'lr': 0.0001999994285100393, 'samples': 411584, 'steps': 803, 'loss/train': 4.325254440307617} -09/20/2021 17:16:25 - INFO - __main__ - Step 12863: {'lr': 0.0001999994285100393, 'samples': 411616, 'steps': 803, 'loss/train': 4.624445915222168} -09/20/2021 17:16:26 - INFO - __main__ - Step 12864: {'lr': 0.0001999994285100393, 'samples': 411648, 'steps': 803, 'loss/train': 4.209540367126465} -09/20/2021 17:16:27 - INFO - __main__ - Step 12865: {'lr': 0.00019999940674095233, 'samples': 411680, 'steps': 804, 'loss/train': 4.161425590515137} -09/20/2021 17:16:28 - INFO - __main__ - Step 12866: {'lr': 0.00019999940674095233, 'samples': 411712, 'steps': 804, 'loss/train': 3.726414680480957} -09/20/2021 17:16:28 - INFO - __main__ - Step 12867: {'lr': 0.00019999940674095233, 'samples': 411744, 'steps': 804, 'loss/train': 5.469222068786621} -09/20/2021 17:16:29 - INFO - __main__ - Step 12868: {'lr': 0.00019999940674095233, 'samples': 411776, 'steps': 804, 'loss/train': 3.8134045600891113} -09/20/2021 17:16:30 - INFO - __main__ - Step 12869: {'lr': 0.00019999940674095233, 'samples': 411808, 'steps': 804, 'loss/train': 3.1840062141418457} -09/20/2021 17:16:31 - INFO - __main__ - Step 12870: {'lr': 0.00019999940674095233, 'samples': 411840, 'steps': 804, 'loss/train': 4.664689064025879} -09/20/2021 17:16:31 - INFO - __main__ - Step 12871: {'lr': 0.00019999940674095233, 'samples': 411872, 'steps': 804, 'loss/train': 4.323614597320557} -09/20/2021 17:16:32 - INFO - __main__ - Step 12872: {'lr': 0.00019999940674095233, 'samples': 411904, 'steps': 804, 'loss/train': 5.871425151824951} -09/20/2021 17:16:33 - INFO - __main__ - Step 12873: {'lr': 0.00019999940674095233, 'samples': 411936, 'steps': 804, 'loss/train': 4.209181308746338} -09/20/2021 17:16:34 - INFO - __main__ - Step 12874: {'lr': 0.00019999940674095233, 'samples': 411968, 'steps': 804, 'loss/train': 4.664322376251221} -09/20/2021 17:16:34 - INFO - __main__ - Step 12875: {'lr': 0.00019999940674095233, 'samples': 412000, 'steps': 804, 'loss/train': 2.710369110107422} -09/20/2021 17:16:35 - INFO - __main__ - Step 12876: {'lr': 0.00019999940674095233, 'samples': 412032, 'steps': 804, 'loss/train': 4.192403793334961} -09/20/2021 17:16:36 - INFO - __main__ - Step 12877: {'lr': 0.00019999940674095233, 'samples': 412064, 'steps': 804, 'loss/train': 3.777350664138794} -09/20/2021 17:16:37 - INFO - __main__ - Step 12878: {'lr': 0.00019999940674095233, 'samples': 412096, 'steps': 804, 'loss/train': 4.102631092071533} -09/20/2021 17:16:37 - INFO - __main__ - Step 12879: {'lr': 0.00019999940674095233, 'samples': 412128, 'steps': 804, 'loss/train': 3.466933488845825} -09/20/2021 17:16:38 - INFO - __main__ - Step 12880: {'lr': 0.00019999940674095233, 'samples': 412160, 'steps': 804, 'loss/train': 4.880801677703857} -09/20/2021 17:16:39 - INFO - __main__ - Step 12881: {'lr': 0.00019999938456496813, 'samples': 412192, 'steps': 805, 'loss/train': 4.675688743591309} -09/20/2021 17:16:40 - INFO - __main__ - Step 12882: {'lr': 0.00019999938456496813, 'samples': 412224, 'steps': 805, 'loss/train': 4.207706451416016} -09/20/2021 17:16:41 - INFO - __main__ - Step 12883: {'lr': 0.00019999938456496813, 'samples': 412256, 'steps': 805, 'loss/train': 3.8505239486694336} -09/20/2021 17:16:41 - INFO - __main__ - Step 12884: {'lr': 0.00019999938456496813, 'samples': 412288, 'steps': 805, 'loss/train': 3.9367077350616455} -09/20/2021 17:16:42 - INFO - __main__ - Step 12885: {'lr': 0.00019999938456496813, 'samples': 412320, 'steps': 805, 'loss/train': 4.444403648376465} -09/20/2021 17:16:43 - INFO - __main__ - Step 12886: {'lr': 0.00019999938456496813, 'samples': 412352, 'steps': 805, 'loss/train': 4.363608360290527} -09/20/2021 17:16:44 - INFO - __main__ - Step 12887: {'lr': 0.00019999938456496813, 'samples': 412384, 'steps': 805, 'loss/train': 4.009427547454834} -09/20/2021 17:16:45 - INFO - __main__ - Step 12888: {'lr': 0.00019999938456496813, 'samples': 412416, 'steps': 805, 'loss/train': 3.874497652053833} -09/20/2021 17:16:46 - INFO - __main__ - Step 12889: {'lr': 0.00019999938456496813, 'samples': 412448, 'steps': 805, 'loss/train': 3.7231318950653076} -09/20/2021 17:16:47 - INFO - __main__ - Step 12890: {'lr': 0.00019999938456496813, 'samples': 412480, 'steps': 805, 'loss/train': 3.1723413467407227} -09/20/2021 17:16:48 - INFO - __main__ - Step 12891: {'lr': 0.00019999938456496813, 'samples': 412512, 'steps': 805, 'loss/train': 4.348320007324219} -09/20/2021 17:16:48 - INFO - __main__ - Step 12892: {'lr': 0.00019999938456496813, 'samples': 412544, 'steps': 805, 'loss/train': 4.037775039672852} -09/20/2021 17:16:49 - INFO - __main__ - Step 12893: {'lr': 0.00019999938456496813, 'samples': 412576, 'steps': 805, 'loss/train': 3.2021665573120117} -09/20/2021 17:16:50 - INFO - __main__ - Step 12894: {'lr': 0.00019999938456496813, 'samples': 412608, 'steps': 805, 'loss/train': 4.233974933624268} -09/20/2021 17:16:51 - INFO - __main__ - Step 12895: {'lr': 0.00019999938456496813, 'samples': 412640, 'steps': 805, 'loss/train': 3.5555572509765625} -09/20/2021 17:16:51 - INFO - __main__ - Step 12896: {'lr': 0.00019999938456496813, 'samples': 412672, 'steps': 805, 'loss/train': 3.577910900115967} -09/20/2021 17:16:52 - INFO - __main__ - Step 12897: {'lr': 0.00019999936198208685, 'samples': 412704, 'steps': 806, 'loss/train': 3.86767840385437} -09/20/2021 17:16:53 - INFO - __main__ - Step 12898: {'lr': 0.00019999936198208685, 'samples': 412736, 'steps': 806, 'loss/train': 3.8051583766937256} -09/20/2021 17:16:54 - INFO - __main__ - Step 12899: {'lr': 0.00019999936198208685, 'samples': 412768, 'steps': 806, 'loss/train': 4.123025417327881} -09/20/2021 17:16:54 - INFO - __main__ - Step 12900: {'lr': 0.00019999936198208685, 'samples': 412800, 'steps': 806, 'loss/train': 3.7604238986968994} -09/20/2021 17:16:55 - INFO - __main__ - Step 12901: {'lr': 0.00019999936198208685, 'samples': 412832, 'steps': 806, 'loss/train': 4.797454357147217} -09/20/2021 17:16:56 - INFO - __main__ - Step 12902: {'lr': 0.00019999936198208685, 'samples': 412864, 'steps': 806, 'loss/train': 4.247081756591797} -09/20/2021 17:16:57 - INFO - __main__ - Step 12903: {'lr': 0.00019999936198208685, 'samples': 412896, 'steps': 806, 'loss/train': 3.6742398738861084} -09/20/2021 17:16:57 - INFO - __main__ - Step 12904: {'lr': 0.00019999936198208685, 'samples': 412928, 'steps': 806, 'loss/train': 4.459545135498047} -09/20/2021 17:16:58 - INFO - __main__ - Step 12905: {'lr': 0.00019999936198208685, 'samples': 412960, 'steps': 806, 'loss/train': 3.588306427001953} -09/20/2021 17:16:59 - INFO - __main__ - Step 12906: {'lr': 0.00019999936198208685, 'samples': 412992, 'steps': 806, 'loss/train': 3.312713623046875} -09/20/2021 17:17:00 - INFO - __main__ - Step 12907: {'lr': 0.00019999936198208685, 'samples': 413024, 'steps': 806, 'loss/train': 3.9705610275268555} -09/20/2021 17:17:00 - INFO - __main__ - Step 12908: {'lr': 0.00019999936198208685, 'samples': 413056, 'steps': 806, 'loss/train': 3.6405045986175537} -09/20/2021 17:17:01 - INFO - __main__ - Step 12909: {'lr': 0.00019999936198208685, 'samples': 413088, 'steps': 806, 'loss/train': 3.3417856693267822} -09/20/2021 17:17:02 - INFO - __main__ - Step 12910: {'lr': 0.00019999936198208685, 'samples': 413120, 'steps': 806, 'loss/train': 4.256547451019287} -09/20/2021 17:17:03 - INFO - __main__ - Step 12911: {'lr': 0.00019999936198208685, 'samples': 413152, 'steps': 806, 'loss/train': 3.7995026111602783} -09/20/2021 17:17:03 - INFO - __main__ - Step 12912: {'lr': 0.00019999936198208685, 'samples': 413184, 'steps': 806, 'loss/train': 4.993103504180908} -09/20/2021 17:17:04 - INFO - __main__ - Step 12913: {'lr': 0.00019999933899230853, 'samples': 413216, 'steps': 807, 'loss/train': 2.989496946334839} -09/20/2021 17:17:05 - INFO - __main__ - Step 12914: {'lr': 0.00019999933899230853, 'samples': 413248, 'steps': 807, 'loss/train': 3.4254579544067383} -09/20/2021 17:17:06 - INFO - __main__ - Step 12915: {'lr': 0.00019999933899230853, 'samples': 413280, 'steps': 807, 'loss/train': 2.4548816680908203} -09/20/2021 17:17:07 - INFO - __main__ - Step 12916: {'lr': 0.00019999933899230853, 'samples': 413312, 'steps': 807, 'loss/train': 2.3366239070892334} -09/20/2021 17:17:07 - INFO - __main__ - Step 12917: {'lr': 0.00019999933899230853, 'samples': 413344, 'steps': 807, 'loss/train': 2.6334524154663086} -09/20/2021 17:17:08 - INFO - __main__ - Step 12918: {'lr': 0.00019999933899230853, 'samples': 413376, 'steps': 807, 'loss/train': 3.0323116779327393} -09/20/2021 17:17:09 - INFO - __main__ - Step 12919: {'lr': 0.00019999933899230853, 'samples': 413408, 'steps': 807, 'loss/train': 2.5405097007751465} -09/20/2021 17:17:10 - INFO - __main__ - Step 12920: {'lr': 0.00019999933899230853, 'samples': 413440, 'steps': 807, 'loss/train': 3.586425542831421} -09/20/2021 17:17:10 - INFO - __main__ - Step 12921: {'lr': 0.00019999933899230853, 'samples': 413472, 'steps': 807, 'loss/train': 3.27213978767395} -09/20/2021 17:17:11 - INFO - __main__ - Step 12922: {'lr': 0.00019999933899230853, 'samples': 413504, 'steps': 807, 'loss/train': 0.7695060968399048} -09/20/2021 17:17:12 - INFO - __main__ - Step 12923: {'lr': 0.00019999933899230853, 'samples': 413536, 'steps': 807, 'loss/train': 4.170294284820557} -09/20/2021 17:17:13 - INFO - __main__ - Step 12924: {'lr': 0.00019999933899230853, 'samples': 413568, 'steps': 807, 'loss/train': 4.229313850402832} -09/20/2021 17:17:13 - INFO - __main__ - Step 12925: {'lr': 0.00019999933899230853, 'samples': 413600, 'steps': 807, 'loss/train': 4.770866870880127} -09/20/2021 17:17:14 - INFO - __main__ - Step 12926: {'lr': 0.00019999933899230853, 'samples': 413632, 'steps': 807, 'loss/train': 4.6135149002075195} -09/20/2021 17:17:15 - INFO - __main__ - Step 12927: {'lr': 0.00019999933899230853, 'samples': 413664, 'steps': 807, 'loss/train': 4.230984687805176} -09/20/2021 17:17:16 - INFO - __main__ - Step 12928: {'lr': 0.00019999933899230853, 'samples': 413696, 'steps': 807, 'loss/train': 4.20033597946167} -09/20/2021 17:17:17 - INFO - __main__ - Step 12929: {'lr': 0.0001999993155956333, 'samples': 413728, 'steps': 808, 'loss/train': 2.8992180824279785} -09/20/2021 17:17:18 - INFO - __main__ - Step 12930: {'lr': 0.0001999993155956333, 'samples': 413760, 'steps': 808, 'loss/train': 4.954456329345703} -09/20/2021 17:17:18 - INFO - __main__ - Step 12931: {'lr': 0.0001999993155956333, 'samples': 413792, 'steps': 808, 'loss/train': 4.453046798706055} -09/20/2021 17:17:19 - INFO - __main__ - Step 12932: {'lr': 0.0001999993155956333, 'samples': 413824, 'steps': 808, 'loss/train': 4.331480979919434} -09/20/2021 17:17:20 - INFO - __main__ - Step 12933: {'lr': 0.0001999993155956333, 'samples': 413856, 'steps': 808, 'loss/train': 5.173374652862549} -09/20/2021 17:17:21 - INFO - __main__ - Step 12934: {'lr': 0.0001999993155956333, 'samples': 413888, 'steps': 808, 'loss/train': 4.010056972503662} -09/20/2021 17:17:21 - INFO - __main__ - Step 12935: {'lr': 0.0001999993155956333, 'samples': 413920, 'steps': 808, 'loss/train': 3.7238311767578125} -09/20/2021 17:17:22 - INFO - __main__ - Step 12936: {'lr': 0.0001999993155956333, 'samples': 413952, 'steps': 808, 'loss/train': 4.177578926086426} -09/20/2021 17:17:23 - INFO - __main__ - Step 12937: {'lr': 0.0001999993155956333, 'samples': 413984, 'steps': 808, 'loss/train': 4.395230770111084} -09/20/2021 17:17:24 - INFO - __main__ - Step 12938: {'lr': 0.0001999993155956333, 'samples': 414016, 'steps': 808, 'loss/train': 3.7393319606781006} -09/20/2021 17:17:24 - INFO - __main__ - Step 12939: {'lr': 0.0001999993155956333, 'samples': 414048, 'steps': 808, 'loss/train': 3.942636013031006} -09/20/2021 17:17:25 - INFO - __main__ - Step 12940: {'lr': 0.0001999993155956333, 'samples': 414080, 'steps': 808, 'loss/train': 4.3557024002075195} -09/20/2021 17:17:26 - INFO - __main__ - Step 12941: {'lr': 0.0001999993155956333, 'samples': 414112, 'steps': 808, 'loss/train': 4.230552673339844} -09/20/2021 17:17:27 - INFO - __main__ - Step 12942: {'lr': 0.0001999993155956333, 'samples': 414144, 'steps': 808, 'loss/train': 4.049747467041016} -09/20/2021 17:17:27 - INFO - __main__ - Step 12943: {'lr': 0.0001999993155956333, 'samples': 414176, 'steps': 808, 'loss/train': 3.8624613285064697} -09/20/2021 17:17:28 - INFO - __main__ - Step 12944: {'lr': 0.0001999993155956333, 'samples': 414208, 'steps': 808, 'loss/train': 3.895202875137329} -09/20/2021 17:17:29 - INFO - __main__ - Step 12945: {'lr': 0.00019999929179206126, 'samples': 414240, 'steps': 809, 'loss/train': 3.110624313354492} -09/20/2021 17:17:30 - INFO - __main__ - Step 12946: {'lr': 0.00019999929179206126, 'samples': 414272, 'steps': 809, 'loss/train': 3.1966984272003174} -09/20/2021 17:17:31 - INFO - __main__ - Step 12947: {'lr': 0.00019999929179206126, 'samples': 414304, 'steps': 809, 'loss/train': 2.967503547668457} -09/20/2021 17:17:31 - INFO - __main__ - Step 12948: {'lr': 0.00019999929179206126, 'samples': 414336, 'steps': 809, 'loss/train': 4.158684253692627} -09/20/2021 17:17:32 - INFO - __main__ - Step 12949: {'lr': 0.00019999929179206126, 'samples': 414368, 'steps': 809, 'loss/train': 4.5532546043396} -09/20/2021 17:17:33 - INFO - __main__ - Step 12950: {'lr': 0.00019999929179206126, 'samples': 414400, 'steps': 809, 'loss/train': 4.466666221618652} -09/20/2021 17:17:34 - INFO - __main__ - Step 12951: {'lr': 0.00019999929179206126, 'samples': 414432, 'steps': 809, 'loss/train': 5.262000560760498} -09/20/2021 17:17:34 - INFO - __main__ - Step 12952: {'lr': 0.00019999929179206126, 'samples': 414464, 'steps': 809, 'loss/train': 3.591419219970703} -09/20/2021 17:17:35 - INFO - __main__ - Step 12953: {'lr': 0.00019999929179206126, 'samples': 414496, 'steps': 809, 'loss/train': 4.929917335510254} -09/20/2021 17:17:36 - INFO - __main__ - Step 12954: {'lr': 0.00019999929179206126, 'samples': 414528, 'steps': 809, 'loss/train': 3.9523138999938965} -09/20/2021 17:17:37 - INFO - __main__ - Step 12955: {'lr': 0.00019999929179206126, 'samples': 414560, 'steps': 809, 'loss/train': 2.5679075717926025} -09/20/2021 17:17:37 - INFO - __main__ - Step 12956: {'lr': 0.00019999929179206126, 'samples': 414592, 'steps': 809, 'loss/train': 4.176979064941406} -09/20/2021 17:17:39 - INFO - __main__ - Step 12957: {'lr': 0.00019999929179206126, 'samples': 414624, 'steps': 809, 'loss/train': 4.171136856079102} -09/20/2021 17:17:40 - INFO - __main__ - Step 12958: {'lr': 0.00019999929179206126, 'samples': 414656, 'steps': 809, 'loss/train': 4.626184940338135} -09/20/2021 17:17:41 - INFO - __main__ - Step 12959: {'lr': 0.00019999929179206126, 'samples': 414688, 'steps': 809, 'loss/train': 3.3174257278442383} -09/20/2021 17:17:41 - INFO - __main__ - Step 12960: {'lr': 0.00019999929179206126, 'samples': 414720, 'steps': 809, 'loss/train': 4.287726879119873} -09/20/2021 17:17:42 - INFO - __main__ - Step 12961: {'lr': 0.00019999926758159248, 'samples': 414752, 'steps': 810, 'loss/train': 3.6757757663726807} -09/20/2021 17:17:43 - INFO - __main__ - Step 12962: {'lr': 0.00019999926758159248, 'samples': 414784, 'steps': 810, 'loss/train': 3.089817762374878} -09/20/2021 17:17:44 - INFO - __main__ - Step 12963: {'lr': 0.00019999926758159248, 'samples': 414816, 'steps': 810, 'loss/train': 3.897002696990967} -09/20/2021 17:17:44 - INFO - __main__ - Step 12964: {'lr': 0.00019999926758159248, 'samples': 414848, 'steps': 810, 'loss/train': 4.750665664672852} -09/20/2021 17:17:45 - INFO - __main__ - Step 12965: {'lr': 0.00019999926758159248, 'samples': 414880, 'steps': 810, 'loss/train': 3.8593311309814453} -09/20/2021 17:17:46 - INFO - __main__ - Step 12966: {'lr': 0.00019999926758159248, 'samples': 414912, 'steps': 810, 'loss/train': 4.242072582244873} -09/20/2021 17:17:47 - INFO - __main__ - Step 12967: {'lr': 0.00019999926758159248, 'samples': 414944, 'steps': 810, 'loss/train': 4.46863317489624} -09/20/2021 17:17:47 - INFO - __main__ - Step 12968: {'lr': 0.00019999926758159248, 'samples': 414976, 'steps': 810, 'loss/train': 3.658397912979126} -09/20/2021 17:17:48 - INFO - __main__ - Step 12969: {'lr': 0.00019999926758159248, 'samples': 415008, 'steps': 810, 'loss/train': 3.6949098110198975} -09/20/2021 17:17:49 - INFO - __main__ - Step 12970: {'lr': 0.00019999926758159248, 'samples': 415040, 'steps': 810, 'loss/train': 4.697622776031494} -09/20/2021 17:17:50 - INFO - __main__ - Step 12971: {'lr': 0.00019999926758159248, 'samples': 415072, 'steps': 810, 'loss/train': 5.458834171295166} -09/20/2021 17:17:50 - INFO - __main__ - Step 12972: {'lr': 0.00019999926758159248, 'samples': 415104, 'steps': 810, 'loss/train': 4.085319519042969} -09/20/2021 17:17:51 - INFO - __main__ - Step 12973: {'lr': 0.00019999926758159248, 'samples': 415136, 'steps': 810, 'loss/train': 3.618593692779541} -09/20/2021 17:17:52 - INFO - __main__ - Step 12974: {'lr': 0.00019999926758159248, 'samples': 415168, 'steps': 810, 'loss/train': 4.862817764282227} -09/20/2021 17:17:53 - INFO - __main__ - Step 12975: {'lr': 0.00019999926758159248, 'samples': 415200, 'steps': 810, 'loss/train': 4.190164566040039} -09/20/2021 17:17:53 - INFO - __main__ - Step 12976: {'lr': 0.00019999926758159248, 'samples': 415232, 'steps': 810, 'loss/train': 4.278195858001709} -09/20/2021 17:17:54 - INFO - __main__ - Step 12977: {'lr': 0.00019999924296422707, 'samples': 415264, 'steps': 811, 'loss/train': 4.9221625328063965} -09/20/2021 17:17:55 - INFO - __main__ - Step 12978: {'lr': 0.00019999924296422707, 'samples': 415296, 'steps': 811, 'loss/train': 3.768043279647827} -09/20/2021 17:17:56 - INFO - __main__ - Step 12979: {'lr': 0.00019999924296422707, 'samples': 415328, 'steps': 811, 'loss/train': 4.965723514556885} -09/20/2021 17:17:57 - INFO - __main__ - Step 12980: {'lr': 0.00019999924296422707, 'samples': 415360, 'steps': 811, 'loss/train': 3.3901405334472656} -09/20/2021 17:17:57 - INFO - __main__ - Step 12981: {'lr': 0.00019999924296422707, 'samples': 415392, 'steps': 811, 'loss/train': 3.256420373916626} -09/20/2021 17:17:58 - INFO - __main__ - Step 12982: {'lr': 0.00019999924296422707, 'samples': 415424, 'steps': 811, 'loss/train': 3.874894142150879} -09/20/2021 17:17:59 - INFO - __main__ - Step 12983: {'lr': 0.00019999924296422707, 'samples': 415456, 'steps': 811, 'loss/train': 4.589085102081299} -09/20/2021 17:18:00 - INFO - __main__ - Step 12984: {'lr': 0.00019999924296422707, 'samples': 415488, 'steps': 811, 'loss/train': 4.927199363708496} -09/20/2021 17:18:00 - INFO - __main__ - Step 12985: {'lr': 0.00019999924296422707, 'samples': 415520, 'steps': 811, 'loss/train': 3.268983840942383} -09/20/2021 17:18:01 - INFO - __main__ - Step 12986: {'lr': 0.00019999924296422707, 'samples': 415552, 'steps': 811, 'loss/train': 3.697288990020752} -09/20/2021 17:18:02 - INFO - __main__ - Step 12987: {'lr': 0.00019999924296422707, 'samples': 415584, 'steps': 811, 'loss/train': 3.276038408279419} -09/20/2021 17:18:03 - INFO - __main__ - Step 12988: {'lr': 0.00019999924296422707, 'samples': 415616, 'steps': 811, 'loss/train': 3.688748598098755} -09/20/2021 17:18:03 - INFO - __main__ - Step 12989: {'lr': 0.00019999924296422707, 'samples': 415648, 'steps': 811, 'loss/train': 1.863612413406372} -09/20/2021 17:18:05 - INFO - __main__ - Step 12990: {'lr': 0.00019999924296422707, 'samples': 415680, 'steps': 811, 'loss/train': 3.328345537185669} -09/20/2021 17:18:05 - INFO - __main__ - Step 12991: {'lr': 0.00019999924296422707, 'samples': 415712, 'steps': 811, 'loss/train': 4.7563323974609375} -09/20/2021 17:18:06 - INFO - __main__ - Step 12992: {'lr': 0.00019999924296422707, 'samples': 415744, 'steps': 811, 'loss/train': 3.752995491027832} -09/20/2021 17:18:07 - INFO - __main__ - Step 12993: {'lr': 0.00019999921793996514, 'samples': 415776, 'steps': 812, 'loss/train': 3.5120928287506104} -09/20/2021 17:18:08 - INFO - __main__ - Step 12994: {'lr': 0.00019999921793996514, 'samples': 415808, 'steps': 812, 'loss/train': 4.136435508728027} -09/20/2021 17:18:09 - INFO - __main__ - Step 12995: {'lr': 0.00019999921793996514, 'samples': 415840, 'steps': 812, 'loss/train': 3.9560863971710205} -09/20/2021 17:18:09 - INFO - __main__ - Step 12996: {'lr': 0.00019999921793996514, 'samples': 415872, 'steps': 812, 'loss/train': 4.741512298583984} -09/20/2021 17:18:10 - INFO - __main__ - Step 12997: {'lr': 0.00019999921793996514, 'samples': 415904, 'steps': 812, 'loss/train': 3.88960599899292} -09/20/2021 17:18:11 - INFO - __main__ - Step 12998: {'lr': 0.00019999921793996514, 'samples': 415936, 'steps': 812, 'loss/train': 3.82177734375} -09/20/2021 17:18:12 - INFO - __main__ - Step 12999: {'lr': 0.00019999921793996514, 'samples': 415968, 'steps': 812, 'loss/train': 4.25442361831665} -09/20/2021 17:18:12 - INFO - __main__ - Step 13000: {'lr': 0.00019999921793996514, 'samples': 416000, 'steps': 812, 'loss/train': 4.894994735717773} -09/20/2021 17:18:13 - INFO - __main__ - Step 13001: {'lr': 0.00019999921793996514, 'samples': 416032, 'steps': 812, 'loss/train': 4.986673355102539} -09/20/2021 17:18:14 - INFO - __main__ - Step 13002: {'lr': 0.00019999921793996514, 'samples': 416064, 'steps': 812, 'loss/train': 4.421505928039551} -09/20/2021 17:18:15 - INFO - __main__ - Step 13003: {'lr': 0.00019999921793996514, 'samples': 416096, 'steps': 812, 'loss/train': 4.806142330169678} -09/20/2021 17:18:15 - INFO - __main__ - Step 13004: {'lr': 0.00019999921793996514, 'samples': 416128, 'steps': 812, 'loss/train': 2.972053050994873} -09/20/2021 17:18:16 - INFO - __main__ - Step 13005: {'lr': 0.00019999921793996514, 'samples': 416160, 'steps': 812, 'loss/train': 0.7060786485671997} -09/20/2021 17:18:17 - INFO - __main__ - Step 13006: {'lr': 0.00019999921793996514, 'samples': 416192, 'steps': 812, 'loss/train': 3.8689796924591064} -09/20/2021 17:18:18 - INFO - __main__ - Step 13007: {'lr': 0.00019999921793996514, 'samples': 416224, 'steps': 812, 'loss/train': 4.819457054138184} -09/20/2021 17:18:18 - INFO - __main__ - Step 13008: {'lr': 0.00019999921793996514, 'samples': 416256, 'steps': 812, 'loss/train': 3.971144199371338} -09/20/2021 17:18:19 - INFO - __main__ - Step 13009: {'lr': 0.00019999919250880677, 'samples': 416288, 'steps': 813, 'loss/train': 3.816091299057007} -09/20/2021 17:18:20 - INFO - __main__ - Step 13010: {'lr': 0.00019999919250880677, 'samples': 416320, 'steps': 813, 'loss/train': 3.294355869293213} -09/20/2021 17:18:21 - INFO - __main__ - Step 13011: {'lr': 0.00019999919250880677, 'samples': 416352, 'steps': 813, 'loss/train': 5.456426620483398} -09/20/2021 17:18:22 - INFO - __main__ - Step 13012: {'lr': 0.00019999919250880677, 'samples': 416384, 'steps': 813, 'loss/train': 2.9135982990264893} -09/20/2021 17:18:22 - INFO - __main__ - Step 13013: {'lr': 0.00019999919250880677, 'samples': 416416, 'steps': 813, 'loss/train': 3.590325355529785} -09/20/2021 17:18:23 - INFO - __main__ - Step 13014: {'lr': 0.00019999919250880677, 'samples': 416448, 'steps': 813, 'loss/train': 4.435572147369385} -09/20/2021 17:18:24 - INFO - __main__ - Step 13015: {'lr': 0.00019999919250880677, 'samples': 416480, 'steps': 813, 'loss/train': 4.948478698730469} -09/20/2021 17:18:25 - INFO - __main__ - Step 13016: {'lr': 0.00019999919250880677, 'samples': 416512, 'steps': 813, 'loss/train': 4.25620698928833} -09/20/2021 17:18:25 - INFO - __main__ - Step 13017: {'lr': 0.00019999919250880677, 'samples': 416544, 'steps': 813, 'loss/train': 1.853776454925537} -09/20/2021 17:18:26 - INFO - __main__ - Step 13018: {'lr': 0.00019999919250880677, 'samples': 416576, 'steps': 813, 'loss/train': 4.1850433349609375} -09/20/2021 17:18:27 - INFO - __main__ - Step 13019: {'lr': 0.00019999919250880677, 'samples': 416608, 'steps': 813, 'loss/train': 3.7336790561676025} -09/20/2021 17:18:28 - INFO - __main__ - Step 13020: {'lr': 0.00019999919250880677, 'samples': 416640, 'steps': 813, 'loss/train': 3.9755337238311768} -09/20/2021 17:18:29 - INFO - __main__ - Step 13021: {'lr': 0.00019999919250880677, 'samples': 416672, 'steps': 813, 'loss/train': 4.997709274291992} -09/20/2021 17:18:30 - INFO - __main__ - Step 13022: {'lr': 0.00019999919250880677, 'samples': 416704, 'steps': 813, 'loss/train': 4.719659805297852} -09/20/2021 17:18:30 - INFO - __main__ - Step 13023: {'lr': 0.00019999919250880677, 'samples': 416736, 'steps': 813, 'loss/train': 3.9614779949188232} -09/20/2021 17:18:31 - INFO - __main__ - Step 13024: {'lr': 0.00019999919250880677, 'samples': 416768, 'steps': 813, 'loss/train': 4.967212200164795} -09/20/2021 17:18:32 - INFO - __main__ - Step 13025: {'lr': 0.00019999916667075204, 'samples': 416800, 'steps': 814, 'loss/train': 2.1083242893218994} -09/20/2021 17:18:33 - INFO - __main__ - Step 13026: {'lr': 0.00019999916667075204, 'samples': 416832, 'steps': 814, 'loss/train': 4.517325401306152} -09/20/2021 17:18:33 - INFO - __main__ - Step 13027: {'lr': 0.00019999916667075204, 'samples': 416864, 'steps': 814, 'loss/train': 3.996535062789917} -09/20/2021 17:18:34 - INFO - __main__ - Step 13028: {'lr': 0.00019999916667075204, 'samples': 416896, 'steps': 814, 'loss/train': 4.515016078948975} -09/20/2021 17:18:35 - INFO - __main__ - Step 13029: {'lr': 0.00019999916667075204, 'samples': 416928, 'steps': 814, 'loss/train': 3.7751452922821045} -09/20/2021 17:18:36 - INFO - __main__ - Step 13030: {'lr': 0.00019999916667075204, 'samples': 416960, 'steps': 814, 'loss/train': 4.138591289520264} -09/20/2021 17:18:36 - INFO - __main__ - Step 13031: {'lr': 0.00019999916667075204, 'samples': 416992, 'steps': 814, 'loss/train': 4.563834190368652} -09/20/2021 17:18:37 - INFO - __main__ - Step 13032: {'lr': 0.00019999916667075204, 'samples': 417024, 'steps': 814, 'loss/train': 3.748748540878296} -09/20/2021 17:18:38 - INFO - __main__ - Step 13033: {'lr': 0.00019999916667075204, 'samples': 417056, 'steps': 814, 'loss/train': 4.001470565795898} -09/20/2021 17:18:39 - INFO - __main__ - Step 13034: {'lr': 0.00019999916667075204, 'samples': 417088, 'steps': 814, 'loss/train': 4.543045997619629} -09/20/2021 17:18:39 - INFO - __main__ - Step 13035: {'lr': 0.00019999916667075204, 'samples': 417120, 'steps': 814, 'loss/train': 4.330716609954834} -09/20/2021 17:18:40 - INFO - __main__ - Step 13036: {'lr': 0.00019999916667075204, 'samples': 417152, 'steps': 814, 'loss/train': 1.6933741569519043} -09/20/2021 17:18:41 - INFO - __main__ - Step 13037: {'lr': 0.00019999916667075204, 'samples': 417184, 'steps': 814, 'loss/train': 4.624745845794678} -09/20/2021 17:18:42 - INFO - __main__ - Step 13038: {'lr': 0.00019999916667075204, 'samples': 417216, 'steps': 814, 'loss/train': 4.0459980964660645} -09/20/2021 17:18:42 - INFO - __main__ - Step 13039: {'lr': 0.00019999916667075204, 'samples': 417248, 'steps': 814, 'loss/train': 4.163773536682129} -09/20/2021 17:18:43 - INFO - __main__ - Step 13040: {'lr': 0.00019999916667075204, 'samples': 417280, 'steps': 814, 'loss/train': 4.162492752075195} -09/20/2021 17:18:44 - INFO - __main__ - Step 13041: {'lr': 0.00019999914042580114, 'samples': 417312, 'steps': 815, 'loss/train': 2.3723325729370117} -09/20/2021 17:18:45 - INFO - __main__ - Step 13042: {'lr': 0.00019999914042580114, 'samples': 417344, 'steps': 815, 'loss/train': 4.6562604904174805} -09/20/2021 17:18:46 - INFO - __main__ - Step 13043: {'lr': 0.00019999914042580114, 'samples': 417376, 'steps': 815, 'loss/train': 3.6044206619262695} -09/20/2021 17:18:46 - INFO - __main__ - Step 13044: {'lr': 0.00019999914042580114, 'samples': 417408, 'steps': 815, 'loss/train': 3.1532204151153564} -09/20/2021 17:18:47 - INFO - __main__ - Step 13045: {'lr': 0.00019999914042580114, 'samples': 417440, 'steps': 815, 'loss/train': 3.534578800201416} -09/20/2021 17:18:48 - INFO - __main__ - Step 13046: {'lr': 0.00019999914042580114, 'samples': 417472, 'steps': 815, 'loss/train': 4.04744815826416} -09/20/2021 17:18:49 - INFO - __main__ - Step 13047: {'lr': 0.00019999914042580114, 'samples': 417504, 'steps': 815, 'loss/train': 4.5633955001831055} -09/20/2021 17:18:49 - INFO - __main__ - Step 13048: {'lr': 0.00019999914042580114, 'samples': 417536, 'steps': 815, 'loss/train': 3.5225625038146973} -09/20/2021 17:18:50 - INFO - __main__ - Step 13049: {'lr': 0.00019999914042580114, 'samples': 417568, 'steps': 815, 'loss/train': 6.027340412139893} -09/20/2021 17:18:51 - INFO - __main__ - Step 13050: {'lr': 0.00019999914042580114, 'samples': 417600, 'steps': 815, 'loss/train': 4.035227298736572} -09/20/2021 17:18:52 - INFO - __main__ - Step 13051: {'lr': 0.00019999914042580114, 'samples': 417632, 'steps': 815, 'loss/train': 3.964585065841675} -09/20/2021 17:18:53 - INFO - __main__ - Step 13052: {'lr': 0.00019999914042580114, 'samples': 417664, 'steps': 815, 'loss/train': 3.547205924987793} -09/20/2021 17:18:54 - INFO - __main__ - Step 13053: {'lr': 0.00019999914042580114, 'samples': 417696, 'steps': 815, 'loss/train': 4.626123428344727} -09/20/2021 17:18:54 - INFO - __main__ - Step 13054: {'lr': 0.00019999914042580114, 'samples': 417728, 'steps': 815, 'loss/train': 6.119394302368164} -09/20/2021 17:18:55 - INFO - __main__ - Step 13055: {'lr': 0.00019999914042580114, 'samples': 417760, 'steps': 815, 'loss/train': 6.43768835067749} -09/20/2021 17:18:56 - INFO - __main__ - Step 13056: {'lr': 0.00019999914042580114, 'samples': 417792, 'steps': 815, 'loss/train': 4.9311137199401855} -09/20/2021 17:18:57 - INFO - __main__ - Step 13057: {'lr': 0.0001999991137739541, 'samples': 417824, 'steps': 816, 'loss/train': 3.740478515625} -09/20/2021 17:18:58 - INFO - __main__ - Step 13058: {'lr': 0.0001999991137739541, 'samples': 417856, 'steps': 816, 'loss/train': 3.99627685546875} -09/20/2021 17:18:58 - INFO - __main__ - Step 13059: {'lr': 0.0001999991137739541, 'samples': 417888, 'steps': 816, 'loss/train': 3.7142744064331055} -09/20/2021 17:18:59 - INFO - __main__ - Step 13060: {'lr': 0.0001999991137739541, 'samples': 417920, 'steps': 816, 'loss/train': 3.6847951412200928} -09/20/2021 17:19:00 - INFO - __main__ - Step 13061: {'lr': 0.0001999991137739541, 'samples': 417952, 'steps': 816, 'loss/train': 4.5298919677734375} -09/20/2021 17:19:01 - INFO - __main__ - Step 13062: {'lr': 0.0001999991137739541, 'samples': 417984, 'steps': 816, 'loss/train': 4.543121814727783} -09/20/2021 17:19:01 - INFO - __main__ - Step 13063: {'lr': 0.0001999991137739541, 'samples': 418016, 'steps': 816, 'loss/train': 3.8250067234039307} -09/20/2021 17:19:02 - INFO - __main__ - Step 13064: {'lr': 0.0001999991137739541, 'samples': 418048, 'steps': 816, 'loss/train': 3.8503987789154053} -09/20/2021 17:19:03 - INFO - __main__ - Step 13065: {'lr': 0.0001999991137739541, 'samples': 418080, 'steps': 816, 'loss/train': 4.6082377433776855} -09/20/2021 17:19:04 - INFO - __main__ - Step 13066: {'lr': 0.0001999991137739541, 'samples': 418112, 'steps': 816, 'loss/train': 4.01769495010376} -09/20/2021 17:19:04 - INFO - __main__ - Step 13067: {'lr': 0.0001999991137739541, 'samples': 418144, 'steps': 816, 'loss/train': 3.833949327468872} -09/20/2021 17:19:05 - INFO - __main__ - Step 13068: {'lr': 0.0001999991137739541, 'samples': 418176, 'steps': 816, 'loss/train': 3.96064829826355} -09/20/2021 17:19:06 - INFO - __main__ - Step 13069: {'lr': 0.0001999991137739541, 'samples': 418208, 'steps': 816, 'loss/train': 4.417924880981445} -09/20/2021 17:19:07 - INFO - __main__ - Step 13070: {'lr': 0.0001999991137739541, 'samples': 418240, 'steps': 816, 'loss/train': 4.8874921798706055} -09/20/2021 17:19:07 - INFO - __main__ - Step 13071: {'lr': 0.0001999991137739541, 'samples': 418272, 'steps': 816, 'loss/train': 3.9624836444854736} -09/20/2021 17:19:08 - INFO - __main__ - Step 13072: {'lr': 0.0001999991137739541, 'samples': 418304, 'steps': 816, 'loss/train': 3.7344353199005127} -09/20/2021 17:19:09 - INFO - __main__ - Step 13073: {'lr': 0.00019999908671521107, 'samples': 418336, 'steps': 817, 'loss/train': 3.710301160812378} -09/20/2021 17:19:10 - INFO - __main__ - Step 13074: {'lr': 0.00019999908671521107, 'samples': 418368, 'steps': 817, 'loss/train': 6.486268043518066} -09/20/2021 17:19:10 - INFO - __main__ - Step 13075: {'lr': 0.00019999908671521107, 'samples': 418400, 'steps': 817, 'loss/train': 5.118996620178223} -09/20/2021 17:19:11 - INFO - __main__ - Step 13076: {'lr': 0.00019999908671521107, 'samples': 418432, 'steps': 817, 'loss/train': 4.504016399383545} -09/20/2021 17:19:12 - INFO - __main__ - Step 13077: {'lr': 0.00019999908671521107, 'samples': 418464, 'steps': 817, 'loss/train': 3.926029682159424} -09/20/2021 17:19:13 - INFO - __main__ - Step 13078: {'lr': 0.00019999908671521107, 'samples': 418496, 'steps': 817, 'loss/train': 3.667083740234375} -09/20/2021 17:19:13 - INFO - __main__ - Step 13079: {'lr': 0.00019999908671521107, 'samples': 418528, 'steps': 817, 'loss/train': 3.5596494674682617} -09/20/2021 17:19:14 - INFO - __main__ - Step 13080: {'lr': 0.00019999908671521107, 'samples': 418560, 'steps': 817, 'loss/train': 4.160233974456787} -09/20/2021 17:19:15 - INFO - __main__ - Step 13081: {'lr': 0.00019999908671521107, 'samples': 418592, 'steps': 817, 'loss/train': 3.80606746673584} -09/20/2021 17:19:16 - INFO - __main__ - Step 13082: {'lr': 0.00019999908671521107, 'samples': 418624, 'steps': 817, 'loss/train': 3.7594311237335205} -09/20/2021 17:19:16 - INFO - __main__ - Step 13083: {'lr': 0.00019999908671521107, 'samples': 418656, 'steps': 817, 'loss/train': 4.124363899230957} -09/20/2021 17:19:18 - INFO - __main__ - Step 13084: {'lr': 0.00019999908671521107, 'samples': 418688, 'steps': 817, 'loss/train': 3.0843520164489746} -09/20/2021 17:19:18 - INFO - __main__ - Step 13085: {'lr': 0.00019999908671521107, 'samples': 418720, 'steps': 817, 'loss/train': 3.2347066402435303} -09/20/2021 17:19:19 - INFO - __main__ - Step 13086: {'lr': 0.00019999908671521107, 'samples': 418752, 'steps': 817, 'loss/train': 5.160746097564697} -09/20/2021 17:19:20 - INFO - __main__ - Step 13087: {'lr': 0.00019999908671521107, 'samples': 418784, 'steps': 817, 'loss/train': 4.8345417976379395} -09/20/2021 17:19:21 - INFO - __main__ - Step 13088: {'lr': 0.00019999908671521107, 'samples': 418816, 'steps': 817, 'loss/train': 4.392824649810791} -09/20/2021 17:19:22 - INFO - __main__ - Step 13089: {'lr': 0.0001999990592495721, 'samples': 418848, 'steps': 818, 'loss/train': 3.988158702850342} -09/20/2021 17:19:22 - INFO - __main__ - Step 13090: {'lr': 0.0001999990592495721, 'samples': 418880, 'steps': 818, 'loss/train': 5.734930038452148} -09/20/2021 17:19:23 - INFO - __main__ - Step 13091: {'lr': 0.0001999990592495721, 'samples': 418912, 'steps': 818, 'loss/train': 3.7697670459747314} -09/20/2021 17:19:24 - INFO - __main__ - Step 13092: {'lr': 0.0001999990592495721, 'samples': 418944, 'steps': 818, 'loss/train': 4.525407791137695} -09/20/2021 17:19:25 - INFO - __main__ - Step 13093: {'lr': 0.0001999990592495721, 'samples': 418976, 'steps': 818, 'loss/train': 4.395815849304199} -09/20/2021 17:19:25 - INFO - __main__ - Step 13094: {'lr': 0.0001999990592495721, 'samples': 419008, 'steps': 818, 'loss/train': 4.561460018157959} -09/20/2021 17:19:26 - INFO - __main__ - Step 13095: {'lr': 0.0001999990592495721, 'samples': 419040, 'steps': 818, 'loss/train': 3.7612640857696533} -09/20/2021 17:19:27 - INFO - __main__ - Step 13096: {'lr': 0.0001999990592495721, 'samples': 419072, 'steps': 818, 'loss/train': 4.162590026855469} -09/20/2021 17:19:28 - INFO - __main__ - Step 13097: {'lr': 0.0001999990592495721, 'samples': 419104, 'steps': 818, 'loss/train': 3.527508497238159} -09/20/2021 17:19:28 - INFO - __main__ - Step 13098: {'lr': 0.0001999990592495721, 'samples': 419136, 'steps': 818, 'loss/train': 3.8173654079437256} -09/20/2021 17:19:29 - INFO - __main__ - Step 13099: {'lr': 0.0001999990592495721, 'samples': 419168, 'steps': 818, 'loss/train': 4.949609279632568} -09/20/2021 17:19:30 - INFO - __main__ - Step 13100: {'lr': 0.0001999990592495721, 'samples': 419200, 'steps': 818, 'loss/train': 4.311455249786377} -09/20/2021 17:19:31 - INFO - __main__ - Step 13101: {'lr': 0.0001999990592495721, 'samples': 419232, 'steps': 818, 'loss/train': 3.917886257171631} -09/20/2021 17:19:31 - INFO - __main__ - Step 13102: {'lr': 0.0001999990592495721, 'samples': 419264, 'steps': 818, 'loss/train': 5.149755954742432} -09/20/2021 17:19:32 - INFO - __main__ - Step 13103: {'lr': 0.0001999990592495721, 'samples': 419296, 'steps': 818, 'loss/train': 4.18107271194458} -09/20/2021 17:19:33 - INFO - __main__ - Step 13104: {'lr': 0.0001999990592495721, 'samples': 419328, 'steps': 818, 'loss/train': 2.357550621032715} -09/20/2021 17:19:34 - INFO - __main__ - Step 13105: {'lr': 0.00019999903137703738, 'samples': 419360, 'steps': 819, 'loss/train': 3.000431537628174} -09/20/2021 17:19:34 - INFO - __main__ - Step 13106: {'lr': 0.00019999903137703738, 'samples': 419392, 'steps': 819, 'loss/train': 4.568227291107178} -09/20/2021 17:19:35 - INFO - __main__ - Step 13107: {'lr': 0.00019999903137703738, 'samples': 419424, 'steps': 819, 'loss/train': 4.409794807434082} -09/20/2021 17:19:36 - INFO - __main__ - Step 13108: {'lr': 0.00019999903137703738, 'samples': 419456, 'steps': 819, 'loss/train': 4.620377540588379} -09/20/2021 17:19:37 - INFO - __main__ - Step 13109: {'lr': 0.00019999903137703738, 'samples': 419488, 'steps': 819, 'loss/train': 4.22324800491333} -09/20/2021 17:19:37 - INFO - __main__ - Step 13110: {'lr': 0.00019999903137703738, 'samples': 419520, 'steps': 819, 'loss/train': 4.319800853729248} -09/20/2021 17:19:38 - INFO - __main__ - Step 13111: {'lr': 0.00019999903137703738, 'samples': 419552, 'steps': 819, 'loss/train': 5.313857555389404} -09/20/2021 17:19:39 - INFO - __main__ - Step 13112: {'lr': 0.00019999903137703738, 'samples': 419584, 'steps': 819, 'loss/train': 3.9986491203308105} -09/20/2021 17:19:40 - INFO - __main__ - Step 13113: {'lr': 0.00019999903137703738, 'samples': 419616, 'steps': 819, 'loss/train': 3.8317058086395264} -09/20/2021 17:19:40 - INFO - __main__ - Step 13114: {'lr': 0.00019999903137703738, 'samples': 419648, 'steps': 819, 'loss/train': 1.6799272298812866} -09/20/2021 17:19:41 - INFO - __main__ - Step 13115: {'lr': 0.00019999903137703738, 'samples': 419680, 'steps': 819, 'loss/train': 3.549971103668213} -09/20/2021 17:19:42 - INFO - __main__ - Step 13116: {'lr': 0.00019999903137703738, 'samples': 419712, 'steps': 819, 'loss/train': 3.6508541107177734} -09/20/2021 17:19:43 - INFO - __main__ - Step 13117: {'lr': 0.00019999903137703738, 'samples': 419744, 'steps': 819, 'loss/train': 4.423103332519531} -09/20/2021 17:19:44 - INFO - __main__ - Step 13118: {'lr': 0.00019999903137703738, 'samples': 419776, 'steps': 819, 'loss/train': 3.84169602394104} -09/20/2021 17:19:45 - INFO - __main__ - Step 13119: {'lr': 0.00019999903137703738, 'samples': 419808, 'steps': 819, 'loss/train': 4.629302501678467} -09/20/2021 17:19:45 - INFO - __main__ - Step 13120: {'lr': 0.00019999903137703738, 'samples': 419840, 'steps': 819, 'loss/train': 3.7894983291625977} -09/20/2021 17:19:46 - INFO - __main__ - Step 13121: {'lr': 0.000199999003097607, 'samples': 419872, 'steps': 820, 'loss/train': 3.8654751777648926} -09/20/2021 17:19:47 - INFO - __main__ - Step 13122: {'lr': 0.000199999003097607, 'samples': 419904, 'steps': 820, 'loss/train': 4.04419469833374} -09/20/2021 17:19:48 - INFO - __main__ - Step 13123: {'lr': 0.000199999003097607, 'samples': 419936, 'steps': 820, 'loss/train': 4.5442891120910645} -09/20/2021 17:19:49 - INFO - __main__ - Step 13124: {'lr': 0.000199999003097607, 'samples': 419968, 'steps': 820, 'loss/train': 4.324363708496094} -09/20/2021 17:19:49 - INFO - __main__ - Step 13125: {'lr': 0.000199999003097607, 'samples': 420000, 'steps': 820, 'loss/train': 4.145316123962402} -09/20/2021 17:19:50 - INFO - __main__ - Step 13126: {'lr': 0.000199999003097607, 'samples': 420032, 'steps': 820, 'loss/train': 3.8571486473083496} -09/20/2021 17:19:51 - INFO - __main__ - Step 13127: {'lr': 0.000199999003097607, 'samples': 420064, 'steps': 820, 'loss/train': 3.1921675205230713} -09/20/2021 17:19:52 - INFO - __main__ - Step 13128: {'lr': 0.000199999003097607, 'samples': 420096, 'steps': 820, 'loss/train': 4.533485412597656} -09/20/2021 17:19:52 - INFO - __main__ - Step 13129: {'lr': 0.000199999003097607, 'samples': 420128, 'steps': 820, 'loss/train': 5.369959831237793} -09/20/2021 17:19:53 - INFO - __main__ - Step 13130: {'lr': 0.000199999003097607, 'samples': 420160, 'steps': 820, 'loss/train': 2.9991097450256348} -09/20/2021 17:19:54 - INFO - __main__ - Step 13131: {'lr': 0.000199999003097607, 'samples': 420192, 'steps': 820, 'loss/train': 3.9169869422912598} -09/20/2021 17:19:55 - INFO - __main__ - Step 13132: {'lr': 0.000199999003097607, 'samples': 420224, 'steps': 820, 'loss/train': 4.067293643951416} -09/20/2021 17:19:55 - INFO - __main__ - Step 13133: {'lr': 0.000199999003097607, 'samples': 420256, 'steps': 820, 'loss/train': 4.5132527351379395} -09/20/2021 17:19:56 - INFO - __main__ - Step 13134: {'lr': 0.000199999003097607, 'samples': 420288, 'steps': 820, 'loss/train': 3.3676087856292725} -09/20/2021 17:19:57 - INFO - __main__ - Step 13135: {'lr': 0.000199999003097607, 'samples': 420320, 'steps': 820, 'loss/train': 3.2954962253570557} -09/20/2021 17:19:58 - INFO - __main__ - Step 13136: {'lr': 0.000199999003097607, 'samples': 420352, 'steps': 820, 'loss/train': 4.190021514892578} -09/20/2021 17:19:58 - INFO - __main__ - Step 13137: {'lr': 0.00019999897441128102, 'samples': 420384, 'steps': 821, 'loss/train': 3.9447250366210938} -09/20/2021 17:19:59 - INFO - __main__ - Step 13138: {'lr': 0.00019999897441128102, 'samples': 420416, 'steps': 821, 'loss/train': 3.9908769130706787} -09/20/2021 17:20:00 - INFO - __main__ - Step 13139: {'lr': 0.00019999897441128102, 'samples': 420448, 'steps': 821, 'loss/train': 4.152823448181152} -09/20/2021 17:20:01 - INFO - __main__ - Step 13140: {'lr': 0.00019999897441128102, 'samples': 420480, 'steps': 821, 'loss/train': 4.259876728057861} -09/20/2021 17:20:01 - INFO - __main__ - Step 13141: {'lr': 0.00019999897441128102, 'samples': 420512, 'steps': 821, 'loss/train': 3.294572114944458} -09/20/2021 17:20:02 - INFO - __main__ - Step 13142: {'lr': 0.00019999897441128102, 'samples': 420544, 'steps': 821, 'loss/train': 4.383772373199463} -09/20/2021 17:20:03 - INFO - __main__ - Step 13143: {'lr': 0.00019999897441128102, 'samples': 420576, 'steps': 821, 'loss/train': 3.5806918144226074} -09/20/2021 17:20:04 - INFO - __main__ - Step 13144: {'lr': 0.00019999897441128102, 'samples': 420608, 'steps': 821, 'loss/train': 4.047801971435547} -09/20/2021 17:20:04 - INFO - __main__ - Step 13145: {'lr': 0.00019999897441128102, 'samples': 420640, 'steps': 821, 'loss/train': 4.381851673126221} -09/20/2021 17:20:06 - INFO - __main__ - Step 13146: {'lr': 0.00019999897441128102, 'samples': 420672, 'steps': 821, 'loss/train': 3.588402271270752} -09/20/2021 17:20:06 - INFO - __main__ - Step 13147: {'lr': 0.00019999897441128102, 'samples': 420704, 'steps': 821, 'loss/train': 3.9576938152313232} -09/20/2021 17:20:07 - INFO - __main__ - Step 13148: {'lr': 0.00019999897441128102, 'samples': 420736, 'steps': 821, 'loss/train': 3.8063929080963135} -09/20/2021 17:20:08 - INFO - __main__ - Step 13149: {'lr': 0.00019999897441128102, 'samples': 420768, 'steps': 821, 'loss/train': 4.838873863220215} -09/20/2021 17:20:09 - INFO - __main__ - Step 13150: {'lr': 0.00019999897441128102, 'samples': 420800, 'steps': 821, 'loss/train': 3.8808107376098633} -09/20/2021 17:20:09 - INFO - __main__ - Step 13151: {'lr': 0.00019999897441128102, 'samples': 420832, 'steps': 821, 'loss/train': 3.265174627304077} -09/20/2021 17:20:10 - INFO - __main__ - Step 13152: {'lr': 0.00019999897441128102, 'samples': 420864, 'steps': 821, 'loss/train': 3.7900092601776123} -09/20/2021 17:20:11 - INFO - __main__ - Step 13153: {'lr': 0.00019999894531805965, 'samples': 420896, 'steps': 822, 'loss/train': 3.873499870300293} -09/20/2021 17:20:12 - INFO - __main__ - Step 13154: {'lr': 0.00019999894531805965, 'samples': 420928, 'steps': 822, 'loss/train': 3.4699881076812744} -09/20/2021 17:20:13 - INFO - __main__ - Step 13155: {'lr': 0.00019999894531805965, 'samples': 420960, 'steps': 822, 'loss/train': 3.799405097961426} -09/20/2021 17:20:13 - INFO - __main__ - Step 13156: {'lr': 0.00019999894531805965, 'samples': 420992, 'steps': 822, 'loss/train': 4.184645175933838} -09/20/2021 17:20:14 - INFO - __main__ - Step 13157: {'lr': 0.00019999894531805965, 'samples': 421024, 'steps': 822, 'loss/train': 4.4897847175598145} -09/20/2021 17:20:15 - INFO - __main__ - Step 13158: {'lr': 0.00019999894531805965, 'samples': 421056, 'steps': 822, 'loss/train': 4.005550384521484} -09/20/2021 17:20:16 - INFO - __main__ - Step 13159: {'lr': 0.00019999894531805965, 'samples': 421088, 'steps': 822, 'loss/train': 5.082205772399902} -09/20/2021 17:20:16 - INFO - __main__ - Step 13160: {'lr': 0.00019999894531805965, 'samples': 421120, 'steps': 822, 'loss/train': 3.8383688926696777} -09/20/2021 17:20:17 - INFO - __main__ - Step 13161: {'lr': 0.00019999894531805965, 'samples': 421152, 'steps': 822, 'loss/train': 4.6724677085876465} -09/20/2021 17:20:18 - INFO - __main__ - Step 13162: {'lr': 0.00019999894531805965, 'samples': 421184, 'steps': 822, 'loss/train': 4.3611297607421875} -09/20/2021 17:20:19 - INFO - __main__ - Step 13163: {'lr': 0.00019999894531805965, 'samples': 421216, 'steps': 822, 'loss/train': 5.093181610107422} -09/20/2021 17:20:19 - INFO - __main__ - Step 13164: {'lr': 0.00019999894531805965, 'samples': 421248, 'steps': 822, 'loss/train': 1.4154495000839233} -09/20/2021 17:20:20 - INFO - __main__ - Step 13165: {'lr': 0.00019999894531805965, 'samples': 421280, 'steps': 822, 'loss/train': 3.8266615867614746} -09/20/2021 17:20:21 - INFO - __main__ - Step 13166: {'lr': 0.00019999894531805965, 'samples': 421312, 'steps': 822, 'loss/train': 4.875917911529541} -09/20/2021 17:20:22 - INFO - __main__ - Step 13167: {'lr': 0.00019999894531805965, 'samples': 421344, 'steps': 822, 'loss/train': 3.4492154121398926} -09/20/2021 17:20:22 - INFO - __main__ - Step 13168: {'lr': 0.00019999894531805965, 'samples': 421376, 'steps': 822, 'loss/train': 4.762094974517822} -09/20/2021 17:20:23 - INFO - __main__ - Step 13169: {'lr': 0.00019999891581794294, 'samples': 421408, 'steps': 823, 'loss/train': 3.9263386726379395} -09/20/2021 17:20:24 - INFO - __main__ - Step 13170: {'lr': 0.00019999891581794294, 'samples': 421440, 'steps': 823, 'loss/train': 3.8450613021850586} -09/20/2021 17:20:25 - INFO - __main__ - Step 13171: {'lr': 0.00019999891581794294, 'samples': 421472, 'steps': 823, 'loss/train': 5.189791679382324} -09/20/2021 17:20:25 - INFO - __main__ - Step 13172: {'lr': 0.00019999891581794294, 'samples': 421504, 'steps': 823, 'loss/train': 4.623821258544922} -09/20/2021 17:20:26 - INFO - __main__ - Step 13173: {'lr': 0.00019999891581794294, 'samples': 421536, 'steps': 823, 'loss/train': 3.7993083000183105} -09/20/2021 17:20:27 - INFO - __main__ - Step 13174: {'lr': 0.00019999891581794294, 'samples': 421568, 'steps': 823, 'loss/train': 3.7883498668670654} -09/20/2021 17:20:28 - INFO - __main__ - Step 13175: {'lr': 0.00019999891581794294, 'samples': 421600, 'steps': 823, 'loss/train': 4.3107218742370605} -09/20/2021 17:20:28 - INFO - __main__ - Step 13176: {'lr': 0.00019999891581794294, 'samples': 421632, 'steps': 823, 'loss/train': 3.5190303325653076} -09/20/2021 17:20:30 - INFO - __main__ - Step 13177: {'lr': 0.00019999891581794294, 'samples': 421664, 'steps': 823, 'loss/train': 5.532691478729248} -09/20/2021 17:20:30 - INFO - __main__ - Step 13178: {'lr': 0.00019999891581794294, 'samples': 421696, 'steps': 823, 'loss/train': 4.468084812164307} -09/20/2021 17:20:31 - INFO - __main__ - Step 13179: {'lr': 0.00019999891581794294, 'samples': 421728, 'steps': 823, 'loss/train': 3.613095760345459} -09/20/2021 17:20:32 - INFO - __main__ - Step 13180: {'lr': 0.00019999891581794294, 'samples': 421760, 'steps': 823, 'loss/train': 4.983715057373047} -09/20/2021 17:20:33 - INFO - __main__ - Step 13181: {'lr': 0.00019999891581794294, 'samples': 421792, 'steps': 823, 'loss/train': 4.27334451675415} -09/20/2021 17:20:33 - INFO - __main__ - Step 13182: {'lr': 0.00019999891581794294, 'samples': 421824, 'steps': 823, 'loss/train': 3.832427978515625} -09/20/2021 17:20:34 - INFO - __main__ - Step 13183: {'lr': 0.00019999891581794294, 'samples': 421856, 'steps': 823, 'loss/train': 3.8133153915405273} -09/20/2021 17:20:35 - INFO - __main__ - Step 13184: {'lr': 0.00019999891581794294, 'samples': 421888, 'steps': 823, 'loss/train': 3.292112350463867} -09/20/2021 17:20:36 - INFO - __main__ - Step 13185: {'lr': 0.00019999888591093105, 'samples': 421920, 'steps': 824, 'loss/train': 1.8980093002319336} -09/20/2021 17:20:37 - INFO - __main__ - Step 13186: {'lr': 0.00019999888591093105, 'samples': 421952, 'steps': 824, 'loss/train': 1.529555082321167} -09/20/2021 17:20:37 - INFO - __main__ - Step 13187: {'lr': 0.00019999888591093105, 'samples': 421984, 'steps': 824, 'loss/train': 1.7998528480529785} -09/20/2021 17:20:38 - INFO - __main__ - Step 13188: {'lr': 0.00019999888591093105, 'samples': 422016, 'steps': 824, 'loss/train': 3.923703908920288} -09/20/2021 17:20:39 - INFO - __main__ - Step 13189: {'lr': 0.00019999888591093105, 'samples': 422048, 'steps': 824, 'loss/train': 3.42044997215271} -09/20/2021 17:20:40 - INFO - __main__ - Step 13190: {'lr': 0.00019999888591093105, 'samples': 422080, 'steps': 824, 'loss/train': 4.5185675621032715} -09/20/2021 17:20:40 - INFO - __main__ - Step 13191: {'lr': 0.00019999888591093105, 'samples': 422112, 'steps': 824, 'loss/train': 3.903902769088745} -09/20/2021 17:20:41 - INFO - __main__ - Step 13192: {'lr': 0.00019999888591093105, 'samples': 422144, 'steps': 824, 'loss/train': 4.212377548217773} -09/20/2021 17:20:42 - INFO - __main__ - Step 13193: {'lr': 0.00019999888591093105, 'samples': 422176, 'steps': 824, 'loss/train': 4.151421070098877} -09/20/2021 17:20:43 - INFO - __main__ - Step 13194: {'lr': 0.00019999888591093105, 'samples': 422208, 'steps': 824, 'loss/train': 4.032505512237549} -09/20/2021 17:20:43 - INFO - __main__ - Step 13195: {'lr': 0.00019999888591093105, 'samples': 422240, 'steps': 824, 'loss/train': 4.133058071136475} -09/20/2021 17:20:44 - INFO - __main__ - Step 13196: {'lr': 0.00019999888591093105, 'samples': 422272, 'steps': 824, 'loss/train': 4.406484603881836} -09/20/2021 17:20:45 - INFO - __main__ - Step 13197: {'lr': 0.00019999888591093105, 'samples': 422304, 'steps': 824, 'loss/train': 3.4926395416259766} -09/20/2021 17:20:46 - INFO - __main__ - Step 13198: {'lr': 0.00019999888591093105, 'samples': 422336, 'steps': 824, 'loss/train': 4.061985492706299} -09/20/2021 17:20:46 - INFO - __main__ - Step 13199: {'lr': 0.00019999888591093105, 'samples': 422368, 'steps': 824, 'loss/train': 3.6847875118255615} -09/20/2021 17:20:47 - INFO - __main__ - Step 13200: {'lr': 0.00019999888591093105, 'samples': 422400, 'steps': 824, 'loss/train': 4.28052282333374} -09/20/2021 17:20:48 - INFO - __main__ - Step 13201: {'lr': 0.00019999885559702406, 'samples': 422432, 'steps': 825, 'loss/train': 5.051398277282715} -09/20/2021 17:20:49 - INFO - __main__ - Step 13202: {'lr': 0.00019999885559702406, 'samples': 422464, 'steps': 825, 'loss/train': 4.976864814758301} -09/20/2021 17:20:49 - INFO - __main__ - Step 13203: {'lr': 0.00019999885559702406, 'samples': 422496, 'steps': 825, 'loss/train': 3.811652183532715} -09/20/2021 17:20:50 - INFO - __main__ - Step 13204: {'lr': 0.00019999885559702406, 'samples': 422528, 'steps': 825, 'loss/train': 5.1005754470825195} -09/20/2021 17:20:51 - INFO - __main__ - Step 13205: {'lr': 0.00019999885559702406, 'samples': 422560, 'steps': 825, 'loss/train': 4.4381585121154785} -09/20/2021 17:20:52 - INFO - __main__ - Step 13206: {'lr': 0.00019999885559702406, 'samples': 422592, 'steps': 825, 'loss/train': 4.072188377380371} -09/20/2021 17:20:52 - INFO - __main__ - Step 13207: {'lr': 0.00019999885559702406, 'samples': 422624, 'steps': 825, 'loss/train': 2.9990386962890625} -09/20/2021 17:20:54 - INFO - __main__ - Step 13208: {'lr': 0.00019999885559702406, 'samples': 422656, 'steps': 825, 'loss/train': 3.9877350330352783} -09/20/2021 17:20:55 - INFO - __main__ - Step 13209: {'lr': 0.00019999885559702406, 'samples': 422688, 'steps': 825, 'loss/train': 3.7556252479553223} -09/20/2021 17:20:55 - INFO - __main__ - Step 13210: {'lr': 0.00019999885559702406, 'samples': 422720, 'steps': 825, 'loss/train': 4.370273590087891} -09/20/2021 17:20:56 - INFO - __main__ - Step 13211: {'lr': 0.00019999885559702406, 'samples': 422752, 'steps': 825, 'loss/train': 4.448325157165527} -09/20/2021 17:20:57 - INFO - __main__ - Step 13212: {'lr': 0.00019999885559702406, 'samples': 422784, 'steps': 825, 'loss/train': 4.233177185058594} -09/20/2021 17:20:58 - INFO - __main__ - Step 13213: {'lr': 0.00019999885559702406, 'samples': 422816, 'steps': 825, 'loss/train': 3.5916619300842285} -09/20/2021 17:20:58 - INFO - __main__ - Step 13214: {'lr': 0.00019999885559702406, 'samples': 422848, 'steps': 825, 'loss/train': 3.816451072692871} -09/20/2021 17:20:59 - INFO - __main__ - Step 13215: {'lr': 0.00019999885559702406, 'samples': 422880, 'steps': 825, 'loss/train': 3.1629955768585205} -09/20/2021 17:21:00 - INFO - __main__ - Step 13216: {'lr': 0.00019999885559702406, 'samples': 422912, 'steps': 825, 'loss/train': 3.8705716133117676} -09/20/2021 17:21:01 - INFO - __main__ - Step 13217: {'lr': 0.00019999882487622213, 'samples': 422944, 'steps': 826, 'loss/train': 3.973865032196045} -09/20/2021 17:21:01 - INFO - __main__ - Step 13218: {'lr': 0.00019999882487622213, 'samples': 422976, 'steps': 826, 'loss/train': 3.267526626586914} -09/20/2021 17:21:02 - INFO - __main__ - Step 13219: {'lr': 0.00019999882487622213, 'samples': 423008, 'steps': 826, 'loss/train': 4.875021457672119} -09/20/2021 17:21:03 - INFO - __main__ - Step 13220: {'lr': 0.00019999882487622213, 'samples': 423040, 'steps': 826, 'loss/train': 4.033105850219727} -09/20/2021 17:21:04 - INFO - __main__ - Step 13221: {'lr': 0.00019999882487622213, 'samples': 423072, 'steps': 826, 'loss/train': 4.1432600021362305} -09/20/2021 17:21:04 - INFO - __main__ - Step 13222: {'lr': 0.00019999882487622213, 'samples': 423104, 'steps': 826, 'loss/train': 2.7281136512756348} -09/20/2021 17:21:05 - INFO - __main__ - Step 13223: {'lr': 0.00019999882487622213, 'samples': 423136, 'steps': 826, 'loss/train': 4.266306400299072} -09/20/2021 17:21:06 - INFO - __main__ - Step 13224: {'lr': 0.00019999882487622213, 'samples': 423168, 'steps': 826, 'loss/train': 4.288414478302002} -09/20/2021 17:21:07 - INFO - __main__ - Step 13225: {'lr': 0.00019999882487622213, 'samples': 423200, 'steps': 826, 'loss/train': 4.260138988494873} -09/20/2021 17:21:07 - INFO - __main__ - Step 13226: {'lr': 0.00019999882487622213, 'samples': 423232, 'steps': 826, 'loss/train': 4.099386692047119} -09/20/2021 17:21:08 - INFO - __main__ - Step 13227: {'lr': 0.00019999882487622213, 'samples': 423264, 'steps': 826, 'loss/train': 3.843125820159912} -09/20/2021 17:21:09 - INFO - __main__ - Step 13228: {'lr': 0.00019999882487622213, 'samples': 423296, 'steps': 826, 'loss/train': 4.079999923706055} -09/20/2021 17:21:10 - INFO - __main__ - Step 13229: {'lr': 0.00019999882487622213, 'samples': 423328, 'steps': 826, 'loss/train': 3.505723476409912} -09/20/2021 17:21:10 - INFO - __main__ - Step 13230: {'lr': 0.00019999882487622213, 'samples': 423360, 'steps': 826, 'loss/train': 3.692235231399536} -09/20/2021 17:21:11 - INFO - __main__ - Step 13231: {'lr': 0.00019999882487622213, 'samples': 423392, 'steps': 826, 'loss/train': 3.6967689990997314} -09/20/2021 17:21:12 - INFO - __main__ - Step 13232: {'lr': 0.00019999882487622213, 'samples': 423424, 'steps': 826, 'loss/train': 5.2038092613220215} -09/20/2021 17:21:13 - INFO - __main__ - Step 13233: {'lr': 0.00019999879374852535, 'samples': 423456, 'steps': 827, 'loss/train': 3.9057905673980713} -09/20/2021 17:21:14 - INFO - __main__ - Step 13234: {'lr': 0.00019999879374852535, 'samples': 423488, 'steps': 827, 'loss/train': 4.99953556060791} -09/20/2021 17:21:14 - INFO - __main__ - Step 13235: {'lr': 0.00019999879374852535, 'samples': 423520, 'steps': 827, 'loss/train': 3.6775457859039307} -09/20/2021 17:21:15 - INFO - __main__ - Step 13236: {'lr': 0.00019999879374852535, 'samples': 423552, 'steps': 827, 'loss/train': 3.1537187099456787} -09/20/2021 17:21:16 - INFO - __main__ - Step 13237: {'lr': 0.00019999879374852535, 'samples': 423584, 'steps': 827, 'loss/train': 4.449862480163574} -09/20/2021 17:21:17 - INFO - __main__ - Step 13238: {'lr': 0.00019999879374852535, 'samples': 423616, 'steps': 827, 'loss/train': 4.20688009262085} -09/20/2021 17:21:18 - INFO - __main__ - Step 13239: {'lr': 0.00019999879374852535, 'samples': 423648, 'steps': 827, 'loss/train': 5.13803243637085} -09/20/2021 17:21:19 - INFO - __main__ - Step 13240: {'lr': 0.00019999879374852535, 'samples': 423680, 'steps': 827, 'loss/train': 4.055980205535889} -09/20/2021 17:21:19 - INFO - __main__ - Step 13241: {'lr': 0.00019999879374852535, 'samples': 423712, 'steps': 827, 'loss/train': 3.34928822517395} -09/20/2021 17:21:20 - INFO - __main__ - Step 13242: {'lr': 0.00019999879374852535, 'samples': 423744, 'steps': 827, 'loss/train': 3.5202925205230713} -09/20/2021 17:21:21 - INFO - __main__ - Step 13243: {'lr': 0.00019999879374852535, 'samples': 423776, 'steps': 827, 'loss/train': 5.18527889251709} -09/20/2021 17:21:22 - INFO - __main__ - Step 13244: {'lr': 0.00019999879374852535, 'samples': 423808, 'steps': 827, 'loss/train': 5.793221950531006} -09/20/2021 17:21:22 - INFO - __main__ - Step 13245: {'lr': 0.00019999879374852535, 'samples': 423840, 'steps': 827, 'loss/train': 5.828436374664307} -09/20/2021 17:21:23 - INFO - __main__ - Step 13246: {'lr': 0.00019999879374852535, 'samples': 423872, 'steps': 827, 'loss/train': 5.189996719360352} -09/20/2021 17:21:24 - INFO - __main__ - Step 13247: {'lr': 0.00019999879374852535, 'samples': 423904, 'steps': 827, 'loss/train': 3.9045462608337402} -09/20/2021 17:21:25 - INFO - __main__ - Step 13248: {'lr': 0.00019999879374852535, 'samples': 423936, 'steps': 827, 'loss/train': 4.945547580718994} -09/20/2021 17:21:26 - INFO - __main__ - Step 13249: {'lr': 0.00019999876221393387, 'samples': 423968, 'steps': 828, 'loss/train': 4.257103443145752} -09/20/2021 17:21:26 - INFO - __main__ - Step 13250: {'lr': 0.00019999876221393387, 'samples': 424000, 'steps': 828, 'loss/train': 4.094753265380859} -09/20/2021 17:21:27 - INFO - __main__ - Step 13251: {'lr': 0.00019999876221393387, 'samples': 424032, 'steps': 828, 'loss/train': 5.531219482421875} -09/20/2021 17:21:28 - INFO - __main__ - Step 13252: {'lr': 0.00019999876221393387, 'samples': 424064, 'steps': 828, 'loss/train': 3.2762489318847656} -09/20/2021 17:21:29 - INFO - __main__ - Step 13253: {'lr': 0.00019999876221393387, 'samples': 424096, 'steps': 828, 'loss/train': 3.516158103942871} -09/20/2021 17:21:29 - INFO - __main__ - Step 13254: {'lr': 0.00019999876221393387, 'samples': 424128, 'steps': 828, 'loss/train': 4.65578556060791} -09/20/2021 17:21:30 - INFO - __main__ - Step 13255: {'lr': 0.00019999876221393387, 'samples': 424160, 'steps': 828, 'loss/train': 2.1630048751831055} -09/20/2021 17:21:31 - INFO - __main__ - Step 13256: {'lr': 0.00019999876221393387, 'samples': 424192, 'steps': 828, 'loss/train': 3.383293628692627} -09/20/2021 17:21:32 - INFO - __main__ - Step 13257: {'lr': 0.00019999876221393387, 'samples': 424224, 'steps': 828, 'loss/train': 3.8229122161865234} -09/20/2021 17:21:32 - INFO - __main__ - Step 13258: {'lr': 0.00019999876221393387, 'samples': 424256, 'steps': 828, 'loss/train': 4.09869384765625} -09/20/2021 17:21:33 - INFO - __main__ - Step 13259: {'lr': 0.00019999876221393387, 'samples': 424288, 'steps': 828, 'loss/train': 3.565784454345703} -09/20/2021 17:21:34 - INFO - __main__ - Step 13260: {'lr': 0.00019999876221393387, 'samples': 424320, 'steps': 828, 'loss/train': 3.6540894508361816} -09/20/2021 17:21:35 - INFO - __main__ - Step 13261: {'lr': 0.00019999876221393387, 'samples': 424352, 'steps': 828, 'loss/train': 3.017953872680664} -09/20/2021 17:21:35 - INFO - __main__ - Step 13262: {'lr': 0.00019999876221393387, 'samples': 424384, 'steps': 828, 'loss/train': 5.071017265319824} -09/20/2021 17:21:36 - INFO - __main__ - Step 13263: {'lr': 0.00019999876221393387, 'samples': 424416, 'steps': 828, 'loss/train': 3.397055149078369} -09/20/2021 17:21:37 - INFO - __main__ - Step 13264: {'lr': 0.00019999876221393387, 'samples': 424448, 'steps': 828, 'loss/train': 3.9200727939605713} -09/20/2021 17:21:38 - INFO - __main__ - Step 13265: {'lr': 0.00019999873027244782, 'samples': 424480, 'steps': 829, 'loss/train': 4.283830642700195} -09/20/2021 17:21:38 - INFO - __main__ - Step 13266: {'lr': 0.00019999873027244782, 'samples': 424512, 'steps': 829, 'loss/train': 4.236387252807617} -09/20/2021 17:21:39 - INFO - __main__ - Step 13267: {'lr': 0.00019999873027244782, 'samples': 424544, 'steps': 829, 'loss/train': 4.126161575317383} -09/20/2021 17:21:40 - INFO - __main__ - Step 13268: {'lr': 0.00019999873027244782, 'samples': 424576, 'steps': 829, 'loss/train': 3.8063323497772217} -09/20/2021 17:21:41 - INFO - __main__ - Step 13269: {'lr': 0.00019999873027244782, 'samples': 424608, 'steps': 829, 'loss/train': 4.093848705291748} -09/20/2021 17:21:41 - INFO - __main__ - Step 13270: {'lr': 0.00019999873027244782, 'samples': 424640, 'steps': 829, 'loss/train': 4.370362758636475} -09/20/2021 17:21:43 - INFO - __main__ - Step 13271: {'lr': 0.00019999873027244782, 'samples': 424672, 'steps': 829, 'loss/train': 3.6834042072296143} -09/20/2021 17:21:44 - INFO - __main__ - Step 13272: {'lr': 0.00019999873027244782, 'samples': 424704, 'steps': 829, 'loss/train': 4.198015213012695} -09/20/2021 17:21:45 - INFO - __main__ - Step 13273: {'lr': 0.00019999873027244782, 'samples': 424736, 'steps': 829, 'loss/train': 3.737574577331543} -09/20/2021 17:21:45 - INFO - __main__ - Step 13274: {'lr': 0.00019999873027244782, 'samples': 424768, 'steps': 829, 'loss/train': 4.294305324554443} -09/20/2021 17:21:46 - INFO - __main__ - Step 13275: {'lr': 0.00019999873027244782, 'samples': 424800, 'steps': 829, 'loss/train': 3.8784542083740234} -09/20/2021 17:21:47 - INFO - __main__ - Step 13276: {'lr': 0.00019999873027244782, 'samples': 424832, 'steps': 829, 'loss/train': 4.869704723358154} -09/20/2021 17:21:48 - INFO - __main__ - Step 13277: {'lr': 0.00019999873027244782, 'samples': 424864, 'steps': 829, 'loss/train': 4.494791030883789} -09/20/2021 17:21:48 - INFO - __main__ - Step 13278: {'lr': 0.00019999873027244782, 'samples': 424896, 'steps': 829, 'loss/train': 3.855742931365967} -09/20/2021 17:21:49 - INFO - __main__ - Step 13279: {'lr': 0.00019999873027244782, 'samples': 424928, 'steps': 829, 'loss/train': 3.4008359909057617} -09/20/2021 17:21:50 - INFO - __main__ - Step 13280: {'lr': 0.00019999873027244782, 'samples': 424960, 'steps': 829, 'loss/train': 3.58229398727417} -09/20/2021 17:21:51 - INFO - __main__ - Step 13281: {'lr': 0.00019999869792406734, 'samples': 424992, 'steps': 830, 'loss/train': 3.420916795730591} -09/20/2021 17:21:52 - INFO - __main__ - Step 13282: {'lr': 0.00019999869792406734, 'samples': 425024, 'steps': 830, 'loss/train': 3.5203356742858887} -09/20/2021 17:21:52 - INFO - __main__ - Step 13283: {'lr': 0.00019999869792406734, 'samples': 425056, 'steps': 830, 'loss/train': 4.247054100036621} -09/20/2021 17:21:53 - INFO - __main__ - Step 13284: {'lr': 0.00019999869792406734, 'samples': 425088, 'steps': 830, 'loss/train': 3.1218130588531494} -09/20/2021 17:21:54 - INFO - __main__ - Step 13285: {'lr': 0.00019999869792406734, 'samples': 425120, 'steps': 830, 'loss/train': 3.089711904525757} -09/20/2021 17:21:55 - INFO - __main__ - Step 13286: {'lr': 0.00019999869792406734, 'samples': 425152, 'steps': 830, 'loss/train': 3.3922767639160156} -09/20/2021 17:21:55 - INFO - __main__ - Step 13287: {'lr': 0.00019999869792406734, 'samples': 425184, 'steps': 830, 'loss/train': 3.6814217567443848} -09/20/2021 17:21:56 - INFO - __main__ - Step 13288: {'lr': 0.00019999869792406734, 'samples': 425216, 'steps': 830, 'loss/train': 4.001708507537842} -09/20/2021 17:21:57 - INFO - __main__ - Step 13289: {'lr': 0.00019999869792406734, 'samples': 425248, 'steps': 830, 'loss/train': 5.814835548400879} -09/20/2021 17:21:58 - INFO - __main__ - Step 13290: {'lr': 0.00019999869792406734, 'samples': 425280, 'steps': 830, 'loss/train': 4.085226535797119} -09/20/2021 17:21:58 - INFO - __main__ - Step 13291: {'lr': 0.00019999869792406734, 'samples': 425312, 'steps': 830, 'loss/train': 3.553964614868164} -09/20/2021 17:21:59 - INFO - __main__ - Step 13292: {'lr': 0.00019999869792406734, 'samples': 425344, 'steps': 830, 'loss/train': 3.1820015907287598} -09/20/2021 17:22:00 - INFO - __main__ - Step 13293: {'lr': 0.00019999869792406734, 'samples': 425376, 'steps': 830, 'loss/train': 3.829512357711792} -09/20/2021 17:22:01 - INFO - __main__ - Step 13294: {'lr': 0.00019999869792406734, 'samples': 425408, 'steps': 830, 'loss/train': 4.271641731262207} -09/20/2021 17:22:01 - INFO - __main__ - Step 13295: {'lr': 0.00019999869792406734, 'samples': 425440, 'steps': 830, 'loss/train': 4.214982032775879} -09/20/2021 17:22:02 - INFO - __main__ - Step 13296: {'lr': 0.00019999869792406734, 'samples': 425472, 'steps': 830, 'loss/train': 4.6274895668029785} -09/20/2021 17:22:03 - INFO - __main__ - Step 13297: {'lr': 0.0001999986651687925, 'samples': 425504, 'steps': 831, 'loss/train': 3.9100141525268555} -09/20/2021 17:22:04 - INFO - __main__ - Step 13298: {'lr': 0.0001999986651687925, 'samples': 425536, 'steps': 831, 'loss/train': 4.020129680633545} -09/20/2021 17:22:04 - INFO - __main__ - Step 13299: {'lr': 0.0001999986651687925, 'samples': 425568, 'steps': 831, 'loss/train': 4.175419330596924} -09/20/2021 17:22:05 - INFO - __main__ - Step 13300: {'lr': 0.0001999986651687925, 'samples': 425600, 'steps': 831, 'loss/train': 4.3551740646362305} -09/20/2021 17:22:06 - INFO - __main__ - Step 13301: {'lr': 0.0001999986651687925, 'samples': 425632, 'steps': 831, 'loss/train': 5.482379913330078} -09/20/2021 17:22:07 - INFO - __main__ - Step 13302: {'lr': 0.0001999986651687925, 'samples': 425664, 'steps': 831, 'loss/train': 3.911796808242798} -09/20/2021 17:22:08 - INFO - __main__ - Step 13303: {'lr': 0.0001999986651687925, 'samples': 425696, 'steps': 831, 'loss/train': 3.6945958137512207} -09/20/2021 17:22:09 - INFO - __main__ - Step 13304: {'lr': 0.0001999986651687925, 'samples': 425728, 'steps': 831, 'loss/train': 4.9799418449401855} -09/20/2021 17:22:10 - INFO - __main__ - Step 13305: {'lr': 0.0001999986651687925, 'samples': 425760, 'steps': 831, 'loss/train': 5.013979911804199} -09/20/2021 17:22:10 - INFO - __main__ - Step 13306: {'lr': 0.0001999986651687925, 'samples': 425792, 'steps': 831, 'loss/train': 3.7983241081237793} -09/20/2021 17:22:11 - INFO - __main__ - Step 13307: {'lr': 0.0001999986651687925, 'samples': 425824, 'steps': 831, 'loss/train': 4.011417865753174} -09/20/2021 17:22:12 - INFO - __main__ - Step 13308: {'lr': 0.0001999986651687925, 'samples': 425856, 'steps': 831, 'loss/train': 3.765367269515991} -09/20/2021 17:22:13 - INFO - __main__ - Step 13309: {'lr': 0.0001999986651687925, 'samples': 425888, 'steps': 831, 'loss/train': 4.747297286987305} -09/20/2021 17:22:13 - INFO - __main__ - Step 13310: {'lr': 0.0001999986651687925, 'samples': 425920, 'steps': 831, 'loss/train': 4.246455192565918} -09/20/2021 17:22:14 - INFO - __main__ - Step 13311: {'lr': 0.0001999986651687925, 'samples': 425952, 'steps': 831, 'loss/train': 4.195315361022949} -09/20/2021 17:22:15 - INFO - __main__ - Step 13312: {'lr': 0.0001999986651687925, 'samples': 425984, 'steps': 831, 'loss/train': 5.442715167999268} -09/20/2021 17:22:16 - INFO - __main__ - Step 13313: {'lr': 0.00019999863200662353, 'samples': 426016, 'steps': 832, 'loss/train': 4.470644474029541} -09/20/2021 17:22:16 - INFO - __main__ - Step 13314: {'lr': 0.00019999863200662353, 'samples': 426048, 'steps': 832, 'loss/train': 2.4253294467926025} -09/20/2021 17:22:17 - INFO - __main__ - Step 13315: {'lr': 0.00019999863200662353, 'samples': 426080, 'steps': 832, 'loss/train': 7.403284072875977} -09/20/2021 17:22:18 - INFO - __main__ - Step 13316: {'lr': 0.00019999863200662353, 'samples': 426112, 'steps': 832, 'loss/train': 7.365134239196777} -09/20/2021 17:22:19 - INFO - __main__ - Step 13317: {'lr': 0.00019999863200662353, 'samples': 426144, 'steps': 832, 'loss/train': 3.98517107963562} -09/20/2021 17:22:19 - INFO - __main__ - Step 13318: {'lr': 0.00019999863200662353, 'samples': 426176, 'steps': 832, 'loss/train': 4.587787628173828} -09/20/2021 17:22:20 - INFO - __main__ - Step 13319: {'lr': 0.00019999863200662353, 'samples': 426208, 'steps': 832, 'loss/train': 4.212495803833008} -09/20/2021 17:22:21 - INFO - __main__ - Step 13320: {'lr': 0.00019999863200662353, 'samples': 426240, 'steps': 832, 'loss/train': 4.192691326141357} -09/20/2021 17:22:22 - INFO - __main__ - Step 13321: {'lr': 0.00019999863200662353, 'samples': 426272, 'steps': 832, 'loss/train': 4.101686477661133} -09/20/2021 17:22:22 - INFO - __main__ - Step 13322: {'lr': 0.00019999863200662353, 'samples': 426304, 'steps': 832, 'loss/train': 4.46851110458374} -09/20/2021 17:22:23 - INFO - __main__ - Step 13323: {'lr': 0.00019999863200662353, 'samples': 426336, 'steps': 832, 'loss/train': 3.8579964637756348} -09/20/2021 17:22:24 - INFO - __main__ - Step 13324: {'lr': 0.00019999863200662353, 'samples': 426368, 'steps': 832, 'loss/train': 4.0081329345703125} -09/20/2021 17:22:25 - INFO - __main__ - Step 13325: {'lr': 0.00019999863200662353, 'samples': 426400, 'steps': 832, 'loss/train': 4.475008010864258} -09/20/2021 17:22:25 - INFO - __main__ - Step 13326: {'lr': 0.00019999863200662353, 'samples': 426432, 'steps': 832, 'loss/train': 4.317285060882568} -09/20/2021 17:22:26 - INFO - __main__ - Step 13327: {'lr': 0.00019999863200662353, 'samples': 426464, 'steps': 832, 'loss/train': 3.8131520748138428} -09/20/2021 17:22:27 - INFO - __main__ - Step 13328: {'lr': 0.00019999863200662353, 'samples': 426496, 'steps': 832, 'loss/train': 4.183721542358398} -09/20/2021 17:22:28 - INFO - __main__ - Step 13329: {'lr': 0.00019999859843756047, 'samples': 426528, 'steps': 833, 'loss/train': 3.4916162490844727} -09/20/2021 17:22:29 - INFO - __main__ - Step 13330: {'lr': 0.00019999859843756047, 'samples': 426560, 'steps': 833, 'loss/train': 4.584217548370361} -09/20/2021 17:22:29 - INFO - __main__ - Step 13331: {'lr': 0.00019999859843756047, 'samples': 426592, 'steps': 833, 'loss/train': 4.758711338043213} -09/20/2021 17:22:30 - INFO - __main__ - Step 13332: {'lr': 0.00019999859843756047, 'samples': 426624, 'steps': 833, 'loss/train': 4.019218921661377} -09/20/2021 17:22:31 - INFO - __main__ - Step 13333: {'lr': 0.00019999859843756047, 'samples': 426656, 'steps': 833, 'loss/train': 5.0515899658203125} -09/20/2021 17:22:32 - INFO - __main__ - Step 13334: {'lr': 0.00019999859843756047, 'samples': 426688, 'steps': 833, 'loss/train': 4.654232978820801} -09/20/2021 17:22:33 - INFO - __main__ - Step 13335: {'lr': 0.00019999859843756047, 'samples': 426720, 'steps': 833, 'loss/train': 4.093780040740967} -09/20/2021 17:22:34 - INFO - __main__ - Step 13336: {'lr': 0.00019999859843756047, 'samples': 426752, 'steps': 833, 'loss/train': 4.029789924621582} -09/20/2021 17:22:34 - INFO - __main__ - Step 13337: {'lr': 0.00019999859843756047, 'samples': 426784, 'steps': 833, 'loss/train': 4.181129455566406} -09/20/2021 17:22:35 - INFO - __main__ - Step 13338: {'lr': 0.00019999859843756047, 'samples': 426816, 'steps': 833, 'loss/train': 3.4623947143554688} -09/20/2021 17:22:36 - INFO - __main__ - Step 13339: {'lr': 0.00019999859843756047, 'samples': 426848, 'steps': 833, 'loss/train': 4.574141025543213} -09/20/2021 17:22:37 - INFO - __main__ - Step 13340: {'lr': 0.00019999859843756047, 'samples': 426880, 'steps': 833, 'loss/train': 3.234100341796875} -09/20/2021 17:22:37 - INFO - __main__ - Step 13341: {'lr': 0.00019999859843756047, 'samples': 426912, 'steps': 833, 'loss/train': 3.818758964538574} -09/20/2021 17:22:38 - INFO - __main__ - Step 13342: {'lr': 0.00019999859843756047, 'samples': 426944, 'steps': 833, 'loss/train': 4.386695861816406} -09/20/2021 17:22:39 - INFO - __main__ - Step 13343: {'lr': 0.00019999859843756047, 'samples': 426976, 'steps': 833, 'loss/train': 3.495774984359741} -09/20/2021 17:22:40 - INFO - __main__ - Step 13344: {'lr': 0.00019999859843756047, 'samples': 427008, 'steps': 833, 'loss/train': 3.393763303756714} -09/20/2021 17:22:41 - INFO - __main__ - Step 13345: {'lr': 0.00019999856446160355, 'samples': 427040, 'steps': 834, 'loss/train': 3.9988107681274414} -09/20/2021 17:22:41 - INFO - __main__ - Step 13346: {'lr': 0.00019999856446160355, 'samples': 427072, 'steps': 834, 'loss/train': 4.889581680297852} -09/20/2021 17:22:42 - INFO - __main__ - Step 13347: {'lr': 0.00019999856446160355, 'samples': 427104, 'steps': 834, 'loss/train': 3.3734734058380127} -09/20/2021 17:22:43 - INFO - __main__ - Step 13348: {'lr': 0.00019999856446160355, 'samples': 427136, 'steps': 834, 'loss/train': 3.2510318756103516} -09/20/2021 17:22:44 - INFO - __main__ - Step 13349: {'lr': 0.00019999856446160355, 'samples': 427168, 'steps': 834, 'loss/train': 4.89572811126709} -09/20/2021 17:22:44 - INFO - __main__ - Step 13350: {'lr': 0.00019999856446160355, 'samples': 427200, 'steps': 834, 'loss/train': 2.151693820953369} -09/20/2021 17:22:45 - INFO - __main__ - Step 13351: {'lr': 0.00019999856446160355, 'samples': 427232, 'steps': 834, 'loss/train': 2.9123122692108154} -09/20/2021 17:22:46 - INFO - __main__ - Step 13352: {'lr': 0.00019999856446160355, 'samples': 427264, 'steps': 834, 'loss/train': 4.649178504943848} -09/20/2021 17:22:47 - INFO - __main__ - Step 13353: {'lr': 0.00019999856446160355, 'samples': 427296, 'steps': 834, 'loss/train': 3.579908847808838} -09/20/2021 17:22:47 - INFO - __main__ - Step 13354: {'lr': 0.00019999856446160355, 'samples': 427328, 'steps': 834, 'loss/train': 3.917099952697754} -09/20/2021 17:22:48 - INFO - __main__ - Step 13355: {'lr': 0.00019999856446160355, 'samples': 427360, 'steps': 834, 'loss/train': 3.234571695327759} -09/20/2021 17:22:49 - INFO - __main__ - Step 13356: {'lr': 0.00019999856446160355, 'samples': 427392, 'steps': 834, 'loss/train': 4.424201965332031} -09/20/2021 17:22:50 - INFO - __main__ - Step 13357: {'lr': 0.00019999856446160355, 'samples': 427424, 'steps': 834, 'loss/train': 4.393004417419434} -09/20/2021 17:22:50 - INFO - __main__ - Step 13358: {'lr': 0.00019999856446160355, 'samples': 427456, 'steps': 834, 'loss/train': 4.471902847290039} -09/20/2021 17:22:51 - INFO - __main__ - Step 13359: {'lr': 0.00019999856446160355, 'samples': 427488, 'steps': 834, 'loss/train': 4.411074638366699} -09/20/2021 17:22:52 - INFO - __main__ - Step 13360: {'lr': 0.00019999856446160355, 'samples': 427520, 'steps': 834, 'loss/train': 3.4288508892059326} -09/20/2021 17:22:53 - INFO - __main__ - Step 13361: {'lr': 0.00019999853007875282, 'samples': 427552, 'steps': 835, 'loss/train': 4.675498962402344} -09/20/2021 17:22:53 - INFO - __main__ - Step 13362: {'lr': 0.00019999853007875282, 'samples': 427584, 'steps': 835, 'loss/train': 3.949014902114868} -09/20/2021 17:22:54 - INFO - __main__ - Step 13363: {'lr': 0.00019999853007875282, 'samples': 427616, 'steps': 835, 'loss/train': 4.53362512588501} -09/20/2021 17:22:55 - INFO - __main__ - Step 13364: {'lr': 0.00019999853007875282, 'samples': 427648, 'steps': 835, 'loss/train': 4.1190643310546875} -09/20/2021 17:22:56 - INFO - __main__ - Step 13365: {'lr': 0.00019999853007875282, 'samples': 427680, 'steps': 835, 'loss/train': 3.6188902854919434} -09/20/2021 17:22:57 - INFO - __main__ - Step 13366: {'lr': 0.00019999853007875282, 'samples': 427712, 'steps': 835, 'loss/train': 3.8958444595336914} -09/20/2021 17:22:58 - INFO - __main__ - Step 13367: {'lr': 0.00019999853007875282, 'samples': 427744, 'steps': 835, 'loss/train': 2.177649974822998} -09/20/2021 17:22:59 - INFO - __main__ - Step 13368: {'lr': 0.00019999853007875282, 'samples': 427776, 'steps': 835, 'loss/train': 4.183998107910156} -09/20/2021 17:22:59 - INFO - __main__ - Step 13369: {'lr': 0.00019999853007875282, 'samples': 427808, 'steps': 835, 'loss/train': 3.5582969188690186} -09/20/2021 17:23:00 - INFO - __main__ - Step 13370: {'lr': 0.00019999853007875282, 'samples': 427840, 'steps': 835, 'loss/train': 3.584099054336548} -09/20/2021 17:23:01 - INFO - __main__ - Step 13371: {'lr': 0.00019999853007875282, 'samples': 427872, 'steps': 835, 'loss/train': 3.7559878826141357} -09/20/2021 17:23:02 - INFO - __main__ - Step 13372: {'lr': 0.00019999853007875282, 'samples': 427904, 'steps': 835, 'loss/train': 3.95371675491333} -09/20/2021 17:23:02 - INFO - __main__ - Step 13373: {'lr': 0.00019999853007875282, 'samples': 427936, 'steps': 835, 'loss/train': 3.8867897987365723} -09/20/2021 17:23:03 - INFO - __main__ - Step 13374: {'lr': 0.00019999853007875282, 'samples': 427968, 'steps': 835, 'loss/train': 3.6724040508270264} -09/20/2021 17:23:04 - INFO - __main__ - Step 13375: {'lr': 0.00019999853007875282, 'samples': 428000, 'steps': 835, 'loss/train': 3.806276321411133} -09/20/2021 17:23:05 - INFO - __main__ - Step 13376: {'lr': 0.00019999853007875282, 'samples': 428032, 'steps': 835, 'loss/train': 1.8548110723495483} -09/20/2021 17:23:05 - INFO - __main__ - Step 13377: {'lr': 0.00019999849528900846, 'samples': 428064, 'steps': 836, 'loss/train': 3.808619976043701} -09/20/2021 17:23:06 - INFO - __main__ - Step 13378: {'lr': 0.00019999849528900846, 'samples': 428096, 'steps': 836, 'loss/train': 3.4945828914642334} -09/20/2021 17:23:07 - INFO - __main__ - Step 13379: {'lr': 0.00019999849528900846, 'samples': 428128, 'steps': 836, 'loss/train': 4.9143171310424805} -09/20/2021 17:23:08 - INFO - __main__ - Step 13380: {'lr': 0.00019999849528900846, 'samples': 428160, 'steps': 836, 'loss/train': 3.044736385345459} -09/20/2021 17:23:08 - INFO - __main__ - Step 13381: {'lr': 0.00019999849528900846, 'samples': 428192, 'steps': 836, 'loss/train': 3.397188901901245} -09/20/2021 17:23:09 - INFO - __main__ - Step 13382: {'lr': 0.00019999849528900846, 'samples': 428224, 'steps': 836, 'loss/train': 1.2731144428253174} -09/20/2021 17:23:10 - INFO - __main__ - Step 13383: {'lr': 0.00019999849528900846, 'samples': 428256, 'steps': 836, 'loss/train': 1.233879566192627} -09/20/2021 17:23:11 - INFO - __main__ - Step 13384: {'lr': 0.00019999849528900846, 'samples': 428288, 'steps': 836, 'loss/train': 1.3846274614334106} -09/20/2021 17:23:11 - INFO - __main__ - Step 13385: {'lr': 0.00019999849528900846, 'samples': 428320, 'steps': 836, 'loss/train': 3.344517469406128} -09/20/2021 17:23:12 - INFO - __main__ - Step 13386: {'lr': 0.00019999849528900846, 'samples': 428352, 'steps': 836, 'loss/train': 4.106280326843262} -09/20/2021 17:23:13 - INFO - __main__ - Step 13387: {'lr': 0.00019999849528900846, 'samples': 428384, 'steps': 836, 'loss/train': 4.245086193084717} -09/20/2021 17:23:14 - INFO - __main__ - Step 13388: {'lr': 0.00019999849528900846, 'samples': 428416, 'steps': 836, 'loss/train': 4.0856242179870605} -09/20/2021 17:23:14 - INFO - __main__ - Step 13389: {'lr': 0.00019999849528900846, 'samples': 428448, 'steps': 836, 'loss/train': 4.1073174476623535} -09/20/2021 17:23:15 - INFO - __main__ - Step 13390: {'lr': 0.00019999849528900846, 'samples': 428480, 'steps': 836, 'loss/train': 4.445667743682861} -09/20/2021 17:23:16 - INFO - __main__ - Step 13391: {'lr': 0.00019999849528900846, 'samples': 428512, 'steps': 836, 'loss/train': 3.539788007736206} -09/20/2021 17:23:17 - INFO - __main__ - Step 13392: {'lr': 0.00019999849528900846, 'samples': 428544, 'steps': 836, 'loss/train': 4.394167423248291} -09/20/2021 17:23:18 - INFO - __main__ - Step 13393: {'lr': 0.00019999846009237065, 'samples': 428576, 'steps': 837, 'loss/train': 4.429690837860107} -09/20/2021 17:23:18 - INFO - __main__ - Step 13394: {'lr': 0.00019999846009237065, 'samples': 428608, 'steps': 837, 'loss/train': 3.562028408050537} -09/20/2021 17:23:19 - INFO - __main__ - Step 13395: {'lr': 0.00019999846009237065, 'samples': 428640, 'steps': 837, 'loss/train': 3.478727102279663} -09/20/2021 17:23:20 - INFO - __main__ - Step 13396: {'lr': 0.00019999846009237065, 'samples': 428672, 'steps': 837, 'loss/train': 3.91408634185791} -09/20/2021 17:23:21 - INFO - __main__ - Step 13397: {'lr': 0.00019999846009237065, 'samples': 428704, 'steps': 837, 'loss/train': 3.5882785320281982} -09/20/2021 17:23:22 - INFO - __main__ - Step 13398: {'lr': 0.00019999846009237065, 'samples': 428736, 'steps': 837, 'loss/train': 3.5845634937286377} -09/20/2021 17:23:23 - INFO - __main__ - Step 13399: {'lr': 0.00019999846009237065, 'samples': 428768, 'steps': 837, 'loss/train': 3.313443660736084} -09/20/2021 17:23:23 - INFO - __main__ - Step 13400: {'lr': 0.00019999846009237065, 'samples': 428800, 'steps': 837, 'loss/train': 4.203221321105957} -09/20/2021 17:23:24 - INFO - __main__ - Step 13401: {'lr': 0.00019999846009237065, 'samples': 428832, 'steps': 837, 'loss/train': 4.2425079345703125} -09/20/2021 17:23:25 - INFO - __main__ - Step 13402: {'lr': 0.00019999846009237065, 'samples': 428864, 'steps': 837, 'loss/train': 3.560814142227173} -09/20/2021 17:23:26 - INFO - __main__ - Step 13403: {'lr': 0.00019999846009237065, 'samples': 428896, 'steps': 837, 'loss/train': 3.730058431625366} -09/20/2021 17:23:26 - INFO - __main__ - Step 13404: {'lr': 0.00019999846009237065, 'samples': 428928, 'steps': 837, 'loss/train': 4.604489803314209} -09/20/2021 17:23:27 - INFO - __main__ - Step 13405: {'lr': 0.00019999846009237065, 'samples': 428960, 'steps': 837, 'loss/train': 4.073885440826416} -09/20/2021 17:23:28 - INFO - __main__ - Step 13406: {'lr': 0.00019999846009237065, 'samples': 428992, 'steps': 837, 'loss/train': 3.4222068786621094} -09/20/2021 17:23:29 - INFO - __main__ - Step 13407: {'lr': 0.00019999846009237065, 'samples': 429024, 'steps': 837, 'loss/train': 3.235604763031006} -09/20/2021 17:23:29 - INFO - __main__ - Step 13408: {'lr': 0.00019999846009237065, 'samples': 429056, 'steps': 837, 'loss/train': 3.984450101852417} -09/20/2021 17:23:30 - INFO - __main__ - Step 13409: {'lr': 0.00019999842448883946, 'samples': 429088, 'steps': 838, 'loss/train': 4.2418646812438965} -09/20/2021 17:23:31 - INFO - __main__ - Step 13410: {'lr': 0.00019999842448883946, 'samples': 429120, 'steps': 838, 'loss/train': 3.9373550415039062} -09/20/2021 17:23:32 - INFO - __main__ - Step 13411: {'lr': 0.00019999842448883946, 'samples': 429152, 'steps': 838, 'loss/train': 4.209853649139404} -09/20/2021 17:23:32 - INFO - __main__ - Step 13412: {'lr': 0.00019999842448883946, 'samples': 429184, 'steps': 838, 'loss/train': 4.02140998840332} -09/20/2021 17:23:33 - INFO - __main__ - Step 13413: {'lr': 0.00019999842448883946, 'samples': 429216, 'steps': 838, 'loss/train': 4.428193092346191} -09/20/2021 17:23:34 - INFO - __main__ - Step 13414: {'lr': 0.00019999842448883946, 'samples': 429248, 'steps': 838, 'loss/train': 3.1932153701782227} -09/20/2021 17:23:35 - INFO - __main__ - Step 13415: {'lr': 0.00019999842448883946, 'samples': 429280, 'steps': 838, 'loss/train': 3.6262569427490234} -09/20/2021 17:23:35 - INFO - __main__ - Step 13416: {'lr': 0.00019999842448883946, 'samples': 429312, 'steps': 838, 'loss/train': 4.177759170532227} -09/20/2021 17:23:36 - INFO - __main__ - Step 13417: {'lr': 0.00019999842448883946, 'samples': 429344, 'steps': 838, 'loss/train': 1.5088119506835938} -09/20/2021 17:23:37 - INFO - __main__ - Step 13418: {'lr': 0.00019999842448883946, 'samples': 429376, 'steps': 838, 'loss/train': 3.6700706481933594} -09/20/2021 17:23:38 - INFO - __main__ - Step 13419: {'lr': 0.00019999842448883946, 'samples': 429408, 'steps': 838, 'loss/train': 4.676732063293457} -09/20/2021 17:23:38 - INFO - __main__ - Step 13420: {'lr': 0.00019999842448883946, 'samples': 429440, 'steps': 838, 'loss/train': 5.075088024139404} -09/20/2021 17:23:39 - INFO - __main__ - Step 13421: {'lr': 0.00019999842448883946, 'samples': 429472, 'steps': 838, 'loss/train': 3.9981164932250977} -09/20/2021 17:23:40 - INFO - __main__ - Step 13422: {'lr': 0.00019999842448883946, 'samples': 429504, 'steps': 838, 'loss/train': 3.7876875400543213} -09/20/2021 17:23:41 - INFO - __main__ - Step 13423: {'lr': 0.00019999842448883946, 'samples': 429536, 'steps': 838, 'loss/train': 3.63625168800354} -09/20/2021 17:23:41 - INFO - __main__ - Step 13424: {'lr': 0.00019999842448883946, 'samples': 429568, 'steps': 838, 'loss/train': 3.9871575832366943} -09/20/2021 17:23:42 - INFO - __main__ - Step 13425: {'lr': 0.00019999838847841508, 'samples': 429600, 'steps': 839, 'loss/train': 3.925133466720581} -09/20/2021 17:23:43 - INFO - __main__ - Step 13426: {'lr': 0.00019999838847841508, 'samples': 429632, 'steps': 839, 'loss/train': 7.362324237823486} -09/20/2021 17:23:45 - INFO - __main__ - Step 13427: {'lr': 0.00019999838847841508, 'samples': 429664, 'steps': 839, 'loss/train': 3.89479923248291} -09/20/2021 17:23:45 - INFO - __main__ - Step 13428: {'lr': 0.00019999838847841508, 'samples': 429696, 'steps': 839, 'loss/train': 1.6699892282485962} -09/20/2021 17:23:46 - INFO - __main__ - Step 13429: {'lr': 0.00019999838847841508, 'samples': 429728, 'steps': 839, 'loss/train': 2.147742986679077} -09/20/2021 17:23:47 - INFO - __main__ - Step 13430: {'lr': 0.00019999838847841508, 'samples': 429760, 'steps': 839, 'loss/train': 1.2476366758346558} -09/20/2021 17:23:48 - INFO - __main__ - Step 13431: {'lr': 0.00019999838847841508, 'samples': 429792, 'steps': 839, 'loss/train': 4.324377059936523} -09/20/2021 17:23:48 - INFO - __main__ - Step 13432: {'lr': 0.00019999838847841508, 'samples': 429824, 'steps': 839, 'loss/train': 4.01801872253418} -09/20/2021 17:23:49 - INFO - __main__ - Step 13433: {'lr': 0.00019999838847841508, 'samples': 429856, 'steps': 839, 'loss/train': 4.313638687133789} -09/20/2021 17:23:50 - INFO - __main__ - Step 13434: {'lr': 0.00019999838847841508, 'samples': 429888, 'steps': 839, 'loss/train': 4.491818428039551} -09/20/2021 17:23:51 - INFO - __main__ - Step 13435: {'lr': 0.00019999838847841508, 'samples': 429920, 'steps': 839, 'loss/train': 4.184451580047607} -09/20/2021 17:23:51 - INFO - __main__ - Step 13436: {'lr': 0.00019999838847841508, 'samples': 429952, 'steps': 839, 'loss/train': 3.725766181945801} -09/20/2021 17:23:52 - INFO - __main__ - Step 13437: {'lr': 0.00019999838847841508, 'samples': 429984, 'steps': 839, 'loss/train': 3.7597124576568604} -09/20/2021 17:23:53 - INFO - __main__ - Step 13438: {'lr': 0.00019999838847841508, 'samples': 430016, 'steps': 839, 'loss/train': 5.1381378173828125} -09/20/2021 17:23:54 - INFO - __main__ - Step 13439: {'lr': 0.00019999838847841508, 'samples': 430048, 'steps': 839, 'loss/train': 4.910434246063232} -09/20/2021 17:23:54 - INFO - __main__ - Step 13440: {'lr': 0.00019999838847841508, 'samples': 430080, 'steps': 839, 'loss/train': 3.940828323364258} -09/20/2021 17:23:55 - INFO - __main__ - Step 13441: {'lr': 0.00019999835206109765, 'samples': 430112, 'steps': 840, 'loss/train': 4.021162986755371} -09/20/2021 17:23:56 - INFO - __main__ - Step 13442: {'lr': 0.00019999835206109765, 'samples': 430144, 'steps': 840, 'loss/train': 4.530847072601318} -09/20/2021 17:23:57 - INFO - __main__ - Step 13443: {'lr': 0.00019999835206109765, 'samples': 430176, 'steps': 840, 'loss/train': 4.260108947753906} -09/20/2021 17:23:57 - INFO - __main__ - Step 13444: {'lr': 0.00019999835206109765, 'samples': 430208, 'steps': 840, 'loss/train': 5.751190662384033} -09/20/2021 17:23:58 - INFO - __main__ - Step 13445: {'lr': 0.00019999835206109765, 'samples': 430240, 'steps': 840, 'loss/train': 4.109583854675293} -09/20/2021 17:23:59 - INFO - __main__ - Step 13446: {'lr': 0.00019999835206109765, 'samples': 430272, 'steps': 840, 'loss/train': 3.3415322303771973} -09/20/2021 17:24:00 - INFO - __main__ - Step 13447: {'lr': 0.00019999835206109765, 'samples': 430304, 'steps': 840, 'loss/train': 3.989215850830078} -09/20/2021 17:24:00 - INFO - __main__ - Step 13448: {'lr': 0.00019999835206109765, 'samples': 430336, 'steps': 840, 'loss/train': 4.229532241821289} -09/20/2021 17:24:01 - INFO - __main__ - Step 13449: {'lr': 0.00019999835206109765, 'samples': 430368, 'steps': 840, 'loss/train': 3.810969591140747} -09/20/2021 17:24:02 - INFO - __main__ - Step 13450: {'lr': 0.00019999835206109765, 'samples': 430400, 'steps': 840, 'loss/train': 3.748198986053467} -09/20/2021 17:24:03 - INFO - __main__ - Step 13451: {'lr': 0.00019999835206109765, 'samples': 430432, 'steps': 840, 'loss/train': 3.940682888031006} -09/20/2021 17:24:03 - INFO - __main__ - Step 13452: {'lr': 0.00019999835206109765, 'samples': 430464, 'steps': 840, 'loss/train': 4.784289836883545} -09/20/2021 17:24:04 - INFO - __main__ - Step 13453: {'lr': 0.00019999835206109765, 'samples': 430496, 'steps': 840, 'loss/train': 4.788129806518555} -09/20/2021 17:24:05 - INFO - __main__ - Step 13454: {'lr': 0.00019999835206109765, 'samples': 430528, 'steps': 840, 'loss/train': 3.0674867630004883} -09/20/2021 17:24:06 - INFO - __main__ - Step 13455: {'lr': 0.00019999835206109765, 'samples': 430560, 'steps': 840, 'loss/train': 4.168207168579102} -09/20/2021 17:24:06 - INFO - __main__ - Step 13456: {'lr': 0.00019999835206109765, 'samples': 430592, 'steps': 840, 'loss/train': 2.915520429611206} -09/20/2021 17:24:08 - INFO - __main__ - Step 13457: {'lr': 0.0001999983152368873, 'samples': 430624, 'steps': 841, 'loss/train': 3.621305465698242} -09/20/2021 17:24:09 - INFO - __main__ - Step 13458: {'lr': 0.0001999983152368873, 'samples': 430656, 'steps': 841, 'loss/train': 4.567440032958984} -09/20/2021 17:24:10 - INFO - __main__ - Step 13459: {'lr': 0.0001999983152368873, 'samples': 430688, 'steps': 841, 'loss/train': 4.173653602600098} -09/20/2021 17:24:10 - INFO - __main__ - Step 13460: {'lr': 0.0001999983152368873, 'samples': 430720, 'steps': 841, 'loss/train': 3.573418378829956} -09/20/2021 17:24:11 - INFO - __main__ - Step 13461: {'lr': 0.0001999983152368873, 'samples': 430752, 'steps': 841, 'loss/train': 5.080088138580322} -09/20/2021 17:24:12 - INFO - __main__ - Step 13462: {'lr': 0.0001999983152368873, 'samples': 430784, 'steps': 841, 'loss/train': 3.4515562057495117} -09/20/2021 17:24:13 - INFO - __main__ - Step 13463: {'lr': 0.0001999983152368873, 'samples': 430816, 'steps': 841, 'loss/train': 5.4553022384643555} -09/20/2021 17:24:13 - INFO - __main__ - Step 13464: {'lr': 0.0001999983152368873, 'samples': 430848, 'steps': 841, 'loss/train': 1.0698779821395874} -09/20/2021 17:24:14 - INFO - __main__ - Step 13465: {'lr': 0.0001999983152368873, 'samples': 430880, 'steps': 841, 'loss/train': 1.2105644941329956} -09/20/2021 17:24:15 - INFO - __main__ - Step 13466: {'lr': 0.0001999983152368873, 'samples': 430912, 'steps': 841, 'loss/train': 1.7200340032577515} -09/20/2021 17:24:16 - INFO - __main__ - Step 13467: {'lr': 0.0001999983152368873, 'samples': 430944, 'steps': 841, 'loss/train': 1.0243021249771118} -09/20/2021 17:24:16 - INFO - __main__ - Step 13468: {'lr': 0.0001999983152368873, 'samples': 430976, 'steps': 841, 'loss/train': 3.773898124694824} -09/20/2021 17:24:17 - INFO - __main__ - Step 13469: {'lr': 0.0001999983152368873, 'samples': 431008, 'steps': 841, 'loss/train': 3.4114511013031006} -09/20/2021 17:24:18 - INFO - __main__ - Step 13470: {'lr': 0.0001999983152368873, 'samples': 431040, 'steps': 841, 'loss/train': 4.2145514488220215} -09/20/2021 17:24:19 - INFO - __main__ - Step 13471: {'lr': 0.0001999983152368873, 'samples': 431072, 'steps': 841, 'loss/train': 3.710703134536743} -09/20/2021 17:24:19 - INFO - __main__ - Step 13472: {'lr': 0.0001999983152368873, 'samples': 431104, 'steps': 841, 'loss/train': 4.5072021484375} -09/20/2021 17:24:20 - INFO - __main__ - Step 13473: {'lr': 0.0001999982780057842, 'samples': 431136, 'steps': 842, 'loss/train': 3.6873905658721924} -09/20/2021 17:24:21 - INFO - __main__ - Step 13474: {'lr': 0.0001999982780057842, 'samples': 431168, 'steps': 842, 'loss/train': 4.218286514282227} -09/20/2021 17:24:22 - INFO - __main__ - Step 13475: {'lr': 0.0001999982780057842, 'samples': 431200, 'steps': 842, 'loss/train': 3.9454970359802246} -09/20/2021 17:24:22 - INFO - __main__ - Step 13476: {'lr': 0.0001999982780057842, 'samples': 431232, 'steps': 842, 'loss/train': 3.9855082035064697} -09/20/2021 17:24:23 - INFO - __main__ - Step 13477: {'lr': 0.0001999982780057842, 'samples': 431264, 'steps': 842, 'loss/train': 4.368809700012207} -09/20/2021 17:24:24 - INFO - __main__ - Step 13478: {'lr': 0.0001999982780057842, 'samples': 431296, 'steps': 842, 'loss/train': 3.8177871704101562} -09/20/2021 17:24:25 - INFO - __main__ - Step 13479: {'lr': 0.0001999982780057842, 'samples': 431328, 'steps': 842, 'loss/train': 3.8631083965301514} -09/20/2021 17:24:25 - INFO - __main__ - Step 13480: {'lr': 0.0001999982780057842, 'samples': 431360, 'steps': 842, 'loss/train': 4.084607124328613} -09/20/2021 17:24:26 - INFO - __main__ - Step 13481: {'lr': 0.0001999982780057842, 'samples': 431392, 'steps': 842, 'loss/train': 4.787711143493652} -09/20/2021 17:24:27 - INFO - __main__ - Step 13482: {'lr': 0.0001999982780057842, 'samples': 431424, 'steps': 842, 'loss/train': 3.486072063446045} -09/20/2021 17:24:28 - INFO - __main__ - Step 13483: {'lr': 0.0001999982780057842, 'samples': 431456, 'steps': 842, 'loss/train': 3.045255184173584} -09/20/2021 17:24:28 - INFO - __main__ - Step 13484: {'lr': 0.0001999982780057842, 'samples': 431488, 'steps': 842, 'loss/train': 3.242844581604004} -09/20/2021 17:24:29 - INFO - __main__ - Step 13485: {'lr': 0.0001999982780057842, 'samples': 431520, 'steps': 842, 'loss/train': 3.694103240966797} -09/20/2021 17:24:30 - INFO - __main__ - Step 13486: {'lr': 0.0001999982780057842, 'samples': 431552, 'steps': 842, 'loss/train': 4.171317100524902} -09/20/2021 17:24:31 - INFO - __main__ - Step 13487: {'lr': 0.0001999982780057842, 'samples': 431584, 'steps': 842, 'loss/train': 3.8292698860168457} -09/20/2021 17:24:31 - INFO - __main__ - Step 13488: {'lr': 0.0001999982780057842, 'samples': 431616, 'steps': 842, 'loss/train': 4.092489719390869} -09/20/2021 17:24:33 - INFO - __main__ - Step 13489: {'lr': 0.0001999982403677885, 'samples': 431648, 'steps': 843, 'loss/train': 3.062756061553955} -09/20/2021 17:24:34 - INFO - __main__ - Step 13490: {'lr': 0.0001999982403677885, 'samples': 431680, 'steps': 843, 'loss/train': 3.4961097240448} -09/20/2021 17:24:35 - INFO - __main__ - Step 13491: {'lr': 0.0001999982403677885, 'samples': 431712, 'steps': 843, 'loss/train': 3.2242624759674072} -09/20/2021 17:24:35 - INFO - __main__ - Step 13492: {'lr': 0.0001999982403677885, 'samples': 431744, 'steps': 843, 'loss/train': 3.621858835220337} -09/20/2021 17:24:36 - INFO - __main__ - Step 13493: {'lr': 0.0001999982403677885, 'samples': 431776, 'steps': 843, 'loss/train': 1.2199958562850952} -09/20/2021 17:24:37 - INFO - __main__ - Step 13494: {'lr': 0.0001999982403677885, 'samples': 431808, 'steps': 843, 'loss/train': 3.3329193592071533} -09/20/2021 17:24:38 - INFO - __main__ - Step 13495: {'lr': 0.0001999982403677885, 'samples': 431840, 'steps': 843, 'loss/train': 4.071252822875977} -09/20/2021 17:24:38 - INFO - __main__ - Step 13496: {'lr': 0.0001999982403677885, 'samples': 431872, 'steps': 843, 'loss/train': 3.6085095405578613} -09/20/2021 17:24:39 - INFO - __main__ - Step 13497: {'lr': 0.0001999982403677885, 'samples': 431904, 'steps': 843, 'loss/train': 4.002532005310059} -09/20/2021 17:24:40 - INFO - __main__ - Step 13498: {'lr': 0.0001999982403677885, 'samples': 431936, 'steps': 843, 'loss/train': 2.639407157897949} -09/20/2021 17:24:41 - INFO - __main__ - Step 13499: {'lr': 0.0001999982403677885, 'samples': 431968, 'steps': 843, 'loss/train': 4.554128646850586} -09/20/2021 17:24:41 - INFO - __main__ - Step 13500: {'lr': 0.0001999982403677885, 'samples': 432000, 'steps': 843, 'loss/train': 4.2015461921691895} -09/20/2021 17:24:42 - INFO - __main__ - Step 13501: {'lr': 0.0001999982403677885, 'samples': 432032, 'steps': 843, 'loss/train': 3.550290822982788} -09/20/2021 17:24:43 - INFO - __main__ - Step 13502: {'lr': 0.0001999982403677885, 'samples': 432064, 'steps': 843, 'loss/train': 1.441927194595337} -09/20/2021 17:24:44 - INFO - __main__ - Step 13503: {'lr': 0.0001999982403677885, 'samples': 432096, 'steps': 843, 'loss/train': 1.0062355995178223} -09/20/2021 17:24:44 - INFO - __main__ - Step 13504: {'lr': 0.0001999982403677885, 'samples': 432128, 'steps': 843, 'loss/train': 1.016701340675354} -09/20/2021 17:24:45 - INFO - __main__ - Step 13505: {'lr': 0.00019999820232290033, 'samples': 432160, 'steps': 844, 'loss/train': 1.0851832628250122} -09/20/2021 17:24:46 - INFO - __main__ - Step 13506: {'lr': 0.00019999820232290033, 'samples': 432192, 'steps': 844, 'loss/train': 4.050252437591553} -09/20/2021 17:24:47 - INFO - __main__ - Step 13507: {'lr': 0.00019999820232290033, 'samples': 432224, 'steps': 844, 'loss/train': 4.127182960510254} -09/20/2021 17:24:47 - INFO - __main__ - Step 13508: {'lr': 0.00019999820232290033, 'samples': 432256, 'steps': 844, 'loss/train': 3.8045969009399414} -09/20/2021 17:24:48 - INFO - __main__ - Step 13509: {'lr': 0.00019999820232290033, 'samples': 432288, 'steps': 844, 'loss/train': 3.426367998123169} -09/20/2021 17:24:49 - INFO - __main__ - Step 13510: {'lr': 0.00019999820232290033, 'samples': 432320, 'steps': 844, 'loss/train': 4.10466194152832} -09/20/2021 17:24:50 - INFO - __main__ - Step 13511: {'lr': 0.00019999820232290033, 'samples': 432352, 'steps': 844, 'loss/train': 4.449901103973389} -09/20/2021 17:24:50 - INFO - __main__ - Step 13512: {'lr': 0.00019999820232290033, 'samples': 432384, 'steps': 844, 'loss/train': 4.040013790130615} -09/20/2021 17:24:51 - INFO - __main__ - Step 13513: {'lr': 0.00019999820232290033, 'samples': 432416, 'steps': 844, 'loss/train': 5.6263298988342285} -09/20/2021 17:24:52 - INFO - __main__ - Step 13514: {'lr': 0.00019999820232290033, 'samples': 432448, 'steps': 844, 'loss/train': 5.40472936630249} -09/20/2021 17:24:53 - INFO - __main__ - Step 13515: {'lr': 0.00019999820232290033, 'samples': 432480, 'steps': 844, 'loss/train': 4.386739730834961} -09/20/2021 17:24:53 - INFO - __main__ - Step 13516: {'lr': 0.00019999820232290033, 'samples': 432512, 'steps': 844, 'loss/train': 4.293882369995117} -09/20/2021 17:24:54 - INFO - __main__ - Step 13517: {'lr': 0.00019999820232290033, 'samples': 432544, 'steps': 844, 'loss/train': 2.0185258388519287} -09/20/2021 17:24:55 - INFO - __main__ - Step 13518: {'lr': 0.00019999820232290033, 'samples': 432576, 'steps': 844, 'loss/train': 3.5305490493774414} -09/20/2021 17:24:56 - INFO - __main__ - Step 13519: {'lr': 0.00019999820232290033, 'samples': 432608, 'steps': 844, 'loss/train': 3.0966837406158447} -09/20/2021 17:24:57 - INFO - __main__ - Step 13520: {'lr': 0.00019999820232290033, 'samples': 432640, 'steps': 844, 'loss/train': 4.073970317840576} -09/20/2021 17:24:58 - INFO - __main__ - Step 13521: {'lr': 0.00019999816387111986, 'samples': 432672, 'steps': 845, 'loss/train': 3.594139814376831} -09/20/2021 17:24:59 - INFO - __main__ - Step 13522: {'lr': 0.00019999816387111986, 'samples': 432704, 'steps': 845, 'loss/train': 4.462234973907471} -09/20/2021 17:24:59 - INFO - __main__ - Step 13523: {'lr': 0.00019999816387111986, 'samples': 432736, 'steps': 845, 'loss/train': 4.570359230041504} -09/20/2021 17:25:00 - INFO - __main__ - Step 13524: {'lr': 0.00019999816387111986, 'samples': 432768, 'steps': 845, 'loss/train': 4.179370403289795} -09/20/2021 17:25:01 - INFO - __main__ - Step 13525: {'lr': 0.00019999816387111986, 'samples': 432800, 'steps': 845, 'loss/train': 3.528158187866211} -09/20/2021 17:25:02 - INFO - __main__ - Step 13526: {'lr': 0.00019999816387111986, 'samples': 432832, 'steps': 845, 'loss/train': 3.429391860961914} -09/20/2021 17:25:02 - INFO - __main__ - Step 13527: {'lr': 0.00019999816387111986, 'samples': 432864, 'steps': 845, 'loss/train': 3.330670118331909} -09/20/2021 17:25:03 - INFO - __main__ - Step 13528: {'lr': 0.00019999816387111986, 'samples': 432896, 'steps': 845, 'loss/train': 3.8736350536346436} -09/20/2021 17:25:04 - INFO - __main__ - Step 13529: {'lr': 0.00019999816387111986, 'samples': 432928, 'steps': 845, 'loss/train': 4.104378700256348} -09/20/2021 17:25:05 - INFO - __main__ - Step 13530: {'lr': 0.00019999816387111986, 'samples': 432960, 'steps': 845, 'loss/train': 3.6573188304901123} -09/20/2021 17:25:05 - INFO - __main__ - Step 13531: {'lr': 0.00019999816387111986, 'samples': 432992, 'steps': 845, 'loss/train': 5.10708475112915} -09/20/2021 17:25:06 - INFO - __main__ - Step 13532: {'lr': 0.00019999816387111986, 'samples': 433024, 'steps': 845, 'loss/train': 4.5401763916015625} -09/20/2021 17:25:07 - INFO - __main__ - Step 13533: {'lr': 0.00019999816387111986, 'samples': 433056, 'steps': 845, 'loss/train': 3.9547195434570312} -09/20/2021 17:25:08 - INFO - __main__ - Step 13534: {'lr': 0.00019999816387111986, 'samples': 433088, 'steps': 845, 'loss/train': 4.321925640106201} -09/20/2021 17:25:08 - INFO - __main__ - Step 13535: {'lr': 0.00019999816387111986, 'samples': 433120, 'steps': 845, 'loss/train': 4.249927043914795} -09/20/2021 17:25:09 - INFO - __main__ - Step 13536: {'lr': 0.00019999816387111986, 'samples': 433152, 'steps': 845, 'loss/train': 4.336556911468506} -09/20/2021 17:25:10 - INFO - __main__ - Step 13537: {'lr': 0.00019999812501244729, 'samples': 433184, 'steps': 846, 'loss/train': 4.356725215911865} -09/20/2021 17:25:11 - INFO - __main__ - Step 13538: {'lr': 0.00019999812501244729, 'samples': 433216, 'steps': 846, 'loss/train': 4.922709941864014} -09/20/2021 17:25:12 - INFO - __main__ - Step 13539: {'lr': 0.00019999812501244729, 'samples': 433248, 'steps': 846, 'loss/train': 4.633336067199707} -09/20/2021 17:25:12 - INFO - __main__ - Step 13540: {'lr': 0.00019999812501244729, 'samples': 433280, 'steps': 846, 'loss/train': 4.838750839233398} -09/20/2021 17:25:13 - INFO - __main__ - Step 13541: {'lr': 0.00019999812501244729, 'samples': 433312, 'steps': 846, 'loss/train': 5.2673540115356445} -09/20/2021 17:25:14 - INFO - __main__ - Step 13542: {'lr': 0.00019999812501244729, 'samples': 433344, 'steps': 846, 'loss/train': 5.17922306060791} -09/20/2021 17:25:15 - INFO - __main__ - Step 13543: {'lr': 0.00019999812501244729, 'samples': 433376, 'steps': 846, 'loss/train': 4.117546081542969} -09/20/2021 17:25:15 - INFO - __main__ - Step 13544: {'lr': 0.00019999812501244729, 'samples': 433408, 'steps': 846, 'loss/train': 3.8183624744415283} -09/20/2021 17:25:16 - INFO - __main__ - Step 13545: {'lr': 0.00019999812501244729, 'samples': 433440, 'steps': 846, 'loss/train': 4.268054008483887} -09/20/2021 17:25:17 - INFO - __main__ - Step 13546: {'lr': 0.00019999812501244729, 'samples': 433472, 'steps': 846, 'loss/train': 3.347277879714966} -09/20/2021 17:25:18 - INFO - __main__ - Step 13547: {'lr': 0.00019999812501244729, 'samples': 433504, 'steps': 846, 'loss/train': 4.412509918212891} -09/20/2021 17:25:18 - INFO - __main__ - Step 13548: {'lr': 0.00019999812501244729, 'samples': 433536, 'steps': 846, 'loss/train': 3.899561643600464} -09/20/2021 17:25:19 - INFO - __main__ - Step 13549: {'lr': 0.00019999812501244729, 'samples': 433568, 'steps': 846, 'loss/train': 4.577779293060303} -09/20/2021 17:25:20 - INFO - __main__ - Step 13550: {'lr': 0.00019999812501244729, 'samples': 433600, 'steps': 846, 'loss/train': 4.743430137634277} -09/20/2021 17:25:21 - INFO - __main__ - Step 13551: {'lr': 0.00019999812501244729, 'samples': 433632, 'steps': 846, 'loss/train': 3.2888474464416504} -09/20/2021 17:25:22 - INFO - __main__ - Step 13552: {'lr': 0.00019999812501244729, 'samples': 433664, 'steps': 846, 'loss/train': 3.3221027851104736} -09/20/2021 17:25:23 - INFO - __main__ - Step 13553: {'lr': 0.0001999980857468827, 'samples': 433696, 'steps': 847, 'loss/train': 4.173206329345703} -09/20/2021 17:25:23 - INFO - __main__ - Step 13554: {'lr': 0.0001999980857468827, 'samples': 433728, 'steps': 847, 'loss/train': 3.251892328262329} -09/20/2021 17:25:24 - INFO - __main__ - Step 13555: {'lr': 0.0001999980857468827, 'samples': 433760, 'steps': 847, 'loss/train': 4.951797008514404} -09/20/2021 17:25:25 - INFO - __main__ - Step 13556: {'lr': 0.0001999980857468827, 'samples': 433792, 'steps': 847, 'loss/train': 3.7825350761413574} -09/20/2021 17:25:26 - INFO - __main__ - Step 13557: {'lr': 0.0001999980857468827, 'samples': 433824, 'steps': 847, 'loss/train': 4.662040710449219} -09/20/2021 17:25:26 - INFO - __main__ - Step 13558: {'lr': 0.0001999980857468827, 'samples': 433856, 'steps': 847, 'loss/train': 3.5977272987365723} -09/20/2021 17:25:27 - INFO - __main__ - Step 13559: {'lr': 0.0001999980857468827, 'samples': 433888, 'steps': 847, 'loss/train': 3.476016044616699} -09/20/2021 17:25:28 - INFO - __main__ - Step 13560: {'lr': 0.0001999980857468827, 'samples': 433920, 'steps': 847, 'loss/train': 4.048685550689697} -09/20/2021 17:25:29 - INFO - __main__ - Step 13561: {'lr': 0.0001999980857468827, 'samples': 433952, 'steps': 847, 'loss/train': 4.394377708435059} -09/20/2021 17:25:29 - INFO - __main__ - Step 13562: {'lr': 0.0001999980857468827, 'samples': 433984, 'steps': 847, 'loss/train': 5.051202774047852} -09/20/2021 17:25:30 - INFO - __main__ - Step 13563: {'lr': 0.0001999980857468827, 'samples': 434016, 'steps': 847, 'loss/train': 4.00152587890625} -09/20/2021 17:25:31 - INFO - __main__ - Step 13564: {'lr': 0.0001999980857468827, 'samples': 434048, 'steps': 847, 'loss/train': 4.474799156188965} -09/20/2021 17:25:32 - INFO - __main__ - Step 13565: {'lr': 0.0001999980857468827, 'samples': 434080, 'steps': 847, 'loss/train': 4.183254718780518} -09/20/2021 17:25:32 - INFO - __main__ - Step 13566: {'lr': 0.0001999980857468827, 'samples': 434112, 'steps': 847, 'loss/train': 3.8000428676605225} -09/20/2021 17:25:33 - INFO - __main__ - Step 13567: {'lr': 0.0001999980857468827, 'samples': 434144, 'steps': 847, 'loss/train': 3.6373589038848877} -09/20/2021 17:25:34 - INFO - __main__ - Step 13568: {'lr': 0.0001999980857468827, 'samples': 434176, 'steps': 847, 'loss/train': 4.7940354347229} -09/20/2021 17:25:35 - INFO - __main__ - Step 13569: {'lr': 0.00019999804607442632, 'samples': 434208, 'steps': 848, 'loss/train': 3.3990721702575684} -09/20/2021 17:25:36 - INFO - __main__ - Step 13570: {'lr': 0.00019999804607442632, 'samples': 434240, 'steps': 848, 'loss/train': 3.8665454387664795} -09/20/2021 17:25:36 - INFO - __main__ - Step 13571: {'lr': 0.00019999804607442632, 'samples': 434272, 'steps': 848, 'loss/train': 4.174686908721924} -09/20/2021 17:25:37 - INFO - __main__ - Step 13572: {'lr': 0.00019999804607442632, 'samples': 434304, 'steps': 848, 'loss/train': 4.11002254486084} -09/20/2021 17:25:38 - INFO - __main__ - Step 13573: {'lr': 0.00019999804607442632, 'samples': 434336, 'steps': 848, 'loss/train': 4.373510837554932} -09/20/2021 17:25:39 - INFO - __main__ - Step 13574: {'lr': 0.00019999804607442632, 'samples': 434368, 'steps': 848, 'loss/train': 3.3738856315612793} -09/20/2021 17:25:39 - INFO - __main__ - Step 13575: {'lr': 0.00019999804607442632, 'samples': 434400, 'steps': 848, 'loss/train': 3.9241650104522705} -09/20/2021 17:25:40 - INFO - __main__ - Step 13576: {'lr': 0.00019999804607442632, 'samples': 434432, 'steps': 848, 'loss/train': 4.4594950675964355} -09/20/2021 17:25:41 - INFO - __main__ - Step 13577: {'lr': 0.00019999804607442632, 'samples': 434464, 'steps': 848, 'loss/train': 4.4602861404418945} -09/20/2021 17:25:42 - INFO - __main__ - Step 13578: {'lr': 0.00019999804607442632, 'samples': 434496, 'steps': 848, 'loss/train': 5.1317830085754395} -09/20/2021 17:25:42 - INFO - __main__ - Step 13579: {'lr': 0.00019999804607442632, 'samples': 434528, 'steps': 848, 'loss/train': 0.6088433861732483} -09/20/2021 17:25:43 - INFO - __main__ - Step 13580: {'lr': 0.00019999804607442632, 'samples': 434560, 'steps': 848, 'loss/train': 1.6834524869918823} -09/20/2021 17:25:45 - INFO - __main__ - Step 13581: {'lr': 0.00019999804607442632, 'samples': 434592, 'steps': 848, 'loss/train': 5.391042709350586} -09/20/2021 17:25:46 - INFO - __main__ - Step 13582: {'lr': 0.00019999804607442632, 'samples': 434624, 'steps': 848, 'loss/train': 4.344334602355957} -09/20/2021 17:25:46 - INFO - __main__ - Step 13583: {'lr': 0.00019999804607442632, 'samples': 434656, 'steps': 848, 'loss/train': 5.233471870422363} -09/20/2021 17:25:47 - INFO - __main__ - Step 13584: {'lr': 0.00019999804607442632, 'samples': 434688, 'steps': 848, 'loss/train': 3.8413572311401367} -09/20/2021 17:25:48 - INFO - __main__ - Step 13585: {'lr': 0.00019999800599507825, 'samples': 434720, 'steps': 849, 'loss/train': 1.6976394653320312} -09/20/2021 17:25:49 - INFO - __main__ - Step 13586: {'lr': 0.00019999800599507825, 'samples': 434752, 'steps': 849, 'loss/train': 4.554813861846924} -09/20/2021 17:25:49 - INFO - __main__ - Step 13587: {'lr': 0.00019999800599507825, 'samples': 434784, 'steps': 849, 'loss/train': 3.2028303146362305} -09/20/2021 17:25:50 - INFO - __main__ - Step 13588: {'lr': 0.00019999800599507825, 'samples': 434816, 'steps': 849, 'loss/train': 4.1235575675964355} -09/20/2021 17:25:51 - INFO - __main__ - Step 13589: {'lr': 0.00019999800599507825, 'samples': 434848, 'steps': 849, 'loss/train': 4.624473571777344} -09/20/2021 17:25:52 - INFO - __main__ - Step 13590: {'lr': 0.00019999800599507825, 'samples': 434880, 'steps': 849, 'loss/train': 4.581003189086914} -09/20/2021 17:25:52 - INFO - __main__ - Step 13591: {'lr': 0.00019999800599507825, 'samples': 434912, 'steps': 849, 'loss/train': 5.538898468017578} -09/20/2021 17:25:53 - INFO - __main__ - Step 13592: {'lr': 0.00019999800599507825, 'samples': 434944, 'steps': 849, 'loss/train': 2.222236394882202} -09/20/2021 17:25:54 - INFO - __main__ - Step 13593: {'lr': 0.00019999800599507825, 'samples': 434976, 'steps': 849, 'loss/train': 4.410379409790039} -09/20/2021 17:25:55 - INFO - __main__ - Step 13594: {'lr': 0.00019999800599507825, 'samples': 435008, 'steps': 849, 'loss/train': 4.866135597229004} -09/20/2021 17:25:55 - INFO - __main__ - Step 13595: {'lr': 0.00019999800599507825, 'samples': 435040, 'steps': 849, 'loss/train': 3.6695427894592285} -09/20/2021 17:25:56 - INFO - __main__ - Step 13596: {'lr': 0.00019999800599507825, 'samples': 435072, 'steps': 849, 'loss/train': 3.677811861038208} -09/20/2021 17:25:57 - INFO - __main__ - Step 13597: {'lr': 0.00019999800599507825, 'samples': 435104, 'steps': 849, 'loss/train': 4.6106953620910645} -09/20/2021 17:25:58 - INFO - __main__ - Step 13598: {'lr': 0.00019999800599507825, 'samples': 435136, 'steps': 849, 'loss/train': 3.3901827335357666} -09/20/2021 17:25:58 - INFO - __main__ - Step 13599: {'lr': 0.00019999800599507825, 'samples': 435168, 'steps': 849, 'loss/train': 4.750954627990723} -09/20/2021 17:25:59 - INFO - __main__ - Step 13600: {'lr': 0.00019999800599507825, 'samples': 435200, 'steps': 849, 'loss/train': 3.6786444187164307} -09/20/2021 17:26:00 - INFO - __main__ - Step 13601: {'lr': 0.0001999979655088387, 'samples': 435232, 'steps': 850, 'loss/train': 4.09751558303833} -09/20/2021 17:26:01 - INFO - __main__ - Step 13602: {'lr': 0.0001999979655088387, 'samples': 435264, 'steps': 850, 'loss/train': 5.618940353393555} -09/20/2021 17:26:02 - INFO - __main__ - Step 13603: {'lr': 0.0001999979655088387, 'samples': 435296, 'steps': 850, 'loss/train': 3.8479835987091064} -09/20/2021 17:26:02 - INFO - __main__ - Step 13604: {'lr': 0.0001999979655088387, 'samples': 435328, 'steps': 850, 'loss/train': 4.51493501663208} -09/20/2021 17:26:03 - INFO - __main__ - Step 13605: {'lr': 0.0001999979655088387, 'samples': 435360, 'steps': 850, 'loss/train': 4.09794282913208} -09/20/2021 17:26:04 - INFO - __main__ - Step 13606: {'lr': 0.0001999979655088387, 'samples': 435392, 'steps': 850, 'loss/train': 3.8531157970428467} -09/20/2021 17:26:05 - INFO - __main__ - Step 13607: {'lr': 0.0001999979655088387, 'samples': 435424, 'steps': 850, 'loss/train': 1.3877215385437012} -09/20/2021 17:26:05 - INFO - __main__ - Step 13608: {'lr': 0.0001999979655088387, 'samples': 435456, 'steps': 850, 'loss/train': 3.5005953311920166} -09/20/2021 17:26:06 - INFO - __main__ - Step 13609: {'lr': 0.0001999979655088387, 'samples': 435488, 'steps': 850, 'loss/train': 5.871039867401123} -09/20/2021 17:26:07 - INFO - __main__ - Step 13610: {'lr': 0.0001999979655088387, 'samples': 435520, 'steps': 850, 'loss/train': 3.791339159011841} -09/20/2021 17:26:08 - INFO - __main__ - Step 13611: {'lr': 0.0001999979655088387, 'samples': 435552, 'steps': 850, 'loss/train': 5.495855331420898} -09/20/2021 17:26:09 - INFO - __main__ - Step 13612: {'lr': 0.0001999979655088387, 'samples': 435584, 'steps': 850, 'loss/train': 3.310189962387085} -09/20/2021 17:26:10 - INFO - __main__ - Step 13613: {'lr': 0.0001999979655088387, 'samples': 435616, 'steps': 850, 'loss/train': 4.2442498207092285} -09/20/2021 17:26:10 - INFO - __main__ - Step 13614: {'lr': 0.0001999979655088387, 'samples': 435648, 'steps': 850, 'loss/train': 4.379226207733154} -09/20/2021 17:26:11 - INFO - __main__ - Step 13615: {'lr': 0.0001999979655088387, 'samples': 435680, 'steps': 850, 'loss/train': 3.4740867614746094} -09/20/2021 17:26:12 - INFO - __main__ - Step 13616: {'lr': 0.0001999979655088387, 'samples': 435712, 'steps': 850, 'loss/train': 5.188986301422119} -09/20/2021 17:26:13 - INFO - __main__ - Step 13617: {'lr': 0.0001999979246157078, 'samples': 435744, 'steps': 851, 'loss/train': 3.454906463623047} -09/20/2021 17:26:14 - INFO - __main__ - Step 13618: {'lr': 0.0001999979246157078, 'samples': 435776, 'steps': 851, 'loss/train': 4.944936275482178} -09/20/2021 17:26:14 - INFO - __main__ - Step 13619: {'lr': 0.0001999979246157078, 'samples': 435808, 'steps': 851, 'loss/train': 3.4110090732574463} -09/20/2021 17:26:15 - INFO - __main__ - Step 13620: {'lr': 0.0001999979246157078, 'samples': 435840, 'steps': 851, 'loss/train': 4.251176834106445} -09/20/2021 17:26:16 - INFO - __main__ - Step 13621: {'lr': 0.0001999979246157078, 'samples': 435872, 'steps': 851, 'loss/train': 3.890280246734619} -09/20/2021 17:26:17 - INFO - __main__ - Step 13622: {'lr': 0.0001999979246157078, 'samples': 435904, 'steps': 851, 'loss/train': 5.254909515380859} -09/20/2021 17:26:17 - INFO - __main__ - Step 13623: {'lr': 0.0001999979246157078, 'samples': 435936, 'steps': 851, 'loss/train': 2.6076722145080566} -09/20/2021 17:26:18 - INFO - __main__ - Step 13624: {'lr': 0.0001999979246157078, 'samples': 435968, 'steps': 851, 'loss/train': 3.4124019145965576} -09/20/2021 17:26:19 - INFO - __main__ - Step 13625: {'lr': 0.0001999979246157078, 'samples': 436000, 'steps': 851, 'loss/train': 3.6725072860717773} -09/20/2021 17:26:20 - INFO - __main__ - Step 13626: {'lr': 0.0001999979246157078, 'samples': 436032, 'steps': 851, 'loss/train': 3.590291976928711} -09/20/2021 17:26:20 - INFO - __main__ - Step 13627: {'lr': 0.0001999979246157078, 'samples': 436064, 'steps': 851, 'loss/train': 3.2552616596221924} -09/20/2021 17:26:21 - INFO - __main__ - Step 13628: {'lr': 0.0001999979246157078, 'samples': 436096, 'steps': 851, 'loss/train': 1.460847020149231} -09/20/2021 17:26:22 - INFO - __main__ - Step 13629: {'lr': 0.0001999979246157078, 'samples': 436128, 'steps': 851, 'loss/train': 5.040970802307129} -09/20/2021 17:26:23 - INFO - __main__ - Step 13630: {'lr': 0.0001999979246157078, 'samples': 436160, 'steps': 851, 'loss/train': 4.233334064483643} -09/20/2021 17:26:23 - INFO - __main__ - Step 13631: {'lr': 0.0001999979246157078, 'samples': 436192, 'steps': 851, 'loss/train': 4.453797340393066} -09/20/2021 17:26:24 - INFO - __main__ - Step 13632: {'lr': 0.0001999979246157078, 'samples': 436224, 'steps': 851, 'loss/train': 4.1527228355407715} -09/20/2021 17:26:25 - INFO - __main__ - Step 13633: {'lr': 0.00019999788331568575, 'samples': 436256, 'steps': 852, 'loss/train': 3.6083691120147705} -09/20/2021 17:26:26 - INFO - __main__ - Step 13634: {'lr': 0.00019999788331568575, 'samples': 436288, 'steps': 852, 'loss/train': 3.165984630584717} -09/20/2021 17:26:26 - INFO - __main__ - Step 13635: {'lr': 0.00019999788331568575, 'samples': 436320, 'steps': 852, 'loss/train': 4.554512977600098} -09/20/2021 17:26:27 - INFO - __main__ - Step 13636: {'lr': 0.00019999788331568575, 'samples': 436352, 'steps': 852, 'loss/train': 3.700819969177246} -09/20/2021 17:26:28 - INFO - __main__ - Step 13637: {'lr': 0.00019999788331568575, 'samples': 436384, 'steps': 852, 'loss/train': 3.170443296432495} -09/20/2021 17:26:29 - INFO - __main__ - Step 13638: {'lr': 0.00019999788331568575, 'samples': 436416, 'steps': 852, 'loss/train': 4.9557623863220215} -09/20/2021 17:26:29 - INFO - __main__ - Step 13639: {'lr': 0.00019999788331568575, 'samples': 436448, 'steps': 852, 'loss/train': 4.066009998321533} -09/20/2021 17:26:30 - INFO - __main__ - Step 13640: {'lr': 0.00019999788331568575, 'samples': 436480, 'steps': 852, 'loss/train': 3.466407299041748} -09/20/2021 17:26:31 - INFO - __main__ - Step 13641: {'lr': 0.00019999788331568575, 'samples': 436512, 'steps': 852, 'loss/train': 2.587437391281128} -09/20/2021 17:26:32 - INFO - __main__ - Step 13642: {'lr': 0.00019999788331568575, 'samples': 436544, 'steps': 852, 'loss/train': 3.221467971801758} -09/20/2021 17:26:32 - INFO - __main__ - Step 13643: {'lr': 0.00019999788331568575, 'samples': 436576, 'steps': 852, 'loss/train': 3.6381022930145264} -09/20/2021 17:26:34 - INFO - __main__ - Step 13644: {'lr': 0.00019999788331568575, 'samples': 436608, 'steps': 852, 'loss/train': 4.37518310546875} -09/20/2021 17:26:35 - INFO - __main__ - Step 13645: {'lr': 0.00019999788331568575, 'samples': 436640, 'steps': 852, 'loss/train': 3.774585008621216} -09/20/2021 17:26:35 - INFO - __main__ - Step 13646: {'lr': 0.00019999788331568575, 'samples': 436672, 'steps': 852, 'loss/train': 3.873786211013794} -09/20/2021 17:26:36 - INFO - __main__ - Step 13647: {'lr': 0.00019999788331568575, 'samples': 436704, 'steps': 852, 'loss/train': 3.484182119369507} -09/20/2021 17:26:37 - INFO - __main__ - Step 13648: {'lr': 0.00019999788331568575, 'samples': 436736, 'steps': 852, 'loss/train': 4.1660284996032715} -09/20/2021 17:26:38 - INFO - __main__ - Step 13649: {'lr': 0.00019999784160877265, 'samples': 436768, 'steps': 853, 'loss/train': 3.334244966506958} -09/20/2021 17:26:38 - INFO - __main__ - Step 13650: {'lr': 0.00019999784160877265, 'samples': 436800, 'steps': 853, 'loss/train': 4.931953430175781} -09/20/2021 17:26:39 - INFO - __main__ - Step 13651: {'lr': 0.00019999784160877265, 'samples': 436832, 'steps': 853, 'loss/train': 3.4810993671417236} -09/20/2021 17:26:40 - INFO - __main__ - Step 13652: {'lr': 0.00019999784160877265, 'samples': 436864, 'steps': 853, 'loss/train': 2.905488967895508} -09/20/2021 17:26:41 - INFO - __main__ - Step 13653: {'lr': 0.00019999784160877265, 'samples': 436896, 'steps': 853, 'loss/train': 3.8477277755737305} -09/20/2021 17:26:41 - INFO - __main__ - Step 13654: {'lr': 0.00019999784160877265, 'samples': 436928, 'steps': 853, 'loss/train': 3.889946222305298} -09/20/2021 17:26:42 - INFO - __main__ - Step 13655: {'lr': 0.00019999784160877265, 'samples': 436960, 'steps': 853, 'loss/train': 3.9911863803863525} -09/20/2021 17:26:43 - INFO - __main__ - Step 13656: {'lr': 0.00019999784160877265, 'samples': 436992, 'steps': 853, 'loss/train': 3.4882731437683105} -09/20/2021 17:26:44 - INFO - __main__ - Step 13657: {'lr': 0.00019999784160877265, 'samples': 437024, 'steps': 853, 'loss/train': 4.492053985595703} -09/20/2021 17:26:44 - INFO - __main__ - Step 13658: {'lr': 0.00019999784160877265, 'samples': 437056, 'steps': 853, 'loss/train': 4.261109828948975} -09/20/2021 17:26:45 - INFO - __main__ - Step 13659: {'lr': 0.00019999784160877265, 'samples': 437088, 'steps': 853, 'loss/train': 4.401059150695801} -09/20/2021 17:26:46 - INFO - __main__ - Step 13660: {'lr': 0.00019999784160877265, 'samples': 437120, 'steps': 853, 'loss/train': 3.847898483276367} -09/20/2021 17:26:47 - INFO - __main__ - Step 13661: {'lr': 0.00019999784160877265, 'samples': 437152, 'steps': 853, 'loss/train': 3.832012414932251} -09/20/2021 17:26:47 - INFO - __main__ - Step 13662: {'lr': 0.00019999784160877265, 'samples': 437184, 'steps': 853, 'loss/train': 1.013859510421753} -09/20/2021 17:26:48 - INFO - __main__ - Step 13663: {'lr': 0.00019999784160877265, 'samples': 437216, 'steps': 853, 'loss/train': 4.141283988952637} -09/20/2021 17:26:49 - INFO - __main__ - Step 13664: {'lr': 0.00019999784160877265, 'samples': 437248, 'steps': 853, 'loss/train': 3.4317102432250977} -09/20/2021 17:26:50 - INFO - __main__ - Step 13665: {'lr': 0.0001999977994949688, 'samples': 437280, 'steps': 854, 'loss/train': 3.7386724948883057} -09/20/2021 17:26:51 - INFO - __main__ - Step 13666: {'lr': 0.0001999977994949688, 'samples': 437312, 'steps': 854, 'loss/train': 4.19016170501709} -09/20/2021 17:26:51 - INFO - __main__ - Step 13667: {'lr': 0.0001999977994949688, 'samples': 437344, 'steps': 854, 'loss/train': 3.690089225769043} -09/20/2021 17:26:52 - INFO - __main__ - Step 13668: {'lr': 0.0001999977994949688, 'samples': 437376, 'steps': 854, 'loss/train': 3.1137542724609375} -09/20/2021 17:26:53 - INFO - __main__ - Step 13669: {'lr': 0.0001999977994949688, 'samples': 437408, 'steps': 854, 'loss/train': 1.7201601266860962} -09/20/2021 17:26:54 - INFO - __main__ - Step 13670: {'lr': 0.0001999977994949688, 'samples': 437440, 'steps': 854, 'loss/train': 1.9999711513519287} -09/20/2021 17:26:54 - INFO - __main__ - Step 13671: {'lr': 0.0001999977994949688, 'samples': 437472, 'steps': 854, 'loss/train': 3.226975917816162} -09/20/2021 17:26:55 - INFO - __main__ - Step 13672: {'lr': 0.0001999977994949688, 'samples': 437504, 'steps': 854, 'loss/train': 3.315099000930786} -09/20/2021 17:26:56 - INFO - __main__ - Step 13673: {'lr': 0.0001999977994949688, 'samples': 437536, 'steps': 854, 'loss/train': 3.489169120788574} -09/20/2021 17:26:57 - INFO - __main__ - Step 13674: {'lr': 0.0001999977994949688, 'samples': 437568, 'steps': 854, 'loss/train': 3.9809930324554443} -09/20/2021 17:26:57 - INFO - __main__ - Step 13675: {'lr': 0.0001999977994949688, 'samples': 437600, 'steps': 854, 'loss/train': 4.608789920806885} -09/20/2021 17:26:59 - INFO - __main__ - Step 13676: {'lr': 0.0001999977994949688, 'samples': 437632, 'steps': 854, 'loss/train': 4.341854095458984} -09/20/2021 17:26:59 - INFO - __main__ - Step 13677: {'lr': 0.0001999977994949688, 'samples': 437664, 'steps': 854, 'loss/train': 4.39963436126709} -09/20/2021 17:27:00 - INFO - __main__ - Step 13678: {'lr': 0.0001999977994949688, 'samples': 437696, 'steps': 854, 'loss/train': 3.863450527191162} -09/20/2021 17:27:01 - INFO - __main__ - Step 13679: {'lr': 0.0001999977994949688, 'samples': 437728, 'steps': 854, 'loss/train': 3.6422030925750732} -09/20/2021 17:27:02 - INFO - __main__ - Step 13680: {'lr': 0.0001999977994949688, 'samples': 437760, 'steps': 854, 'loss/train': 3.4293835163116455} -09/20/2021 17:27:02 - INFO - __main__ - Step 13681: {'lr': 0.00019999775697427424, 'samples': 437792, 'steps': 855, 'loss/train': 3.0816245079040527} -09/20/2021 17:27:03 - INFO - __main__ - Step 13682: {'lr': 0.00019999775697427424, 'samples': 437824, 'steps': 855, 'loss/train': 4.5557861328125} -09/20/2021 17:27:04 - INFO - __main__ - Step 13683: {'lr': 0.00019999775697427424, 'samples': 437856, 'steps': 855, 'loss/train': 3.9676010608673096} -09/20/2021 17:27:05 - INFO - __main__ - Step 13684: {'lr': 0.00019999775697427424, 'samples': 437888, 'steps': 855, 'loss/train': 3.971341371536255} -09/20/2021 17:27:05 - INFO - __main__ - Step 13685: {'lr': 0.00019999775697427424, 'samples': 437920, 'steps': 855, 'loss/train': 3.6748461723327637} -09/20/2021 17:27:06 - INFO - __main__ - Step 13686: {'lr': 0.00019999775697427424, 'samples': 437952, 'steps': 855, 'loss/train': 4.837482929229736} -09/20/2021 17:27:07 - INFO - __main__ - Step 13687: {'lr': 0.00019999775697427424, 'samples': 437984, 'steps': 855, 'loss/train': 4.991029262542725} -09/20/2021 17:27:08 - INFO - __main__ - Step 13688: {'lr': 0.00019999775697427424, 'samples': 438016, 'steps': 855, 'loss/train': 3.6079797744750977} -09/20/2021 17:27:08 - INFO - __main__ - Step 13689: {'lr': 0.00019999775697427424, 'samples': 438048, 'steps': 855, 'loss/train': 3.7602643966674805} -09/20/2021 17:27:09 - INFO - __main__ - Step 13690: {'lr': 0.00019999775697427424, 'samples': 438080, 'steps': 855, 'loss/train': 3.769587993621826} -09/20/2021 17:27:10 - INFO - __main__ - Step 13691: {'lr': 0.00019999775697427424, 'samples': 438112, 'steps': 855, 'loss/train': 3.786303758621216} -09/20/2021 17:27:11 - INFO - __main__ - Step 13692: {'lr': 0.00019999775697427424, 'samples': 438144, 'steps': 855, 'loss/train': 4.613248348236084} -09/20/2021 17:27:11 - INFO - __main__ - Step 13693: {'lr': 0.00019999775697427424, 'samples': 438176, 'steps': 855, 'loss/train': 5.430627346038818} -09/20/2021 17:27:12 - INFO - __main__ - Step 13694: {'lr': 0.00019999775697427424, 'samples': 438208, 'steps': 855, 'loss/train': 4.7371697425842285} -09/20/2021 17:27:13 - INFO - __main__ - Step 13695: {'lr': 0.00019999775697427424, 'samples': 438240, 'steps': 855, 'loss/train': 5.0237202644348145} -09/20/2021 17:27:14 - INFO - __main__ - Step 13696: {'lr': 0.00019999775697427424, 'samples': 438272, 'steps': 855, 'loss/train': 4.895113468170166} -09/20/2021 17:27:15 - INFO - __main__ - Step 13697: {'lr': 0.0001999977140466892, 'samples': 438304, 'steps': 856, 'loss/train': 3.654959201812744} -09/20/2021 17:27:15 - INFO - __main__ - Step 13698: {'lr': 0.0001999977140466892, 'samples': 438336, 'steps': 856, 'loss/train': 4.829066276550293} -09/20/2021 17:27:16 - INFO - __main__ - Step 13699: {'lr': 0.0001999977140466892, 'samples': 438368, 'steps': 856, 'loss/train': 3.753678560256958} -09/20/2021 17:27:17 - INFO - __main__ - Step 13700: {'lr': 0.0001999977140466892, 'samples': 438400, 'steps': 856, 'loss/train': 4.475807189941406} -09/20/2021 17:27:18 - INFO - __main__ - Step 13701: {'lr': 0.0001999977140466892, 'samples': 438432, 'steps': 856, 'loss/train': 3.488558292388916} -09/20/2021 17:27:18 - INFO - __main__ - Step 13702: {'lr': 0.0001999977140466892, 'samples': 438464, 'steps': 856, 'loss/train': 4.0326666831970215} -09/20/2021 17:27:19 - INFO - __main__ - Step 13703: {'lr': 0.0001999977140466892, 'samples': 438496, 'steps': 856, 'loss/train': 3.5112826824188232} -09/20/2021 17:27:20 - INFO - __main__ - Step 13704: {'lr': 0.0001999977140466892, 'samples': 438528, 'steps': 856, 'loss/train': 4.463895320892334} -09/20/2021 17:27:21 - INFO - __main__ - Step 13705: {'lr': 0.0001999977140466892, 'samples': 438560, 'steps': 856, 'loss/train': 3.98983097076416} -09/20/2021 17:27:22 - INFO - __main__ - Step 13706: {'lr': 0.0001999977140466892, 'samples': 438592, 'steps': 856, 'loss/train': 3.6913604736328125} -09/20/2021 17:27:23 - INFO - __main__ - Step 13707: {'lr': 0.0001999977140466892, 'samples': 438624, 'steps': 856, 'loss/train': 1.3203134536743164} -09/20/2021 17:27:23 - INFO - __main__ - Step 13708: {'lr': 0.0001999977140466892, 'samples': 438656, 'steps': 856, 'loss/train': 2.3419830799102783} -09/20/2021 17:27:24 - INFO - __main__ - Step 13709: {'lr': 0.0001999977140466892, 'samples': 438688, 'steps': 856, 'loss/train': 1.085060477256775} -09/20/2021 17:27:25 - INFO - __main__ - Step 13710: {'lr': 0.0001999977140466892, 'samples': 438720, 'steps': 856, 'loss/train': 1.147442102432251} -09/20/2021 17:27:26 - INFO - __main__ - Step 13711: {'lr': 0.0001999977140466892, 'samples': 438752, 'steps': 856, 'loss/train': 3.8313558101654053} -09/20/2021 17:27:26 - INFO - __main__ - Step 13712: {'lr': 0.0001999977140466892, 'samples': 438784, 'steps': 856, 'loss/train': 3.9155964851379395} -09/20/2021 17:27:27 - INFO - __main__ - Step 13713: {'lr': 0.00019999767071221384, 'samples': 438816, 'steps': 857, 'loss/train': 3.6821625232696533} -09/20/2021 17:27:28 - INFO - __main__ - Step 13714: {'lr': 0.00019999767071221384, 'samples': 438848, 'steps': 857, 'loss/train': 4.1820292472839355} -09/20/2021 17:27:29 - INFO - __main__ - Step 13715: {'lr': 0.00019999767071221384, 'samples': 438880, 'steps': 857, 'loss/train': 4.1676530838012695} -09/20/2021 17:27:30 - INFO - __main__ - Step 13716: {'lr': 0.00019999767071221384, 'samples': 438912, 'steps': 857, 'loss/train': 3.809724807739258} -09/20/2021 17:27:30 - INFO - __main__ - Step 13717: {'lr': 0.00019999767071221384, 'samples': 438944, 'steps': 857, 'loss/train': 5.350722789764404} -09/20/2021 17:27:31 - INFO - __main__ - Step 13718: {'lr': 0.00019999767071221384, 'samples': 438976, 'steps': 857, 'loss/train': 3.512314796447754} -09/20/2021 17:27:32 - INFO - __main__ - Step 13719: {'lr': 0.00019999767071221384, 'samples': 439008, 'steps': 857, 'loss/train': 3.386605739593506} -09/20/2021 17:27:33 - INFO - __main__ - Step 13720: {'lr': 0.00019999767071221384, 'samples': 439040, 'steps': 857, 'loss/train': 3.4257447719573975} -09/20/2021 17:27:33 - INFO - __main__ - Step 13721: {'lr': 0.00019999767071221384, 'samples': 439072, 'steps': 857, 'loss/train': 3.760153293609619} -09/20/2021 17:27:34 - INFO - __main__ - Step 13722: {'lr': 0.00019999767071221384, 'samples': 439104, 'steps': 857, 'loss/train': 2.2076971530914307} -09/20/2021 17:27:35 - INFO - __main__ - Step 13723: {'lr': 0.00019999767071221384, 'samples': 439136, 'steps': 857, 'loss/train': 3.720167398452759} -09/20/2021 17:27:36 - INFO - __main__ - Step 13724: {'lr': 0.00019999767071221384, 'samples': 439168, 'steps': 857, 'loss/train': 3.2651801109313965} -09/20/2021 17:27:36 - INFO - __main__ - Step 13725: {'lr': 0.00019999767071221384, 'samples': 439200, 'steps': 857, 'loss/train': 3.901264190673828} -09/20/2021 17:27:37 - INFO - __main__ - Step 13726: {'lr': 0.00019999767071221384, 'samples': 439232, 'steps': 857, 'loss/train': 3.5587222576141357} -09/20/2021 17:27:38 - INFO - __main__ - Step 13727: {'lr': 0.00019999767071221384, 'samples': 439264, 'steps': 857, 'loss/train': 3.962092876434326} -09/20/2021 17:27:39 - INFO - __main__ - Step 13728: {'lr': 0.00019999767071221384, 'samples': 439296, 'steps': 857, 'loss/train': 4.317385673522949} -09/20/2021 17:27:39 - INFO - __main__ - Step 13729: {'lr': 0.00019999762697084838, 'samples': 439328, 'steps': 858, 'loss/train': 4.0132293701171875} -09/20/2021 17:27:40 - INFO - __main__ - Step 13730: {'lr': 0.00019999762697084838, 'samples': 439360, 'steps': 858, 'loss/train': 4.0892205238342285} -09/20/2021 17:27:41 - INFO - __main__ - Step 13731: {'lr': 0.00019999762697084838, 'samples': 439392, 'steps': 858, 'loss/train': 3.5622341632843018} -09/20/2021 17:27:42 - INFO - __main__ - Step 13732: {'lr': 0.00019999762697084838, 'samples': 439424, 'steps': 858, 'loss/train': 3.720393657684326} -09/20/2021 17:27:42 - INFO - __main__ - Step 13733: {'lr': 0.00019999762697084838, 'samples': 439456, 'steps': 858, 'loss/train': 3.888812780380249} -09/20/2021 17:27:43 - INFO - __main__ - Step 13734: {'lr': 0.00019999762697084838, 'samples': 439488, 'steps': 858, 'loss/train': 1.3453214168548584} -09/20/2021 17:27:44 - INFO - __main__ - Step 13735: {'lr': 0.00019999762697084838, 'samples': 439520, 'steps': 858, 'loss/train': 1.2492824792861938} -09/20/2021 17:27:45 - INFO - __main__ - Step 13736: {'lr': 0.00019999762697084838, 'samples': 439552, 'steps': 858, 'loss/train': 1.0021988153457642} -09/20/2021 17:27:46 - INFO - __main__ - Step 13737: {'lr': 0.00019999762697084838, 'samples': 439584, 'steps': 858, 'loss/train': 4.437636375427246} -09/20/2021 17:27:47 - INFO - __main__ - Step 13738: {'lr': 0.00019999762697084838, 'samples': 439616, 'steps': 858, 'loss/train': 3.3594613075256348} -09/20/2021 17:27:47 - INFO - __main__ - Step 13739: {'lr': 0.00019999762697084838, 'samples': 439648, 'steps': 858, 'loss/train': 4.091653823852539} -09/20/2021 17:27:48 - INFO - __main__ - Step 13740: {'lr': 0.00019999762697084838, 'samples': 439680, 'steps': 858, 'loss/train': 3.4296672344207764} -09/20/2021 17:27:49 - INFO - __main__ - Step 13741: {'lr': 0.00019999762697084838, 'samples': 439712, 'steps': 858, 'loss/train': 3.5813426971435547} -09/20/2021 17:27:50 - INFO - __main__ - Step 13742: {'lr': 0.00019999762697084838, 'samples': 439744, 'steps': 858, 'loss/train': 5.532720565795898} -09/20/2021 17:27:50 - INFO - __main__ - Step 13743: {'lr': 0.00019999762697084838, 'samples': 439776, 'steps': 858, 'loss/train': 3.143702983856201} -09/20/2021 17:27:51 - INFO - __main__ - Step 13744: {'lr': 0.00019999762697084838, 'samples': 439808, 'steps': 858, 'loss/train': 3.6935057640075684} -09/20/2021 17:27:52 - INFO - __main__ - Step 13745: {'lr': 0.00019999758282259297, 'samples': 439840, 'steps': 859, 'loss/train': 3.057760000228882} -09/20/2021 17:27:53 - INFO - __main__ - Step 13746: {'lr': 0.00019999758282259297, 'samples': 439872, 'steps': 859, 'loss/train': 4.138457298278809} -09/20/2021 17:27:54 - INFO - __main__ - Step 13747: {'lr': 0.00019999758282259297, 'samples': 439904, 'steps': 859, 'loss/train': 4.991602420806885} -09/20/2021 17:27:54 - INFO - __main__ - Step 13748: {'lr': 0.00019999758282259297, 'samples': 439936, 'steps': 859, 'loss/train': 3.9286413192749023} -09/20/2021 17:27:55 - INFO - __main__ - Step 13749: {'lr': 0.00019999758282259297, 'samples': 439968, 'steps': 859, 'loss/train': 3.7362120151519775} -09/20/2021 17:27:56 - INFO - __main__ - Step 13750: {'lr': 0.00019999758282259297, 'samples': 440000, 'steps': 859, 'loss/train': 4.201443672180176} -09/20/2021 17:27:57 - INFO - __main__ - Step 13751: {'lr': 0.00019999758282259297, 'samples': 440032, 'steps': 859, 'loss/train': 4.192630290985107} -09/20/2021 17:27:57 - INFO - __main__ - Step 13752: {'lr': 0.00019999758282259297, 'samples': 440064, 'steps': 859, 'loss/train': 3.6916873455047607} -09/20/2021 17:27:58 - INFO - __main__ - Step 13753: {'lr': 0.00019999758282259297, 'samples': 440096, 'steps': 859, 'loss/train': 4.151600360870361} -09/20/2021 17:27:59 - INFO - __main__ - Step 13754: {'lr': 0.00019999758282259297, 'samples': 440128, 'steps': 859, 'loss/train': 4.027298927307129} -09/20/2021 17:28:00 - INFO - __main__ - Step 13755: {'lr': 0.00019999758282259297, 'samples': 440160, 'steps': 859, 'loss/train': 3.6880245208740234} -09/20/2021 17:28:00 - INFO - __main__ - Step 13756: {'lr': 0.00019999758282259297, 'samples': 440192, 'steps': 859, 'loss/train': 3.9487595558166504} -09/20/2021 17:28:01 - INFO - __main__ - Step 13757: {'lr': 0.00019999758282259297, 'samples': 440224, 'steps': 859, 'loss/train': 3.0468530654907227} -09/20/2021 17:28:02 - INFO - __main__ - Step 13758: {'lr': 0.00019999758282259297, 'samples': 440256, 'steps': 859, 'loss/train': 4.381703853607178} -09/20/2021 17:28:03 - INFO - __main__ - Step 13759: {'lr': 0.00019999758282259297, 'samples': 440288, 'steps': 859, 'loss/train': 4.517544269561768} -09/20/2021 17:28:03 - INFO - __main__ - Step 13760: {'lr': 0.00019999758282259297, 'samples': 440320, 'steps': 859, 'loss/train': 5.339778423309326} -09/20/2021 17:28:04 - INFO - __main__ - Step 13761: {'lr': 0.00019999753826744775, 'samples': 440352, 'steps': 860, 'loss/train': 4.519352912902832} -09/20/2021 17:28:05 - INFO - __main__ - Step 13762: {'lr': 0.00019999753826744775, 'samples': 440384, 'steps': 860, 'loss/train': 3.4823598861694336} -09/20/2021 17:28:06 - INFO - __main__ - Step 13763: {'lr': 0.00019999753826744775, 'samples': 440416, 'steps': 860, 'loss/train': 3.7517778873443604} -09/20/2021 17:28:06 - INFO - __main__ - Step 13764: {'lr': 0.00019999753826744775, 'samples': 440448, 'steps': 860, 'loss/train': 4.301408767700195} -09/20/2021 17:28:07 - INFO - __main__ - Step 13765: {'lr': 0.00019999753826744775, 'samples': 440480, 'steps': 860, 'loss/train': 3.988205909729004} -09/20/2021 17:28:08 - INFO - __main__ - Step 13766: {'lr': 0.00019999753826744775, 'samples': 440512, 'steps': 860, 'loss/train': 3.511686086654663} -09/20/2021 17:28:09 - INFO - __main__ - Step 13767: {'lr': 0.00019999753826744775, 'samples': 440544, 'steps': 860, 'loss/train': 4.743406295776367} -09/20/2021 17:28:10 - INFO - __main__ - Step 13768: {'lr': 0.00019999753826744775, 'samples': 440576, 'steps': 860, 'loss/train': 3.9631404876708984} -09/20/2021 17:28:11 - INFO - __main__ - Step 13769: {'lr': 0.00019999753826744775, 'samples': 440608, 'steps': 860, 'loss/train': 4.005614757537842} -09/20/2021 17:28:11 - INFO - __main__ - Step 13770: {'lr': 0.00019999753826744775, 'samples': 440640, 'steps': 860, 'loss/train': 3.9820849895477295} -09/20/2021 17:28:12 - INFO - __main__ - Step 13771: {'lr': 0.00019999753826744775, 'samples': 440672, 'steps': 860, 'loss/train': 2.6663527488708496} -09/20/2021 17:28:13 - INFO - __main__ - Step 13772: {'lr': 0.00019999753826744775, 'samples': 440704, 'steps': 860, 'loss/train': 1.8962011337280273} -09/20/2021 17:28:14 - INFO - __main__ - Step 13773: {'lr': 0.00019999753826744775, 'samples': 440736, 'steps': 860, 'loss/train': 4.506433486938477} -09/20/2021 17:28:14 - INFO - __main__ - Step 13774: {'lr': 0.00019999753826744775, 'samples': 440768, 'steps': 860, 'loss/train': 3.8163769245147705} -09/20/2021 17:28:15 - INFO - __main__ - Step 13775: {'lr': 0.00019999753826744775, 'samples': 440800, 'steps': 860, 'loss/train': 2.707343578338623} -09/20/2021 17:28:16 - INFO - __main__ - Step 13776: {'lr': 0.00019999753826744775, 'samples': 440832, 'steps': 860, 'loss/train': 3.634850263595581} -09/20/2021 17:28:17 - INFO - __main__ - Step 13777: {'lr': 0.00019999749330541295, 'samples': 440864, 'steps': 861, 'loss/train': 2.989496946334839} -09/20/2021 17:28:18 - INFO - __main__ - Step 13778: {'lr': 0.00019999749330541295, 'samples': 440896, 'steps': 861, 'loss/train': 4.098989486694336} -09/20/2021 17:28:18 - INFO - __main__ - Step 13779: {'lr': 0.00019999749330541295, 'samples': 440928, 'steps': 861, 'loss/train': 5.327324867248535} -09/20/2021 17:28:19 - INFO - __main__ - Step 13780: {'lr': 0.00019999749330541295, 'samples': 440960, 'steps': 861, 'loss/train': 3.993441104888916} -09/20/2021 17:28:20 - INFO - __main__ - Step 13781: {'lr': 0.00019999749330541295, 'samples': 440992, 'steps': 861, 'loss/train': 4.781274318695068} -09/20/2021 17:28:21 - INFO - __main__ - Step 13782: {'lr': 0.00019999749330541295, 'samples': 441024, 'steps': 861, 'loss/train': 3.3141703605651855} -09/20/2021 17:28:21 - INFO - __main__ - Step 13783: {'lr': 0.00019999749330541295, 'samples': 441056, 'steps': 861, 'loss/train': 4.775904178619385} -09/20/2021 17:28:22 - INFO - __main__ - Step 13784: {'lr': 0.00019999749330541295, 'samples': 441088, 'steps': 861, 'loss/train': 4.249048233032227} -09/20/2021 17:28:23 - INFO - __main__ - Step 13785: {'lr': 0.00019999749330541295, 'samples': 441120, 'steps': 861, 'loss/train': 3.818708896636963} -09/20/2021 17:28:24 - INFO - __main__ - Step 13786: {'lr': 0.00019999749330541295, 'samples': 441152, 'steps': 861, 'loss/train': 3.9411332607269287} -09/20/2021 17:28:24 - INFO - __main__ - Step 13787: {'lr': 0.00019999749330541295, 'samples': 441184, 'steps': 861, 'loss/train': 3.7920515537261963} -09/20/2021 17:28:25 - INFO - __main__ - Step 13788: {'lr': 0.00019999749330541295, 'samples': 441216, 'steps': 861, 'loss/train': 4.692425727844238} -09/20/2021 17:28:26 - INFO - __main__ - Step 13789: {'lr': 0.00019999749330541295, 'samples': 441248, 'steps': 861, 'loss/train': 4.2795515060424805} -09/20/2021 17:28:27 - INFO - __main__ - Step 13790: {'lr': 0.00019999749330541295, 'samples': 441280, 'steps': 861, 'loss/train': 4.7114176750183105} -09/20/2021 17:28:27 - INFO - __main__ - Step 13791: {'lr': 0.00019999749330541295, 'samples': 441312, 'steps': 861, 'loss/train': 3.848135232925415} -09/20/2021 17:28:28 - INFO - __main__ - Step 13792: {'lr': 0.00019999749330541295, 'samples': 441344, 'steps': 861, 'loss/train': 3.3780694007873535} -09/20/2021 17:28:29 - INFO - __main__ - Step 13793: {'lr': 0.00019999744793648873, 'samples': 441376, 'steps': 862, 'loss/train': 3.859912872314453} -09/20/2021 17:28:30 - INFO - __main__ - Step 13794: {'lr': 0.00019999744793648873, 'samples': 441408, 'steps': 862, 'loss/train': 4.195104122161865} -09/20/2021 17:28:31 - INFO - __main__ - Step 13795: {'lr': 0.00019999744793648873, 'samples': 441440, 'steps': 862, 'loss/train': 3.3720920085906982} -09/20/2021 17:28:31 - INFO - __main__ - Step 13796: {'lr': 0.00019999744793648873, 'samples': 441472, 'steps': 862, 'loss/train': 4.116262435913086} -09/20/2021 17:28:32 - INFO - __main__ - Step 13797: {'lr': 0.00019999744793648873, 'samples': 441504, 'steps': 862, 'loss/train': 4.384119033813477} -09/20/2021 17:28:33 - INFO - __main__ - Step 13798: {'lr': 0.00019999744793648873, 'samples': 441536, 'steps': 862, 'loss/train': 3.767848014831543} -09/20/2021 17:28:34 - INFO - __main__ - Step 13799: {'lr': 0.00019999744793648873, 'samples': 441568, 'steps': 862, 'loss/train': 4.472550392150879} -09/20/2021 17:28:35 - INFO - __main__ - Step 13800: {'lr': 0.00019999744793648873, 'samples': 441600, 'steps': 862, 'loss/train': 3.5761706829071045} -09/20/2021 17:28:36 - INFO - __main__ - Step 13801: {'lr': 0.00019999744793648873, 'samples': 441632, 'steps': 862, 'loss/train': 1.9268826246261597} -09/20/2021 17:28:36 - INFO - __main__ - Step 13802: {'lr': 0.00019999744793648873, 'samples': 441664, 'steps': 862, 'loss/train': 3.7454724311828613} -09/20/2021 17:28:37 - INFO - __main__ - Step 13803: {'lr': 0.00019999744793648873, 'samples': 441696, 'steps': 862, 'loss/train': 3.456859588623047} -09/20/2021 17:28:38 - INFO - __main__ - Step 13804: {'lr': 0.00019999744793648873, 'samples': 441728, 'steps': 862, 'loss/train': 3.1675915718078613} -09/20/2021 17:28:39 - INFO - __main__ - Step 13805: {'lr': 0.00019999744793648873, 'samples': 441760, 'steps': 862, 'loss/train': 3.929959297180176} -09/20/2021 17:28:39 - INFO - __main__ - Step 13806: {'lr': 0.00019999744793648873, 'samples': 441792, 'steps': 862, 'loss/train': 4.335862636566162} -09/20/2021 17:28:40 - INFO - __main__ - Step 13807: {'lr': 0.00019999744793648873, 'samples': 441824, 'steps': 862, 'loss/train': 3.9436230659484863} -09/20/2021 17:28:41 - INFO - __main__ - Step 13808: {'lr': 0.00019999744793648873, 'samples': 441856, 'steps': 862, 'loss/train': 3.3080697059631348} -09/20/2021 17:28:42 - INFO - __main__ - Step 13809: {'lr': 0.00019999740216067527, 'samples': 441888, 'steps': 863, 'loss/train': 4.943742752075195} -09/20/2021 17:28:43 - INFO - __main__ - Step 13810: {'lr': 0.00019999740216067527, 'samples': 441920, 'steps': 863, 'loss/train': 4.225198745727539} -09/20/2021 17:28:43 - INFO - __main__ - Step 13811: {'lr': 0.00019999740216067527, 'samples': 441952, 'steps': 863, 'loss/train': 3.8717944622039795} -09/20/2021 17:28:44 - INFO - __main__ - Step 13812: {'lr': 0.00019999740216067527, 'samples': 441984, 'steps': 863, 'loss/train': 4.138514041900635} -09/20/2021 17:28:45 - INFO - __main__ - Step 13813: {'lr': 0.00019999740216067527, 'samples': 442016, 'steps': 863, 'loss/train': 3.6962058544158936} -09/20/2021 17:28:46 - INFO - __main__ - Step 13814: {'lr': 0.00019999740216067527, 'samples': 442048, 'steps': 863, 'loss/train': 4.088113307952881} -09/20/2021 17:28:46 - INFO - __main__ - Step 13815: {'lr': 0.00019999740216067527, 'samples': 442080, 'steps': 863, 'loss/train': 4.1552734375} -09/20/2021 17:28:47 - INFO - __main__ - Step 13816: {'lr': 0.00019999740216067527, 'samples': 442112, 'steps': 863, 'loss/train': 4.685675621032715} -09/20/2021 17:28:48 - INFO - __main__ - Step 13817: {'lr': 0.00019999740216067527, 'samples': 442144, 'steps': 863, 'loss/train': 4.324446678161621} -09/20/2021 17:28:49 - INFO - __main__ - Step 13818: {'lr': 0.00019999740216067527, 'samples': 442176, 'steps': 863, 'loss/train': 4.43963098526001} -09/20/2021 17:28:49 - INFO - __main__ - Step 13819: {'lr': 0.00019999740216067527, 'samples': 442208, 'steps': 863, 'loss/train': 3.808727741241455} -09/20/2021 17:28:50 - INFO - __main__ - Step 13820: {'lr': 0.00019999740216067527, 'samples': 442240, 'steps': 863, 'loss/train': 4.462586879730225} -09/20/2021 17:28:51 - INFO - __main__ - Step 13821: {'lr': 0.00019999740216067527, 'samples': 442272, 'steps': 863, 'loss/train': 4.17171049118042} -09/20/2021 17:28:52 - INFO - __main__ - Step 13822: {'lr': 0.00019999740216067527, 'samples': 442304, 'steps': 863, 'loss/train': 4.152982711791992} -09/20/2021 17:28:52 - INFO - __main__ - Step 13823: {'lr': 0.00019999740216067527, 'samples': 442336, 'steps': 863, 'loss/train': 4.141335487365723} -09/20/2021 17:28:53 - INFO - __main__ - Step 13824: {'lr': 0.00019999740216067527, 'samples': 442368, 'steps': 863, 'loss/train': 6.362804412841797} -09/20/2021 17:28:54 - INFO - __main__ - Step 13825: {'lr': 0.0001999973559779728, 'samples': 442400, 'steps': 864, 'loss/train': 3.8270606994628906} -09/20/2021 17:28:55 - INFO - __main__ - Step 13826: {'lr': 0.0001999973559779728, 'samples': 442432, 'steps': 864, 'loss/train': 3.3038856983184814} -09/20/2021 17:28:55 - INFO - __main__ - Step 13827: {'lr': 0.0001999973559779728, 'samples': 442464, 'steps': 864, 'loss/train': 4.271692276000977} -09/20/2021 17:28:57 - INFO - __main__ - Step 13828: {'lr': 0.0001999973559779728, 'samples': 442496, 'steps': 864, 'loss/train': 4.175492286682129} -09/20/2021 17:28:58 - INFO - __main__ - Step 13829: {'lr': 0.0001999973559779728, 'samples': 442528, 'steps': 864, 'loss/train': 3.829437732696533} -09/20/2021 17:28:58 - INFO - __main__ - Step 13830: {'lr': 0.0001999973559779728, 'samples': 442560, 'steps': 864, 'loss/train': 3.6317596435546875} -09/20/2021 17:28:59 - INFO - __main__ - Step 13831: {'lr': 0.0001999973559779728, 'samples': 442592, 'steps': 864, 'loss/train': 3.004007577896118} -09/20/2021 17:29:00 - INFO - __main__ - Step 13832: {'lr': 0.0001999973559779728, 'samples': 442624, 'steps': 864, 'loss/train': 3.2203736305236816} -09/20/2021 17:29:01 - INFO - __main__ - Step 13833: {'lr': 0.0001999973559779728, 'samples': 442656, 'steps': 864, 'loss/train': 4.999274253845215} -09/20/2021 17:29:01 - INFO - __main__ - Step 13834: {'lr': 0.0001999973559779728, 'samples': 442688, 'steps': 864, 'loss/train': 4.000890731811523} -09/20/2021 17:29:02 - INFO - __main__ - Step 13835: {'lr': 0.0001999973559779728, 'samples': 442720, 'steps': 864, 'loss/train': 4.3030805587768555} -09/20/2021 17:29:03 - INFO - __main__ - Step 13836: {'lr': 0.0001999973559779728, 'samples': 442752, 'steps': 864, 'loss/train': 4.356365203857422} -09/20/2021 17:29:04 - INFO - __main__ - Step 13837: {'lr': 0.0001999973559779728, 'samples': 442784, 'steps': 864, 'loss/train': 4.88618278503418} -09/20/2021 17:29:04 - INFO - __main__ - Step 13838: {'lr': 0.0001999973559779728, 'samples': 442816, 'steps': 864, 'loss/train': 7.019900798797607} -09/20/2021 17:29:05 - INFO - __main__ - Step 13839: {'lr': 0.0001999973559779728, 'samples': 442848, 'steps': 864, 'loss/train': 4.063394546508789} -09/20/2021 17:29:06 - INFO - __main__ - Step 13840: {'lr': 0.0001999973559779728, 'samples': 442880, 'steps': 864, 'loss/train': 3.394357442855835} -09/20/2021 17:29:07 - INFO - __main__ - Step 13841: {'lr': 0.00019999730938838147, 'samples': 442912, 'steps': 865, 'loss/train': 4.9127421379089355} -09/20/2021 17:29:07 - INFO - __main__ - Step 13842: {'lr': 0.00019999730938838147, 'samples': 442944, 'steps': 865, 'loss/train': 1.4038437604904175} -09/20/2021 17:29:08 - INFO - __main__ - Step 13843: {'lr': 0.00019999730938838147, 'samples': 442976, 'steps': 865, 'loss/train': 3.3789010047912598} -09/20/2021 17:29:09 - INFO - __main__ - Step 13844: {'lr': 0.00019999730938838147, 'samples': 443008, 'steps': 865, 'loss/train': 3.8932723999023438} -09/20/2021 17:29:10 - INFO - __main__ - Step 13845: {'lr': 0.00019999730938838147, 'samples': 443040, 'steps': 865, 'loss/train': 3.8936214447021484} -09/20/2021 17:29:10 - INFO - __main__ - Step 13846: {'lr': 0.00019999730938838147, 'samples': 443072, 'steps': 865, 'loss/train': 2.739809274673462} -09/20/2021 17:29:11 - INFO - __main__ - Step 13847: {'lr': 0.00019999730938838147, 'samples': 443104, 'steps': 865, 'loss/train': 3.6584770679473877} -09/20/2021 17:29:12 - INFO - __main__ - Step 13848: {'lr': 0.00019999730938838147, 'samples': 443136, 'steps': 865, 'loss/train': 3.8922252655029297} -09/20/2021 17:29:13 - INFO - __main__ - Step 13849: {'lr': 0.00019999730938838147, 'samples': 443168, 'steps': 865, 'loss/train': 3.8317644596099854} -09/20/2021 17:29:13 - INFO - __main__ - Step 13850: {'lr': 0.00019999730938838147, 'samples': 443200, 'steps': 865, 'loss/train': 3.9840333461761475} -09/20/2021 17:29:14 - INFO - __main__ - Step 13851: {'lr': 0.00019999730938838147, 'samples': 443232, 'steps': 865, 'loss/train': 3.8568191528320312} -09/20/2021 17:29:15 - INFO - __main__ - Step 13852: {'lr': 0.00019999730938838147, 'samples': 443264, 'steps': 865, 'loss/train': 3.675008773803711} -09/20/2021 17:29:16 - INFO - __main__ - Step 13853: {'lr': 0.00019999730938838147, 'samples': 443296, 'steps': 865, 'loss/train': 3.6260178089141846} -09/20/2021 17:29:16 - INFO - __main__ - Step 13854: {'lr': 0.00019999730938838147, 'samples': 443328, 'steps': 865, 'loss/train': 3.9886415004730225} -09/20/2021 17:29:17 - INFO - __main__ - Step 13855: {'lr': 0.00019999730938838147, 'samples': 443360, 'steps': 865, 'loss/train': 3.7074170112609863} -09/20/2021 17:29:18 - INFO - __main__ - Step 13856: {'lr': 0.00019999730938838147, 'samples': 443392, 'steps': 865, 'loss/train': 3.8737757205963135} -09/20/2021 17:29:19 - INFO - __main__ - Step 13857: {'lr': 0.00019999726239190146, 'samples': 443424, 'steps': 866, 'loss/train': 5.54691219329834} -09/20/2021 17:29:20 - INFO - __main__ - Step 13858: {'lr': 0.00019999726239190146, 'samples': 443456, 'steps': 866, 'loss/train': 4.470693588256836} -09/20/2021 17:29:21 - INFO - __main__ - Step 13859: {'lr': 0.00019999726239190146, 'samples': 443488, 'steps': 866, 'loss/train': 4.321222305297852} -09/20/2021 17:29:22 - INFO - __main__ - Step 13860: {'lr': 0.00019999726239190146, 'samples': 443520, 'steps': 866, 'loss/train': 4.125954627990723} -09/20/2021 17:29:22 - INFO - __main__ - Step 13861: {'lr': 0.00019999726239190146, 'samples': 443552, 'steps': 866, 'loss/train': 4.320698261260986} -09/20/2021 17:29:23 - INFO - __main__ - Step 13862: {'lr': 0.00019999726239190146, 'samples': 443584, 'steps': 866, 'loss/train': 3.3505799770355225} -09/20/2021 17:29:24 - INFO - __main__ - Step 13863: {'lr': 0.00019999726239190146, 'samples': 443616, 'steps': 866, 'loss/train': 3.337796449661255} -09/20/2021 17:29:25 - INFO - __main__ - Step 13864: {'lr': 0.00019999726239190146, 'samples': 443648, 'steps': 866, 'loss/train': 4.178014755249023} -09/20/2021 17:29:25 - INFO - __main__ - Step 13865: {'lr': 0.00019999726239190146, 'samples': 443680, 'steps': 866, 'loss/train': 4.507061958312988} -09/20/2021 17:29:26 - INFO - __main__ - Step 13866: {'lr': 0.00019999726239190146, 'samples': 443712, 'steps': 866, 'loss/train': 2.793649911880493} -09/20/2021 17:29:27 - INFO - __main__ - Step 13867: {'lr': 0.00019999726239190146, 'samples': 443744, 'steps': 866, 'loss/train': 4.162247657775879} -09/20/2021 17:29:28 - INFO - __main__ - Step 13868: {'lr': 0.00019999726239190146, 'samples': 443776, 'steps': 866, 'loss/train': 3.731031894683838} -09/20/2021 17:29:28 - INFO - __main__ - Step 13869: {'lr': 0.00019999726239190146, 'samples': 443808, 'steps': 866, 'loss/train': 2.922832489013672} -09/20/2021 17:29:29 - INFO - __main__ - Step 13870: {'lr': 0.00019999726239190146, 'samples': 443840, 'steps': 866, 'loss/train': 3.376594066619873} -09/20/2021 17:29:30 - INFO - __main__ - Step 13871: {'lr': 0.00019999726239190146, 'samples': 443872, 'steps': 866, 'loss/train': 4.060923099517822} -09/20/2021 17:29:31 - INFO - __main__ - Step 13872: {'lr': 0.00019999726239190146, 'samples': 443904, 'steps': 866, 'loss/train': 3.6475484371185303} -09/20/2021 17:29:31 - INFO - __main__ - Step 13873: {'lr': 0.000199997214988533, 'samples': 443936, 'steps': 867, 'loss/train': 5.425074577331543} -09/20/2021 17:29:32 - INFO - __main__ - Step 13874: {'lr': 0.000199997214988533, 'samples': 443968, 'steps': 867, 'loss/train': 2.917530059814453} -09/20/2021 17:29:33 - INFO - __main__ - Step 13875: {'lr': 0.000199997214988533, 'samples': 444000, 'steps': 867, 'loss/train': 4.221967697143555} -09/20/2021 17:29:34 - INFO - __main__ - Step 13876: {'lr': 0.000199997214988533, 'samples': 444032, 'steps': 867, 'loss/train': 3.9511051177978516} -09/20/2021 17:29:34 - INFO - __main__ - Step 13877: {'lr': 0.000199997214988533, 'samples': 444064, 'steps': 867, 'loss/train': 5.410984992980957} -09/20/2021 17:29:35 - INFO - __main__ - Step 13878: {'lr': 0.000199997214988533, 'samples': 444096, 'steps': 867, 'loss/train': 4.237882137298584} -09/20/2021 17:29:36 - INFO - __main__ - Step 13879: {'lr': 0.000199997214988533, 'samples': 444128, 'steps': 867, 'loss/train': 3.9435794353485107} -09/20/2021 17:29:37 - INFO - __main__ - Step 13880: {'lr': 0.000199997214988533, 'samples': 444160, 'steps': 867, 'loss/train': 3.981282949447632} -09/20/2021 17:29:37 - INFO - __main__ - Step 13881: {'lr': 0.000199997214988533, 'samples': 444192, 'steps': 867, 'loss/train': 5.170494556427002} -09/20/2021 17:29:38 - INFO - __main__ - Step 13882: {'lr': 0.000199997214988533, 'samples': 444224, 'steps': 867, 'loss/train': 5.174713134765625} -09/20/2021 17:29:39 - INFO - __main__ - Step 13883: {'lr': 0.000199997214988533, 'samples': 444256, 'steps': 867, 'loss/train': 5.155541896820068} -09/20/2021 17:29:40 - INFO - __main__ - Step 13884: {'lr': 0.000199997214988533, 'samples': 444288, 'steps': 867, 'loss/train': 2.596703052520752} -09/20/2021 17:29:40 - INFO - __main__ - Step 13885: {'lr': 0.000199997214988533, 'samples': 444320, 'steps': 867, 'loss/train': 1.1573774814605713} -09/20/2021 17:29:41 - INFO - __main__ - Step 13886: {'lr': 0.000199997214988533, 'samples': 444352, 'steps': 867, 'loss/train': 4.303823947906494} -09/20/2021 17:29:42 - INFO - __main__ - Step 13887: {'lr': 0.000199997214988533, 'samples': 444384, 'steps': 867, 'loss/train': 4.244650363922119} -09/20/2021 17:29:43 - INFO - __main__ - Step 13888: {'lr': 0.000199997214988533, 'samples': 444416, 'steps': 867, 'loss/train': 2.1723673343658447} -09/20/2021 17:29:44 - INFO - __main__ - Step 13889: {'lr': 0.00019999716717827623, 'samples': 444448, 'steps': 868, 'loss/train': 4.432715892791748} -09/20/2021 17:29:45 - INFO - __main__ - Step 13890: {'lr': 0.00019999716717827623, 'samples': 444480, 'steps': 868, 'loss/train': 4.630208492279053} -09/20/2021 17:29:46 - INFO - __main__ - Step 13891: {'lr': 0.00019999716717827623, 'samples': 444512, 'steps': 868, 'loss/train': 1.8534786701202393} -09/20/2021 17:29:46 - INFO - __main__ - Step 13892: {'lr': 0.00019999716717827623, 'samples': 444544, 'steps': 868, 'loss/train': 6.130279064178467} -09/20/2021 17:29:47 - INFO - __main__ - Step 13893: {'lr': 0.00019999716717827623, 'samples': 444576, 'steps': 868, 'loss/train': 3.3568100929260254} -09/20/2021 17:29:48 - INFO - __main__ - Step 13894: {'lr': 0.00019999716717827623, 'samples': 444608, 'steps': 868, 'loss/train': 4.50846529006958} -09/20/2021 17:29:49 - INFO - __main__ - Step 13895: {'lr': 0.00019999716717827623, 'samples': 444640, 'steps': 868, 'loss/train': 3.529101848602295} -09/20/2021 17:29:49 - INFO - __main__ - Step 13896: {'lr': 0.00019999716717827623, 'samples': 444672, 'steps': 868, 'loss/train': 3.5341973304748535} -09/20/2021 17:29:50 - INFO - __main__ - Step 13897: {'lr': 0.00019999716717827623, 'samples': 444704, 'steps': 868, 'loss/train': 4.10011100769043} -09/20/2021 17:29:51 - INFO - __main__ - Step 13898: {'lr': 0.00019999716717827623, 'samples': 444736, 'steps': 868, 'loss/train': 4.472707748413086} -09/20/2021 17:29:52 - INFO - __main__ - Step 13899: {'lr': 0.00019999716717827623, 'samples': 444768, 'steps': 868, 'loss/train': 3.755411386489868} -09/20/2021 17:29:52 - INFO - __main__ - Step 13900: {'lr': 0.00019999716717827623, 'samples': 444800, 'steps': 868, 'loss/train': 6.544638156890869} -09/20/2021 17:29:53 - INFO - __main__ - Step 13901: {'lr': 0.00019999716717827623, 'samples': 444832, 'steps': 868, 'loss/train': 3.8193163871765137} -09/20/2021 17:29:54 - INFO - __main__ - Step 13902: {'lr': 0.00019999716717827623, 'samples': 444864, 'steps': 868, 'loss/train': 4.553319454193115} -09/20/2021 17:29:55 - INFO - __main__ - Step 13903: {'lr': 0.00019999716717827623, 'samples': 444896, 'steps': 868, 'loss/train': 3.971046209335327} -09/20/2021 17:29:55 - INFO - __main__ - Step 13904: {'lr': 0.00019999716717827623, 'samples': 444928, 'steps': 868, 'loss/train': 4.35441255569458} -09/20/2021 17:29:56 - INFO - __main__ - Step 13905: {'lr': 0.00019999711896113138, 'samples': 444960, 'steps': 869, 'loss/train': 3.728933811187744} -09/20/2021 17:29:57 - INFO - __main__ - Step 13906: {'lr': 0.00019999711896113138, 'samples': 444992, 'steps': 869, 'loss/train': 3.615971803665161} -09/20/2021 17:29:58 - INFO - __main__ - Step 13907: {'lr': 0.00019999711896113138, 'samples': 445024, 'steps': 869, 'loss/train': 3.6404266357421875} -09/20/2021 17:29:58 - INFO - __main__ - Step 13908: {'lr': 0.00019999711896113138, 'samples': 445056, 'steps': 869, 'loss/train': 5.513003826141357} -09/20/2021 17:29:59 - INFO - __main__ - Step 13909: {'lr': 0.00019999711896113138, 'samples': 445088, 'steps': 869, 'loss/train': 4.097228050231934} -09/20/2021 17:30:00 - INFO - __main__ - Step 13910: {'lr': 0.00019999711896113138, 'samples': 445120, 'steps': 869, 'loss/train': 3.8358418941497803} -09/20/2021 17:30:01 - INFO - __main__ - Step 13911: {'lr': 0.00019999711896113138, 'samples': 445152, 'steps': 869, 'loss/train': 4.440773963928223} -09/20/2021 17:30:01 - INFO - __main__ - Step 13912: {'lr': 0.00019999711896113138, 'samples': 445184, 'steps': 869, 'loss/train': 3.9075515270233154} -09/20/2021 17:30:02 - INFO - __main__ - Step 13913: {'lr': 0.00019999711896113138, 'samples': 445216, 'steps': 869, 'loss/train': 3.727651834487915} -09/20/2021 17:30:03 - INFO - __main__ - Step 13914: {'lr': 0.00019999711896113138, 'samples': 445248, 'steps': 869, 'loss/train': 3.8654024600982666} -09/20/2021 17:30:04 - INFO - __main__ - Step 13915: {'lr': 0.00019999711896113138, 'samples': 445280, 'steps': 869, 'loss/train': 4.128149032592773} -09/20/2021 17:30:04 - INFO - __main__ - Step 13916: {'lr': 0.00019999711896113138, 'samples': 445312, 'steps': 869, 'loss/train': 3.9022951126098633} -09/20/2021 17:30:05 - INFO - __main__ - Step 13917: {'lr': 0.00019999711896113138, 'samples': 445344, 'steps': 869, 'loss/train': 4.064466953277588} -09/20/2021 17:30:06 - INFO - __main__ - Step 13918: {'lr': 0.00019999711896113138, 'samples': 445376, 'steps': 869, 'loss/train': 3.996948719024658} -09/20/2021 17:30:07 - INFO - __main__ - Step 13919: {'lr': 0.00019999711896113138, 'samples': 445408, 'steps': 869, 'loss/train': 4.719066619873047} -09/20/2021 17:30:07 - INFO - __main__ - Step 13920: {'lr': 0.00019999711896113138, 'samples': 445440, 'steps': 869, 'loss/train': 4.247080326080322} -09/20/2021 17:30:10 - INFO - __main__ - Step 13921: {'lr': 0.00019999707033709866, 'samples': 445472, 'steps': 870, 'loss/train': 4.696272850036621} -09/20/2021 17:30:10 - INFO - __main__ - Step 13922: {'lr': 0.00019999707033709866, 'samples': 445504, 'steps': 870, 'loss/train': 4.257717132568359} -09/20/2021 17:30:11 - INFO - __main__ - Step 13923: {'lr': 0.00019999707033709866, 'samples': 445536, 'steps': 870, 'loss/train': 3.9894778728485107} -09/20/2021 17:30:12 - INFO - __main__ - Step 13924: {'lr': 0.00019999707033709866, 'samples': 445568, 'steps': 870, 'loss/train': 3.8493285179138184} -09/20/2021 17:30:13 - INFO - __main__ - Step 13925: {'lr': 0.00019999707033709866, 'samples': 445600, 'steps': 870, 'loss/train': 3.5980591773986816} -09/20/2021 17:30:13 - INFO - __main__ - Step 13926: {'lr': 0.00019999707033709866, 'samples': 445632, 'steps': 870, 'loss/train': 4.05117654800415} -09/20/2021 17:30:14 - INFO - __main__ - Step 13927: {'lr': 0.00019999707033709866, 'samples': 445664, 'steps': 870, 'loss/train': 3.2454895973205566} -09/20/2021 17:30:15 - INFO - __main__ - Step 13928: {'lr': 0.00019999707033709866, 'samples': 445696, 'steps': 870, 'loss/train': 3.173541307449341} -09/20/2021 17:30:16 - INFO - __main__ - Step 13929: {'lr': 0.00019999707033709866, 'samples': 445728, 'steps': 870, 'loss/train': 4.269453525543213} -09/20/2021 17:30:16 - INFO - __main__ - Step 13930: {'lr': 0.00019999707033709866, 'samples': 445760, 'steps': 870, 'loss/train': 4.357816696166992} -09/20/2021 17:30:17 - INFO - __main__ - Step 13931: {'lr': 0.00019999707033709866, 'samples': 445792, 'steps': 870, 'loss/train': 3.4449687004089355} -09/20/2021 17:30:18 - INFO - __main__ - Step 13932: {'lr': 0.00019999707033709866, 'samples': 445824, 'steps': 870, 'loss/train': 0.6181684136390686} -09/20/2021 17:30:19 - INFO - __main__ - Step 13933: {'lr': 0.00019999707033709866, 'samples': 445856, 'steps': 870, 'loss/train': 1.130661964416504} -09/20/2021 17:30:19 - INFO - __main__ - Step 13934: {'lr': 0.00019999707033709866, 'samples': 445888, 'steps': 870, 'loss/train': 1.4369257688522339} -09/20/2021 17:30:20 - INFO - __main__ - Step 13935: {'lr': 0.00019999707033709866, 'samples': 445920, 'steps': 870, 'loss/train': 3.71763014793396} -09/20/2021 17:30:21 - INFO - __main__ - Step 13936: {'lr': 0.00019999707033709866, 'samples': 445952, 'steps': 870, 'loss/train': 3.771160364151001} -09/20/2021 17:30:22 - INFO - __main__ - Step 13937: {'lr': 0.00019999702130617825, 'samples': 445984, 'steps': 871, 'loss/train': 3.950888156890869} -09/20/2021 17:30:22 - INFO - __main__ - Step 13938: {'lr': 0.00019999702130617825, 'samples': 446016, 'steps': 871, 'loss/train': 5.559480667114258} -09/20/2021 17:30:23 - INFO - __main__ - Step 13939: {'lr': 0.00019999702130617825, 'samples': 446048, 'steps': 871, 'loss/train': 4.601937294006348} -09/20/2021 17:30:24 - INFO - __main__ - Step 13940: {'lr': 0.00019999702130617825, 'samples': 446080, 'steps': 871, 'loss/train': 5.038701057434082} -09/20/2021 17:30:25 - INFO - __main__ - Step 13941: {'lr': 0.00019999702130617825, 'samples': 446112, 'steps': 871, 'loss/train': 3.9746835231781006} -09/20/2021 17:30:25 - INFO - __main__ - Step 13942: {'lr': 0.00019999702130617825, 'samples': 446144, 'steps': 871, 'loss/train': 3.663844347000122} -09/20/2021 17:30:26 - INFO - __main__ - Step 13943: {'lr': 0.00019999702130617825, 'samples': 446176, 'steps': 871, 'loss/train': 3.73061466217041} -09/20/2021 17:30:27 - INFO - __main__ - Step 13944: {'lr': 0.00019999702130617825, 'samples': 446208, 'steps': 871, 'loss/train': 4.461034297943115} -09/20/2021 17:30:28 - INFO - __main__ - Step 13945: {'lr': 0.00019999702130617825, 'samples': 446240, 'steps': 871, 'loss/train': 3.505847215652466} -09/20/2021 17:30:28 - INFO - __main__ - Step 13946: {'lr': 0.00019999702130617825, 'samples': 446272, 'steps': 871, 'loss/train': 4.245022296905518} -09/20/2021 17:30:29 - INFO - __main__ - Step 13947: {'lr': 0.00019999702130617825, 'samples': 446304, 'steps': 871, 'loss/train': 5.914699554443359} -09/20/2021 17:30:30 - INFO - __main__ - Step 13948: {'lr': 0.00019999702130617825, 'samples': 446336, 'steps': 871, 'loss/train': 6.118843078613281} -09/20/2021 17:30:31 - INFO - __main__ - Step 13949: {'lr': 0.00019999702130617825, 'samples': 446368, 'steps': 871, 'loss/train': 5.660003662109375} -09/20/2021 17:30:31 - INFO - __main__ - Step 13950: {'lr': 0.00019999702130617825, 'samples': 446400, 'steps': 871, 'loss/train': 3.324514150619507} -09/20/2021 17:30:32 - INFO - __main__ - Step 13951: {'lr': 0.00019999702130617825, 'samples': 446432, 'steps': 871, 'loss/train': 4.718526363372803} -09/20/2021 17:30:33 - INFO - __main__ - Step 13952: {'lr': 0.00019999702130617825, 'samples': 446464, 'steps': 871, 'loss/train': 3.972304582595825} -09/20/2021 17:30:34 - INFO - __main__ - Step 13953: {'lr': 0.00019999697186837034, 'samples': 446496, 'steps': 872, 'loss/train': 4.235689163208008} -09/20/2021 17:30:35 - INFO - __main__ - Step 13954: {'lr': 0.00019999697186837034, 'samples': 446528, 'steps': 872, 'loss/train': 5.19511604309082} -09/20/2021 17:30:36 - INFO - __main__ - Step 13955: {'lr': 0.00019999697186837034, 'samples': 446560, 'steps': 872, 'loss/train': 4.688419818878174} -09/20/2021 17:30:37 - INFO - __main__ - Step 13956: {'lr': 0.00019999697186837034, 'samples': 446592, 'steps': 872, 'loss/train': 4.511555194854736} -09/20/2021 17:30:37 - INFO - __main__ - Step 13957: {'lr': 0.00019999697186837034, 'samples': 446624, 'steps': 872, 'loss/train': 3.7327475547790527} -09/20/2021 17:30:38 - INFO - __main__ - Step 13958: {'lr': 0.00019999697186837034, 'samples': 446656, 'steps': 872, 'loss/train': 3.5491247177124023} -09/20/2021 17:30:39 - INFO - __main__ - Step 13959: {'lr': 0.00019999697186837034, 'samples': 446688, 'steps': 872, 'loss/train': 4.020685195922852} -09/20/2021 17:30:40 - INFO - __main__ - Step 13960: {'lr': 0.00019999697186837034, 'samples': 446720, 'steps': 872, 'loss/train': 4.334100723266602} -09/20/2021 17:30:40 - INFO - __main__ - Step 13961: {'lr': 0.00019999697186837034, 'samples': 446752, 'steps': 872, 'loss/train': 3.4550888538360596} -09/20/2021 17:30:41 - INFO - __main__ - Step 13962: {'lr': 0.00019999697186837034, 'samples': 446784, 'steps': 872, 'loss/train': 4.6349077224731445} -09/20/2021 17:30:42 - INFO - __main__ - Step 13963: {'lr': 0.00019999697186837034, 'samples': 446816, 'steps': 872, 'loss/train': 3.5416407585144043} -09/20/2021 17:30:43 - INFO - __main__ - Step 13964: {'lr': 0.00019999697186837034, 'samples': 446848, 'steps': 872, 'loss/train': 5.855147838592529} -09/20/2021 17:30:43 - INFO - __main__ - Step 13965: {'lr': 0.00019999697186837034, 'samples': 446880, 'steps': 872, 'loss/train': 3.99454927444458} -09/20/2021 17:30:44 - INFO - __main__ - Step 13966: {'lr': 0.00019999697186837034, 'samples': 446912, 'steps': 872, 'loss/train': 3.4947726726531982} -09/20/2021 17:30:45 - INFO - __main__ - Step 13967: {'lr': 0.00019999697186837034, 'samples': 446944, 'steps': 872, 'loss/train': 3.8320631980895996} -09/20/2021 17:30:46 - INFO - __main__ - Step 13968: {'lr': 0.00019999697186837034, 'samples': 446976, 'steps': 872, 'loss/train': 5.114284038543701} -09/20/2021 17:30:47 - INFO - __main__ - Step 13969: {'lr': 0.00019999692202367513, 'samples': 447008, 'steps': 873, 'loss/train': 2.52602219581604} -09/20/2021 17:30:47 - INFO - __main__ - Step 13970: {'lr': 0.00019999692202367513, 'samples': 447040, 'steps': 873, 'loss/train': 5.414944171905518} -09/20/2021 17:30:48 - INFO - __main__ - Step 13971: {'lr': 0.00019999692202367513, 'samples': 447072, 'steps': 873, 'loss/train': 3.332202672958374} -09/20/2021 17:30:49 - INFO - __main__ - Step 13972: {'lr': 0.00019999692202367513, 'samples': 447104, 'steps': 873, 'loss/train': 3.6202352046966553} -09/20/2021 17:30:50 - INFO - __main__ - Step 13973: {'lr': 0.00019999692202367513, 'samples': 447136, 'steps': 873, 'loss/train': 2.345533609390259} -09/20/2021 17:30:50 - INFO - __main__ - Step 13974: {'lr': 0.00019999692202367513, 'samples': 447168, 'steps': 873, 'loss/train': 5.3161845207214355} -09/20/2021 17:30:51 - INFO - __main__ - Step 13975: {'lr': 0.00019999692202367513, 'samples': 447200, 'steps': 873, 'loss/train': 4.287130355834961} -09/20/2021 17:30:52 - INFO - __main__ - Step 13976: {'lr': 0.00019999692202367513, 'samples': 447232, 'steps': 873, 'loss/train': 5.336607933044434} -09/20/2021 17:30:53 - INFO - __main__ - Step 13977: {'lr': 0.00019999692202367513, 'samples': 447264, 'steps': 873, 'loss/train': 4.202427387237549} -09/20/2021 17:30:53 - INFO - __main__ - Step 13978: {'lr': 0.00019999692202367513, 'samples': 447296, 'steps': 873, 'loss/train': 3.6999247074127197} -09/20/2021 17:30:54 - INFO - __main__ - Step 13979: {'lr': 0.00019999692202367513, 'samples': 447328, 'steps': 873, 'loss/train': 4.137558937072754} -09/20/2021 17:30:55 - INFO - __main__ - Step 13980: {'lr': 0.00019999692202367513, 'samples': 447360, 'steps': 873, 'loss/train': 4.015655517578125} -09/20/2021 17:30:56 - INFO - __main__ - Step 13981: {'lr': 0.00019999692202367513, 'samples': 447392, 'steps': 873, 'loss/train': 3.5347509384155273} -09/20/2021 17:30:56 - INFO - __main__ - Step 13982: {'lr': 0.00019999692202367513, 'samples': 447424, 'steps': 873, 'loss/train': 4.03071928024292} -09/20/2021 17:30:57 - INFO - __main__ - Step 13983: {'lr': 0.00019999692202367513, 'samples': 447456, 'steps': 873, 'loss/train': 3.6768579483032227} -09/20/2021 17:30:58 - INFO - __main__ - Step 13984: {'lr': 0.00019999692202367513, 'samples': 447488, 'steps': 873, 'loss/train': 3.954387664794922} -09/20/2021 17:30:59 - INFO - __main__ - Step 13985: {'lr': 0.00019999687177209286, 'samples': 447520, 'steps': 874, 'loss/train': 3.8230743408203125} -09/20/2021 17:31:00 - INFO - __main__ - Step 13986: {'lr': 0.00019999687177209286, 'samples': 447552, 'steps': 874, 'loss/train': 4.427877426147461} -09/20/2021 17:31:01 - INFO - __main__ - Step 13987: {'lr': 0.00019999687177209286, 'samples': 447584, 'steps': 874, 'loss/train': 4.971517562866211} -09/20/2021 17:31:01 - INFO - __main__ - Step 13988: {'lr': 0.00019999687177209286, 'samples': 447616, 'steps': 874, 'loss/train': 3.801034688949585} -09/20/2021 17:31:02 - INFO - __main__ - Step 13989: {'lr': 0.00019999687177209286, 'samples': 447648, 'steps': 874, 'loss/train': 5.430682182312012} -09/20/2021 17:31:03 - INFO - __main__ - Step 13990: {'lr': 0.00019999687177209286, 'samples': 447680, 'steps': 874, 'loss/train': 4.838325023651123} -09/20/2021 17:31:04 - INFO - __main__ - Step 13991: {'lr': 0.00019999687177209286, 'samples': 447712, 'steps': 874, 'loss/train': 3.9484968185424805} -09/20/2021 17:31:04 - INFO - __main__ - Step 13992: {'lr': 0.00019999687177209286, 'samples': 447744, 'steps': 874, 'loss/train': 4.143830299377441} -09/20/2021 17:31:05 - INFO - __main__ - Step 13993: {'lr': 0.00019999687177209286, 'samples': 447776, 'steps': 874, 'loss/train': 4.430648326873779} -09/20/2021 17:31:06 - INFO - __main__ - Step 13994: {'lr': 0.00019999687177209286, 'samples': 447808, 'steps': 874, 'loss/train': 4.72411584854126} -09/20/2021 17:31:07 - INFO - __main__ - Step 13995: {'lr': 0.00019999687177209286, 'samples': 447840, 'steps': 874, 'loss/train': 4.392622947692871} -09/20/2021 17:31:07 - INFO - __main__ - Step 13996: {'lr': 0.00019999687177209286, 'samples': 447872, 'steps': 874, 'loss/train': 1.8926362991333008} -09/20/2021 17:31:08 - INFO - __main__ - Step 13997: {'lr': 0.00019999687177209286, 'samples': 447904, 'steps': 874, 'loss/train': 3.5407016277313232} -09/20/2021 17:31:09 - INFO - __main__ - Step 13998: {'lr': 0.00019999687177209286, 'samples': 447936, 'steps': 874, 'loss/train': 3.4222166538238525} -09/20/2021 17:31:10 - INFO - __main__ - Step 13999: {'lr': 0.00019999687177209286, 'samples': 447968, 'steps': 874, 'loss/train': 1.5405601263046265} -09/20/2021 17:31:10 - INFO - __main__ - Step 14000: {'lr': 0.00019999687177209286, 'samples': 448000, 'steps': 874, 'loss/train': 3.837585210800171} -09/20/2021 17:31:11 - INFO - __main__ - Step 14001: {'lr': 0.00019999682111362368, 'samples': 448032, 'steps': 875, 'loss/train': 3.8508036136627197} -09/20/2021 17:31:12 - INFO - __main__ - Step 14002: {'lr': 0.00019999682111362368, 'samples': 448064, 'steps': 875, 'loss/train': 3.4083142280578613} -09/20/2021 17:31:13 - INFO - __main__ - Step 14003: {'lr': 0.00019999682111362368, 'samples': 448096, 'steps': 875, 'loss/train': 4.128019332885742} -09/20/2021 17:31:14 - INFO - __main__ - Step 14004: {'lr': 0.00019999682111362368, 'samples': 448128, 'steps': 875, 'loss/train': 3.2533445358276367} -09/20/2021 17:31:14 - INFO - __main__ - Step 14005: {'lr': 0.00019999682111362368, 'samples': 448160, 'steps': 875, 'loss/train': 2.954454183578491} -09/20/2021 17:31:15 - INFO - __main__ - Step 14006: {'lr': 0.00019999682111362368, 'samples': 448192, 'steps': 875, 'loss/train': 4.120911598205566} -09/20/2021 17:31:16 - INFO - __main__ - Step 14007: {'lr': 0.00019999682111362368, 'samples': 448224, 'steps': 875, 'loss/train': 3.7798585891723633} -09/20/2021 17:31:17 - INFO - __main__ - Step 14008: {'lr': 0.00019999682111362368, 'samples': 448256, 'steps': 875, 'loss/train': 5.053905963897705} -09/20/2021 17:31:17 - INFO - __main__ - Step 14009: {'lr': 0.00019999682111362368, 'samples': 448288, 'steps': 875, 'loss/train': 4.104362964630127} -09/20/2021 17:31:18 - INFO - __main__ - Step 14010: {'lr': 0.00019999682111362368, 'samples': 448320, 'steps': 875, 'loss/train': 1.448917269706726} -09/20/2021 17:31:19 - INFO - __main__ - Step 14011: {'lr': 0.00019999682111362368, 'samples': 448352, 'steps': 875, 'loss/train': 3.8150899410247803} -09/20/2021 17:31:20 - INFO - __main__ - Step 14012: {'lr': 0.00019999682111362368, 'samples': 448384, 'steps': 875, 'loss/train': 3.7268881797790527} -09/20/2021 17:31:20 - INFO - __main__ - Step 14013: {'lr': 0.00019999682111362368, 'samples': 448416, 'steps': 875, 'loss/train': 3.4080746173858643} -09/20/2021 17:31:21 - INFO - __main__ - Step 14014: {'lr': 0.00019999682111362368, 'samples': 448448, 'steps': 875, 'loss/train': 5.543246746063232} -09/20/2021 17:31:22 - INFO - __main__ - Step 14015: {'lr': 0.00019999682111362368, 'samples': 448480, 'steps': 875, 'loss/train': 3.312747001647949} -09/20/2021 17:31:23 - INFO - __main__ - Step 14016: {'lr': 0.00019999682111362368, 'samples': 448512, 'steps': 875, 'loss/train': 4.5658111572265625} -09/20/2021 17:31:24 - INFO - __main__ - Step 14017: {'lr': 0.00019999677004826783, 'samples': 448544, 'steps': 876, 'loss/train': 4.766980171203613} -09/20/2021 17:31:25 - INFO - __main__ - Step 14018: {'lr': 0.00019999677004826783, 'samples': 448576, 'steps': 876, 'loss/train': 2.672924518585205} -09/20/2021 17:31:25 - INFO - __main__ - Step 14019: {'lr': 0.00019999677004826783, 'samples': 448608, 'steps': 876, 'loss/train': 4.094448566436768} -09/20/2021 17:31:26 - INFO - __main__ - Step 14020: {'lr': 0.00019999677004826783, 'samples': 448640, 'steps': 876, 'loss/train': 3.674529790878296} -09/20/2021 17:31:27 - INFO - __main__ - Step 14021: {'lr': 0.00019999677004826783, 'samples': 448672, 'steps': 876, 'loss/train': 4.119448184967041} -09/20/2021 17:31:28 - INFO - __main__ - Step 14022: {'lr': 0.00019999677004826783, 'samples': 448704, 'steps': 876, 'loss/train': 5.505594253540039} -09/20/2021 17:31:28 - INFO - __main__ - Step 14023: {'lr': 0.00019999677004826783, 'samples': 448736, 'steps': 876, 'loss/train': 3.779296398162842} -09/20/2021 17:31:29 - INFO - __main__ - Step 14024: {'lr': 0.00019999677004826783, 'samples': 448768, 'steps': 876, 'loss/train': 4.239679336547852} -09/20/2021 17:31:30 - INFO - __main__ - Step 14025: {'lr': 0.00019999677004826783, 'samples': 448800, 'steps': 876, 'loss/train': 3.498231887817383} -09/20/2021 17:31:31 - INFO - __main__ - Step 14026: {'lr': 0.00019999677004826783, 'samples': 448832, 'steps': 876, 'loss/train': 4.310726165771484} -09/20/2021 17:31:31 - INFO - __main__ - Step 14027: {'lr': 0.00019999677004826783, 'samples': 448864, 'steps': 876, 'loss/train': 4.801558971405029} -09/20/2021 17:31:32 - INFO - __main__ - Step 14028: {'lr': 0.00019999677004826783, 'samples': 448896, 'steps': 876, 'loss/train': 4.297584533691406} -09/20/2021 17:31:33 - INFO - __main__ - Step 14029: {'lr': 0.00019999677004826783, 'samples': 448928, 'steps': 876, 'loss/train': 4.3858561515808105} -09/20/2021 17:31:34 - INFO - __main__ - Step 14030: {'lr': 0.00019999677004826783, 'samples': 448960, 'steps': 876, 'loss/train': 3.776930332183838} -09/20/2021 17:31:34 - INFO - __main__ - Step 14031: {'lr': 0.00019999677004826783, 'samples': 448992, 'steps': 876, 'loss/train': 4.715627193450928} -09/20/2021 17:31:35 - INFO - __main__ - Step 14032: {'lr': 0.00019999677004826783, 'samples': 449024, 'steps': 876, 'loss/train': 3.3701608180999756} -09/20/2021 17:31:36 - INFO - __main__ - Step 14033: {'lr': 0.0001999967185760255, 'samples': 449056, 'steps': 877, 'loss/train': 4.737759590148926} -09/20/2021 17:31:37 - INFO - __main__ - Step 14034: {'lr': 0.0001999967185760255, 'samples': 449088, 'steps': 877, 'loss/train': 3.3763980865478516} -09/20/2021 17:31:38 - INFO - __main__ - Step 14035: {'lr': 0.0001999967185760255, 'samples': 449120, 'steps': 877, 'loss/train': 3.9879543781280518} -09/20/2021 17:31:38 - INFO - __main__ - Step 14036: {'lr': 0.0001999967185760255, 'samples': 449152, 'steps': 877, 'loss/train': 4.509870529174805} -09/20/2021 17:31:39 - INFO - __main__ - Step 14037: {'lr': 0.0001999967185760255, 'samples': 449184, 'steps': 877, 'loss/train': 4.226057052612305} -09/20/2021 17:31:40 - INFO - __main__ - Step 14038: {'lr': 0.0001999967185760255, 'samples': 449216, 'steps': 877, 'loss/train': 3.3488259315490723} -09/20/2021 17:31:41 - INFO - __main__ - Step 14039: {'lr': 0.0001999967185760255, 'samples': 449248, 'steps': 877, 'loss/train': 3.9901316165924072} -09/20/2021 17:31:41 - INFO - __main__ - Step 14040: {'lr': 0.0001999967185760255, 'samples': 449280, 'steps': 877, 'loss/train': 3.2054426670074463} -09/20/2021 17:31:42 - INFO - __main__ - Step 14041: {'lr': 0.0001999967185760255, 'samples': 449312, 'steps': 877, 'loss/train': 3.906161069869995} -09/20/2021 17:31:43 - INFO - __main__ - Step 14042: {'lr': 0.0001999967185760255, 'samples': 449344, 'steps': 877, 'loss/train': 3.874833822250366} -09/20/2021 17:31:44 - INFO - __main__ - Step 14043: {'lr': 0.0001999967185760255, 'samples': 449376, 'steps': 877, 'loss/train': 4.149228096008301} -09/20/2021 17:31:44 - INFO - __main__ - Step 14044: {'lr': 0.0001999967185760255, 'samples': 449408, 'steps': 877, 'loss/train': 3.7326226234436035} -09/20/2021 17:31:46 - INFO - __main__ - Step 14045: {'lr': 0.0001999967185760255, 'samples': 449440, 'steps': 877, 'loss/train': 3.662419557571411} -09/20/2021 17:31:47 - INFO - __main__ - Step 14046: {'lr': 0.0001999967185760255, 'samples': 449472, 'steps': 877, 'loss/train': 4.316903591156006} -09/20/2021 17:31:47 - INFO - __main__ - Step 14047: {'lr': 0.0001999967185760255, 'samples': 449504, 'steps': 877, 'loss/train': 4.439770221710205} -09/20/2021 17:31:48 - INFO - __main__ - Step 14048: {'lr': 0.0001999967185760255, 'samples': 449536, 'steps': 877, 'loss/train': 3.311342477798462} -09/20/2021 17:31:49 - INFO - __main__ - Step 14049: {'lr': 0.0001999966666968969, 'samples': 449568, 'steps': 878, 'loss/train': 4.603912830352783} -09/20/2021 17:31:50 - INFO - __main__ - Step 14050: {'lr': 0.0001999966666968969, 'samples': 449600, 'steps': 878, 'loss/train': 3.5469553470611572} -09/20/2021 17:31:50 - INFO - __main__ - Step 14051: {'lr': 0.0001999966666968969, 'samples': 449632, 'steps': 878, 'loss/train': 3.9709689617156982} -09/20/2021 17:31:51 - INFO - __main__ - Step 14052: {'lr': 0.0001999966666968969, 'samples': 449664, 'steps': 878, 'loss/train': 2.8770227432250977} -09/20/2021 17:31:52 - INFO - __main__ - Step 14053: {'lr': 0.0001999966666968969, 'samples': 449696, 'steps': 878, 'loss/train': 3.191934585571289} -09/20/2021 17:31:53 - INFO - __main__ - Step 14054: {'lr': 0.0001999966666968969, 'samples': 449728, 'steps': 878, 'loss/train': 4.361191272735596} -09/20/2021 17:31:53 - INFO - __main__ - Step 14055: {'lr': 0.0001999966666968969, 'samples': 449760, 'steps': 878, 'loss/train': 1.4261066913604736} -09/20/2021 17:31:54 - INFO - __main__ - Step 14056: {'lr': 0.0001999966666968969, 'samples': 449792, 'steps': 878, 'loss/train': 1.213817834854126} -09/20/2021 17:31:55 - INFO - __main__ - Step 14057: {'lr': 0.0001999966666968969, 'samples': 449824, 'steps': 878, 'loss/train': 0.7995688915252686} -09/20/2021 17:31:56 - INFO - __main__ - Step 14058: {'lr': 0.0001999966666968969, 'samples': 449856, 'steps': 878, 'loss/train': 1.251267910003662} -09/20/2021 17:31:56 - INFO - __main__ - Step 14059: {'lr': 0.0001999966666968969, 'samples': 449888, 'steps': 878, 'loss/train': 1.5758367776870728} -09/20/2021 17:31:57 - INFO - __main__ - Step 14060: {'lr': 0.0001999966666968969, 'samples': 449920, 'steps': 878, 'loss/train': 4.217048168182373} -09/20/2021 17:31:58 - INFO - __main__ - Step 14061: {'lr': 0.0001999966666968969, 'samples': 449952, 'steps': 878, 'loss/train': 3.1808552742004395} -09/20/2021 17:31:59 - INFO - __main__ - Step 14062: {'lr': 0.0001999966666968969, 'samples': 449984, 'steps': 878, 'loss/train': 4.445603847503662} -09/20/2021 17:31:59 - INFO - __main__ - Step 14063: {'lr': 0.0001999966666968969, 'samples': 450016, 'steps': 878, 'loss/train': 4.979335308074951} -09/20/2021 17:32:00 - INFO - __main__ - Step 14064: {'lr': 0.0001999966666968969, 'samples': 450048, 'steps': 878, 'loss/train': 5.031728744506836} -09/20/2021 17:32:01 - INFO - __main__ - Step 14065: {'lr': 0.00019999661441088228, 'samples': 450080, 'steps': 879, 'loss/train': 4.540170669555664} -09/20/2021 17:32:02 - INFO - __main__ - Step 14066: {'lr': 0.00019999661441088228, 'samples': 450112, 'steps': 879, 'loss/train': 5.239747524261475} -09/20/2021 17:32:03 - INFO - __main__ - Step 14067: {'lr': 0.00019999661441088228, 'samples': 450144, 'steps': 879, 'loss/train': 2.9676992893218994} -09/20/2021 17:32:03 - INFO - __main__ - Step 14068: {'lr': 0.00019999661441088228, 'samples': 450176, 'steps': 879, 'loss/train': 4.819594383239746} -09/20/2021 17:32:04 - INFO - __main__ - Step 14069: {'lr': 0.00019999661441088228, 'samples': 450208, 'steps': 879, 'loss/train': 4.19253396987915} -09/20/2021 17:32:05 - INFO - __main__ - Step 14070: {'lr': 0.00019999661441088228, 'samples': 450240, 'steps': 879, 'loss/train': 3.286149263381958} -09/20/2021 17:32:06 - INFO - __main__ - Step 14071: {'lr': 0.00019999661441088228, 'samples': 450272, 'steps': 879, 'loss/train': 4.9216132164001465} -09/20/2021 17:32:06 - INFO - __main__ - Step 14072: {'lr': 0.00019999661441088228, 'samples': 450304, 'steps': 879, 'loss/train': 1.5550153255462646} -09/20/2021 17:32:07 - INFO - __main__ - Step 14073: {'lr': 0.00019999661441088228, 'samples': 450336, 'steps': 879, 'loss/train': 3.2373788356781006} -09/20/2021 17:32:08 - INFO - __main__ - Step 14074: {'lr': 0.00019999661441088228, 'samples': 450368, 'steps': 879, 'loss/train': 3.916128635406494} -09/20/2021 17:32:09 - INFO - __main__ - Step 14075: {'lr': 0.00019999661441088228, 'samples': 450400, 'steps': 879, 'loss/train': 4.04241418838501} -09/20/2021 17:32:10 - INFO - __main__ - Step 14076: {'lr': 0.00019999661441088228, 'samples': 450432, 'steps': 879, 'loss/train': 4.544898986816406} -09/20/2021 17:32:11 - INFO - __main__ - Step 14077: {'lr': 0.00019999661441088228, 'samples': 450464, 'steps': 879, 'loss/train': 3.6476449966430664} -09/20/2021 17:32:11 - INFO - __main__ - Step 14078: {'lr': 0.00019999661441088228, 'samples': 450496, 'steps': 879, 'loss/train': 4.430802345275879} -09/20/2021 17:32:12 - INFO - __main__ - Step 14079: {'lr': 0.00019999661441088228, 'samples': 450528, 'steps': 879, 'loss/train': 4.79084587097168} -09/20/2021 17:32:13 - INFO - __main__ - Step 14080: {'lr': 0.00019999661441088228, 'samples': 450560, 'steps': 879, 'loss/train': 4.001932144165039} -09/20/2021 17:32:14 - INFO - __main__ - Step 14081: {'lr': 0.00019999656171798184, 'samples': 450592, 'steps': 880, 'loss/train': 3.742588520050049} -09/20/2021 17:32:14 - INFO - __main__ - Step 14082: {'lr': 0.00019999656171798184, 'samples': 450624, 'steps': 880, 'loss/train': 4.127896785736084} -09/20/2021 17:32:15 - INFO - __main__ - Step 14083: {'lr': 0.00019999656171798184, 'samples': 450656, 'steps': 880, 'loss/train': 3.638359308242798} -09/20/2021 17:32:16 - INFO - __main__ - Step 14084: {'lr': 0.00019999656171798184, 'samples': 450688, 'steps': 880, 'loss/train': 3.653564929962158} -09/20/2021 17:32:17 - INFO - __main__ - Step 14085: {'lr': 0.00019999656171798184, 'samples': 450720, 'steps': 880, 'loss/train': 4.943887710571289} -09/20/2021 17:32:17 - INFO - __main__ - Step 14086: {'lr': 0.00019999656171798184, 'samples': 450752, 'steps': 880, 'loss/train': 1.8787117004394531} -09/20/2021 17:32:18 - INFO - __main__ - Step 14087: {'lr': 0.00019999656171798184, 'samples': 450784, 'steps': 880, 'loss/train': 3.905472755432129} -09/20/2021 17:32:19 - INFO - __main__ - Step 14088: {'lr': 0.00019999656171798184, 'samples': 450816, 'steps': 880, 'loss/train': 3.7116341590881348} -09/20/2021 17:32:20 - INFO - __main__ - Step 14089: {'lr': 0.00019999656171798184, 'samples': 450848, 'steps': 880, 'loss/train': 3.2597789764404297} -09/20/2021 17:32:20 - INFO - __main__ - Step 14090: {'lr': 0.00019999656171798184, 'samples': 450880, 'steps': 880, 'loss/train': 3.7935516834259033} -09/20/2021 17:32:21 - INFO - __main__ - Step 14091: {'lr': 0.00019999656171798184, 'samples': 450912, 'steps': 880, 'loss/train': 4.121829986572266} -09/20/2021 17:32:22 - INFO - __main__ - Step 14092: {'lr': 0.00019999656171798184, 'samples': 450944, 'steps': 880, 'loss/train': 2.400770902633667} -09/20/2021 17:32:23 - INFO - __main__ - Step 14093: {'lr': 0.00019999656171798184, 'samples': 450976, 'steps': 880, 'loss/train': 2.049635648727417} -09/20/2021 17:32:23 - INFO - __main__ - Step 14094: {'lr': 0.00019999656171798184, 'samples': 451008, 'steps': 880, 'loss/train': 3.8026797771453857} -09/20/2021 17:32:24 - INFO - __main__ - Step 14095: {'lr': 0.00019999656171798184, 'samples': 451040, 'steps': 880, 'loss/train': 4.585050582885742} -09/20/2021 17:32:25 - INFO - __main__ - Step 14096: {'lr': 0.00019999656171798184, 'samples': 451072, 'steps': 880, 'loss/train': 3.5821213722229004} -09/20/2021 17:32:26 - INFO - __main__ - Step 14097: {'lr': 0.00019999650861819577, 'samples': 451104, 'steps': 881, 'loss/train': 2.9964845180511475} -09/20/2021 17:32:27 - INFO - __main__ - Step 14098: {'lr': 0.00019999650861819577, 'samples': 451136, 'steps': 881, 'loss/train': 5.187802314758301} -09/20/2021 17:32:27 - INFO - __main__ - Step 14099: {'lr': 0.00019999650861819577, 'samples': 451168, 'steps': 881, 'loss/train': 3.5530927181243896} -09/20/2021 17:32:28 - INFO - __main__ - Step 14100: {'lr': 0.00019999650861819577, 'samples': 451200, 'steps': 881, 'loss/train': 4.433169364929199} -09/20/2021 17:32:29 - INFO - __main__ - Step 14101: {'lr': 0.00019999650861819577, 'samples': 451232, 'steps': 881, 'loss/train': 3.4618113040924072} -09/20/2021 17:32:30 - INFO - __main__ - Step 14102: {'lr': 0.00019999650861819577, 'samples': 451264, 'steps': 881, 'loss/train': 3.6814966201782227} -09/20/2021 17:32:30 - INFO - __main__ - Step 14103: {'lr': 0.00019999650861819577, 'samples': 451296, 'steps': 881, 'loss/train': 3.4064009189605713} -09/20/2021 17:32:31 - INFO - __main__ - Step 14104: {'lr': 0.00019999650861819577, 'samples': 451328, 'steps': 881, 'loss/train': 3.5539536476135254} -09/20/2021 17:32:32 - INFO - __main__ - Step 14105: {'lr': 0.00019999650861819577, 'samples': 451360, 'steps': 881, 'loss/train': 4.3858442306518555} -09/20/2021 17:32:33 - INFO - __main__ - Step 14106: {'lr': 0.00019999650861819577, 'samples': 451392, 'steps': 881, 'loss/train': 3.6190614700317383} -09/20/2021 17:32:34 - INFO - __main__ - Step 14107: {'lr': 0.00019999650861819577, 'samples': 451424, 'steps': 881, 'loss/train': 4.012559413909912} -09/20/2021 17:32:35 - INFO - __main__ - Step 14108: {'lr': 0.00019999650861819577, 'samples': 451456, 'steps': 881, 'loss/train': 4.657374858856201} -09/20/2021 17:32:35 - INFO - __main__ - Step 14109: {'lr': 0.00019999650861819577, 'samples': 451488, 'steps': 881, 'loss/train': 4.701349258422852} -09/20/2021 17:32:36 - INFO - __main__ - Step 14110: {'lr': 0.00019999650861819577, 'samples': 451520, 'steps': 881, 'loss/train': 4.745386600494385} -09/20/2021 17:32:37 - INFO - __main__ - Step 14111: {'lr': 0.00019999650861819577, 'samples': 451552, 'steps': 881, 'loss/train': 3.3629915714263916} -09/20/2021 17:32:38 - INFO - __main__ - Step 14112: {'lr': 0.00019999650861819577, 'samples': 451584, 'steps': 881, 'loss/train': 3.517869710922241} -09/20/2021 17:32:39 - INFO - __main__ - Step 14113: {'lr': 0.00019999645511152426, 'samples': 451616, 'steps': 882, 'loss/train': 4.416726589202881} -09/20/2021 17:32:39 - INFO - __main__ - Step 14114: {'lr': 0.00019999645511152426, 'samples': 451648, 'steps': 882, 'loss/train': 4.508228302001953} -09/20/2021 17:32:40 - INFO - __main__ - Step 14115: {'lr': 0.00019999645511152426, 'samples': 451680, 'steps': 882, 'loss/train': 3.4421842098236084} -09/20/2021 17:32:41 - INFO - __main__ - Step 14116: {'lr': 0.00019999645511152426, 'samples': 451712, 'steps': 882, 'loss/train': 4.464772701263428} -09/20/2021 17:32:42 - INFO - __main__ - Step 14117: {'lr': 0.00019999645511152426, 'samples': 451744, 'steps': 882, 'loss/train': 4.3133087158203125} -09/20/2021 17:32:42 - INFO - __main__ - Step 14118: {'lr': 0.00019999645511152426, 'samples': 451776, 'steps': 882, 'loss/train': 3.5504417419433594} -09/20/2021 17:32:43 - INFO - __main__ - Step 14119: {'lr': 0.00019999645511152426, 'samples': 451808, 'steps': 882, 'loss/train': 3.8331329822540283} -09/20/2021 17:32:44 - INFO - __main__ - Step 14120: {'lr': 0.00019999645511152426, 'samples': 451840, 'steps': 882, 'loss/train': 4.105401515960693} -09/20/2021 17:32:45 - INFO - __main__ - Step 14121: {'lr': 0.00019999645511152426, 'samples': 451872, 'steps': 882, 'loss/train': 3.267214775085449} -09/20/2021 17:32:45 - INFO - __main__ - Step 14122: {'lr': 0.00019999645511152426, 'samples': 451904, 'steps': 882, 'loss/train': 4.163766860961914} -09/20/2021 17:32:46 - INFO - __main__ - Step 14123: {'lr': 0.00019999645511152426, 'samples': 451936, 'steps': 882, 'loss/train': 4.196110248565674} -09/20/2021 17:32:47 - INFO - __main__ - Step 14124: {'lr': 0.00019999645511152426, 'samples': 451968, 'steps': 882, 'loss/train': 4.402645587921143} -09/20/2021 17:32:48 - INFO - __main__ - Step 14125: {'lr': 0.00019999645511152426, 'samples': 452000, 'steps': 882, 'loss/train': 4.0338454246521} -09/20/2021 17:32:48 - INFO - __main__ - Step 14126: {'lr': 0.00019999645511152426, 'samples': 452032, 'steps': 882, 'loss/train': 4.100314140319824} -09/20/2021 17:32:49 - INFO - __main__ - Step 14127: {'lr': 0.00019999645511152426, 'samples': 452064, 'steps': 882, 'loss/train': 3.4314444065093994} -09/20/2021 17:32:50 - INFO - __main__ - Step 14128: {'lr': 0.00019999645511152426, 'samples': 452096, 'steps': 882, 'loss/train': 4.716648578643799} -09/20/2021 17:32:51 - INFO - __main__ - Step 14129: {'lr': 0.0001999964011979676, 'samples': 452128, 'steps': 883, 'loss/train': 3.6391236782073975} -09/20/2021 17:32:51 - INFO - __main__ - Step 14130: {'lr': 0.0001999964011979676, 'samples': 452160, 'steps': 883, 'loss/train': 3.0869340896606445} -09/20/2021 17:32:52 - INFO - __main__ - Step 14131: {'lr': 0.0001999964011979676, 'samples': 452192, 'steps': 883, 'loss/train': 3.994335412979126} -09/20/2021 17:32:53 - INFO - __main__ - Step 14132: {'lr': 0.0001999964011979676, 'samples': 452224, 'steps': 883, 'loss/train': 3.5463955402374268} -09/20/2021 17:32:54 - INFO - __main__ - Step 14133: {'lr': 0.0001999964011979676, 'samples': 452256, 'steps': 883, 'loss/train': 3.624479293823242} -09/20/2021 17:32:54 - INFO - __main__ - Step 14134: {'lr': 0.0001999964011979676, 'samples': 452288, 'steps': 883, 'loss/train': 3.4052021503448486} -09/20/2021 17:32:55 - INFO - __main__ - Step 14135: {'lr': 0.0001999964011979676, 'samples': 452320, 'steps': 883, 'loss/train': 4.418642044067383} -09/20/2021 17:32:56 - INFO - __main__ - Step 14136: {'lr': 0.0001999964011979676, 'samples': 452352, 'steps': 883, 'loss/train': 3.983520984649658} -09/20/2021 17:32:57 - INFO - __main__ - Step 14137: {'lr': 0.0001999964011979676, 'samples': 452384, 'steps': 883, 'loss/train': 3.4285597801208496} -09/20/2021 17:32:58 - INFO - __main__ - Step 14138: {'lr': 0.0001999964011979676, 'samples': 452416, 'steps': 883, 'loss/train': 0.9984701871871948} -09/20/2021 17:32:59 - INFO - __main__ - Step 14139: {'lr': 0.0001999964011979676, 'samples': 452448, 'steps': 883, 'loss/train': 1.1089884042739868} -09/20/2021 17:33:00 - INFO - __main__ - Step 14140: {'lr': 0.0001999964011979676, 'samples': 452480, 'steps': 883, 'loss/train': 3.5043396949768066} -09/20/2021 17:33:00 - INFO - __main__ - Step 14141: {'lr': 0.0001999964011979676, 'samples': 452512, 'steps': 883, 'loss/train': 3.586062431335449} -09/20/2021 17:33:01 - INFO - __main__ - Step 14142: {'lr': 0.0001999964011979676, 'samples': 452544, 'steps': 883, 'loss/train': 4.441938877105713} -09/20/2021 17:33:02 - INFO - __main__ - Step 14143: {'lr': 0.0001999964011979676, 'samples': 452576, 'steps': 883, 'loss/train': 3.1825528144836426} -09/20/2021 17:33:03 - INFO - __main__ - Step 14144: {'lr': 0.0001999964011979676, 'samples': 452608, 'steps': 883, 'loss/train': 4.4416327476501465} -09/20/2021 17:33:04 - INFO - __main__ - Step 14145: {'lr': 0.00019999634687752594, 'samples': 452640, 'steps': 884, 'loss/train': 3.5386877059936523} -09/20/2021 17:33:04 - INFO - __main__ - Step 14146: {'lr': 0.00019999634687752594, 'samples': 452672, 'steps': 884, 'loss/train': 2.912402391433716} -09/20/2021 17:33:05 - INFO - __main__ - Step 14147: {'lr': 0.00019999634687752594, 'samples': 452704, 'steps': 884, 'loss/train': 5.059581279754639} -09/20/2021 17:33:06 - INFO - __main__ - Step 14148: {'lr': 0.00019999634687752594, 'samples': 452736, 'steps': 884, 'loss/train': 3.448667049407959} -09/20/2021 17:33:07 - INFO - __main__ - Step 14149: {'lr': 0.00019999634687752594, 'samples': 452768, 'steps': 884, 'loss/train': 3.137357473373413} -09/20/2021 17:33:07 - INFO - __main__ - Step 14150: {'lr': 0.00019999634687752594, 'samples': 452800, 'steps': 884, 'loss/train': 4.08616304397583} -09/20/2021 17:33:08 - INFO - __main__ - Step 14151: {'lr': 0.00019999634687752594, 'samples': 452832, 'steps': 884, 'loss/train': 4.638679027557373} -09/20/2021 17:33:09 - INFO - __main__ - Step 14152: {'lr': 0.00019999634687752594, 'samples': 452864, 'steps': 884, 'loss/train': 4.66417121887207} -09/20/2021 17:33:10 - INFO - __main__ - Step 14153: {'lr': 0.00019999634687752594, 'samples': 452896, 'steps': 884, 'loss/train': 4.222921371459961} -09/20/2021 17:33:10 - INFO - __main__ - Step 14154: {'lr': 0.00019999634687752594, 'samples': 452928, 'steps': 884, 'loss/train': 3.700685977935791} -09/20/2021 17:33:11 - INFO - __main__ - Step 14155: {'lr': 0.00019999634687752594, 'samples': 452960, 'steps': 884, 'loss/train': 3.6142327785491943} -09/20/2021 17:33:12 - INFO - __main__ - Step 14156: {'lr': 0.00019999634687752594, 'samples': 452992, 'steps': 884, 'loss/train': 4.609636306762695} -09/20/2021 17:33:13 - INFO - __main__ - Step 14157: {'lr': 0.00019999634687752594, 'samples': 453024, 'steps': 884, 'loss/train': 4.083582401275635} -09/20/2021 17:33:13 - INFO - __main__ - Step 14158: {'lr': 0.00019999634687752594, 'samples': 453056, 'steps': 884, 'loss/train': 1.0340317487716675} -09/20/2021 17:33:14 - INFO - __main__ - Step 14159: {'lr': 0.00019999634687752594, 'samples': 453088, 'steps': 884, 'loss/train': 0.9586219191551208} -09/20/2021 17:33:15 - INFO - __main__ - Step 14160: {'lr': 0.00019999634687752594, 'samples': 453120, 'steps': 884, 'loss/train': 4.287863731384277} -09/20/2021 17:33:16 - INFO - __main__ - Step 14161: {'lr': 0.00019999629215019957, 'samples': 453152, 'steps': 885, 'loss/train': 5.669816017150879} -09/20/2021 17:33:17 - INFO - __main__ - Step 14162: {'lr': 0.00019999629215019957, 'samples': 453184, 'steps': 885, 'loss/train': 3.9796886444091797} -09/20/2021 17:33:17 - INFO - __main__ - Step 14163: {'lr': 0.00019999629215019957, 'samples': 453216, 'steps': 885, 'loss/train': 3.4385359287261963} -09/20/2021 17:33:18 - INFO - __main__ - Step 14164: {'lr': 0.00019999629215019957, 'samples': 453248, 'steps': 885, 'loss/train': 4.997025966644287} -09/20/2021 17:33:19 - INFO - __main__ - Step 14165: {'lr': 0.00019999629215019957, 'samples': 453280, 'steps': 885, 'loss/train': 4.575601100921631} -09/20/2021 17:33:20 - INFO - __main__ - Step 14166: {'lr': 0.00019999629215019957, 'samples': 453312, 'steps': 885, 'loss/train': 3.073178291320801} -09/20/2021 17:33:20 - INFO - __main__ - Step 14167: {'lr': 0.00019999629215019957, 'samples': 453344, 'steps': 885, 'loss/train': 4.165116786956787} -09/20/2021 17:33:21 - INFO - __main__ - Step 14168: {'lr': 0.00019999629215019957, 'samples': 453376, 'steps': 885, 'loss/train': 0.976802408695221} -09/20/2021 17:33:22 - INFO - __main__ - Step 14169: {'lr': 0.00019999629215019957, 'samples': 453408, 'steps': 885, 'loss/train': 1.908077359199524} -09/20/2021 17:33:23 - INFO - __main__ - Step 14170: {'lr': 0.00019999629215019957, 'samples': 453440, 'steps': 885, 'loss/train': 2.2058603763580322} -09/20/2021 17:33:24 - INFO - __main__ - Step 14171: {'lr': 0.00019999629215019957, 'samples': 453472, 'steps': 885, 'loss/train': 1.003435492515564} -09/20/2021 17:33:25 - INFO - __main__ - Step 14172: {'lr': 0.00019999629215019957, 'samples': 453504, 'steps': 885, 'loss/train': 4.343263149261475} -09/20/2021 17:33:25 - INFO - __main__ - Step 14173: {'lr': 0.00019999629215019957, 'samples': 453536, 'steps': 885, 'loss/train': 3.8132870197296143} -09/20/2021 17:33:26 - INFO - __main__ - Step 14174: {'lr': 0.00019999629215019957, 'samples': 453568, 'steps': 885, 'loss/train': 3.6254501342773438} -09/20/2021 17:33:27 - INFO - __main__ - Step 14175: {'lr': 0.00019999629215019957, 'samples': 453600, 'steps': 885, 'loss/train': 0.3301474153995514} -09/20/2021 17:33:28 - INFO - __main__ - Step 14176: {'lr': 0.00019999629215019957, 'samples': 453632, 'steps': 885, 'loss/train': 3.7329580783843994} -09/20/2021 17:33:28 - INFO - __main__ - Step 14177: {'lr': 0.00019999623701598865, 'samples': 453664, 'steps': 886, 'loss/train': 3.3061294555664062} -09/20/2021 17:33:29 - INFO - __main__ - Step 14178: {'lr': 0.00019999623701598865, 'samples': 453696, 'steps': 886, 'loss/train': 4.684664249420166} -09/20/2021 17:33:30 - INFO - __main__ - Step 14179: {'lr': 0.00019999623701598865, 'samples': 453728, 'steps': 886, 'loss/train': 3.4723668098449707} -09/20/2021 17:33:31 - INFO - __main__ - Step 14180: {'lr': 0.00019999623701598865, 'samples': 453760, 'steps': 886, 'loss/train': 4.138331890106201} -09/20/2021 17:33:31 - INFO - __main__ - Step 14181: {'lr': 0.00019999623701598865, 'samples': 453792, 'steps': 886, 'loss/train': 4.663036823272705} -09/20/2021 17:33:32 - INFO - __main__ - Step 14182: {'lr': 0.00019999623701598865, 'samples': 453824, 'steps': 886, 'loss/train': 4.363883972167969} -09/20/2021 17:33:33 - INFO - __main__ - Step 14183: {'lr': 0.00019999623701598865, 'samples': 453856, 'steps': 886, 'loss/train': 3.0882833003997803} -09/20/2021 17:33:34 - INFO - __main__ - Step 14184: {'lr': 0.00019999623701598865, 'samples': 453888, 'steps': 886, 'loss/train': 2.735745906829834} -09/20/2021 17:33:34 - INFO - __main__ - Step 14185: {'lr': 0.00019999623701598865, 'samples': 453920, 'steps': 886, 'loss/train': 3.795417070388794} -09/20/2021 17:33:35 - INFO - __main__ - Step 14186: {'lr': 0.00019999623701598865, 'samples': 453952, 'steps': 886, 'loss/train': 3.6938109397888184} -09/20/2021 17:33:36 - INFO - __main__ - Step 14187: {'lr': 0.00019999623701598865, 'samples': 453984, 'steps': 886, 'loss/train': 3.634232997894287} -09/20/2021 17:33:37 - INFO - __main__ - Step 14188: {'lr': 0.00019999623701598865, 'samples': 454016, 'steps': 886, 'loss/train': 2.2217016220092773} -09/20/2021 17:33:37 - INFO - __main__ - Step 14189: {'lr': 0.00019999623701598865, 'samples': 454048, 'steps': 886, 'loss/train': 2.1840391159057617} -09/20/2021 17:33:38 - INFO - __main__ - Step 14190: {'lr': 0.00019999623701598865, 'samples': 454080, 'steps': 886, 'loss/train': 2.1895272731781006} -09/20/2021 17:33:39 - INFO - __main__ - Step 14191: {'lr': 0.00019999623701598865, 'samples': 454112, 'steps': 886, 'loss/train': 3.5727524757385254} -09/20/2021 17:33:40 - INFO - __main__ - Step 14192: {'lr': 0.00019999623701598865, 'samples': 454144, 'steps': 886, 'loss/train': 3.9480364322662354} -09/20/2021 17:33:41 - INFO - __main__ - Step 14193: {'lr': 0.0001999961814748934, 'samples': 454176, 'steps': 887, 'loss/train': 3.159994602203369} -09/20/2021 17:33:41 - INFO - __main__ - Step 14194: {'lr': 0.0001999961814748934, 'samples': 454208, 'steps': 887, 'loss/train': 3.2468411922454834} -09/20/2021 17:33:42 - INFO - __main__ - Step 14195: {'lr': 0.0001999961814748934, 'samples': 454240, 'steps': 887, 'loss/train': 4.6597161293029785} -09/20/2021 17:33:43 - INFO - __main__ - Step 14196: {'lr': 0.0001999961814748934, 'samples': 454272, 'steps': 887, 'loss/train': 3.810650110244751} -09/20/2021 17:33:44 - INFO - __main__ - Step 14197: {'lr': 0.0001999961814748934, 'samples': 454304, 'steps': 887, 'loss/train': 3.9365234375} -09/20/2021 17:33:44 - INFO - __main__ - Step 14198: {'lr': 0.0001999961814748934, 'samples': 454336, 'steps': 887, 'loss/train': 3.781907796859741} -09/20/2021 17:33:45 - INFO - __main__ - Step 14199: {'lr': 0.0001999961814748934, 'samples': 454368, 'steps': 887, 'loss/train': 2.3987269401550293} -09/20/2021 17:33:46 - INFO - __main__ - Step 14200: {'lr': 0.0001999961814748934, 'samples': 454400, 'steps': 887, 'loss/train': 5.272470474243164} -09/20/2021 17:33:47 - INFO - __main__ - Step 14201: {'lr': 0.0001999961814748934, 'samples': 454432, 'steps': 887, 'loss/train': 4.102312088012695} -09/20/2021 17:33:47 - INFO - __main__ - Step 14202: {'lr': 0.0001999961814748934, 'samples': 454464, 'steps': 887, 'loss/train': 3.1621198654174805} -09/20/2021 17:33:48 - INFO - __main__ - Step 14203: {'lr': 0.0001999961814748934, 'samples': 454496, 'steps': 887, 'loss/train': 4.180722713470459} -09/20/2021 17:33:49 - INFO - __main__ - Step 14204: {'lr': 0.0001999961814748934, 'samples': 454528, 'steps': 887, 'loss/train': 3.2463226318359375} -09/20/2021 17:33:50 - INFO - __main__ - Step 14205: {'lr': 0.0001999961814748934, 'samples': 454560, 'steps': 887, 'loss/train': 3.9803802967071533} -09/20/2021 17:33:51 - INFO - __main__ - Step 14206: {'lr': 0.0001999961814748934, 'samples': 454592, 'steps': 887, 'loss/train': 3.7252864837646484} -09/20/2021 17:33:52 - INFO - __main__ - Step 14207: {'lr': 0.0001999961814748934, 'samples': 454624, 'steps': 887, 'loss/train': 4.834569454193115} -09/20/2021 17:33:52 - INFO - __main__ - Step 14208: {'lr': 0.0001999961814748934, 'samples': 454656, 'steps': 887, 'loss/train': 3.1781885623931885} -09/20/2021 17:33:53 - INFO - __main__ - Step 14209: {'lr': 0.00019999612552691414, 'samples': 454688, 'steps': 888, 'loss/train': 3.7497365474700928} -09/20/2021 17:33:54 - INFO - __main__ - Step 14210: {'lr': 0.00019999612552691414, 'samples': 454720, 'steps': 888, 'loss/train': 5.547143936157227} -09/20/2021 17:33:55 - INFO - __main__ - Step 14211: {'lr': 0.00019999612552691414, 'samples': 454752, 'steps': 888, 'loss/train': 2.2013285160064697} -09/20/2021 17:33:55 - INFO - __main__ - Step 14212: {'lr': 0.00019999612552691414, 'samples': 454784, 'steps': 888, 'loss/train': 4.688166618347168} -09/20/2021 17:33:56 - INFO - __main__ - Step 14213: {'lr': 0.00019999612552691414, 'samples': 454816, 'steps': 888, 'loss/train': 4.675026893615723} -09/20/2021 17:33:57 - INFO - __main__ - Step 14214: {'lr': 0.00019999612552691414, 'samples': 454848, 'steps': 888, 'loss/train': 4.196665287017822} -09/20/2021 17:33:58 - INFO - __main__ - Step 14215: {'lr': 0.00019999612552691414, 'samples': 454880, 'steps': 888, 'loss/train': 3.3849918842315674} -09/20/2021 17:33:58 - INFO - __main__ - Step 14216: {'lr': 0.00019999612552691414, 'samples': 454912, 'steps': 888, 'loss/train': 4.086844444274902} -09/20/2021 17:33:59 - INFO - __main__ - Step 14217: {'lr': 0.00019999612552691414, 'samples': 454944, 'steps': 888, 'loss/train': 3.475722551345825} -09/20/2021 17:34:00 - INFO - __main__ - Step 14218: {'lr': 0.00019999612552691414, 'samples': 454976, 'steps': 888, 'loss/train': 3.4984400272369385} -09/20/2021 17:34:01 - INFO - __main__ - Step 14219: {'lr': 0.00019999612552691414, 'samples': 455008, 'steps': 888, 'loss/train': 4.445842742919922} -09/20/2021 17:34:01 - INFO - __main__ - Step 14220: {'lr': 0.00019999612552691414, 'samples': 455040, 'steps': 888, 'loss/train': 3.7315847873687744} -09/20/2021 17:34:02 - INFO - __main__ - Step 14221: {'lr': 0.00019999612552691414, 'samples': 455072, 'steps': 888, 'loss/train': 2.968393087387085} -09/20/2021 17:34:03 - INFO - __main__ - Step 14222: {'lr': 0.00019999612552691414, 'samples': 455104, 'steps': 888, 'loss/train': 3.476762056350708} -09/20/2021 17:34:04 - INFO - __main__ - Step 14223: {'lr': 0.00019999612552691414, 'samples': 455136, 'steps': 888, 'loss/train': 3.3525731563568115} -09/20/2021 17:34:04 - INFO - __main__ - Step 14224: {'lr': 0.00019999612552691414, 'samples': 455168, 'steps': 888, 'loss/train': 5.110676288604736} -09/20/2021 17:34:05 - INFO - __main__ - Step 14225: {'lr': 0.000199996069172051, 'samples': 455200, 'steps': 889, 'loss/train': 4.389630317687988} -09/20/2021 17:34:06 - INFO - __main__ - Step 14226: {'lr': 0.000199996069172051, 'samples': 455232, 'steps': 889, 'loss/train': 4.004722595214844} -09/20/2021 17:34:07 - INFO - __main__ - Step 14227: {'lr': 0.000199996069172051, 'samples': 455264, 'steps': 889, 'loss/train': 3.9315147399902344} -09/20/2021 17:34:08 - INFO - __main__ - Step 14228: {'lr': 0.000199996069172051, 'samples': 455296, 'steps': 889, 'loss/train': 7.489767074584961} -09/20/2021 17:34:08 - INFO - __main__ - Step 14229: {'lr': 0.000199996069172051, 'samples': 455328, 'steps': 889, 'loss/train': 4.587721824645996} -09/20/2021 17:34:09 - INFO - __main__ - Step 14230: {'lr': 0.000199996069172051, 'samples': 455360, 'steps': 889, 'loss/train': 3.9245283603668213} -09/20/2021 17:34:10 - INFO - __main__ - Step 14231: {'lr': 0.000199996069172051, 'samples': 455392, 'steps': 889, 'loss/train': 3.3495235443115234} -09/20/2021 17:34:11 - INFO - __main__ - Step 14232: {'lr': 0.000199996069172051, 'samples': 455424, 'steps': 889, 'loss/train': 3.5921311378479004} -09/20/2021 17:34:11 - INFO - __main__ - Step 14233: {'lr': 0.000199996069172051, 'samples': 455456, 'steps': 889, 'loss/train': 2.418586492538452} -09/20/2021 17:34:12 - INFO - __main__ - Step 14234: {'lr': 0.000199996069172051, 'samples': 455488, 'steps': 889, 'loss/train': 3.689911365509033} -09/20/2021 17:34:14 - INFO - __main__ - Step 14235: {'lr': 0.000199996069172051, 'samples': 455520, 'steps': 889, 'loss/train': 3.203199625015259} -09/20/2021 17:34:15 - INFO - __main__ - Step 14236: {'lr': 0.000199996069172051, 'samples': 455552, 'steps': 889, 'loss/train': 2.956554889678955} -09/20/2021 17:34:15 - INFO - __main__ - Step 14237: {'lr': 0.000199996069172051, 'samples': 455584, 'steps': 889, 'loss/train': 4.4369707107543945} -09/20/2021 17:34:16 - INFO - __main__ - Step 14238: {'lr': 0.000199996069172051, 'samples': 455616, 'steps': 889, 'loss/train': 3.7545809745788574} -09/20/2021 17:34:17 - INFO - __main__ - Step 14239: {'lr': 0.000199996069172051, 'samples': 455648, 'steps': 889, 'loss/train': 4.099985599517822} -09/20/2021 17:34:18 - INFO - __main__ - Step 14240: {'lr': 0.000199996069172051, 'samples': 455680, 'steps': 889, 'loss/train': 3.6446921825408936} -09/20/2021 17:34:18 - INFO - __main__ - Step 14241: {'lr': 0.00019999601241030423, 'samples': 455712, 'steps': 890, 'loss/train': 4.055332660675049} -09/20/2021 17:34:19 - INFO - __main__ - Step 14242: {'lr': 0.00019999601241030423, 'samples': 455744, 'steps': 890, 'loss/train': 3.0729870796203613} -09/20/2021 17:34:20 - INFO - __main__ - Step 14243: {'lr': 0.00019999601241030423, 'samples': 455776, 'steps': 890, 'loss/train': 3.798668384552002} -09/20/2021 17:34:21 - INFO - __main__ - Step 14244: {'lr': 0.00019999601241030423, 'samples': 455808, 'steps': 890, 'loss/train': 2.6784987449645996} -09/20/2021 17:34:21 - INFO - __main__ - Step 14245: {'lr': 0.00019999601241030423, 'samples': 455840, 'steps': 890, 'loss/train': 3.3349549770355225} -09/20/2021 17:34:22 - INFO - __main__ - Step 14246: {'lr': 0.00019999601241030423, 'samples': 455872, 'steps': 890, 'loss/train': 3.4703614711761475} -09/20/2021 17:34:23 - INFO - __main__ - Step 14247: {'lr': 0.00019999601241030423, 'samples': 455904, 'steps': 890, 'loss/train': 3.428213596343994} -09/20/2021 17:34:24 - INFO - __main__ - Step 14248: {'lr': 0.00019999601241030423, 'samples': 455936, 'steps': 890, 'loss/train': 3.496842622756958} -09/20/2021 17:34:24 - INFO - __main__ - Step 14249: {'lr': 0.00019999601241030423, 'samples': 455968, 'steps': 890, 'loss/train': 4.45277214050293} -09/20/2021 17:34:25 - INFO - __main__ - Step 14250: {'lr': 0.00019999601241030423, 'samples': 456000, 'steps': 890, 'loss/train': 4.068141460418701} -09/20/2021 17:34:26 - INFO - __main__ - Step 14251: {'lr': 0.00019999601241030423, 'samples': 456032, 'steps': 890, 'loss/train': 6.562459945678711} -09/20/2021 17:34:27 - INFO - __main__ - Step 14252: {'lr': 0.00019999601241030423, 'samples': 456064, 'steps': 890, 'loss/train': 3.6213908195495605} -09/20/2021 17:34:27 - INFO - __main__ - Step 14253: {'lr': 0.00019999601241030423, 'samples': 456096, 'steps': 890, 'loss/train': 2.826777696609497} -09/20/2021 17:34:28 - INFO - __main__ - Step 14254: {'lr': 0.00019999601241030423, 'samples': 456128, 'steps': 890, 'loss/train': 4.325118541717529} -09/20/2021 17:34:29 - INFO - __main__ - Step 14255: {'lr': 0.00019999601241030423, 'samples': 456160, 'steps': 890, 'loss/train': 4.200131416320801} -09/20/2021 17:34:30 - INFO - __main__ - Step 14256: {'lr': 0.00019999601241030423, 'samples': 456192, 'steps': 890, 'loss/train': 3.9047789573669434} -09/20/2021 17:34:31 - INFO - __main__ - Step 14257: {'lr': 0.0001999959552416741, 'samples': 456224, 'steps': 891, 'loss/train': 3.3045499324798584} -09/20/2021 17:34:31 - INFO - __main__ - Step 14258: {'lr': 0.0001999959552416741, 'samples': 456256, 'steps': 891, 'loss/train': 1.3550549745559692} -09/20/2021 17:34:32 - INFO - __main__ - Step 14259: {'lr': 0.0001999959552416741, 'samples': 456288, 'steps': 891, 'loss/train': 3.748760461807251} -09/20/2021 17:34:33 - INFO - __main__ - Step 14260: {'lr': 0.0001999959552416741, 'samples': 456320, 'steps': 891, 'loss/train': 3.7354276180267334} -09/20/2021 17:34:34 - INFO - __main__ - Step 14261: {'lr': 0.0001999959552416741, 'samples': 456352, 'steps': 891, 'loss/train': 6.803324222564697} -09/20/2021 17:34:34 - INFO - __main__ - Step 14262: {'lr': 0.0001999959552416741, 'samples': 456384, 'steps': 891, 'loss/train': 4.129453182220459} -09/20/2021 17:34:35 - INFO - __main__ - Step 14263: {'lr': 0.0001999959552416741, 'samples': 456416, 'steps': 891, 'loss/train': 1.0126653909683228} -09/20/2021 17:34:36 - INFO - __main__ - Step 14264: {'lr': 0.0001999959552416741, 'samples': 456448, 'steps': 891, 'loss/train': 4.326703071594238} -09/20/2021 17:34:37 - INFO - __main__ - Step 14265: {'lr': 0.0001999959552416741, 'samples': 456480, 'steps': 891, 'loss/train': 3.3795597553253174} -09/20/2021 17:34:38 - INFO - __main__ - Step 14266: {'lr': 0.0001999959552416741, 'samples': 456512, 'steps': 891, 'loss/train': 3.750032901763916} -09/20/2021 17:34:39 - INFO - __main__ - Step 14267: {'lr': 0.0001999959552416741, 'samples': 456544, 'steps': 891, 'loss/train': 3.395491123199463} -09/20/2021 17:34:39 - INFO - __main__ - Step 14268: {'lr': 0.0001999959552416741, 'samples': 456576, 'steps': 891, 'loss/train': 4.3176589012146} -09/20/2021 17:34:40 - INFO - __main__ - Step 14269: {'lr': 0.0001999959552416741, 'samples': 456608, 'steps': 891, 'loss/train': 4.4143500328063965} -09/20/2021 17:34:41 - INFO - __main__ - Step 14270: {'lr': 0.0001999959552416741, 'samples': 456640, 'steps': 891, 'loss/train': 4.79584264755249} -09/20/2021 17:34:42 - INFO - __main__ - Step 14271: {'lr': 0.0001999959552416741, 'samples': 456672, 'steps': 891, 'loss/train': 5.563566207885742} -09/20/2021 17:34:42 - INFO - __main__ - Step 14272: {'lr': 0.0001999959552416741, 'samples': 456704, 'steps': 891, 'loss/train': 3.420776128768921} -09/20/2021 17:34:43 - INFO - __main__ - Step 14273: {'lr': 0.0001999958976661608, 'samples': 456736, 'steps': 892, 'loss/train': 3.6732516288757324} -09/20/2021 17:34:44 - INFO - __main__ - Step 14274: {'lr': 0.0001999958976661608, 'samples': 456768, 'steps': 892, 'loss/train': 4.22780179977417} -09/20/2021 17:34:45 - INFO - __main__ - Step 14275: {'lr': 0.0001999958976661608, 'samples': 456800, 'steps': 892, 'loss/train': 3.9223792552948} -09/20/2021 17:34:46 - INFO - __main__ - Step 14276: {'lr': 0.0001999958976661608, 'samples': 456832, 'steps': 892, 'loss/train': 4.007853984832764} -09/20/2021 17:34:46 - INFO - __main__ - Step 14277: {'lr': 0.0001999958976661608, 'samples': 456864, 'steps': 892, 'loss/train': 4.044539928436279} -09/20/2021 17:34:47 - INFO - __main__ - Step 14278: {'lr': 0.0001999958976661608, 'samples': 456896, 'steps': 892, 'loss/train': 3.9241721630096436} -09/20/2021 17:34:48 - INFO - __main__ - Step 14279: {'lr': 0.0001999958976661608, 'samples': 456928, 'steps': 892, 'loss/train': 4.275952339172363} -09/20/2021 17:34:49 - INFO - __main__ - Step 14280: {'lr': 0.0001999958976661608, 'samples': 456960, 'steps': 892, 'loss/train': 3.451869010925293} -09/20/2021 17:34:49 - INFO - __main__ - Step 14281: {'lr': 0.0001999958976661608, 'samples': 456992, 'steps': 892, 'loss/train': 4.713321208953857} -09/20/2021 17:34:50 - INFO - __main__ - Step 14282: {'lr': 0.0001999958976661608, 'samples': 457024, 'steps': 892, 'loss/train': 3.4416065216064453} -09/20/2021 17:34:51 - INFO - __main__ - Step 14283: {'lr': 0.0001999958976661608, 'samples': 457056, 'steps': 892, 'loss/train': 3.3103086948394775} -09/20/2021 17:34:52 - INFO - __main__ - Step 14284: {'lr': 0.0001999958976661608, 'samples': 457088, 'steps': 892, 'loss/train': 4.284217834472656} -09/20/2021 17:34:52 - INFO - __main__ - Step 14285: {'lr': 0.0001999958976661608, 'samples': 457120, 'steps': 892, 'loss/train': 3.473893642425537} -09/20/2021 17:34:53 - INFO - __main__ - Step 14286: {'lr': 0.0001999958976661608, 'samples': 457152, 'steps': 892, 'loss/train': 3.89640474319458} -09/20/2021 17:34:54 - INFO - __main__ - Step 14287: {'lr': 0.0001999958976661608, 'samples': 457184, 'steps': 892, 'loss/train': 4.736216068267822} -09/20/2021 17:34:55 - INFO - __main__ - Step 14288: {'lr': 0.0001999958976661608, 'samples': 457216, 'steps': 892, 'loss/train': 4.173854351043701} -09/20/2021 17:34:55 - INFO - __main__ - Step 14289: {'lr': 0.0001999958396837646, 'samples': 457248, 'steps': 893, 'loss/train': 1.9257144927978516} -09/20/2021 17:34:56 - INFO - __main__ - Step 14290: {'lr': 0.0001999958396837646, 'samples': 457280, 'steps': 893, 'loss/train': 3.8308286666870117} -09/20/2021 17:34:57 - INFO - __main__ - Step 14291: {'lr': 0.0001999958396837646, 'samples': 457312, 'steps': 893, 'loss/train': 4.4263739585876465} -09/20/2021 17:34:58 - INFO - __main__ - Step 14292: {'lr': 0.0001999958396837646, 'samples': 457344, 'steps': 893, 'loss/train': 4.798765182495117} -09/20/2021 17:34:58 - INFO - __main__ - Step 14293: {'lr': 0.0001999958396837646, 'samples': 457376, 'steps': 893, 'loss/train': 3.5186924934387207} -09/20/2021 17:34:59 - INFO - __main__ - Step 14294: {'lr': 0.0001999958396837646, 'samples': 457408, 'steps': 893, 'loss/train': 3.9332284927368164} -09/20/2021 17:35:00 - INFO - __main__ - Step 14295: {'lr': 0.0001999958396837646, 'samples': 457440, 'steps': 893, 'loss/train': 4.847353935241699} -09/20/2021 17:35:01 - INFO - __main__ - Step 14296: {'lr': 0.0001999958396837646, 'samples': 457472, 'steps': 893, 'loss/train': 3.4528286457061768} -09/20/2021 17:35:02 - INFO - __main__ - Step 14297: {'lr': 0.0001999958396837646, 'samples': 457504, 'steps': 893, 'loss/train': 4.484725475311279} -09/20/2021 17:35:03 - INFO - __main__ - Step 14298: {'lr': 0.0001999958396837646, 'samples': 457536, 'steps': 893, 'loss/train': 3.5472497940063477} -09/20/2021 17:35:03 - INFO - __main__ - Step 14299: {'lr': 0.0001999958396837646, 'samples': 457568, 'steps': 893, 'loss/train': 3.7722949981689453} -09/20/2021 17:35:04 - INFO - __main__ - Step 14300: {'lr': 0.0001999958396837646, 'samples': 457600, 'steps': 893, 'loss/train': 4.135725975036621} -09/20/2021 17:35:05 - INFO - __main__ - Step 14301: {'lr': 0.0001999958396837646, 'samples': 457632, 'steps': 893, 'loss/train': 3.8742940425872803} -09/20/2021 17:35:06 - INFO - __main__ - Step 14302: {'lr': 0.0001999958396837646, 'samples': 457664, 'steps': 893, 'loss/train': 2.8412318229675293} -09/20/2021 17:35:06 - INFO - __main__ - Step 14303: {'lr': 0.0001999958396837646, 'samples': 457696, 'steps': 893, 'loss/train': 2.2723135948181152} -09/20/2021 17:35:07 - INFO - __main__ - Step 14304: {'lr': 0.0001999958396837646, 'samples': 457728, 'steps': 893, 'loss/train': 2.0522844791412354} -09/20/2021 17:35:08 - INFO - __main__ - Step 14305: {'lr': 0.0001999957812944857, 'samples': 457760, 'steps': 894, 'loss/train': 3.971592903137207} -09/20/2021 17:35:09 - INFO - __main__ - Step 14306: {'lr': 0.0001999957812944857, 'samples': 457792, 'steps': 894, 'loss/train': 3.079878330230713} -09/20/2021 17:35:10 - INFO - __main__ - Step 14307: {'lr': 0.0001999957812944857, 'samples': 457824, 'steps': 894, 'loss/train': 4.1083269119262695} -09/20/2021 17:35:10 - INFO - __main__ - Step 14308: {'lr': 0.0001999957812944857, 'samples': 457856, 'steps': 894, 'loss/train': 3.7726681232452393} -09/20/2021 17:35:11 - INFO - __main__ - Step 14309: {'lr': 0.0001999957812944857, 'samples': 457888, 'steps': 894, 'loss/train': 3.980539321899414} -09/20/2021 17:35:12 - INFO - __main__ - Step 14310: {'lr': 0.0001999957812944857, 'samples': 457920, 'steps': 894, 'loss/train': 4.1372599601745605} -09/20/2021 17:35:13 - INFO - __main__ - Step 14311: {'lr': 0.0001999957812944857, 'samples': 457952, 'steps': 894, 'loss/train': 3.497279405593872} -09/20/2021 17:35:13 - INFO - __main__ - Step 14312: {'lr': 0.0001999957812944857, 'samples': 457984, 'steps': 894, 'loss/train': 3.672508716583252} -09/20/2021 17:35:14 - INFO - __main__ - Step 14313: {'lr': 0.0001999957812944857, 'samples': 458016, 'steps': 894, 'loss/train': 4.028905868530273} -09/20/2021 17:35:15 - INFO - __main__ - Step 14314: {'lr': 0.0001999957812944857, 'samples': 458048, 'steps': 894, 'loss/train': 3.566892385482788} -09/20/2021 17:35:16 - INFO - __main__ - Step 14315: {'lr': 0.0001999957812944857, 'samples': 458080, 'steps': 894, 'loss/train': 3.749706506729126} -09/20/2021 17:35:16 - INFO - __main__ - Step 14316: {'lr': 0.0001999957812944857, 'samples': 458112, 'steps': 894, 'loss/train': 4.612628936767578} -09/20/2021 17:35:17 - INFO - __main__ - Step 14317: {'lr': 0.0001999957812944857, 'samples': 458144, 'steps': 894, 'loss/train': 3.4004993438720703} -09/20/2021 17:35:18 - INFO - __main__ - Step 14318: {'lr': 0.0001999957812944857, 'samples': 458176, 'steps': 894, 'loss/train': 3.3172285556793213} -09/20/2021 17:35:19 - INFO - __main__ - Step 14319: {'lr': 0.0001999957812944857, 'samples': 458208, 'steps': 894, 'loss/train': 4.055354595184326} -09/20/2021 17:35:19 - INFO - __main__ - Step 14320: {'lr': 0.0001999957812944857, 'samples': 458240, 'steps': 894, 'loss/train': 4.446184158325195} -09/20/2021 17:35:20 - INFO - __main__ - Step 14321: {'lr': 0.00019999572249832434, 'samples': 458272, 'steps': 895, 'loss/train': 3.4823670387268066} -09/20/2021 17:35:21 - INFO - __main__ - Step 14322: {'lr': 0.00019999572249832434, 'samples': 458304, 'steps': 895, 'loss/train': 4.207427501678467} -09/20/2021 17:35:22 - INFO - __main__ - Step 14323: {'lr': 0.00019999572249832434, 'samples': 458336, 'steps': 895, 'loss/train': 4.603208065032959} -09/20/2021 17:35:23 - INFO - __main__ - Step 14324: {'lr': 0.00019999572249832434, 'samples': 458368, 'steps': 895, 'loss/train': 3.989581346511841} -09/20/2021 17:35:23 - INFO - __main__ - Step 14325: {'lr': 0.00019999572249832434, 'samples': 458400, 'steps': 895, 'loss/train': 2.830674886703491} -09/20/2021 17:35:24 - INFO - __main__ - Step 14326: {'lr': 0.00019999572249832434, 'samples': 458432, 'steps': 895, 'loss/train': 3.2072854042053223} -09/20/2021 17:35:25 - INFO - __main__ - Step 14327: {'lr': 0.00019999572249832434, 'samples': 458464, 'steps': 895, 'loss/train': 2.819275379180908} -09/20/2021 17:35:26 - INFO - __main__ - Step 14328: {'lr': 0.00019999572249832434, 'samples': 458496, 'steps': 895, 'loss/train': 2.6793699264526367} -09/20/2021 17:35:27 - INFO - __main__ - Step 14329: {'lr': 0.00019999572249832434, 'samples': 458528, 'steps': 895, 'loss/train': 3.5541908740997314} -09/20/2021 17:35:28 - INFO - __main__ - Step 14330: {'lr': 0.00019999572249832434, 'samples': 458560, 'steps': 895, 'loss/train': 4.294123649597168} -09/20/2021 17:35:28 - INFO - __main__ - Step 14331: {'lr': 0.00019999572249832434, 'samples': 458592, 'steps': 895, 'loss/train': 5.11336612701416} -09/20/2021 17:35:29 - INFO - __main__ - Step 14332: {'lr': 0.00019999572249832434, 'samples': 458624, 'steps': 895, 'loss/train': 2.192500352859497} -09/20/2021 17:35:30 - INFO - __main__ - Step 14333: {'lr': 0.00019999572249832434, 'samples': 458656, 'steps': 895, 'loss/train': 3.659363031387329} -09/20/2021 17:35:31 - INFO - __main__ - Step 14334: {'lr': 0.00019999572249832434, 'samples': 458688, 'steps': 895, 'loss/train': 2.8589208126068115} -09/20/2021 17:35:31 - INFO - __main__ - Step 14335: {'lr': 0.00019999572249832434, 'samples': 458720, 'steps': 895, 'loss/train': 3.612515449523926} -09/20/2021 17:35:32 - INFO - __main__ - Step 14336: {'lr': 0.00019999572249832434, 'samples': 458752, 'steps': 895, 'loss/train': 3.469770908355713} -09/20/2021 17:35:33 - INFO - __main__ - Step 14337: {'lr': 0.0001999956632952808, 'samples': 458784, 'steps': 896, 'loss/train': 3.740128755569458} -09/20/2021 17:35:34 - INFO - __main__ - Step 14338: {'lr': 0.0001999956632952808, 'samples': 458816, 'steps': 896, 'loss/train': 4.442699432373047} -09/20/2021 17:35:34 - INFO - __main__ - Step 14339: {'lr': 0.0001999956632952808, 'samples': 458848, 'steps': 896, 'loss/train': 1.4206053018569946} -09/20/2021 17:35:35 - INFO - __main__ - Step 14340: {'lr': 0.0001999956632952808, 'samples': 458880, 'steps': 896, 'loss/train': 3.730530261993408} -09/20/2021 17:35:36 - INFO - __main__ - Step 14341: {'lr': 0.0001999956632952808, 'samples': 458912, 'steps': 896, 'loss/train': 3.828738212585449} -09/20/2021 17:35:37 - INFO - __main__ - Step 14342: {'lr': 0.0001999956632952808, 'samples': 458944, 'steps': 896, 'loss/train': 3.6484951972961426} -09/20/2021 17:35:37 - INFO - __main__ - Step 14343: {'lr': 0.0001999956632952808, 'samples': 458976, 'steps': 896, 'loss/train': 4.0677266120910645} -09/20/2021 17:35:38 - INFO - __main__ - Step 14344: {'lr': 0.0001999956632952808, 'samples': 459008, 'steps': 896, 'loss/train': 4.479247570037842} -09/20/2021 17:35:39 - INFO - __main__ - Step 14345: {'lr': 0.0001999956632952808, 'samples': 459040, 'steps': 896, 'loss/train': 1.0978095531463623} -09/20/2021 17:35:40 - INFO - __main__ - Step 14346: {'lr': 0.0001999956632952808, 'samples': 459072, 'steps': 896, 'loss/train': 0.8933594822883606} -09/20/2021 17:35:40 - INFO - __main__ - Step 14347: {'lr': 0.0001999956632952808, 'samples': 459104, 'steps': 896, 'loss/train': 3.9150843620300293} -09/20/2021 17:35:41 - INFO - __main__ - Step 14348: {'lr': 0.0001999956632952808, 'samples': 459136, 'steps': 896, 'loss/train': 4.336253643035889} -09/20/2021 17:35:42 - INFO - __main__ - Step 14349: {'lr': 0.0001999956632952808, 'samples': 459168, 'steps': 896, 'loss/train': 2.47312068939209} -09/20/2021 17:35:43 - INFO - __main__ - Step 14350: {'lr': 0.0001999956632952808, 'samples': 459200, 'steps': 896, 'loss/train': 3.8009445667266846} -09/20/2021 17:35:43 - INFO - __main__ - Step 14351: {'lr': 0.0001999956632952808, 'samples': 459232, 'steps': 896, 'loss/train': 3.6520845890045166} -09/20/2021 17:35:44 - INFO - __main__ - Step 14352: {'lr': 0.0001999956632952808, 'samples': 459264, 'steps': 896, 'loss/train': 4.423449993133545} -09/20/2021 17:35:45 - INFO - __main__ - Step 14353: {'lr': 0.00019999560368535527, 'samples': 459296, 'steps': 897, 'loss/train': 4.300126552581787} -09/20/2021 17:35:46 - INFO - __main__ - Step 14354: {'lr': 0.00019999560368535527, 'samples': 459328, 'steps': 897, 'loss/train': 3.8466291427612305} -09/20/2021 17:35:47 - INFO - __main__ - Step 14355: {'lr': 0.00019999560368535527, 'samples': 459360, 'steps': 897, 'loss/train': 4.739898204803467} -09/20/2021 17:35:47 - INFO - __main__ - Step 14356: {'lr': 0.00019999560368535527, 'samples': 459392, 'steps': 897, 'loss/train': 3.385674476623535} -09/20/2021 17:35:48 - INFO - __main__ - Step 14357: {'lr': 0.00019999560368535527, 'samples': 459424, 'steps': 897, 'loss/train': 4.045036315917969} -09/20/2021 17:35:49 - INFO - __main__ - Step 14358: {'lr': 0.00019999560368535527, 'samples': 459456, 'steps': 897, 'loss/train': 3.239557981491089} -09/20/2021 17:35:50 - INFO - __main__ - Step 14359: {'lr': 0.00019999560368535527, 'samples': 459488, 'steps': 897, 'loss/train': 3.5903217792510986} -09/20/2021 17:35:51 - INFO - __main__ - Step 14360: {'lr': 0.00019999560368535527, 'samples': 459520, 'steps': 897, 'loss/train': 3.868828058242798} -09/20/2021 17:35:52 - INFO - __main__ - Step 14361: {'lr': 0.00019999560368535527, 'samples': 459552, 'steps': 897, 'loss/train': 4.1851043701171875} -09/20/2021 17:35:52 - INFO - __main__ - Step 14362: {'lr': 0.00019999560368535527, 'samples': 459584, 'steps': 897, 'loss/train': 5.226545810699463} -09/20/2021 17:35:53 - INFO - __main__ - Step 14363: {'lr': 0.00019999560368535527, 'samples': 459616, 'steps': 897, 'loss/train': 3.2903647422790527} -09/20/2021 17:35:54 - INFO - __main__ - Step 14364: {'lr': 0.00019999560368535527, 'samples': 459648, 'steps': 897, 'loss/train': 3.9427690505981445} -09/20/2021 17:35:55 - INFO - __main__ - Step 14365: {'lr': 0.00019999560368535527, 'samples': 459680, 'steps': 897, 'loss/train': 3.2080636024475098} -09/20/2021 17:35:55 - INFO - __main__ - Step 14366: {'lr': 0.00019999560368535527, 'samples': 459712, 'steps': 897, 'loss/train': 3.7739787101745605} -09/20/2021 17:35:56 - INFO - __main__ - Step 14367: {'lr': 0.00019999560368535527, 'samples': 459744, 'steps': 897, 'loss/train': 2.9151217937469482} -09/20/2021 17:35:57 - INFO - __main__ - Step 14368: {'lr': 0.00019999560368535527, 'samples': 459776, 'steps': 897, 'loss/train': 3.9292805194854736} -09/20/2021 17:35:58 - INFO - __main__ - Step 14369: {'lr': 0.00019999554366854802, 'samples': 459808, 'steps': 898, 'loss/train': 4.307036399841309} -09/20/2021 17:35:59 - INFO - __main__ - Step 14370: {'lr': 0.00019999554366854802, 'samples': 459840, 'steps': 898, 'loss/train': 4.507481575012207} -09/20/2021 17:35:59 - INFO - __main__ - Step 14371: {'lr': 0.00019999554366854802, 'samples': 459872, 'steps': 898, 'loss/train': 2.820399522781372} -09/20/2021 17:36:00 - INFO - __main__ - Step 14372: {'lr': 0.00019999554366854802, 'samples': 459904, 'steps': 898, 'loss/train': 3.159242630004883} -09/20/2021 17:36:01 - INFO - __main__ - Step 14373: {'lr': 0.00019999554366854802, 'samples': 459936, 'steps': 898, 'loss/train': 4.273611545562744} -09/20/2021 17:36:02 - INFO - __main__ - Step 14374: {'lr': 0.00019999554366854802, 'samples': 459968, 'steps': 898, 'loss/train': 4.017053127288818} -09/20/2021 17:36:02 - INFO - __main__ - Step 14375: {'lr': 0.00019999554366854802, 'samples': 460000, 'steps': 898, 'loss/train': 3.4386651515960693} -09/20/2021 17:36:03 - INFO - __main__ - Step 14376: {'lr': 0.00019999554366854802, 'samples': 460032, 'steps': 898, 'loss/train': 4.278730869293213} -09/20/2021 17:36:04 - INFO - __main__ - Step 14377: {'lr': 0.00019999554366854802, 'samples': 460064, 'steps': 898, 'loss/train': 4.641199588775635} -09/20/2021 17:36:05 - INFO - __main__ - Step 14378: {'lr': 0.00019999554366854802, 'samples': 460096, 'steps': 898, 'loss/train': 3.937304973602295} -09/20/2021 17:36:05 - INFO - __main__ - Step 14379: {'lr': 0.00019999554366854802, 'samples': 460128, 'steps': 898, 'loss/train': 3.4976749420166016} -09/20/2021 17:36:06 - INFO - __main__ - Step 14380: {'lr': 0.00019999554366854802, 'samples': 460160, 'steps': 898, 'loss/train': 4.3143229484558105} -09/20/2021 17:36:07 - INFO - __main__ - Step 14381: {'lr': 0.00019999554366854802, 'samples': 460192, 'steps': 898, 'loss/train': 4.169865131378174} -09/20/2021 17:36:08 - INFO - __main__ - Step 14382: {'lr': 0.00019999554366854802, 'samples': 460224, 'steps': 898, 'loss/train': 4.033476829528809} -09/20/2021 17:36:08 - INFO - __main__ - Step 14383: {'lr': 0.00019999554366854802, 'samples': 460256, 'steps': 898, 'loss/train': 3.6237411499023438} -09/20/2021 17:36:09 - INFO - __main__ - Step 14384: {'lr': 0.00019999554366854802, 'samples': 460288, 'steps': 898, 'loss/train': 3.6068150997161865} -09/20/2021 17:36:10 - INFO - __main__ - Step 14385: {'lr': 0.00019999548324485932, 'samples': 460320, 'steps': 899, 'loss/train': 4.116662502288818} -09/20/2021 17:36:11 - INFO - __main__ - Step 14386: {'lr': 0.00019999548324485932, 'samples': 460352, 'steps': 899, 'loss/train': 4.197206974029541} -09/20/2021 17:36:11 - INFO - __main__ - Step 14387: {'lr': 0.00019999548324485932, 'samples': 460384, 'steps': 899, 'loss/train': 3.0829038619995117} -09/20/2021 17:36:12 - INFO - __main__ - Step 14388: {'lr': 0.00019999548324485932, 'samples': 460416, 'steps': 899, 'loss/train': 3.534485340118408} -09/20/2021 17:36:13 - INFO - __main__ - Step 14389: {'lr': 0.00019999548324485932, 'samples': 460448, 'steps': 899, 'loss/train': 4.486137390136719} -09/20/2021 17:36:14 - INFO - __main__ - Step 14390: {'lr': 0.00019999548324485932, 'samples': 460480, 'steps': 899, 'loss/train': 0.892396092414856} -09/20/2021 17:36:15 - INFO - __main__ - Step 14391: {'lr': 0.00019999548324485932, 'samples': 460512, 'steps': 899, 'loss/train': 0.78476881980896} -09/20/2021 17:36:16 - INFO - __main__ - Step 14392: {'lr': 0.00019999548324485932, 'samples': 460544, 'steps': 899, 'loss/train': 4.431501388549805} -09/20/2021 17:36:16 - INFO - __main__ - Step 14393: {'lr': 0.00019999548324485932, 'samples': 460576, 'steps': 899, 'loss/train': 3.342336893081665} -09/20/2021 17:36:17 - INFO - __main__ - Step 14394: {'lr': 0.00019999548324485932, 'samples': 460608, 'steps': 899, 'loss/train': 3.0080010890960693} -09/20/2021 17:36:18 - INFO - __main__ - Step 14395: {'lr': 0.00019999548324485932, 'samples': 460640, 'steps': 899, 'loss/train': 3.2055013179779053} -09/20/2021 17:36:19 - INFO - __main__ - Step 14396: {'lr': 0.00019999548324485932, 'samples': 460672, 'steps': 899, 'loss/train': 3.5772719383239746} -09/20/2021 17:36:19 - INFO - __main__ - Step 14397: {'lr': 0.00019999548324485932, 'samples': 460704, 'steps': 899, 'loss/train': 4.400094509124756} -09/20/2021 17:36:20 - INFO - __main__ - Step 14398: {'lr': 0.00019999548324485932, 'samples': 460736, 'steps': 899, 'loss/train': 4.322717189788818} -09/20/2021 17:36:21 - INFO - __main__ - Step 14399: {'lr': 0.00019999548324485932, 'samples': 460768, 'steps': 899, 'loss/train': 3.7824082374572754} -09/20/2021 17:36:22 - INFO - __main__ - Step 14400: {'lr': 0.00019999548324485932, 'samples': 460800, 'steps': 899, 'loss/train': 3.612448215484619} -09/20/2021 17:36:23 - INFO - __main__ - Step 14401: {'lr': 0.00019999542241428935, 'samples': 460832, 'steps': 900, 'loss/train': 3.502251148223877} -09/20/2021 17:36:23 - INFO - __main__ - Step 14402: {'lr': 0.00019999542241428935, 'samples': 460864, 'steps': 900, 'loss/train': 3.649843692779541} -09/20/2021 17:36:24 - INFO - __main__ - Step 14403: {'lr': 0.00019999542241428935, 'samples': 460896, 'steps': 900, 'loss/train': 3.854386329650879} -09/20/2021 17:36:25 - INFO - __main__ - Step 14404: {'lr': 0.00019999542241428935, 'samples': 460928, 'steps': 900, 'loss/train': 3.511301279067993} -09/20/2021 17:36:26 - INFO - __main__ - Step 14405: {'lr': 0.00019999542241428935, 'samples': 460960, 'steps': 900, 'loss/train': 3.8575057983398438} -09/20/2021 17:36:26 - INFO - __main__ - Step 14406: {'lr': 0.00019999542241428935, 'samples': 460992, 'steps': 900, 'loss/train': 3.9269232749938965} -09/20/2021 17:36:27 - INFO - __main__ - Step 14407: {'lr': 0.00019999542241428935, 'samples': 461024, 'steps': 900, 'loss/train': 0.9656960964202881} -09/20/2021 17:36:28 - INFO - __main__ - Step 14408: {'lr': 0.00019999542241428935, 'samples': 461056, 'steps': 900, 'loss/train': 4.172285556793213} -09/20/2021 17:36:29 - INFO - __main__ - Step 14409: {'lr': 0.00019999542241428935, 'samples': 461088, 'steps': 900, 'loss/train': 4.445596218109131} -09/20/2021 17:36:29 - INFO - __main__ - Step 14410: {'lr': 0.00019999542241428935, 'samples': 461120, 'steps': 900, 'loss/train': 6.332667827606201} -09/20/2021 17:36:30 - INFO - __main__ - Step 14411: {'lr': 0.00019999542241428935, 'samples': 461152, 'steps': 900, 'loss/train': 6.463472843170166} -09/20/2021 17:36:31 - INFO - __main__ - Step 14412: {'lr': 0.00019999542241428935, 'samples': 461184, 'steps': 900, 'loss/train': 3.9127588272094727} -09/20/2021 17:36:32 - INFO - __main__ - Step 14413: {'lr': 0.00019999542241428935, 'samples': 461216, 'steps': 900, 'loss/train': 2.8502347469329834} -09/20/2021 17:36:32 - INFO - __main__ - Step 14414: {'lr': 0.00019999542241428935, 'samples': 461248, 'steps': 900, 'loss/train': 3.5371222496032715} -09/20/2021 17:36:33 - INFO - __main__ - Step 14415: {'lr': 0.00019999542241428935, 'samples': 461280, 'steps': 900, 'loss/train': 3.1613643169403076} -09/20/2021 17:36:34 - INFO - __main__ - Step 14416: {'lr': 0.00019999542241428935, 'samples': 461312, 'steps': 900, 'loss/train': 3.9629828929901123} -09/20/2021 17:36:35 - INFO - __main__ - Step 14417: {'lr': 0.00019999536117683842, 'samples': 461344, 'steps': 901, 'loss/train': 3.8340964317321777} -09/20/2021 17:36:35 - INFO - __main__ - Step 14418: {'lr': 0.00019999536117683842, 'samples': 461376, 'steps': 901, 'loss/train': 4.0475239753723145} -09/20/2021 17:36:36 - INFO - __main__ - Step 14419: {'lr': 0.00019999536117683842, 'samples': 461408, 'steps': 901, 'loss/train': 3.99713397026062} -09/20/2021 17:36:37 - INFO - __main__ - Step 14420: {'lr': 0.00019999536117683842, 'samples': 461440, 'steps': 901, 'loss/train': 4.108545303344727} -09/20/2021 17:36:38 - INFO - __main__ - Step 14421: {'lr': 0.00019999536117683842, 'samples': 461472, 'steps': 901, 'loss/train': 3.970038414001465} -09/20/2021 17:36:39 - INFO - __main__ - Step 14422: {'lr': 0.00019999536117683842, 'samples': 461504, 'steps': 901, 'loss/train': 3.8321659564971924} -09/20/2021 17:36:40 - INFO - __main__ - Step 14423: {'lr': 0.00019999536117683842, 'samples': 461536, 'steps': 901, 'loss/train': 4.421684265136719} -09/20/2021 17:36:41 - INFO - __main__ - Step 14424: {'lr': 0.00019999536117683842, 'samples': 461568, 'steps': 901, 'loss/train': 3.828491687774658} -09/20/2021 17:36:41 - INFO - __main__ - Step 14425: {'lr': 0.00019999536117683842, 'samples': 461600, 'steps': 901, 'loss/train': 3.917066812515259} -09/20/2021 17:36:42 - INFO - __main__ - Step 14426: {'lr': 0.00019999536117683842, 'samples': 461632, 'steps': 901, 'loss/train': 4.004735946655273} -09/20/2021 17:36:43 - INFO - __main__ - Step 14427: {'lr': 0.00019999536117683842, 'samples': 461664, 'steps': 901, 'loss/train': 4.562780857086182} -09/20/2021 17:36:44 - INFO - __main__ - Step 14428: {'lr': 0.00019999536117683842, 'samples': 461696, 'steps': 901, 'loss/train': 4.0611042976379395} -09/20/2021 17:36:44 - INFO - __main__ - Step 14429: {'lr': 0.00019999536117683842, 'samples': 461728, 'steps': 901, 'loss/train': 4.021551132202148} -09/20/2021 17:36:45 - INFO - __main__ - Step 14430: {'lr': 0.00019999536117683842, 'samples': 461760, 'steps': 901, 'loss/train': 3.415894031524658} -09/20/2021 17:36:46 - INFO - __main__ - Step 14431: {'lr': 0.00019999536117683842, 'samples': 461792, 'steps': 901, 'loss/train': 4.9330058097839355} -09/20/2021 17:36:47 - INFO - __main__ - Step 14432: {'lr': 0.00019999536117683842, 'samples': 461824, 'steps': 901, 'loss/train': 4.27390718460083} -09/20/2021 17:36:47 - INFO - __main__ - Step 14433: {'lr': 0.00019999529953250675, 'samples': 461856, 'steps': 902, 'loss/train': 4.038913726806641} -09/20/2021 17:36:48 - INFO - __main__ - Step 14434: {'lr': 0.00019999529953250675, 'samples': 461888, 'steps': 902, 'loss/train': 3.721398115158081} -09/20/2021 17:36:49 - INFO - __main__ - Step 14435: {'lr': 0.00019999529953250675, 'samples': 461920, 'steps': 902, 'loss/train': 3.924257278442383} -09/20/2021 17:36:50 - INFO - __main__ - Step 14436: {'lr': 0.00019999529953250675, 'samples': 461952, 'steps': 902, 'loss/train': 3.755751132965088} -09/20/2021 17:36:50 - INFO - __main__ - Step 14437: {'lr': 0.00019999529953250675, 'samples': 461984, 'steps': 902, 'loss/train': 4.089193344116211} -09/20/2021 17:36:51 - INFO - __main__ - Step 14438: {'lr': 0.00019999529953250675, 'samples': 462016, 'steps': 902, 'loss/train': 4.336679458618164} -09/20/2021 17:36:52 - INFO - __main__ - Step 14439: {'lr': 0.00019999529953250675, 'samples': 462048, 'steps': 902, 'loss/train': 4.638967514038086} -09/20/2021 17:36:53 - INFO - __main__ - Step 14440: {'lr': 0.00019999529953250675, 'samples': 462080, 'steps': 902, 'loss/train': 3.4716286659240723} -09/20/2021 17:36:53 - INFO - __main__ - Step 14441: {'lr': 0.00019999529953250675, 'samples': 462112, 'steps': 902, 'loss/train': 5.110100269317627} -09/20/2021 17:36:54 - INFO - __main__ - Step 14442: {'lr': 0.00019999529953250675, 'samples': 462144, 'steps': 902, 'loss/train': 4.246917247772217} -09/20/2021 17:36:55 - INFO - __main__ - Step 14443: {'lr': 0.00019999529953250675, 'samples': 462176, 'steps': 902, 'loss/train': 3.816041946411133} -09/20/2021 17:36:56 - INFO - __main__ - Step 14444: {'lr': 0.00019999529953250675, 'samples': 462208, 'steps': 902, 'loss/train': 3.5025339126586914} -09/20/2021 17:36:57 - INFO - __main__ - Step 14445: {'lr': 0.00019999529953250675, 'samples': 462240, 'steps': 902, 'loss/train': 4.315547466278076} -09/20/2021 17:36:57 - INFO - __main__ - Step 14446: {'lr': 0.00019999529953250675, 'samples': 462272, 'steps': 902, 'loss/train': 3.6464622020721436} -09/20/2021 17:36:58 - INFO - __main__ - Step 14447: {'lr': 0.00019999529953250675, 'samples': 462304, 'steps': 902, 'loss/train': 3.4933977127075195} -09/20/2021 17:36:59 - INFO - __main__ - Step 14448: {'lr': 0.00019999529953250675, 'samples': 462336, 'steps': 902, 'loss/train': 4.489396572113037} -09/20/2021 17:37:00 - INFO - __main__ - Step 14449: {'lr': 0.0001999952374812946, 'samples': 462368, 'steps': 903, 'loss/train': 2.1240198612213135} -09/20/2021 17:37:00 - INFO - __main__ - Step 14450: {'lr': 0.0001999952374812946, 'samples': 462400, 'steps': 903, 'loss/train': 3.98087739944458} -09/20/2021 17:37:01 - INFO - __main__ - Step 14451: {'lr': 0.0001999952374812946, 'samples': 462432, 'steps': 903, 'loss/train': 3.1818997859954834} -09/20/2021 17:37:02 - INFO - __main__ - Step 14452: {'lr': 0.0001999952374812946, 'samples': 462464, 'steps': 903, 'loss/train': 4.0845046043396} -09/20/2021 17:37:03 - INFO - __main__ - Step 14453: {'lr': 0.0001999952374812946, 'samples': 462496, 'steps': 903, 'loss/train': 4.246333122253418} -09/20/2021 17:37:04 - INFO - __main__ - Step 14454: {'lr': 0.0001999952374812946, 'samples': 462528, 'steps': 903, 'loss/train': 3.2745068073272705} -09/20/2021 17:37:05 - INFO - __main__ - Step 14455: {'lr': 0.0001999952374812946, 'samples': 462560, 'steps': 903, 'loss/train': 4.410967826843262} -09/20/2021 17:37:05 - INFO - __main__ - Step 14456: {'lr': 0.0001999952374812946, 'samples': 462592, 'steps': 903, 'loss/train': 3.5837576389312744} -09/20/2021 17:37:06 - INFO - __main__ - Step 14457: {'lr': 0.0001999952374812946, 'samples': 462624, 'steps': 903, 'loss/train': 5.606301784515381} -09/20/2021 17:37:07 - INFO - __main__ - Step 14458: {'lr': 0.0001999952374812946, 'samples': 462656, 'steps': 903, 'loss/train': 2.8199379444122314} -09/20/2021 17:37:08 - INFO - __main__ - Step 14459: {'lr': 0.0001999952374812946, 'samples': 462688, 'steps': 903, 'loss/train': 2.827216863632202} -09/20/2021 17:37:08 - INFO - __main__ - Step 14460: {'lr': 0.0001999952374812946, 'samples': 462720, 'steps': 903, 'loss/train': 3.503746271133423} -09/20/2021 17:37:09 - INFO - __main__ - Step 14461: {'lr': 0.0001999952374812946, 'samples': 462752, 'steps': 903, 'loss/train': 3.3171379566192627} -09/20/2021 17:37:10 - INFO - __main__ - Step 14462: {'lr': 0.0001999952374812946, 'samples': 462784, 'steps': 903, 'loss/train': 4.995660305023193} -09/20/2021 17:37:11 - INFO - __main__ - Step 14463: {'lr': 0.0001999952374812946, 'samples': 462816, 'steps': 903, 'loss/train': 2.5826306343078613} -09/20/2021 17:37:11 - INFO - __main__ - Step 14464: {'lr': 0.0001999952374812946, 'samples': 462848, 'steps': 903, 'loss/train': 3.6662991046905518} -09/20/2021 17:37:12 - INFO - __main__ - Step 14465: {'lr': 0.0001999951750232022, 'samples': 462880, 'steps': 904, 'loss/train': 3.3390674591064453} -09/20/2021 17:37:13 - INFO - __main__ - Step 14466: {'lr': 0.0001999951750232022, 'samples': 462912, 'steps': 904, 'loss/train': 4.314344882965088} -09/20/2021 17:37:14 - INFO - __main__ - Step 14467: {'lr': 0.0001999951750232022, 'samples': 462944, 'steps': 904, 'loss/train': 4.163910865783691} -09/20/2021 17:37:15 - INFO - __main__ - Step 14468: {'lr': 0.0001999951750232022, 'samples': 462976, 'steps': 904, 'loss/train': 3.75009822845459} -09/20/2021 17:37:15 - INFO - __main__ - Step 14469: {'lr': 0.0001999951750232022, 'samples': 463008, 'steps': 904, 'loss/train': 4.078174114227295} -09/20/2021 17:37:16 - INFO - __main__ - Step 14470: {'lr': 0.0001999951750232022, 'samples': 463040, 'steps': 904, 'loss/train': 4.112732887268066} -09/20/2021 17:37:17 - INFO - __main__ - Step 14471: {'lr': 0.0001999951750232022, 'samples': 463072, 'steps': 904, 'loss/train': 3.9413392543792725} -09/20/2021 17:37:18 - INFO - __main__ - Step 14472: {'lr': 0.0001999951750232022, 'samples': 463104, 'steps': 904, 'loss/train': 3.963028907775879} -09/20/2021 17:37:18 - INFO - __main__ - Step 14473: {'lr': 0.0001999951750232022, 'samples': 463136, 'steps': 904, 'loss/train': 3.784130811691284} -09/20/2021 17:37:19 - INFO - __main__ - Step 14474: {'lr': 0.0001999951750232022, 'samples': 463168, 'steps': 904, 'loss/train': 4.541180610656738} -09/20/2021 17:37:20 - INFO - __main__ - Step 14475: {'lr': 0.0001999951750232022, 'samples': 463200, 'steps': 904, 'loss/train': 3.6199724674224854} -09/20/2021 17:37:21 - INFO - __main__ - Step 14476: {'lr': 0.0001999951750232022, 'samples': 463232, 'steps': 904, 'loss/train': 3.6897387504577637} -09/20/2021 17:37:21 - INFO - __main__ - Step 14477: {'lr': 0.0001999951750232022, 'samples': 463264, 'steps': 904, 'loss/train': 4.410264015197754} -09/20/2021 17:37:22 - INFO - __main__ - Step 14478: {'lr': 0.0001999951750232022, 'samples': 463296, 'steps': 904, 'loss/train': 4.088655948638916} -09/20/2021 17:37:23 - INFO - __main__ - Step 14479: {'lr': 0.0001999951750232022, 'samples': 463328, 'steps': 904, 'loss/train': 4.197007656097412} -09/20/2021 17:37:24 - INFO - __main__ - Step 14480: {'lr': 0.0001999951750232022, 'samples': 463360, 'steps': 904, 'loss/train': 2.7657837867736816} -09/20/2021 17:37:24 - INFO - __main__ - Step 14481: {'lr': 0.00019999511215822985, 'samples': 463392, 'steps': 905, 'loss/train': 3.67195463180542} -09/20/2021 17:37:25 - INFO - __main__ - Step 14482: {'lr': 0.00019999511215822985, 'samples': 463424, 'steps': 905, 'loss/train': 3.0928854942321777} -09/20/2021 17:37:26 - INFO - __main__ - Step 14483: {'lr': 0.00019999511215822985, 'samples': 463456, 'steps': 905, 'loss/train': 3.8333184719085693} -09/20/2021 17:37:27 - INFO - __main__ - Step 14484: {'lr': 0.00019999511215822985, 'samples': 463488, 'steps': 905, 'loss/train': 4.056633949279785} -09/20/2021 17:37:28 - INFO - __main__ - Step 14485: {'lr': 0.00019999511215822985, 'samples': 463520, 'steps': 905, 'loss/train': 4.457232475280762} -09/20/2021 17:37:29 - INFO - __main__ - Step 14486: {'lr': 0.00019999511215822985, 'samples': 463552, 'steps': 905, 'loss/train': 3.8539817333221436} -09/20/2021 17:37:29 - INFO - __main__ - Step 14487: {'lr': 0.00019999511215822985, 'samples': 463584, 'steps': 905, 'loss/train': 3.6844022274017334} -09/20/2021 17:37:30 - INFO - __main__ - Step 14488: {'lr': 0.00019999511215822985, 'samples': 463616, 'steps': 905, 'loss/train': 3.3367514610290527} -09/20/2021 17:37:31 - INFO - __main__ - Step 14489: {'lr': 0.00019999511215822985, 'samples': 463648, 'steps': 905, 'loss/train': 3.968905210494995} -09/20/2021 17:37:32 - INFO - __main__ - Step 14490: {'lr': 0.00019999511215822985, 'samples': 463680, 'steps': 905, 'loss/train': 4.266056537628174} -09/20/2021 17:37:32 - INFO - __main__ - Step 14491: {'lr': 0.00019999511215822985, 'samples': 463712, 'steps': 905, 'loss/train': 3.79679274559021} -09/20/2021 17:37:33 - INFO - __main__ - Step 14492: {'lr': 0.00019999511215822985, 'samples': 463744, 'steps': 905, 'loss/train': 4.058928489685059} -09/20/2021 17:37:34 - INFO - __main__ - Step 14493: {'lr': 0.00019999511215822985, 'samples': 463776, 'steps': 905, 'loss/train': 4.571557521820068} -09/20/2021 17:37:35 - INFO - __main__ - Step 14494: {'lr': 0.00019999511215822985, 'samples': 463808, 'steps': 905, 'loss/train': 3.4852962493896484} -09/20/2021 17:37:35 - INFO - __main__ - Step 14495: {'lr': 0.00019999511215822985, 'samples': 463840, 'steps': 905, 'loss/train': 4.237942695617676} -09/20/2021 17:37:36 - INFO - __main__ - Step 14496: {'lr': 0.00019999511215822985, 'samples': 463872, 'steps': 905, 'loss/train': 5.767998218536377} -09/20/2021 17:37:37 - INFO - __main__ - Step 14497: {'lr': 0.00019999504888637773, 'samples': 463904, 'steps': 906, 'loss/train': 3.792215347290039} -09/20/2021 17:37:38 - INFO - __main__ - Step 14498: {'lr': 0.00019999504888637773, 'samples': 463936, 'steps': 906, 'loss/train': 3.693462371826172} -09/20/2021 17:37:39 - INFO - __main__ - Step 14499: {'lr': 0.00019999504888637773, 'samples': 463968, 'steps': 906, 'loss/train': 4.730345249176025} -09/20/2021 17:37:39 - INFO - __main__ - Step 14500: {'lr': 0.00019999504888637773, 'samples': 464000, 'steps': 906, 'loss/train': 3.153398036956787} -09/20/2021 17:37:40 - INFO - __main__ - Step 14501: {'lr': 0.00019999504888637773, 'samples': 464032, 'steps': 906, 'loss/train': 3.718950033187866} -09/20/2021 17:37:41 - INFO - __main__ - Step 14502: {'lr': 0.00019999504888637773, 'samples': 464064, 'steps': 906, 'loss/train': 2.918909788131714} -09/20/2021 17:37:42 - INFO - __main__ - Step 14503: {'lr': 0.00019999504888637773, 'samples': 464096, 'steps': 906, 'loss/train': 1.4005913734436035} -09/20/2021 17:37:42 - INFO - __main__ - Step 14504: {'lr': 0.00019999504888637773, 'samples': 464128, 'steps': 906, 'loss/train': 4.635822296142578} -09/20/2021 17:37:43 - INFO - __main__ - Step 14505: {'lr': 0.00019999504888637773, 'samples': 464160, 'steps': 906, 'loss/train': 2.225581169128418} -09/20/2021 17:37:44 - INFO - __main__ - Step 14506: {'lr': 0.00019999504888637773, 'samples': 464192, 'steps': 906, 'loss/train': 4.764238357543945} -09/20/2021 17:37:45 - INFO - __main__ - Step 14507: {'lr': 0.00019999504888637773, 'samples': 464224, 'steps': 906, 'loss/train': 2.6536450386047363} -09/20/2021 17:37:45 - INFO - __main__ - Step 14508: {'lr': 0.00019999504888637773, 'samples': 464256, 'steps': 906, 'loss/train': 3.3479061126708984} -09/20/2021 17:37:46 - INFO - __main__ - Step 14509: {'lr': 0.00019999504888637773, 'samples': 464288, 'steps': 906, 'loss/train': 3.680527448654175} -09/20/2021 17:37:47 - INFO - __main__ - Step 14510: {'lr': 0.00019999504888637773, 'samples': 464320, 'steps': 906, 'loss/train': 3.976078748703003} -09/20/2021 17:37:48 - INFO - __main__ - Step 14511: {'lr': 0.00019999504888637773, 'samples': 464352, 'steps': 906, 'loss/train': 3.3573875427246094} -09/20/2021 17:37:48 - INFO - __main__ - Step 14512: {'lr': 0.00019999504888637773, 'samples': 464384, 'steps': 906, 'loss/train': 3.51824951171875} -09/20/2021 17:37:49 - INFO - __main__ - Step 14513: {'lr': 0.00019999498520764615, 'samples': 464416, 'steps': 907, 'loss/train': 4.177755832672119} -09/20/2021 17:37:50 - INFO - __main__ - Step 14514: {'lr': 0.00019999498520764615, 'samples': 464448, 'steps': 907, 'loss/train': 3.932166814804077} -09/20/2021 17:37:52 - INFO - __main__ - Step 14515: {'lr': 0.00019999498520764615, 'samples': 464480, 'steps': 907, 'loss/train': 4.140517234802246} -09/20/2021 17:37:52 - INFO - __main__ - Step 14516: {'lr': 0.00019999498520764615, 'samples': 464512, 'steps': 907, 'loss/train': 4.9413743019104} -09/20/2021 17:37:53 - INFO - __main__ - Step 14517: {'lr': 0.00019999498520764615, 'samples': 464544, 'steps': 907, 'loss/train': 4.513391017913818} -09/20/2021 17:37:54 - INFO - __main__ - Step 14518: {'lr': 0.00019999498520764615, 'samples': 464576, 'steps': 907, 'loss/train': 3.519439697265625} -09/20/2021 17:37:55 - INFO - __main__ - Step 14519: {'lr': 0.00019999498520764615, 'samples': 464608, 'steps': 907, 'loss/train': 3.82440185546875} -09/20/2021 17:37:55 - INFO - __main__ - Step 14520: {'lr': 0.00019999498520764615, 'samples': 464640, 'steps': 907, 'loss/train': 0.5905527472496033} -09/20/2021 17:37:56 - INFO - __main__ - Step 14521: {'lr': 0.00019999498520764615, 'samples': 464672, 'steps': 907, 'loss/train': 4.165826320648193} -09/20/2021 17:37:57 - INFO - __main__ - Step 14522: {'lr': 0.00019999498520764615, 'samples': 464704, 'steps': 907, 'loss/train': 3.165074586868286} -09/20/2021 17:37:58 - INFO - __main__ - Step 14523: {'lr': 0.00019999498520764615, 'samples': 464736, 'steps': 907, 'loss/train': 4.904946327209473} -09/20/2021 17:37:58 - INFO - __main__ - Step 14524: {'lr': 0.00019999498520764615, 'samples': 464768, 'steps': 907, 'loss/train': 5.443978786468506} -09/20/2021 17:37:59 - INFO - __main__ - Step 14525: {'lr': 0.00019999498520764615, 'samples': 464800, 'steps': 907, 'loss/train': 4.882306098937988} -09/20/2021 17:38:00 - INFO - __main__ - Step 14526: {'lr': 0.00019999498520764615, 'samples': 464832, 'steps': 907, 'loss/train': 5.0945658683776855} -09/20/2021 17:38:01 - INFO - __main__ - Step 14527: {'lr': 0.00019999498520764615, 'samples': 464864, 'steps': 907, 'loss/train': 3.756913661956787} -09/20/2021 17:38:01 - INFO - __main__ - Step 14528: {'lr': 0.00019999498520764615, 'samples': 464896, 'steps': 907, 'loss/train': 3.5068812370300293} -09/20/2021 17:38:02 - INFO - __main__ - Step 14529: {'lr': 0.0001999949211220354, 'samples': 464928, 'steps': 908, 'loss/train': 4.530573844909668} -09/20/2021 17:38:03 - INFO - __main__ - Step 14530: {'lr': 0.0001999949211220354, 'samples': 464960, 'steps': 908, 'loss/train': 4.20059871673584} -09/20/2021 17:38:04 - INFO - __main__ - Step 14531: {'lr': 0.0001999949211220354, 'samples': 464992, 'steps': 908, 'loss/train': 5.080560207366943} -09/20/2021 17:38:04 - INFO - __main__ - Step 14532: {'lr': 0.0001999949211220354, 'samples': 465024, 'steps': 908, 'loss/train': 3.0027310848236084} -09/20/2021 17:38:05 - INFO - __main__ - Step 14533: {'lr': 0.0001999949211220354, 'samples': 465056, 'steps': 908, 'loss/train': 3.7919461727142334} -09/20/2021 17:38:06 - INFO - __main__ - Step 14534: {'lr': 0.0001999949211220354, 'samples': 465088, 'steps': 908, 'loss/train': 3.5029125213623047} -09/20/2021 17:38:07 - INFO - __main__ - Step 14535: {'lr': 0.0001999949211220354, 'samples': 465120, 'steps': 908, 'loss/train': 3.9976067543029785} -09/20/2021 17:38:07 - INFO - __main__ - Step 14536: {'lr': 0.0001999949211220354, 'samples': 465152, 'steps': 908, 'loss/train': 4.858298301696777} -09/20/2021 17:38:08 - INFO - __main__ - Step 14537: {'lr': 0.0001999949211220354, 'samples': 465184, 'steps': 908, 'loss/train': 3.5744776725769043} -09/20/2021 17:38:09 - INFO - __main__ - Step 14538: {'lr': 0.0001999949211220354, 'samples': 465216, 'steps': 908, 'loss/train': 4.389369964599609} -09/20/2021 17:38:10 - INFO - __main__ - Step 14539: {'lr': 0.0001999949211220354, 'samples': 465248, 'steps': 908, 'loss/train': 3.7485411167144775} -09/20/2021 17:38:10 - INFO - __main__ - Step 14540: {'lr': 0.0001999949211220354, 'samples': 465280, 'steps': 908, 'loss/train': 3.666156530380249} -09/20/2021 17:38:11 - INFO - __main__ - Step 14541: {'lr': 0.0001999949211220354, 'samples': 465312, 'steps': 908, 'loss/train': 3.9067656993865967} -09/20/2021 17:38:12 - INFO - __main__ - Step 14542: {'lr': 0.0001999949211220354, 'samples': 465344, 'steps': 908, 'loss/train': 3.886909246444702} -09/20/2021 17:38:13 - INFO - __main__ - Step 14543: {'lr': 0.0001999949211220354, 'samples': 465376, 'steps': 908, 'loss/train': 3.4079947471618652} -09/20/2021 17:38:13 - INFO - __main__ - Step 14544: {'lr': 0.0001999949211220354, 'samples': 465408, 'steps': 908, 'loss/train': 4.315451145172119} -09/20/2021 17:38:14 - INFO - __main__ - Step 14545: {'lr': 0.00019999485662954567, 'samples': 465440, 'steps': 909, 'loss/train': 3.9837486743927} -09/20/2021 17:38:15 - INFO - __main__ - Step 14546: {'lr': 0.00019999485662954567, 'samples': 465472, 'steps': 909, 'loss/train': 1.7519664764404297} -09/20/2021 17:38:16 - INFO - __main__ - Step 14547: {'lr': 0.00019999485662954567, 'samples': 465504, 'steps': 909, 'loss/train': 3.6075327396392822} -09/20/2021 17:38:17 - INFO - __main__ - Step 14548: {'lr': 0.00019999485662954567, 'samples': 465536, 'steps': 909, 'loss/train': 4.561975479125977} -09/20/2021 17:38:18 - INFO - __main__ - Step 14549: {'lr': 0.00019999485662954567, 'samples': 465568, 'steps': 909, 'loss/train': 3.799398899078369} -09/20/2021 17:38:19 - INFO - __main__ - Step 14550: {'lr': 0.00019999485662954567, 'samples': 465600, 'steps': 909, 'loss/train': 4.07563591003418} -09/20/2021 17:38:19 - INFO - __main__ - Step 14551: {'lr': 0.00019999485662954567, 'samples': 465632, 'steps': 909, 'loss/train': 2.8986871242523193} -09/20/2021 17:38:20 - INFO - __main__ - Step 14552: {'lr': 0.00019999485662954567, 'samples': 465664, 'steps': 909, 'loss/train': 1.8984307050704956} -09/20/2021 17:38:21 - INFO - __main__ - Step 14553: {'lr': 0.00019999485662954567, 'samples': 465696, 'steps': 909, 'loss/train': 3.9963326454162598} -09/20/2021 17:38:22 - INFO - __main__ - Step 14554: {'lr': 0.00019999485662954567, 'samples': 465728, 'steps': 909, 'loss/train': 4.288894176483154} -09/20/2021 17:38:22 - INFO - __main__ - Step 14555: {'lr': 0.00019999485662954567, 'samples': 465760, 'steps': 909, 'loss/train': 3.71744704246521} -09/20/2021 17:38:23 - INFO - __main__ - Step 14556: {'lr': 0.00019999485662954567, 'samples': 465792, 'steps': 909, 'loss/train': 3.091414451599121} -09/20/2021 17:38:24 - INFO - __main__ - Step 14557: {'lr': 0.00019999485662954567, 'samples': 465824, 'steps': 909, 'loss/train': 4.104827404022217} -09/20/2021 17:38:25 - INFO - __main__ - Step 14558: {'lr': 0.00019999485662954567, 'samples': 465856, 'steps': 909, 'loss/train': 3.5551369190216064} -09/20/2021 17:38:25 - INFO - __main__ - Step 14559: {'lr': 0.00019999485662954567, 'samples': 465888, 'steps': 909, 'loss/train': 2.4270429611206055} -09/20/2021 17:38:26 - INFO - __main__ - Step 14560: {'lr': 0.00019999485662954567, 'samples': 465920, 'steps': 909, 'loss/train': 3.5146749019622803} -09/20/2021 17:38:27 - INFO - __main__ - Step 14561: {'lr': 0.00019999479173017726, 'samples': 465952, 'steps': 910, 'loss/train': 4.02989387512207} -09/20/2021 17:38:28 - INFO - __main__ - Step 14562: {'lr': 0.00019999479173017726, 'samples': 465984, 'steps': 910, 'loss/train': 3.8797380924224854} -09/20/2021 17:38:28 - INFO - __main__ - Step 14563: {'lr': 0.00019999479173017726, 'samples': 466016, 'steps': 910, 'loss/train': 1.992167592048645} -09/20/2021 17:38:29 - INFO - __main__ - Step 14564: {'lr': 0.00019999479173017726, 'samples': 466048, 'steps': 910, 'loss/train': 3.5704967975616455} -09/20/2021 17:38:30 - INFO - __main__ - Step 14565: {'lr': 0.00019999479173017726, 'samples': 466080, 'steps': 910, 'loss/train': 3.535032272338867} -09/20/2021 17:38:31 - INFO - __main__ - Step 14566: {'lr': 0.00019999479173017726, 'samples': 466112, 'steps': 910, 'loss/train': 4.203611850738525} -09/20/2021 17:38:31 - INFO - __main__ - Step 14567: {'lr': 0.00019999479173017726, 'samples': 466144, 'steps': 910, 'loss/train': 3.2943594455718994} -09/20/2021 17:38:32 - INFO - __main__ - Step 14568: {'lr': 0.00019999479173017726, 'samples': 466176, 'steps': 910, 'loss/train': 3.807248592376709} -09/20/2021 17:38:33 - INFO - __main__ - Step 14569: {'lr': 0.00019999479173017726, 'samples': 466208, 'steps': 910, 'loss/train': 3.8929007053375244} -09/20/2021 17:38:34 - INFO - __main__ - Step 14570: {'lr': 0.00019999479173017726, 'samples': 466240, 'steps': 910, 'loss/train': 3.0332443714141846} -09/20/2021 17:38:34 - INFO - __main__ - Step 14571: {'lr': 0.00019999479173017726, 'samples': 466272, 'steps': 910, 'loss/train': 3.3652217388153076} -09/20/2021 17:38:35 - INFO - __main__ - Step 14572: {'lr': 0.00019999479173017726, 'samples': 466304, 'steps': 910, 'loss/train': 3.887589931488037} -09/20/2021 17:38:36 - INFO - __main__ - Step 14573: {'lr': 0.00019999479173017726, 'samples': 466336, 'steps': 910, 'loss/train': 4.21035623550415} -09/20/2021 17:38:37 - INFO - __main__ - Step 14574: {'lr': 0.00019999479173017726, 'samples': 466368, 'steps': 910, 'loss/train': 3.900583267211914} -09/20/2021 17:38:37 - INFO - __main__ - Step 14575: {'lr': 0.00019999479173017726, 'samples': 466400, 'steps': 910, 'loss/train': 4.719539642333984} -09/20/2021 17:38:38 - INFO - __main__ - Step 14576: {'lr': 0.00019999479173017726, 'samples': 466432, 'steps': 910, 'loss/train': 5.265089511871338} -09/20/2021 17:38:39 - INFO - __main__ - Step 14577: {'lr': 0.00019999472642393047, 'samples': 466464, 'steps': 911, 'loss/train': 4.16115140914917} -09/20/2021 17:38:41 - INFO - __main__ - Step 14578: {'lr': 0.00019999472642393047, 'samples': 466496, 'steps': 911, 'loss/train': 4.533095836639404} -09/20/2021 17:38:42 - INFO - __main__ - Step 14579: {'lr': 0.00019999472642393047, 'samples': 466528, 'steps': 911, 'loss/train': 4.285905838012695} -09/20/2021 17:38:43 - INFO - __main__ - Step 14580: {'lr': 0.00019999472642393047, 'samples': 466560, 'steps': 911, 'loss/train': 3.5989034175872803} -09/20/2021 17:38:43 - INFO - __main__ - Step 14581: {'lr': 0.00019999472642393047, 'samples': 466592, 'steps': 911, 'loss/train': 4.1346940994262695} -09/20/2021 17:38:44 - INFO - __main__ - Step 14582: {'lr': 0.00019999472642393047, 'samples': 466624, 'steps': 911, 'loss/train': 4.717152118682861} -09/20/2021 17:38:45 - INFO - __main__ - Step 14583: {'lr': 0.00019999472642393047, 'samples': 466656, 'steps': 911, 'loss/train': 3.7857041358947754} -09/20/2021 17:38:46 - INFO - __main__ - Step 14584: {'lr': 0.00019999472642393047, 'samples': 466688, 'steps': 911, 'loss/train': 4.605965614318848} -09/20/2021 17:38:46 - INFO - __main__ - Step 14585: {'lr': 0.00019999472642393047, 'samples': 466720, 'steps': 911, 'loss/train': 4.206153869628906} -09/20/2021 17:38:47 - INFO - __main__ - Step 14586: {'lr': 0.00019999472642393047, 'samples': 466752, 'steps': 911, 'loss/train': 3.249586582183838} -09/20/2021 17:38:48 - INFO - __main__ - Step 14587: {'lr': 0.00019999472642393047, 'samples': 466784, 'steps': 911, 'loss/train': 3.9466023445129395} -09/20/2021 17:38:49 - INFO - __main__ - Step 14588: {'lr': 0.00019999472642393047, 'samples': 466816, 'steps': 911, 'loss/train': 4.283313274383545} -09/20/2021 17:38:49 - INFO - __main__ - Step 14589: {'lr': 0.00019999472642393047, 'samples': 466848, 'steps': 911, 'loss/train': 4.4562482833862305} -09/20/2021 17:38:50 - INFO - __main__ - Step 14590: {'lr': 0.00019999472642393047, 'samples': 466880, 'steps': 911, 'loss/train': 4.0550312995910645} -09/20/2021 17:38:51 - INFO - __main__ - Step 14591: {'lr': 0.00019999472642393047, 'samples': 466912, 'steps': 911, 'loss/train': 3.7812390327453613} -09/20/2021 17:38:52 - INFO - __main__ - Step 14592: {'lr': 0.00019999472642393047, 'samples': 466944, 'steps': 911, 'loss/train': 3.375903606414795} -09/20/2021 17:38:53 - INFO - __main__ - Step 14593: {'lr': 0.0001999946607108055, 'samples': 466976, 'steps': 912, 'loss/train': 4.756021022796631} -09/20/2021 17:38:53 - INFO - __main__ - Step 14594: {'lr': 0.0001999946607108055, 'samples': 467008, 'steps': 912, 'loss/train': 3.1658012866973877} -09/20/2021 17:38:54 - INFO - __main__ - Step 14595: {'lr': 0.0001999946607108055, 'samples': 467040, 'steps': 912, 'loss/train': 3.3021676540374756} -09/20/2021 17:38:55 - INFO - __main__ - Step 14596: {'lr': 0.0001999946607108055, 'samples': 467072, 'steps': 912, 'loss/train': 3.2883288860321045} -09/20/2021 17:38:56 - INFO - __main__ - Step 14597: {'lr': 0.0001999946607108055, 'samples': 467104, 'steps': 912, 'loss/train': 2.762259006500244} -09/20/2021 17:38:56 - INFO - __main__ - Step 14598: {'lr': 0.0001999946607108055, 'samples': 467136, 'steps': 912, 'loss/train': 3.379985809326172} -09/20/2021 17:38:57 - INFO - __main__ - Step 14599: {'lr': 0.0001999946607108055, 'samples': 467168, 'steps': 912, 'loss/train': 2.4255211353302} -09/20/2021 17:38:58 - INFO - __main__ - Step 14600: {'lr': 0.0001999946607108055, 'samples': 467200, 'steps': 912, 'loss/train': 2.5284781455993652} -09/20/2021 17:38:59 - INFO - __main__ - Step 14601: {'lr': 0.0001999946607108055, 'samples': 467232, 'steps': 912, 'loss/train': 2.366633415222168} -09/20/2021 17:38:59 - INFO - __main__ - Step 14602: {'lr': 0.0001999946607108055, 'samples': 467264, 'steps': 912, 'loss/train': 3.779266595840454} -09/20/2021 17:39:00 - INFO - __main__ - Step 14603: {'lr': 0.0001999946607108055, 'samples': 467296, 'steps': 912, 'loss/train': 4.261382102966309} -09/20/2021 17:39:01 - INFO - __main__ - Step 14604: {'lr': 0.0001999946607108055, 'samples': 467328, 'steps': 912, 'loss/train': 3.5795116424560547} -09/20/2021 17:39:02 - INFO - __main__ - Step 14605: {'lr': 0.0001999946607108055, 'samples': 467360, 'steps': 912, 'loss/train': 4.100636959075928} -09/20/2021 17:39:02 - INFO - __main__ - Step 14606: {'lr': 0.0001999946607108055, 'samples': 467392, 'steps': 912, 'loss/train': 4.25731086730957} -09/20/2021 17:39:03 - INFO - __main__ - Step 14607: {'lr': 0.0001999946607108055, 'samples': 467424, 'steps': 912, 'loss/train': 5.1336517333984375} -09/20/2021 17:39:04 - INFO - __main__ - Step 14608: {'lr': 0.0001999946607108055, 'samples': 467456, 'steps': 912, 'loss/train': 3.959639310836792} -09/20/2021 17:39:05 - INFO - __main__ - Step 14609: {'lr': 0.00019999459459080264, 'samples': 467488, 'steps': 913, 'loss/train': 3.170132637023926} -09/20/2021 17:39:06 - INFO - __main__ - Step 14610: {'lr': 0.00019999459459080264, 'samples': 467520, 'steps': 913, 'loss/train': 3.32442569732666} -09/20/2021 17:39:07 - INFO - __main__ - Step 14611: {'lr': 0.00019999459459080264, 'samples': 467552, 'steps': 913, 'loss/train': 4.382776260375977} -09/20/2021 17:39:07 - INFO - __main__ - Step 14612: {'lr': 0.00019999459459080264, 'samples': 467584, 'steps': 913, 'loss/train': 4.171169281005859} -09/20/2021 17:39:08 - INFO - __main__ - Step 14613: {'lr': 0.00019999459459080264, 'samples': 467616, 'steps': 913, 'loss/train': 5.051274299621582} -09/20/2021 17:39:09 - INFO - __main__ - Step 14614: {'lr': 0.00019999459459080264, 'samples': 467648, 'steps': 913, 'loss/train': 4.208676338195801} -09/20/2021 17:39:10 - INFO - __main__ - Step 14615: {'lr': 0.00019999459459080264, 'samples': 467680, 'steps': 913, 'loss/train': 3.707965135574341} -09/20/2021 17:39:10 - INFO - __main__ - Step 14616: {'lr': 0.00019999459459080264, 'samples': 467712, 'steps': 913, 'loss/train': 3.2471706867218018} -09/20/2021 17:39:11 - INFO - __main__ - Step 14617: {'lr': 0.00019999459459080264, 'samples': 467744, 'steps': 913, 'loss/train': 3.646897077560425} -09/20/2021 17:39:12 - INFO - __main__ - Step 14618: {'lr': 0.00019999459459080264, 'samples': 467776, 'steps': 913, 'loss/train': 3.8915319442749023} -09/20/2021 17:39:13 - INFO - __main__ - Step 14619: {'lr': 0.00019999459459080264, 'samples': 467808, 'steps': 913, 'loss/train': 3.55007266998291} -09/20/2021 17:39:13 - INFO - __main__ - Step 14620: {'lr': 0.00019999459459080264, 'samples': 467840, 'steps': 913, 'loss/train': 3.787106513977051} -09/20/2021 17:39:14 - INFO - __main__ - Step 14621: {'lr': 0.00019999459459080264, 'samples': 467872, 'steps': 913, 'loss/train': 3.8526101112365723} -09/20/2021 17:39:15 - INFO - __main__ - Step 14622: {'lr': 0.00019999459459080264, 'samples': 467904, 'steps': 913, 'loss/train': 4.105713367462158} -09/20/2021 17:39:16 - INFO - __main__ - Step 14623: {'lr': 0.00019999459459080264, 'samples': 467936, 'steps': 913, 'loss/train': 3.426065444946289} -09/20/2021 17:39:16 - INFO - __main__ - Step 14624: {'lr': 0.00019999459459080264, 'samples': 467968, 'steps': 913, 'loss/train': 4.36418342590332} -09/20/2021 17:39:17 - INFO - __main__ - Step 14625: {'lr': 0.00019999452806392215, 'samples': 468000, 'steps': 914, 'loss/train': 4.439134120941162} -09/20/2021 17:39:18 - INFO - __main__ - Step 14626: {'lr': 0.00019999452806392215, 'samples': 468032, 'steps': 914, 'loss/train': 4.7662177085876465} -09/20/2021 17:39:19 - INFO - __main__ - Step 14627: {'lr': 0.00019999452806392215, 'samples': 468064, 'steps': 914, 'loss/train': 3.5509817600250244} -09/20/2021 17:39:20 - INFO - __main__ - Step 14628: {'lr': 0.00019999452806392215, 'samples': 468096, 'steps': 914, 'loss/train': 2.649240255355835} -09/20/2021 17:39:20 - INFO - __main__ - Step 14629: {'lr': 0.00019999452806392215, 'samples': 468128, 'steps': 914, 'loss/train': 3.4882822036743164} -09/20/2021 17:39:21 - INFO - __main__ - Step 14630: {'lr': 0.00019999452806392215, 'samples': 468160, 'steps': 914, 'loss/train': 4.75009298324585} -09/20/2021 17:39:22 - INFO - __main__ - Step 14631: {'lr': 0.00019999452806392215, 'samples': 468192, 'steps': 914, 'loss/train': 3.516494035720825} -09/20/2021 17:39:23 - INFO - __main__ - Step 14632: {'lr': 0.00019999452806392215, 'samples': 468224, 'steps': 914, 'loss/train': 3.264765977859497} -09/20/2021 17:39:23 - INFO - __main__ - Step 14633: {'lr': 0.00019999452806392215, 'samples': 468256, 'steps': 914, 'loss/train': 2.5334246158599854} -09/20/2021 17:39:24 - INFO - __main__ - Step 14634: {'lr': 0.00019999452806392215, 'samples': 468288, 'steps': 914, 'loss/train': 3.429535388946533} -09/20/2021 17:39:25 - INFO - __main__ - Step 14635: {'lr': 0.00019999452806392215, 'samples': 468320, 'steps': 914, 'loss/train': 3.7687268257141113} -09/20/2021 17:39:26 - INFO - __main__ - Step 14636: {'lr': 0.00019999452806392215, 'samples': 468352, 'steps': 914, 'loss/train': 3.9805822372436523} -09/20/2021 17:39:26 - INFO - __main__ - Step 14637: {'lr': 0.00019999452806392215, 'samples': 468384, 'steps': 914, 'loss/train': 3.4917590618133545} -09/20/2021 17:39:27 - INFO - __main__ - Step 14638: {'lr': 0.00019999452806392215, 'samples': 468416, 'steps': 914, 'loss/train': 3.386691093444824} -09/20/2021 17:39:28 - INFO - __main__ - Step 14639: {'lr': 0.00019999452806392215, 'samples': 468448, 'steps': 914, 'loss/train': 4.1083807945251465} -09/20/2021 17:39:29 - INFO - __main__ - Step 14640: {'lr': 0.00019999452806392215, 'samples': 468480, 'steps': 914, 'loss/train': 4.136220455169678} -09/20/2021 17:39:30 - INFO - __main__ - Step 14641: {'lr': 0.00019999446113016432, 'samples': 468512, 'steps': 915, 'loss/train': 4.6686224937438965} -09/20/2021 17:39:31 - INFO - __main__ - Step 14642: {'lr': 0.00019999446113016432, 'samples': 468544, 'steps': 915, 'loss/train': 3.9577126502990723} -09/20/2021 17:39:31 - INFO - __main__ - Step 14643: {'lr': 0.00019999446113016432, 'samples': 468576, 'steps': 915, 'loss/train': 3.730501890182495} -09/20/2021 17:39:32 - INFO - __main__ - Step 14644: {'lr': 0.00019999446113016432, 'samples': 468608, 'steps': 915, 'loss/train': 3.8163018226623535} -09/20/2021 17:39:33 - INFO - __main__ - Step 14645: {'lr': 0.00019999446113016432, 'samples': 468640, 'steps': 915, 'loss/train': 1.1583664417266846} -09/20/2021 17:39:34 - INFO - __main__ - Step 14646: {'lr': 0.00019999446113016432, 'samples': 468672, 'steps': 915, 'loss/train': 5.1588134765625} -09/20/2021 17:39:34 - INFO - __main__ - Step 14647: {'lr': 0.00019999446113016432, 'samples': 468704, 'steps': 915, 'loss/train': 5.014006614685059} -09/20/2021 17:39:35 - INFO - __main__ - Step 14648: {'lr': 0.00019999446113016432, 'samples': 468736, 'steps': 915, 'loss/train': 3.241452932357788} -09/20/2021 17:39:36 - INFO - __main__ - Step 14649: {'lr': 0.00019999446113016432, 'samples': 468768, 'steps': 915, 'loss/train': 3.5537452697753906} -09/20/2021 17:39:37 - INFO - __main__ - Step 14650: {'lr': 0.00019999446113016432, 'samples': 468800, 'steps': 915, 'loss/train': 4.533556938171387} -09/20/2021 17:39:37 - INFO - __main__ - Step 14651: {'lr': 0.00019999446113016432, 'samples': 468832, 'steps': 915, 'loss/train': 3.921095371246338} -09/20/2021 17:39:38 - INFO - __main__ - Step 14652: {'lr': 0.00019999446113016432, 'samples': 468864, 'steps': 915, 'loss/train': 2.924821615219116} -09/20/2021 17:39:39 - INFO - __main__ - Step 14653: {'lr': 0.00019999446113016432, 'samples': 468896, 'steps': 915, 'loss/train': 5.3980712890625} -09/20/2021 17:39:40 - INFO - __main__ - Step 14654: {'lr': 0.00019999446113016432, 'samples': 468928, 'steps': 915, 'loss/train': 4.501133441925049} -09/20/2021 17:39:40 - INFO - __main__ - Step 14655: {'lr': 0.00019999446113016432, 'samples': 468960, 'steps': 915, 'loss/train': 4.127435684204102} -09/20/2021 17:39:41 - INFO - __main__ - Step 14656: {'lr': 0.00019999446113016432, 'samples': 468992, 'steps': 915, 'loss/train': 3.471712589263916} -09/20/2021 17:39:42 - INFO - __main__ - Step 14657: {'lr': 0.00019999439378952944, 'samples': 469024, 'steps': 916, 'loss/train': 3.667846441268921} -09/20/2021 17:39:43 - INFO - __main__ - Step 14658: {'lr': 0.00019999439378952944, 'samples': 469056, 'steps': 916, 'loss/train': 3.4079430103302} -09/20/2021 17:39:44 - INFO - __main__ - Step 14659: {'lr': 0.00019999439378952944, 'samples': 469088, 'steps': 916, 'loss/train': 3.235903263092041} -09/20/2021 17:39:44 - INFO - __main__ - Step 14660: {'lr': 0.00019999439378952944, 'samples': 469120, 'steps': 916, 'loss/train': 4.120580196380615} -09/20/2021 17:39:45 - INFO - __main__ - Step 14661: {'lr': 0.00019999439378952944, 'samples': 469152, 'steps': 916, 'loss/train': 4.215738296508789} -09/20/2021 17:39:46 - INFO - __main__ - Step 14662: {'lr': 0.00019999439378952944, 'samples': 469184, 'steps': 916, 'loss/train': 3.7750422954559326} -09/20/2021 17:39:47 - INFO - __main__ - Step 14663: {'lr': 0.00019999439378952944, 'samples': 469216, 'steps': 916, 'loss/train': 3.8309876918792725} -09/20/2021 17:39:47 - INFO - __main__ - Step 14664: {'lr': 0.00019999439378952944, 'samples': 469248, 'steps': 916, 'loss/train': 3.7444021701812744} -09/20/2021 17:39:48 - INFO - __main__ - Step 14665: {'lr': 0.00019999439378952944, 'samples': 469280, 'steps': 916, 'loss/train': 4.213076114654541} -09/20/2021 17:39:49 - INFO - __main__ - Step 14666: {'lr': 0.00019999439378952944, 'samples': 469312, 'steps': 916, 'loss/train': 3.668179512023926} -09/20/2021 17:39:50 - INFO - __main__ - Step 14667: {'lr': 0.00019999439378952944, 'samples': 469344, 'steps': 916, 'loss/train': 4.403337001800537} -09/20/2021 17:39:50 - INFO - __main__ - Step 14668: {'lr': 0.00019999439378952944, 'samples': 469376, 'steps': 916, 'loss/train': 4.135979652404785} -09/20/2021 17:39:51 - INFO - __main__ - Step 14669: {'lr': 0.00019999439378952944, 'samples': 469408, 'steps': 916, 'loss/train': 4.964376449584961} -09/20/2021 17:39:52 - INFO - __main__ - Step 14670: {'lr': 0.00019999439378952944, 'samples': 469440, 'steps': 916, 'loss/train': 4.575099945068359} -09/20/2021 17:39:53 - INFO - __main__ - Step 14671: {'lr': 0.00019999439378952944, 'samples': 469472, 'steps': 916, 'loss/train': 5.187491416931152} -09/20/2021 17:39:54 - INFO - __main__ - Step 14672: {'lr': 0.00019999439378952944, 'samples': 469504, 'steps': 916, 'loss/train': 1.9469330310821533} -09/20/2021 17:39:55 - INFO - __main__ - Step 14673: {'lr': 0.00019999432604201776, 'samples': 469536, 'steps': 917, 'loss/train': 3.917232036590576} -09/20/2021 17:39:56 - INFO - __main__ - Step 14674: {'lr': 0.00019999432604201776, 'samples': 469568, 'steps': 917, 'loss/train': 3.24454665184021} -09/20/2021 17:39:56 - INFO - __main__ - Step 14675: {'lr': 0.00019999432604201776, 'samples': 469600, 'steps': 917, 'loss/train': 4.238831043243408} -09/20/2021 17:39:57 - INFO - __main__ - Step 14676: {'lr': 0.00019999432604201776, 'samples': 469632, 'steps': 917, 'loss/train': 4.593649864196777} -09/20/2021 17:39:58 - INFO - __main__ - Step 14677: {'lr': 0.00019999432604201776, 'samples': 469664, 'steps': 917, 'loss/train': 3.4187135696411133} -09/20/2021 17:39:59 - INFO - __main__ - Step 14678: {'lr': 0.00019999432604201776, 'samples': 469696, 'steps': 917, 'loss/train': 3.6330268383026123} -09/20/2021 17:39:59 - INFO - __main__ - Step 14679: {'lr': 0.00019999432604201776, 'samples': 469728, 'steps': 917, 'loss/train': 4.668287754058838} -09/20/2021 17:40:00 - INFO - __main__ - Step 14680: {'lr': 0.00019999432604201776, 'samples': 469760, 'steps': 917, 'loss/train': 5.136999607086182} -09/20/2021 17:40:01 - INFO - __main__ - Step 14681: {'lr': 0.00019999432604201776, 'samples': 469792, 'steps': 917, 'loss/train': 4.251902103424072} -09/20/2021 17:40:02 - INFO - __main__ - Step 14682: {'lr': 0.00019999432604201776, 'samples': 469824, 'steps': 917, 'loss/train': 4.49857759475708} -09/20/2021 17:40:02 - INFO - __main__ - Step 14683: {'lr': 0.00019999432604201776, 'samples': 469856, 'steps': 917, 'loss/train': 4.452916145324707} -09/20/2021 17:40:03 - INFO - __main__ - Step 14684: {'lr': 0.00019999432604201776, 'samples': 469888, 'steps': 917, 'loss/train': 4.326997756958008} -09/20/2021 17:40:04 - INFO - __main__ - Step 14685: {'lr': 0.00019999432604201776, 'samples': 469920, 'steps': 917, 'loss/train': 4.376492977142334} -09/20/2021 17:40:05 - INFO - __main__ - Step 14686: {'lr': 0.00019999432604201776, 'samples': 469952, 'steps': 917, 'loss/train': 2.7402868270874023} -09/20/2021 17:40:05 - INFO - __main__ - Step 14687: {'lr': 0.00019999432604201776, 'samples': 469984, 'steps': 917, 'loss/train': 4.169252872467041} -09/20/2021 17:40:06 - INFO - __main__ - Step 14688: {'lr': 0.00019999432604201776, 'samples': 470016, 'steps': 917, 'loss/train': 4.93079948425293} -09/20/2021 17:40:07 - INFO - __main__ - Step 14689: {'lr': 0.00019999425788762954, 'samples': 470048, 'steps': 918, 'loss/train': 3.1185264587402344} -09/20/2021 17:40:08 - INFO - __main__ - Step 14690: {'lr': 0.00019999425788762954, 'samples': 470080, 'steps': 918, 'loss/train': 3.5774085521698} -09/20/2021 17:40:08 - INFO - __main__ - Step 14691: {'lr': 0.00019999425788762954, 'samples': 470112, 'steps': 918, 'loss/train': 4.60957670211792} -09/20/2021 17:40:09 - INFO - __main__ - Step 14692: {'lr': 0.00019999425788762954, 'samples': 470144, 'steps': 918, 'loss/train': 4.683963298797607} -09/20/2021 17:40:10 - INFO - __main__ - Step 14693: {'lr': 0.00019999425788762954, 'samples': 470176, 'steps': 918, 'loss/train': 4.4314656257629395} -09/20/2021 17:40:11 - INFO - __main__ - Step 14694: {'lr': 0.00019999425788762954, 'samples': 470208, 'steps': 918, 'loss/train': 4.969517707824707} -09/20/2021 17:40:11 - INFO - __main__ - Step 14695: {'lr': 0.00019999425788762954, 'samples': 470240, 'steps': 918, 'loss/train': 3.0804152488708496} -09/20/2021 17:40:12 - INFO - __main__ - Step 14696: {'lr': 0.00019999425788762954, 'samples': 470272, 'steps': 918, 'loss/train': 4.523036956787109} -09/20/2021 17:40:13 - INFO - __main__ - Step 14697: {'lr': 0.00019999425788762954, 'samples': 470304, 'steps': 918, 'loss/train': 4.951265811920166} -09/20/2021 17:40:14 - INFO - __main__ - Step 14698: {'lr': 0.00019999425788762954, 'samples': 470336, 'steps': 918, 'loss/train': 3.716417074203491} -09/20/2021 17:40:14 - INFO - __main__ - Step 14699: {'lr': 0.00019999425788762954, 'samples': 470368, 'steps': 918, 'loss/train': 3.6824653148651123} -09/20/2021 17:40:15 - INFO - __main__ - Step 14700: {'lr': 0.00019999425788762954, 'samples': 470400, 'steps': 918, 'loss/train': 3.727421522140503} -09/20/2021 17:40:16 - INFO - __main__ - Step 14701: {'lr': 0.00019999425788762954, 'samples': 470432, 'steps': 918, 'loss/train': 4.204041957855225} -09/20/2021 17:40:17 - INFO - __main__ - Step 14702: {'lr': 0.00019999425788762954, 'samples': 470464, 'steps': 918, 'loss/train': 3.8032517433166504} -09/20/2021 17:40:18 - INFO - __main__ - Step 14703: {'lr': 0.00019999425788762954, 'samples': 470496, 'steps': 918, 'loss/train': 2.8659892082214355} -09/20/2021 17:40:19 - INFO - __main__ - Step 14704: {'lr': 0.00019999425788762954, 'samples': 470528, 'steps': 918, 'loss/train': 4.040616512298584} -09/20/2021 17:40:20 - INFO - __main__ - Step 14705: {'lr': 0.00019999418932636507, 'samples': 470560, 'steps': 919, 'loss/train': 3.525907278060913} -09/20/2021 17:40:20 - INFO - __main__ - Step 14706: {'lr': 0.00019999418932636507, 'samples': 470592, 'steps': 919, 'loss/train': 3.538576602935791} -09/20/2021 17:40:21 - INFO - __main__ - Step 14707: {'lr': 0.00019999418932636507, 'samples': 470624, 'steps': 919, 'loss/train': 3.539547920227051} -09/20/2021 17:40:22 - INFO - __main__ - Step 14708: {'lr': 0.00019999418932636507, 'samples': 470656, 'steps': 919, 'loss/train': 3.666938543319702} -09/20/2021 17:40:23 - INFO - __main__ - Step 14709: {'lr': 0.00019999418932636507, 'samples': 470688, 'steps': 919, 'loss/train': 4.689937114715576} -09/20/2021 17:40:23 - INFO - __main__ - Step 14710: {'lr': 0.00019999418932636507, 'samples': 470720, 'steps': 919, 'loss/train': 3.7508645057678223} -09/20/2021 17:40:24 - INFO - __main__ - Step 14711: {'lr': 0.00019999418932636507, 'samples': 470752, 'steps': 919, 'loss/train': 3.5235259532928467} -09/20/2021 17:40:25 - INFO - __main__ - Step 14712: {'lr': 0.00019999418932636507, 'samples': 470784, 'steps': 919, 'loss/train': 4.00644588470459} -09/20/2021 17:40:26 - INFO - __main__ - Step 14713: {'lr': 0.00019999418932636507, 'samples': 470816, 'steps': 919, 'loss/train': 4.014239311218262} -09/20/2021 17:40:26 - INFO - __main__ - Step 14714: {'lr': 0.00019999418932636507, 'samples': 470848, 'steps': 919, 'loss/train': 4.6989617347717285} -09/20/2021 17:40:27 - INFO - __main__ - Step 14715: {'lr': 0.00019999418932636507, 'samples': 470880, 'steps': 919, 'loss/train': 4.079406261444092} -09/20/2021 17:40:28 - INFO - __main__ - Step 14716: {'lr': 0.00019999418932636507, 'samples': 470912, 'steps': 919, 'loss/train': 3.7870047092437744} -09/20/2021 17:40:29 - INFO - __main__ - Step 14717: {'lr': 0.00019999418932636507, 'samples': 470944, 'steps': 919, 'loss/train': 3.035217523574829} -09/20/2021 17:40:29 - INFO - __main__ - Step 14718: {'lr': 0.00019999418932636507, 'samples': 470976, 'steps': 919, 'loss/train': 3.9783337116241455} -09/20/2021 17:40:30 - INFO - __main__ - Step 14719: {'lr': 0.00019999418932636507, 'samples': 471008, 'steps': 919, 'loss/train': 3.2537224292755127} -09/20/2021 17:40:31 - INFO - __main__ - Step 14720: {'lr': 0.00019999418932636507, 'samples': 471040, 'steps': 919, 'loss/train': 3.6646900177001953} -09/20/2021 17:40:32 - INFO - __main__ - Step 14721: {'lr': 0.00019999412035822463, 'samples': 471072, 'steps': 920, 'loss/train': 2.8926937580108643} -09/20/2021 17:40:33 - INFO - __main__ - Step 14722: {'lr': 0.00019999412035822463, 'samples': 471104, 'steps': 920, 'loss/train': 3.661036729812622} -09/20/2021 17:40:33 - INFO - __main__ - Step 14723: {'lr': 0.00019999412035822463, 'samples': 471136, 'steps': 920, 'loss/train': 4.082695484161377} -09/20/2021 17:40:34 - INFO - __main__ - Step 14724: {'lr': 0.00019999412035822463, 'samples': 471168, 'steps': 920, 'loss/train': 4.242680072784424} -09/20/2021 17:40:35 - INFO - __main__ - Step 14725: {'lr': 0.00019999412035822463, 'samples': 471200, 'steps': 920, 'loss/train': 3.1546027660369873} -09/20/2021 17:40:36 - INFO - __main__ - Step 14726: {'lr': 0.00019999412035822463, 'samples': 471232, 'steps': 920, 'loss/train': 3.9251961708068848} -09/20/2021 17:40:36 - INFO - __main__ - Step 14727: {'lr': 0.00019999412035822463, 'samples': 471264, 'steps': 920, 'loss/train': 3.350761651992798} -09/20/2021 17:40:37 - INFO - __main__ - Step 14728: {'lr': 0.00019999412035822463, 'samples': 471296, 'steps': 920, 'loss/train': 3.886363983154297} -09/20/2021 17:40:38 - INFO - __main__ - Step 14729: {'lr': 0.00019999412035822463, 'samples': 471328, 'steps': 920, 'loss/train': 5.549525260925293} -09/20/2021 17:40:39 - INFO - __main__ - Step 14730: {'lr': 0.00019999412035822463, 'samples': 471360, 'steps': 920, 'loss/train': 3.579272508621216} -09/20/2021 17:40:39 - INFO - __main__ - Step 14731: {'lr': 0.00019999412035822463, 'samples': 471392, 'steps': 920, 'loss/train': 3.6838669776916504} -09/20/2021 17:40:40 - INFO - __main__ - Step 14732: {'lr': 0.00019999412035822463, 'samples': 471424, 'steps': 920, 'loss/train': 3.983819007873535} -09/20/2021 17:40:41 - INFO - __main__ - Step 14733: {'lr': 0.00019999412035822463, 'samples': 471456, 'steps': 920, 'loss/train': 3.1176860332489014} -09/20/2021 17:40:42 - INFO - __main__ - Step 14734: {'lr': 0.00019999412035822463, 'samples': 471488, 'steps': 920, 'loss/train': 4.298069000244141} -09/20/2021 17:40:43 - INFO - __main__ - Step 14735: {'lr': 0.00019999412035822463, 'samples': 471520, 'steps': 920, 'loss/train': 4.382990837097168} -09/20/2021 17:40:44 - INFO - __main__ - Step 14736: {'lr': 0.00019999412035822463, 'samples': 471552, 'steps': 920, 'loss/train': 3.5047221183776855} -09/20/2021 17:40:45 - INFO - __main__ - Step 14737: {'lr': 0.0001999940509832085, 'samples': 471584, 'steps': 921, 'loss/train': 6.239818096160889} -09/20/2021 17:40:45 - INFO - __main__ - Step 14738: {'lr': 0.0001999940509832085, 'samples': 471616, 'steps': 921, 'loss/train': 3.70766282081604} -09/20/2021 17:40:46 - INFO - __main__ - Step 14739: {'lr': 0.0001999940509832085, 'samples': 471648, 'steps': 921, 'loss/train': 4.038074493408203} -09/20/2021 17:40:47 - INFO - __main__ - Step 14740: {'lr': 0.0001999940509832085, 'samples': 471680, 'steps': 921, 'loss/train': 4.146382808685303} -09/20/2021 17:40:48 - INFO - __main__ - Step 14741: {'lr': 0.0001999940509832085, 'samples': 471712, 'steps': 921, 'loss/train': 3.5727388858795166} -09/20/2021 17:40:48 - INFO - __main__ - Step 14742: {'lr': 0.0001999940509832085, 'samples': 471744, 'steps': 921, 'loss/train': 4.644150733947754} -09/20/2021 17:40:49 - INFO - __main__ - Step 14743: {'lr': 0.0001999940509832085, 'samples': 471776, 'steps': 921, 'loss/train': 2.2829668521881104} -09/20/2021 17:40:50 - INFO - __main__ - Step 14744: {'lr': 0.0001999940509832085, 'samples': 471808, 'steps': 921, 'loss/train': 4.1634602546691895} -09/20/2021 17:40:51 - INFO - __main__ - Step 14745: {'lr': 0.0001999940509832085, 'samples': 471840, 'steps': 921, 'loss/train': 4.651848793029785} -09/20/2021 17:40:51 - INFO - __main__ - Step 14746: {'lr': 0.0001999940509832085, 'samples': 471872, 'steps': 921, 'loss/train': 1.9962406158447266} -09/20/2021 17:40:52 - INFO - __main__ - Step 14747: {'lr': 0.0001999940509832085, 'samples': 471904, 'steps': 921, 'loss/train': 3.493278980255127} -09/20/2021 17:40:53 - INFO - __main__ - Step 14748: {'lr': 0.0001999940509832085, 'samples': 471936, 'steps': 921, 'loss/train': 2.47981333732605} -09/20/2021 17:40:54 - INFO - __main__ - Step 14749: {'lr': 0.0001999940509832085, 'samples': 471968, 'steps': 921, 'loss/train': 3.00272798538208} -09/20/2021 17:40:54 - INFO - __main__ - Step 14750: {'lr': 0.0001999940509832085, 'samples': 472000, 'steps': 921, 'loss/train': 3.1890413761138916} -09/20/2021 17:40:55 - INFO - __main__ - Step 14751: {'lr': 0.0001999940509832085, 'samples': 472032, 'steps': 921, 'loss/train': 3.59834361076355} -09/20/2021 17:40:56 - INFO - __main__ - Step 14752: {'lr': 0.0001999940509832085, 'samples': 472064, 'steps': 921, 'loss/train': 3.8705947399139404} -09/20/2021 17:40:57 - INFO - __main__ - Step 14753: {'lr': 0.00019999398120131695, 'samples': 472096, 'steps': 922, 'loss/train': 1.2573144435882568} -09/20/2021 17:40:57 - INFO - __main__ - Step 14754: {'lr': 0.00019999398120131695, 'samples': 472128, 'steps': 922, 'loss/train': 5.073368072509766} -09/20/2021 17:40:58 - INFO - __main__ - Step 14755: {'lr': 0.00019999398120131695, 'samples': 472160, 'steps': 922, 'loss/train': 3.0564682483673096} -09/20/2021 17:40:59 - INFO - __main__ - Step 14756: {'lr': 0.00019999398120131695, 'samples': 472192, 'steps': 922, 'loss/train': 3.5265309810638428} -09/20/2021 17:41:00 - INFO - __main__ - Step 14757: {'lr': 0.00019999398120131695, 'samples': 472224, 'steps': 922, 'loss/train': 3.706831455230713} -09/20/2021 17:41:00 - INFO - __main__ - Step 14758: {'lr': 0.00019999398120131695, 'samples': 472256, 'steps': 922, 'loss/train': 2.8620922565460205} -09/20/2021 17:41:01 - INFO - __main__ - Step 14759: {'lr': 0.00019999398120131695, 'samples': 472288, 'steps': 922, 'loss/train': 3.7208092212677} -09/20/2021 17:41:02 - INFO - __main__ - Step 14760: {'lr': 0.00019999398120131695, 'samples': 472320, 'steps': 922, 'loss/train': 3.9770607948303223} -09/20/2021 17:41:03 - INFO - __main__ - Step 14761: {'lr': 0.00019999398120131695, 'samples': 472352, 'steps': 922, 'loss/train': 3.8587114810943604} -09/20/2021 17:41:03 - INFO - __main__ - Step 14762: {'lr': 0.00019999398120131695, 'samples': 472384, 'steps': 922, 'loss/train': 5.027976989746094} -09/20/2021 17:41:05 - INFO - __main__ - Step 14763: {'lr': 0.00019999398120131695, 'samples': 472416, 'steps': 922, 'loss/train': 4.443924427032471} -09/20/2021 17:41:05 - INFO - __main__ - Step 14764: {'lr': 0.00019999398120131695, 'samples': 472448, 'steps': 922, 'loss/train': 5.364899158477783} -09/20/2021 17:41:06 - INFO - __main__ - Step 14765: {'lr': 0.00019999398120131695, 'samples': 472480, 'steps': 922, 'loss/train': 3.7052457332611084} -09/20/2021 17:41:07 - INFO - __main__ - Step 14766: {'lr': 0.00019999398120131695, 'samples': 472512, 'steps': 922, 'loss/train': 3.5141375064849854} -09/20/2021 17:41:08 - INFO - __main__ - Step 14767: {'lr': 0.00019999398120131695, 'samples': 472544, 'steps': 922, 'loss/train': 5.222323417663574} -09/20/2021 17:41:08 - INFO - __main__ - Step 14768: {'lr': 0.00019999398120131695, 'samples': 472576, 'steps': 922, 'loss/train': 4.241465091705322} -09/20/2021 17:41:09 - INFO - __main__ - Step 14769: {'lr': 0.00019999391101255034, 'samples': 472608, 'steps': 923, 'loss/train': 4.207173824310303} -09/20/2021 17:41:10 - INFO - __main__ - Step 14770: {'lr': 0.00019999391101255034, 'samples': 472640, 'steps': 923, 'loss/train': 3.815542697906494} -09/20/2021 17:41:11 - INFO - __main__ - Step 14771: {'lr': 0.00019999391101255034, 'samples': 472672, 'steps': 923, 'loss/train': 4.787763595581055} -09/20/2021 17:41:12 - INFO - __main__ - Step 14772: {'lr': 0.00019999391101255034, 'samples': 472704, 'steps': 923, 'loss/train': 4.190427303314209} -09/20/2021 17:41:12 - INFO - __main__ - Step 14773: {'lr': 0.00019999391101255034, 'samples': 472736, 'steps': 923, 'loss/train': 4.374410629272461} -09/20/2021 17:41:13 - INFO - __main__ - Step 14774: {'lr': 0.00019999391101255034, 'samples': 472768, 'steps': 923, 'loss/train': 4.627283573150635} -09/20/2021 17:41:14 - INFO - __main__ - Step 14775: {'lr': 0.00019999391101255034, 'samples': 472800, 'steps': 923, 'loss/train': 3.934094190597534} -09/20/2021 17:41:15 - INFO - __main__ - Step 14776: {'lr': 0.00019999391101255034, 'samples': 472832, 'steps': 923, 'loss/train': 4.312780857086182} -09/20/2021 17:41:15 - INFO - __main__ - Step 14777: {'lr': 0.00019999391101255034, 'samples': 472864, 'steps': 923, 'loss/train': 4.612746238708496} -09/20/2021 17:41:16 - INFO - __main__ - Step 14778: {'lr': 0.00019999391101255034, 'samples': 472896, 'steps': 923, 'loss/train': 3.169797897338867} -09/20/2021 17:41:17 - INFO - __main__ - Step 14779: {'lr': 0.00019999391101255034, 'samples': 472928, 'steps': 923, 'loss/train': 4.034718036651611} -09/20/2021 17:41:18 - INFO - __main__ - Step 14780: {'lr': 0.00019999391101255034, 'samples': 472960, 'steps': 923, 'loss/train': 4.639209747314453} -09/20/2021 17:41:18 - INFO - __main__ - Step 14781: {'lr': 0.00019999391101255034, 'samples': 472992, 'steps': 923, 'loss/train': 4.096138954162598} -09/20/2021 17:41:19 - INFO - __main__ - Step 14782: {'lr': 0.00019999391101255034, 'samples': 473024, 'steps': 923, 'loss/train': 3.7969367504119873} -09/20/2021 17:41:20 - INFO - __main__ - Step 14783: {'lr': 0.00019999391101255034, 'samples': 473056, 'steps': 923, 'loss/train': 3.718031883239746} -09/20/2021 17:41:21 - INFO - __main__ - Step 14784: {'lr': 0.00019999391101255034, 'samples': 473088, 'steps': 923, 'loss/train': 4.153254508972168} -09/20/2021 17:41:21 - INFO - __main__ - Step 14785: {'lr': 0.00019999384041690882, 'samples': 473120, 'steps': 924, 'loss/train': 3.704923152923584} -09/20/2021 17:41:22 - INFO - __main__ - Step 14786: {'lr': 0.00019999384041690882, 'samples': 473152, 'steps': 924, 'loss/train': 4.47373628616333} -09/20/2021 17:41:23 - INFO - __main__ - Step 14787: {'lr': 0.00019999384041690882, 'samples': 473184, 'steps': 924, 'loss/train': 3.443143129348755} -09/20/2021 17:41:24 - INFO - __main__ - Step 14788: {'lr': 0.00019999384041690882, 'samples': 473216, 'steps': 924, 'loss/train': 3.5606956481933594} -09/20/2021 17:41:24 - INFO - __main__ - Step 14789: {'lr': 0.00019999384041690882, 'samples': 473248, 'steps': 924, 'loss/train': 4.390476703643799} -09/20/2021 17:41:25 - INFO - __main__ - Step 14790: {'lr': 0.00019999384041690882, 'samples': 473280, 'steps': 924, 'loss/train': 3.106254816055298} -09/20/2021 17:41:26 - INFO - __main__ - Step 14791: {'lr': 0.00019999384041690882, 'samples': 473312, 'steps': 924, 'loss/train': 4.027798652648926} -09/20/2021 17:41:27 - INFO - __main__ - Step 14792: {'lr': 0.00019999384041690882, 'samples': 473344, 'steps': 924, 'loss/train': 3.977044105529785} -09/20/2021 17:41:28 - INFO - __main__ - Step 14793: {'lr': 0.00019999384041690882, 'samples': 473376, 'steps': 924, 'loss/train': 3.5621237754821777} -09/20/2021 17:41:29 - INFO - __main__ - Step 14794: {'lr': 0.00019999384041690882, 'samples': 473408, 'steps': 924, 'loss/train': 4.0142364501953125} -09/20/2021 17:41:30 - INFO - __main__ - Step 14795: {'lr': 0.00019999384041690882, 'samples': 473440, 'steps': 924, 'loss/train': 4.03265380859375} -09/20/2021 17:41:30 - INFO - __main__ - Step 14796: {'lr': 0.00019999384041690882, 'samples': 473472, 'steps': 924, 'loss/train': 3.452021837234497} -09/20/2021 17:41:31 - INFO - __main__ - Step 14797: {'lr': 0.00019999384041690882, 'samples': 473504, 'steps': 924, 'loss/train': 4.174952507019043} -09/20/2021 17:41:32 - INFO - __main__ - Step 14798: {'lr': 0.00019999384041690882, 'samples': 473536, 'steps': 924, 'loss/train': 2.0985617637634277} -09/20/2021 17:41:33 - INFO - __main__ - Step 14799: {'lr': 0.00019999384041690882, 'samples': 473568, 'steps': 924, 'loss/train': 2.926701784133911} -09/20/2021 17:41:33 - INFO - __main__ - Step 14800: {'lr': 0.00019999384041690882, 'samples': 473600, 'steps': 924, 'loss/train': 3.5102131366729736} -09/20/2021 17:41:34 - INFO - __main__ - Step 14801: {'lr': 0.0001999937694143928, 'samples': 473632, 'steps': 925, 'loss/train': 3.5692942142486572} -09/20/2021 17:41:35 - INFO - __main__ - Step 14802: {'lr': 0.0001999937694143928, 'samples': 473664, 'steps': 925, 'loss/train': 4.382085800170898} -09/20/2021 17:41:36 - INFO - __main__ - Step 14803: {'lr': 0.0001999937694143928, 'samples': 473696, 'steps': 925, 'loss/train': 4.134748935699463} -09/20/2021 17:41:37 - INFO - __main__ - Step 14804: {'lr': 0.0001999937694143928, 'samples': 473728, 'steps': 925, 'loss/train': 4.214677810668945} -09/20/2021 17:41:37 - INFO - __main__ - Step 14805: {'lr': 0.0001999937694143928, 'samples': 473760, 'steps': 925, 'loss/train': 3.1546471118927} -09/20/2021 17:41:38 - INFO - __main__ - Step 14806: {'lr': 0.0001999937694143928, 'samples': 473792, 'steps': 925, 'loss/train': 4.251882553100586} -09/20/2021 17:41:39 - INFO - __main__ - Step 14807: {'lr': 0.0001999937694143928, 'samples': 473824, 'steps': 925, 'loss/train': 1.5994555950164795} -09/20/2021 17:41:40 - INFO - __main__ - Step 14808: {'lr': 0.0001999937694143928, 'samples': 473856, 'steps': 925, 'loss/train': 4.1342387199401855} -09/20/2021 17:41:40 - INFO - __main__ - Step 14809: {'lr': 0.0001999937694143928, 'samples': 473888, 'steps': 925, 'loss/train': 4.926196575164795} -09/20/2021 17:41:41 - INFO - __main__ - Step 14810: {'lr': 0.0001999937694143928, 'samples': 473920, 'steps': 925, 'loss/train': 3.649384021759033} -09/20/2021 17:41:42 - INFO - __main__ - Step 14811: {'lr': 0.0001999937694143928, 'samples': 473952, 'steps': 925, 'loss/train': 3.283642053604126} -09/20/2021 17:41:43 - INFO - __main__ - Step 14812: {'lr': 0.0001999937694143928, 'samples': 473984, 'steps': 925, 'loss/train': 3.7773683071136475} -09/20/2021 17:41:43 - INFO - __main__ - Step 14813: {'lr': 0.0001999937694143928, 'samples': 474016, 'steps': 925, 'loss/train': 3.0027871131896973} -09/20/2021 17:41:44 - INFO - __main__ - Step 14814: {'lr': 0.0001999937694143928, 'samples': 474048, 'steps': 925, 'loss/train': 4.19696044921875} -09/20/2021 17:41:45 - INFO - __main__ - Step 14815: {'lr': 0.0001999937694143928, 'samples': 474080, 'steps': 925, 'loss/train': 4.494161128997803} -09/20/2021 17:41:46 - INFO - __main__ - Step 14816: {'lr': 0.0001999937694143928, 'samples': 474112, 'steps': 925, 'loss/train': 3.69498348236084} -09/20/2021 17:41:46 - INFO - __main__ - Step 14817: {'lr': 0.00019999369800500252, 'samples': 474144, 'steps': 926, 'loss/train': 3.5104739665985107} -09/20/2021 17:41:47 - INFO - __main__ - Step 14818: {'lr': 0.00019999369800500252, 'samples': 474176, 'steps': 926, 'loss/train': 4.857038974761963} -09/20/2021 17:41:48 - INFO - __main__ - Step 14819: {'lr': 0.00019999369800500252, 'samples': 474208, 'steps': 926, 'loss/train': 4.297270774841309} -09/20/2021 17:41:49 - INFO - __main__ - Step 14820: {'lr': 0.00019999369800500252, 'samples': 474240, 'steps': 926, 'loss/train': 5.098450660705566} -09/20/2021 17:41:49 - INFO - __main__ - Step 14821: {'lr': 0.00019999369800500252, 'samples': 474272, 'steps': 926, 'loss/train': 4.372534275054932} -09/20/2021 17:41:50 - INFO - __main__ - Step 14822: {'lr': 0.00019999369800500252, 'samples': 474304, 'steps': 926, 'loss/train': 3.401204824447632} -09/20/2021 17:41:51 - INFO - __main__ - Step 14823: {'lr': 0.00019999369800500252, 'samples': 474336, 'steps': 926, 'loss/train': 0.8698886632919312} -09/20/2021 17:41:52 - INFO - __main__ - Step 14824: {'lr': 0.00019999369800500252, 'samples': 474368, 'steps': 926, 'loss/train': 0.982926070690155} -09/20/2021 17:41:53 - INFO - __main__ - Step 14825: {'lr': 0.00019999369800500252, 'samples': 474400, 'steps': 926, 'loss/train': 1.4091498851776123} -09/20/2021 17:41:54 - INFO - __main__ - Step 14826: {'lr': 0.00019999369800500252, 'samples': 474432, 'steps': 926, 'loss/train': 3.6061127185821533} -09/20/2021 17:41:54 - INFO - __main__ - Step 14827: {'lr': 0.00019999369800500252, 'samples': 474464, 'steps': 926, 'loss/train': 2.865992307662964} -09/20/2021 17:41:55 - INFO - __main__ - Step 14828: {'lr': 0.00019999369800500252, 'samples': 474496, 'steps': 926, 'loss/train': 3.1331331729888916} -09/20/2021 17:41:56 - INFO - __main__ - Step 14829: {'lr': 0.00019999369800500252, 'samples': 474528, 'steps': 926, 'loss/train': 4.202727794647217} -09/20/2021 17:41:57 - INFO - __main__ - Step 14830: {'lr': 0.00019999369800500252, 'samples': 474560, 'steps': 926, 'loss/train': 4.5180816650390625} -09/20/2021 17:41:57 - INFO - __main__ - Step 14831: {'lr': 0.00019999369800500252, 'samples': 474592, 'steps': 926, 'loss/train': 3.7902700901031494} -09/20/2021 17:41:58 - INFO - __main__ - Step 14832: {'lr': 0.00019999369800500252, 'samples': 474624, 'steps': 926, 'loss/train': 4.110168933868408} -09/20/2021 17:41:59 - INFO - __main__ - Step 14833: {'lr': 0.00019999362618873824, 'samples': 474656, 'steps': 927, 'loss/train': 4.138016223907471} -09/20/2021 17:42:00 - INFO - __main__ - Step 14834: {'lr': 0.00019999362618873824, 'samples': 474688, 'steps': 927, 'loss/train': 3.8407905101776123} -09/20/2021 17:42:01 - INFO - __main__ - Step 14835: {'lr': 0.00019999362618873824, 'samples': 474720, 'steps': 927, 'loss/train': 2.843038558959961} -09/20/2021 17:42:01 - INFO - __main__ - Step 14836: {'lr': 0.00019999362618873824, 'samples': 474752, 'steps': 927, 'loss/train': 2.8295352458953857} -09/20/2021 17:42:02 - INFO - __main__ - Step 14837: {'lr': 0.00019999362618873824, 'samples': 474784, 'steps': 927, 'loss/train': 3.9715850353240967} -09/20/2021 17:42:03 - INFO - __main__ - Step 14838: {'lr': 0.00019999362618873824, 'samples': 474816, 'steps': 927, 'loss/train': 3.350080966949463} -09/20/2021 17:42:04 - INFO - __main__ - Step 14839: {'lr': 0.00019999362618873824, 'samples': 474848, 'steps': 927, 'loss/train': 3.275994300842285} -09/20/2021 17:42:04 - INFO - __main__ - Step 14840: {'lr': 0.00019999362618873824, 'samples': 474880, 'steps': 927, 'loss/train': 4.798832416534424} -09/20/2021 17:42:05 - INFO - __main__ - Step 14841: {'lr': 0.00019999362618873824, 'samples': 474912, 'steps': 927, 'loss/train': 3.2009437084198} -09/20/2021 17:42:06 - INFO - __main__ - Step 14842: {'lr': 0.00019999362618873824, 'samples': 474944, 'steps': 927, 'loss/train': 4.589803695678711} -09/20/2021 17:42:07 - INFO - __main__ - Step 14843: {'lr': 0.00019999362618873824, 'samples': 474976, 'steps': 927, 'loss/train': 4.174758434295654} -09/20/2021 17:42:07 - INFO - __main__ - Step 14844: {'lr': 0.00019999362618873824, 'samples': 475008, 'steps': 927, 'loss/train': 3.838822841644287} -09/20/2021 17:42:08 - INFO - __main__ - Step 14845: {'lr': 0.00019999362618873824, 'samples': 475040, 'steps': 927, 'loss/train': 3.1625397205352783} -09/20/2021 17:42:09 - INFO - __main__ - Step 14846: {'lr': 0.00019999362618873824, 'samples': 475072, 'steps': 927, 'loss/train': 3.417228937149048} -09/20/2021 17:42:10 - INFO - __main__ - Step 14847: {'lr': 0.00019999362618873824, 'samples': 475104, 'steps': 927, 'loss/train': 4.083000183105469} -09/20/2021 17:42:10 - INFO - __main__ - Step 14848: {'lr': 0.00019999362618873824, 'samples': 475136, 'steps': 927, 'loss/train': 5.4976630210876465} -09/20/2021 17:42:11 - INFO - __main__ - Step 14849: {'lr': 0.00019999355396560031, 'samples': 475168, 'steps': 928, 'loss/train': 3.4192044734954834} -09/20/2021 17:42:12 - INFO - __main__ - Step 14850: {'lr': 0.00019999355396560031, 'samples': 475200, 'steps': 928, 'loss/train': 4.899316310882568} -09/20/2021 17:42:13 - INFO - __main__ - Step 14851: {'lr': 0.00019999355396560031, 'samples': 475232, 'steps': 928, 'loss/train': 3.8079910278320312} -09/20/2021 17:42:13 - INFO - __main__ - Step 14852: {'lr': 0.00019999355396560031, 'samples': 475264, 'steps': 928, 'loss/train': 3.7759506702423096} -09/20/2021 17:42:14 - INFO - __main__ - Step 14853: {'lr': 0.00019999355396560031, 'samples': 475296, 'steps': 928, 'loss/train': 3.4978933334350586} -09/20/2021 17:42:15 - INFO - __main__ - Step 14854: {'lr': 0.00019999355396560031, 'samples': 475328, 'steps': 928, 'loss/train': 3.507459878921509} -09/20/2021 17:42:16 - INFO - __main__ - Step 14855: {'lr': 0.00019999355396560031, 'samples': 475360, 'steps': 928, 'loss/train': 4.398745536804199} -09/20/2021 17:42:17 - INFO - __main__ - Step 14856: {'lr': 0.00019999355396560031, 'samples': 475392, 'steps': 928, 'loss/train': 3.100440263748169} -09/20/2021 17:42:18 - INFO - __main__ - Step 14857: {'lr': 0.00019999355396560031, 'samples': 475424, 'steps': 928, 'loss/train': 3.917088508605957} -09/20/2021 17:42:18 - INFO - __main__ - Step 14858: {'lr': 0.00019999355396560031, 'samples': 475456, 'steps': 928, 'loss/train': 4.253096103668213} -09/20/2021 17:42:19 - INFO - __main__ - Step 14859: {'lr': 0.00019999355396560031, 'samples': 475488, 'steps': 928, 'loss/train': 3.9235615730285645} -09/20/2021 17:42:20 - INFO - __main__ - Step 14860: {'lr': 0.00019999355396560031, 'samples': 475520, 'steps': 928, 'loss/train': 4.41342306137085} -09/20/2021 17:42:21 - INFO - __main__ - Step 14861: {'lr': 0.00019999355396560031, 'samples': 475552, 'steps': 928, 'loss/train': 3.8987622261047363} -09/20/2021 17:42:21 - INFO - __main__ - Step 14862: {'lr': 0.00019999355396560031, 'samples': 475584, 'steps': 928, 'loss/train': 3.3810276985168457} -09/20/2021 17:42:22 - INFO - __main__ - Step 14863: {'lr': 0.00019999355396560031, 'samples': 475616, 'steps': 928, 'loss/train': 4.404519081115723} -09/20/2021 17:42:23 - INFO - __main__ - Step 14864: {'lr': 0.00019999355396560031, 'samples': 475648, 'steps': 928, 'loss/train': 3.6459248065948486} -09/20/2021 17:42:24 - INFO - __main__ - Step 14865: {'lr': 0.000199993481335589, 'samples': 475680, 'steps': 929, 'loss/train': 3.6290152072906494} -09/20/2021 17:42:25 - INFO - __main__ - Step 14866: {'lr': 0.000199993481335589, 'samples': 475712, 'steps': 929, 'loss/train': 3.747356653213501} -09/20/2021 17:42:25 - INFO - __main__ - Step 14867: {'lr': 0.000199993481335589, 'samples': 475744, 'steps': 929, 'loss/train': 3.940779447555542} -09/20/2021 17:42:26 - INFO - __main__ - Step 14868: {'lr': 0.000199993481335589, 'samples': 475776, 'steps': 929, 'loss/train': 3.7092626094818115} -09/20/2021 17:42:27 - INFO - __main__ - Step 14869: {'lr': 0.000199993481335589, 'samples': 475808, 'steps': 929, 'loss/train': 3.579545259475708} -09/20/2021 17:42:28 - INFO - __main__ - Step 14870: {'lr': 0.000199993481335589, 'samples': 475840, 'steps': 929, 'loss/train': 4.596546649932861} -09/20/2021 17:42:28 - INFO - __main__ - Step 14871: {'lr': 0.000199993481335589, 'samples': 475872, 'steps': 929, 'loss/train': 4.130242824554443} -09/20/2021 17:42:29 - INFO - __main__ - Step 14872: {'lr': 0.000199993481335589, 'samples': 475904, 'steps': 929, 'loss/train': 3.768577814102173} -09/20/2021 17:42:30 - INFO - __main__ - Step 14873: {'lr': 0.000199993481335589, 'samples': 475936, 'steps': 929, 'loss/train': 3.915268898010254} -09/20/2021 17:42:31 - INFO - __main__ - Step 14874: {'lr': 0.000199993481335589, 'samples': 475968, 'steps': 929, 'loss/train': 3.1050937175750732} -09/20/2021 17:42:31 - INFO - __main__ - Step 14875: {'lr': 0.000199993481335589, 'samples': 476000, 'steps': 929, 'loss/train': 2.862633466720581} -09/20/2021 17:42:32 - INFO - __main__ - Step 14876: {'lr': 0.000199993481335589, 'samples': 476032, 'steps': 929, 'loss/train': 3.862276315689087} -09/20/2021 17:42:33 - INFO - __main__ - Step 14877: {'lr': 0.000199993481335589, 'samples': 476064, 'steps': 929, 'loss/train': 4.4577226638793945} -09/20/2021 17:42:34 - INFO - __main__ - Step 14878: {'lr': 0.000199993481335589, 'samples': 476096, 'steps': 929, 'loss/train': 4.391833305358887} -09/20/2021 17:42:34 - INFO - __main__ - Step 14879: {'lr': 0.000199993481335589, 'samples': 476128, 'steps': 929, 'loss/train': 4.463728904724121} -09/20/2021 17:42:35 - INFO - __main__ - Step 14880: {'lr': 0.000199993481335589, 'samples': 476160, 'steps': 929, 'loss/train': 3.409025192260742} -09/20/2021 17:42:36 - INFO - __main__ - Step 14881: {'lr': 0.0001999934082987046, 'samples': 476192, 'steps': 930, 'loss/train': 4.672584533691406} -09/20/2021 17:42:37 - INFO - __main__ - Step 14882: {'lr': 0.0001999934082987046, 'samples': 476224, 'steps': 930, 'loss/train': 4.2855305671691895} -09/20/2021 17:42:37 - INFO - __main__ - Step 14883: {'lr': 0.0001999934082987046, 'samples': 476256, 'steps': 930, 'loss/train': 3.7221333980560303} -09/20/2021 17:42:38 - INFO - __main__ - Step 14884: {'lr': 0.0001999934082987046, 'samples': 476288, 'steps': 930, 'loss/train': 3.9898459911346436} -09/20/2021 17:42:39 - INFO - __main__ - Step 14885: {'lr': 0.0001999934082987046, 'samples': 476320, 'steps': 930, 'loss/train': 3.153094530105591} -09/20/2021 17:42:41 - INFO - __main__ - Step 14886: {'lr': 0.0001999934082987046, 'samples': 476352, 'steps': 930, 'loss/train': 3.986494779586792} -09/20/2021 17:42:42 - INFO - __main__ - Step 14887: {'lr': 0.0001999934082987046, 'samples': 476384, 'steps': 930, 'loss/train': 7.433053016662598} -09/20/2021 17:42:42 - INFO - __main__ - Step 14888: {'lr': 0.0001999934082987046, 'samples': 476416, 'steps': 930, 'loss/train': 1.535020351409912} -09/20/2021 17:42:43 - INFO - __main__ - Step 14889: {'lr': 0.0001999934082987046, 'samples': 476448, 'steps': 930, 'loss/train': 4.019839763641357} -09/20/2021 17:42:44 - INFO - __main__ - Step 14890: {'lr': 0.0001999934082987046, 'samples': 476480, 'steps': 930, 'loss/train': 3.994732141494751} -09/20/2021 17:42:45 - INFO - __main__ - Step 14891: {'lr': 0.0001999934082987046, 'samples': 476512, 'steps': 930, 'loss/train': 3.786637306213379} -09/20/2021 17:42:45 - INFO - __main__ - Step 14892: {'lr': 0.0001999934082987046, 'samples': 476544, 'steps': 930, 'loss/train': 3.4348323345184326} -09/20/2021 17:42:46 - INFO - __main__ - Step 14893: {'lr': 0.0001999934082987046, 'samples': 476576, 'steps': 930, 'loss/train': 4.195120811462402} -09/20/2021 17:42:47 - INFO - __main__ - Step 14894: {'lr': 0.0001999934082987046, 'samples': 476608, 'steps': 930, 'loss/train': 3.5174386501312256} -09/20/2021 17:42:48 - INFO - __main__ - Step 14895: {'lr': 0.0001999934082987046, 'samples': 476640, 'steps': 930, 'loss/train': 4.444658279418945} -09/20/2021 17:42:48 - INFO - __main__ - Step 14896: {'lr': 0.0001999934082987046, 'samples': 476672, 'steps': 930, 'loss/train': 3.617379903793335} -09/20/2021 17:42:49 - INFO - __main__ - Step 14897: {'lr': 0.00019999333485494738, 'samples': 476704, 'steps': 931, 'loss/train': 2.70151424407959} -09/20/2021 17:42:50 - INFO - __main__ - Step 14898: {'lr': 0.00019999333485494738, 'samples': 476736, 'steps': 931, 'loss/train': 3.4582366943359375} -09/20/2021 17:42:51 - INFO - __main__ - Step 14899: {'lr': 0.00019999333485494738, 'samples': 476768, 'steps': 931, 'loss/train': 3.5242912769317627} -09/20/2021 17:42:52 - INFO - __main__ - Step 14900: {'lr': 0.00019999333485494738, 'samples': 476800, 'steps': 931, 'loss/train': 3.4609756469726562} -09/20/2021 17:42:52 - INFO - __main__ - Step 14901: {'lr': 0.00019999333485494738, 'samples': 476832, 'steps': 931, 'loss/train': 4.020810604095459} -09/20/2021 17:42:53 - INFO - __main__ - Step 14902: {'lr': 0.00019999333485494738, 'samples': 476864, 'steps': 931, 'loss/train': 3.516003131866455} -09/20/2021 17:42:54 - INFO - __main__ - Step 14903: {'lr': 0.00019999333485494738, 'samples': 476896, 'steps': 931, 'loss/train': 3.5767743587493896} -09/20/2021 17:42:55 - INFO - __main__ - Step 14904: {'lr': 0.00019999333485494738, 'samples': 476928, 'steps': 931, 'loss/train': 4.603180885314941} -09/20/2021 17:42:55 - INFO - __main__ - Step 14905: {'lr': 0.00019999333485494738, 'samples': 476960, 'steps': 931, 'loss/train': 2.970198631286621} -09/20/2021 17:42:56 - INFO - __main__ - Step 14906: {'lr': 0.00019999333485494738, 'samples': 476992, 'steps': 931, 'loss/train': 3.9111998081207275} -09/20/2021 17:42:57 - INFO - __main__ - Step 14907: {'lr': 0.00019999333485494738, 'samples': 477024, 'steps': 931, 'loss/train': 4.240096569061279} -09/20/2021 17:42:58 - INFO - __main__ - Step 14908: {'lr': 0.00019999333485494738, 'samples': 477056, 'steps': 931, 'loss/train': 1.4329185485839844} -09/20/2021 17:42:58 - INFO - __main__ - Step 14909: {'lr': 0.00019999333485494738, 'samples': 477088, 'steps': 931, 'loss/train': 4.2575178146362305} -09/20/2021 17:42:59 - INFO - __main__ - Step 14910: {'lr': 0.00019999333485494738, 'samples': 477120, 'steps': 931, 'loss/train': 4.93565559387207} -09/20/2021 17:43:00 - INFO - __main__ - Step 14911: {'lr': 0.00019999333485494738, 'samples': 477152, 'steps': 931, 'loss/train': 4.084084510803223} -09/20/2021 17:43:01 - INFO - __main__ - Step 14912: {'lr': 0.00019999333485494738, 'samples': 477184, 'steps': 931, 'loss/train': 2.7918009757995605} -09/20/2021 17:43:01 - INFO - __main__ - Step 14913: {'lr': 0.00019999326100431767, 'samples': 477216, 'steps': 932, 'loss/train': 1.563263177871704} -09/20/2021 17:43:02 - INFO - __main__ - Step 14914: {'lr': 0.00019999326100431767, 'samples': 477248, 'steps': 932, 'loss/train': 0.8828915357589722} -09/20/2021 17:43:03 - INFO - __main__ - Step 14915: {'lr': 0.00019999326100431767, 'samples': 477280, 'steps': 932, 'loss/train': 1.1361149549484253} -09/20/2021 17:43:04 - INFO - __main__ - Step 14916: {'lr': 0.00019999326100431767, 'samples': 477312, 'steps': 932, 'loss/train': 1.61184561252594} -09/20/2021 17:43:05 - INFO - __main__ - Step 14917: {'lr': 0.00019999326100431767, 'samples': 477344, 'steps': 932, 'loss/train': 0.8874145150184631} -09/20/2021 17:43:06 - INFO - __main__ - Step 14918: {'lr': 0.00019999326100431767, 'samples': 477376, 'steps': 932, 'loss/train': 3.303671360015869} -09/20/2021 17:43:06 - INFO - __main__ - Step 14919: {'lr': 0.00019999326100431767, 'samples': 477408, 'steps': 932, 'loss/train': 3.931899309158325} -09/20/2021 17:43:07 - INFO - __main__ - Step 14920: {'lr': 0.00019999326100431767, 'samples': 477440, 'steps': 932, 'loss/train': 4.784920692443848} -09/20/2021 17:43:08 - INFO - __main__ - Step 14921: {'lr': 0.00019999326100431767, 'samples': 477472, 'steps': 932, 'loss/train': 3.311018943786621} -09/20/2021 17:43:09 - INFO - __main__ - Step 14922: {'lr': 0.00019999326100431767, 'samples': 477504, 'steps': 932, 'loss/train': 1.718665599822998} -09/20/2021 17:43:09 - INFO - __main__ - Step 14923: {'lr': 0.00019999326100431767, 'samples': 477536, 'steps': 932, 'loss/train': 3.3582804203033447} -09/20/2021 17:43:10 - INFO - __main__ - Step 14924: {'lr': 0.00019999326100431767, 'samples': 477568, 'steps': 932, 'loss/train': 3.5253443717956543} -09/20/2021 17:43:11 - INFO - __main__ - Step 14925: {'lr': 0.00019999326100431767, 'samples': 477600, 'steps': 932, 'loss/train': 4.12693977355957} -09/20/2021 17:43:12 - INFO - __main__ - Step 14926: {'lr': 0.00019999326100431767, 'samples': 477632, 'steps': 932, 'loss/train': 3.895509958267212} -09/20/2021 17:43:12 - INFO - __main__ - Step 14927: {'lr': 0.00019999326100431767, 'samples': 477664, 'steps': 932, 'loss/train': 3.500168561935425} -09/20/2021 17:43:13 - INFO - __main__ - Step 14928: {'lr': 0.00019999326100431767, 'samples': 477696, 'steps': 932, 'loss/train': 0.8505412936210632} -09/20/2021 17:43:14 - INFO - __main__ - Step 14929: {'lr': 0.0001999931867468158, 'samples': 477728, 'steps': 933, 'loss/train': 3.36470627784729} -09/20/2021 17:43:15 - INFO - __main__ - Step 14930: {'lr': 0.0001999931867468158, 'samples': 477760, 'steps': 933, 'loss/train': 3.5732645988464355} -09/20/2021 17:43:16 - INFO - __main__ - Step 14931: {'lr': 0.0001999931867468158, 'samples': 477792, 'steps': 933, 'loss/train': 3.201462984085083} -09/20/2021 17:43:16 - INFO - __main__ - Step 14932: {'lr': 0.0001999931867468158, 'samples': 477824, 'steps': 933, 'loss/train': 3.3896918296813965} -09/20/2021 17:43:17 - INFO - __main__ - Step 14933: {'lr': 0.0001999931867468158, 'samples': 477856, 'steps': 933, 'loss/train': 3.6070821285247803} -09/20/2021 17:43:18 - INFO - __main__ - Step 14934: {'lr': 0.0001999931867468158, 'samples': 477888, 'steps': 933, 'loss/train': 3.9093177318573} -09/20/2021 17:43:19 - INFO - __main__ - Step 14935: {'lr': 0.0001999931867468158, 'samples': 477920, 'steps': 933, 'loss/train': 3.9014859199523926} -09/20/2021 17:43:19 - INFO - __main__ - Step 14936: {'lr': 0.0001999931867468158, 'samples': 477952, 'steps': 933, 'loss/train': 3.9002835750579834} -09/20/2021 17:43:20 - INFO - __main__ - Step 14937: {'lr': 0.0001999931867468158, 'samples': 477984, 'steps': 933, 'loss/train': 3.9194376468658447} -09/20/2021 17:43:21 - INFO - __main__ - Step 14938: {'lr': 0.0001999931867468158, 'samples': 478016, 'steps': 933, 'loss/train': 4.182638168334961} -09/20/2021 17:43:22 - INFO - __main__ - Step 14939: {'lr': 0.0001999931867468158, 'samples': 478048, 'steps': 933, 'loss/train': 3.233388900756836} -09/20/2021 17:43:22 - INFO - __main__ - Step 14940: {'lr': 0.0001999931867468158, 'samples': 478080, 'steps': 933, 'loss/train': 3.820080518722534} -09/20/2021 17:43:23 - INFO - __main__ - Step 14941: {'lr': 0.0001999931867468158, 'samples': 478112, 'steps': 933, 'loss/train': 3.9353113174438477} -09/20/2021 17:43:24 - INFO - __main__ - Step 14942: {'lr': 0.0001999931867468158, 'samples': 478144, 'steps': 933, 'loss/train': 3.9722185134887695} -09/20/2021 17:43:25 - INFO - __main__ - Step 14943: {'lr': 0.0001999931867468158, 'samples': 478176, 'steps': 933, 'loss/train': 3.5528311729431152} -09/20/2021 17:43:25 - INFO - __main__ - Step 14944: {'lr': 0.0001999931867468158, 'samples': 478208, 'steps': 933, 'loss/train': 3.893462657928467} -09/20/2021 17:43:26 - INFO - __main__ - Step 14945: {'lr': 0.00019999311208244205, 'samples': 478240, 'steps': 934, 'loss/train': 3.8748199939727783} -09/20/2021 17:43:27 - INFO - __main__ - Step 14946: {'lr': 0.00019999311208244205, 'samples': 478272, 'steps': 934, 'loss/train': 4.190334796905518} -09/20/2021 17:43:28 - INFO - __main__ - Step 14947: {'lr': 0.00019999311208244205, 'samples': 478304, 'steps': 934, 'loss/train': 4.304593563079834} -09/20/2021 17:43:28 - INFO - __main__ - Step 14948: {'lr': 0.00019999311208244205, 'samples': 478336, 'steps': 934, 'loss/train': 3.2389891147613525} -09/20/2021 17:43:30 - INFO - __main__ - Step 14949: {'lr': 0.00019999311208244205, 'samples': 478368, 'steps': 934, 'loss/train': 3.396214723587036} -09/20/2021 17:43:31 - INFO - __main__ - Step 14950: {'lr': 0.00019999311208244205, 'samples': 478400, 'steps': 934, 'loss/train': 3.3987276554107666} -09/20/2021 17:43:31 - INFO - __main__ - Step 14951: {'lr': 0.00019999311208244205, 'samples': 478432, 'steps': 934, 'loss/train': 4.032411098480225} -09/20/2021 17:43:32 - INFO - __main__ - Step 14952: {'lr': 0.00019999311208244205, 'samples': 478464, 'steps': 934, 'loss/train': 4.235344409942627} -09/20/2021 17:43:33 - INFO - __main__ - Step 14953: {'lr': 0.00019999311208244205, 'samples': 478496, 'steps': 934, 'loss/train': 4.137333393096924} -09/20/2021 17:43:34 - INFO - __main__ - Step 14954: {'lr': 0.00019999311208244205, 'samples': 478528, 'steps': 934, 'loss/train': 3.7190310955047607} -09/20/2021 17:43:34 - INFO - __main__ - Step 14955: {'lr': 0.00019999311208244205, 'samples': 478560, 'steps': 934, 'loss/train': 3.8309478759765625} -09/20/2021 17:43:35 - INFO - __main__ - Step 14956: {'lr': 0.00019999311208244205, 'samples': 478592, 'steps': 934, 'loss/train': 3.8112199306488037} -09/20/2021 17:43:36 - INFO - __main__ - Step 14957: {'lr': 0.00019999311208244205, 'samples': 478624, 'steps': 934, 'loss/train': 3.5102453231811523} -09/20/2021 17:43:37 - INFO - __main__ - Step 14958: {'lr': 0.00019999311208244205, 'samples': 478656, 'steps': 934, 'loss/train': 3.6711130142211914} -09/20/2021 17:43:37 - INFO - __main__ - Step 14959: {'lr': 0.00019999311208244205, 'samples': 478688, 'steps': 934, 'loss/train': 4.144901752471924} -09/20/2021 17:43:38 - INFO - __main__ - Step 14960: {'lr': 0.00019999311208244205, 'samples': 478720, 'steps': 934, 'loss/train': 3.8977363109588623} -09/20/2021 17:43:39 - INFO - __main__ - Step 14961: {'lr': 0.00019999303701119666, 'samples': 478752, 'steps': 935, 'loss/train': 3.2438251972198486} -09/20/2021 17:43:40 - INFO - __main__ - Step 14962: {'lr': 0.00019999303701119666, 'samples': 478784, 'steps': 935, 'loss/train': 4.02119255065918} -09/20/2021 17:43:40 - INFO - __main__ - Step 14963: {'lr': 0.00019999303701119666, 'samples': 478816, 'steps': 935, 'loss/train': 3.107450485229492} -09/20/2021 17:43:41 - INFO - __main__ - Step 14964: {'lr': 0.00019999303701119666, 'samples': 478848, 'steps': 935, 'loss/train': 4.540010452270508} -09/20/2021 17:43:42 - INFO - __main__ - Step 14965: {'lr': 0.00019999303701119666, 'samples': 478880, 'steps': 935, 'loss/train': 3.0901103019714355} -09/20/2021 17:43:43 - INFO - __main__ - Step 14966: {'lr': 0.00019999303701119666, 'samples': 478912, 'steps': 935, 'loss/train': 4.182144641876221} -09/20/2021 17:43:43 - INFO - __main__ - Step 14967: {'lr': 0.00019999303701119666, 'samples': 478944, 'steps': 935, 'loss/train': 4.238659381866455} -09/20/2021 17:43:44 - INFO - __main__ - Step 14968: {'lr': 0.00019999303701119666, 'samples': 478976, 'steps': 935, 'loss/train': 3.588758707046509} -09/20/2021 17:43:45 - INFO - __main__ - Step 14969: {'lr': 0.00019999303701119666, 'samples': 479008, 'steps': 935, 'loss/train': 3.843505859375} -09/20/2021 17:43:46 - INFO - __main__ - Step 14970: {'lr': 0.00019999303701119666, 'samples': 479040, 'steps': 935, 'loss/train': 4.040332794189453} -09/20/2021 17:43:46 - INFO - __main__ - Step 14971: {'lr': 0.00019999303701119666, 'samples': 479072, 'steps': 935, 'loss/train': 3.0481550693511963} -09/20/2021 17:43:47 - INFO - __main__ - Step 14972: {'lr': 0.00019999303701119666, 'samples': 479104, 'steps': 935, 'loss/train': 3.4698503017425537} -09/20/2021 17:43:48 - INFO - __main__ - Step 14973: {'lr': 0.00019999303701119666, 'samples': 479136, 'steps': 935, 'loss/train': 3.919300079345703} -09/20/2021 17:43:49 - INFO - __main__ - Step 14974: {'lr': 0.00019999303701119666, 'samples': 479168, 'steps': 935, 'loss/train': 5.568083763122559} -09/20/2021 17:43:49 - INFO - __main__ - Step 14975: {'lr': 0.00019999303701119666, 'samples': 479200, 'steps': 935, 'loss/train': 4.151995658874512} -09/20/2021 17:43:50 - INFO - __main__ - Step 14976: {'lr': 0.00019999303701119666, 'samples': 479232, 'steps': 935, 'loss/train': 3.1670119762420654} -09/20/2021 17:43:51 - INFO - __main__ - Step 14977: {'lr': 0.00019999296153308004, 'samples': 479264, 'steps': 936, 'loss/train': 2.7973248958587646} -09/20/2021 17:43:52 - INFO - __main__ - Step 14978: {'lr': 0.00019999296153308004, 'samples': 479296, 'steps': 936, 'loss/train': 2.7121875286102295} -09/20/2021 17:43:53 - INFO - __main__ - Step 14979: {'lr': 0.00019999296153308004, 'samples': 479328, 'steps': 936, 'loss/train': 2.2648138999938965} -09/20/2021 17:43:54 - INFO - __main__ - Step 14980: {'lr': 0.00019999296153308004, 'samples': 479360, 'steps': 936, 'loss/train': 3.390758752822876} -09/20/2021 17:43:55 - INFO - __main__ - Step 14981: {'lr': 0.00019999296153308004, 'samples': 479392, 'steps': 936, 'loss/train': 4.402124881744385} -09/20/2021 17:43:55 - INFO - __main__ - Step 14982: {'lr': 0.00019999296153308004, 'samples': 479424, 'steps': 936, 'loss/train': 3.6164703369140625} -09/20/2021 17:43:56 - INFO - __main__ - Step 14983: {'lr': 0.00019999296153308004, 'samples': 479456, 'steps': 936, 'loss/train': 4.928025245666504} -09/20/2021 17:43:57 - INFO - __main__ - Step 14984: {'lr': 0.00019999296153308004, 'samples': 479488, 'steps': 936, 'loss/train': 3.326127290725708} -09/20/2021 17:43:58 - INFO - __main__ - Step 14985: {'lr': 0.00019999296153308004, 'samples': 479520, 'steps': 936, 'loss/train': 3.9613277912139893} -09/20/2021 17:43:58 - INFO - __main__ - Step 14986: {'lr': 0.00019999296153308004, 'samples': 479552, 'steps': 936, 'loss/train': 3.548144578933716} -09/20/2021 17:43:59 - INFO - __main__ - Step 14987: {'lr': 0.00019999296153308004, 'samples': 479584, 'steps': 936, 'loss/train': 4.597811698913574} -09/20/2021 17:44:00 - INFO - __main__ - Step 14988: {'lr': 0.00019999296153308004, 'samples': 479616, 'steps': 936, 'loss/train': 3.684746265411377} -09/20/2021 17:44:01 - INFO - __main__ - Step 14989: {'lr': 0.00019999296153308004, 'samples': 479648, 'steps': 936, 'loss/train': 3.59025239944458} -09/20/2021 17:44:01 - INFO - __main__ - Step 14990: {'lr': 0.00019999296153308004, 'samples': 479680, 'steps': 936, 'loss/train': 3.080814838409424} -09/20/2021 17:44:02 - INFO - __main__ - Step 14991: {'lr': 0.00019999296153308004, 'samples': 479712, 'steps': 936, 'loss/train': 4.175645351409912} -09/20/2021 17:44:03 - INFO - __main__ - Step 14992: {'lr': 0.00019999296153308004, 'samples': 479744, 'steps': 936, 'loss/train': 4.320689678192139} -09/20/2021 17:44:04 - INFO - __main__ - Step 14993: {'lr': 0.00019999288564809243, 'samples': 479776, 'steps': 937, 'loss/train': 4.425957202911377} -09/20/2021 17:44:04 - INFO - __main__ - Step 14994: {'lr': 0.00019999288564809243, 'samples': 479808, 'steps': 937, 'loss/train': 3.4705052375793457} -09/20/2021 17:44:05 - INFO - __main__ - Step 14995: {'lr': 0.00019999288564809243, 'samples': 479840, 'steps': 937, 'loss/train': 3.4695656299591064} -09/20/2021 17:44:06 - INFO - __main__ - Step 14996: {'lr': 0.00019999288564809243, 'samples': 479872, 'steps': 937, 'loss/train': 3.9328811168670654} -09/20/2021 17:44:07 - INFO - __main__ - Step 14997: {'lr': 0.00019999288564809243, 'samples': 479904, 'steps': 937, 'loss/train': 3.5153648853302} -09/20/2021 17:44:07 - INFO - __main__ - Step 14998: {'lr': 0.00019999288564809243, 'samples': 479936, 'steps': 937, 'loss/train': 4.469745635986328} -09/20/2021 17:44:08 - INFO - __main__ - Step 14999: {'lr': 0.00019999288564809243, 'samples': 479968, 'steps': 937, 'loss/train': 3.3477678298950195} -09/20/2021 17:44:09 - INFO - __main__ - Step 15000: {'lr': 0.00019999288564809243, 'samples': 480000, 'steps': 937, 'loss/train': 4.234356880187988} -09/20/2021 17:44:10 - INFO - __main__ - Step 15001: {'lr': 0.00019999288564809243, 'samples': 480032, 'steps': 937, 'loss/train': 4.018489360809326} -09/20/2021 17:44:10 - INFO - __main__ - Step 15002: {'lr': 0.00019999288564809243, 'samples': 480064, 'steps': 937, 'loss/train': 4.281285285949707} -09/20/2021 17:44:11 - INFO - __main__ - Step 15003: {'lr': 0.00019999288564809243, 'samples': 480096, 'steps': 937, 'loss/train': 2.7608394622802734} -09/20/2021 17:44:12 - INFO - __main__ - Step 15004: {'lr': 0.00019999288564809243, 'samples': 480128, 'steps': 937, 'loss/train': 4.3059844970703125} -09/20/2021 17:44:13 - INFO - __main__ - Step 15005: {'lr': 0.00019999288564809243, 'samples': 480160, 'steps': 937, 'loss/train': 4.483016014099121} -09/20/2021 17:44:13 - INFO - __main__ - Step 15006: {'lr': 0.00019999288564809243, 'samples': 480192, 'steps': 937, 'loss/train': 4.201278209686279} -09/20/2021 17:44:14 - INFO - __main__ - Step 15007: {'lr': 0.00019999288564809243, 'samples': 480224, 'steps': 937, 'loss/train': 3.580564022064209} -09/20/2021 17:44:15 - INFO - __main__ - Step 15008: {'lr': 0.00019999288564809243, 'samples': 480256, 'steps': 937, 'loss/train': 3.932734251022339} -09/20/2021 17:44:16 - INFO - __main__ - Step 15009: {'lr': 0.00019999280935623418, 'samples': 480288, 'steps': 938, 'loss/train': 4.841139793395996} -09/20/2021 17:44:17 - INFO - __main__ - Step 15010: {'lr': 0.00019999280935623418, 'samples': 480320, 'steps': 938, 'loss/train': 4.761340618133545} -09/20/2021 17:44:18 - INFO - __main__ - Step 15011: {'lr': 0.00019999280935623418, 'samples': 480352, 'steps': 938, 'loss/train': 2.0485732555389404} -09/20/2021 17:44:19 - INFO - __main__ - Step 15012: {'lr': 0.00019999280935623418, 'samples': 480384, 'steps': 938, 'loss/train': 3.2909719944000244} -09/20/2021 17:44:20 - INFO - __main__ - Step 15013: {'lr': 0.00019999280935623418, 'samples': 480416, 'steps': 938, 'loss/train': 3.1982805728912354} -09/20/2021 17:44:20 - INFO - __main__ - Step 15014: {'lr': 0.00019999280935623418, 'samples': 480448, 'steps': 938, 'loss/train': 6.323996543884277} -09/20/2021 17:44:21 - INFO - __main__ - Step 15015: {'lr': 0.00019999280935623418, 'samples': 480480, 'steps': 938, 'loss/train': 3.85353684425354} -09/20/2021 17:44:22 - INFO - __main__ - Step 15016: {'lr': 0.00019999280935623418, 'samples': 480512, 'steps': 938, 'loss/train': 2.3108274936676025} -09/20/2021 17:44:23 - INFO - __main__ - Step 15017: {'lr': 0.00019999280935623418, 'samples': 480544, 'steps': 938, 'loss/train': 3.7762465476989746} -09/20/2021 17:44:23 - INFO - __main__ - Step 15018: {'lr': 0.00019999280935623418, 'samples': 480576, 'steps': 938, 'loss/train': 5.941010475158691} -09/20/2021 17:44:24 - INFO - __main__ - Step 15019: {'lr': 0.00019999280935623418, 'samples': 480608, 'steps': 938, 'loss/train': 3.430311441421509} -09/20/2021 17:44:25 - INFO - __main__ - Step 15020: {'lr': 0.00019999280935623418, 'samples': 480640, 'steps': 938, 'loss/train': 3.0564966201782227} -09/20/2021 17:44:26 - INFO - __main__ - Step 15021: {'lr': 0.00019999280935623418, 'samples': 480672, 'steps': 938, 'loss/train': 2.670713424682617} -09/20/2021 17:44:26 - INFO - __main__ - Step 15022: {'lr': 0.00019999280935623418, 'samples': 480704, 'steps': 938, 'loss/train': 4.542950630187988} -09/20/2021 17:44:27 - INFO - __main__ - Step 15023: {'lr': 0.00019999280935623418, 'samples': 480736, 'steps': 938, 'loss/train': 4.364436149597168} -09/20/2021 17:44:28 - INFO - __main__ - Step 15024: {'lr': 0.00019999280935623418, 'samples': 480768, 'steps': 938, 'loss/train': 3.01997971534729} -09/20/2021 17:44:29 - INFO - __main__ - Step 15025: {'lr': 0.00019999273265750554, 'samples': 480800, 'steps': 939, 'loss/train': 3.649960994720459} -09/20/2021 17:44:29 - INFO - __main__ - Step 15026: {'lr': 0.00019999273265750554, 'samples': 480832, 'steps': 939, 'loss/train': 3.776329755783081} -09/20/2021 17:44:30 - INFO - __main__ - Step 15027: {'lr': 0.00019999273265750554, 'samples': 480864, 'steps': 939, 'loss/train': 5.463622570037842} -09/20/2021 17:44:31 - INFO - __main__ - Step 15028: {'lr': 0.00019999273265750554, 'samples': 480896, 'steps': 939, 'loss/train': 4.034764289855957} -09/20/2021 17:44:32 - INFO - __main__ - Step 15029: {'lr': 0.00019999273265750554, 'samples': 480928, 'steps': 939, 'loss/train': 4.92642879486084} -09/20/2021 17:44:32 - INFO - __main__ - Step 15030: {'lr': 0.00019999273265750554, 'samples': 480960, 'steps': 939, 'loss/train': 3.4317500591278076} -09/20/2021 17:44:33 - INFO - __main__ - Step 15031: {'lr': 0.00019999273265750554, 'samples': 480992, 'steps': 939, 'loss/train': 3.719024181365967} -09/20/2021 17:44:34 - INFO - __main__ - Step 15032: {'lr': 0.00019999273265750554, 'samples': 481024, 'steps': 939, 'loss/train': 2.7306511402130127} -09/20/2021 17:44:35 - INFO - __main__ - Step 15033: {'lr': 0.00019999273265750554, 'samples': 481056, 'steps': 939, 'loss/train': 2.83971905708313} -09/20/2021 17:44:35 - INFO - __main__ - Step 15034: {'lr': 0.00019999273265750554, 'samples': 481088, 'steps': 939, 'loss/train': 2.623387098312378} -09/20/2021 17:44:36 - INFO - __main__ - Step 15035: {'lr': 0.00019999273265750554, 'samples': 481120, 'steps': 939, 'loss/train': 4.26571798324585} -09/20/2021 17:44:37 - INFO - __main__ - Step 15036: {'lr': 0.00019999273265750554, 'samples': 481152, 'steps': 939, 'loss/train': 3.1520233154296875} -09/20/2021 17:44:38 - INFO - __main__ - Step 15037: {'lr': 0.00019999273265750554, 'samples': 481184, 'steps': 939, 'loss/train': 3.7500174045562744} -09/20/2021 17:44:38 - INFO - __main__ - Step 15038: {'lr': 0.00019999273265750554, 'samples': 481216, 'steps': 939, 'loss/train': 3.738579034805298} -09/20/2021 17:44:39 - INFO - __main__ - Step 15039: {'lr': 0.00019999273265750554, 'samples': 481248, 'steps': 939, 'loss/train': 4.6358747482299805} -09/20/2021 17:44:40 - INFO - __main__ - Step 15040: {'lr': 0.00019999273265750554, 'samples': 481280, 'steps': 939, 'loss/train': 4.210331916809082} -09/20/2021 17:44:41 - INFO - __main__ - Step 15041: {'lr': 0.00019999265555190686, 'samples': 481312, 'steps': 940, 'loss/train': 3.4247846603393555} -09/20/2021 17:44:42 - INFO - __main__ - Step 15042: {'lr': 0.00019999265555190686, 'samples': 481344, 'steps': 940, 'loss/train': 3.884979724884033} -09/20/2021 17:44:43 - INFO - __main__ - Step 15043: {'lr': 0.00019999265555190686, 'samples': 481376, 'steps': 940, 'loss/train': 3.661370277404785} -09/20/2021 17:44:44 - INFO - __main__ - Step 15044: {'lr': 0.00019999265555190686, 'samples': 481408, 'steps': 940, 'loss/train': 3.9328112602233887} -09/20/2021 17:44:44 - INFO - __main__ - Step 15045: {'lr': 0.00019999265555190686, 'samples': 481440, 'steps': 940, 'loss/train': 3.2877159118652344} -09/20/2021 17:44:45 - INFO - __main__ - Step 15046: {'lr': 0.00019999265555190686, 'samples': 481472, 'steps': 940, 'loss/train': 4.239045143127441} -09/20/2021 17:44:46 - INFO - __main__ - Step 15047: {'lr': 0.00019999265555190686, 'samples': 481504, 'steps': 940, 'loss/train': 2.0830650329589844} -09/20/2021 17:44:47 - INFO - __main__ - Step 15048: {'lr': 0.00019999265555190686, 'samples': 481536, 'steps': 940, 'loss/train': 4.713620662689209} -09/20/2021 17:44:47 - INFO - __main__ - Step 15049: {'lr': 0.00019999265555190686, 'samples': 481568, 'steps': 940, 'loss/train': 4.753978729248047} -09/20/2021 17:44:48 - INFO - __main__ - Step 15050: {'lr': 0.00019999265555190686, 'samples': 481600, 'steps': 940, 'loss/train': 5.315863132476807} -09/20/2021 17:44:49 - INFO - __main__ - Step 15051: {'lr': 0.00019999265555190686, 'samples': 481632, 'steps': 940, 'loss/train': 4.718224048614502} -09/20/2021 17:44:50 - INFO - __main__ - Step 15052: {'lr': 0.00019999265555190686, 'samples': 481664, 'steps': 940, 'loss/train': 5.074258804321289} -09/20/2021 17:44:50 - INFO - __main__ - Step 15053: {'lr': 0.00019999265555190686, 'samples': 481696, 'steps': 940, 'loss/train': 0.8252530097961426} -09/20/2021 17:44:51 - INFO - __main__ - Step 15054: {'lr': 0.00019999265555190686, 'samples': 481728, 'steps': 940, 'loss/train': 1.0652590990066528} -09/20/2021 17:44:52 - INFO - __main__ - Step 15055: {'lr': 0.00019999265555190686, 'samples': 481760, 'steps': 940, 'loss/train': 1.00490140914917} -09/20/2021 17:44:53 - INFO - __main__ - Step 15056: {'lr': 0.00019999265555190686, 'samples': 481792, 'steps': 940, 'loss/train': 3.2333011627197266} -09/20/2021 17:44:54 - INFO - __main__ - Step 15057: {'lr': 0.00019999257803943846, 'samples': 481824, 'steps': 941, 'loss/train': 3.7706081867218018} -09/20/2021 17:44:54 - INFO - __main__ - Step 15058: {'lr': 0.00019999257803943846, 'samples': 481856, 'steps': 941, 'loss/train': 4.31318473815918} -09/20/2021 17:44:55 - INFO - __main__ - Step 15059: {'lr': 0.00019999257803943846, 'samples': 481888, 'steps': 941, 'loss/train': 4.625682353973389} -09/20/2021 17:44:56 - INFO - __main__ - Step 15060: {'lr': 0.00019999257803943846, 'samples': 481920, 'steps': 941, 'loss/train': 0.7383083701133728} -09/20/2021 17:44:57 - INFO - __main__ - Step 15061: {'lr': 0.00019999257803943846, 'samples': 481952, 'steps': 941, 'loss/train': 0.7637101411819458} -09/20/2021 17:44:57 - INFO - __main__ - Step 15062: {'lr': 0.00019999257803943846, 'samples': 481984, 'steps': 941, 'loss/train': 3.321723699569702} -09/20/2021 17:44:58 - INFO - __main__ - Step 15063: {'lr': 0.00019999257803943846, 'samples': 482016, 'steps': 941, 'loss/train': 4.094365119934082} -09/20/2021 17:44:59 - INFO - __main__ - Step 15064: {'lr': 0.00019999257803943846, 'samples': 482048, 'steps': 941, 'loss/train': 4.1443939208984375} -09/20/2021 17:45:00 - INFO - __main__ - Step 15065: {'lr': 0.00019999257803943846, 'samples': 482080, 'steps': 941, 'loss/train': 4.026381492614746} -09/20/2021 17:45:00 - INFO - __main__ - Step 15066: {'lr': 0.00019999257803943846, 'samples': 482112, 'steps': 941, 'loss/train': 1.3727058172225952} -09/20/2021 17:45:01 - INFO - __main__ - Step 15067: {'lr': 0.00019999257803943846, 'samples': 482144, 'steps': 941, 'loss/train': 3.5967395305633545} -09/20/2021 17:45:02 - INFO - __main__ - Step 15068: {'lr': 0.00019999257803943846, 'samples': 482176, 'steps': 941, 'loss/train': 4.029372215270996} -09/20/2021 17:45:03 - INFO - __main__ - Step 15069: {'lr': 0.00019999257803943846, 'samples': 482208, 'steps': 941, 'loss/train': 4.011352062225342} -09/20/2021 17:45:03 - INFO - __main__ - Step 15070: {'lr': 0.00019999257803943846, 'samples': 482240, 'steps': 941, 'loss/train': 4.30413293838501} -09/20/2021 17:45:04 - INFO - __main__ - Step 15071: {'lr': 0.00019999257803943846, 'samples': 482272, 'steps': 941, 'loss/train': 3.2049999237060547} -09/20/2021 17:45:05 - INFO - __main__ - Step 15072: {'lr': 0.00019999257803943846, 'samples': 482304, 'steps': 941, 'loss/train': 3.18133544921875} -09/20/2021 17:45:06 - INFO - __main__ - Step 15073: {'lr': 0.00019999250012010068, 'samples': 482336, 'steps': 942, 'loss/train': 3.6436586380004883} -09/20/2021 17:45:07 - INFO - __main__ - Step 15074: {'lr': 0.00019999250012010068, 'samples': 482368, 'steps': 942, 'loss/train': 2.9064273834228516} -09/20/2021 17:45:08 - INFO - __main__ - Step 15075: {'lr': 0.00019999250012010068, 'samples': 482400, 'steps': 942, 'loss/train': 3.6099658012390137} -09/20/2021 17:45:08 - INFO - __main__ - Step 15076: {'lr': 0.00019999250012010068, 'samples': 482432, 'steps': 942, 'loss/train': 3.7416319847106934} -09/20/2021 17:45:09 - INFO - __main__ - Step 15077: {'lr': 0.00019999250012010068, 'samples': 482464, 'steps': 942, 'loss/train': 3.6332204341888428} -09/20/2021 17:45:10 - INFO - __main__ - Step 15078: {'lr': 0.00019999250012010068, 'samples': 482496, 'steps': 942, 'loss/train': 3.9622888565063477} -09/20/2021 17:45:11 - INFO - __main__ - Step 15079: {'lr': 0.00019999250012010068, 'samples': 482528, 'steps': 942, 'loss/train': 3.171161413192749} -09/20/2021 17:45:11 - INFO - __main__ - Step 15080: {'lr': 0.00019999250012010068, 'samples': 482560, 'steps': 942, 'loss/train': 4.440806865692139} -09/20/2021 17:45:12 - INFO - __main__ - Step 15081: {'lr': 0.00019999250012010068, 'samples': 482592, 'steps': 942, 'loss/train': 3.583645820617676} -09/20/2021 17:45:13 - INFO - __main__ - Step 15082: {'lr': 0.00019999250012010068, 'samples': 482624, 'steps': 942, 'loss/train': 2.8209762573242188} -09/20/2021 17:45:14 - INFO - __main__ - Step 15083: {'lr': 0.00019999250012010068, 'samples': 482656, 'steps': 942, 'loss/train': 4.084691524505615} -09/20/2021 17:45:14 - INFO - __main__ - Step 15084: {'lr': 0.00019999250012010068, 'samples': 482688, 'steps': 942, 'loss/train': 3.919086456298828} -09/20/2021 17:45:15 - INFO - __main__ - Step 15085: {'lr': 0.00019999250012010068, 'samples': 482720, 'steps': 942, 'loss/train': 4.901786804199219} -09/20/2021 17:45:16 - INFO - __main__ - Step 15086: {'lr': 0.00019999250012010068, 'samples': 482752, 'steps': 942, 'loss/train': 3.7820515632629395} -09/20/2021 17:45:17 - INFO - __main__ - Step 15087: {'lr': 0.00019999250012010068, 'samples': 482784, 'steps': 942, 'loss/train': 3.9370241165161133} -09/20/2021 17:45:17 - INFO - __main__ - Step 15088: {'lr': 0.00019999250012010068, 'samples': 482816, 'steps': 942, 'loss/train': 3.9588842391967773} -09/20/2021 17:45:18 - INFO - __main__ - Step 15089: {'lr': 0.00019999242179389378, 'samples': 482848, 'steps': 943, 'loss/train': 3.733891487121582} -09/20/2021 17:45:19 - INFO - __main__ - Step 15090: {'lr': 0.00019999242179389378, 'samples': 482880, 'steps': 943, 'loss/train': 0.5259603261947632} -09/20/2021 17:45:20 - INFO - __main__ - Step 15091: {'lr': 0.00019999242179389378, 'samples': 482912, 'steps': 943, 'loss/train': 3.593528985977173} -09/20/2021 17:45:21 - INFO - __main__ - Step 15092: {'lr': 0.00019999242179389378, 'samples': 482944, 'steps': 943, 'loss/train': 3.1095378398895264} -09/20/2021 17:45:21 - INFO - __main__ - Step 15093: {'lr': 0.00019999242179389378, 'samples': 482976, 'steps': 943, 'loss/train': 3.6069090366363525} -09/20/2021 17:45:22 - INFO - __main__ - Step 15094: {'lr': 0.00019999242179389378, 'samples': 483008, 'steps': 943, 'loss/train': 3.2523062229156494} -09/20/2021 17:45:23 - INFO - __main__ - Step 15095: {'lr': 0.00019999242179389378, 'samples': 483040, 'steps': 943, 'loss/train': 4.183604717254639} -09/20/2021 17:45:24 - INFO - __main__ - Step 15096: {'lr': 0.00019999242179389378, 'samples': 483072, 'steps': 943, 'loss/train': 4.023453712463379} -09/20/2021 17:45:24 - INFO - __main__ - Step 15097: {'lr': 0.00019999242179389378, 'samples': 483104, 'steps': 943, 'loss/train': 3.8463640213012695} -09/20/2021 17:45:25 - INFO - __main__ - Step 15098: {'lr': 0.00019999242179389378, 'samples': 483136, 'steps': 943, 'loss/train': 3.7608535289764404} -09/20/2021 17:45:26 - INFO - __main__ - Step 15099: {'lr': 0.00019999242179389378, 'samples': 483168, 'steps': 943, 'loss/train': 4.367311000823975} -09/20/2021 17:45:27 - INFO - __main__ - Step 15100: {'lr': 0.00019999242179389378, 'samples': 483200, 'steps': 943, 'loss/train': 4.831721782684326} -09/20/2021 17:45:27 - INFO - __main__ - Step 15101: {'lr': 0.00019999242179389378, 'samples': 483232, 'steps': 943, 'loss/train': 3.5862419605255127} -09/20/2021 17:45:28 - INFO - __main__ - Step 15102: {'lr': 0.00019999242179389378, 'samples': 483264, 'steps': 943, 'loss/train': 5.158838272094727} -09/20/2021 17:45:29 - INFO - __main__ - Step 15103: {'lr': 0.00019999242179389378, 'samples': 483296, 'steps': 943, 'loss/train': 2.5214269161224365} -09/20/2021 17:45:30 - INFO - __main__ - Step 15104: {'lr': 0.00019999242179389378, 'samples': 483328, 'steps': 943, 'loss/train': 3.428450345993042} -09/20/2021 17:45:31 - INFO - __main__ - Step 15105: {'lr': 0.0001999923430608181, 'samples': 483360, 'steps': 944, 'loss/train': 3.6047964096069336} -09/20/2021 17:45:32 - INFO - __main__ - Step 15106: {'lr': 0.0001999923430608181, 'samples': 483392, 'steps': 944, 'loss/train': 0.6337105631828308} -09/20/2021 17:45:33 - INFO - __main__ - Step 15107: {'lr': 0.0001999923430608181, 'samples': 483424, 'steps': 944, 'loss/train': 3.744260311126709} -09/20/2021 17:45:33 - INFO - __main__ - Step 15108: {'lr': 0.0001999923430608181, 'samples': 483456, 'steps': 944, 'loss/train': 4.22861909866333} -09/20/2021 17:45:34 - INFO - __main__ - Step 15109: {'lr': 0.0001999923430608181, 'samples': 483488, 'steps': 944, 'loss/train': 3.8723063468933105} -09/20/2021 17:45:35 - INFO - __main__ - Step 15110: {'lr': 0.0001999923430608181, 'samples': 483520, 'steps': 944, 'loss/train': 0.8661887645721436} -09/20/2021 17:45:36 - INFO - __main__ - Step 15111: {'lr': 0.0001999923430608181, 'samples': 483552, 'steps': 944, 'loss/train': 0.8030769228935242} -09/20/2021 17:45:36 - INFO - __main__ - Step 15112: {'lr': 0.0001999923430608181, 'samples': 483584, 'steps': 944, 'loss/train': 3.293856382369995} -09/20/2021 17:45:37 - INFO - __main__ - Step 15113: {'lr': 0.0001999923430608181, 'samples': 483616, 'steps': 944, 'loss/train': 3.705028772354126} -09/20/2021 17:45:38 - INFO - __main__ - Step 15114: {'lr': 0.0001999923430608181, 'samples': 483648, 'steps': 944, 'loss/train': 2.381950616836548} -09/20/2021 17:45:39 - INFO - __main__ - Step 15115: {'lr': 0.0001999923430608181, 'samples': 483680, 'steps': 944, 'loss/train': 3.3133912086486816} -09/20/2021 17:45:39 - INFO - __main__ - Step 15116: {'lr': 0.0001999923430608181, 'samples': 483712, 'steps': 944, 'loss/train': 3.2817928791046143} -09/20/2021 17:45:40 - INFO - __main__ - Step 15117: {'lr': 0.0001999923430608181, 'samples': 483744, 'steps': 944, 'loss/train': 4.273379325866699} -09/20/2021 17:45:41 - INFO - __main__ - Step 15118: {'lr': 0.0001999923430608181, 'samples': 483776, 'steps': 944, 'loss/train': 3.271415948867798} -09/20/2021 17:45:42 - INFO - __main__ - Step 15119: {'lr': 0.0001999923430608181, 'samples': 483808, 'steps': 944, 'loss/train': 3.897298574447632} -09/20/2021 17:45:42 - INFO - __main__ - Step 15120: {'lr': 0.0001999923430608181, 'samples': 483840, 'steps': 944, 'loss/train': 3.4297525882720947} -09/20/2021 17:45:43 - INFO - __main__ - Step 15121: {'lr': 0.00019999226392087394, 'samples': 483872, 'steps': 945, 'loss/train': 4.033904075622559} -09/20/2021 17:45:44 - INFO - __main__ - Step 15122: {'lr': 0.00019999226392087394, 'samples': 483904, 'steps': 945, 'loss/train': 3.313122034072876} -09/20/2021 17:45:45 - INFO - __main__ - Step 15123: {'lr': 0.00019999226392087394, 'samples': 483936, 'steps': 945, 'loss/train': 4.248556613922119} -09/20/2021 17:45:45 - INFO - __main__ - Step 15124: {'lr': 0.00019999226392087394, 'samples': 483968, 'steps': 945, 'loss/train': 2.6319658756256104} -09/20/2021 17:45:46 - INFO - __main__ - Step 15125: {'lr': 0.00019999226392087394, 'samples': 484000, 'steps': 945, 'loss/train': 3.6806788444519043} -09/20/2021 17:45:47 - INFO - __main__ - Step 15126: {'lr': 0.00019999226392087394, 'samples': 484032, 'steps': 945, 'loss/train': 3.4949450492858887} -09/20/2021 17:45:48 - INFO - __main__ - Step 15127: {'lr': 0.00019999226392087394, 'samples': 484064, 'steps': 945, 'loss/train': 4.170562267303467} -09/20/2021 17:45:48 - INFO - __main__ - Step 15128: {'lr': 0.00019999226392087394, 'samples': 484096, 'steps': 945, 'loss/train': 0.6684021353721619} -09/20/2021 17:45:49 - INFO - __main__ - Step 15129: {'lr': 0.00019999226392087394, 'samples': 484128, 'steps': 945, 'loss/train': 0.5702759623527527} -09/20/2021 17:45:50 - INFO - __main__ - Step 15130: {'lr': 0.00019999226392087394, 'samples': 484160, 'steps': 945, 'loss/train': 4.937928676605225} -09/20/2021 17:45:51 - INFO - __main__ - Step 15131: {'lr': 0.00019999226392087394, 'samples': 484192, 'steps': 945, 'loss/train': 4.502780437469482} -09/20/2021 17:45:51 - INFO - __main__ - Step 15132: {'lr': 0.00019999226392087394, 'samples': 484224, 'steps': 945, 'loss/train': 1.1939756870269775} -09/20/2021 17:45:52 - INFO - __main__ - Step 15133: {'lr': 0.00019999226392087394, 'samples': 484256, 'steps': 945, 'loss/train': 3.009443521499634} -09/20/2021 17:45:53 - INFO - __main__ - Step 15134: {'lr': 0.00019999226392087394, 'samples': 484288, 'steps': 945, 'loss/train': 4.176768779754639} -09/20/2021 17:45:55 - INFO - __main__ - Step 15135: {'lr': 0.00019999226392087394, 'samples': 484320, 'steps': 945, 'loss/train': 3.7353134155273438} -09/20/2021 17:45:55 - INFO - __main__ - Step 15136: {'lr': 0.00019999226392087394, 'samples': 484352, 'steps': 945, 'loss/train': 2.7586348056793213} -09/20/2021 17:45:56 - INFO - __main__ - Step 15137: {'lr': 0.00019999218437406172, 'samples': 484384, 'steps': 946, 'loss/train': 3.58156681060791} -09/20/2021 17:45:57 - INFO - __main__ - Step 15138: {'lr': 0.00019999218437406172, 'samples': 484416, 'steps': 946, 'loss/train': 3.7587592601776123} -09/20/2021 17:45:58 - INFO - __main__ - Step 15139: {'lr': 0.00019999218437406172, 'samples': 484448, 'steps': 946, 'loss/train': 3.8349335193634033} -09/20/2021 17:45:58 - INFO - __main__ - Step 15140: {'lr': 0.00019999218437406172, 'samples': 484480, 'steps': 946, 'loss/train': 3.3301749229431152} -09/20/2021 17:45:59 - INFO - __main__ - Step 15141: {'lr': 0.00019999218437406172, 'samples': 484512, 'steps': 946, 'loss/train': 3.9968667030334473} -09/20/2021 17:46:00 - INFO - __main__ - Step 15142: {'lr': 0.00019999218437406172, 'samples': 484544, 'steps': 946, 'loss/train': 4.477569580078125} -09/20/2021 17:46:01 - INFO - __main__ - Step 15143: {'lr': 0.00019999218437406172, 'samples': 484576, 'steps': 946, 'loss/train': 2.1225502490997314} -09/20/2021 17:46:01 - INFO - __main__ - Step 15144: {'lr': 0.00019999218437406172, 'samples': 484608, 'steps': 946, 'loss/train': 1.312957763671875} -09/20/2021 17:46:02 - INFO - __main__ - Step 15145: {'lr': 0.00019999218437406172, 'samples': 484640, 'steps': 946, 'loss/train': 1.0883363485336304} -09/20/2021 17:46:03 - INFO - __main__ - Step 15146: {'lr': 0.00019999218437406172, 'samples': 484672, 'steps': 946, 'loss/train': 0.7905543446540833} -09/20/2021 17:46:04 - INFO - __main__ - Step 15147: {'lr': 0.00019999218437406172, 'samples': 484704, 'steps': 946, 'loss/train': 0.9381816983222961} -09/20/2021 17:46:04 - INFO - __main__ - Step 15148: {'lr': 0.00019999218437406172, 'samples': 484736, 'steps': 946, 'loss/train': 0.8789581060409546} -09/20/2021 17:46:05 - INFO - __main__ - Step 15149: {'lr': 0.00019999218437406172, 'samples': 484768, 'steps': 946, 'loss/train': 3.461390972137451} -09/20/2021 17:46:06 - INFO - __main__ - Step 15150: {'lr': 0.00019999218437406172, 'samples': 484800, 'steps': 946, 'loss/train': 4.112685680389404} -09/20/2021 17:46:07 - INFO - __main__ - Step 15151: {'lr': 0.00019999218437406172, 'samples': 484832, 'steps': 946, 'loss/train': 3.789266347885132} -09/20/2021 17:46:07 - INFO - __main__ - Step 15152: {'lr': 0.00019999218437406172, 'samples': 484864, 'steps': 946, 'loss/train': 3.03033709526062} -09/20/2021 17:46:08 - INFO - __main__ - Step 15153: {'lr': 0.00019999210442038162, 'samples': 484896, 'steps': 947, 'loss/train': 3.2527050971984863} -09/20/2021 17:46:09 - INFO - __main__ - Step 15154: {'lr': 0.00019999210442038162, 'samples': 484928, 'steps': 947, 'loss/train': 3.4147322177886963} -09/20/2021 17:46:10 - INFO - __main__ - Step 15155: {'lr': 0.00019999210442038162, 'samples': 484960, 'steps': 947, 'loss/train': 4.660663604736328} -09/20/2021 17:46:11 - INFO - __main__ - Step 15156: {'lr': 0.00019999210442038162, 'samples': 484992, 'steps': 947, 'loss/train': 3.801121950149536} -09/20/2021 17:46:11 - INFO - __main__ - Step 15157: {'lr': 0.00019999210442038162, 'samples': 485024, 'steps': 947, 'loss/train': 4.881961345672607} -09/20/2021 17:46:12 - INFO - __main__ - Step 15158: {'lr': 0.00019999210442038162, 'samples': 485056, 'steps': 947, 'loss/train': 3.581481695175171} -09/20/2021 17:46:13 - INFO - __main__ - Step 15159: {'lr': 0.00019999210442038162, 'samples': 485088, 'steps': 947, 'loss/train': 3.704150915145874} -09/20/2021 17:46:14 - INFO - __main__ - Step 15160: {'lr': 0.00019999210442038162, 'samples': 485120, 'steps': 947, 'loss/train': 3.5911755561828613} -09/20/2021 17:46:14 - INFO - __main__ - Step 15161: {'lr': 0.00019999210442038162, 'samples': 485152, 'steps': 947, 'loss/train': 2.5466554164886475} -09/20/2021 17:46:15 - INFO - __main__ - Step 15162: {'lr': 0.00019999210442038162, 'samples': 485184, 'steps': 947, 'loss/train': 3.5356786251068115} -09/20/2021 17:46:16 - INFO - __main__ - Step 15163: {'lr': 0.00019999210442038162, 'samples': 485216, 'steps': 947, 'loss/train': 3.5980899333953857} -09/20/2021 17:46:17 - INFO - __main__ - Step 15164: {'lr': 0.00019999210442038162, 'samples': 485248, 'steps': 947, 'loss/train': 4.543637275695801} -09/20/2021 17:46:17 - INFO - __main__ - Step 15165: {'lr': 0.00019999210442038162, 'samples': 485280, 'steps': 947, 'loss/train': 4.918087005615234} -09/20/2021 17:46:19 - INFO - __main__ - Step 15166: {'lr': 0.00019999210442038162, 'samples': 485312, 'steps': 947, 'loss/train': 3.601954221725464} -09/20/2021 17:46:19 - INFO - __main__ - Step 15167: {'lr': 0.00019999210442038162, 'samples': 485344, 'steps': 947, 'loss/train': 3.9294748306274414} -09/20/2021 17:46:20 - INFO - __main__ - Step 15168: {'lr': 0.00019999210442038162, 'samples': 485376, 'steps': 947, 'loss/train': 3.7071352005004883} -09/20/2021 17:46:21 - INFO - __main__ - Step 15169: {'lr': 0.00019999202405983406, 'samples': 485408, 'steps': 948, 'loss/train': 5.553105354309082} -09/20/2021 17:46:22 - INFO - __main__ - Step 15170: {'lr': 0.00019999202405983406, 'samples': 485440, 'steps': 948, 'loss/train': 0.5113850831985474} -09/20/2021 17:46:22 - INFO - __main__ - Step 15171: {'lr': 0.00019999202405983406, 'samples': 485472, 'steps': 948, 'loss/train': 4.684269905090332} -09/20/2021 17:46:23 - INFO - __main__ - Step 15172: {'lr': 0.00019999202405983406, 'samples': 485504, 'steps': 948, 'loss/train': 3.5881192684173584} -09/20/2021 17:46:24 - INFO - __main__ - Step 15173: {'lr': 0.00019999202405983406, 'samples': 485536, 'steps': 948, 'loss/train': 4.00050163269043} -09/20/2021 17:46:25 - INFO - __main__ - Step 15174: {'lr': 0.00019999202405983406, 'samples': 485568, 'steps': 948, 'loss/train': 3.476200580596924} -09/20/2021 17:46:25 - INFO - __main__ - Step 15175: {'lr': 0.00019999202405983406, 'samples': 485600, 'steps': 948, 'loss/train': 4.028609752655029} -09/20/2021 17:46:26 - INFO - __main__ - Step 15176: {'lr': 0.00019999202405983406, 'samples': 485632, 'steps': 948, 'loss/train': 3.4487361907958984} -09/20/2021 17:46:27 - INFO - __main__ - Step 15177: {'lr': 0.00019999202405983406, 'samples': 485664, 'steps': 948, 'loss/train': 4.374684810638428} -09/20/2021 17:46:28 - INFO - __main__ - Step 15178: {'lr': 0.00019999202405983406, 'samples': 485696, 'steps': 948, 'loss/train': 3.3471920490264893} -09/20/2021 17:46:28 - INFO - __main__ - Step 15179: {'lr': 0.00019999202405983406, 'samples': 485728, 'steps': 948, 'loss/train': 3.5548434257507324} -09/20/2021 17:46:29 - INFO - __main__ - Step 15180: {'lr': 0.00019999202405983406, 'samples': 485760, 'steps': 948, 'loss/train': 3.3786916732788086} -09/20/2021 17:46:30 - INFO - __main__ - Step 15181: {'lr': 0.00019999202405983406, 'samples': 485792, 'steps': 948, 'loss/train': 3.885321617126465} -09/20/2021 17:46:31 - INFO - __main__ - Step 15182: {'lr': 0.00019999202405983406, 'samples': 485824, 'steps': 948, 'loss/train': 3.0775668621063232} -09/20/2021 17:46:31 - INFO - __main__ - Step 15183: {'lr': 0.00019999202405983406, 'samples': 485856, 'steps': 948, 'loss/train': 3.274806022644043} -09/20/2021 17:46:32 - INFO - __main__ - Step 15184: {'lr': 0.00019999202405983406, 'samples': 485888, 'steps': 948, 'loss/train': 5.33602237701416} -09/20/2021 17:46:33 - INFO - __main__ - Step 15185: {'lr': 0.00019999194329241933, 'samples': 485920, 'steps': 949, 'loss/train': 0.9817814826965332} -09/20/2021 17:46:34 - INFO - __main__ - Step 15186: {'lr': 0.00019999194329241933, 'samples': 485952, 'steps': 949, 'loss/train': 4.211426734924316} -09/20/2021 17:46:35 - INFO - __main__ - Step 15187: {'lr': 0.00019999194329241933, 'samples': 485984, 'steps': 949, 'loss/train': 4.715743064880371} -09/20/2021 17:46:35 - INFO - __main__ - Step 15188: {'lr': 0.00019999194329241933, 'samples': 486016, 'steps': 949, 'loss/train': 2.686408519744873} -09/20/2021 17:46:36 - INFO - __main__ - Step 15189: {'lr': 0.00019999194329241933, 'samples': 486048, 'steps': 949, 'loss/train': 1.0539387464523315} -09/20/2021 17:46:37 - INFO - __main__ - Step 15190: {'lr': 0.00019999194329241933, 'samples': 486080, 'steps': 949, 'loss/train': 0.8912505507469177} -09/20/2021 17:46:38 - INFO - __main__ - Step 15191: {'lr': 0.00019999194329241933, 'samples': 486112, 'steps': 949, 'loss/train': 4.116211414337158} -09/20/2021 17:46:38 - INFO - __main__ - Step 15192: {'lr': 0.00019999194329241933, 'samples': 486144, 'steps': 949, 'loss/train': 3.761652946472168} -09/20/2021 17:46:39 - INFO - __main__ - Step 15193: {'lr': 0.00019999194329241933, 'samples': 486176, 'steps': 949, 'loss/train': 3.588017225265503} -09/20/2021 17:46:40 - INFO - __main__ - Step 15194: {'lr': 0.00019999194329241933, 'samples': 486208, 'steps': 949, 'loss/train': 3.7681214809417725} -09/20/2021 17:46:41 - INFO - __main__ - Step 15195: {'lr': 0.00019999194329241933, 'samples': 486240, 'steps': 949, 'loss/train': 4.1371073722839355} -09/20/2021 17:46:41 - INFO - __main__ - Step 15196: {'lr': 0.00019999194329241933, 'samples': 486272, 'steps': 949, 'loss/train': 3.954378366470337} -09/20/2021 17:46:43 - INFO - __main__ - Step 15197: {'lr': 0.00019999194329241933, 'samples': 486304, 'steps': 949, 'loss/train': 4.148307800292969} -09/20/2021 17:46:44 - INFO - __main__ - Step 15198: {'lr': 0.00019999194329241933, 'samples': 486336, 'steps': 949, 'loss/train': 4.245765209197998} -09/20/2021 17:46:45 - INFO - __main__ - Step 15199: {'lr': 0.00019999194329241933, 'samples': 486368, 'steps': 949, 'loss/train': 4.0223469734191895} -09/20/2021 17:46:45 - INFO - __main__ - Step 15200: {'lr': 0.00019999194329241933, 'samples': 486400, 'steps': 949, 'loss/train': 3.1630449295043945} -09/20/2021 17:46:46 - INFO - __main__ - Step 15201: {'lr': 0.00019999186211813781, 'samples': 486432, 'steps': 950, 'loss/train': 4.842977523803711} -09/20/2021 17:46:47 - INFO - __main__ - Step 15202: {'lr': 0.00019999186211813781, 'samples': 486464, 'steps': 950, 'loss/train': 1.5179955959320068} -09/20/2021 17:46:48 - INFO - __main__ - Step 15203: {'lr': 0.00019999186211813781, 'samples': 486496, 'steps': 950, 'loss/train': 3.028104305267334} -09/20/2021 17:46:49 - INFO - __main__ - Step 15204: {'lr': 0.00019999186211813781, 'samples': 486528, 'steps': 950, 'loss/train': 4.659564018249512} -09/20/2021 17:46:49 - INFO - __main__ - Step 15205: {'lr': 0.00019999186211813781, 'samples': 486560, 'steps': 950, 'loss/train': 3.986283779144287} -09/20/2021 17:46:50 - INFO - __main__ - Step 15206: {'lr': 0.00019999186211813781, 'samples': 486592, 'steps': 950, 'loss/train': 4.0432353019714355} -09/20/2021 17:46:51 - INFO - __main__ - Step 15207: {'lr': 0.00019999186211813781, 'samples': 486624, 'steps': 950, 'loss/train': 3.9579832553863525} -09/20/2021 17:46:52 - INFO - __main__ - Step 15208: {'lr': 0.00019999186211813781, 'samples': 486656, 'steps': 950, 'loss/train': 3.9282567501068115} -09/20/2021 17:46:52 - INFO - __main__ - Step 15209: {'lr': 0.00019999186211813781, 'samples': 486688, 'steps': 950, 'loss/train': 4.1088762283325195} -09/20/2021 17:46:53 - INFO - __main__ - Step 15210: {'lr': 0.00019999186211813781, 'samples': 486720, 'steps': 950, 'loss/train': 4.032843112945557} -09/20/2021 17:46:54 - INFO - __main__ - Step 15211: {'lr': 0.00019999186211813781, 'samples': 486752, 'steps': 950, 'loss/train': 3.450953483581543} -09/20/2021 17:46:55 - INFO - __main__ - Step 15212: {'lr': 0.00019999186211813781, 'samples': 486784, 'steps': 950, 'loss/train': 3.3812265396118164} -09/20/2021 17:46:55 - INFO - __main__ - Step 15213: {'lr': 0.00019999186211813781, 'samples': 486816, 'steps': 950, 'loss/train': 3.5268421173095703} -09/20/2021 17:46:56 - INFO - __main__ - Step 15214: {'lr': 0.00019999186211813781, 'samples': 486848, 'steps': 950, 'loss/train': 4.19607400894165} -09/20/2021 17:46:57 - INFO - __main__ - Step 15215: {'lr': 0.00019999186211813781, 'samples': 486880, 'steps': 950, 'loss/train': 3.7512340545654297} -09/20/2021 17:46:58 - INFO - __main__ - Step 15216: {'lr': 0.00019999186211813781, 'samples': 486912, 'steps': 950, 'loss/train': 3.615049362182617} -09/20/2021 17:46:58 - INFO - __main__ - Step 15217: {'lr': 0.00019999178053698975, 'samples': 486944, 'steps': 951, 'loss/train': 3.9301536083221436} -09/20/2021 17:46:59 - INFO - __main__ - Step 15218: {'lr': 0.00019999178053698975, 'samples': 486976, 'steps': 951, 'loss/train': 5.4109392166137695} -09/20/2021 17:47:00 - INFO - __main__ - Step 15219: {'lr': 0.00019999178053698975, 'samples': 487008, 'steps': 951, 'loss/train': 1.253391146659851} -09/20/2021 17:47:01 - INFO - __main__ - Step 15220: {'lr': 0.00019999178053698975, 'samples': 487040, 'steps': 951, 'loss/train': 3.887329578399658} -09/20/2021 17:47:01 - INFO - __main__ - Step 15221: {'lr': 0.00019999178053698975, 'samples': 487072, 'steps': 951, 'loss/train': 3.855607509613037} -09/20/2021 17:47:02 - INFO - __main__ - Step 15222: {'lr': 0.00019999178053698975, 'samples': 487104, 'steps': 951, 'loss/train': 4.425135135650635} -09/20/2021 17:47:03 - INFO - __main__ - Step 15223: {'lr': 0.00019999178053698975, 'samples': 487136, 'steps': 951, 'loss/train': 4.075297832489014} -09/20/2021 17:47:04 - INFO - __main__ - Step 15224: {'lr': 0.00019999178053698975, 'samples': 487168, 'steps': 951, 'loss/train': 3.459522247314453} -09/20/2021 17:47:04 - INFO - __main__ - Step 15225: {'lr': 0.00019999178053698975, 'samples': 487200, 'steps': 951, 'loss/train': 3.5278329849243164} -09/20/2021 17:47:05 - INFO - __main__ - Step 15226: {'lr': 0.00019999178053698975, 'samples': 487232, 'steps': 951, 'loss/train': 4.121120929718018} -09/20/2021 17:47:06 - INFO - __main__ - Step 15227: {'lr': 0.00019999178053698975, 'samples': 487264, 'steps': 951, 'loss/train': 3.8917508125305176} -09/20/2021 17:47:07 - INFO - __main__ - Step 15228: {'lr': 0.00019999178053698975, 'samples': 487296, 'steps': 951, 'loss/train': 3.5738022327423096} -09/20/2021 17:47:08 - INFO - __main__ - Step 15229: {'lr': 0.00019999178053698975, 'samples': 487328, 'steps': 951, 'loss/train': 3.165102481842041} -09/20/2021 17:47:09 - INFO - __main__ - Step 15230: {'lr': 0.00019999178053698975, 'samples': 487360, 'steps': 951, 'loss/train': 4.045403957366943} -09/20/2021 17:47:10 - INFO - __main__ - Step 15231: {'lr': 0.00019999178053698975, 'samples': 487392, 'steps': 951, 'loss/train': 4.1224684715271} -09/20/2021 17:47:10 - INFO - __main__ - Step 15232: {'lr': 0.00019999178053698975, 'samples': 487424, 'steps': 951, 'loss/train': 3.8497989177703857} -09/20/2021 17:47:11 - INFO - __main__ - Step 15233: {'lr': 0.00019999169854897556, 'samples': 487456, 'steps': 952, 'loss/train': 3.921948194503784} -09/20/2021 17:47:12 - INFO - __main__ - Step 15234: {'lr': 0.00019999169854897556, 'samples': 487488, 'steps': 952, 'loss/train': 4.600345134735107} -09/20/2021 17:47:13 - INFO - __main__ - Step 15235: {'lr': 0.00019999169854897556, 'samples': 487520, 'steps': 952, 'loss/train': 4.383433818817139} -09/20/2021 17:47:13 - INFO - __main__ - Step 15236: {'lr': 0.00019999169854897556, 'samples': 487552, 'steps': 952, 'loss/train': 7.22796106338501} -09/20/2021 17:47:14 - INFO - __main__ - Step 15237: {'lr': 0.00019999169854897556, 'samples': 487584, 'steps': 952, 'loss/train': 0.8813254833221436} -09/20/2021 17:47:15 - INFO - __main__ - Step 15238: {'lr': 0.00019999169854897556, 'samples': 487616, 'steps': 952, 'loss/train': 0.86967933177948} -09/20/2021 17:47:16 - INFO - __main__ - Step 15239: {'lr': 0.00019999169854897556, 'samples': 487648, 'steps': 952, 'loss/train': 0.9204877018928528} -09/20/2021 17:47:16 - INFO - __main__ - Step 15240: {'lr': 0.00019999169854897556, 'samples': 487680, 'steps': 952, 'loss/train': 3.9438414573669434} -09/20/2021 17:47:17 - INFO - __main__ - Step 15241: {'lr': 0.00019999169854897556, 'samples': 487712, 'steps': 952, 'loss/train': 4.363726615905762} -09/20/2021 17:47:18 - INFO - __main__ - Step 15242: {'lr': 0.00019999169854897556, 'samples': 487744, 'steps': 952, 'loss/train': 4.116193771362305} -09/20/2021 17:47:19 - INFO - __main__ - Step 15243: {'lr': 0.00019999169854897556, 'samples': 487776, 'steps': 952, 'loss/train': 3.274158000946045} -09/20/2021 17:47:19 - INFO - __main__ - Step 15244: {'lr': 0.00019999169854897556, 'samples': 487808, 'steps': 952, 'loss/train': 3.276061534881592} -09/20/2021 17:47:20 - INFO - __main__ - Step 15245: {'lr': 0.00019999169854897556, 'samples': 487840, 'steps': 952, 'loss/train': 4.708544731140137} -09/20/2021 17:47:21 - INFO - __main__ - Step 15246: {'lr': 0.00019999169854897556, 'samples': 487872, 'steps': 952, 'loss/train': 4.153046131134033} -09/20/2021 17:47:22 - INFO - __main__ - Step 15247: {'lr': 0.00019999169854897556, 'samples': 487904, 'steps': 952, 'loss/train': 3.8060245513916016} -09/20/2021 17:47:22 - INFO - __main__ - Step 15248: {'lr': 0.00019999169854897556, 'samples': 487936, 'steps': 952, 'loss/train': 3.730842113494873} -09/20/2021 17:47:23 - INFO - __main__ - Step 15249: {'lr': 0.00019999161615409547, 'samples': 487968, 'steps': 953, 'loss/train': 3.737994909286499} -09/20/2021 17:47:24 - INFO - __main__ - Step 15250: {'lr': 0.00019999161615409547, 'samples': 488000, 'steps': 953, 'loss/train': 3.633044958114624} -09/20/2021 17:47:25 - INFO - __main__ - Step 15251: {'lr': 0.00019999161615409547, 'samples': 488032, 'steps': 953, 'loss/train': 3.546363592147827} -09/20/2021 17:47:26 - INFO - __main__ - Step 15252: {'lr': 0.00019999161615409547, 'samples': 488064, 'steps': 953, 'loss/train': 4.089874744415283} -09/20/2021 17:47:26 - INFO - __main__ - Step 15253: {'lr': 0.00019999161615409547, 'samples': 488096, 'steps': 953, 'loss/train': 4.343858242034912} -09/20/2021 17:47:27 - INFO - __main__ - Step 15254: {'lr': 0.00019999161615409547, 'samples': 488128, 'steps': 953, 'loss/train': 3.725341558456421} -09/20/2021 17:47:28 - INFO - __main__ - Step 15255: {'lr': 0.00019999161615409547, 'samples': 488160, 'steps': 953, 'loss/train': 3.528458833694458} -09/20/2021 17:47:29 - INFO - __main__ - Step 15256: {'lr': 0.00019999161615409547, 'samples': 488192, 'steps': 953, 'loss/train': 2.646463632583618} -09/20/2021 17:47:29 - INFO - __main__ - Step 15257: {'lr': 0.00019999161615409547, 'samples': 488224, 'steps': 953, 'loss/train': 4.211952209472656} -09/20/2021 17:47:30 - INFO - __main__ - Step 15258: {'lr': 0.00019999161615409547, 'samples': 488256, 'steps': 953, 'loss/train': 3.4662342071533203} -09/20/2021 17:47:31 - INFO - __main__ - Step 15259: {'lr': 0.00019999161615409547, 'samples': 488288, 'steps': 953, 'loss/train': 3.752490282058716} -09/20/2021 17:47:32 - INFO - __main__ - Step 15260: {'lr': 0.00019999161615409547, 'samples': 488320, 'steps': 953, 'loss/train': 1.1469383239746094} -09/20/2021 17:47:33 - INFO - __main__ - Step 15261: {'lr': 0.00019999161615409547, 'samples': 488352, 'steps': 953, 'loss/train': 0.9053558111190796} -09/20/2021 17:47:34 - INFO - __main__ - Step 15262: {'lr': 0.00019999161615409547, 'samples': 488384, 'steps': 953, 'loss/train': 0.8065220713615417} -09/20/2021 17:47:34 - INFO - __main__ - Step 15263: {'lr': 0.00019999161615409547, 'samples': 488416, 'steps': 953, 'loss/train': 0.9651960730552673} -09/20/2021 17:47:35 - INFO - __main__ - Step 15264: {'lr': 0.00019999161615409547, 'samples': 488448, 'steps': 953, 'loss/train': 1.2737071514129639} -09/20/2021 17:47:36 - INFO - __main__ - Step 15265: {'lr': 0.00019999153335234995, 'samples': 488480, 'steps': 954, 'loss/train': 3.1366710662841797} -09/20/2021 17:47:37 - INFO - __main__ - Step 15266: {'lr': 0.00019999153335234995, 'samples': 488512, 'steps': 954, 'loss/train': 4.365438461303711} -09/20/2021 17:47:38 - INFO - __main__ - Step 15267: {'lr': 0.00019999153335234995, 'samples': 488544, 'steps': 954, 'loss/train': 4.320596218109131} -09/20/2021 17:47:38 - INFO - __main__ - Step 15268: {'lr': 0.00019999153335234995, 'samples': 488576, 'steps': 954, 'loss/train': 3.1824166774749756} -09/20/2021 17:47:39 - INFO - __main__ - Step 15269: {'lr': 0.00019999153335234995, 'samples': 488608, 'steps': 954, 'loss/train': 3.9437203407287598} -09/20/2021 17:47:40 - INFO - __main__ - Step 15270: {'lr': 0.00019999153335234995, 'samples': 488640, 'steps': 954, 'loss/train': 3.543034553527832} -09/20/2021 17:47:41 - INFO - __main__ - Step 15271: {'lr': 0.00019999153335234995, 'samples': 488672, 'steps': 954, 'loss/train': 4.705565929412842} -09/20/2021 17:47:41 - INFO - __main__ - Step 15272: {'lr': 0.00019999153335234995, 'samples': 488704, 'steps': 954, 'loss/train': 3.688345432281494} -09/20/2021 17:47:42 - INFO - __main__ - Step 15273: {'lr': 0.00019999153335234995, 'samples': 488736, 'steps': 954, 'loss/train': 1.9637141227722168} -09/20/2021 17:47:43 - INFO - __main__ - Step 15274: {'lr': 0.00019999153335234995, 'samples': 488768, 'steps': 954, 'loss/train': 3.638390064239502} -09/20/2021 17:47:44 - INFO - __main__ - Step 15275: {'lr': 0.00019999153335234995, 'samples': 488800, 'steps': 954, 'loss/train': 3.2445478439331055} -09/20/2021 17:47:44 - INFO - __main__ - Step 15276: {'lr': 0.00019999153335234995, 'samples': 488832, 'steps': 954, 'loss/train': 4.459997177124023} -09/20/2021 17:47:45 - INFO - __main__ - Step 15277: {'lr': 0.00019999153335234995, 'samples': 488864, 'steps': 954, 'loss/train': 3.9828531742095947} -09/20/2021 17:47:46 - INFO - __main__ - Step 15278: {'lr': 0.00019999153335234995, 'samples': 488896, 'steps': 954, 'loss/train': 3.938371181488037} -09/20/2021 17:47:47 - INFO - __main__ - Step 15279: {'lr': 0.00019999153335234995, 'samples': 488928, 'steps': 954, 'loss/train': 4.312215805053711} -09/20/2021 17:47:47 - INFO - __main__ - Step 15280: {'lr': 0.00019999153335234995, 'samples': 488960, 'steps': 954, 'loss/train': 4.277616024017334} -09/20/2021 17:47:48 - INFO - __main__ - Step 15281: {'lr': 0.00019999145014373924, 'samples': 488992, 'steps': 955, 'loss/train': 3.151466131210327} -09/20/2021 17:47:49 - INFO - __main__ - Step 15282: {'lr': 0.00019999145014373924, 'samples': 489024, 'steps': 955, 'loss/train': 4.302523612976074} -09/20/2021 17:47:50 - INFO - __main__ - Step 15283: {'lr': 0.00019999145014373924, 'samples': 489056, 'steps': 955, 'loss/train': 4.264550685882568} -09/20/2021 17:47:50 - INFO - __main__ - Step 15284: {'lr': 0.00019999145014373924, 'samples': 489088, 'steps': 955, 'loss/train': 3.9399688243865967} -09/20/2021 17:47:51 - INFO - __main__ - Step 15285: {'lr': 0.00019999145014373924, 'samples': 489120, 'steps': 955, 'loss/train': 4.132872104644775} -09/20/2021 17:47:52 - INFO - __main__ - Step 15286: {'lr': 0.00019999145014373924, 'samples': 489152, 'steps': 955, 'loss/train': 2.7709767818450928} -09/20/2021 17:47:53 - INFO - __main__ - Step 15287: {'lr': 0.00019999145014373924, 'samples': 489184, 'steps': 955, 'loss/train': 3.2692441940307617} -09/20/2021 17:47:53 - INFO - __main__ - Step 15288: {'lr': 0.00019999145014373924, 'samples': 489216, 'steps': 955, 'loss/train': 0.7596940398216248} -09/20/2021 17:47:55 - INFO - __main__ - Step 15289: {'lr': 0.00019999145014373924, 'samples': 489248, 'steps': 955, 'loss/train': 0.9874200224876404} -09/20/2021 17:47:55 - INFO - __main__ - Step 15290: {'lr': 0.00019999145014373924, 'samples': 489280, 'steps': 955, 'loss/train': 3.7392611503601074} -09/20/2021 17:47:56 - INFO - __main__ - Step 15291: {'lr': 0.00019999145014373924, 'samples': 489312, 'steps': 955, 'loss/train': 3.3496828079223633} -09/20/2021 17:47:57 - INFO - __main__ - Step 15292: {'lr': 0.00019999145014373924, 'samples': 489344, 'steps': 955, 'loss/train': 3.6532387733459473} -09/20/2021 17:47:58 - INFO - __main__ - Step 15293: {'lr': 0.00019999145014373924, 'samples': 489376, 'steps': 955, 'loss/train': 3.3011903762817383} -09/20/2021 17:47:58 - INFO - __main__ - Step 15294: {'lr': 0.00019999145014373924, 'samples': 489408, 'steps': 955, 'loss/train': 3.973137140274048} -09/20/2021 17:47:59 - INFO - __main__ - Step 15295: {'lr': 0.00019999145014373924, 'samples': 489440, 'steps': 955, 'loss/train': 4.239051818847656} -09/20/2021 17:48:00 - INFO - __main__ - Step 15296: {'lr': 0.00019999145014373924, 'samples': 489472, 'steps': 955, 'loss/train': 3.4143011569976807} -09/20/2021 17:48:01 - INFO - __main__ - Step 15297: {'lr': 0.00019999136652826372, 'samples': 489504, 'steps': 956, 'loss/train': 4.049868106842041} -09/20/2021 17:48:02 - INFO - __main__ - Step 15298: {'lr': 0.00019999136652826372, 'samples': 489536, 'steps': 956, 'loss/train': 3.1799981594085693} -09/20/2021 17:48:02 - INFO - __main__ - Step 15299: {'lr': 0.00019999136652826372, 'samples': 489568, 'steps': 956, 'loss/train': 4.020306587219238} -09/20/2021 17:48:03 - INFO - __main__ - Step 15300: {'lr': 0.00019999136652826372, 'samples': 489600, 'steps': 956, 'loss/train': 4.217194080352783} -09/20/2021 17:48:04 - INFO - __main__ - Step 15301: {'lr': 0.00019999136652826372, 'samples': 489632, 'steps': 956, 'loss/train': 3.4428582191467285} -09/20/2021 17:48:05 - INFO - __main__ - Step 15302: {'lr': 0.00019999136652826372, 'samples': 489664, 'steps': 956, 'loss/train': 4.056758880615234} -09/20/2021 17:48:05 - INFO - __main__ - Step 15303: {'lr': 0.00019999136652826372, 'samples': 489696, 'steps': 956, 'loss/train': 4.843712329864502} -09/20/2021 17:48:06 - INFO - __main__ - Step 15304: {'lr': 0.00019999136652826372, 'samples': 489728, 'steps': 956, 'loss/train': 3.426893472671509} -09/20/2021 17:48:07 - INFO - __main__ - Step 15305: {'lr': 0.00019999136652826372, 'samples': 489760, 'steps': 956, 'loss/train': 4.585038185119629} -09/20/2021 17:48:08 - INFO - __main__ - Step 15306: {'lr': 0.00019999136652826372, 'samples': 489792, 'steps': 956, 'loss/train': 3.9242312908172607} -09/20/2021 17:48:08 - INFO - __main__ - Step 15307: {'lr': 0.00019999136652826372, 'samples': 489824, 'steps': 956, 'loss/train': 4.322389125823975} -09/20/2021 17:48:09 - INFO - __main__ - Step 15308: {'lr': 0.00019999136652826372, 'samples': 489856, 'steps': 956, 'loss/train': 3.469235897064209} -09/20/2021 17:48:10 - INFO - __main__ - Step 15309: {'lr': 0.00019999136652826372, 'samples': 489888, 'steps': 956, 'loss/train': 3.2267346382141113} -09/20/2021 17:48:11 - INFO - __main__ - Step 15310: {'lr': 0.00019999136652826372, 'samples': 489920, 'steps': 956, 'loss/train': 6.057393550872803} -09/20/2021 17:48:11 - INFO - __main__ - Step 15311: {'lr': 0.00019999136652826372, 'samples': 489952, 'steps': 956, 'loss/train': 3.743861675262451} -09/20/2021 17:48:12 - INFO - __main__ - Step 15312: {'lr': 0.00019999136652826372, 'samples': 489984, 'steps': 956, 'loss/train': 4.179612636566162} -09/20/2021 17:48:13 - INFO - __main__ - Step 15313: {'lr': 0.00019999128250592371, 'samples': 490016, 'steps': 957, 'loss/train': 3.1034960746765137} -09/20/2021 17:48:14 - INFO - __main__ - Step 15314: {'lr': 0.00019999128250592371, 'samples': 490048, 'steps': 957, 'loss/train': 4.0528244972229} -09/20/2021 17:48:14 - INFO - __main__ - Step 15315: {'lr': 0.00019999128250592371, 'samples': 490080, 'steps': 957, 'loss/train': 3.3612112998962402} -09/20/2021 17:48:15 - INFO - __main__ - Step 15316: {'lr': 0.00019999128250592371, 'samples': 490112, 'steps': 957, 'loss/train': 4.736362934112549} -09/20/2021 17:48:16 - INFO - __main__ - Step 15317: {'lr': 0.00019999128250592371, 'samples': 490144, 'steps': 957, 'loss/train': 5.134712219238281} -09/20/2021 17:48:17 - INFO - __main__ - Step 15318: {'lr': 0.00019999128250592371, 'samples': 490176, 'steps': 957, 'loss/train': 4.041910171508789} -09/20/2021 17:48:17 - INFO - __main__ - Step 15319: {'lr': 0.00019999128250592371, 'samples': 490208, 'steps': 957, 'loss/train': 3.41738224029541} -09/20/2021 17:48:19 - INFO - __main__ - Step 15320: {'lr': 0.00019999128250592371, 'samples': 490240, 'steps': 957, 'loss/train': 3.65769624710083} -09/20/2021 17:48:20 - INFO - __main__ - Step 15321: {'lr': 0.00019999128250592371, 'samples': 490272, 'steps': 957, 'loss/train': 3.6448028087615967} -09/20/2021 17:48:20 - INFO - __main__ - Step 15322: {'lr': 0.00019999128250592371, 'samples': 490304, 'steps': 957, 'loss/train': 3.0535786151885986} -09/20/2021 17:48:21 - INFO - __main__ - Step 15323: {'lr': 0.00019999128250592371, 'samples': 490336, 'steps': 957, 'loss/train': 1.339119553565979} -09/20/2021 17:48:22 - INFO - __main__ - Step 15324: {'lr': 0.00019999128250592371, 'samples': 490368, 'steps': 957, 'loss/train': 2.707810401916504} -09/20/2021 17:48:23 - INFO - __main__ - Step 15325: {'lr': 0.00019999128250592371, 'samples': 490400, 'steps': 957, 'loss/train': 3.834379196166992} -09/20/2021 17:48:23 - INFO - __main__ - Step 15326: {'lr': 0.00019999128250592371, 'samples': 490432, 'steps': 957, 'loss/train': 3.3730552196502686} -09/20/2021 17:48:24 - INFO - __main__ - Step 15327: {'lr': 0.00019999128250592371, 'samples': 490464, 'steps': 957, 'loss/train': 3.8404765129089355} -09/20/2021 17:48:25 - INFO - __main__ - Step 15328: {'lr': 0.00019999128250592371, 'samples': 490496, 'steps': 957, 'loss/train': 3.6148159503936768} -09/20/2021 17:48:26 - INFO - __main__ - Step 15329: {'lr': 0.00019999119807671955, 'samples': 490528, 'steps': 958, 'loss/train': 3.4026224613189697} -09/20/2021 17:48:26 - INFO - __main__ - Step 15330: {'lr': 0.00019999119807671955, 'samples': 490560, 'steps': 958, 'loss/train': 3.826504945755005} -09/20/2021 17:48:27 - INFO - __main__ - Step 15331: {'lr': 0.00019999119807671955, 'samples': 490592, 'steps': 958, 'loss/train': 4.067816734313965} -09/20/2021 17:48:28 - INFO - __main__ - Step 15332: {'lr': 0.00019999119807671955, 'samples': 490624, 'steps': 958, 'loss/train': 3.031010150909424} -09/20/2021 17:48:29 - INFO - __main__ - Step 15333: {'lr': 0.00019999119807671955, 'samples': 490656, 'steps': 958, 'loss/train': 3.900480270385742} -09/20/2021 17:48:29 - INFO - __main__ - Step 15334: {'lr': 0.00019999119807671955, 'samples': 490688, 'steps': 958, 'loss/train': 2.0202112197875977} -09/20/2021 17:48:30 - INFO - __main__ - Step 15335: {'lr': 0.00019999119807671955, 'samples': 490720, 'steps': 958, 'loss/train': 5.045182228088379} -09/20/2021 17:48:31 - INFO - __main__ - Step 15336: {'lr': 0.00019999119807671955, 'samples': 490752, 'steps': 958, 'loss/train': 3.4136297702789307} -09/20/2021 17:48:32 - INFO - __main__ - Step 15337: {'lr': 0.00019999119807671955, 'samples': 490784, 'steps': 958, 'loss/train': 4.489741325378418} -09/20/2021 17:48:32 - INFO - __main__ - Step 15338: {'lr': 0.00019999119807671955, 'samples': 490816, 'steps': 958, 'loss/train': 3.378007173538208} -09/20/2021 17:48:33 - INFO - __main__ - Step 15339: {'lr': 0.00019999119807671955, 'samples': 490848, 'steps': 958, 'loss/train': 3.4118244647979736} -09/20/2021 17:48:34 - INFO - __main__ - Step 15340: {'lr': 0.00019999119807671955, 'samples': 490880, 'steps': 958, 'loss/train': 4.928621292114258} -09/20/2021 17:48:35 - INFO - __main__ - Step 15341: {'lr': 0.00019999119807671955, 'samples': 490912, 'steps': 958, 'loss/train': 3.4796640872955322} -09/20/2021 17:48:35 - INFO - __main__ - Step 15342: {'lr': 0.00019999119807671955, 'samples': 490944, 'steps': 958, 'loss/train': 4.110263824462891} -09/20/2021 17:48:36 - INFO - __main__ - Step 15343: {'lr': 0.00019999119807671955, 'samples': 490976, 'steps': 958, 'loss/train': 3.5834834575653076} -09/20/2021 17:48:37 - INFO - __main__ - Step 15344: {'lr': 0.00019999119807671955, 'samples': 491008, 'steps': 958, 'loss/train': 4.364543437957764} -09/20/2021 17:48:38 - INFO - __main__ - Step 15345: {'lr': 0.00019999111324065161, 'samples': 491040, 'steps': 959, 'loss/train': 4.104925632476807} -09/20/2021 17:48:39 - INFO - __main__ - Step 15346: {'lr': 0.00019999111324065161, 'samples': 491072, 'steps': 959, 'loss/train': 4.53737211227417} -09/20/2021 17:48:39 - INFO - __main__ - Step 15347: {'lr': 0.00019999111324065161, 'samples': 491104, 'steps': 959, 'loss/train': 3.798635959625244} -09/20/2021 17:48:40 - INFO - __main__ - Step 15348: {'lr': 0.00019999111324065161, 'samples': 491136, 'steps': 959, 'loss/train': 4.544741153717041} -09/20/2021 17:48:41 - INFO - __main__ - Step 15349: {'lr': 0.00019999111324065161, 'samples': 491168, 'steps': 959, 'loss/train': 3.433138608932495} -09/20/2021 17:48:42 - INFO - __main__ - Step 15350: {'lr': 0.00019999111324065161, 'samples': 491200, 'steps': 959, 'loss/train': 2.831509590148926} -09/20/2021 17:48:42 - INFO - __main__ - Step 15351: {'lr': 0.00019999111324065161, 'samples': 491232, 'steps': 959, 'loss/train': 5.935950756072998} -09/20/2021 17:48:44 - INFO - __main__ - Step 15352: {'lr': 0.00019999111324065161, 'samples': 491264, 'steps': 959, 'loss/train': 5.015537738800049} -09/20/2021 17:48:44 - INFO - __main__ - Step 15353: {'lr': 0.00019999111324065161, 'samples': 491296, 'steps': 959, 'loss/train': 3.1550328731536865} -09/20/2021 17:48:45 - INFO - __main__ - Step 15354: {'lr': 0.00019999111324065161, 'samples': 491328, 'steps': 959, 'loss/train': 3.7366442680358887} -09/20/2021 17:48:46 - INFO - __main__ - Step 15355: {'lr': 0.00019999111324065161, 'samples': 491360, 'steps': 959, 'loss/train': 2.920161247253418} -09/20/2021 17:48:47 - INFO - __main__ - Step 15356: {'lr': 0.00019999111324065161, 'samples': 491392, 'steps': 959, 'loss/train': 4.033753871917725} -09/20/2021 17:48:47 - INFO - __main__ - Step 15357: {'lr': 0.00019999111324065161, 'samples': 491424, 'steps': 959, 'loss/train': 0.7438740730285645} -09/20/2021 17:48:48 - INFO - __main__ - Step 15358: {'lr': 0.00019999111324065161, 'samples': 491456, 'steps': 959, 'loss/train': 3.4468135833740234} -09/20/2021 17:48:49 - INFO - __main__ - Step 15359: {'lr': 0.00019999111324065161, 'samples': 491488, 'steps': 959, 'loss/train': 4.929225921630859} -09/20/2021 17:48:50 - INFO - __main__ - Step 15360: {'lr': 0.00019999111324065161, 'samples': 491520, 'steps': 959, 'loss/train': 3.8927364349365234} -09/20/2021 17:48:50 - INFO - __main__ - Step 15361: {'lr': 0.0001999910279977202, 'samples': 491552, 'steps': 960, 'loss/train': 3.129554510116577} -09/20/2021 17:48:51 - INFO - __main__ - Step 15362: {'lr': 0.0001999910279977202, 'samples': 491584, 'steps': 960, 'loss/train': 4.384795665740967} -09/20/2021 17:48:52 - INFO - __main__ - Step 15363: {'lr': 0.0001999910279977202, 'samples': 491616, 'steps': 960, 'loss/train': 3.790430784225464} -09/20/2021 17:48:53 - INFO - __main__ - Step 15364: {'lr': 0.0001999910279977202, 'samples': 491648, 'steps': 960, 'loss/train': 3.5339460372924805} -09/20/2021 17:48:53 - INFO - __main__ - Step 15365: {'lr': 0.0001999910279977202, 'samples': 491680, 'steps': 960, 'loss/train': 3.774608612060547} -09/20/2021 17:48:54 - INFO - __main__ - Step 15366: {'lr': 0.0001999910279977202, 'samples': 491712, 'steps': 960, 'loss/train': 3.716017723083496} -09/20/2021 17:48:55 - INFO - __main__ - Step 15367: {'lr': 0.0001999910279977202, 'samples': 491744, 'steps': 960, 'loss/train': 3.8201792240142822} -09/20/2021 17:48:56 - INFO - __main__ - Step 15368: {'lr': 0.0001999910279977202, 'samples': 491776, 'steps': 960, 'loss/train': 2.3856992721557617} -09/20/2021 17:48:56 - INFO - __main__ - Step 15369: {'lr': 0.0001999910279977202, 'samples': 491808, 'steps': 960, 'loss/train': 4.833596706390381} -09/20/2021 17:48:57 - INFO - __main__ - Step 15370: {'lr': 0.0001999910279977202, 'samples': 491840, 'steps': 960, 'loss/train': 2.6234512329101562} -09/20/2021 17:48:58 - INFO - __main__ - Step 15371: {'lr': 0.0001999910279977202, 'samples': 491872, 'steps': 960, 'loss/train': 4.057507038116455} -09/20/2021 17:48:59 - INFO - __main__ - Step 15372: {'lr': 0.0001999910279977202, 'samples': 491904, 'steps': 960, 'loss/train': 4.724687576293945} -09/20/2021 17:48:59 - INFO - __main__ - Step 15373: {'lr': 0.0001999910279977202, 'samples': 491936, 'steps': 960, 'loss/train': 4.724023342132568} -09/20/2021 17:49:00 - INFO - __main__ - Step 15374: {'lr': 0.0001999910279977202, 'samples': 491968, 'steps': 960, 'loss/train': 4.20528507232666} -09/20/2021 17:49:01 - INFO - __main__ - Step 15375: {'lr': 0.0001999910279977202, 'samples': 492000, 'steps': 960, 'loss/train': 3.7362864017486572} -09/20/2021 17:49:02 - INFO - __main__ - Step 15376: {'lr': 0.0001999910279977202, 'samples': 492032, 'steps': 960, 'loss/train': 3.1015875339508057} -09/20/2021 17:49:03 - INFO - __main__ - Step 15377: {'lr': 0.0001999909423479257, 'samples': 492064, 'steps': 961, 'loss/train': 2.5233564376831055} -09/20/2021 17:49:03 - INFO - __main__ - Step 15378: {'lr': 0.0001999909423479257, 'samples': 492096, 'steps': 961, 'loss/train': 4.02951192855835} -09/20/2021 17:49:04 - INFO - __main__ - Step 15379: {'lr': 0.0001999909423479257, 'samples': 492128, 'steps': 961, 'loss/train': 3.9006052017211914} -09/20/2021 17:49:05 - INFO - __main__ - Step 15380: {'lr': 0.0001999909423479257, 'samples': 492160, 'steps': 961, 'loss/train': 3.842994451522827} -09/20/2021 17:49:06 - INFO - __main__ - Step 15381: {'lr': 0.0001999909423479257, 'samples': 492192, 'steps': 961, 'loss/train': 3.434438705444336} -09/20/2021 17:49:06 - INFO - __main__ - Step 15382: {'lr': 0.0001999909423479257, 'samples': 492224, 'steps': 961, 'loss/train': 5.283512115478516} -09/20/2021 17:49:08 - INFO - __main__ - Step 15383: {'lr': 0.0001999909423479257, 'samples': 492256, 'steps': 961, 'loss/train': 4.301599025726318} -09/20/2021 17:49:08 - INFO - __main__ - Step 15384: {'lr': 0.0001999909423479257, 'samples': 492288, 'steps': 961, 'loss/train': 4.881410121917725} -09/20/2021 17:49:09 - INFO - __main__ - Step 15385: {'lr': 0.0001999909423479257, 'samples': 492320, 'steps': 961, 'loss/train': 4.4525370597839355} -09/20/2021 17:49:10 - INFO - __main__ - Step 15386: {'lr': 0.0001999909423479257, 'samples': 492352, 'steps': 961, 'loss/train': 4.132844924926758} -09/20/2021 17:49:11 - INFO - __main__ - Step 15387: {'lr': 0.0001999909423479257, 'samples': 492384, 'steps': 961, 'loss/train': 4.524295330047607} -09/20/2021 17:49:11 - INFO - __main__ - Step 15388: {'lr': 0.0001999909423479257, 'samples': 492416, 'steps': 961, 'loss/train': 4.471034049987793} -09/20/2021 17:49:12 - INFO - __main__ - Step 15389: {'lr': 0.0001999909423479257, 'samples': 492448, 'steps': 961, 'loss/train': 4.668882846832275} -09/20/2021 17:49:13 - INFO - __main__ - Step 15390: {'lr': 0.0001999909423479257, 'samples': 492480, 'steps': 961, 'loss/train': 3.2645931243896484} -09/20/2021 17:49:14 - INFO - __main__ - Step 15391: {'lr': 0.0001999909423479257, 'samples': 492512, 'steps': 961, 'loss/train': 4.08186674118042} -09/20/2021 17:49:14 - INFO - __main__ - Step 15392: {'lr': 0.0001999909423479257, 'samples': 492544, 'steps': 961, 'loss/train': 2.940678596496582} -09/20/2021 17:49:15 - INFO - __main__ - Step 15393: {'lr': 0.00019999085629126843, 'samples': 492576, 'steps': 962, 'loss/train': 3.39446759223938} -09/20/2021 17:49:16 - INFO - __main__ - Step 15394: {'lr': 0.00019999085629126843, 'samples': 492608, 'steps': 962, 'loss/train': 4.1032023429870605} -09/20/2021 17:49:17 - INFO - __main__ - Step 15395: {'lr': 0.00019999085629126843, 'samples': 492640, 'steps': 962, 'loss/train': 4.001509189605713} -09/20/2021 17:49:17 - INFO - __main__ - Step 15396: {'lr': 0.00019999085629126843, 'samples': 492672, 'steps': 962, 'loss/train': 3.6501312255859375} -09/20/2021 17:49:18 - INFO - __main__ - Step 15397: {'lr': 0.00019999085629126843, 'samples': 492704, 'steps': 962, 'loss/train': 3.8947560787200928} -09/20/2021 17:49:19 - INFO - __main__ - Step 15398: {'lr': 0.00019999085629126843, 'samples': 492736, 'steps': 962, 'loss/train': 3.6432344913482666} -09/20/2021 17:49:20 - INFO - __main__ - Step 15399: {'lr': 0.00019999085629126843, 'samples': 492768, 'steps': 962, 'loss/train': 3.5778732299804688} -09/20/2021 17:49:20 - INFO - __main__ - Step 15400: {'lr': 0.00019999085629126843, 'samples': 492800, 'steps': 962, 'loss/train': 3.8717734813690186} -09/20/2021 17:49:21 - INFO - __main__ - Step 15401: {'lr': 0.00019999085629126843, 'samples': 492832, 'steps': 962, 'loss/train': 3.4828970432281494} -09/20/2021 17:49:22 - INFO - __main__ - Step 15402: {'lr': 0.00019999085629126843, 'samples': 492864, 'steps': 962, 'loss/train': 3.6273422241210938} -09/20/2021 17:49:23 - INFO - __main__ - Step 15403: {'lr': 0.00019999085629126843, 'samples': 492896, 'steps': 962, 'loss/train': 1.7504913806915283} -09/20/2021 17:49:23 - INFO - __main__ - Step 15404: {'lr': 0.00019999085629126843, 'samples': 492928, 'steps': 962, 'loss/train': 4.049380302429199} -09/20/2021 17:49:24 - INFO - __main__ - Step 15405: {'lr': 0.00019999085629126843, 'samples': 492960, 'steps': 962, 'loss/train': 3.2789101600646973} -09/20/2021 17:49:25 - INFO - __main__ - Step 15406: {'lr': 0.00019999085629126843, 'samples': 492992, 'steps': 962, 'loss/train': 3.2404956817626953} -09/20/2021 17:49:26 - INFO - __main__ - Step 15407: {'lr': 0.00019999085629126843, 'samples': 493024, 'steps': 962, 'loss/train': 3.450011968612671} -09/20/2021 17:49:26 - INFO - __main__ - Step 15408: {'lr': 0.00019999085629126843, 'samples': 493056, 'steps': 962, 'loss/train': 2.802114725112915} -09/20/2021 17:49:27 - INFO - __main__ - Step 15409: {'lr': 0.0001999907698277488, 'samples': 493088, 'steps': 963, 'loss/train': 4.0629377365112305} -09/20/2021 17:49:28 - INFO - __main__ - Step 15410: {'lr': 0.0001999907698277488, 'samples': 493120, 'steps': 963, 'loss/train': 3.6722447872161865} -09/20/2021 17:49:29 - INFO - __main__ - Step 15411: {'lr': 0.0001999907698277488, 'samples': 493152, 'steps': 963, 'loss/train': 4.025364875793457} -09/20/2021 17:49:30 - INFO - __main__ - Step 15412: {'lr': 0.0001999907698277488, 'samples': 493184, 'steps': 963, 'loss/train': 3.007467269897461} -09/20/2021 17:49:30 - INFO - __main__ - Step 15413: {'lr': 0.0001999907698277488, 'samples': 493216, 'steps': 963, 'loss/train': 3.638395071029663} -09/20/2021 17:49:32 - INFO - __main__ - Step 15414: {'lr': 0.0001999907698277488, 'samples': 493248, 'steps': 963, 'loss/train': 3.87575364112854} -09/20/2021 17:49:32 - INFO - __main__ - Step 15415: {'lr': 0.0001999907698277488, 'samples': 493280, 'steps': 963, 'loss/train': 4.35186767578125} -09/20/2021 17:49:33 - INFO - __main__ - Step 15416: {'lr': 0.0001999907698277488, 'samples': 493312, 'steps': 963, 'loss/train': 2.0064218044281006} -09/20/2021 17:49:34 - INFO - __main__ - Step 15417: {'lr': 0.0001999907698277488, 'samples': 493344, 'steps': 963, 'loss/train': 4.6065673828125} -09/20/2021 17:49:35 - INFO - __main__ - Step 15418: {'lr': 0.0001999907698277488, 'samples': 493376, 'steps': 963, 'loss/train': 3.0563406944274902} -09/20/2021 17:49:35 - INFO - __main__ - Step 15419: {'lr': 0.0001999907698277488, 'samples': 493408, 'steps': 963, 'loss/train': 3.3879213333129883} -09/20/2021 17:49:36 - INFO - __main__ - Step 15420: {'lr': 0.0001999907698277488, 'samples': 493440, 'steps': 963, 'loss/train': 4.527543067932129} -09/20/2021 17:49:37 - INFO - __main__ - Step 15421: {'lr': 0.0001999907698277488, 'samples': 493472, 'steps': 963, 'loss/train': 3.7360734939575195} -09/20/2021 17:49:38 - INFO - __main__ - Step 15422: {'lr': 0.0001999907698277488, 'samples': 493504, 'steps': 963, 'loss/train': 3.1778392791748047} -09/20/2021 17:49:38 - INFO - __main__ - Step 15423: {'lr': 0.0001999907698277488, 'samples': 493536, 'steps': 963, 'loss/train': 3.6200544834136963} -09/20/2021 17:49:39 - INFO - __main__ - Step 15424: {'lr': 0.0001999907698277488, 'samples': 493568, 'steps': 963, 'loss/train': 3.617187023162842} -09/20/2021 17:49:40 - INFO - __main__ - Step 15425: {'lr': 0.00019999068295736705, 'samples': 493600, 'steps': 964, 'loss/train': 3.668743133544922} -09/20/2021 17:49:41 - INFO - __main__ - Step 15426: {'lr': 0.00019999068295736705, 'samples': 493632, 'steps': 964, 'loss/train': 4.017232418060303} -09/20/2021 17:49:42 - INFO - __main__ - Step 15427: {'lr': 0.00019999068295736705, 'samples': 493664, 'steps': 964, 'loss/train': 2.980766534805298} -09/20/2021 17:49:42 - INFO - __main__ - Step 15428: {'lr': 0.00019999068295736705, 'samples': 493696, 'steps': 964, 'loss/train': 3.634857177734375} -09/20/2021 17:49:43 - INFO - __main__ - Step 15429: {'lr': 0.00019999068295736705, 'samples': 493728, 'steps': 964, 'loss/train': 4.104218006134033} -09/20/2021 17:49:44 - INFO - __main__ - Step 15430: {'lr': 0.00019999068295736705, 'samples': 493760, 'steps': 964, 'loss/train': 1.8345166444778442} -09/20/2021 17:49:45 - INFO - __main__ - Step 15431: {'lr': 0.00019999068295736705, 'samples': 493792, 'steps': 964, 'loss/train': 3.496290683746338} -09/20/2021 17:49:45 - INFO - __main__ - Step 15432: {'lr': 0.00019999068295736705, 'samples': 493824, 'steps': 964, 'loss/train': 3.743063449859619} -09/20/2021 17:49:46 - INFO - __main__ - Step 15433: {'lr': 0.00019999068295736705, 'samples': 493856, 'steps': 964, 'loss/train': 4.166558265686035} -09/20/2021 17:49:47 - INFO - __main__ - Step 15434: {'lr': 0.00019999068295736705, 'samples': 493888, 'steps': 964, 'loss/train': 5.955277442932129} -09/20/2021 17:49:48 - INFO - __main__ - Step 15435: {'lr': 0.00019999068295736705, 'samples': 493920, 'steps': 964, 'loss/train': 3.493891954421997} -09/20/2021 17:49:48 - INFO - __main__ - Step 15436: {'lr': 0.00019999068295736705, 'samples': 493952, 'steps': 964, 'loss/train': 4.882965087890625} -09/20/2021 17:49:49 - INFO - __main__ - Step 15437: {'lr': 0.00019999068295736705, 'samples': 493984, 'steps': 964, 'loss/train': 3.684812307357788} -09/20/2021 17:49:50 - INFO - __main__ - Step 15438: {'lr': 0.00019999068295736705, 'samples': 494016, 'steps': 964, 'loss/train': 3.7084922790527344} -09/20/2021 17:49:51 - INFO - __main__ - Step 15439: {'lr': 0.00019999068295736705, 'samples': 494048, 'steps': 964, 'loss/train': 4.231238842010498} -09/20/2021 17:49:51 - INFO - __main__ - Step 15440: {'lr': 0.00019999068295736705, 'samples': 494080, 'steps': 964, 'loss/train': 3.9345967769622803} -09/20/2021 17:49:52 - INFO - __main__ - Step 15441: {'lr': 0.00019999059568012362, 'samples': 494112, 'steps': 965, 'loss/train': 4.382338523864746} -09/20/2021 17:49:53 - INFO - __main__ - Step 15442: {'lr': 0.00019999059568012362, 'samples': 494144, 'steps': 965, 'loss/train': 6.670938014984131} -09/20/2021 17:49:54 - INFO - __main__ - Step 15443: {'lr': 0.00019999059568012362, 'samples': 494176, 'steps': 965, 'loss/train': 3.3426170349121094} -09/20/2021 17:49:54 - INFO - __main__ - Step 15444: {'lr': 0.00019999059568012362, 'samples': 494208, 'steps': 965, 'loss/train': 3.2018980979919434} -09/20/2021 17:49:55 - INFO - __main__ - Step 15445: {'lr': 0.00019999059568012362, 'samples': 494240, 'steps': 965, 'loss/train': 4.178408145904541} -09/20/2021 17:49:56 - INFO - __main__ - Step 15446: {'lr': 0.00019999059568012362, 'samples': 494272, 'steps': 965, 'loss/train': 6.485602855682373} -09/20/2021 17:49:57 - INFO - __main__ - Step 15447: {'lr': 0.00019999059568012362, 'samples': 494304, 'steps': 965, 'loss/train': 3.877664804458618} -09/20/2021 17:49:58 - INFO - __main__ - Step 15448: {'lr': 0.00019999059568012362, 'samples': 494336, 'steps': 965, 'loss/train': 3.594282627105713} -09/20/2021 17:49:59 - INFO - __main__ - Step 15449: {'lr': 0.00019999059568012362, 'samples': 494368, 'steps': 965, 'loss/train': 3.746500253677368} -09/20/2021 17:49:59 - INFO - __main__ - Step 15450: {'lr': 0.00019999059568012362, 'samples': 494400, 'steps': 965, 'loss/train': 4.100342273712158} -09/20/2021 17:50:00 - INFO - __main__ - Step 15451: {'lr': 0.00019999059568012362, 'samples': 494432, 'steps': 965, 'loss/train': 3.6633946895599365} -09/20/2021 17:50:01 - INFO - __main__ - Step 15452: {'lr': 0.00019999059568012362, 'samples': 494464, 'steps': 965, 'loss/train': 4.270843505859375} -09/20/2021 17:50:02 - INFO - __main__ - Step 15453: {'lr': 0.00019999059568012362, 'samples': 494496, 'steps': 965, 'loss/train': 3.917304754257202} -09/20/2021 17:50:02 - INFO - __main__ - Step 15454: {'lr': 0.00019999059568012362, 'samples': 494528, 'steps': 965, 'loss/train': 5.139296054840088} -09/20/2021 17:50:03 - INFO - __main__ - Step 15455: {'lr': 0.00019999059568012362, 'samples': 494560, 'steps': 965, 'loss/train': 6.311926364898682} -09/20/2021 17:50:04 - INFO - __main__ - Step 15456: {'lr': 0.00019999059568012362, 'samples': 494592, 'steps': 965, 'loss/train': 3.832594394683838} -09/20/2021 17:50:05 - INFO - __main__ - Step 15457: {'lr': 0.00019999050799601885, 'samples': 494624, 'steps': 966, 'loss/train': 3.1965432167053223} -09/20/2021 17:50:06 - INFO - __main__ - Step 15458: {'lr': 0.00019999050799601885, 'samples': 494656, 'steps': 966, 'loss/train': 3.9191391468048096} -09/20/2021 17:50:06 - INFO - __main__ - Step 15459: {'lr': 0.00019999050799601885, 'samples': 494688, 'steps': 966, 'loss/train': 4.563853740692139} -09/20/2021 17:50:07 - INFO - __main__ - Step 15460: {'lr': 0.00019999050799601885, 'samples': 494720, 'steps': 966, 'loss/train': 4.255546569824219} -09/20/2021 17:50:08 - INFO - __main__ - Step 15461: {'lr': 0.00019999050799601885, 'samples': 494752, 'steps': 966, 'loss/train': 5.321107864379883} -09/20/2021 17:50:09 - INFO - __main__ - Step 15462: {'lr': 0.00019999050799601885, 'samples': 494784, 'steps': 966, 'loss/train': 3.051715135574341} -09/20/2021 17:50:09 - INFO - __main__ - Step 15463: {'lr': 0.00019999050799601885, 'samples': 494816, 'steps': 966, 'loss/train': 3.0950160026550293} -09/20/2021 17:50:10 - INFO - __main__ - Step 15464: {'lr': 0.00019999050799601885, 'samples': 494848, 'steps': 966, 'loss/train': 3.646501064300537} -09/20/2021 17:50:11 - INFO - __main__ - Step 15465: {'lr': 0.00019999050799601885, 'samples': 494880, 'steps': 966, 'loss/train': 1.8775535821914673} -09/20/2021 17:50:12 - INFO - __main__ - Step 15466: {'lr': 0.00019999050799601885, 'samples': 494912, 'steps': 966, 'loss/train': 3.9674785137176514} -09/20/2021 17:50:12 - INFO - __main__ - Step 15467: {'lr': 0.00019999050799601885, 'samples': 494944, 'steps': 966, 'loss/train': 4.037417411804199} -09/20/2021 17:50:13 - INFO - __main__ - Step 15468: {'lr': 0.00019999050799601885, 'samples': 494976, 'steps': 966, 'loss/train': 3.8833253383636475} -09/20/2021 17:50:14 - INFO - __main__ - Step 15469: {'lr': 0.00019999050799601885, 'samples': 495008, 'steps': 966, 'loss/train': 3.5254757404327393} -09/20/2021 17:50:15 - INFO - __main__ - Step 15470: {'lr': 0.00019999050799601885, 'samples': 495040, 'steps': 966, 'loss/train': 2.250178575515747} -09/20/2021 17:50:15 - INFO - __main__ - Step 15471: {'lr': 0.00019999050799601885, 'samples': 495072, 'steps': 966, 'loss/train': 2.418513298034668} -09/20/2021 17:50:16 - INFO - __main__ - Step 15472: {'lr': 0.00019999050799601885, 'samples': 495104, 'steps': 966, 'loss/train': 3.3306870460510254} -09/20/2021 17:50:17 - INFO - __main__ - Step 15473: {'lr': 0.00019999041990505313, 'samples': 495136, 'steps': 967, 'loss/train': 4.529281139373779} -09/20/2021 17:50:18 - INFO - __main__ - Step 15474: {'lr': 0.00019999041990505313, 'samples': 495168, 'steps': 967, 'loss/train': 3.7763500213623047} -09/20/2021 17:50:18 - INFO - __main__ - Step 15475: {'lr': 0.00019999041990505313, 'samples': 495200, 'steps': 967, 'loss/train': 5.636317253112793} -09/20/2021 17:50:19 - INFO - __main__ - Step 15476: {'lr': 0.00019999041990505313, 'samples': 495232, 'steps': 967, 'loss/train': 4.034103870391846} -09/20/2021 17:50:21 - INFO - __main__ - Step 15477: {'lr': 0.00019999041990505313, 'samples': 495264, 'steps': 967, 'loss/train': 3.844130039215088} -09/20/2021 17:50:21 - INFO - __main__ - Step 15478: {'lr': 0.00019999041990505313, 'samples': 495296, 'steps': 967, 'loss/train': 4.7058234214782715} -09/20/2021 17:50:22 - INFO - __main__ - Step 15479: {'lr': 0.00019999041990505313, 'samples': 495328, 'steps': 967, 'loss/train': 3.1494758129119873} -09/20/2021 17:50:23 - INFO - __main__ - Step 15480: {'lr': 0.00019999041990505313, 'samples': 495360, 'steps': 967, 'loss/train': 4.278605937957764} -09/20/2021 17:50:24 - INFO - __main__ - Step 15481: {'lr': 0.00019999041990505313, 'samples': 495392, 'steps': 967, 'loss/train': 3.35823655128479} -09/20/2021 17:50:24 - INFO - __main__ - Step 15482: {'lr': 0.00019999041990505313, 'samples': 495424, 'steps': 967, 'loss/train': 3.1367745399475098} -09/20/2021 17:50:25 - INFO - __main__ - Step 15483: {'lr': 0.00019999041990505313, 'samples': 495456, 'steps': 967, 'loss/train': 4.047829627990723} -09/20/2021 17:50:26 - INFO - __main__ - Step 15484: {'lr': 0.00019999041990505313, 'samples': 495488, 'steps': 967, 'loss/train': 2.3776729106903076} -09/20/2021 17:50:27 - INFO - __main__ - Step 15485: {'lr': 0.00019999041990505313, 'samples': 495520, 'steps': 967, 'loss/train': 4.26890230178833} -09/20/2021 17:50:27 - INFO - __main__ - Step 15486: {'lr': 0.00019999041990505313, 'samples': 495552, 'steps': 967, 'loss/train': 2.990880012512207} -09/20/2021 17:50:28 - INFO - __main__ - Step 15487: {'lr': 0.00019999041990505313, 'samples': 495584, 'steps': 967, 'loss/train': 4.252338409423828} -09/20/2021 17:50:29 - INFO - __main__ - Step 15488: {'lr': 0.00019999041990505313, 'samples': 495616, 'steps': 967, 'loss/train': 3.3828041553497314} -09/20/2021 17:50:30 - INFO - __main__ - Step 15489: {'lr': 0.0001999903314072267, 'samples': 495648, 'steps': 968, 'loss/train': 3.0456180572509766} -09/20/2021 17:50:30 - INFO - __main__ - Step 15490: {'lr': 0.0001999903314072267, 'samples': 495680, 'steps': 968, 'loss/train': 2.2284915447235107} -09/20/2021 17:50:31 - INFO - __main__ - Step 15491: {'lr': 0.0001999903314072267, 'samples': 495712, 'steps': 968, 'loss/train': 3.502208709716797} -09/20/2021 17:50:32 - INFO - __main__ - Step 15492: {'lr': 0.0001999903314072267, 'samples': 495744, 'steps': 968, 'loss/train': 4.049108982086182} -09/20/2021 17:50:33 - INFO - __main__ - Step 15493: {'lr': 0.0001999903314072267, 'samples': 495776, 'steps': 968, 'loss/train': 2.7363152503967285} -09/20/2021 17:50:33 - INFO - __main__ - Step 15494: {'lr': 0.0001999903314072267, 'samples': 495808, 'steps': 968, 'loss/train': 3.5726847648620605} -09/20/2021 17:50:34 - INFO - __main__ - Step 15495: {'lr': 0.0001999903314072267, 'samples': 495840, 'steps': 968, 'loss/train': 3.6956591606140137} -09/20/2021 17:50:35 - INFO - __main__ - Step 15496: {'lr': 0.0001999903314072267, 'samples': 495872, 'steps': 968, 'loss/train': 4.597193241119385} -09/20/2021 17:50:36 - INFO - __main__ - Step 15497: {'lr': 0.0001999903314072267, 'samples': 495904, 'steps': 968, 'loss/train': 2.1451056003570557} -09/20/2021 17:50:36 - INFO - __main__ - Step 15498: {'lr': 0.0001999903314072267, 'samples': 495936, 'steps': 968, 'loss/train': 4.068268775939941} -09/20/2021 17:50:37 - INFO - __main__ - Step 15499: {'lr': 0.0001999903314072267, 'samples': 495968, 'steps': 968, 'loss/train': 3.565836191177368} -09/20/2021 17:50:38 - INFO - __main__ - Step 15500: {'lr': 0.0001999903314072267, 'samples': 496000, 'steps': 968, 'loss/train': 4.077301979064941} -09/20/2021 17:50:39 - INFO - __main__ - Step 15501: {'lr': 0.0001999903314072267, 'samples': 496032, 'steps': 968, 'loss/train': 3.8878531455993652} -09/20/2021 17:50:39 - INFO - __main__ - Step 15502: {'lr': 0.0001999903314072267, 'samples': 496064, 'steps': 968, 'loss/train': 2.908829927444458} -09/20/2021 17:50:40 - INFO - __main__ - Step 15503: {'lr': 0.0001999903314072267, 'samples': 496096, 'steps': 968, 'loss/train': 5.863828182220459} -09/20/2021 17:50:41 - INFO - __main__ - Step 15504: {'lr': 0.0001999903314072267, 'samples': 496128, 'steps': 968, 'loss/train': 3.4330081939697266} -09/20/2021 17:50:42 - INFO - __main__ - Step 15505: {'lr': 0.00019999024250254006, 'samples': 496160, 'steps': 969, 'loss/train': 1.1848762035369873} -09/20/2021 17:50:43 - INFO - __main__ - Step 15506: {'lr': 0.00019999024250254006, 'samples': 496192, 'steps': 969, 'loss/train': 4.913367748260498} -09/20/2021 17:50:43 - INFO - __main__ - Step 15507: {'lr': 0.00019999024250254006, 'samples': 496224, 'steps': 969, 'loss/train': 6.168879508972168} -09/20/2021 17:50:45 - INFO - __main__ - Step 15508: {'lr': 0.00019999024250254006, 'samples': 496256, 'steps': 969, 'loss/train': 1.4060355424880981} -09/20/2021 17:50:45 - INFO - __main__ - Step 15509: {'lr': 0.00019999024250254006, 'samples': 496288, 'steps': 969, 'loss/train': 3.408432960510254} -09/20/2021 17:50:46 - INFO - __main__ - Step 15510: {'lr': 0.00019999024250254006, 'samples': 496320, 'steps': 969, 'loss/train': 3.736100435256958} -09/20/2021 17:50:47 - INFO - __main__ - Step 15511: {'lr': 0.00019999024250254006, 'samples': 496352, 'steps': 969, 'loss/train': 3.916964292526245} -09/20/2021 17:50:48 - INFO - __main__ - Step 15512: {'lr': 0.00019999024250254006, 'samples': 496384, 'steps': 969, 'loss/train': 4.023538589477539} -09/20/2021 17:50:48 - INFO - __main__ - Step 15513: {'lr': 0.00019999024250254006, 'samples': 496416, 'steps': 969, 'loss/train': 4.767122745513916} -09/20/2021 17:50:49 - INFO - __main__ - Step 15514: {'lr': 0.00019999024250254006, 'samples': 496448, 'steps': 969, 'loss/train': 4.7230634689331055} -09/20/2021 17:50:50 - INFO - __main__ - Step 15515: {'lr': 0.00019999024250254006, 'samples': 496480, 'steps': 969, 'loss/train': 3.9197771549224854} -09/20/2021 17:50:51 - INFO - __main__ - Step 15516: {'lr': 0.00019999024250254006, 'samples': 496512, 'steps': 969, 'loss/train': 4.303018093109131} -09/20/2021 17:50:51 - INFO - __main__ - Step 15517: {'lr': 0.00019999024250254006, 'samples': 496544, 'steps': 969, 'loss/train': 3.6342365741729736} -09/20/2021 17:50:52 - INFO - __main__ - Step 15518: {'lr': 0.00019999024250254006, 'samples': 496576, 'steps': 969, 'loss/train': 2.8394758701324463} -09/20/2021 17:50:53 - INFO - __main__ - Step 15519: {'lr': 0.00019999024250254006, 'samples': 496608, 'steps': 969, 'loss/train': 3.594820499420166} -09/20/2021 17:50:54 - INFO - __main__ - Step 15520: {'lr': 0.00019999024250254006, 'samples': 496640, 'steps': 969, 'loss/train': 3.4083211421966553} -09/20/2021 17:50:54 - INFO - __main__ - Step 15521: {'lr': 0.0001999901531909935, 'samples': 496672, 'steps': 970, 'loss/train': 3.368712902069092} -09/20/2021 17:50:55 - INFO - __main__ - Step 15522: {'lr': 0.0001999901531909935, 'samples': 496704, 'steps': 970, 'loss/train': 4.553531646728516} -09/20/2021 17:50:56 - INFO - __main__ - Step 15523: {'lr': 0.0001999901531909935, 'samples': 496736, 'steps': 970, 'loss/train': 2.920720338821411} -09/20/2021 17:50:57 - INFO - __main__ - Step 15524: {'lr': 0.0001999901531909935, 'samples': 496768, 'steps': 970, 'loss/train': 1.4950330257415771} -09/20/2021 17:50:57 - INFO - __main__ - Step 15525: {'lr': 0.0001999901531909935, 'samples': 496800, 'steps': 970, 'loss/train': 3.951267719268799} -09/20/2021 17:50:58 - INFO - __main__ - Step 15526: {'lr': 0.0001999901531909935, 'samples': 496832, 'steps': 970, 'loss/train': 4.173757076263428} -09/20/2021 17:50:59 - INFO - __main__ - Step 15527: {'lr': 0.0001999901531909935, 'samples': 496864, 'steps': 970, 'loss/train': 4.4405951499938965} -09/20/2021 17:51:00 - INFO - __main__ - Step 15528: {'lr': 0.0001999901531909935, 'samples': 496896, 'steps': 970, 'loss/train': 4.554479598999023} -09/20/2021 17:51:00 - INFO - __main__ - Step 15529: {'lr': 0.0001999901531909935, 'samples': 496928, 'steps': 970, 'loss/train': 3.3547818660736084} -09/20/2021 17:51:01 - INFO - __main__ - Step 15530: {'lr': 0.0001999901531909935, 'samples': 496960, 'steps': 970, 'loss/train': 4.516754150390625} -09/20/2021 17:51:02 - INFO - __main__ - Step 15531: {'lr': 0.0001999901531909935, 'samples': 496992, 'steps': 970, 'loss/train': 3.3575551509857178} -09/20/2021 17:51:03 - INFO - __main__ - Step 15532: {'lr': 0.0001999901531909935, 'samples': 497024, 'steps': 970, 'loss/train': 3.317713975906372} -09/20/2021 17:51:03 - INFO - __main__ - Step 15533: {'lr': 0.0001999901531909935, 'samples': 497056, 'steps': 970, 'loss/train': 3.4174675941467285} -09/20/2021 17:51:04 - INFO - __main__ - Step 15534: {'lr': 0.0001999901531909935, 'samples': 497088, 'steps': 970, 'loss/train': 3.521207332611084} -09/20/2021 17:51:05 - INFO - __main__ - Step 15535: {'lr': 0.0001999901531909935, 'samples': 497120, 'steps': 970, 'loss/train': 3.068398952484131} -09/20/2021 17:51:06 - INFO - __main__ - Step 15536: {'lr': 0.0001999901531909935, 'samples': 497152, 'steps': 970, 'loss/train': 4.053470134735107} -09/20/2021 17:51:07 - INFO - __main__ - Step 15537: {'lr': 0.0001999900634725874, 'samples': 497184, 'steps': 971, 'loss/train': 3.617158889770508} -09/20/2021 17:51:08 - INFO - __main__ - Step 15538: {'lr': 0.0001999900634725874, 'samples': 497216, 'steps': 971, 'loss/train': 3.1720895767211914} -09/20/2021 17:51:09 - INFO - __main__ - Step 15539: {'lr': 0.0001999900634725874, 'samples': 497248, 'steps': 971, 'loss/train': 0.9541934132575989} -09/20/2021 17:51:10 - INFO - __main__ - Step 15540: {'lr': 0.0001999900634725874, 'samples': 497280, 'steps': 971, 'loss/train': 1.246850848197937} -09/20/2021 17:51:11 - INFO - __main__ - Step 15541: {'lr': 0.0001999900634725874, 'samples': 497312, 'steps': 971, 'loss/train': 3.223706007003784} -09/20/2021 17:51:11 - INFO - __main__ - Step 15542: {'lr': 0.0001999900634725874, 'samples': 497344, 'steps': 971, 'loss/train': 5.1987762451171875} -09/20/2021 17:51:12 - INFO - __main__ - Step 15543: {'lr': 0.0001999900634725874, 'samples': 497376, 'steps': 971, 'loss/train': 3.3555612564086914} -09/20/2021 17:51:13 - INFO - __main__ - Step 15544: {'lr': 0.0001999900634725874, 'samples': 497408, 'steps': 971, 'loss/train': 3.174546718597412} -09/20/2021 17:51:14 - INFO - __main__ - Step 15545: {'lr': 0.0001999900634725874, 'samples': 497440, 'steps': 971, 'loss/train': 3.6519339084625244} -09/20/2021 17:51:14 - INFO - __main__ - Step 15546: {'lr': 0.0001999900634725874, 'samples': 497472, 'steps': 971, 'loss/train': 3.815666437149048} -09/20/2021 17:51:15 - INFO - __main__ - Step 15547: {'lr': 0.0001999900634725874, 'samples': 497504, 'steps': 971, 'loss/train': 3.1025004386901855} -09/20/2021 17:51:16 - INFO - __main__ - Step 15548: {'lr': 0.0001999900634725874, 'samples': 497536, 'steps': 971, 'loss/train': 1.1086899042129517} -09/20/2021 17:51:17 - INFO - __main__ - Step 15549: {'lr': 0.0001999900634725874, 'samples': 497568, 'steps': 971, 'loss/train': 4.692831516265869} -09/20/2021 17:51:17 - INFO - __main__ - Step 15550: {'lr': 0.0001999900634725874, 'samples': 497600, 'steps': 971, 'loss/train': 3.933811902999878} -09/20/2021 17:51:18 - INFO - __main__ - Step 15551: {'lr': 0.0001999900634725874, 'samples': 497632, 'steps': 971, 'loss/train': 4.493006706237793} -09/20/2021 17:51:19 - INFO - __main__ - Step 15552: {'lr': 0.0001999900634725874, 'samples': 497664, 'steps': 971, 'loss/train': 3.9021153450012207} -09/20/2021 17:51:20 - INFO - __main__ - Step 15553: {'lr': 0.0001999899733473221, 'samples': 497696, 'steps': 972, 'loss/train': 3.597290515899658} -09/20/2021 17:51:21 - INFO - __main__ - Step 15554: {'lr': 0.0001999899733473221, 'samples': 497728, 'steps': 972, 'loss/train': 4.374988079071045} -09/20/2021 17:51:21 - INFO - __main__ - Step 15555: {'lr': 0.0001999899733473221, 'samples': 497760, 'steps': 972, 'loss/train': 4.1182684898376465} -09/20/2021 17:51:22 - INFO - __main__ - Step 15556: {'lr': 0.0001999899733473221, 'samples': 497792, 'steps': 972, 'loss/train': 3.8587493896484375} -09/20/2021 17:51:23 - INFO - __main__ - Step 15557: {'lr': 0.0001999899733473221, 'samples': 497824, 'steps': 972, 'loss/train': 3.935605525970459} -09/20/2021 17:51:24 - INFO - __main__ - Step 15558: {'lr': 0.0001999899733473221, 'samples': 497856, 'steps': 972, 'loss/train': 3.5611376762390137} -09/20/2021 17:51:24 - INFO - __main__ - Step 15559: {'lr': 0.0001999899733473221, 'samples': 497888, 'steps': 972, 'loss/train': 4.864984035491943} -09/20/2021 17:51:25 - INFO - __main__ - Step 15560: {'lr': 0.0001999899733473221, 'samples': 497920, 'steps': 972, 'loss/train': 4.400440692901611} -09/20/2021 17:51:26 - INFO - __main__ - Step 15561: {'lr': 0.0001999899733473221, 'samples': 497952, 'steps': 972, 'loss/train': 3.570797920227051} -09/20/2021 17:51:27 - INFO - __main__ - Step 15562: {'lr': 0.0001999899733473221, 'samples': 497984, 'steps': 972, 'loss/train': 3.903348684310913} -09/20/2021 17:51:27 - INFO - __main__ - Step 15563: {'lr': 0.0001999899733473221, 'samples': 498016, 'steps': 972, 'loss/train': 4.116324424743652} -09/20/2021 17:51:28 - INFO - __main__ - Step 15564: {'lr': 0.0001999899733473221, 'samples': 498048, 'steps': 972, 'loss/train': 3.524843215942383} -09/20/2021 17:51:29 - INFO - __main__ - Step 15565: {'lr': 0.0001999899733473221, 'samples': 498080, 'steps': 972, 'loss/train': 4.077313423156738} -09/20/2021 17:51:30 - INFO - __main__ - Step 15566: {'lr': 0.0001999899733473221, 'samples': 498112, 'steps': 972, 'loss/train': 4.67933464050293} -09/20/2021 17:51:30 - INFO - __main__ - Step 15567: {'lr': 0.0001999899733473221, 'samples': 498144, 'steps': 972, 'loss/train': 4.395967483520508} -09/20/2021 17:51:31 - INFO - __main__ - Step 15568: {'lr': 0.0001999899733473221, 'samples': 498176, 'steps': 972, 'loss/train': 5.2856221199035645} -09/20/2021 17:51:33 - INFO - __main__ - Step 15569: {'lr': 0.000199989882815198, 'samples': 498208, 'steps': 973, 'loss/train': 3.2566473484039307} -09/20/2021 17:51:33 - INFO - __main__ - Step 15570: {'lr': 0.000199989882815198, 'samples': 498240, 'steps': 973, 'loss/train': 2.9752182960510254} -09/20/2021 17:51:34 - INFO - __main__ - Step 15571: {'lr': 0.000199989882815198, 'samples': 498272, 'steps': 973, 'loss/train': 3.8662595748901367} -09/20/2021 17:51:35 - INFO - __main__ - Step 15572: {'lr': 0.000199989882815198, 'samples': 498304, 'steps': 973, 'loss/train': 3.520627975463867} -09/20/2021 17:51:36 - INFO - __main__ - Step 15573: {'lr': 0.000199989882815198, 'samples': 498336, 'steps': 973, 'loss/train': 3.3922431468963623} -09/20/2021 17:51:36 - INFO - __main__ - Step 15574: {'lr': 0.000199989882815198, 'samples': 498368, 'steps': 973, 'loss/train': 3.9149677753448486} -09/20/2021 17:51:37 - INFO - __main__ - Step 15575: {'lr': 0.000199989882815198, 'samples': 498400, 'steps': 973, 'loss/train': 3.5352699756622314} -09/20/2021 17:51:38 - INFO - __main__ - Step 15576: {'lr': 0.000199989882815198, 'samples': 498432, 'steps': 973, 'loss/train': 3.1632237434387207} -09/20/2021 17:51:39 - INFO - __main__ - Step 15577: {'lr': 0.000199989882815198, 'samples': 498464, 'steps': 973, 'loss/train': 3.035367012023926} -09/20/2021 17:51:39 - INFO - __main__ - Step 15578: {'lr': 0.000199989882815198, 'samples': 498496, 'steps': 973, 'loss/train': 6.132573127746582} -09/20/2021 17:51:40 - INFO - __main__ - Step 15579: {'lr': 0.000199989882815198, 'samples': 498528, 'steps': 973, 'loss/train': 3.8739991188049316} -09/20/2021 17:51:41 - INFO - __main__ - Step 15580: {'lr': 0.000199989882815198, 'samples': 498560, 'steps': 973, 'loss/train': 0.6291259527206421} -09/20/2021 17:51:42 - INFO - __main__ - Step 15581: {'lr': 0.000199989882815198, 'samples': 498592, 'steps': 973, 'loss/train': 4.0214715003967285} -09/20/2021 17:51:42 - INFO - __main__ - Step 15582: {'lr': 0.000199989882815198, 'samples': 498624, 'steps': 973, 'loss/train': 2.2569494247436523} -09/20/2021 17:51:43 - INFO - __main__ - Step 15583: {'lr': 0.000199989882815198, 'samples': 498656, 'steps': 973, 'loss/train': 0.6171169281005859} -09/20/2021 17:51:44 - INFO - __main__ - Step 15584: {'lr': 0.000199989882815198, 'samples': 498688, 'steps': 973, 'loss/train': 4.116447925567627} -09/20/2021 17:51:45 - INFO - __main__ - Step 15585: {'lr': 0.00019998979187621542, 'samples': 498720, 'steps': 974, 'loss/train': 3.786821126937866} -09/20/2021 17:51:46 - INFO - __main__ - Step 15586: {'lr': 0.00019998979187621542, 'samples': 498752, 'steps': 974, 'loss/train': 3.924081802368164} -09/20/2021 17:51:46 - INFO - __main__ - Step 15587: {'lr': 0.00019998979187621542, 'samples': 498784, 'steps': 974, 'loss/train': 3.368699312210083} -09/20/2021 17:51:47 - INFO - __main__ - Step 15588: {'lr': 0.00019998979187621542, 'samples': 498816, 'steps': 974, 'loss/train': 4.445293426513672} -09/20/2021 17:51:48 - INFO - __main__ - Step 15589: {'lr': 0.00019998979187621542, 'samples': 498848, 'steps': 974, 'loss/train': 1.9764013290405273} -09/20/2021 17:51:49 - INFO - __main__ - Step 15590: {'lr': 0.00019998979187621542, 'samples': 498880, 'steps': 974, 'loss/train': 1.1063538789749146} -09/20/2021 17:51:49 - INFO - __main__ - Step 15591: {'lr': 0.00019998979187621542, 'samples': 498912, 'steps': 974, 'loss/train': 1.5640087127685547} -09/20/2021 17:51:50 - INFO - __main__ - Step 15592: {'lr': 0.00019998979187621542, 'samples': 498944, 'steps': 974, 'loss/train': 0.8527233600616455} -09/20/2021 17:51:51 - INFO - __main__ - Step 15593: {'lr': 0.00019998979187621542, 'samples': 498976, 'steps': 974, 'loss/train': 0.8820142149925232} -09/20/2021 17:51:52 - INFO - __main__ - Step 15594: {'lr': 0.00019998979187621542, 'samples': 499008, 'steps': 974, 'loss/train': 3.2949752807617188} -09/20/2021 17:51:52 - INFO - __main__ - Step 15595: {'lr': 0.00019998979187621542, 'samples': 499040, 'steps': 974, 'loss/train': 4.209493637084961} -09/20/2021 17:51:53 - INFO - __main__ - Step 15596: {'lr': 0.00019998979187621542, 'samples': 499072, 'steps': 974, 'loss/train': 3.1518259048461914} -09/20/2021 17:51:54 - INFO - __main__ - Step 15597: {'lr': 0.00019998979187621542, 'samples': 499104, 'steps': 974, 'loss/train': 4.545456886291504} -09/20/2021 17:51:54 - INFO - __main__ - Step 15598: {'lr': 0.00019998979187621542, 'samples': 499136, 'steps': 974, 'loss/train': 3.329596996307373} -09/20/2021 17:51:55 - INFO - __main__ - Step 15599: {'lr': 0.00019998979187621542, 'samples': 499168, 'steps': 974, 'loss/train': 3.20947527885437} -09/20/2021 17:51:57 - INFO - __main__ - Step 15600: {'lr': 0.00019998979187621542, 'samples': 499200, 'steps': 974, 'loss/train': 2.7873547077178955} -09/20/2021 17:51:58 - INFO - __main__ - Step 15601: {'lr': 0.0001999897005303748, 'samples': 499232, 'steps': 975, 'loss/train': 3.865007162094116} -09/20/2021 17:51:58 - INFO - __main__ - Step 15602: {'lr': 0.0001999897005303748, 'samples': 499264, 'steps': 975, 'loss/train': 3.657151937484741} -09/20/2021 17:51:59 - INFO - __main__ - Step 15603: {'lr': 0.0001999897005303748, 'samples': 499296, 'steps': 975, 'loss/train': 3.335709810256958} -09/20/2021 17:52:00 - INFO - __main__ - Step 15604: {'lr': 0.0001999897005303748, 'samples': 499328, 'steps': 975, 'loss/train': 3.9065098762512207} -09/20/2021 17:52:01 - INFO - __main__ - Step 15605: {'lr': 0.0001999897005303748, 'samples': 499360, 'steps': 975, 'loss/train': 1.1403229236602783} -09/20/2021 17:52:01 - INFO - __main__ - Step 15606: {'lr': 0.0001999897005303748, 'samples': 499392, 'steps': 975, 'loss/train': 3.7656660079956055} -09/20/2021 17:52:02 - INFO - __main__ - Step 15607: {'lr': 0.0001999897005303748, 'samples': 499424, 'steps': 975, 'loss/train': 3.4572296142578125} -09/20/2021 17:52:03 - INFO - __main__ - Step 15608: {'lr': 0.0001999897005303748, 'samples': 499456, 'steps': 975, 'loss/train': 3.5201306343078613} -09/20/2021 17:52:04 - INFO - __main__ - Step 15609: {'lr': 0.0001999897005303748, 'samples': 499488, 'steps': 975, 'loss/train': 4.145495891571045} -09/20/2021 17:52:04 - INFO - __main__ - Step 15610: {'lr': 0.0001999897005303748, 'samples': 499520, 'steps': 975, 'loss/train': 4.966415882110596} -09/20/2021 17:52:05 - INFO - __main__ - Step 15611: {'lr': 0.0001999897005303748, 'samples': 499552, 'steps': 975, 'loss/train': 3.950831174850464} -09/20/2021 17:52:06 - INFO - __main__ - Step 15612: {'lr': 0.0001999897005303748, 'samples': 499584, 'steps': 975, 'loss/train': 3.3853919506073} -09/20/2021 17:52:07 - INFO - __main__ - Step 15613: {'lr': 0.0001999897005303748, 'samples': 499616, 'steps': 975, 'loss/train': 4.023794174194336} -09/20/2021 17:52:07 - INFO - __main__ - Step 15614: {'lr': 0.0001999897005303748, 'samples': 499648, 'steps': 975, 'loss/train': 4.391129493713379} -09/20/2021 17:52:08 - INFO - __main__ - Step 15615: {'lr': 0.0001999897005303748, 'samples': 499680, 'steps': 975, 'loss/train': 0.9586086869239807} -09/20/2021 17:52:09 - INFO - __main__ - Step 15616: {'lr': 0.0001999897005303748, 'samples': 499712, 'steps': 975, 'loss/train': 3.6062352657318115} -09/20/2021 17:52:10 - INFO - __main__ - Step 15617: {'lr': 0.00019998960877767646, 'samples': 499744, 'steps': 976, 'loss/train': 3.8969266414642334} -09/20/2021 17:52:10 - INFO - __main__ - Step 15618: {'lr': 0.00019998960877767646, 'samples': 499776, 'steps': 976, 'loss/train': 3.788522243499756} -09/20/2021 17:52:11 - INFO - __main__ - Step 15619: {'lr': 0.00019998960877767646, 'samples': 499808, 'steps': 976, 'loss/train': 3.7178194522857666} -09/20/2021 17:52:12 - INFO - __main__ - Step 15620: {'lr': 0.00019998960877767646, 'samples': 499840, 'steps': 976, 'loss/train': 3.1741020679473877} -09/20/2021 17:52:13 - INFO - __main__ - Step 15621: {'lr': 0.00019998960877767646, 'samples': 499872, 'steps': 976, 'loss/train': 4.333766937255859} -09/20/2021 17:52:13 - INFO - __main__ - Step 15622: {'lr': 0.00019998960877767646, 'samples': 499904, 'steps': 976, 'loss/train': 0.9017714262008667} -09/20/2021 17:52:14 - INFO - __main__ - Step 15623: {'lr': 0.00019998960877767646, 'samples': 499936, 'steps': 976, 'loss/train': 4.829098701477051} -09/20/2021 17:52:15 - INFO - __main__ - Step 15624: {'lr': 0.00019998960877767646, 'samples': 499968, 'steps': 976, 'loss/train': 3.7374660968780518} -09/20/2021 17:52:16 - INFO - __main__ - Step 15625: {'lr': 0.00019998960877767646, 'samples': 500000, 'steps': 976, 'loss/train': 3.2748687267303467} -09/20/2021 17:52:16 - INFO - __main__ - Step 15626: {'lr': 0.00019998960877767646, 'samples': 500032, 'steps': 976, 'loss/train': 3.1313092708587646} -09/20/2021 17:52:17 - INFO - __main__ - Step 15627: {'lr': 0.00019998960877767646, 'samples': 500064, 'steps': 976, 'loss/train': 4.64542293548584} -09/20/2021 17:52:18 - INFO - __main__ - Step 15628: {'lr': 0.00019998960877767646, 'samples': 500096, 'steps': 976, 'loss/train': 3.89001727104187} -09/20/2021 17:52:19 - INFO - __main__ - Step 15629: {'lr': 0.00019998960877767646, 'samples': 500128, 'steps': 976, 'loss/train': 3.006126642227173} -09/20/2021 17:52:19 - INFO - __main__ - Step 15630: {'lr': 0.00019998960877767646, 'samples': 500160, 'steps': 976, 'loss/train': 4.357333660125732} -09/20/2021 17:52:21 - INFO - __main__ - Step 15631: {'lr': 0.00019998960877767646, 'samples': 500192, 'steps': 976, 'loss/train': 3.148820161819458} -09/20/2021 17:52:22 - INFO - __main__ - Step 15632: {'lr': 0.00019998960877767646, 'samples': 500224, 'steps': 976, 'loss/train': 3.608330249786377} -09/20/2021 17:52:22 - INFO - __main__ - Step 15633: {'lr': 0.0001999895166181208, 'samples': 500256, 'steps': 977, 'loss/train': 2.1353771686553955} -09/20/2021 17:52:23 - INFO - __main__ - Step 15634: {'lr': 0.0001999895166181208, 'samples': 500288, 'steps': 977, 'loss/train': 3.7013611793518066} -09/20/2021 17:52:24 - INFO - __main__ - Step 15635: {'lr': 0.0001999895166181208, 'samples': 500320, 'steps': 977, 'loss/train': 4.078956127166748} -09/20/2021 17:52:25 - INFO - __main__ - Step 15636: {'lr': 0.0001999895166181208, 'samples': 500352, 'steps': 977, 'loss/train': 2.954307794570923} -09/20/2021 17:52:25 - INFO - __main__ - Step 15637: {'lr': 0.0001999895166181208, 'samples': 500384, 'steps': 977, 'loss/train': 3.3710148334503174} -09/20/2021 17:52:26 - INFO - __main__ - Step 15638: {'lr': 0.0001999895166181208, 'samples': 500416, 'steps': 977, 'loss/train': 3.5391793251037598} -09/20/2021 17:52:27 - INFO - __main__ - Step 15639: {'lr': 0.0001999895166181208, 'samples': 500448, 'steps': 977, 'loss/train': 3.307457685470581} -09/20/2021 17:52:28 - INFO - __main__ - Step 15640: {'lr': 0.0001999895166181208, 'samples': 500480, 'steps': 977, 'loss/train': 3.160266160964966} -09/20/2021 17:52:28 - INFO - __main__ - Step 15641: {'lr': 0.0001999895166181208, 'samples': 500512, 'steps': 977, 'loss/train': 3.811797618865967} -09/20/2021 17:52:29 - INFO - __main__ - Step 15642: {'lr': 0.0001999895166181208, 'samples': 500544, 'steps': 977, 'loss/train': 1.1107995510101318} -09/20/2021 17:52:30 - INFO - __main__ - Step 15643: {'lr': 0.0001999895166181208, 'samples': 500576, 'steps': 977, 'loss/train': 0.6471940279006958} -09/20/2021 17:52:31 - INFO - __main__ - Step 15644: {'lr': 0.0001999895166181208, 'samples': 500608, 'steps': 977, 'loss/train': 0.8877522945404053} -09/20/2021 17:52:31 - INFO - __main__ - Step 15645: {'lr': 0.0001999895166181208, 'samples': 500640, 'steps': 977, 'loss/train': 4.9239583015441895} -09/20/2021 17:52:32 - INFO - __main__ - Step 15646: {'lr': 0.0001999895166181208, 'samples': 500672, 'steps': 977, 'loss/train': 3.965597629547119} -09/20/2021 17:52:33 - INFO - __main__ - Step 15647: {'lr': 0.0001999895166181208, 'samples': 500704, 'steps': 977, 'loss/train': 3.706423282623291} -09/20/2021 17:52:34 - INFO - __main__ - Step 15648: {'lr': 0.0001999895166181208, 'samples': 500736, 'steps': 977, 'loss/train': 3.9913957118988037} -09/20/2021 17:52:35 - INFO - __main__ - Step 15649: {'lr': 0.00019998942405170822, 'samples': 500768, 'steps': 978, 'loss/train': 3.106586217880249} -09/20/2021 17:52:35 - INFO - __main__ - Step 15650: {'lr': 0.00019998942405170822, 'samples': 500800, 'steps': 978, 'loss/train': 3.5538084506988525} -09/20/2021 17:52:36 - INFO - __main__ - Step 15651: {'lr': 0.00019998942405170822, 'samples': 500832, 'steps': 978, 'loss/train': 4.453087329864502} -09/20/2021 17:52:37 - INFO - __main__ - Step 15652: {'lr': 0.00019998942405170822, 'samples': 500864, 'steps': 978, 'loss/train': 3.817089796066284} -09/20/2021 17:52:38 - INFO - __main__ - Step 15653: {'lr': 0.00019998942405170822, 'samples': 500896, 'steps': 978, 'loss/train': 3.944350004196167} -09/20/2021 17:52:38 - INFO - __main__ - Step 15654: {'lr': 0.00019998942405170822, 'samples': 500928, 'steps': 978, 'loss/train': 3.8037853240966797} -09/20/2021 17:52:39 - INFO - __main__ - Step 15655: {'lr': 0.00019998942405170822, 'samples': 500960, 'steps': 978, 'loss/train': 3.5621747970581055} -09/20/2021 17:52:40 - INFO - __main__ - Step 15656: {'lr': 0.00019998942405170822, 'samples': 500992, 'steps': 978, 'loss/train': 3.275416135787964} -09/20/2021 17:52:41 - INFO - __main__ - Step 15657: {'lr': 0.00019998942405170822, 'samples': 501024, 'steps': 978, 'loss/train': 3.058722496032715} -09/20/2021 17:52:41 - INFO - __main__ - Step 15658: {'lr': 0.00019998942405170822, 'samples': 501056, 'steps': 978, 'loss/train': 3.29244065284729} -09/20/2021 17:52:42 - INFO - __main__ - Step 15659: {'lr': 0.00019998942405170822, 'samples': 501088, 'steps': 978, 'loss/train': 4.404748439788818} -09/20/2021 17:52:43 - INFO - __main__ - Step 15660: {'lr': 0.00019998942405170822, 'samples': 501120, 'steps': 978, 'loss/train': 4.575806140899658} -09/20/2021 17:52:44 - INFO - __main__ - Step 15661: {'lr': 0.00019998942405170822, 'samples': 501152, 'steps': 978, 'loss/train': 4.37198543548584} -09/20/2021 17:52:45 - INFO - __main__ - Step 15662: {'lr': 0.00019998942405170822, 'samples': 501184, 'steps': 978, 'loss/train': 4.585623741149902} -09/20/2021 17:52:46 - INFO - __main__ - Step 15663: {'lr': 0.00019998942405170822, 'samples': 501216, 'steps': 978, 'loss/train': 3.7112913131713867} -09/20/2021 17:52:46 - INFO - __main__ - Step 15664: {'lr': 0.00019998942405170822, 'samples': 501248, 'steps': 978, 'loss/train': 4.957189559936523} -09/20/2021 17:52:47 - INFO - __main__ - Step 15665: {'lr': 0.00019998933107843902, 'samples': 501280, 'steps': 979, 'loss/train': 3.2685959339141846} -09/20/2021 17:52:48 - INFO - __main__ - Step 15666: {'lr': 0.00019998933107843902, 'samples': 501312, 'steps': 979, 'loss/train': 2.907823324203491} -09/20/2021 17:52:49 - INFO - __main__ - Step 15667: {'lr': 0.00019998933107843902, 'samples': 501344, 'steps': 979, 'loss/train': 4.521307468414307} -09/20/2021 17:52:50 - INFO - __main__ - Step 15668: {'lr': 0.00019998933107843902, 'samples': 501376, 'steps': 979, 'loss/train': 3.467026472091675} -09/20/2021 17:52:50 - INFO - __main__ - Step 15669: {'lr': 0.00019998933107843902, 'samples': 501408, 'steps': 979, 'loss/train': 3.6265859603881836} -09/20/2021 17:52:51 - INFO - __main__ - Step 15670: {'lr': 0.00019998933107843902, 'samples': 501440, 'steps': 979, 'loss/train': 1.2089229822158813} -09/20/2021 17:52:52 - INFO - __main__ - Step 15671: {'lr': 0.00019998933107843902, 'samples': 501472, 'steps': 979, 'loss/train': 3.989795684814453} -09/20/2021 17:52:53 - INFO - __main__ - Step 15672: {'lr': 0.00019998933107843902, 'samples': 501504, 'steps': 979, 'loss/train': 3.648200035095215} -09/20/2021 17:52:53 - INFO - __main__ - Step 15673: {'lr': 0.00019998933107843902, 'samples': 501536, 'steps': 979, 'loss/train': 4.577778339385986} -09/20/2021 17:52:54 - INFO - __main__ - Step 15674: {'lr': 0.00019998933107843902, 'samples': 501568, 'steps': 979, 'loss/train': 3.6090574264526367} -09/20/2021 17:52:55 - INFO - __main__ - Step 15675: {'lr': 0.00019998933107843902, 'samples': 501600, 'steps': 979, 'loss/train': 3.295799970626831} -09/20/2021 17:52:56 - INFO - __main__ - Step 15676: {'lr': 0.00019998933107843902, 'samples': 501632, 'steps': 979, 'loss/train': 1.174192190170288} -09/20/2021 17:52:56 - INFO - __main__ - Step 15677: {'lr': 0.00019998933107843902, 'samples': 501664, 'steps': 979, 'loss/train': 2.4245688915252686} -09/20/2021 17:52:57 - INFO - __main__ - Step 15678: {'lr': 0.00019998933107843902, 'samples': 501696, 'steps': 979, 'loss/train': 3.664276361465454} -09/20/2021 17:52:58 - INFO - __main__ - Step 15679: {'lr': 0.00019998933107843902, 'samples': 501728, 'steps': 979, 'loss/train': 4.250544548034668} -09/20/2021 17:52:59 - INFO - __main__ - Step 15680: {'lr': 0.00019998933107843902, 'samples': 501760, 'steps': 979, 'loss/train': 4.032130241394043} -09/20/2021 17:52:59 - INFO - __main__ - Step 15681: {'lr': 0.00019998923769831364, 'samples': 501792, 'steps': 980, 'loss/train': 3.588466167449951} -09/20/2021 17:53:00 - INFO - __main__ - Step 15682: {'lr': 0.00019998923769831364, 'samples': 501824, 'steps': 980, 'loss/train': 3.51802659034729} -09/20/2021 17:53:01 - INFO - __main__ - Step 15683: {'lr': 0.00019998923769831364, 'samples': 501856, 'steps': 980, 'loss/train': 4.156248092651367} -09/20/2021 17:53:02 - INFO - __main__ - Step 15684: {'lr': 0.00019998923769831364, 'samples': 501888, 'steps': 980, 'loss/train': 3.4777848720550537} -09/20/2021 17:53:02 - INFO - __main__ - Step 15685: {'lr': 0.00019998923769831364, 'samples': 501920, 'steps': 980, 'loss/train': 3.6892592906951904} -09/20/2021 17:53:03 - INFO - __main__ - Step 15686: {'lr': 0.00019998923769831364, 'samples': 501952, 'steps': 980, 'loss/train': 2.3349075317382812} -09/20/2021 17:53:04 - INFO - __main__ - Step 15687: {'lr': 0.00019998923769831364, 'samples': 501984, 'steps': 980, 'loss/train': 3.372523307800293} -09/20/2021 17:53:05 - INFO - __main__ - Step 15688: {'lr': 0.00019998923769831364, 'samples': 502016, 'steps': 980, 'loss/train': 0.4864799678325653} -09/20/2021 17:53:05 - INFO - __main__ - Step 15689: {'lr': 0.00019998923769831364, 'samples': 502048, 'steps': 980, 'loss/train': 4.188755035400391} -09/20/2021 17:53:06 - INFO - __main__ - Step 15690: {'lr': 0.00019998923769831364, 'samples': 502080, 'steps': 980, 'loss/train': 3.2645766735076904} -09/20/2021 17:53:07 - INFO - __main__ - Step 15691: {'lr': 0.00019998923769831364, 'samples': 502112, 'steps': 980, 'loss/train': 4.567110061645508} -09/20/2021 17:53:08 - INFO - __main__ - Step 15692: {'lr': 0.00019998923769831364, 'samples': 502144, 'steps': 980, 'loss/train': 4.689562797546387} -09/20/2021 17:53:09 - INFO - __main__ - Step 15693: {'lr': 0.00019998923769831364, 'samples': 502176, 'steps': 980, 'loss/train': 3.3124890327453613} -09/20/2021 17:53:10 - INFO - __main__ - Step 15694: {'lr': 0.00019998923769831364, 'samples': 502208, 'steps': 980, 'loss/train': 3.086172103881836} -09/20/2021 17:53:11 - INFO - __main__ - Step 15695: {'lr': 0.00019998923769831364, 'samples': 502240, 'steps': 980, 'loss/train': 3.1168811321258545} -09/20/2021 17:53:11 - INFO - __main__ - Step 15696: {'lr': 0.00019998923769831364, 'samples': 502272, 'steps': 980, 'loss/train': 3.3481056690216064} -09/20/2021 17:53:12 - INFO - __main__ - Step 15697: {'lr': 0.00019998914391133242, 'samples': 502304, 'steps': 981, 'loss/train': 2.7666850090026855} -09/20/2021 17:53:13 - INFO - __main__ - Step 15698: {'lr': 0.00019998914391133242, 'samples': 502336, 'steps': 981, 'loss/train': 3.8500783443450928} -09/20/2021 17:53:14 - INFO - __main__ - Step 15699: {'lr': 0.00019998914391133242, 'samples': 502368, 'steps': 981, 'loss/train': 3.615238666534424} -09/20/2021 17:53:14 - INFO - __main__ - Step 15700: {'lr': 0.00019998914391133242, 'samples': 502400, 'steps': 981, 'loss/train': 4.378839492797852} -09/20/2021 17:53:15 - INFO - __main__ - Step 15701: {'lr': 0.00019998914391133242, 'samples': 502432, 'steps': 981, 'loss/train': 3.6758530139923096} -09/20/2021 17:53:16 - INFO - __main__ - Step 15702: {'lr': 0.00019998914391133242, 'samples': 502464, 'steps': 981, 'loss/train': 3.2463817596435547} -09/20/2021 17:53:17 - INFO - __main__ - Step 15703: {'lr': 0.00019998914391133242, 'samples': 502496, 'steps': 981, 'loss/train': 4.2016682624816895} -09/20/2021 17:53:17 - INFO - __main__ - Step 15704: {'lr': 0.00019998914391133242, 'samples': 502528, 'steps': 981, 'loss/train': 3.8306984901428223} -09/20/2021 17:53:18 - INFO - __main__ - Step 15705: {'lr': 0.00019998914391133242, 'samples': 502560, 'steps': 981, 'loss/train': 3.807548999786377} -09/20/2021 17:53:19 - INFO - __main__ - Step 15706: {'lr': 0.00019998914391133242, 'samples': 502592, 'steps': 981, 'loss/train': 3.3776752948760986} -09/20/2021 17:53:20 - INFO - __main__ - Step 15707: {'lr': 0.00019998914391133242, 'samples': 502624, 'steps': 981, 'loss/train': 3.5825035572052} -09/20/2021 17:53:20 - INFO - __main__ - Step 15708: {'lr': 0.00019998914391133242, 'samples': 502656, 'steps': 981, 'loss/train': 0.5322588086128235} -09/20/2021 17:53:21 - INFO - __main__ - Step 15709: {'lr': 0.00019998914391133242, 'samples': 502688, 'steps': 981, 'loss/train': 4.744424343109131} -09/20/2021 17:53:22 - INFO - __main__ - Step 15710: {'lr': 0.00019998914391133242, 'samples': 502720, 'steps': 981, 'loss/train': 4.33983039855957} -09/20/2021 17:53:23 - INFO - __main__ - Step 15711: {'lr': 0.00019998914391133242, 'samples': 502752, 'steps': 981, 'loss/train': 3.803800582885742} -09/20/2021 17:53:23 - INFO - __main__ - Step 15712: {'lr': 0.00019998914391133242, 'samples': 502784, 'steps': 981, 'loss/train': 3.668105125427246} -09/20/2021 17:53:24 - INFO - __main__ - Step 15713: {'lr': 0.00019998904971749577, 'samples': 502816, 'steps': 982, 'loss/train': 4.279098987579346} -09/20/2021 17:53:25 - INFO - __main__ - Step 15714: {'lr': 0.00019998904971749577, 'samples': 502848, 'steps': 982, 'loss/train': 3.9963157176971436} -09/20/2021 17:53:26 - INFO - __main__ - Step 15715: {'lr': 0.00019998904971749577, 'samples': 502880, 'steps': 982, 'loss/train': 4.851997375488281} -09/20/2021 17:53:27 - INFO - __main__ - Step 15716: {'lr': 0.00019998904971749577, 'samples': 502912, 'steps': 982, 'loss/train': 3.10443377494812} -09/20/2021 17:53:27 - INFO - __main__ - Step 15717: {'lr': 0.00019998904971749577, 'samples': 502944, 'steps': 982, 'loss/train': 3.499799966812134} -09/20/2021 17:53:28 - INFO - __main__ - Step 15718: {'lr': 0.00019998904971749577, 'samples': 502976, 'steps': 982, 'loss/train': 4.140439033508301} -09/20/2021 17:53:29 - INFO - __main__ - Step 15719: {'lr': 0.00019998904971749577, 'samples': 503008, 'steps': 982, 'loss/train': 2.5152981281280518} -09/20/2021 17:53:30 - INFO - __main__ - Step 15720: {'lr': 0.00019998904971749577, 'samples': 503040, 'steps': 982, 'loss/train': 3.371954917907715} -09/20/2021 17:53:30 - INFO - __main__ - Step 15721: {'lr': 0.00019998904971749577, 'samples': 503072, 'steps': 982, 'loss/train': 3.6869330406188965} -09/20/2021 17:53:32 - INFO - __main__ - Step 15722: {'lr': 0.00019998904971749577, 'samples': 503104, 'steps': 982, 'loss/train': 4.411525249481201} -09/20/2021 17:53:32 - INFO - __main__ - Step 15723: {'lr': 0.00019998904971749577, 'samples': 503136, 'steps': 982, 'loss/train': 5.075201511383057} -09/20/2021 17:53:33 - INFO - __main__ - Step 15724: {'lr': 0.00019998904971749577, 'samples': 503168, 'steps': 982, 'loss/train': 3.25459885597229} -09/20/2021 17:53:34 - INFO - __main__ - Step 15725: {'lr': 0.00019998904971749577, 'samples': 503200, 'steps': 982, 'loss/train': 3.2622034549713135} -09/20/2021 17:53:35 - INFO - __main__ - Step 15726: {'lr': 0.00019998904971749577, 'samples': 503232, 'steps': 982, 'loss/train': 3.6800100803375244} -09/20/2021 17:53:35 - INFO - __main__ - Step 15727: {'lr': 0.00019998904971749577, 'samples': 503264, 'steps': 982, 'loss/train': 4.201226234436035} -09/20/2021 17:53:36 - INFO - __main__ - Step 15728: {'lr': 0.00019998904971749577, 'samples': 503296, 'steps': 982, 'loss/train': 3.9123287200927734} -09/20/2021 17:53:37 - INFO - __main__ - Step 15729: {'lr': 0.00019998895511680407, 'samples': 503328, 'steps': 983, 'loss/train': 3.9432449340820312} -09/20/2021 17:53:38 - INFO - __main__ - Step 15730: {'lr': 0.00019998895511680407, 'samples': 503360, 'steps': 983, 'loss/train': 4.537878513336182} -09/20/2021 17:53:38 - INFO - __main__ - Step 15731: {'lr': 0.00019998895511680407, 'samples': 503392, 'steps': 983, 'loss/train': 3.443787097930908} -09/20/2021 17:53:39 - INFO - __main__ - Step 15732: {'lr': 0.00019998895511680407, 'samples': 503424, 'steps': 983, 'loss/train': 3.7268173694610596} -09/20/2021 17:53:40 - INFO - __main__ - Step 15733: {'lr': 0.00019998895511680407, 'samples': 503456, 'steps': 983, 'loss/train': 3.1473307609558105} -09/20/2021 17:53:41 - INFO - __main__ - Step 15734: {'lr': 0.00019998895511680407, 'samples': 503488, 'steps': 983, 'loss/train': 3.7384955883026123} -09/20/2021 17:53:41 - INFO - __main__ - Step 15735: {'lr': 0.00019998895511680407, 'samples': 503520, 'steps': 983, 'loss/train': 3.5855321884155273} -09/20/2021 17:53:42 - INFO - __main__ - Step 15736: {'lr': 0.00019998895511680407, 'samples': 503552, 'steps': 983, 'loss/train': 3.1496784687042236} -09/20/2021 17:53:43 - INFO - __main__ - Step 15737: {'lr': 0.00019998895511680407, 'samples': 503584, 'steps': 983, 'loss/train': 5.280541896820068} -09/20/2021 17:53:44 - INFO - __main__ - Step 15738: {'lr': 0.00019998895511680407, 'samples': 503616, 'steps': 983, 'loss/train': 4.258530139923096} -09/20/2021 17:53:44 - INFO - __main__ - Step 15739: {'lr': 0.00019998895511680407, 'samples': 503648, 'steps': 983, 'loss/train': 3.6767680644989014} -09/20/2021 17:53:45 - INFO - __main__ - Step 15740: {'lr': 0.00019998895511680407, 'samples': 503680, 'steps': 983, 'loss/train': 4.120012283325195} -09/20/2021 17:53:46 - INFO - __main__ - Step 15741: {'lr': 0.00019998895511680407, 'samples': 503712, 'steps': 983, 'loss/train': 4.7123613357543945} -09/20/2021 17:53:47 - INFO - __main__ - Step 15742: {'lr': 0.00019998895511680407, 'samples': 503744, 'steps': 983, 'loss/train': 4.37725305557251} -09/20/2021 17:53:47 - INFO - __main__ - Step 15743: {'lr': 0.00019998895511680407, 'samples': 503776, 'steps': 983, 'loss/train': 3.7843360900878906} -09/20/2021 17:53:48 - INFO - __main__ - Step 15744: {'lr': 0.00019998895511680407, 'samples': 503808, 'steps': 983, 'loss/train': 3.4609384536743164} -09/20/2021 17:53:49 - INFO - __main__ - Step 15745: {'lr': 0.00019998886010925767, 'samples': 503840, 'steps': 984, 'loss/train': 4.073824405670166} -09/20/2021 17:53:50 - INFO - __main__ - Step 15746: {'lr': 0.00019998886010925767, 'samples': 503872, 'steps': 984, 'loss/train': 4.070682048797607} -09/20/2021 17:53:51 - INFO - __main__ - Step 15747: {'lr': 0.00019998886010925767, 'samples': 503904, 'steps': 984, 'loss/train': 3.6423425674438477} -09/20/2021 17:53:51 - INFO - __main__ - Step 15748: {'lr': 0.00019998886010925767, 'samples': 503936, 'steps': 984, 'loss/train': 3.8760087490081787} -09/20/2021 17:53:52 - INFO - __main__ - Step 15749: {'lr': 0.00019998886010925767, 'samples': 503968, 'steps': 984, 'loss/train': 3.6478896141052246} -09/20/2021 17:53:53 - INFO - __main__ - Step 15750: {'lr': 0.00019998886010925767, 'samples': 504000, 'steps': 984, 'loss/train': 2.9186549186706543} -09/20/2021 17:53:54 - INFO - __main__ - Step 15751: {'lr': 0.00019998886010925767, 'samples': 504032, 'steps': 984, 'loss/train': 3.7928640842437744} -09/20/2021 17:53:55 - INFO - __main__ - Step 15752: {'lr': 0.00019998886010925767, 'samples': 504064, 'steps': 984, 'loss/train': 4.082446575164795} -09/20/2021 17:53:56 - INFO - __main__ - Step 15753: {'lr': 0.00019998886010925767, 'samples': 504096, 'steps': 984, 'loss/train': 3.6985995769500732} -09/20/2021 17:53:56 - INFO - __main__ - Step 15754: {'lr': 0.00019998886010925767, 'samples': 504128, 'steps': 984, 'loss/train': 3.7316765785217285} -09/20/2021 17:53:57 - INFO - __main__ - Step 15755: {'lr': 0.00019998886010925767, 'samples': 504160, 'steps': 984, 'loss/train': 4.612216472625732} -09/20/2021 17:53:58 - INFO - __main__ - Step 15756: {'lr': 0.00019998886010925767, 'samples': 504192, 'steps': 984, 'loss/train': 2.6236488819122314} -09/20/2021 17:53:59 - INFO - __main__ - Step 15757: {'lr': 0.00019998886010925767, 'samples': 504224, 'steps': 984, 'loss/train': 2.561459541320801} -09/20/2021 17:53:59 - INFO - __main__ - Step 15758: {'lr': 0.00019998886010925767, 'samples': 504256, 'steps': 984, 'loss/train': 3.3263211250305176} -09/20/2021 17:54:00 - INFO - __main__ - Step 15759: {'lr': 0.00019998886010925767, 'samples': 504288, 'steps': 984, 'loss/train': 4.646740436553955} -09/20/2021 17:54:01 - INFO - __main__ - Step 15760: {'lr': 0.00019998886010925767, 'samples': 504320, 'steps': 984, 'loss/train': 3.9170315265655518} -09/20/2021 17:54:02 - INFO - __main__ - Step 15761: {'lr': 0.000199988764694857, 'samples': 504352, 'steps': 985, 'loss/train': 3.42199969291687} -09/20/2021 17:54:02 - INFO - __main__ - Step 15762: {'lr': 0.000199988764694857, 'samples': 504384, 'steps': 985, 'loss/train': 3.7465124130249023} -09/20/2021 17:54:03 - INFO - __main__ - Step 15763: {'lr': 0.000199988764694857, 'samples': 504416, 'steps': 985, 'loss/train': 3.6238341331481934} -09/20/2021 17:54:04 - INFO - __main__ - Step 15764: {'lr': 0.000199988764694857, 'samples': 504448, 'steps': 985, 'loss/train': 3.3449296951293945} -09/20/2021 17:54:05 - INFO - __main__ - Step 15765: {'lr': 0.000199988764694857, 'samples': 504480, 'steps': 985, 'loss/train': 3.0846354961395264} -09/20/2021 17:54:05 - INFO - __main__ - Step 15766: {'lr': 0.000199988764694857, 'samples': 504512, 'steps': 985, 'loss/train': 4.318047523498535} -09/20/2021 17:54:06 - INFO - __main__ - Step 15767: {'lr': 0.000199988764694857, 'samples': 504544, 'steps': 985, 'loss/train': 4.0249762535095215} -09/20/2021 17:54:07 - INFO - __main__ - Step 15768: {'lr': 0.000199988764694857, 'samples': 504576, 'steps': 985, 'loss/train': 2.672302722930908} -09/20/2021 17:54:08 - INFO - __main__ - Step 15769: {'lr': 0.000199988764694857, 'samples': 504608, 'steps': 985, 'loss/train': 3.1712911128997803} -09/20/2021 17:54:08 - INFO - __main__ - Step 15770: {'lr': 0.000199988764694857, 'samples': 504640, 'steps': 985, 'loss/train': 3.421593427658081} -09/20/2021 17:54:09 - INFO - __main__ - Step 15771: {'lr': 0.000199988764694857, 'samples': 504672, 'steps': 985, 'loss/train': 3.5375239849090576} -09/20/2021 17:54:10 - INFO - __main__ - Step 15772: {'lr': 0.000199988764694857, 'samples': 504704, 'steps': 985, 'loss/train': 3.3306472301483154} -09/20/2021 17:54:11 - INFO - __main__ - Step 15773: {'lr': 0.000199988764694857, 'samples': 504736, 'steps': 985, 'loss/train': 4.60683536529541} -09/20/2021 17:54:11 - INFO - __main__ - Step 15774: {'lr': 0.000199988764694857, 'samples': 504768, 'steps': 985, 'loss/train': 5.125966548919678} -09/20/2021 17:54:12 - INFO - __main__ - Step 15775: {'lr': 0.000199988764694857, 'samples': 504800, 'steps': 985, 'loss/train': 3.2316396236419678} -09/20/2021 17:54:13 - INFO - __main__ - Step 15776: {'lr': 0.000199988764694857, 'samples': 504832, 'steps': 985, 'loss/train': 3.695277690887451} -09/20/2021 17:54:14 - INFO - __main__ - Step 15777: {'lr': 0.00019998866887360248, 'samples': 504864, 'steps': 986, 'loss/train': 2.1260738372802734} -09/20/2021 17:54:15 - INFO - __main__ - Step 15778: {'lr': 0.00019998866887360248, 'samples': 504896, 'steps': 986, 'loss/train': 3.5090298652648926} -09/20/2021 17:54:15 - INFO - __main__ - Step 15779: {'lr': 0.00019998866887360248, 'samples': 504928, 'steps': 986, 'loss/train': 2.506908893585205} -09/20/2021 17:54:16 - INFO - __main__ - Step 15780: {'lr': 0.00019998866887360248, 'samples': 504960, 'steps': 986, 'loss/train': 3.5584466457366943} -09/20/2021 17:54:17 - INFO - __main__ - Step 15781: {'lr': 0.00019998866887360248, 'samples': 504992, 'steps': 986, 'loss/train': 3.534876823425293} -09/20/2021 17:54:18 - INFO - __main__ - Step 15782: {'lr': 0.00019998866887360248, 'samples': 505024, 'steps': 986, 'loss/train': 2.6416971683502197} -09/20/2021 17:54:19 - INFO - __main__ - Step 15783: {'lr': 0.00019998866887360248, 'samples': 505056, 'steps': 986, 'loss/train': 3.1517536640167236} -09/20/2021 17:54:20 - INFO - __main__ - Step 15784: {'lr': 0.00019998866887360248, 'samples': 505088, 'steps': 986, 'loss/train': 3.1156086921691895} -09/20/2021 17:54:20 - INFO - __main__ - Step 15785: {'lr': 0.00019998866887360248, 'samples': 505120, 'steps': 986, 'loss/train': 2.9740710258483887} -09/20/2021 17:54:21 - INFO - __main__ - Step 15786: {'lr': 0.00019998866887360248, 'samples': 505152, 'steps': 986, 'loss/train': 3.5666732788085938} -09/20/2021 17:54:22 - INFO - __main__ - Step 15787: {'lr': 0.00019998866887360248, 'samples': 505184, 'steps': 986, 'loss/train': 3.710219383239746} -09/20/2021 17:54:23 - INFO - __main__ - Step 15788: {'lr': 0.00019998866887360248, 'samples': 505216, 'steps': 986, 'loss/train': 4.723977088928223} -09/20/2021 17:54:23 - INFO - __main__ - Step 15789: {'lr': 0.00019998866887360248, 'samples': 505248, 'steps': 986, 'loss/train': 3.8268682956695557} -09/20/2021 17:54:24 - INFO - __main__ - Step 15790: {'lr': 0.00019998866887360248, 'samples': 505280, 'steps': 986, 'loss/train': 4.058739185333252} -09/20/2021 17:54:25 - INFO - __main__ - Step 15791: {'lr': 0.00019998866887360248, 'samples': 505312, 'steps': 986, 'loss/train': 3.0393524169921875} -09/20/2021 17:54:26 - INFO - __main__ - Step 15792: {'lr': 0.00019998866887360248, 'samples': 505344, 'steps': 986, 'loss/train': 3.4837262630462646} -09/20/2021 17:54:27 - INFO - __main__ - Step 15793: {'lr': 0.00019998857264549443, 'samples': 505376, 'steps': 987, 'loss/train': 3.427565813064575} -09/20/2021 17:54:27 - INFO - __main__ - Step 15794: {'lr': 0.00019998857264549443, 'samples': 505408, 'steps': 987, 'loss/train': 3.4298512935638428} -09/20/2021 17:54:28 - INFO - __main__ - Step 15795: {'lr': 0.00019998857264549443, 'samples': 505440, 'steps': 987, 'loss/train': 4.1193766593933105} -09/20/2021 17:54:29 - INFO - __main__ - Step 15796: {'lr': 0.00019998857264549443, 'samples': 505472, 'steps': 987, 'loss/train': 3.939636468887329} -09/20/2021 17:54:30 - INFO - __main__ - Step 15797: {'lr': 0.00019998857264549443, 'samples': 505504, 'steps': 987, 'loss/train': 4.967914581298828} -09/20/2021 17:54:30 - INFO - __main__ - Step 15798: {'lr': 0.00019998857264549443, 'samples': 505536, 'steps': 987, 'loss/train': 4.949335098266602} -09/20/2021 17:54:31 - INFO - __main__ - Step 15799: {'lr': 0.00019998857264549443, 'samples': 505568, 'steps': 987, 'loss/train': 0.7096419930458069} -09/20/2021 17:54:32 - INFO - __main__ - Step 15800: {'lr': 0.00019998857264549443, 'samples': 505600, 'steps': 987, 'loss/train': 0.9553905129432678} -09/20/2021 17:54:33 - INFO - __main__ - Step 15801: {'lr': 0.00019998857264549443, 'samples': 505632, 'steps': 987, 'loss/train': 2.602663993835449} -09/20/2021 17:54:33 - INFO - __main__ - Step 15802: {'lr': 0.00019998857264549443, 'samples': 505664, 'steps': 987, 'loss/train': 3.4622061252593994} -09/20/2021 17:54:34 - INFO - __main__ - Step 15803: {'lr': 0.00019998857264549443, 'samples': 505696, 'steps': 987, 'loss/train': 3.0206854343414307} -09/20/2021 17:54:35 - INFO - __main__ - Step 15804: {'lr': 0.00019998857264549443, 'samples': 505728, 'steps': 987, 'loss/train': 2.8686411380767822} -09/20/2021 17:54:36 - INFO - __main__ - Step 15805: {'lr': 0.00019998857264549443, 'samples': 505760, 'steps': 987, 'loss/train': 3.9081268310546875} -09/20/2021 17:54:36 - INFO - __main__ - Step 15806: {'lr': 0.00019998857264549443, 'samples': 505792, 'steps': 987, 'loss/train': 3.458800792694092} -09/20/2021 17:54:37 - INFO - __main__ - Step 15807: {'lr': 0.00019998857264549443, 'samples': 505824, 'steps': 987, 'loss/train': 6.208954334259033} -09/20/2021 17:54:38 - INFO - __main__ - Step 15808: {'lr': 0.00019998857264549443, 'samples': 505856, 'steps': 987, 'loss/train': 3.4337551593780518} -09/20/2021 17:54:39 - INFO - __main__ - Step 15809: {'lr': 0.00019998847601053322, 'samples': 505888, 'steps': 988, 'loss/train': 3.010859727859497} -09/20/2021 17:54:40 - INFO - __main__ - Step 15810: {'lr': 0.00019998847601053322, 'samples': 505920, 'steps': 988, 'loss/train': 3.2033817768096924} -09/20/2021 17:54:40 - INFO - __main__ - Step 15811: {'lr': 0.00019998847601053322, 'samples': 505952, 'steps': 988, 'loss/train': 3.7468101978302} -09/20/2021 17:54:41 - INFO - __main__ - Step 15812: {'lr': 0.00019998847601053322, 'samples': 505984, 'steps': 988, 'loss/train': 3.2692065238952637} -09/20/2021 17:54:42 - INFO - __main__ - Step 15813: {'lr': 0.00019998847601053322, 'samples': 506016, 'steps': 988, 'loss/train': 2.763157606124878} -09/20/2021 17:54:43 - INFO - __main__ - Step 15814: {'lr': 0.00019998847601053322, 'samples': 506048, 'steps': 988, 'loss/train': 3.598121166229248} -09/20/2021 17:54:44 - INFO - __main__ - Step 15815: {'lr': 0.00019998847601053322, 'samples': 506080, 'steps': 988, 'loss/train': 3.29661226272583} -09/20/2021 17:54:45 - INFO - __main__ - Step 15816: {'lr': 0.00019998847601053322, 'samples': 506112, 'steps': 988, 'loss/train': 3.2501251697540283} -09/20/2021 17:54:45 - INFO - __main__ - Step 15817: {'lr': 0.00019998847601053322, 'samples': 506144, 'steps': 988, 'loss/train': 3.7564144134521484} -09/20/2021 17:54:46 - INFO - __main__ - Step 15818: {'lr': 0.00019998847601053322, 'samples': 506176, 'steps': 988, 'loss/train': 5.150450229644775} -09/20/2021 17:54:47 - INFO - __main__ - Step 15819: {'lr': 0.00019998847601053322, 'samples': 506208, 'steps': 988, 'loss/train': 3.3039848804473877} -09/20/2021 17:54:48 - INFO - __main__ - Step 15820: {'lr': 0.00019998847601053322, 'samples': 506240, 'steps': 988, 'loss/train': 3.326143503189087} -09/20/2021 17:54:48 - INFO - __main__ - Step 15821: {'lr': 0.00019998847601053322, 'samples': 506272, 'steps': 988, 'loss/train': 3.928778648376465} -09/20/2021 17:54:49 - INFO - __main__ - Step 15822: {'lr': 0.00019998847601053322, 'samples': 506304, 'steps': 988, 'loss/train': 3.796295642852783} -09/20/2021 17:54:50 - INFO - __main__ - Step 15823: {'lr': 0.00019998847601053322, 'samples': 506336, 'steps': 988, 'loss/train': 3.6045162677764893} -09/20/2021 17:54:51 - INFO - __main__ - Step 15824: {'lr': 0.00019998847601053322, 'samples': 506368, 'steps': 988, 'loss/train': 4.095033645629883} -09/20/2021 17:54:51 - INFO - __main__ - Step 15825: {'lr': 0.00019998837896871934, 'samples': 506400, 'steps': 989, 'loss/train': 3.760841131210327} -09/20/2021 17:54:52 - INFO - __main__ - Step 15826: {'lr': 0.00019998837896871934, 'samples': 506432, 'steps': 989, 'loss/train': 3.876896858215332} -09/20/2021 17:54:53 - INFO - __main__ - Step 15827: {'lr': 0.00019998837896871934, 'samples': 506464, 'steps': 989, 'loss/train': 4.587381362915039} -09/20/2021 17:54:54 - INFO - __main__ - Step 15828: {'lr': 0.00019998837896871934, 'samples': 506496, 'steps': 989, 'loss/train': 3.9840080738067627} -09/20/2021 17:54:54 - INFO - __main__ - Step 15829: {'lr': 0.00019998837896871934, 'samples': 506528, 'steps': 989, 'loss/train': 3.8803653717041016} -09/20/2021 17:54:55 - INFO - __main__ - Step 15830: {'lr': 0.00019998837896871934, 'samples': 506560, 'steps': 989, 'loss/train': 3.301253080368042} -09/20/2021 17:54:56 - INFO - __main__ - Step 15831: {'lr': 0.00019998837896871934, 'samples': 506592, 'steps': 989, 'loss/train': 3.638490915298462} -09/20/2021 17:54:57 - INFO - __main__ - Step 15832: {'lr': 0.00019998837896871934, 'samples': 506624, 'steps': 989, 'loss/train': 4.078593730926514} -09/20/2021 17:54:57 - INFO - __main__ - Step 15833: {'lr': 0.00019998837896871934, 'samples': 506656, 'steps': 989, 'loss/train': 2.807096004486084} -09/20/2021 17:54:58 - INFO - __main__ - Step 15834: {'lr': 0.00019998837896871934, 'samples': 506688, 'steps': 989, 'loss/train': 2.58888840675354} -09/20/2021 17:54:59 - INFO - __main__ - Step 15835: {'lr': 0.00019998837896871934, 'samples': 506720, 'steps': 989, 'loss/train': 0.8801530003547668} -09/20/2021 17:55:00 - INFO - __main__ - Step 15836: {'lr': 0.00019998837896871934, 'samples': 506752, 'steps': 989, 'loss/train': 4.020409107208252} -09/20/2021 17:55:00 - INFO - __main__ - Step 15837: {'lr': 0.00019998837896871934, 'samples': 506784, 'steps': 989, 'loss/train': 4.006494522094727} -09/20/2021 17:55:01 - INFO - __main__ - Step 15838: {'lr': 0.00019998837896871934, 'samples': 506816, 'steps': 989, 'loss/train': 3.4485013484954834} -09/20/2021 17:55:02 - INFO - __main__ - Step 15839: {'lr': 0.00019998837896871934, 'samples': 506848, 'steps': 989, 'loss/train': 3.3330373764038086} -09/20/2021 17:55:03 - INFO - __main__ - Step 15840: {'lr': 0.00019998837896871934, 'samples': 506880, 'steps': 989, 'loss/train': 4.929409980773926} -09/20/2021 17:55:04 - INFO - __main__ - Step 15841: {'lr': 0.0001999882815200531, 'samples': 506912, 'steps': 990, 'loss/train': 5.332210540771484} -09/20/2021 17:55:04 - INFO - __main__ - Step 15842: {'lr': 0.0001999882815200531, 'samples': 506944, 'steps': 990, 'loss/train': 3.463209390640259} -09/20/2021 17:55:05 - INFO - __main__ - Step 15843: {'lr': 0.0001999882815200531, 'samples': 506976, 'steps': 990, 'loss/train': 1.8434772491455078} -09/20/2021 17:55:06 - INFO - __main__ - Step 15844: {'lr': 0.0001999882815200531, 'samples': 507008, 'steps': 990, 'loss/train': 3.0817654132843018} -09/20/2021 17:55:08 - INFO - __main__ - Step 15845: {'lr': 0.0001999882815200531, 'samples': 507040, 'steps': 990, 'loss/train': 3.6217169761657715} -09/20/2021 17:55:08 - INFO - __main__ - Step 15846: {'lr': 0.0001999882815200531, 'samples': 507072, 'steps': 990, 'loss/train': 4.14897346496582} -09/20/2021 17:55:09 - INFO - __main__ - Step 15847: {'lr': 0.0001999882815200531, 'samples': 507104, 'steps': 990, 'loss/train': 3.9192023277282715} -09/20/2021 17:55:10 - INFO - __main__ - Step 15848: {'lr': 0.0001999882815200531, 'samples': 507136, 'steps': 990, 'loss/train': 3.369290351867676} -09/20/2021 17:55:11 - INFO - __main__ - Step 15849: {'lr': 0.0001999882815200531, 'samples': 507168, 'steps': 990, 'loss/train': 4.416330337524414} -09/20/2021 17:55:11 - INFO - __main__ - Step 15850: {'lr': 0.0001999882815200531, 'samples': 507200, 'steps': 990, 'loss/train': 3.4564712047576904} -09/20/2021 17:55:12 - INFO - __main__ - Step 15851: {'lr': 0.0001999882815200531, 'samples': 507232, 'steps': 990, 'loss/train': 2.8457658290863037} -09/20/2021 17:55:13 - INFO - __main__ - Step 15852: {'lr': 0.0001999882815200531, 'samples': 507264, 'steps': 990, 'loss/train': 3.656369686126709} -09/20/2021 17:55:14 - INFO - __main__ - Step 15853: {'lr': 0.0001999882815200531, 'samples': 507296, 'steps': 990, 'loss/train': 3.959324836730957} -09/20/2021 17:55:14 - INFO - __main__ - Step 15854: {'lr': 0.0001999882815200531, 'samples': 507328, 'steps': 990, 'loss/train': 3.2679741382598877} -09/20/2021 17:55:15 - INFO - __main__ - Step 15855: {'lr': 0.0001999882815200531, 'samples': 507360, 'steps': 990, 'loss/train': 3.0334482192993164} -09/20/2021 17:55:16 - INFO - __main__ - Step 15856: {'lr': 0.0001999882815200531, 'samples': 507392, 'steps': 990, 'loss/train': 1.3019797801971436} -09/20/2021 17:55:17 - INFO - __main__ - Step 15857: {'lr': 0.00019998818366453498, 'samples': 507424, 'steps': 991, 'loss/train': 1.370937466621399} -09/20/2021 17:55:18 - INFO - __main__ - Step 15858: {'lr': 0.00019998818366453498, 'samples': 507456, 'steps': 991, 'loss/train': 0.8150690197944641} -09/20/2021 17:55:18 - INFO - __main__ - Step 15859: {'lr': 0.00019998818366453498, 'samples': 507488, 'steps': 991, 'loss/train': 0.5938019752502441} -09/20/2021 17:55:19 - INFO - __main__ - Step 15860: {'lr': 0.00019998818366453498, 'samples': 507520, 'steps': 991, 'loss/train': 3.4728293418884277} -09/20/2021 17:55:20 - INFO - __main__ - Step 15861: {'lr': 0.00019998818366453498, 'samples': 507552, 'steps': 991, 'loss/train': 3.4313149452209473} -09/20/2021 17:55:21 - INFO - __main__ - Step 15862: {'lr': 0.00019998818366453498, 'samples': 507584, 'steps': 991, 'loss/train': 3.9473776817321777} -09/20/2021 17:55:21 - INFO - __main__ - Step 15863: {'lr': 0.00019998818366453498, 'samples': 507616, 'steps': 991, 'loss/train': 3.608335256576538} -09/20/2021 17:55:22 - INFO - __main__ - Step 15864: {'lr': 0.00019998818366453498, 'samples': 507648, 'steps': 991, 'loss/train': 3.241823434829712} -09/20/2021 17:55:23 - INFO - __main__ - Step 15865: {'lr': 0.00019998818366453498, 'samples': 507680, 'steps': 991, 'loss/train': 0.6642243266105652} -09/20/2021 17:55:24 - INFO - __main__ - Step 15866: {'lr': 0.00019998818366453498, 'samples': 507712, 'steps': 991, 'loss/train': 3.7225284576416016} -09/20/2021 17:55:24 - INFO - __main__ - Step 15867: {'lr': 0.00019998818366453498, 'samples': 507744, 'steps': 991, 'loss/train': 4.7160491943359375} -09/20/2021 17:55:25 - INFO - __main__ - Step 15868: {'lr': 0.00019998818366453498, 'samples': 507776, 'steps': 991, 'loss/train': 4.721347332000732} -09/20/2021 17:55:26 - INFO - __main__ - Step 15869: {'lr': 0.00019998818366453498, 'samples': 507808, 'steps': 991, 'loss/train': 3.508544921875} -09/20/2021 17:55:27 - INFO - __main__ - Step 15870: {'lr': 0.00019998818366453498, 'samples': 507840, 'steps': 991, 'loss/train': 3.4258835315704346} -09/20/2021 17:55:27 - INFO - __main__ - Step 15871: {'lr': 0.00019998818366453498, 'samples': 507872, 'steps': 991, 'loss/train': 4.518589973449707} -09/20/2021 17:55:28 - INFO - __main__ - Step 15872: {'lr': 0.00019998818366453498, 'samples': 507904, 'steps': 991, 'loss/train': 3.712761402130127} -09/20/2021 17:55:29 - INFO - __main__ - Step 15873: {'lr': 0.0001999880854021653, 'samples': 507936, 'steps': 992, 'loss/train': 3.778977870941162} -09/20/2021 17:55:30 - INFO - __main__ - Step 15874: {'lr': 0.0001999880854021653, 'samples': 507968, 'steps': 992, 'loss/train': 1.820471167564392} -09/20/2021 17:55:31 - INFO - __main__ - Step 15875: {'lr': 0.0001999880854021653, 'samples': 508000, 'steps': 992, 'loss/train': 4.1739349365234375} -09/20/2021 17:55:32 - INFO - __main__ - Step 15876: {'lr': 0.0001999880854021653, 'samples': 508032, 'steps': 992, 'loss/train': 3.7391698360443115} -09/20/2021 17:55:33 - INFO - __main__ - Step 15877: {'lr': 0.0001999880854021653, 'samples': 508064, 'steps': 992, 'loss/train': 3.0802338123321533} -09/20/2021 17:55:33 - INFO - __main__ - Step 15878: {'lr': 0.0001999880854021653, 'samples': 508096, 'steps': 992, 'loss/train': 3.6124556064605713} -09/20/2021 17:55:34 - INFO - __main__ - Step 15879: {'lr': 0.0001999880854021653, 'samples': 508128, 'steps': 992, 'loss/train': 3.9067647457122803} -09/20/2021 17:55:35 - INFO - __main__ - Step 15880: {'lr': 0.0001999880854021653, 'samples': 508160, 'steps': 992, 'loss/train': 3.65932559967041} -09/20/2021 17:55:36 - INFO - __main__ - Step 15881: {'lr': 0.0001999880854021653, 'samples': 508192, 'steps': 992, 'loss/train': 3.288418769836426} -09/20/2021 17:55:36 - INFO - __main__ - Step 15882: {'lr': 0.0001999880854021653, 'samples': 508224, 'steps': 992, 'loss/train': 3.1588590145111084} -09/20/2021 17:55:37 - INFO - __main__ - Step 15883: {'lr': 0.0001999880854021653, 'samples': 508256, 'steps': 992, 'loss/train': 3.3695545196533203} -09/20/2021 17:55:38 - INFO - __main__ - Step 15884: {'lr': 0.0001999880854021653, 'samples': 508288, 'steps': 992, 'loss/train': 3.204225778579712} -09/20/2021 17:55:39 - INFO - __main__ - Step 15885: {'lr': 0.0001999880854021653, 'samples': 508320, 'steps': 992, 'loss/train': 4.3637542724609375} -09/20/2021 17:55:39 - INFO - __main__ - Step 15886: {'lr': 0.0001999880854021653, 'samples': 508352, 'steps': 992, 'loss/train': 4.953799247741699} -09/20/2021 17:55:40 - INFO - __main__ - Step 15887: {'lr': 0.0001999880854021653, 'samples': 508384, 'steps': 992, 'loss/train': 5.4251813888549805} -09/20/2021 17:55:41 - INFO - __main__ - Step 15888: {'lr': 0.0001999880854021653, 'samples': 508416, 'steps': 992, 'loss/train': 3.1516311168670654} -09/20/2021 17:55:42 - INFO - __main__ - Step 15889: {'lr': 0.00019998798673294448, 'samples': 508448, 'steps': 993, 'loss/train': 4.1034955978393555} -09/20/2021 17:55:42 - INFO - __main__ - Step 15890: {'lr': 0.00019998798673294448, 'samples': 508480, 'steps': 993, 'loss/train': 3.6606616973876953} -09/20/2021 17:55:43 - INFO - __main__ - Step 15891: {'lr': 0.00019998798673294448, 'samples': 508512, 'steps': 993, 'loss/train': 3.0563836097717285} -09/20/2021 17:55:44 - INFO - __main__ - Step 15892: {'lr': 0.00019998798673294448, 'samples': 508544, 'steps': 993, 'loss/train': 3.4956679344177246} -09/20/2021 17:55:45 - INFO - __main__ - Step 15893: {'lr': 0.00019998798673294448, 'samples': 508576, 'steps': 993, 'loss/train': 4.310747146606445} -09/20/2021 17:55:45 - INFO - __main__ - Step 15894: {'lr': 0.00019998798673294448, 'samples': 508608, 'steps': 993, 'loss/train': 3.6150612831115723} -09/20/2021 17:55:46 - INFO - __main__ - Step 15895: {'lr': 0.00019998798673294448, 'samples': 508640, 'steps': 993, 'loss/train': 4.783689975738525} -09/20/2021 17:55:47 - INFO - __main__ - Step 15896: {'lr': 0.00019998798673294448, 'samples': 508672, 'steps': 993, 'loss/train': 3.903834342956543} -09/20/2021 17:55:48 - INFO - __main__ - Step 15897: {'lr': 0.00019998798673294448, 'samples': 508704, 'steps': 993, 'loss/train': 3.284327268600464} -09/20/2021 17:55:48 - INFO - __main__ - Step 15898: {'lr': 0.00019998798673294448, 'samples': 508736, 'steps': 993, 'loss/train': 4.112295150756836} -09/20/2021 17:55:49 - INFO - __main__ - Step 15899: {'lr': 0.00019998798673294448, 'samples': 508768, 'steps': 993, 'loss/train': 3.291200637817383} -09/20/2021 17:55:50 - INFO - __main__ - Step 15900: {'lr': 0.00019998798673294448, 'samples': 508800, 'steps': 993, 'loss/train': 3.427443027496338} -09/20/2021 17:55:51 - INFO - __main__ - Step 15901: {'lr': 0.00019998798673294448, 'samples': 508832, 'steps': 993, 'loss/train': 3.4598917961120605} -09/20/2021 17:55:51 - INFO - __main__ - Step 15902: {'lr': 0.00019998798673294448, 'samples': 508864, 'steps': 993, 'loss/train': 4.226787090301514} -09/20/2021 17:55:52 - INFO - __main__ - Step 15903: {'lr': 0.00019998798673294448, 'samples': 508896, 'steps': 993, 'loss/train': 3.0156795978546143} -09/20/2021 17:55:53 - INFO - __main__ - Step 15904: {'lr': 0.00019998798673294448, 'samples': 508928, 'steps': 993, 'loss/train': 4.574108600616455} -09/20/2021 17:55:54 - INFO - __main__ - Step 15905: {'lr': 0.00019998788765687294, 'samples': 508960, 'steps': 994, 'loss/train': 2.916872501373291} -09/20/2021 17:55:55 - INFO - __main__ - Step 15906: {'lr': 0.00019998788765687294, 'samples': 508992, 'steps': 994, 'loss/train': 4.24338960647583} -09/20/2021 17:55:56 - INFO - __main__ - Step 15907: {'lr': 0.00019998788765687294, 'samples': 509024, 'steps': 994, 'loss/train': 3.5770764350891113} -09/20/2021 17:55:57 - INFO - __main__ - Step 15908: {'lr': 0.00019998788765687294, 'samples': 509056, 'steps': 994, 'loss/train': 3.471336603164673} -09/20/2021 17:55:57 - INFO - __main__ - Step 15909: {'lr': 0.00019998788765687294, 'samples': 509088, 'steps': 994, 'loss/train': 4.01750373840332} -09/20/2021 17:55:58 - INFO - __main__ - Step 15910: {'lr': 0.00019998788765687294, 'samples': 509120, 'steps': 994, 'loss/train': 1.3558377027511597} -09/20/2021 17:55:59 - INFO - __main__ - Step 15911: {'lr': 0.00019998788765687294, 'samples': 509152, 'steps': 994, 'loss/train': 4.336276054382324} -09/20/2021 17:56:00 - INFO - __main__ - Step 15912: {'lr': 0.00019998788765687294, 'samples': 509184, 'steps': 994, 'loss/train': 3.857409954071045} -09/20/2021 17:56:00 - INFO - __main__ - Step 15913: {'lr': 0.00019998788765687294, 'samples': 509216, 'steps': 994, 'loss/train': 3.4272263050079346} -09/20/2021 17:56:01 - INFO - __main__ - Step 15914: {'lr': 0.00019998788765687294, 'samples': 509248, 'steps': 994, 'loss/train': 4.195802688598633} -09/20/2021 17:56:02 - INFO - __main__ - Step 15915: {'lr': 0.00019998788765687294, 'samples': 509280, 'steps': 994, 'loss/train': 4.213019847869873} -09/20/2021 17:56:03 - INFO - __main__ - Step 15916: {'lr': 0.00019998788765687294, 'samples': 509312, 'steps': 994, 'loss/train': 4.863793849945068} -09/20/2021 17:56:03 - INFO - __main__ - Step 15917: {'lr': 0.00019998788765687294, 'samples': 509344, 'steps': 994, 'loss/train': 4.954282760620117} -09/20/2021 17:56:04 - INFO - __main__ - Step 15918: {'lr': 0.00019998788765687294, 'samples': 509376, 'steps': 994, 'loss/train': 4.591910362243652} -09/20/2021 17:56:05 - INFO - __main__ - Step 15919: {'lr': 0.00019998788765687294, 'samples': 509408, 'steps': 994, 'loss/train': 3.154350757598877} -09/20/2021 17:56:06 - INFO - __main__ - Step 15920: {'lr': 0.00019998788765687294, 'samples': 509440, 'steps': 994, 'loss/train': 3.836885690689087} -09/20/2021 17:56:07 - INFO - __main__ - Step 15921: {'lr': 0.00019998778817395104, 'samples': 509472, 'steps': 995, 'loss/train': 3.590794324874878} -09/20/2021 17:56:07 - INFO - __main__ - Step 15922: {'lr': 0.00019998778817395104, 'samples': 509504, 'steps': 995, 'loss/train': 4.060523986816406} -09/20/2021 17:56:08 - INFO - __main__ - Step 15923: {'lr': 0.00019998778817395104, 'samples': 509536, 'steps': 995, 'loss/train': 3.5149295330047607} -09/20/2021 17:56:09 - INFO - __main__ - Step 15924: {'lr': 0.00019998778817395104, 'samples': 509568, 'steps': 995, 'loss/train': 3.7733681201934814} -09/20/2021 17:56:10 - INFO - __main__ - Step 15925: {'lr': 0.00019998778817395104, 'samples': 509600, 'steps': 995, 'loss/train': 3.2622385025024414} -09/20/2021 17:56:10 - INFO - __main__ - Step 15926: {'lr': 0.00019998778817395104, 'samples': 509632, 'steps': 995, 'loss/train': 3.7827484607696533} -09/20/2021 17:56:11 - INFO - __main__ - Step 15927: {'lr': 0.00019998778817395104, 'samples': 509664, 'steps': 995, 'loss/train': 3.5026962757110596} -09/20/2021 17:56:12 - INFO - __main__ - Step 15928: {'lr': 0.00019998778817395104, 'samples': 509696, 'steps': 995, 'loss/train': 3.098813056945801} -09/20/2021 17:56:13 - INFO - __main__ - Step 15929: {'lr': 0.00019998778817395104, 'samples': 509728, 'steps': 995, 'loss/train': 4.2027201652526855} -09/20/2021 17:56:13 - INFO - __main__ - Step 15930: {'lr': 0.00019998778817395104, 'samples': 509760, 'steps': 995, 'loss/train': 4.129007816314697} -09/20/2021 17:56:14 - INFO - __main__ - Step 15931: {'lr': 0.00019998778817395104, 'samples': 509792, 'steps': 995, 'loss/train': 4.283318996429443} -09/20/2021 17:56:15 - INFO - __main__ - Step 15932: {'lr': 0.00019998778817395104, 'samples': 509824, 'steps': 995, 'loss/train': 3.899501085281372} -09/20/2021 17:56:16 - INFO - __main__ - Step 15933: {'lr': 0.00019998778817395104, 'samples': 509856, 'steps': 995, 'loss/train': 3.609429359436035} -09/20/2021 17:56:16 - INFO - __main__ - Step 15934: {'lr': 0.00019998778817395104, 'samples': 509888, 'steps': 995, 'loss/train': 3.436026096343994} -09/20/2021 17:56:17 - INFO - __main__ - Step 15935: {'lr': 0.00019998778817395104, 'samples': 509920, 'steps': 995, 'loss/train': 3.7281577587127686} -09/20/2021 17:56:18 - INFO - __main__ - Step 15936: {'lr': 0.00019998778817395104, 'samples': 509952, 'steps': 995, 'loss/train': 4.283090114593506} -09/20/2021 17:56:19 - INFO - __main__ - Step 15937: {'lr': 0.00019998768828417927, 'samples': 509984, 'steps': 996, 'loss/train': 3.7275285720825195} -09/20/2021 17:56:20 - INFO - __main__ - Step 15938: {'lr': 0.00019998768828417927, 'samples': 510016, 'steps': 996, 'loss/train': 3.841311454772949} -09/20/2021 17:56:21 - INFO - __main__ - Step 15939: {'lr': 0.00019998768828417927, 'samples': 510048, 'steps': 996, 'loss/train': 3.949129819869995} -09/20/2021 17:56:22 - INFO - __main__ - Step 15940: {'lr': 0.00019998768828417927, 'samples': 510080, 'steps': 996, 'loss/train': 4.167607307434082} -09/20/2021 17:56:22 - INFO - __main__ - Step 15941: {'lr': 0.00019998768828417927, 'samples': 510112, 'steps': 996, 'loss/train': 3.765897750854492} -09/20/2021 17:56:23 - INFO - __main__ - Step 15942: {'lr': 0.00019998768828417927, 'samples': 510144, 'steps': 996, 'loss/train': 2.869473457336426} -09/20/2021 17:56:24 - INFO - __main__ - Step 15943: {'lr': 0.00019998768828417927, 'samples': 510176, 'steps': 996, 'loss/train': 3.7261550426483154} -09/20/2021 17:56:25 - INFO - __main__ - Step 15944: {'lr': 0.00019998768828417927, 'samples': 510208, 'steps': 996, 'loss/train': 3.1183652877807617} -09/20/2021 17:56:25 - INFO - __main__ - Step 15945: {'lr': 0.00019998768828417927, 'samples': 510240, 'steps': 996, 'loss/train': 4.125201225280762} -09/20/2021 17:56:26 - INFO - __main__ - Step 15946: {'lr': 0.00019998768828417927, 'samples': 510272, 'steps': 996, 'loss/train': 3.636979103088379} -09/20/2021 17:56:27 - INFO - __main__ - Step 15947: {'lr': 0.00019998768828417927, 'samples': 510304, 'steps': 996, 'loss/train': 4.270755767822266} -09/20/2021 17:56:28 - INFO - __main__ - Step 15948: {'lr': 0.00019998768828417927, 'samples': 510336, 'steps': 996, 'loss/train': 4.24249267578125} -09/20/2021 17:56:28 - INFO - __main__ - Step 15949: {'lr': 0.00019998768828417927, 'samples': 510368, 'steps': 996, 'loss/train': 3.8593926429748535} -09/20/2021 17:56:29 - INFO - __main__ - Step 15950: {'lr': 0.00019998768828417927, 'samples': 510400, 'steps': 996, 'loss/train': 2.8321197032928467} -09/20/2021 17:56:30 - INFO - __main__ - Step 15951: {'lr': 0.00019998768828417927, 'samples': 510432, 'steps': 996, 'loss/train': 0.89643394947052} -09/20/2021 17:56:31 - INFO - __main__ - Step 15952: {'lr': 0.00019998768828417927, 'samples': 510464, 'steps': 996, 'loss/train': 3.9051733016967773} -09/20/2021 17:56:31 - INFO - __main__ - Step 15953: {'lr': 0.00019998758798755797, 'samples': 510496, 'steps': 997, 'loss/train': 3.450491428375244} -09/20/2021 17:56:32 - INFO - __main__ - Step 15954: {'lr': 0.00019998758798755797, 'samples': 510528, 'steps': 997, 'loss/train': 3.9038801193237305} -09/20/2021 17:56:33 - INFO - __main__ - Step 15955: {'lr': 0.00019998758798755797, 'samples': 510560, 'steps': 997, 'loss/train': 3.2207207679748535} -09/20/2021 17:56:34 - INFO - __main__ - Step 15956: {'lr': 0.00019998758798755797, 'samples': 510592, 'steps': 997, 'loss/train': 3.095268487930298} -09/20/2021 17:56:34 - INFO - __main__ - Step 15957: {'lr': 0.00019998758798755797, 'samples': 510624, 'steps': 997, 'loss/train': 3.617495536804199} -09/20/2021 17:56:35 - INFO - __main__ - Step 15958: {'lr': 0.00019998758798755797, 'samples': 510656, 'steps': 997, 'loss/train': 3.327066421508789} -09/20/2021 17:56:36 - INFO - __main__ - Step 15959: {'lr': 0.00019998758798755797, 'samples': 510688, 'steps': 997, 'loss/train': 3.6858041286468506} -09/20/2021 17:56:37 - INFO - __main__ - Step 15960: {'lr': 0.00019998758798755797, 'samples': 510720, 'steps': 997, 'loss/train': 3.862600564956665} -09/20/2021 17:56:37 - INFO - __main__ - Step 15961: {'lr': 0.00019998758798755797, 'samples': 510752, 'steps': 997, 'loss/train': 4.44608736038208} -09/20/2021 17:56:38 - INFO - __main__ - Step 15962: {'lr': 0.00019998758798755797, 'samples': 510784, 'steps': 997, 'loss/train': 3.990675210952759} -09/20/2021 17:56:39 - INFO - __main__ - Step 15963: {'lr': 0.00019998758798755797, 'samples': 510816, 'steps': 997, 'loss/train': 3.821347713470459} -09/20/2021 17:56:40 - INFO - __main__ - Step 15964: {'lr': 0.00019998758798755797, 'samples': 510848, 'steps': 997, 'loss/train': 2.9744255542755127} -09/20/2021 17:56:40 - INFO - __main__ - Step 15965: {'lr': 0.00019998758798755797, 'samples': 510880, 'steps': 997, 'loss/train': 3.9907727241516113} -09/20/2021 17:56:41 - INFO - __main__ - Step 15966: {'lr': 0.00019998758798755797, 'samples': 510912, 'steps': 997, 'loss/train': 3.8450379371643066} -09/20/2021 17:56:42 - INFO - __main__ - Step 15967: {'lr': 0.00019998758798755797, 'samples': 510944, 'steps': 997, 'loss/train': 3.8558828830718994} -09/20/2021 17:56:43 - INFO - __main__ - Step 15968: {'lr': 0.00019998758798755797, 'samples': 510976, 'steps': 997, 'loss/train': 4.258852005004883} -09/20/2021 17:56:44 - INFO - __main__ - Step 15969: {'lr': 0.00019998748728408753, 'samples': 511008, 'steps': 998, 'loss/train': 3.7409865856170654} -09/20/2021 17:56:45 - INFO - __main__ - Step 15970: {'lr': 0.00019998748728408753, 'samples': 511040, 'steps': 998, 'loss/train': 3.570101499557495} -09/20/2021 17:56:46 - INFO - __main__ - Step 15971: {'lr': 0.00019998748728408753, 'samples': 511072, 'steps': 998, 'loss/train': 3.643702268600464} -09/20/2021 17:56:47 - INFO - __main__ - Step 15972: {'lr': 0.00019998748728408753, 'samples': 511104, 'steps': 998, 'loss/train': 2.4884071350097656} -09/20/2021 17:56:47 - INFO - __main__ - Step 15973: {'lr': 0.00019998748728408753, 'samples': 511136, 'steps': 998, 'loss/train': 3.3155083656311035} -09/20/2021 17:56:48 - INFO - __main__ - Step 15974: {'lr': 0.00019998748728408753, 'samples': 511168, 'steps': 998, 'loss/train': 1.4916459321975708} -09/20/2021 17:56:49 - INFO - __main__ - Step 15975: {'lr': 0.00019998748728408753, 'samples': 511200, 'steps': 998, 'loss/train': 4.410026550292969} -09/20/2021 17:56:50 - INFO - __main__ - Step 15976: {'lr': 0.00019998748728408753, 'samples': 511232, 'steps': 998, 'loss/train': 2.394763469696045} -09/20/2021 17:56:50 - INFO - __main__ - Step 15977: {'lr': 0.00019998748728408753, 'samples': 511264, 'steps': 998, 'loss/train': 3.169173240661621} -09/20/2021 17:56:51 - INFO - __main__ - Step 15978: {'lr': 0.00019998748728408753, 'samples': 511296, 'steps': 998, 'loss/train': 3.681849241256714} -09/20/2021 17:56:52 - INFO - __main__ - Step 15979: {'lr': 0.00019998748728408753, 'samples': 511328, 'steps': 998, 'loss/train': 3.4413552284240723} -09/20/2021 17:56:53 - INFO - __main__ - Step 15980: {'lr': 0.00019998748728408753, 'samples': 511360, 'steps': 998, 'loss/train': 3.414424419403076} -09/20/2021 17:56:53 - INFO - __main__ - Step 15981: {'lr': 0.00019998748728408753, 'samples': 511392, 'steps': 998, 'loss/train': 3.5984768867492676} -09/20/2021 17:56:54 - INFO - __main__ - Step 15982: {'lr': 0.00019998748728408753, 'samples': 511424, 'steps': 998, 'loss/train': 4.704044818878174} -09/20/2021 17:56:55 - INFO - __main__ - Step 15983: {'lr': 0.00019998748728408753, 'samples': 511456, 'steps': 998, 'loss/train': 3.395101308822632} -09/20/2021 17:56:56 - INFO - __main__ - Step 15984: {'lr': 0.00019998748728408753, 'samples': 511488, 'steps': 998, 'loss/train': 3.7598307132720947} -09/20/2021 17:56:56 - INFO - __main__ - Step 15985: {'lr': 0.00019998738617376844, 'samples': 511520, 'steps': 999, 'loss/train': 3.614213228225708} -09/20/2021 17:56:57 - INFO - __main__ - Step 15986: {'lr': 0.00019998738617376844, 'samples': 511552, 'steps': 999, 'loss/train': 3.372999668121338} -09/20/2021 17:56:58 - INFO - __main__ - Step 15987: {'lr': 0.00019998738617376844, 'samples': 511584, 'steps': 999, 'loss/train': 0.6250375509262085} -09/20/2021 17:56:59 - INFO - __main__ - Step 15988: {'lr': 0.00019998738617376844, 'samples': 511616, 'steps': 999, 'loss/train': 0.7566878795623779} -09/20/2021 17:56:59 - INFO - __main__ - Step 15989: {'lr': 0.00019998738617376844, 'samples': 511648, 'steps': 999, 'loss/train': 0.9840039610862732} -09/20/2021 17:57:00 - INFO - __main__ - Step 15990: {'lr': 0.00019998738617376844, 'samples': 511680, 'steps': 999, 'loss/train': 1.062923789024353} -09/20/2021 17:57:01 - INFO - __main__ - Step 15991: {'lr': 0.00019998738617376844, 'samples': 511712, 'steps': 999, 'loss/train': 3.4294121265411377} -09/20/2021 17:57:02 - INFO - __main__ - Step 15992: {'lr': 0.00019998738617376844, 'samples': 511744, 'steps': 999, 'loss/train': 3.9780004024505615} -09/20/2021 17:57:02 - INFO - __main__ - Step 15993: {'lr': 0.00019998738617376844, 'samples': 511776, 'steps': 999, 'loss/train': 3.254194498062134} -09/20/2021 17:57:03 - INFO - __main__ - Step 15994: {'lr': 0.00019998738617376844, 'samples': 511808, 'steps': 999, 'loss/train': 3.965348958969116} -09/20/2021 17:57:04 - INFO - __main__ - Step 15995: {'lr': 0.00019998738617376844, 'samples': 511840, 'steps': 999, 'loss/train': 4.57406759262085} -09/20/2021 17:57:05 - INFO - __main__ - Step 15996: {'lr': 0.00019998738617376844, 'samples': 511872, 'steps': 999, 'loss/train': 4.009472370147705} -09/20/2021 17:57:05 - INFO - __main__ - Step 15997: {'lr': 0.00019998738617376844, 'samples': 511904, 'steps': 999, 'loss/train': 3.450841188430786} -09/20/2021 17:57:06 - INFO - __main__ - Step 15998: {'lr': 0.00019998738617376844, 'samples': 511936, 'steps': 999, 'loss/train': 2.88623309135437} -09/20/2021 17:57:08 - INFO - __main__ - Step 15999: {'lr': 0.00019998738617376844, 'samples': 511968, 'steps': 999, 'loss/train': 3.6503114700317383} -09/20/2021 17:57:09 - INFO - __main__ - Step 16000: {'lr': 0.00019998738617376844, 'samples': 512000, 'steps': 999, 'loss/train': 4.239576816558838} -09/20/2021 17:57:09 - INFO - __main__ - Step 16001: {'lr': 0.00019998728465660105, 'samples': 512032, 'steps': 1000, 'loss/train': 3.6915314197540283} -09/20/2021 17:57:10 - INFO - __main__ - Step 16002: {'lr': 0.00019998728465660105, 'samples': 512064, 'steps': 1000, 'loss/train': 3.315316677093506} -09/20/2021 17:57:11 - INFO - __main__ - Step 16003: {'lr': 0.00019998728465660105, 'samples': 512096, 'steps': 1000, 'loss/train': 4.4364166259765625} -09/20/2021 17:57:12 - INFO - __main__ - Step 16004: {'lr': 0.00019998728465660105, 'samples': 512128, 'steps': 1000, 'loss/train': 3.436793804168701} -09/20/2021 17:57:12 - INFO - __main__ - Step 16005: {'lr': 0.00019998728465660105, 'samples': 512160, 'steps': 1000, 'loss/train': 3.002697467803955} -09/20/2021 17:57:13 - INFO - __main__ - Step 16006: {'lr': 0.00019998728465660105, 'samples': 512192, 'steps': 1000, 'loss/train': 4.395937442779541} -09/20/2021 17:57:14 - INFO - __main__ - Step 16007: {'lr': 0.00019998728465660105, 'samples': 512224, 'steps': 1000, 'loss/train': 3.79020619392395} -09/20/2021 17:57:15 - INFO - __main__ - Step 16008: {'lr': 0.00019998728465660105, 'samples': 512256, 'steps': 1000, 'loss/train': 4.190907955169678} -09/20/2021 17:57:15 - INFO - __main__ - Step 16009: {'lr': 0.00019998728465660105, 'samples': 512288, 'steps': 1000, 'loss/train': 3.9536361694335938} -09/20/2021 17:57:16 - INFO - __main__ - Step 16010: {'lr': 0.00019998728465660105, 'samples': 512320, 'steps': 1000, 'loss/train': 3.944126844406128} -09/20/2021 17:57:17 - INFO - __main__ - Step 16011: {'lr': 0.00019998728465660105, 'samples': 512352, 'steps': 1000, 'loss/train': 2.9513800144195557} -09/20/2021 17:57:18 - INFO - __main__ - Step 16012: {'lr': 0.00019998728465660105, 'samples': 512384, 'steps': 1000, 'loss/train': 2.251518726348877} -09/20/2021 17:57:18 - INFO - __main__ - Step 16013: {'lr': 0.00019998728465660105, 'samples': 512416, 'steps': 1000, 'loss/train': 2.4143190383911133} -09/20/2021 17:57:19 - INFO - __main__ - Step 16014: {'lr': 0.00019998728465660105, 'samples': 512448, 'steps': 1000, 'loss/train': 2.887258529663086} -09/20/2021 17:57:20 - INFO - __main__ - Step 16015: {'lr': 0.00019998728465660105, 'samples': 512480, 'steps': 1000, 'loss/train': 3.0335655212402344} -09/20/2021 17:57:21 - INFO - __main__ - Step 16016: {'lr': 0.00019998728465660105, 'samples': 512512, 'steps': 1000, 'loss/train': 2.3525593280792236} -09/20/2021 17:57:22 - INFO - __main__ - Step 16017: {'lr': 0.00019998718273258576, 'samples': 512544, 'steps': 1001, 'loss/train': 2.520092010498047} -09/20/2021 17:57:22 - INFO - __main__ - Step 16018: {'lr': 0.00019998718273258576, 'samples': 512576, 'steps': 1001, 'loss/train': 2.4529261589050293} -09/20/2021 17:57:23 - INFO - __main__ - Step 16019: {'lr': 0.00019998718273258576, 'samples': 512608, 'steps': 1001, 'loss/train': 2.9826929569244385} -09/20/2021 17:57:24 - INFO - __main__ - Step 16020: {'lr': 0.00019998718273258576, 'samples': 512640, 'steps': 1001, 'loss/train': 2.4821627140045166} -09/20/2021 17:57:25 - INFO - __main__ - Step 16021: {'lr': 0.00019998718273258576, 'samples': 512672, 'steps': 1001, 'loss/train': 4.204830646514893} -09/20/2021 17:57:25 - INFO - __main__ - Step 16022: {'lr': 0.00019998718273258576, 'samples': 512704, 'steps': 1001, 'loss/train': 3.795896530151367} -09/20/2021 17:57:26 - INFO - __main__ - Step 16023: {'lr': 0.00019998718273258576, 'samples': 512736, 'steps': 1001, 'loss/train': 5.11868953704834} -09/20/2021 17:57:27 - INFO - __main__ - Step 16024: {'lr': 0.00019998718273258576, 'samples': 512768, 'steps': 1001, 'loss/train': 2.996929407119751} -09/20/2021 17:57:28 - INFO - __main__ - Step 16025: {'lr': 0.00019998718273258576, 'samples': 512800, 'steps': 1001, 'loss/train': 3.1076643466949463} -09/20/2021 17:57:28 - INFO - __main__ - Step 16026: {'lr': 0.00019998718273258576, 'samples': 512832, 'steps': 1001, 'loss/train': 3.7157480716705322} -09/20/2021 17:57:29 - INFO - __main__ - Step 16027: {'lr': 0.00019998718273258576, 'samples': 512864, 'steps': 1001, 'loss/train': 2.520082473754883} -09/20/2021 17:57:30 - INFO - __main__ - Step 16028: {'lr': 0.00019998718273258576, 'samples': 512896, 'steps': 1001, 'loss/train': 2.4452428817749023} -09/20/2021 17:57:31 - INFO - __main__ - Step 16029: {'lr': 0.00019998718273258576, 'samples': 512928, 'steps': 1001, 'loss/train': 3.396850347518921} -09/20/2021 17:57:31 - INFO - __main__ - Step 16030: {'lr': 0.00019998718273258576, 'samples': 512960, 'steps': 1001, 'loss/train': 4.59843111038208} -09/20/2021 17:57:32 - INFO - __main__ - Step 16031: {'lr': 0.00019998718273258576, 'samples': 512992, 'steps': 1001, 'loss/train': 3.3161978721618652} -09/20/2021 17:57:33 - INFO - __main__ - Step 16032: {'lr': 0.00019998718273258576, 'samples': 513024, 'steps': 1001, 'loss/train': 2.938370943069458} -09/20/2021 17:57:34 - INFO - __main__ - Step 16033: {'lr': 0.00019998708040172303, 'samples': 513056, 'steps': 1002, 'loss/train': 4.4612650871276855} -09/20/2021 17:57:35 - INFO - __main__ - Step 16034: {'lr': 0.00019998708040172303, 'samples': 513088, 'steps': 1002, 'loss/train': 3.973130226135254} -09/20/2021 17:57:35 - INFO - __main__ - Step 16035: {'lr': 0.00019998708040172303, 'samples': 513120, 'steps': 1002, 'loss/train': 3.731865406036377} -09/20/2021 17:57:37 - INFO - __main__ - Step 16036: {'lr': 0.00019998708040172303, 'samples': 513152, 'steps': 1002, 'loss/train': 4.1545891761779785} -09/20/2021 17:57:37 - INFO - __main__ - Step 16037: {'lr': 0.00019998708040172303, 'samples': 513184, 'steps': 1002, 'loss/train': 3.9249746799468994} -09/20/2021 17:57:38 - INFO - __main__ - Step 16038: {'lr': 0.00019998708040172303, 'samples': 513216, 'steps': 1002, 'loss/train': 3.9705920219421387} -09/20/2021 17:57:39 - INFO - __main__ - Step 16039: {'lr': 0.00019998708040172303, 'samples': 513248, 'steps': 1002, 'loss/train': 4.0617170333862305} -09/20/2021 17:57:40 - INFO - __main__ - Step 16040: {'lr': 0.00019998708040172303, 'samples': 513280, 'steps': 1002, 'loss/train': 1.1372779607772827} -09/20/2021 17:57:40 - INFO - __main__ - Step 16041: {'lr': 0.00019998708040172303, 'samples': 513312, 'steps': 1002, 'loss/train': 1.0925617218017578} -09/20/2021 17:57:41 - INFO - __main__ - Step 16042: {'lr': 0.00019998708040172303, 'samples': 513344, 'steps': 1002, 'loss/train': 4.077350616455078} -09/20/2021 17:57:42 - INFO - __main__ - Step 16043: {'lr': 0.00019998708040172303, 'samples': 513376, 'steps': 1002, 'loss/train': 3.640183925628662} -09/20/2021 17:57:43 - INFO - __main__ - Step 16044: {'lr': 0.00019998708040172303, 'samples': 513408, 'steps': 1002, 'loss/train': 3.8515870571136475} -09/20/2021 17:57:43 - INFO - __main__ - Step 16045: {'lr': 0.00019998708040172303, 'samples': 513440, 'steps': 1002, 'loss/train': 2.9993038177490234} -09/20/2021 17:57:44 - INFO - __main__ - Step 16046: {'lr': 0.00019998708040172303, 'samples': 513472, 'steps': 1002, 'loss/train': 3.6386685371398926} -09/20/2021 17:57:45 - INFO - __main__ - Step 16047: {'lr': 0.00019998708040172303, 'samples': 513504, 'steps': 1002, 'loss/train': 3.6409099102020264} -09/20/2021 17:57:46 - INFO - __main__ - Step 16048: {'lr': 0.00019998708040172303, 'samples': 513536, 'steps': 1002, 'loss/train': 3.451484203338623} -09/20/2021 17:57:46 - INFO - __main__ - Step 16049: {'lr': 0.00019998697766401326, 'samples': 513568, 'steps': 1003, 'loss/train': 3.107962131500244} -09/20/2021 17:57:47 - INFO - __main__ - Step 16050: {'lr': 0.00019998697766401326, 'samples': 513600, 'steps': 1003, 'loss/train': 0.9931305050849915} -09/20/2021 17:57:48 - INFO - __main__ - Step 16051: {'lr': 0.00019998697766401326, 'samples': 513632, 'steps': 1003, 'loss/train': 3.05751371383667} -09/20/2021 17:57:49 - INFO - __main__ - Step 16052: {'lr': 0.00019998697766401326, 'samples': 513664, 'steps': 1003, 'loss/train': 0.8549700379371643} -09/20/2021 17:57:49 - INFO - __main__ - Step 16053: {'lr': 0.00019998697766401326, 'samples': 513696, 'steps': 1003, 'loss/train': 4.05575704574585} -09/20/2021 17:57:50 - INFO - __main__ - Step 16054: {'lr': 0.00019998697766401326, 'samples': 513728, 'steps': 1003, 'loss/train': 4.348228931427002} -09/20/2021 17:57:51 - INFO - __main__ - Step 16055: {'lr': 0.00019998697766401326, 'samples': 513760, 'steps': 1003, 'loss/train': 4.310413837432861} -09/20/2021 17:57:52 - INFO - __main__ - Step 16056: {'lr': 0.00019998697766401326, 'samples': 513792, 'steps': 1003, 'loss/train': 3.004060983657837} -09/20/2021 17:57:52 - INFO - __main__ - Step 16057: {'lr': 0.00019998697766401326, 'samples': 513824, 'steps': 1003, 'loss/train': 3.6554079055786133} -09/20/2021 17:57:53 - INFO - __main__ - Step 16058: {'lr': 0.00019998697766401326, 'samples': 513856, 'steps': 1003, 'loss/train': 3.503734588623047} -09/20/2021 17:57:54 - INFO - __main__ - Step 16059: {'lr': 0.00019998697766401326, 'samples': 513888, 'steps': 1003, 'loss/train': 3.218723773956299} -09/20/2021 17:57:55 - INFO - __main__ - Step 16060: {'lr': 0.00019998697766401326, 'samples': 513920, 'steps': 1003, 'loss/train': 3.2607169151306152} -09/20/2021 17:57:55 - INFO - __main__ - Step 16061: {'lr': 0.00019998697766401326, 'samples': 513952, 'steps': 1003, 'loss/train': 3.0453081130981445} -09/20/2021 17:57:56 - INFO - __main__ - Step 16062: {'lr': 0.00019998697766401326, 'samples': 513984, 'steps': 1003, 'loss/train': 4.802391052246094} -09/20/2021 17:57:57 - INFO - __main__ - Step 16063: {'lr': 0.00019998697766401326, 'samples': 514016, 'steps': 1003, 'loss/train': 3.1268837451934814} -09/20/2021 17:57:58 - INFO - __main__ - Step 16064: {'lr': 0.00019998697766401326, 'samples': 514048, 'steps': 1003, 'loss/train': 3.239445209503174} -09/20/2021 17:57:59 - INFO - __main__ - Step 16065: {'lr': 0.00019998687451945686, 'samples': 514080, 'steps': 1004, 'loss/train': 3.999701738357544} -09/20/2021 17:57:59 - INFO - __main__ - Step 16066: {'lr': 0.00019998687451945686, 'samples': 514112, 'steps': 1004, 'loss/train': 4.390561580657959} -09/20/2021 17:58:00 - INFO - __main__ - Step 16067: {'lr': 0.00019998687451945686, 'samples': 514144, 'steps': 1004, 'loss/train': 3.8088371753692627} -09/20/2021 17:58:01 - INFO - __main__ - Step 16068: {'lr': 0.00019998687451945686, 'samples': 514176, 'steps': 1004, 'loss/train': 4.649652004241943} -09/20/2021 17:58:02 - INFO - __main__ - Step 16069: {'lr': 0.00019998687451945686, 'samples': 514208, 'steps': 1004, 'loss/train': 3.7594308853149414} -09/20/2021 17:58:03 - INFO - __main__ - Step 16070: {'lr': 0.00019998687451945686, 'samples': 514240, 'steps': 1004, 'loss/train': 1.8322734832763672} -09/20/2021 17:58:04 - INFO - __main__ - Step 16071: {'lr': 0.00019998687451945686, 'samples': 514272, 'steps': 1004, 'loss/train': 4.647418975830078} -09/20/2021 17:58:04 - INFO - __main__ - Step 16072: {'lr': 0.00019998687451945686, 'samples': 514304, 'steps': 1004, 'loss/train': 3.6016547679901123} -09/20/2021 17:58:05 - INFO - __main__ - Step 16073: {'lr': 0.00019998687451945686, 'samples': 514336, 'steps': 1004, 'loss/train': 2.2471091747283936} -09/20/2021 17:58:06 - INFO - __main__ - Step 16074: {'lr': 0.00019998687451945686, 'samples': 514368, 'steps': 1004, 'loss/train': 3.779372215270996} -09/20/2021 17:58:07 - INFO - __main__ - Step 16075: {'lr': 0.00019998687451945686, 'samples': 514400, 'steps': 1004, 'loss/train': 3.2067461013793945} -09/20/2021 17:58:07 - INFO - __main__ - Step 16076: {'lr': 0.00019998687451945686, 'samples': 514432, 'steps': 1004, 'loss/train': 3.9586434364318848} -09/20/2021 17:58:08 - INFO - __main__ - Step 16077: {'lr': 0.00019998687451945686, 'samples': 514464, 'steps': 1004, 'loss/train': 6.689398288726807} -09/20/2021 17:58:09 - INFO - __main__ - Step 16078: {'lr': 0.00019998687451945686, 'samples': 514496, 'steps': 1004, 'loss/train': 3.302316188812256} -09/20/2021 17:58:10 - INFO - __main__ - Step 16079: {'lr': 0.00019998687451945686, 'samples': 514528, 'steps': 1004, 'loss/train': 3.653433322906494} -09/20/2021 17:58:10 - INFO - __main__ - Step 16080: {'lr': 0.00019998687451945686, 'samples': 514560, 'steps': 1004, 'loss/train': 4.723154067993164} -09/20/2021 17:58:11 - INFO - __main__ - Step 16081: {'lr': 0.00019998677096805427, 'samples': 514592, 'steps': 1005, 'loss/train': 4.227768421173096} -09/20/2021 17:58:12 - INFO - __main__ - Step 16082: {'lr': 0.00019998677096805427, 'samples': 514624, 'steps': 1005, 'loss/train': 3.7734274864196777} -09/20/2021 17:58:13 - INFO - __main__ - Step 16083: {'lr': 0.00019998677096805427, 'samples': 514656, 'steps': 1005, 'loss/train': 3.234647035598755} -09/20/2021 17:58:13 - INFO - __main__ - Step 16084: {'lr': 0.00019998677096805427, 'samples': 514688, 'steps': 1005, 'loss/train': 2.7285423278808594} -09/20/2021 17:58:14 - INFO - __main__ - Step 16085: {'lr': 0.00019998677096805427, 'samples': 514720, 'steps': 1005, 'loss/train': 3.405611753463745} -09/20/2021 17:58:15 - INFO - __main__ - Step 16086: {'lr': 0.00019998677096805427, 'samples': 514752, 'steps': 1005, 'loss/train': 3.7042062282562256} -09/20/2021 17:58:16 - INFO - __main__ - Step 16087: {'lr': 0.00019998677096805427, 'samples': 514784, 'steps': 1005, 'loss/train': 3.4121592044830322} -09/20/2021 17:58:16 - INFO - __main__ - Step 16088: {'lr': 0.00019998677096805427, 'samples': 514816, 'steps': 1005, 'loss/train': 3.1505320072174072} -09/20/2021 17:58:17 - INFO - __main__ - Step 16089: {'lr': 0.00019998677096805427, 'samples': 514848, 'steps': 1005, 'loss/train': 4.167568206787109} -09/20/2021 17:58:18 - INFO - __main__ - Step 16090: {'lr': 0.00019998677096805427, 'samples': 514880, 'steps': 1005, 'loss/train': 3.2527871131896973} -09/20/2021 17:58:19 - INFO - __main__ - Step 16091: {'lr': 0.00019998677096805427, 'samples': 514912, 'steps': 1005, 'loss/train': 4.273815631866455} -09/20/2021 17:58:19 - INFO - __main__ - Step 16092: {'lr': 0.00019998677096805427, 'samples': 514944, 'steps': 1005, 'loss/train': 3.814617156982422} -09/20/2021 17:58:20 - INFO - __main__ - Step 16093: {'lr': 0.00019998677096805427, 'samples': 514976, 'steps': 1005, 'loss/train': 3.9943039417266846} -09/20/2021 17:58:21 - INFO - __main__ - Step 16094: {'lr': 0.00019998677096805427, 'samples': 515008, 'steps': 1005, 'loss/train': 3.6091549396514893} -09/20/2021 17:58:22 - INFO - __main__ - Step 16095: {'lr': 0.00019998677096805427, 'samples': 515040, 'steps': 1005, 'loss/train': 3.922313928604126} -09/20/2021 17:58:22 - INFO - __main__ - Step 16096: {'lr': 0.00019998677096805427, 'samples': 515072, 'steps': 1005, 'loss/train': 1.4743494987487793} -09/20/2021 17:58:23 - INFO - __main__ - Step 16097: {'lr': 0.00019998666700980587, 'samples': 515104, 'steps': 1006, 'loss/train': 3.4936015605926514} -09/20/2021 17:58:24 - INFO - __main__ - Step 16098: {'lr': 0.00019998666700980587, 'samples': 515136, 'steps': 1006, 'loss/train': 1.4057832956314087} -09/20/2021 17:58:25 - INFO - __main__ - Step 16099: {'lr': 0.00019998666700980587, 'samples': 515168, 'steps': 1006, 'loss/train': 3.435076951980591} -09/20/2021 17:58:26 - INFO - __main__ - Step 16100: {'lr': 0.00019998666700980587, 'samples': 515200, 'steps': 1006, 'loss/train': 3.726776361465454} -09/20/2021 17:58:27 - INFO - __main__ - Step 16101: {'lr': 0.00019998666700980587, 'samples': 515232, 'steps': 1006, 'loss/train': 3.6486947536468506} -09/20/2021 17:58:28 - INFO - __main__ - Step 16102: {'lr': 0.00019998666700980587, 'samples': 515264, 'steps': 1006, 'loss/train': 3.016871929168701} -09/20/2021 17:58:28 - INFO - __main__ - Step 16103: {'lr': 0.00019998666700980587, 'samples': 515296, 'steps': 1006, 'loss/train': 3.426051378250122} -09/20/2021 17:58:29 - INFO - __main__ - Step 16104: {'lr': 0.00019998666700980587, 'samples': 515328, 'steps': 1006, 'loss/train': 3.910250186920166} -09/20/2021 17:58:30 - INFO - __main__ - Step 16105: {'lr': 0.00019998666700980587, 'samples': 515360, 'steps': 1006, 'loss/train': 3.8291122913360596} -09/20/2021 17:58:31 - INFO - __main__ - Step 16106: {'lr': 0.00019998666700980587, 'samples': 515392, 'steps': 1006, 'loss/train': 3.384821653366089} -09/20/2021 17:58:31 - INFO - __main__ - Step 16107: {'lr': 0.00019998666700980587, 'samples': 515424, 'steps': 1006, 'loss/train': 4.797665596008301} -09/20/2021 17:58:32 - INFO - __main__ - Step 16108: {'lr': 0.00019998666700980587, 'samples': 515456, 'steps': 1006, 'loss/train': 4.7918877601623535} -09/20/2021 17:58:33 - INFO - __main__ - Step 16109: {'lr': 0.00019998666700980587, 'samples': 515488, 'steps': 1006, 'loss/train': 4.033017158508301} -09/20/2021 17:58:34 - INFO - __main__ - Step 16110: {'lr': 0.00019998666700980587, 'samples': 515520, 'steps': 1006, 'loss/train': 3.72586989402771} -09/20/2021 17:58:34 - INFO - __main__ - Step 16111: {'lr': 0.00019998666700980587, 'samples': 515552, 'steps': 1006, 'loss/train': 1.9619593620300293} -09/20/2021 17:58:35 - INFO - __main__ - Step 16112: {'lr': 0.00019998666700980587, 'samples': 515584, 'steps': 1006, 'loss/train': 4.357485294342041} -09/20/2021 17:58:36 - INFO - __main__ - Step 16113: {'lr': 0.00019998656264471213, 'samples': 515616, 'steps': 1007, 'loss/train': 3.4105467796325684} -09/20/2021 17:58:37 - INFO - __main__ - Step 16114: {'lr': 0.00019998656264471213, 'samples': 515648, 'steps': 1007, 'loss/train': 4.25531005859375} -09/20/2021 17:58:37 - INFO - __main__ - Step 16115: {'lr': 0.00019998656264471213, 'samples': 515680, 'steps': 1007, 'loss/train': 4.66260290145874} -09/20/2021 17:58:38 - INFO - __main__ - Step 16116: {'lr': 0.00019998656264471213, 'samples': 515712, 'steps': 1007, 'loss/train': 2.6990463733673096} -09/20/2021 17:58:39 - INFO - __main__ - Step 16117: {'lr': 0.00019998656264471213, 'samples': 515744, 'steps': 1007, 'loss/train': 3.147958993911743} -09/20/2021 17:58:40 - INFO - __main__ - Step 16118: {'lr': 0.00019998656264471213, 'samples': 515776, 'steps': 1007, 'loss/train': 4.133133411407471} -09/20/2021 17:58:40 - INFO - __main__ - Step 16119: {'lr': 0.00019998656264471213, 'samples': 515808, 'steps': 1007, 'loss/train': 3.648719072341919} -09/20/2021 17:58:41 - INFO - __main__ - Step 16120: {'lr': 0.00019998656264471213, 'samples': 515840, 'steps': 1007, 'loss/train': 3.984060764312744} -09/20/2021 17:58:42 - INFO - __main__ - Step 16121: {'lr': 0.00019998656264471213, 'samples': 515872, 'steps': 1007, 'loss/train': 4.3640289306640625} -09/20/2021 17:58:43 - INFO - __main__ - Step 16122: {'lr': 0.00019998656264471213, 'samples': 515904, 'steps': 1007, 'loss/train': 3.938654899597168} -09/20/2021 17:58:43 - INFO - __main__ - Step 16123: {'lr': 0.00019998656264471213, 'samples': 515936, 'steps': 1007, 'loss/train': 3.415696620941162} -09/20/2021 17:58:44 - INFO - __main__ - Step 16124: {'lr': 0.00019998656264471213, 'samples': 515968, 'steps': 1007, 'loss/train': 6.04343843460083} -09/20/2021 17:58:45 - INFO - __main__ - Step 16125: {'lr': 0.00019998656264471213, 'samples': 516000, 'steps': 1007, 'loss/train': 4.319607734680176} -09/20/2021 17:58:46 - INFO - __main__ - Step 16126: {'lr': 0.00019998656264471213, 'samples': 516032, 'steps': 1007, 'loss/train': 2.8789451122283936} -09/20/2021 17:58:46 - INFO - __main__ - Step 16127: {'lr': 0.00019998656264471213, 'samples': 516064, 'steps': 1007, 'loss/train': 3.1329598426818848} -09/20/2021 17:58:47 - INFO - __main__ - Step 16128: {'lr': 0.00019998656264471213, 'samples': 516096, 'steps': 1007, 'loss/train': 3.4441094398498535} -09/20/2021 17:58:49 - INFO - __main__ - Step 16129: {'lr': 0.00019998645787277345, 'samples': 516128, 'steps': 1008, 'loss/train': 5.480945587158203} -09/20/2021 17:58:49 - INFO - __main__ - Step 16130: {'lr': 0.00019998645787277345, 'samples': 516160, 'steps': 1008, 'loss/train': 3.0596587657928467} -09/20/2021 17:58:50 - INFO - __main__ - Step 16131: {'lr': 0.00019998645787277345, 'samples': 516192, 'steps': 1008, 'loss/train': 3.3060033321380615} -09/20/2021 17:58:51 - INFO - __main__ - Step 16132: {'lr': 0.00019998645787277345, 'samples': 516224, 'steps': 1008, 'loss/train': 4.165552616119385} -09/20/2021 17:58:52 - INFO - __main__ - Step 16133: {'lr': 0.00019998645787277345, 'samples': 516256, 'steps': 1008, 'loss/train': 2.809051752090454} -09/20/2021 17:58:52 - INFO - __main__ - Step 16134: {'lr': 0.00019998645787277345, 'samples': 516288, 'steps': 1008, 'loss/train': 3.151676654815674} -09/20/2021 17:58:53 - INFO - __main__ - Step 16135: {'lr': 0.00019998645787277345, 'samples': 516320, 'steps': 1008, 'loss/train': 3.954951524734497} -09/20/2021 17:58:54 - INFO - __main__ - Step 16136: {'lr': 0.00019998645787277345, 'samples': 516352, 'steps': 1008, 'loss/train': 3.4410791397094727} -09/20/2021 17:58:55 - INFO - __main__ - Step 16137: {'lr': 0.00019998645787277345, 'samples': 516384, 'steps': 1008, 'loss/train': 2.8260838985443115} -09/20/2021 17:58:55 - INFO - __main__ - Step 16138: {'lr': 0.00019998645787277345, 'samples': 516416, 'steps': 1008, 'loss/train': 2.919102191925049} -09/20/2021 17:58:56 - INFO - __main__ - Step 16139: {'lr': 0.00019998645787277345, 'samples': 516448, 'steps': 1008, 'loss/train': 3.703247308731079} -09/20/2021 17:58:57 - INFO - __main__ - Step 16140: {'lr': 0.00019998645787277345, 'samples': 516480, 'steps': 1008, 'loss/train': 4.2796783447265625} -09/20/2021 17:58:58 - INFO - __main__ - Step 16141: {'lr': 0.00019998645787277345, 'samples': 516512, 'steps': 1008, 'loss/train': 5.169033527374268} -09/20/2021 17:58:58 - INFO - __main__ - Step 16142: {'lr': 0.00019998645787277345, 'samples': 516544, 'steps': 1008, 'loss/train': 0.4310355484485626} -09/20/2021 17:58:59 - INFO - __main__ - Step 16143: {'lr': 0.00019998645787277345, 'samples': 516576, 'steps': 1008, 'loss/train': 3.7963781356811523} -09/20/2021 17:59:00 - INFO - __main__ - Step 16144: {'lr': 0.00019998645787277345, 'samples': 516608, 'steps': 1008, 'loss/train': 3.3849740028381348} -09/20/2021 17:59:01 - INFO - __main__ - Step 16145: {'lr': 0.00019998635269399028, 'samples': 516640, 'steps': 1009, 'loss/train': 2.038330554962158} -09/20/2021 17:59:02 - INFO - __main__ - Step 16146: {'lr': 0.00019998635269399028, 'samples': 516672, 'steps': 1009, 'loss/train': 3.0835044384002686} -09/20/2021 17:59:02 - INFO - __main__ - Step 16147: {'lr': 0.00019998635269399028, 'samples': 516704, 'steps': 1009, 'loss/train': 4.201567649841309} -09/20/2021 17:59:03 - INFO - __main__ - Step 16148: {'lr': 0.00019998635269399028, 'samples': 516736, 'steps': 1009, 'loss/train': 3.7115819454193115} -09/20/2021 17:59:04 - INFO - __main__ - Step 16149: {'lr': 0.00019998635269399028, 'samples': 516768, 'steps': 1009, 'loss/train': 2.642718553543091} -09/20/2021 17:59:05 - INFO - __main__ - Step 16150: {'lr': 0.00019998635269399028, 'samples': 516800, 'steps': 1009, 'loss/train': 3.8588390350341797} -09/20/2021 17:59:05 - INFO - __main__ - Step 16151: {'lr': 0.00019998635269399028, 'samples': 516832, 'steps': 1009, 'loss/train': 2.2619385719299316} -09/20/2021 17:59:06 - INFO - __main__ - Step 16152: {'lr': 0.00019998635269399028, 'samples': 516864, 'steps': 1009, 'loss/train': 4.16005277633667} -09/20/2021 17:59:07 - INFO - __main__ - Step 16153: {'lr': 0.00019998635269399028, 'samples': 516896, 'steps': 1009, 'loss/train': 3.630361795425415} -09/20/2021 17:59:08 - INFO - __main__ - Step 16154: {'lr': 0.00019998635269399028, 'samples': 516928, 'steps': 1009, 'loss/train': 3.9931814670562744} -09/20/2021 17:59:08 - INFO - __main__ - Step 16155: {'lr': 0.00019998635269399028, 'samples': 516960, 'steps': 1009, 'loss/train': 3.5368406772613525} -09/20/2021 17:59:09 - INFO - __main__ - Step 16156: {'lr': 0.00019998635269399028, 'samples': 516992, 'steps': 1009, 'loss/train': 3.230665445327759} -09/20/2021 17:59:10 - INFO - __main__ - Step 16157: {'lr': 0.00019998635269399028, 'samples': 517024, 'steps': 1009, 'loss/train': 3.358604669570923} -09/20/2021 17:59:11 - INFO - __main__ - Step 16158: {'lr': 0.00019998635269399028, 'samples': 517056, 'steps': 1009, 'loss/train': 3.572463274002075} -09/20/2021 17:59:11 - INFO - __main__ - Step 16159: {'lr': 0.00019998635269399028, 'samples': 517088, 'steps': 1009, 'loss/train': 3.98758864402771} -09/20/2021 17:59:12 - INFO - __main__ - Step 16160: {'lr': 0.00019998635269399028, 'samples': 517120, 'steps': 1009, 'loss/train': 2.6083576679229736} -09/20/2021 17:59:14 - INFO - __main__ - Step 16161: {'lr': 0.000199986247108363, 'samples': 517152, 'steps': 1010, 'loss/train': 2.951728105545044} -09/20/2021 17:59:15 - INFO - __main__ - Step 16162: {'lr': 0.000199986247108363, 'samples': 517184, 'steps': 1010, 'loss/train': 5.956739902496338} -09/20/2021 17:59:16 - INFO - __main__ - Step 16163: {'lr': 0.000199986247108363, 'samples': 517216, 'steps': 1010, 'loss/train': 3.9013683795928955} -09/20/2021 17:59:17 - INFO - __main__ - Step 16164: {'lr': 0.000199986247108363, 'samples': 517248, 'steps': 1010, 'loss/train': 3.105844020843506} -09/20/2021 17:59:17 - INFO - __main__ - Step 16165: {'lr': 0.000199986247108363, 'samples': 517280, 'steps': 1010, 'loss/train': 4.361906051635742} -09/20/2021 17:59:18 - INFO - __main__ - Step 16166: {'lr': 0.000199986247108363, 'samples': 517312, 'steps': 1010, 'loss/train': 3.111755847930908} -09/20/2021 17:59:19 - INFO - __main__ - Step 16167: {'lr': 0.000199986247108363, 'samples': 517344, 'steps': 1010, 'loss/train': 0.9241458773612976} -09/20/2021 17:59:20 - INFO - __main__ - Step 16168: {'lr': 0.000199986247108363, 'samples': 517376, 'steps': 1010, 'loss/train': 1.2265263795852661} -09/20/2021 17:59:20 - INFO - __main__ - Step 16169: {'lr': 0.000199986247108363, 'samples': 517408, 'steps': 1010, 'loss/train': 1.0863972902297974} -09/20/2021 17:59:21 - INFO - __main__ - Step 16170: {'lr': 0.000199986247108363, 'samples': 517440, 'steps': 1010, 'loss/train': 0.8797239661216736} -09/20/2021 17:59:22 - INFO - __main__ - Step 16171: {'lr': 0.000199986247108363, 'samples': 517472, 'steps': 1010, 'loss/train': 1.1410683393478394} -09/20/2021 17:59:23 - INFO - __main__ - Step 16172: {'lr': 0.000199986247108363, 'samples': 517504, 'steps': 1010, 'loss/train': 3.771864652633667} -09/20/2021 17:59:23 - INFO - __main__ - Step 16173: {'lr': 0.000199986247108363, 'samples': 517536, 'steps': 1010, 'loss/train': 5.468175888061523} -09/20/2021 17:59:24 - INFO - __main__ - Step 16174: {'lr': 0.000199986247108363, 'samples': 517568, 'steps': 1010, 'loss/train': 3.966752052307129} -09/20/2021 17:59:25 - INFO - __main__ - Step 16175: {'lr': 0.000199986247108363, 'samples': 517600, 'steps': 1010, 'loss/train': 3.449098587036133} -09/20/2021 17:59:26 - INFO - __main__ - Step 16176: {'lr': 0.000199986247108363, 'samples': 517632, 'steps': 1010, 'loss/train': 3.618473529815674} -09/20/2021 17:59:26 - INFO - __main__ - Step 16177: {'lr': 0.0001999861411158921, 'samples': 517664, 'steps': 1011, 'loss/train': 3.7077786922454834} -09/20/2021 17:59:27 - INFO - __main__ - Step 16178: {'lr': 0.0001999861411158921, 'samples': 517696, 'steps': 1011, 'loss/train': 2.9738316535949707} -09/20/2021 17:59:28 - INFO - __main__ - Step 16179: {'lr': 0.0001999861411158921, 'samples': 517728, 'steps': 1011, 'loss/train': 3.4771957397460938} -09/20/2021 17:59:29 - INFO - __main__ - Step 16180: {'lr': 0.0001999861411158921, 'samples': 517760, 'steps': 1011, 'loss/train': 2.9120383262634277} -09/20/2021 17:59:29 - INFO - __main__ - Step 16181: {'lr': 0.0001999861411158921, 'samples': 517792, 'steps': 1011, 'loss/train': 4.003663063049316} -09/20/2021 17:59:30 - INFO - __main__ - Step 16182: {'lr': 0.0001999861411158921, 'samples': 517824, 'steps': 1011, 'loss/train': 4.4059929847717285} -09/20/2021 17:59:31 - INFO - __main__ - Step 16183: {'lr': 0.0001999861411158921, 'samples': 517856, 'steps': 1011, 'loss/train': 3.9342617988586426} -09/20/2021 17:59:32 - INFO - __main__ - Step 16184: {'lr': 0.0001999861411158921, 'samples': 517888, 'steps': 1011, 'loss/train': 4.56647253036499} -09/20/2021 17:59:32 - INFO - __main__ - Step 16185: {'lr': 0.0001999861411158921, 'samples': 517920, 'steps': 1011, 'loss/train': 3.5698344707489014} -09/20/2021 17:59:33 - INFO - __main__ - Step 16186: {'lr': 0.0001999861411158921, 'samples': 517952, 'steps': 1011, 'loss/train': 3.3634724617004395} -09/20/2021 17:59:34 - INFO - __main__ - Step 16187: {'lr': 0.0001999861411158921, 'samples': 517984, 'steps': 1011, 'loss/train': 2.7736997604370117} -09/20/2021 17:59:35 - INFO - __main__ - Step 16188: {'lr': 0.0001999861411158921, 'samples': 518016, 'steps': 1011, 'loss/train': 3.922589063644409} -09/20/2021 17:59:35 - INFO - __main__ - Step 16189: {'lr': 0.0001999861411158921, 'samples': 518048, 'steps': 1011, 'loss/train': 3.7026305198669434} -09/20/2021 17:59:36 - INFO - __main__ - Step 16190: {'lr': 0.0001999861411158921, 'samples': 518080, 'steps': 1011, 'loss/train': 3.125936985015869} -09/20/2021 17:59:38 - INFO - __main__ - Step 16191: {'lr': 0.0001999861411158921, 'samples': 518112, 'steps': 1011, 'loss/train': 3.6138393878936768} -09/20/2021 17:59:38 - INFO - __main__ - Step 16192: {'lr': 0.0001999861411158921, 'samples': 518144, 'steps': 1011, 'loss/train': 3.4523074626922607} -09/20/2021 17:59:39 - INFO - __main__ - Step 16193: {'lr': 0.00019998603471657793, 'samples': 518176, 'steps': 1012, 'loss/train': 3.764824867248535} -09/20/2021 17:59:40 - INFO - __main__ - Step 16194: {'lr': 0.00019998603471657793, 'samples': 518208, 'steps': 1012, 'loss/train': 4.240139484405518} -09/20/2021 17:59:41 - INFO - __main__ - Step 16195: {'lr': 0.00019998603471657793, 'samples': 518240, 'steps': 1012, 'loss/train': 2.864414930343628} -09/20/2021 17:59:41 - INFO - __main__ - Step 16196: {'lr': 0.00019998603471657793, 'samples': 518272, 'steps': 1012, 'loss/train': 3.434279680252075} -09/20/2021 17:59:42 - INFO - __main__ - Step 16197: {'lr': 0.00019998603471657793, 'samples': 518304, 'steps': 1012, 'loss/train': 4.229237079620361} -09/20/2021 17:59:43 - INFO - __main__ - Step 16198: {'lr': 0.00019998603471657793, 'samples': 518336, 'steps': 1012, 'loss/train': 2.783200740814209} -09/20/2021 17:59:44 - INFO - __main__ - Step 16199: {'lr': 0.00019998603471657793, 'samples': 518368, 'steps': 1012, 'loss/train': 3.4406962394714355} -09/20/2021 17:59:44 - INFO - __main__ - Step 16200: {'lr': 0.00019998603471657793, 'samples': 518400, 'steps': 1012, 'loss/train': 4.131840229034424} -09/20/2021 17:59:45 - INFO - __main__ - Step 16201: {'lr': 0.00019998603471657793, 'samples': 518432, 'steps': 1012, 'loss/train': 3.6698431968688965} -09/20/2021 17:59:46 - INFO - __main__ - Step 16202: {'lr': 0.00019998603471657793, 'samples': 518464, 'steps': 1012, 'loss/train': 3.7140510082244873} -09/20/2021 17:59:47 - INFO - __main__ - Step 16203: {'lr': 0.00019998603471657793, 'samples': 518496, 'steps': 1012, 'loss/train': 4.029637336730957} -09/20/2021 17:59:47 - INFO - __main__ - Step 16204: {'lr': 0.00019998603471657793, 'samples': 518528, 'steps': 1012, 'loss/train': 3.123328447341919} -09/20/2021 17:59:48 - INFO - __main__ - Step 16205: {'lr': 0.00019998603471657793, 'samples': 518560, 'steps': 1012, 'loss/train': 2.962404489517212} -09/20/2021 17:59:49 - INFO - __main__ - Step 16206: {'lr': 0.00019998603471657793, 'samples': 518592, 'steps': 1012, 'loss/train': 4.222660064697266} -09/20/2021 17:59:50 - INFO - __main__ - Step 16207: {'lr': 0.00019998603471657793, 'samples': 518624, 'steps': 1012, 'loss/train': 3.579965353012085} -09/20/2021 17:59:51 - INFO - __main__ - Step 16208: {'lr': 0.00019998603471657793, 'samples': 518656, 'steps': 1012, 'loss/train': 4.011941432952881} -09/20/2021 17:59:51 - INFO - __main__ - Step 16209: {'lr': 0.00019998592791042102, 'samples': 518688, 'steps': 1013, 'loss/train': 2.9698901176452637} -09/20/2021 17:59:52 - INFO - __main__ - Step 16210: {'lr': 0.00019998592791042102, 'samples': 518720, 'steps': 1013, 'loss/train': 3.4776034355163574} -09/20/2021 17:59:53 - INFO - __main__ - Step 16211: {'lr': 0.00019998592791042102, 'samples': 518752, 'steps': 1013, 'loss/train': 4.4357991218566895} -09/20/2021 17:59:54 - INFO - __main__ - Step 16212: {'lr': 0.00019998592791042102, 'samples': 518784, 'steps': 1013, 'loss/train': 3.9312613010406494} -09/20/2021 17:59:54 - INFO - __main__ - Step 16213: {'lr': 0.00019998592791042102, 'samples': 518816, 'steps': 1013, 'loss/train': 3.272785186767578} -09/20/2021 17:59:55 - INFO - __main__ - Step 16214: {'lr': 0.00019998592791042102, 'samples': 518848, 'steps': 1013, 'loss/train': 1.2235506772994995} -09/20/2021 17:59:56 - INFO - __main__ - Step 16215: {'lr': 0.00019998592791042102, 'samples': 518880, 'steps': 1013, 'loss/train': 3.1111998558044434} -09/20/2021 17:59:57 - INFO - __main__ - Step 16216: {'lr': 0.00019998592791042102, 'samples': 518912, 'steps': 1013, 'loss/train': 2.8822178840637207} -09/20/2021 17:59:57 - INFO - __main__ - Step 16217: {'lr': 0.00019998592791042102, 'samples': 518944, 'steps': 1013, 'loss/train': 3.204272508621216} -09/20/2021 17:59:58 - INFO - __main__ - Step 16218: {'lr': 0.00019998592791042102, 'samples': 518976, 'steps': 1013, 'loss/train': 6.268996238708496} -09/20/2021 17:59:59 - INFO - __main__ - Step 16219: {'lr': 0.00019998592791042102, 'samples': 519008, 'steps': 1013, 'loss/train': 3.7576277256011963} -09/20/2021 18:00:00 - INFO - __main__ - Step 16220: {'lr': 0.00019998592791042102, 'samples': 519040, 'steps': 1013, 'loss/train': 3.9940803050994873} -09/20/2021 18:00:00 - INFO - __main__ - Step 16221: {'lr': 0.00019998592791042102, 'samples': 519072, 'steps': 1013, 'loss/train': 3.7167611122131348} -09/20/2021 18:00:02 - INFO - __main__ - Step 16222: {'lr': 0.00019998592791042102, 'samples': 519104, 'steps': 1013, 'loss/train': 3.753918409347534} -09/20/2021 18:00:02 - INFO - __main__ - Step 16223: {'lr': 0.00019998592791042102, 'samples': 519136, 'steps': 1013, 'loss/train': 3.717944383621216} -09/20/2021 18:00:03 - INFO - __main__ - Step 16224: {'lr': 0.00019998592791042102, 'samples': 519168, 'steps': 1013, 'loss/train': 3.0987932682037354} -09/20/2021 18:00:04 - INFO - __main__ - Step 16225: {'lr': 0.00019998582069742174, 'samples': 519200, 'steps': 1014, 'loss/train': 2.4567813873291016} -09/20/2021 18:00:05 - INFO - __main__ - Step 16226: {'lr': 0.00019998582069742174, 'samples': 519232, 'steps': 1014, 'loss/train': 3.4428396224975586} -09/20/2021 18:00:06 - INFO - __main__ - Step 16227: {'lr': 0.00019998582069742174, 'samples': 519264, 'steps': 1014, 'loss/train': 5.14805269241333} -09/20/2021 18:00:06 - INFO - __main__ - Step 16228: {'lr': 0.00019998582069742174, 'samples': 519296, 'steps': 1014, 'loss/train': 5.245973110198975} -09/20/2021 18:00:07 - INFO - __main__ - Step 16229: {'lr': 0.00019998582069742174, 'samples': 519328, 'steps': 1014, 'loss/train': 5.230166435241699} -09/20/2021 18:00:08 - INFO - __main__ - Step 16230: {'lr': 0.00019998582069742174, 'samples': 519360, 'steps': 1014, 'loss/train': 3.0847103595733643} -09/20/2021 18:00:09 - INFO - __main__ - Step 16231: {'lr': 0.00019998582069742174, 'samples': 519392, 'steps': 1014, 'loss/train': 3.5275418758392334} -09/20/2021 18:00:09 - INFO - __main__ - Step 16232: {'lr': 0.00019998582069742174, 'samples': 519424, 'steps': 1014, 'loss/train': 4.312446117401123} -09/20/2021 18:00:10 - INFO - __main__ - Step 16233: {'lr': 0.00019998582069742174, 'samples': 519456, 'steps': 1014, 'loss/train': 3.7435503005981445} -09/20/2021 18:00:11 - INFO - __main__ - Step 16234: {'lr': 0.00019998582069742174, 'samples': 519488, 'steps': 1014, 'loss/train': 3.338655471801758} -09/20/2021 18:00:12 - INFO - __main__ - Step 16235: {'lr': 0.00019998582069742174, 'samples': 519520, 'steps': 1014, 'loss/train': 5.144443511962891} -09/20/2021 18:00:12 - INFO - __main__ - Step 16236: {'lr': 0.00019998582069742174, 'samples': 519552, 'steps': 1014, 'loss/train': 3.228353500366211} -09/20/2021 18:00:13 - INFO - __main__ - Step 16237: {'lr': 0.00019998582069742174, 'samples': 519584, 'steps': 1014, 'loss/train': 3.216973304748535} -09/20/2021 18:00:14 - INFO - __main__ - Step 16238: {'lr': 0.00019998582069742174, 'samples': 519616, 'steps': 1014, 'loss/train': 3.4668173789978027} -09/20/2021 18:00:15 - INFO - __main__ - Step 16239: {'lr': 0.00019998582069742174, 'samples': 519648, 'steps': 1014, 'loss/train': 4.054415702819824} -09/20/2021 18:00:15 - INFO - __main__ - Step 16240: {'lr': 0.00019998582069742174, 'samples': 519680, 'steps': 1014, 'loss/train': 3.7273776531219482} -09/20/2021 18:00:16 - INFO - __main__ - Step 16241: {'lr': 0.00019998571307758053, 'samples': 519712, 'steps': 1015, 'loss/train': 2.4931700229644775} -09/20/2021 18:00:17 - INFO - __main__ - Step 16242: {'lr': 0.00019998571307758053, 'samples': 519744, 'steps': 1015, 'loss/train': 3.729112386703491} -09/20/2021 18:00:18 - INFO - __main__ - Step 16243: {'lr': 0.00019998571307758053, 'samples': 519776, 'steps': 1015, 'loss/train': 2.8137457370758057} -09/20/2021 18:00:19 - INFO - __main__ - Step 16244: {'lr': 0.00019998571307758053, 'samples': 519808, 'steps': 1015, 'loss/train': 3.202610731124878} -09/20/2021 18:00:19 - INFO - __main__ - Step 16245: {'lr': 0.00019998571307758053, 'samples': 519840, 'steps': 1015, 'loss/train': 3.4855968952178955} -09/20/2021 18:00:20 - INFO - __main__ - Step 16246: {'lr': 0.00019998571307758053, 'samples': 519872, 'steps': 1015, 'loss/train': 3.3659133911132812} -09/20/2021 18:00:21 - INFO - __main__ - Step 16247: {'lr': 0.00019998571307758053, 'samples': 519904, 'steps': 1015, 'loss/train': 2.914597988128662} -09/20/2021 18:00:22 - INFO - __main__ - Step 16248: {'lr': 0.00019998571307758053, 'samples': 519936, 'steps': 1015, 'loss/train': 3.6340384483337402} -09/20/2021 18:00:22 - INFO - __main__ - Step 16249: {'lr': 0.00019998571307758053, 'samples': 519968, 'steps': 1015, 'loss/train': 3.147368907928467} -09/20/2021 18:00:23 - INFO - __main__ - Step 16250: {'lr': 0.00019998571307758053, 'samples': 520000, 'steps': 1015, 'loss/train': 3.042914628982544} -09/20/2021 18:00:24 - INFO - __main__ - Step 16251: {'lr': 0.00019998571307758053, 'samples': 520032, 'steps': 1015, 'loss/train': 4.125889778137207} -09/20/2021 18:00:25 - INFO - __main__ - Step 16252: {'lr': 0.00019998571307758053, 'samples': 520064, 'steps': 1015, 'loss/train': 3.2137279510498047} -09/20/2021 18:00:26 - INFO - __main__ - Step 16253: {'lr': 0.00019998571307758053, 'samples': 520096, 'steps': 1015, 'loss/train': 3.5654642581939697} -09/20/2021 18:00:27 - INFO - __main__ - Step 16254: {'lr': 0.00019998571307758053, 'samples': 520128, 'steps': 1015, 'loss/train': 3.650127649307251} -09/20/2021 18:00:28 - INFO - __main__ - Step 16255: {'lr': 0.00019998571307758053, 'samples': 520160, 'steps': 1015, 'loss/train': 3.7793731689453125} -09/20/2021 18:00:28 - INFO - __main__ - Step 16256: {'lr': 0.00019998571307758053, 'samples': 520192, 'steps': 1015, 'loss/train': 1.9674828052520752} -09/20/2021 18:00:29 - INFO - __main__ - Step 16257: {'lr': 0.00019998560505089788, 'samples': 520224, 'steps': 1016, 'loss/train': 4.122433662414551} -09/20/2021 18:00:30 - INFO - __main__ - Step 16258: {'lr': 0.00019998560505089788, 'samples': 520256, 'steps': 1016, 'loss/train': 3.3258116245269775} -09/20/2021 18:00:31 - INFO - __main__ - Step 16259: {'lr': 0.00019998560505089788, 'samples': 520288, 'steps': 1016, 'loss/train': 3.7192468643188477} -09/20/2021 18:00:31 - INFO - __main__ - Step 16260: {'lr': 0.00019998560505089788, 'samples': 520320, 'steps': 1016, 'loss/train': 3.238250732421875} -09/20/2021 18:00:32 - INFO - __main__ - Step 16261: {'lr': 0.00019998560505089788, 'samples': 520352, 'steps': 1016, 'loss/train': 3.933090925216675} -09/20/2021 18:00:33 - INFO - __main__ - Step 16262: {'lr': 0.00019998560505089788, 'samples': 520384, 'steps': 1016, 'loss/train': 2.971858501434326} -09/20/2021 18:00:34 - INFO - __main__ - Step 16263: {'lr': 0.00019998560505089788, 'samples': 520416, 'steps': 1016, 'loss/train': 4.171779632568359} -09/20/2021 18:00:34 - INFO - __main__ - Step 16264: {'lr': 0.00019998560505089788, 'samples': 520448, 'steps': 1016, 'loss/train': 3.553072452545166} -09/20/2021 18:00:35 - INFO - __main__ - Step 16265: {'lr': 0.00019998560505089788, 'samples': 520480, 'steps': 1016, 'loss/train': 2.9982705116271973} -09/20/2021 18:00:36 - INFO - __main__ - Step 16266: {'lr': 0.00019998560505089788, 'samples': 520512, 'steps': 1016, 'loss/train': 3.8458869457244873} -09/20/2021 18:00:37 - INFO - __main__ - Step 16267: {'lr': 0.00019998560505089788, 'samples': 520544, 'steps': 1016, 'loss/train': 3.1676828861236572} -09/20/2021 18:00:37 - INFO - __main__ - Step 16268: {'lr': 0.00019998560505089788, 'samples': 520576, 'steps': 1016, 'loss/train': 3.1005749702453613} -09/20/2021 18:00:38 - INFO - __main__ - Step 16269: {'lr': 0.00019998560505089788, 'samples': 520608, 'steps': 1016, 'loss/train': 3.7665185928344727} -09/20/2021 18:00:39 - INFO - __main__ - Step 16270: {'lr': 0.00019998560505089788, 'samples': 520640, 'steps': 1016, 'loss/train': 3.5328567028045654} -09/20/2021 18:00:40 - INFO - __main__ - Step 16271: {'lr': 0.00019998560505089788, 'samples': 520672, 'steps': 1016, 'loss/train': 2.487091541290283} -09/20/2021 18:00:40 - INFO - __main__ - Step 16272: {'lr': 0.00019998560505089788, 'samples': 520704, 'steps': 1016, 'loss/train': 3.4343292713165283} -09/20/2021 18:00:41 - INFO - __main__ - Step 16273: {'lr': 0.00019998549661737417, 'samples': 520736, 'steps': 1017, 'loss/train': 3.518709182739258} -09/20/2021 18:00:42 - INFO - __main__ - Step 16274: {'lr': 0.00019998549661737417, 'samples': 520768, 'steps': 1017, 'loss/train': 3.5611023902893066} -09/20/2021 18:00:43 - INFO - __main__ - Step 16275: {'lr': 0.00019998549661737417, 'samples': 520800, 'steps': 1017, 'loss/train': 3.3488059043884277} -09/20/2021 18:00:44 - INFO - __main__ - Step 16276: {'lr': 0.00019998549661737417, 'samples': 520832, 'steps': 1017, 'loss/train': 3.9737908840179443} -09/20/2021 18:00:44 - INFO - __main__ - Step 16277: {'lr': 0.00019998549661737417, 'samples': 520864, 'steps': 1017, 'loss/train': 1.8740953207015991} -09/20/2021 18:00:45 - INFO - __main__ - Step 16278: {'lr': 0.00019998549661737417, 'samples': 520896, 'steps': 1017, 'loss/train': 3.608269691467285} -09/20/2021 18:00:46 - INFO - __main__ - Step 16279: {'lr': 0.00019998549661737417, 'samples': 520928, 'steps': 1017, 'loss/train': 3.0913870334625244} -09/20/2021 18:00:47 - INFO - __main__ - Step 16280: {'lr': 0.00019998549661737417, 'samples': 520960, 'steps': 1017, 'loss/train': 3.9596238136291504} -09/20/2021 18:00:47 - INFO - __main__ - Step 16281: {'lr': 0.00019998549661737417, 'samples': 520992, 'steps': 1017, 'loss/train': 0.690735936164856} -09/20/2021 18:00:48 - INFO - __main__ - Step 16282: {'lr': 0.00019998549661737417, 'samples': 521024, 'steps': 1017, 'loss/train': 0.8680158853530884} -09/20/2021 18:00:49 - INFO - __main__ - Step 16283: {'lr': 0.00019998549661737417, 'samples': 521056, 'steps': 1017, 'loss/train': 0.7781879305839539} -09/20/2021 18:00:50 - INFO - __main__ - Step 16284: {'lr': 0.00019998549661737417, 'samples': 521088, 'steps': 1017, 'loss/train': 1.0393385887145996} -09/20/2021 18:00:51 - INFO - __main__ - Step 16285: {'lr': 0.00019998549661737417, 'samples': 521120, 'steps': 1017, 'loss/train': 3.910341739654541} -09/20/2021 18:00:52 - INFO - __main__ - Step 16286: {'lr': 0.00019998549661737417, 'samples': 521152, 'steps': 1017, 'loss/train': 4.052924156188965} -09/20/2021 18:00:52 - INFO - __main__ - Step 16287: {'lr': 0.00019998549661737417, 'samples': 521184, 'steps': 1017, 'loss/train': 2.921952724456787} -09/20/2021 18:00:53 - INFO - __main__ - Step 16288: {'lr': 0.00019998549661737417, 'samples': 521216, 'steps': 1017, 'loss/train': 4.6393513679504395} -09/20/2021 18:00:54 - INFO - __main__ - Step 16289: {'lr': 0.00019998538777700985, 'samples': 521248, 'steps': 1018, 'loss/train': 3.132366180419922} -09/20/2021 18:00:55 - INFO - __main__ - Step 16290: {'lr': 0.00019998538777700985, 'samples': 521280, 'steps': 1018, 'loss/train': 3.4729037284851074} -09/20/2021 18:00:56 - INFO - __main__ - Step 16291: {'lr': 0.00019998538777700985, 'samples': 521312, 'steps': 1018, 'loss/train': 3.613501787185669} -09/20/2021 18:00:56 - INFO - __main__ - Step 16292: {'lr': 0.00019998538777700985, 'samples': 521344, 'steps': 1018, 'loss/train': 3.880370616912842} -09/20/2021 18:00:57 - INFO - __main__ - Step 16293: {'lr': 0.00019998538777700985, 'samples': 521376, 'steps': 1018, 'loss/train': 4.375450134277344} -09/20/2021 18:00:58 - INFO - __main__ - Step 16294: {'lr': 0.00019998538777700985, 'samples': 521408, 'steps': 1018, 'loss/train': 4.618492603302002} -09/20/2021 18:00:59 - INFO - __main__ - Step 16295: {'lr': 0.00019998538777700985, 'samples': 521440, 'steps': 1018, 'loss/train': 3.3559281826019287} -09/20/2021 18:00:59 - INFO - __main__ - Step 16296: {'lr': 0.00019998538777700985, 'samples': 521472, 'steps': 1018, 'loss/train': 3.153653621673584} -09/20/2021 18:01:00 - INFO - __main__ - Step 16297: {'lr': 0.00019998538777700985, 'samples': 521504, 'steps': 1018, 'loss/train': 2.692232847213745} -09/20/2021 18:01:01 - INFO - __main__ - Step 16298: {'lr': 0.00019998538777700985, 'samples': 521536, 'steps': 1018, 'loss/train': 2.7918667793273926} -09/20/2021 18:01:02 - INFO - __main__ - Step 16299: {'lr': 0.00019998538777700985, 'samples': 521568, 'steps': 1018, 'loss/train': 2.782586097717285} -09/20/2021 18:01:02 - INFO - __main__ - Step 16300: {'lr': 0.00019998538777700985, 'samples': 521600, 'steps': 1018, 'loss/train': 2.9303994178771973} -09/20/2021 18:01:03 - INFO - __main__ - Step 16301: {'lr': 0.00019998538777700985, 'samples': 521632, 'steps': 1018, 'loss/train': 3.983285903930664} -09/20/2021 18:01:04 - INFO - __main__ - Step 16302: {'lr': 0.00019998538777700985, 'samples': 521664, 'steps': 1018, 'loss/train': 3.816537380218506} -09/20/2021 18:01:05 - INFO - __main__ - Step 16303: {'lr': 0.00019998538777700985, 'samples': 521696, 'steps': 1018, 'loss/train': 4.156362056732178} -09/20/2021 18:01:05 - INFO - __main__ - Step 16304: {'lr': 0.00019998538777700985, 'samples': 521728, 'steps': 1018, 'loss/train': 4.140986442565918} -09/20/2021 18:01:06 - INFO - __main__ - Step 16305: {'lr': 0.00019998527852980538, 'samples': 521760, 'steps': 1019, 'loss/train': 2.7823240756988525} -09/20/2021 18:01:07 - INFO - __main__ - Step 16306: {'lr': 0.00019998527852980538, 'samples': 521792, 'steps': 1019, 'loss/train': 3.674727439880371} -09/20/2021 18:01:08 - INFO - __main__ - Step 16307: {'lr': 0.00019998527852980538, 'samples': 521824, 'steps': 1019, 'loss/train': 2.5253779888153076} -09/20/2021 18:01:09 - INFO - __main__ - Step 16308: {'lr': 0.00019998527852980538, 'samples': 521856, 'steps': 1019, 'loss/train': 2.981658697128296} -09/20/2021 18:01:09 - INFO - __main__ - Step 16309: {'lr': 0.00019998527852980538, 'samples': 521888, 'steps': 1019, 'loss/train': 4.077123641967773} -09/20/2021 18:01:10 - INFO - __main__ - Step 16310: {'lr': 0.00019998527852980538, 'samples': 521920, 'steps': 1019, 'loss/train': 3.6450040340423584} -09/20/2021 18:01:11 - INFO - __main__ - Step 16311: {'lr': 0.00019998527852980538, 'samples': 521952, 'steps': 1019, 'loss/train': 4.32492733001709} -09/20/2021 18:01:12 - INFO - __main__ - Step 16312: {'lr': 0.00019998527852980538, 'samples': 521984, 'steps': 1019, 'loss/train': 3.173368453979492} -09/20/2021 18:01:12 - INFO - __main__ - Step 16313: {'lr': 0.00019998527852980538, 'samples': 522016, 'steps': 1019, 'loss/train': 3.3301167488098145} -09/20/2021 18:01:13 - INFO - __main__ - Step 16314: {'lr': 0.00019998527852980538, 'samples': 522048, 'steps': 1019, 'loss/train': 2.7219338417053223} -09/20/2021 18:01:14 - INFO - __main__ - Step 16315: {'lr': 0.00019998527852980538, 'samples': 522080, 'steps': 1019, 'loss/train': 3.1370046138763428} -09/20/2021 18:01:15 - INFO - __main__ - Step 16316: {'lr': 0.00019998527852980538, 'samples': 522112, 'steps': 1019, 'loss/train': 4.035208225250244} -09/20/2021 18:01:16 - INFO - __main__ - Step 16317: {'lr': 0.00019998527852980538, 'samples': 522144, 'steps': 1019, 'loss/train': 5.2658467292785645} -09/20/2021 18:01:17 - INFO - __main__ - Step 16318: {'lr': 0.00019998527852980538, 'samples': 522176, 'steps': 1019, 'loss/train': 4.24972677230835} -09/20/2021 18:01:17 - INFO - __main__ - Step 16319: {'lr': 0.00019998527852980538, 'samples': 522208, 'steps': 1019, 'loss/train': 3.637037992477417} -09/20/2021 18:01:18 - INFO - __main__ - Step 16320: {'lr': 0.00019998527852980538, 'samples': 522240, 'steps': 1019, 'loss/train': 3.4241485595703125} -09/20/2021 18:01:19 - INFO - __main__ - Step 16321: {'lr': 0.00019998516887576118, 'samples': 522272, 'steps': 1020, 'loss/train': 3.5273921489715576} -09/20/2021 18:01:20 - INFO - __main__ - Step 16322: {'lr': 0.00019998516887576118, 'samples': 522304, 'steps': 1020, 'loss/train': 4.885688304901123} -09/20/2021 18:01:20 - INFO - __main__ - Step 16323: {'lr': 0.00019998516887576118, 'samples': 522336, 'steps': 1020, 'loss/train': 3.2045812606811523} -09/20/2021 18:01:21 - INFO - __main__ - Step 16324: {'lr': 0.00019998516887576118, 'samples': 522368, 'steps': 1020, 'loss/train': 4.113254070281982} -09/20/2021 18:01:22 - INFO - __main__ - Step 16325: {'lr': 0.00019998516887576118, 'samples': 522400, 'steps': 1020, 'loss/train': 3.859143018722534} -09/20/2021 18:01:23 - INFO - __main__ - Step 16326: {'lr': 0.00019998516887576118, 'samples': 522432, 'steps': 1020, 'loss/train': 4.370606899261475} -09/20/2021 18:01:23 - INFO - __main__ - Step 16327: {'lr': 0.00019998516887576118, 'samples': 522464, 'steps': 1020, 'loss/train': 2.945362091064453} -09/20/2021 18:01:24 - INFO - __main__ - Step 16328: {'lr': 0.00019998516887576118, 'samples': 522496, 'steps': 1020, 'loss/train': 4.132382869720459} -09/20/2021 18:01:25 - INFO - __main__ - Step 16329: {'lr': 0.00019998516887576118, 'samples': 522528, 'steps': 1020, 'loss/train': 3.7648115158081055} -09/20/2021 18:01:26 - INFO - __main__ - Step 16330: {'lr': 0.00019998516887576118, 'samples': 522560, 'steps': 1020, 'loss/train': 4.062252044677734} -09/20/2021 18:01:26 - INFO - __main__ - Step 16331: {'lr': 0.00019998516887576118, 'samples': 522592, 'steps': 1020, 'loss/train': 2.905266523361206} -09/20/2021 18:01:27 - INFO - __main__ - Step 16332: {'lr': 0.00019998516887576118, 'samples': 522624, 'steps': 1020, 'loss/train': 3.296480655670166} -09/20/2021 18:01:28 - INFO - __main__ - Step 16333: {'lr': 0.00019998516887576118, 'samples': 522656, 'steps': 1020, 'loss/train': 5.322028636932373} -09/20/2021 18:01:29 - INFO - __main__ - Step 16334: {'lr': 0.00019998516887576118, 'samples': 522688, 'steps': 1020, 'loss/train': 3.7151031494140625} -09/20/2021 18:01:29 - INFO - __main__ - Step 16335: {'lr': 0.00019998516887576118, 'samples': 522720, 'steps': 1020, 'loss/train': 5.356051445007324} -09/20/2021 18:01:30 - INFO - __main__ - Step 16336: {'lr': 0.00019998516887576118, 'samples': 522752, 'steps': 1020, 'loss/train': 3.935054302215576} -09/20/2021 18:01:31 - INFO - __main__ - Step 16337: {'lr': 0.00019998505881487776, 'samples': 522784, 'steps': 1021, 'loss/train': 1.4198598861694336} -09/20/2021 18:01:32 - INFO - __main__ - Step 16338: {'lr': 0.00019998505881487776, 'samples': 522816, 'steps': 1021, 'loss/train': 0.8410055041313171} -09/20/2021 18:01:33 - INFO - __main__ - Step 16339: {'lr': 0.00019998505881487776, 'samples': 522848, 'steps': 1021, 'loss/train': 0.9813398718833923} -09/20/2021 18:01:33 - INFO - __main__ - Step 16340: {'lr': 0.00019998505881487776, 'samples': 522880, 'steps': 1021, 'loss/train': 3.8008291721343994} -09/20/2021 18:01:34 - INFO - __main__ - Step 16341: {'lr': 0.00019998505881487776, 'samples': 522912, 'steps': 1021, 'loss/train': 4.146449565887451} -09/20/2021 18:01:35 - INFO - __main__ - Step 16342: {'lr': 0.00019998505881487776, 'samples': 522944, 'steps': 1021, 'loss/train': 4.558727264404297} -09/20/2021 18:01:36 - INFO - __main__ - Step 16343: {'lr': 0.00019998505881487776, 'samples': 522976, 'steps': 1021, 'loss/train': 2.3747141361236572} -09/20/2021 18:01:36 - INFO - __main__ - Step 16344: {'lr': 0.00019998505881487776, 'samples': 523008, 'steps': 1021, 'loss/train': 4.000399112701416} -09/20/2021 18:01:37 - INFO - __main__ - Step 16345: {'lr': 0.00019998505881487776, 'samples': 523040, 'steps': 1021, 'loss/train': 3.433439016342163} -09/20/2021 18:01:38 - INFO - __main__ - Step 16346: {'lr': 0.00019998505881487776, 'samples': 523072, 'steps': 1021, 'loss/train': 3.9325778484344482} -09/20/2021 18:01:39 - INFO - __main__ - Step 16347: {'lr': 0.00019998505881487776, 'samples': 523104, 'steps': 1021, 'loss/train': 4.3516845703125} -09/20/2021 18:01:40 - INFO - __main__ - Step 16348: {'lr': 0.00019998505881487776, 'samples': 523136, 'steps': 1021, 'loss/train': 3.409386396408081} -09/20/2021 18:01:41 - INFO - __main__ - Step 16349: {'lr': 0.00019998505881487776, 'samples': 523168, 'steps': 1021, 'loss/train': 3.4404661655426025} -09/20/2021 18:01:41 - INFO - __main__ - Step 16350: {'lr': 0.00019998505881487776, 'samples': 523200, 'steps': 1021, 'loss/train': 3.4126908779144287} -09/20/2021 18:01:42 - INFO - __main__ - Step 16351: {'lr': 0.00019998505881487776, 'samples': 523232, 'steps': 1021, 'loss/train': 3.991340398788452} -09/20/2021 18:01:43 - INFO - __main__ - Step 16352: {'lr': 0.00019998505881487776, 'samples': 523264, 'steps': 1021, 'loss/train': 3.8097856044769287} -09/20/2021 18:01:44 - INFO - __main__ - Step 16353: {'lr': 0.0001999849483471555, 'samples': 523296, 'steps': 1022, 'loss/train': 4.7481369972229} -09/20/2021 18:01:45 - INFO - __main__ - Step 16354: {'lr': 0.0001999849483471555, 'samples': 523328, 'steps': 1022, 'loss/train': 3.154947519302368} -09/20/2021 18:01:45 - INFO - __main__ - Step 16355: {'lr': 0.0001999849483471555, 'samples': 523360, 'steps': 1022, 'loss/train': 3.855118989944458} -09/20/2021 18:01:46 - INFO - __main__ - Step 16356: {'lr': 0.0001999849483471555, 'samples': 523392, 'steps': 1022, 'loss/train': 3.970745801925659} -09/20/2021 18:01:47 - INFO - __main__ - Step 16357: {'lr': 0.0001999849483471555, 'samples': 523424, 'steps': 1022, 'loss/train': 3.402665376663208} -09/20/2021 18:01:48 - INFO - __main__ - Step 16358: {'lr': 0.0001999849483471555, 'samples': 523456, 'steps': 1022, 'loss/train': 3.3956243991851807} -09/20/2021 18:01:48 - INFO - __main__ - Step 16359: {'lr': 0.0001999849483471555, 'samples': 523488, 'steps': 1022, 'loss/train': 3.1386494636535645} -09/20/2021 18:01:49 - INFO - __main__ - Step 16360: {'lr': 0.0001999849483471555, 'samples': 523520, 'steps': 1022, 'loss/train': 3.4696004390716553} -09/20/2021 18:01:50 - INFO - __main__ - Step 16361: {'lr': 0.0001999849483471555, 'samples': 523552, 'steps': 1022, 'loss/train': 3.61580753326416} -09/20/2021 18:01:51 - INFO - __main__ - Step 16362: {'lr': 0.0001999849483471555, 'samples': 523584, 'steps': 1022, 'loss/train': 2.9891161918640137} -09/20/2021 18:01:51 - INFO - __main__ - Step 16363: {'lr': 0.0001999849483471555, 'samples': 523616, 'steps': 1022, 'loss/train': 3.878293037414551} -09/20/2021 18:01:52 - INFO - __main__ - Step 16364: {'lr': 0.0001999849483471555, 'samples': 523648, 'steps': 1022, 'loss/train': 4.113058090209961} -09/20/2021 18:01:53 - INFO - __main__ - Step 16365: {'lr': 0.0001999849483471555, 'samples': 523680, 'steps': 1022, 'loss/train': 6.420399188995361} -09/20/2021 18:01:54 - INFO - __main__ - Step 16366: {'lr': 0.0001999849483471555, 'samples': 523712, 'steps': 1022, 'loss/train': 4.688931941986084} -09/20/2021 18:01:54 - INFO - __main__ - Step 16367: {'lr': 0.0001999849483471555, 'samples': 523744, 'steps': 1022, 'loss/train': 2.4787063598632812} -09/20/2021 18:01:55 - INFO - __main__ - Step 16368: {'lr': 0.0001999849483471555, 'samples': 523776, 'steps': 1022, 'loss/train': 2.873718500137329} -09/20/2021 18:01:56 - INFO - __main__ - Step 16369: {'lr': 0.00019998483747259485, 'samples': 523808, 'steps': 1023, 'loss/train': 3.352414846420288} -09/20/2021 18:01:57 - INFO - __main__ - Step 16370: {'lr': 0.00019998483747259485, 'samples': 523840, 'steps': 1023, 'loss/train': 3.298740863800049} -09/20/2021 18:01:57 - INFO - __main__ - Step 16371: {'lr': 0.00019998483747259485, 'samples': 523872, 'steps': 1023, 'loss/train': 3.4934113025665283} -09/20/2021 18:01:58 - INFO - __main__ - Step 16372: {'lr': 0.00019998483747259485, 'samples': 523904, 'steps': 1023, 'loss/train': 4.732107639312744} -09/20/2021 18:01:59 - INFO - __main__ - Step 16373: {'lr': 0.00019998483747259485, 'samples': 523936, 'steps': 1023, 'loss/train': 2.107717990875244} -09/20/2021 18:02:00 - INFO - __main__ - Step 16374: {'lr': 0.00019998483747259485, 'samples': 523968, 'steps': 1023, 'loss/train': 3.4457154273986816} -09/20/2021 18:02:00 - INFO - __main__ - Step 16375: {'lr': 0.00019998483747259485, 'samples': 524000, 'steps': 1023, 'loss/train': 3.5539634227752686} -09/20/2021 18:02:01 - INFO - __main__ - Step 16376: {'lr': 0.00019998483747259485, 'samples': 524032, 'steps': 1023, 'loss/train': 1.9539785385131836} -09/20/2021 18:02:03 - INFO - __main__ - Step 16377: {'lr': 0.00019998483747259485, 'samples': 524064, 'steps': 1023, 'loss/train': 4.332353115081787} -09/20/2021 18:02:03 - INFO - __main__ - Step 16378: {'lr': 0.00019998483747259485, 'samples': 524096, 'steps': 1023, 'loss/train': 3.5412511825561523} -09/20/2021 18:02:04 - INFO - __main__ - Step 16379: {'lr': 0.00019998483747259485, 'samples': 524128, 'steps': 1023, 'loss/train': 4.41445779800415} -09/20/2021 18:02:05 - INFO - __main__ - Step 16380: {'lr': 0.00019998483747259485, 'samples': 524160, 'steps': 1023, 'loss/train': 4.436588287353516} -09/20/2021 18:02:06 - INFO - __main__ - Step 16381: {'lr': 0.00019998483747259485, 'samples': 524192, 'steps': 1023, 'loss/train': 3.289426565170288} -09/20/2021 18:02:06 - INFO - __main__ - Step 16382: {'lr': 0.00019998483747259485, 'samples': 524224, 'steps': 1023, 'loss/train': 3.814120054244995} -09/20/2021 18:02:07 - INFO - __main__ - Step 16383: {'lr': 0.00019998483747259485, 'samples': 524256, 'steps': 1023, 'loss/train': 3.748422622680664} -09/20/2021 18:02:08 - INFO - __main__ - Step 16384: {'lr': 0.00019998483747259485, 'samples': 524288, 'steps': 1023, 'loss/train': 4.332422256469727} -09/20/2021 18:02:09 - INFO - __main__ - Step 16385: {'lr': 0.00019998472619119632, 'samples': 524320, 'steps': 1024, 'loss/train': 4.1946868896484375} -09/20/2021 18:02:10 - INFO - __main__ - Step 16386: {'lr': 0.00019998472619119632, 'samples': 524352, 'steps': 1024, 'loss/train': 4.3815693855285645} -09/20/2021 18:02:10 - INFO - __main__ - Step 16387: {'lr': 0.00019998472619119632, 'samples': 524384, 'steps': 1024, 'loss/train': 3.7051265239715576} -09/20/2021 18:02:11 - INFO - __main__ - Step 16388: {'lr': 0.00019998472619119632, 'samples': 524416, 'steps': 1024, 'loss/train': 4.096824645996094} -09/20/2021 18:02:12 - INFO - __main__ - Step 16389: {'lr': 0.00019998472619119632, 'samples': 524448, 'steps': 1024, 'loss/train': 4.114298343658447} -09/20/2021 18:02:13 - INFO - __main__ - Step 16390: {'lr': 0.00019998472619119632, 'samples': 524480, 'steps': 1024, 'loss/train': 3.6279184818267822} -09/20/2021 18:02:13 - INFO - __main__ - Step 16391: {'lr': 0.00019998472619119632, 'samples': 524512, 'steps': 1024, 'loss/train': 4.410857677459717} -09/20/2021 18:02:14 - INFO - __main__ - Step 16392: {'lr': 0.00019998472619119632, 'samples': 524544, 'steps': 1024, 'loss/train': 4.36497688293457} -09/20/2021 18:02:15 - INFO - __main__ - Step 16393: {'lr': 0.00019998472619119632, 'samples': 524576, 'steps': 1024, 'loss/train': 4.208351135253906} -09/20/2021 18:02:16 - INFO - __main__ - Step 16394: {'lr': 0.00019998472619119632, 'samples': 524608, 'steps': 1024, 'loss/train': 5.059843063354492} -09/20/2021 18:02:16 - INFO - __main__ - Step 16395: {'lr': 0.00019998472619119632, 'samples': 524640, 'steps': 1024, 'loss/train': 4.070626258850098} -09/20/2021 18:02:17 - INFO - __main__ - Step 16396: {'lr': 0.00019998472619119632, 'samples': 524672, 'steps': 1024, 'loss/train': 3.5299692153930664} -09/20/2021 18:02:18 - INFO - __main__ - Step 16397: {'lr': 0.00019998472619119632, 'samples': 524704, 'steps': 1024, 'loss/train': 3.210362672805786} -09/20/2021 18:02:19 - INFO - __main__ - Step 16398: {'lr': 0.00019998472619119632, 'samples': 524736, 'steps': 1024, 'loss/train': 4.868376731872559} -09/20/2021 18:02:19 - INFO - __main__ - Step 16399: {'lr': 0.00019998472619119632, 'samples': 524768, 'steps': 1024, 'loss/train': 4.634317874908447} -09/20/2021 18:02:20 - INFO - __main__ - Step 16400: {'lr': 0.00019998472619119632, 'samples': 524800, 'steps': 1024, 'loss/train': 4.416247844696045} -09/20/2021 18:02:21 - INFO - __main__ - Step 16401: {'lr': 0.00019998461450296035, 'samples': 524832, 'steps': 1025, 'loss/train': 3.7022910118103027} -09/20/2021 18:02:22 - INFO - __main__ - Step 16402: {'lr': 0.00019998461450296035, 'samples': 524864, 'steps': 1025, 'loss/train': 4.132094860076904} -09/20/2021 18:02:23 - INFO - __main__ - Step 16403: {'lr': 0.00019998461450296035, 'samples': 524896, 'steps': 1025, 'loss/train': 4.005939483642578} -09/20/2021 18:02:23 - INFO - __main__ - Step 16404: {'lr': 0.00019998461450296035, 'samples': 524928, 'steps': 1025, 'loss/train': 3.7306926250457764} -09/20/2021 18:02:24 - INFO - __main__ - Step 16405: {'lr': 0.00019998461450296035, 'samples': 524960, 'steps': 1025, 'loss/train': 3.446471691131592} -09/20/2021 18:02:25 - INFO - __main__ - Step 16406: {'lr': 0.00019998461450296035, 'samples': 524992, 'steps': 1025, 'loss/train': 3.6605513095855713} -09/20/2021 18:02:26 - INFO - __main__ - Step 16407: {'lr': 0.00019998461450296035, 'samples': 525024, 'steps': 1025, 'loss/train': 3.862619638442993} -09/20/2021 18:02:26 - INFO - __main__ - Step 16408: {'lr': 0.00019998461450296035, 'samples': 525056, 'steps': 1025, 'loss/train': 4.039466857910156} -09/20/2021 18:02:27 - INFO - __main__ - Step 16409: {'lr': 0.00019998461450296035, 'samples': 525088, 'steps': 1025, 'loss/train': 3.1368064880371094} -09/20/2021 18:02:28 - INFO - __main__ - Step 16410: {'lr': 0.00019998461450296035, 'samples': 525120, 'steps': 1025, 'loss/train': 4.196860313415527} -09/20/2021 18:02:29 - INFO - __main__ - Step 16411: {'lr': 0.00019998461450296035, 'samples': 525152, 'steps': 1025, 'loss/train': 4.140643119812012} -09/20/2021 18:02:30 - INFO - __main__ - Step 16412: {'lr': 0.00019998461450296035, 'samples': 525184, 'steps': 1025, 'loss/train': 3.6725456714630127} -09/20/2021 18:02:31 - INFO - __main__ - Step 16413: {'lr': 0.00019998461450296035, 'samples': 525216, 'steps': 1025, 'loss/train': 3.2749550342559814} -09/20/2021 18:02:31 - INFO - __main__ - Step 16414: {'lr': 0.00019998461450296035, 'samples': 525248, 'steps': 1025, 'loss/train': 4.657914161682129} -09/20/2021 18:02:32 - INFO - __main__ - Step 16415: {'lr': 0.00019998461450296035, 'samples': 525280, 'steps': 1025, 'loss/train': 3.5573480129241943} -09/20/2021 18:02:33 - INFO - __main__ - Step 16416: {'lr': 0.00019998461450296035, 'samples': 525312, 'steps': 1025, 'loss/train': 2.419579029083252} -09/20/2021 18:02:34 - INFO - __main__ - Step 16417: {'lr': 0.00019998450240788732, 'samples': 525344, 'steps': 1026, 'loss/train': 2.5515875816345215} -09/20/2021 18:02:35 - INFO - __main__ - Step 16418: {'lr': 0.00019998450240788732, 'samples': 525376, 'steps': 1026, 'loss/train': 2.4988181591033936} -09/20/2021 18:02:35 - INFO - __main__ - Step 16419: {'lr': 0.00019998450240788732, 'samples': 525408, 'steps': 1026, 'loss/train': 3.971752882003784} -09/20/2021 18:02:36 - INFO - __main__ - Step 16420: {'lr': 0.00019998450240788732, 'samples': 525440, 'steps': 1026, 'loss/train': 3.1762285232543945} -09/20/2021 18:02:37 - INFO - __main__ - Step 16421: {'lr': 0.00019998450240788732, 'samples': 525472, 'steps': 1026, 'loss/train': 1.5635325908660889} -09/20/2021 18:02:38 - INFO - __main__ - Step 16422: {'lr': 0.00019998450240788732, 'samples': 525504, 'steps': 1026, 'loss/train': 3.9341652393341064} -09/20/2021 18:02:38 - INFO - __main__ - Step 16423: {'lr': 0.00019998450240788732, 'samples': 525536, 'steps': 1026, 'loss/train': 3.7796285152435303} -09/20/2021 18:02:39 - INFO - __main__ - Step 16424: {'lr': 0.00019998450240788732, 'samples': 525568, 'steps': 1026, 'loss/train': 3.450078010559082} -09/20/2021 18:02:40 - INFO - __main__ - Step 16425: {'lr': 0.00019998450240788732, 'samples': 525600, 'steps': 1026, 'loss/train': 3.9474620819091797} -09/20/2021 18:02:41 - INFO - __main__ - Step 16426: {'lr': 0.00019998450240788732, 'samples': 525632, 'steps': 1026, 'loss/train': 3.564650774002075} -09/20/2021 18:02:41 - INFO - __main__ - Step 16427: {'lr': 0.00019998450240788732, 'samples': 525664, 'steps': 1026, 'loss/train': 3.341826915740967} -09/20/2021 18:02:42 - INFO - __main__ - Step 16428: {'lr': 0.00019998450240788732, 'samples': 525696, 'steps': 1026, 'loss/train': 3.9062838554382324} -09/20/2021 18:02:43 - INFO - __main__ - Step 16429: {'lr': 0.00019998450240788732, 'samples': 525728, 'steps': 1026, 'loss/train': 4.202979564666748} -09/20/2021 18:02:44 - INFO - __main__ - Step 16430: {'lr': 0.00019998450240788732, 'samples': 525760, 'steps': 1026, 'loss/train': 3.1804261207580566} -09/20/2021 18:02:44 - INFO - __main__ - Step 16431: {'lr': 0.00019998450240788732, 'samples': 525792, 'steps': 1026, 'loss/train': 4.856154918670654} -09/20/2021 18:02:45 - INFO - __main__ - Step 16432: {'lr': 0.00019998450240788732, 'samples': 525824, 'steps': 1026, 'loss/train': 2.9293570518493652} -09/20/2021 18:02:46 - INFO - __main__ - Step 16433: {'lr': 0.00019998438990597776, 'samples': 525856, 'steps': 1027, 'loss/train': 3.604722738265991} -09/20/2021 18:02:47 - INFO - __main__ - Step 16434: {'lr': 0.00019998438990597776, 'samples': 525888, 'steps': 1027, 'loss/train': 3.2783050537109375} -09/20/2021 18:02:47 - INFO - __main__ - Step 16435: {'lr': 0.00019998438990597776, 'samples': 525920, 'steps': 1027, 'loss/train': 3.405156135559082} -09/20/2021 18:02:48 - INFO - __main__ - Step 16436: {'lr': 0.00019998438990597776, 'samples': 525952, 'steps': 1027, 'loss/train': 3.9823334217071533} -09/20/2021 18:02:49 - INFO - __main__ - Step 16437: {'lr': 0.00019998438990597776, 'samples': 525984, 'steps': 1027, 'loss/train': 3.370699882507324} -09/20/2021 18:02:50 - INFO - __main__ - Step 16438: {'lr': 0.00019998438990597776, 'samples': 526016, 'steps': 1027, 'loss/train': 6.087665557861328} -09/20/2021 18:02:50 - INFO - __main__ - Step 16439: {'lr': 0.00019998438990597776, 'samples': 526048, 'steps': 1027, 'loss/train': 3.6560964584350586} -09/20/2021 18:02:51 - INFO - __main__ - Step 16440: {'lr': 0.00019998438990597776, 'samples': 526080, 'steps': 1027, 'loss/train': 3.3894588947296143} -09/20/2021 18:02:52 - INFO - __main__ - Step 16441: {'lr': 0.00019998438990597776, 'samples': 526112, 'steps': 1027, 'loss/train': 4.334916114807129} -09/20/2021 18:02:53 - INFO - __main__ - Step 16442: {'lr': 0.00019998438990597776, 'samples': 526144, 'steps': 1027, 'loss/train': 4.305843830108643} -09/20/2021 18:02:54 - INFO - __main__ - Step 16443: {'lr': 0.00019998438990597776, 'samples': 526176, 'steps': 1027, 'loss/train': 6.251089096069336} -09/20/2021 18:02:55 - INFO - __main__ - Step 16444: {'lr': 0.00019998438990597776, 'samples': 526208, 'steps': 1027, 'loss/train': 3.0477232933044434} -09/20/2021 18:02:55 - INFO - __main__ - Step 16445: {'lr': 0.00019998438990597776, 'samples': 526240, 'steps': 1027, 'loss/train': 4.437353610992432} -09/20/2021 18:02:56 - INFO - __main__ - Step 16446: {'lr': 0.00019998438990597776, 'samples': 526272, 'steps': 1027, 'loss/train': 4.029785633087158} -09/20/2021 18:02:57 - INFO - __main__ - Step 16447: {'lr': 0.00019998438990597776, 'samples': 526304, 'steps': 1027, 'loss/train': 2.3912527561187744} -09/20/2021 18:02:58 - INFO - __main__ - Step 16448: {'lr': 0.00019998438990597776, 'samples': 526336, 'steps': 1027, 'loss/train': 3.5135912895202637} -09/20/2021 18:02:59 - INFO - __main__ - Step 16449: {'lr': 0.0001999842769972321, 'samples': 526368, 'steps': 1028, 'loss/train': 4.100309371948242} -09/20/2021 18:02:59 - INFO - __main__ - Step 16450: {'lr': 0.0001999842769972321, 'samples': 526400, 'steps': 1028, 'loss/train': 3.8180670738220215} -09/20/2021 18:03:00 - INFO - __main__ - Step 16451: {'lr': 0.0001999842769972321, 'samples': 526432, 'steps': 1028, 'loss/train': 3.932492733001709} -09/20/2021 18:03:01 - INFO - __main__ - Step 16452: {'lr': 0.0001999842769972321, 'samples': 526464, 'steps': 1028, 'loss/train': 3.9454119205474854} -09/20/2021 18:03:02 - INFO - __main__ - Step 16453: {'lr': 0.0001999842769972321, 'samples': 526496, 'steps': 1028, 'loss/train': 3.166383981704712} -09/20/2021 18:03:02 - INFO - __main__ - Step 16454: {'lr': 0.0001999842769972321, 'samples': 526528, 'steps': 1028, 'loss/train': 4.204378128051758} -09/20/2021 18:03:03 - INFO - __main__ - Step 16455: {'lr': 0.0001999842769972321, 'samples': 526560, 'steps': 1028, 'loss/train': 2.989276170730591} -09/20/2021 18:03:04 - INFO - __main__ - Step 16456: {'lr': 0.0001999842769972321, 'samples': 526592, 'steps': 1028, 'loss/train': 3.8674116134643555} -09/20/2021 18:03:05 - INFO - __main__ - Step 16457: {'lr': 0.0001999842769972321, 'samples': 526624, 'steps': 1028, 'loss/train': 4.086343288421631} -09/20/2021 18:03:05 - INFO - __main__ - Step 16458: {'lr': 0.0001999842769972321, 'samples': 526656, 'steps': 1028, 'loss/train': 4.3911848068237305} -09/20/2021 18:03:06 - INFO - __main__ - Step 16459: {'lr': 0.0001999842769972321, 'samples': 526688, 'steps': 1028, 'loss/train': 5.406864166259766} -09/20/2021 18:03:07 - INFO - __main__ - Step 16460: {'lr': 0.0001999842769972321, 'samples': 526720, 'steps': 1028, 'loss/train': 3.6873974800109863} -09/20/2021 18:03:08 - INFO - __main__ - Step 16461: {'lr': 0.0001999842769972321, 'samples': 526752, 'steps': 1028, 'loss/train': 4.014548301696777} -09/20/2021 18:03:08 - INFO - __main__ - Step 16462: {'lr': 0.0001999842769972321, 'samples': 526784, 'steps': 1028, 'loss/train': 4.054057598114014} -09/20/2021 18:03:09 - INFO - __main__ - Step 16463: {'lr': 0.0001999842769972321, 'samples': 526816, 'steps': 1028, 'loss/train': 3.694007635116577} -09/20/2021 18:03:10 - INFO - __main__ - Step 16464: {'lr': 0.0001999842769972321, 'samples': 526848, 'steps': 1028, 'loss/train': 3.1213555335998535} -09/20/2021 18:03:11 - INFO - __main__ - Step 16465: {'lr': 0.0001999841636816508, 'samples': 526880, 'steps': 1029, 'loss/train': 3.7819719314575195} -09/20/2021 18:03:11 - INFO - __main__ - Step 16466: {'lr': 0.0001999841636816508, 'samples': 526912, 'steps': 1029, 'loss/train': 3.380856513977051} -09/20/2021 18:03:12 - INFO - __main__ - Step 16467: {'lr': 0.0001999841636816508, 'samples': 526944, 'steps': 1029, 'loss/train': 4.050007343292236} -09/20/2021 18:03:13 - INFO - __main__ - Step 16468: {'lr': 0.0001999841636816508, 'samples': 526976, 'steps': 1029, 'loss/train': 3.5644540786743164} -09/20/2021 18:03:14 - INFO - __main__ - Step 16469: {'lr': 0.0001999841636816508, 'samples': 527008, 'steps': 1029, 'loss/train': 4.422165393829346} -09/20/2021 18:03:14 - INFO - __main__ - Step 16470: {'lr': 0.0001999841636816508, 'samples': 527040, 'steps': 1029, 'loss/train': 4.002499103546143} -09/20/2021 18:03:15 - INFO - __main__ - Step 16471: {'lr': 0.0001999841636816508, 'samples': 527072, 'steps': 1029, 'loss/train': 3.996476173400879} -09/20/2021 18:03:16 - INFO - __main__ - Step 16472: {'lr': 0.0001999841636816508, 'samples': 527104, 'steps': 1029, 'loss/train': 3.37630295753479} -09/20/2021 18:03:17 - INFO - __main__ - Step 16473: {'lr': 0.0001999841636816508, 'samples': 527136, 'steps': 1029, 'loss/train': 3.254631519317627} -09/20/2021 18:03:18 - INFO - __main__ - Step 16474: {'lr': 0.0001999841636816508, 'samples': 527168, 'steps': 1029, 'loss/train': 4.036822319030762} -09/20/2021 18:03:19 - INFO - __main__ - Step 16475: {'lr': 0.0001999841636816508, 'samples': 527200, 'steps': 1029, 'loss/train': 3.6507070064544678} -09/20/2021 18:03:20 - INFO - __main__ - Step 16476: {'lr': 0.0001999841636816508, 'samples': 527232, 'steps': 1029, 'loss/train': 3.7061314582824707} -09/20/2021 18:03:20 - INFO - __main__ - Step 16477: {'lr': 0.0001999841636816508, 'samples': 527264, 'steps': 1029, 'loss/train': 2.828780174255371} -09/20/2021 18:03:21 - INFO - __main__ - Step 16478: {'lr': 0.0001999841636816508, 'samples': 527296, 'steps': 1029, 'loss/train': 1.7872546911239624} -09/20/2021 18:03:22 - INFO - __main__ - Step 16479: {'lr': 0.0001999841636816508, 'samples': 527328, 'steps': 1029, 'loss/train': 2.4388794898986816} -09/20/2021 18:03:23 - INFO - __main__ - Step 16480: {'lr': 0.0001999841636816508, 'samples': 527360, 'steps': 1029, 'loss/train': 3.958207845687866} -09/20/2021 18:03:24 - INFO - __main__ - Step 16481: {'lr': 0.00019998404995923434, 'samples': 527392, 'steps': 1030, 'loss/train': 3.9042084217071533} -09/20/2021 18:03:24 - INFO - __main__ - Step 16482: {'lr': 0.00019998404995923434, 'samples': 527424, 'steps': 1030, 'loss/train': 3.691758155822754} -09/20/2021 18:03:25 - INFO - __main__ - Step 16483: {'lr': 0.00019998404995923434, 'samples': 527456, 'steps': 1030, 'loss/train': 3.170401096343994} -09/20/2021 18:03:26 - INFO - __main__ - Step 16484: {'lr': 0.00019998404995923434, 'samples': 527488, 'steps': 1030, 'loss/train': 3.633188486099243} -09/20/2021 18:03:27 - INFO - __main__ - Step 16485: {'lr': 0.00019998404995923434, 'samples': 527520, 'steps': 1030, 'loss/train': 3.434131383895874} -09/20/2021 18:03:27 - INFO - __main__ - Step 16486: {'lr': 0.00019998404995923434, 'samples': 527552, 'steps': 1030, 'loss/train': 4.099277496337891} -09/20/2021 18:03:28 - INFO - __main__ - Step 16487: {'lr': 0.00019998404995923434, 'samples': 527584, 'steps': 1030, 'loss/train': 3.667020797729492} -09/20/2021 18:03:29 - INFO - __main__ - Step 16488: {'lr': 0.00019998404995923434, 'samples': 527616, 'steps': 1030, 'loss/train': 3.7777087688446045} -09/20/2021 18:03:30 - INFO - __main__ - Step 16489: {'lr': 0.00019998404995923434, 'samples': 527648, 'steps': 1030, 'loss/train': 4.093032360076904} -09/20/2021 18:03:30 - INFO - __main__ - Step 16490: {'lr': 0.00019998404995923434, 'samples': 527680, 'steps': 1030, 'loss/train': 3.9190480709075928} -09/20/2021 18:03:31 - INFO - __main__ - Step 16491: {'lr': 0.00019998404995923434, 'samples': 527712, 'steps': 1030, 'loss/train': 3.175905704498291} -09/20/2021 18:03:32 - INFO - __main__ - Step 16492: {'lr': 0.00019998404995923434, 'samples': 527744, 'steps': 1030, 'loss/train': 2.7355217933654785} -09/20/2021 18:03:33 - INFO - __main__ - Step 16493: {'lr': 0.00019998404995923434, 'samples': 527776, 'steps': 1030, 'loss/train': 4.340100288391113} -09/20/2021 18:03:33 - INFO - __main__ - Step 16494: {'lr': 0.00019998404995923434, 'samples': 527808, 'steps': 1030, 'loss/train': 4.106299877166748} -09/20/2021 18:03:34 - INFO - __main__ - Step 16495: {'lr': 0.00019998404995923434, 'samples': 527840, 'steps': 1030, 'loss/train': 4.276596546173096} -09/20/2021 18:03:35 - INFO - __main__ - Step 16496: {'lr': 0.00019998404995923434, 'samples': 527872, 'steps': 1030, 'loss/train': 4.370373249053955} -09/20/2021 18:03:36 - INFO - __main__ - Step 16497: {'lr': 0.00019998393582998318, 'samples': 527904, 'steps': 1031, 'loss/train': 3.700868606567383} -09/20/2021 18:03:36 - INFO - __main__ - Step 16498: {'lr': 0.00019998393582998318, 'samples': 527936, 'steps': 1031, 'loss/train': 4.190204620361328} -09/20/2021 18:03:37 - INFO - __main__ - Step 16499: {'lr': 0.00019998393582998318, 'samples': 527968, 'steps': 1031, 'loss/train': 3.414203643798828} -09/20/2021 18:03:38 - INFO - __main__ - Step 16500: {'lr': 0.00019998393582998318, 'samples': 528000, 'steps': 1031, 'loss/train': 3.2259905338287354} -09/20/2021 18:03:39 - INFO - __main__ - Step 16501: {'lr': 0.00019998393582998318, 'samples': 528032, 'steps': 1031, 'loss/train': 4.0448899269104} -09/20/2021 18:03:39 - INFO - __main__ - Step 16502: {'lr': 0.00019998393582998318, 'samples': 528064, 'steps': 1031, 'loss/train': 4.0846452713012695} -09/20/2021 18:03:40 - INFO - __main__ - Step 16503: {'lr': 0.00019998393582998318, 'samples': 528096, 'steps': 1031, 'loss/train': 3.0677943229675293} -09/20/2021 18:03:41 - INFO - __main__ - Step 16504: {'lr': 0.00019998393582998318, 'samples': 528128, 'steps': 1031, 'loss/train': 1.807217001914978} -09/20/2021 18:03:42 - INFO - __main__ - Step 16505: {'lr': 0.00019998393582998318, 'samples': 528160, 'steps': 1031, 'loss/train': 1.2731133699417114} -09/20/2021 18:03:42 - INFO - __main__ - Step 16506: {'lr': 0.00019998393582998318, 'samples': 528192, 'steps': 1031, 'loss/train': 1.3215466737747192} -09/20/2021 18:03:45 - INFO - __main__ - Step 16507: {'lr': 0.00019998393582998318, 'samples': 528224, 'steps': 1031, 'loss/train': 1.237776517868042} -09/20/2021 18:03:45 - INFO - __main__ - Step 16508: {'lr': 0.00019998393582998318, 'samples': 528256, 'steps': 1031, 'loss/train': 3.9223055839538574} -09/20/2021 18:03:46 - INFO - __main__ - Step 16509: {'lr': 0.00019998393582998318, 'samples': 528288, 'steps': 1031, 'loss/train': 3.194568634033203} -09/20/2021 18:03:47 - INFO - __main__ - Step 16510: {'lr': 0.00019998393582998318, 'samples': 528320, 'steps': 1031, 'loss/train': 5.500072002410889} -09/20/2021 18:03:48 - INFO - __main__ - Step 16511: {'lr': 0.00019998393582998318, 'samples': 528352, 'steps': 1031, 'loss/train': 3.4632225036621094} -09/20/2021 18:03:48 - INFO - __main__ - Step 16512: {'lr': 0.00019998393582998318, 'samples': 528384, 'steps': 1031, 'loss/train': 3.923215389251709} -09/20/2021 18:03:49 - INFO - __main__ - Step 16513: {'lr': 0.00019998382129389773, 'samples': 528416, 'steps': 1032, 'loss/train': 3.471193552017212} -09/20/2021 18:03:50 - INFO - __main__ - Step 16514: {'lr': 0.00019998382129389773, 'samples': 528448, 'steps': 1032, 'loss/train': 3.001368761062622} -09/20/2021 18:03:51 - INFO - __main__ - Step 16515: {'lr': 0.00019998382129389773, 'samples': 528480, 'steps': 1032, 'loss/train': 2.8679230213165283} -09/20/2021 18:03:51 - INFO - __main__ - Step 16516: {'lr': 0.00019998382129389773, 'samples': 528512, 'steps': 1032, 'loss/train': 4.008815765380859} -09/20/2021 18:03:52 - INFO - __main__ - Step 16517: {'lr': 0.00019998382129389773, 'samples': 528544, 'steps': 1032, 'loss/train': 3.480799436569214} -09/20/2021 18:03:53 - INFO - __main__ - Step 16518: {'lr': 0.00019998382129389773, 'samples': 528576, 'steps': 1032, 'loss/train': 3.9378585815429688} -09/20/2021 18:03:54 - INFO - __main__ - Step 16519: {'lr': 0.00019998382129389773, 'samples': 528608, 'steps': 1032, 'loss/train': 3.664881944656372} -09/20/2021 18:03:54 - INFO - __main__ - Step 16520: {'lr': 0.00019998382129389773, 'samples': 528640, 'steps': 1032, 'loss/train': 3.7621235847473145} -09/20/2021 18:03:55 - INFO - __main__ - Step 16521: {'lr': 0.00019998382129389773, 'samples': 528672, 'steps': 1032, 'loss/train': 2.7076637744903564} -09/20/2021 18:03:56 - INFO - __main__ - Step 16522: {'lr': 0.00019998382129389773, 'samples': 528704, 'steps': 1032, 'loss/train': 3.852762460708618} -09/20/2021 18:03:57 - INFO - __main__ - Step 16523: {'lr': 0.00019998382129389773, 'samples': 528736, 'steps': 1032, 'loss/train': 4.377217769622803} -09/20/2021 18:03:57 - INFO - __main__ - Step 16524: {'lr': 0.00019998382129389773, 'samples': 528768, 'steps': 1032, 'loss/train': 3.644244909286499} -09/20/2021 18:03:58 - INFO - __main__ - Step 16525: {'lr': 0.00019998382129389773, 'samples': 528800, 'steps': 1032, 'loss/train': 0.8158081769943237} -09/20/2021 18:03:59 - INFO - __main__ - Step 16526: {'lr': 0.00019998382129389773, 'samples': 528832, 'steps': 1032, 'loss/train': 0.7980261445045471} -09/20/2021 18:04:00 - INFO - __main__ - Step 16527: {'lr': 0.00019998382129389773, 'samples': 528864, 'steps': 1032, 'loss/train': 0.7420592904090881} -09/20/2021 18:04:00 - INFO - __main__ - Step 16528: {'lr': 0.00019998382129389773, 'samples': 528896, 'steps': 1032, 'loss/train': 0.615780770778656} -09/20/2021 18:04:01 - INFO - __main__ - Step 16529: {'lr': 0.00019998370635097853, 'samples': 528928, 'steps': 1033, 'loss/train': 0.7426031231880188} -09/20/2021 18:04:02 - INFO - __main__ - Step 16530: {'lr': 0.00019998370635097853, 'samples': 528960, 'steps': 1033, 'loss/train': 3.9045562744140625} -09/20/2021 18:04:03 - INFO - __main__ - Step 16531: {'lr': 0.00019998370635097853, 'samples': 528992, 'steps': 1033, 'loss/train': 3.4601895809173584} -09/20/2021 18:04:04 - INFO - __main__ - Step 16532: {'lr': 0.00019998370635097853, 'samples': 529024, 'steps': 1033, 'loss/train': 4.338687896728516} -09/20/2021 18:04:04 - INFO - __main__ - Step 16533: {'lr': 0.00019998370635097853, 'samples': 529056, 'steps': 1033, 'loss/train': 3.3891451358795166} -09/20/2021 18:04:05 - INFO - __main__ - Step 16534: {'lr': 0.00019998370635097853, 'samples': 529088, 'steps': 1033, 'loss/train': 3.7262656688690186} -09/20/2021 18:04:06 - INFO - __main__ - Step 16535: {'lr': 0.00019998370635097853, 'samples': 529120, 'steps': 1033, 'loss/train': 2.8974828720092773} -09/20/2021 18:04:07 - INFO - __main__ - Step 16536: {'lr': 0.00019998370635097853, 'samples': 529152, 'steps': 1033, 'loss/train': 3.737288475036621} -09/20/2021 18:04:08 - INFO - __main__ - Step 16537: {'lr': 0.00019998370635097853, 'samples': 529184, 'steps': 1033, 'loss/train': 4.7995195388793945} -09/20/2021 18:04:09 - INFO - __main__ - Step 16538: {'lr': 0.00019998370635097853, 'samples': 529216, 'steps': 1033, 'loss/train': 3.714038133621216} -09/20/2021 18:04:09 - INFO - __main__ - Step 16539: {'lr': 0.00019998370635097853, 'samples': 529248, 'steps': 1033, 'loss/train': 3.4763777256011963} -09/20/2021 18:04:10 - INFO - __main__ - Step 16540: {'lr': 0.00019998370635097853, 'samples': 529280, 'steps': 1033, 'loss/train': 3.50475811958313} -09/20/2021 18:04:11 - INFO - __main__ - Step 16541: {'lr': 0.00019998370635097853, 'samples': 529312, 'steps': 1033, 'loss/train': 4.080432891845703} -09/20/2021 18:04:12 - INFO - __main__ - Step 16542: {'lr': 0.00019998370635097853, 'samples': 529344, 'steps': 1033, 'loss/train': 3.6232595443725586} -09/20/2021 18:04:12 - INFO - __main__ - Step 16543: {'lr': 0.00019998370635097853, 'samples': 529376, 'steps': 1033, 'loss/train': 3.831475257873535} -09/20/2021 18:04:13 - INFO - __main__ - Step 16544: {'lr': 0.00019998370635097853, 'samples': 529408, 'steps': 1033, 'loss/train': 4.1569952964782715} -09/20/2021 18:04:14 - INFO - __main__ - Step 16545: {'lr': 0.00019998359100122603, 'samples': 529440, 'steps': 1034, 'loss/train': 3.7530670166015625} -09/20/2021 18:04:15 - INFO - __main__ - Step 16546: {'lr': 0.00019998359100122603, 'samples': 529472, 'steps': 1034, 'loss/train': 3.540478467941284} -09/20/2021 18:04:15 - INFO - __main__ - Step 16547: {'lr': 0.00019998359100122603, 'samples': 529504, 'steps': 1034, 'loss/train': 3.6593329906463623} -09/20/2021 18:04:16 - INFO - __main__ - Step 16548: {'lr': 0.00019998359100122603, 'samples': 529536, 'steps': 1034, 'loss/train': 3.656977891921997} -09/20/2021 18:04:17 - INFO - __main__ - Step 16549: {'lr': 0.00019998359100122603, 'samples': 529568, 'steps': 1034, 'loss/train': 2.3365530967712402} -09/20/2021 18:04:18 - INFO - __main__ - Step 16550: {'lr': 0.00019998359100122603, 'samples': 529600, 'steps': 1034, 'loss/train': 3.583519697189331} -09/20/2021 18:04:18 - INFO - __main__ - Step 16551: {'lr': 0.00019998359100122603, 'samples': 529632, 'steps': 1034, 'loss/train': 3.4824187755584717} -09/20/2021 18:04:19 - INFO - __main__ - Step 16552: {'lr': 0.00019998359100122603, 'samples': 529664, 'steps': 1034, 'loss/train': 2.9997940063476562} -09/20/2021 18:04:20 - INFO - __main__ - Step 16553: {'lr': 0.00019998359100122603, 'samples': 529696, 'steps': 1034, 'loss/train': 3.820903778076172} -09/20/2021 18:04:21 - INFO - __main__ - Step 16554: {'lr': 0.00019998359100122603, 'samples': 529728, 'steps': 1034, 'loss/train': 3.3477861881256104} -09/20/2021 18:04:21 - INFO - __main__ - Step 16555: {'lr': 0.00019998359100122603, 'samples': 529760, 'steps': 1034, 'loss/train': 4.328876495361328} -09/20/2021 18:04:22 - INFO - __main__ - Step 16556: {'lr': 0.00019998359100122603, 'samples': 529792, 'steps': 1034, 'loss/train': 3.2440903186798096} -09/20/2021 18:04:23 - INFO - __main__ - Step 16557: {'lr': 0.00019998359100122603, 'samples': 529824, 'steps': 1034, 'loss/train': 3.96077036857605} -09/20/2021 18:04:24 - INFO - __main__ - Step 16558: {'lr': 0.00019998359100122603, 'samples': 529856, 'steps': 1034, 'loss/train': 4.774746417999268} -09/20/2021 18:04:24 - INFO - __main__ - Step 16559: {'lr': 0.00019998359100122603, 'samples': 529888, 'steps': 1034, 'loss/train': 3.0278544425964355} -09/20/2021 18:04:25 - INFO - __main__ - Step 16560: {'lr': 0.00019998359100122603, 'samples': 529920, 'steps': 1034, 'loss/train': 3.826037883758545} -09/20/2021 18:04:26 - INFO - __main__ - Step 16561: {'lr': 0.00019998347524464064, 'samples': 529952, 'steps': 1035, 'loss/train': 3.7343928813934326} -09/20/2021 18:04:27 - INFO - __main__ - Step 16562: {'lr': 0.00019998347524464064, 'samples': 529984, 'steps': 1035, 'loss/train': 3.0122368335723877} -09/20/2021 18:04:28 - INFO - __main__ - Step 16563: {'lr': 0.00019998347524464064, 'samples': 530016, 'steps': 1035, 'loss/train': 3.8015496730804443} -09/20/2021 18:04:28 - INFO - __main__ - Step 16564: {'lr': 0.00019998347524464064, 'samples': 530048, 'steps': 1035, 'loss/train': 3.731990098953247} -09/20/2021 18:04:29 - INFO - __main__ - Step 16565: {'lr': 0.00019998347524464064, 'samples': 530080, 'steps': 1035, 'loss/train': 3.0814175605773926} -09/20/2021 18:04:30 - INFO - __main__ - Step 16566: {'lr': 0.00019998347524464064, 'samples': 530112, 'steps': 1035, 'loss/train': 4.64395809173584} -09/20/2021 18:04:31 - INFO - __main__ - Step 16567: {'lr': 0.00019998347524464064, 'samples': 530144, 'steps': 1035, 'loss/train': 2.886988878250122} -09/20/2021 18:04:32 - INFO - __main__ - Step 16568: {'lr': 0.00019998347524464064, 'samples': 530176, 'steps': 1035, 'loss/train': 3.4870622158050537} -09/20/2021 18:04:33 - INFO - __main__ - Step 16569: {'lr': 0.00019998347524464064, 'samples': 530208, 'steps': 1035, 'loss/train': 3.1984376907348633} -09/20/2021 18:04:33 - INFO - __main__ - Step 16570: {'lr': 0.00019998347524464064, 'samples': 530240, 'steps': 1035, 'loss/train': 4.359239101409912} -09/20/2021 18:04:34 - INFO - __main__ - Step 16571: {'lr': 0.00019998347524464064, 'samples': 530272, 'steps': 1035, 'loss/train': 3.8747451305389404} -09/20/2021 18:04:35 - INFO - __main__ - Step 16572: {'lr': 0.00019998347524464064, 'samples': 530304, 'steps': 1035, 'loss/train': 3.3348593711853027} -09/20/2021 18:04:36 - INFO - __main__ - Step 16573: {'lr': 0.00019998347524464064, 'samples': 530336, 'steps': 1035, 'loss/train': 3.5825202465057373} -09/20/2021 18:04:36 - INFO - __main__ - Step 16574: {'lr': 0.00019998347524464064, 'samples': 530368, 'steps': 1035, 'loss/train': 4.727541446685791} -09/20/2021 18:04:37 - INFO - __main__ - Step 16575: {'lr': 0.00019998347524464064, 'samples': 530400, 'steps': 1035, 'loss/train': 3.3586063385009766} -09/20/2021 18:04:38 - INFO - __main__ - Step 16576: {'lr': 0.00019998347524464064, 'samples': 530432, 'steps': 1035, 'loss/train': 3.2420551776885986} -09/20/2021 18:04:39 - INFO - __main__ - Step 16577: {'lr': 0.0001999833590812229, 'samples': 530464, 'steps': 1036, 'loss/train': 4.66723108291626} -09/20/2021 18:04:39 - INFO - __main__ - Step 16578: {'lr': 0.0001999833590812229, 'samples': 530496, 'steps': 1036, 'loss/train': 4.40952730178833} -09/20/2021 18:04:40 - INFO - __main__ - Step 16579: {'lr': 0.0001999833590812229, 'samples': 530528, 'steps': 1036, 'loss/train': 3.5527243614196777} -09/20/2021 18:04:41 - INFO - __main__ - Step 16580: {'lr': 0.0001999833590812229, 'samples': 530560, 'steps': 1036, 'loss/train': 3.524953603744507} -09/20/2021 18:04:42 - INFO - __main__ - Step 16581: {'lr': 0.0001999833590812229, 'samples': 530592, 'steps': 1036, 'loss/train': 4.145423412322998} -09/20/2021 18:04:42 - INFO - __main__ - Step 16582: {'lr': 0.0001999833590812229, 'samples': 530624, 'steps': 1036, 'loss/train': 3.6920180320739746} -09/20/2021 18:04:43 - INFO - __main__ - Step 16583: {'lr': 0.0001999833590812229, 'samples': 530656, 'steps': 1036, 'loss/train': 3.5184946060180664} -09/20/2021 18:04:44 - INFO - __main__ - Step 16584: {'lr': 0.0001999833590812229, 'samples': 530688, 'steps': 1036, 'loss/train': 3.0217978954315186} -09/20/2021 18:04:45 - INFO - __main__ - Step 16585: {'lr': 0.0001999833590812229, 'samples': 530720, 'steps': 1036, 'loss/train': 4.573349475860596} -09/20/2021 18:04:45 - INFO - __main__ - Step 16586: {'lr': 0.0001999833590812229, 'samples': 530752, 'steps': 1036, 'loss/train': 4.433746814727783} -09/20/2021 18:04:46 - INFO - __main__ - Step 16587: {'lr': 0.0001999833590812229, 'samples': 530784, 'steps': 1036, 'loss/train': 3.7431857585906982} -09/20/2021 18:04:47 - INFO - __main__ - Step 16588: {'lr': 0.0001999833590812229, 'samples': 530816, 'steps': 1036, 'loss/train': 2.688737630844116} -09/20/2021 18:04:48 - INFO - __main__ - Step 16589: {'lr': 0.0001999833590812229, 'samples': 530848, 'steps': 1036, 'loss/train': 3.6040337085723877} -09/20/2021 18:04:48 - INFO - __main__ - Step 16590: {'lr': 0.0001999833590812229, 'samples': 530880, 'steps': 1036, 'loss/train': 4.700527667999268} -09/20/2021 18:04:49 - INFO - __main__ - Step 16591: {'lr': 0.0001999833590812229, 'samples': 530912, 'steps': 1036, 'loss/train': 4.577286243438721} -09/20/2021 18:04:50 - INFO - __main__ - Step 16592: {'lr': 0.0001999833590812229, 'samples': 530944, 'steps': 1036, 'loss/train': 3.9559030532836914} -09/20/2021 18:04:51 - INFO - __main__ - Step 16593: {'lr': 0.00019998324251097328, 'samples': 530976, 'steps': 1037, 'loss/train': 3.2623486518859863} -09/20/2021 18:04:52 - INFO - __main__ - Step 16594: {'lr': 0.00019998324251097328, 'samples': 531008, 'steps': 1037, 'loss/train': 3.1785831451416016} -09/20/2021 18:04:52 - INFO - __main__ - Step 16595: {'lr': 0.00019998324251097328, 'samples': 531040, 'steps': 1037, 'loss/train': 3.1013360023498535} -09/20/2021 18:04:53 - INFO - __main__ - Step 16596: {'lr': 0.00019998324251097328, 'samples': 531072, 'steps': 1037, 'loss/train': 3.5455541610717773} -09/20/2021 18:04:54 - INFO - __main__ - Step 16597: {'lr': 0.00019998324251097328, 'samples': 531104, 'steps': 1037, 'loss/train': 4.103350639343262} -09/20/2021 18:04:55 - INFO - __main__ - Step 16598: {'lr': 0.00019998324251097328, 'samples': 531136, 'steps': 1037, 'loss/train': 4.860375881195068} -09/20/2021 18:04:56 - INFO - __main__ - Step 16599: {'lr': 0.00019998324251097328, 'samples': 531168, 'steps': 1037, 'loss/train': 3.932957172393799} -09/20/2021 18:04:57 - INFO - __main__ - Step 16600: {'lr': 0.00019998324251097328, 'samples': 531200, 'steps': 1037, 'loss/train': 3.8463497161865234} -09/20/2021 18:04:58 - INFO - __main__ - Step 16601: {'lr': 0.00019998324251097328, 'samples': 531232, 'steps': 1037, 'loss/train': 3.6361236572265625} -09/20/2021 18:04:58 - INFO - __main__ - Step 16602: {'lr': 0.00019998324251097328, 'samples': 531264, 'steps': 1037, 'loss/train': 3.7539119720458984} -09/20/2021 18:04:59 - INFO - __main__ - Step 16603: {'lr': 0.00019998324251097328, 'samples': 531296, 'steps': 1037, 'loss/train': 3.2256925106048584} -09/20/2021 18:05:00 - INFO - __main__ - Step 16604: {'lr': 0.00019998324251097328, 'samples': 531328, 'steps': 1037, 'loss/train': 2.9747684001922607} -09/20/2021 18:05:01 - INFO - __main__ - Step 16605: {'lr': 0.00019998324251097328, 'samples': 531360, 'steps': 1037, 'loss/train': 3.9172072410583496} -09/20/2021 18:05:01 - INFO - __main__ - Step 16606: {'lr': 0.00019998324251097328, 'samples': 531392, 'steps': 1037, 'loss/train': 3.2066810131073} -09/20/2021 18:05:02 - INFO - __main__ - Step 16607: {'lr': 0.00019998324251097328, 'samples': 531424, 'steps': 1037, 'loss/train': 4.101933002471924} -09/20/2021 18:05:03 - INFO - __main__ - Step 16608: {'lr': 0.00019998324251097328, 'samples': 531456, 'steps': 1037, 'loss/train': 3.1109230518341064} -09/20/2021 18:05:04 - INFO - __main__ - Step 16609: {'lr': 0.00019998312553389224, 'samples': 531488, 'steps': 1038, 'loss/train': 3.3259775638580322} -09/20/2021 18:05:04 - INFO - __main__ - Step 16610: {'lr': 0.00019998312553389224, 'samples': 531520, 'steps': 1038, 'loss/train': 3.6884591579437256} -09/20/2021 18:05:05 - INFO - __main__ - Step 16611: {'lr': 0.00019998312553389224, 'samples': 531552, 'steps': 1038, 'loss/train': 3.7201762199401855} -09/20/2021 18:05:06 - INFO - __main__ - Step 16612: {'lr': 0.00019998312553389224, 'samples': 531584, 'steps': 1038, 'loss/train': 3.2767391204833984} -09/20/2021 18:05:07 - INFO - __main__ - Step 16613: {'lr': 0.00019998312553389224, 'samples': 531616, 'steps': 1038, 'loss/train': 3.6445493698120117} -09/20/2021 18:05:07 - INFO - __main__ - Step 16614: {'lr': 0.00019998312553389224, 'samples': 531648, 'steps': 1038, 'loss/train': 0.8100234270095825} -09/20/2021 18:05:08 - INFO - __main__ - Step 16615: {'lr': 0.00019998312553389224, 'samples': 531680, 'steps': 1038, 'loss/train': 0.9531813263893127} -09/20/2021 18:05:09 - INFO - __main__ - Step 16616: {'lr': 0.00019998312553389224, 'samples': 531712, 'steps': 1038, 'loss/train': 0.8042693734169006} -09/20/2021 18:05:10 - INFO - __main__ - Step 16617: {'lr': 0.00019998312553389224, 'samples': 531744, 'steps': 1038, 'loss/train': 1.6012649536132812} -09/20/2021 18:05:10 - INFO - __main__ - Step 16618: {'lr': 0.00019998312553389224, 'samples': 531776, 'steps': 1038, 'loss/train': 3.3947134017944336} -09/20/2021 18:05:11 - INFO - __main__ - Step 16619: {'lr': 0.00019998312553389224, 'samples': 531808, 'steps': 1038, 'loss/train': 5.1922383308410645} -09/20/2021 18:05:12 - INFO - __main__ - Step 16620: {'lr': 0.00019998312553389224, 'samples': 531840, 'steps': 1038, 'loss/train': 4.328996181488037} -09/20/2021 18:05:13 - INFO - __main__ - Step 16621: {'lr': 0.00019998312553389224, 'samples': 531872, 'steps': 1038, 'loss/train': 4.681717872619629} -09/20/2021 18:05:13 - INFO - __main__ - Step 16622: {'lr': 0.00019998312553389224, 'samples': 531904, 'steps': 1038, 'loss/train': 4.190087795257568} -09/20/2021 18:05:14 - INFO - __main__ - Step 16623: {'lr': 0.00019998312553389224, 'samples': 531936, 'steps': 1038, 'loss/train': 4.798686981201172} -09/20/2021 18:05:15 - INFO - __main__ - Step 16624: {'lr': 0.00019998312553389224, 'samples': 531968, 'steps': 1038, 'loss/train': 3.725139856338501} -09/20/2021 18:05:16 - INFO - __main__ - Step 16625: {'lr': 0.00019998300814998024, 'samples': 532000, 'steps': 1039, 'loss/train': 3.4024953842163086} -09/20/2021 18:05:17 - INFO - __main__ - Step 16626: {'lr': 0.00019998300814998024, 'samples': 532032, 'steps': 1039, 'loss/train': 3.7391197681427} -09/20/2021 18:05:17 - INFO - __main__ - Step 16627: {'lr': 0.00019998300814998024, 'samples': 532064, 'steps': 1039, 'loss/train': 5.8079142570495605} -09/20/2021 18:05:18 - INFO - __main__ - Step 16628: {'lr': 0.00019998300814998024, 'samples': 532096, 'steps': 1039, 'loss/train': 3.5929856300354004} -09/20/2021 18:05:19 - INFO - __main__ - Step 16629: {'lr': 0.00019998300814998024, 'samples': 532128, 'steps': 1039, 'loss/train': 3.4654593467712402} -09/20/2021 18:05:20 - INFO - __main__ - Step 16630: {'lr': 0.00019998300814998024, 'samples': 532160, 'steps': 1039, 'loss/train': 3.8866968154907227} -09/20/2021 18:05:20 - INFO - __main__ - Step 16631: {'lr': 0.00019998300814998024, 'samples': 532192, 'steps': 1039, 'loss/train': 4.476890563964844} -09/20/2021 18:05:22 - INFO - __main__ - Step 16632: {'lr': 0.00019998300814998024, 'samples': 532224, 'steps': 1039, 'loss/train': 3.5627031326293945} -09/20/2021 18:05:22 - INFO - __main__ - Step 16633: {'lr': 0.00019998300814998024, 'samples': 532256, 'steps': 1039, 'loss/train': 4.154208183288574} -09/20/2021 18:05:23 - INFO - __main__ - Step 16634: {'lr': 0.00019998300814998024, 'samples': 532288, 'steps': 1039, 'loss/train': 3.3633663654327393} -09/20/2021 18:05:24 - INFO - __main__ - Step 16635: {'lr': 0.00019998300814998024, 'samples': 532320, 'steps': 1039, 'loss/train': 3.692441940307617} -09/20/2021 18:05:25 - INFO - __main__ - Step 16636: {'lr': 0.00019998300814998024, 'samples': 532352, 'steps': 1039, 'loss/train': 3.3315846920013428} -09/20/2021 18:05:25 - INFO - __main__ - Step 16637: {'lr': 0.00019998300814998024, 'samples': 532384, 'steps': 1039, 'loss/train': 3.4026997089385986} -09/20/2021 18:05:26 - INFO - __main__ - Step 16638: {'lr': 0.00019998300814998024, 'samples': 532416, 'steps': 1039, 'loss/train': 4.636527061462402} -09/20/2021 18:05:27 - INFO - __main__ - Step 16639: {'lr': 0.00019998300814998024, 'samples': 532448, 'steps': 1039, 'loss/train': 5.6681928634643555} -09/20/2021 18:05:28 - INFO - __main__ - Step 16640: {'lr': 0.00019998300814998024, 'samples': 532480, 'steps': 1039, 'loss/train': 4.024558067321777} -09/20/2021 18:05:29 - INFO - __main__ - Step 16641: {'lr': 0.00019998289035923775, 'samples': 532512, 'steps': 1040, 'loss/train': 3.651212215423584} -09/20/2021 18:05:29 - INFO - __main__ - Step 16642: {'lr': 0.00019998289035923775, 'samples': 532544, 'steps': 1040, 'loss/train': 2.8716917037963867} -09/20/2021 18:05:30 - INFO - __main__ - Step 16643: {'lr': 0.00019998289035923775, 'samples': 532576, 'steps': 1040, 'loss/train': 1.5371826887130737} -09/20/2021 18:05:31 - INFO - __main__ - Step 16644: {'lr': 0.00019998289035923775, 'samples': 532608, 'steps': 1040, 'loss/train': 1.1693741083145142} -09/20/2021 18:05:32 - INFO - __main__ - Step 16645: {'lr': 0.00019998289035923775, 'samples': 532640, 'steps': 1040, 'loss/train': 3.62518572807312} -09/20/2021 18:05:32 - INFO - __main__ - Step 16646: {'lr': 0.00019998289035923775, 'samples': 532672, 'steps': 1040, 'loss/train': 3.3450353145599365} -09/20/2021 18:05:33 - INFO - __main__ - Step 16647: {'lr': 0.00019998289035923775, 'samples': 532704, 'steps': 1040, 'loss/train': 5.003314971923828} -09/20/2021 18:05:34 - INFO - __main__ - Step 16648: {'lr': 0.00019998289035923775, 'samples': 532736, 'steps': 1040, 'loss/train': 3.443206787109375} -09/20/2021 18:05:35 - INFO - __main__ - Step 16649: {'lr': 0.00019998289035923775, 'samples': 532768, 'steps': 1040, 'loss/train': 2.5930163860321045} -09/20/2021 18:05:35 - INFO - __main__ - Step 16650: {'lr': 0.00019998289035923775, 'samples': 532800, 'steps': 1040, 'loss/train': 3.523033380508423} -09/20/2021 18:05:36 - INFO - __main__ - Step 16651: {'lr': 0.00019998289035923775, 'samples': 532832, 'steps': 1040, 'loss/train': 4.033337116241455} -09/20/2021 18:05:37 - INFO - __main__ - Step 16652: {'lr': 0.00019998289035923775, 'samples': 532864, 'steps': 1040, 'loss/train': 3.6043691635131836} -09/20/2021 18:05:38 - INFO - __main__ - Step 16653: {'lr': 0.00019998289035923775, 'samples': 532896, 'steps': 1040, 'loss/train': 5.015673637390137} -09/20/2021 18:05:38 - INFO - __main__ - Step 16654: {'lr': 0.00019998289035923775, 'samples': 532928, 'steps': 1040, 'loss/train': 3.1545791625976562} -09/20/2021 18:05:39 - INFO - __main__ - Step 16655: {'lr': 0.00019998289035923775, 'samples': 532960, 'steps': 1040, 'loss/train': 3.677264451980591} -09/20/2021 18:05:40 - INFO - __main__ - Step 16656: {'lr': 0.00019998289035923775, 'samples': 532992, 'steps': 1040, 'loss/train': 3.2735211849212646} -09/20/2021 18:05:41 - INFO - __main__ - Step 16657: {'lr': 0.00019998277216166525, 'samples': 533024, 'steps': 1041, 'loss/train': 2.4100589752197266} -09/20/2021 18:05:41 - INFO - __main__ - Step 16658: {'lr': 0.00019998277216166525, 'samples': 533056, 'steps': 1041, 'loss/train': 4.246482849121094} -09/20/2021 18:05:42 - INFO - __main__ - Step 16659: {'lr': 0.00019998277216166525, 'samples': 533088, 'steps': 1041, 'loss/train': 3.9572973251342773} -09/20/2021 18:05:43 - INFO - __main__ - Step 16660: {'lr': 0.00019998277216166525, 'samples': 533120, 'steps': 1041, 'loss/train': 2.9618775844573975} -09/20/2021 18:05:44 - INFO - __main__ - Step 16661: {'lr': 0.00019998277216166525, 'samples': 533152, 'steps': 1041, 'loss/train': 3.5377328395843506} -09/20/2021 18:05:45 - INFO - __main__ - Step 16662: {'lr': 0.00019998277216166525, 'samples': 533184, 'steps': 1041, 'loss/train': 3.61527156829834} -09/20/2021 18:05:46 - INFO - __main__ - Step 16663: {'lr': 0.00019998277216166525, 'samples': 533216, 'steps': 1041, 'loss/train': 3.5853025913238525} -09/20/2021 18:05:46 - INFO - __main__ - Step 16664: {'lr': 0.00019998277216166525, 'samples': 533248, 'steps': 1041, 'loss/train': 4.283520221710205} -09/20/2021 18:05:47 - INFO - __main__ - Step 16665: {'lr': 0.00019998277216166525, 'samples': 533280, 'steps': 1041, 'loss/train': 3.293860912322998} -09/20/2021 18:05:48 - INFO - __main__ - Step 16666: {'lr': 0.00019998277216166525, 'samples': 533312, 'steps': 1041, 'loss/train': 3.958580255508423} -09/20/2021 18:05:49 - INFO - __main__ - Step 16667: {'lr': 0.00019998277216166525, 'samples': 533344, 'steps': 1041, 'loss/train': 3.4716336727142334} -09/20/2021 18:05:49 - INFO - __main__ - Step 16668: {'lr': 0.00019998277216166525, 'samples': 533376, 'steps': 1041, 'loss/train': 3.1465837955474854} -09/20/2021 18:05:50 - INFO - __main__ - Step 16669: {'lr': 0.00019998277216166525, 'samples': 533408, 'steps': 1041, 'loss/train': 4.16018533706665} -09/20/2021 18:05:51 - INFO - __main__ - Step 16670: {'lr': 0.00019998277216166525, 'samples': 533440, 'steps': 1041, 'loss/train': 3.695578098297119} -09/20/2021 18:05:52 - INFO - __main__ - Step 16671: {'lr': 0.00019998277216166525, 'samples': 533472, 'steps': 1041, 'loss/train': 1.2696036100387573} -09/20/2021 18:05:52 - INFO - __main__ - Step 16672: {'lr': 0.00019998277216166525, 'samples': 533504, 'steps': 1041, 'loss/train': 0.6227737069129944} -09/20/2021 18:05:53 - INFO - __main__ - Step 16673: {'lr': 0.0001999826535572633, 'samples': 533536, 'steps': 1042, 'loss/train': 0.8833807706832886} -09/20/2021 18:05:54 - INFO - __main__ - Step 16674: {'lr': 0.0001999826535572633, 'samples': 533568, 'steps': 1042, 'loss/train': 4.090945720672607} -09/20/2021 18:05:55 - INFO - __main__ - Step 16675: {'lr': 0.0001999826535572633, 'samples': 533600, 'steps': 1042, 'loss/train': 2.5054609775543213} -09/20/2021 18:05:56 - INFO - __main__ - Step 16676: {'lr': 0.0001999826535572633, 'samples': 533632, 'steps': 1042, 'loss/train': 2.845505475997925} -09/20/2021 18:05:56 - INFO - __main__ - Step 16677: {'lr': 0.0001999826535572633, 'samples': 533664, 'steps': 1042, 'loss/train': 5.936513900756836} -09/20/2021 18:05:57 - INFO - __main__ - Step 16678: {'lr': 0.0001999826535572633, 'samples': 533696, 'steps': 1042, 'loss/train': 4.064140319824219} -09/20/2021 18:05:58 - INFO - __main__ - Step 16679: {'lr': 0.0001999826535572633, 'samples': 533728, 'steps': 1042, 'loss/train': 3.350720167160034} -09/20/2021 18:05:59 - INFO - __main__ - Step 16680: {'lr': 0.0001999826535572633, 'samples': 533760, 'steps': 1042, 'loss/train': 3.491398334503174} -09/20/2021 18:05:59 - INFO - __main__ - Step 16681: {'lr': 0.0001999826535572633, 'samples': 533792, 'steps': 1042, 'loss/train': 2.787506103515625} -09/20/2021 18:06:00 - INFO - __main__ - Step 16682: {'lr': 0.0001999826535572633, 'samples': 533824, 'steps': 1042, 'loss/train': 3.1041507720947266} -09/20/2021 18:06:01 - INFO - __main__ - Step 16683: {'lr': 0.0001999826535572633, 'samples': 533856, 'steps': 1042, 'loss/train': 3.225217342376709} -09/20/2021 18:06:02 - INFO - __main__ - Step 16684: {'lr': 0.0001999826535572633, 'samples': 533888, 'steps': 1042, 'loss/train': 3.7715957164764404} -09/20/2021 18:06:02 - INFO - __main__ - Step 16685: {'lr': 0.0001999826535572633, 'samples': 533920, 'steps': 1042, 'loss/train': 2.7826642990112305} -09/20/2021 18:06:03 - INFO - __main__ - Step 16686: {'lr': 0.0001999826535572633, 'samples': 533952, 'steps': 1042, 'loss/train': 3.3865559101104736} -09/20/2021 18:06:04 - INFO - __main__ - Step 16687: {'lr': 0.0001999826535572633, 'samples': 533984, 'steps': 1042, 'loss/train': 3.6230132579803467} -09/20/2021 18:06:05 - INFO - __main__ - Step 16688: {'lr': 0.0001999826535572633, 'samples': 534016, 'steps': 1042, 'loss/train': 4.331969738006592} -09/20/2021 18:06:06 - INFO - __main__ - Step 16689: {'lr': 0.00019998253454603227, 'samples': 534048, 'steps': 1043, 'loss/train': 1.6730564832687378} -09/20/2021 18:06:06 - INFO - __main__ - Step 16690: {'lr': 0.00019998253454603227, 'samples': 534080, 'steps': 1043, 'loss/train': 3.6857972145080566} -09/20/2021 18:06:07 - INFO - __main__ - Step 16691: {'lr': 0.00019998253454603227, 'samples': 534112, 'steps': 1043, 'loss/train': 4.517242908477783} -09/20/2021 18:06:08 - INFO - __main__ - Step 16692: {'lr': 0.00019998253454603227, 'samples': 534144, 'steps': 1043, 'loss/train': 4.143437385559082} -09/20/2021 18:06:09 - INFO - __main__ - Step 16693: {'lr': 0.00019998253454603227, 'samples': 534176, 'steps': 1043, 'loss/train': 2.9003372192382812} -09/20/2021 18:06:10 - INFO - __main__ - Step 16694: {'lr': 0.00019998253454603227, 'samples': 534208, 'steps': 1043, 'loss/train': 3.5045042037963867} -09/20/2021 18:06:11 - INFO - __main__ - Step 16695: {'lr': 0.00019998253454603227, 'samples': 534240, 'steps': 1043, 'loss/train': 3.939918279647827} -09/20/2021 18:06:11 - INFO - __main__ - Step 16696: {'lr': 0.00019998253454603227, 'samples': 534272, 'steps': 1043, 'loss/train': 3.5052075386047363} -09/20/2021 18:06:12 - INFO - __main__ - Step 16697: {'lr': 0.00019998253454603227, 'samples': 534304, 'steps': 1043, 'loss/train': 3.4959557056427} -09/20/2021 18:06:13 - INFO - __main__ - Step 16698: {'lr': 0.00019998253454603227, 'samples': 534336, 'steps': 1043, 'loss/train': 2.5918335914611816} -09/20/2021 18:06:14 - INFO - __main__ - Step 16699: {'lr': 0.00019998253454603227, 'samples': 534368, 'steps': 1043, 'loss/train': 3.6683273315429688} -09/20/2021 18:06:14 - INFO - __main__ - Step 16700: {'lr': 0.00019998253454603227, 'samples': 534400, 'steps': 1043, 'loss/train': 3.5288431644439697} -09/20/2021 18:06:15 - INFO - __main__ - Step 16701: {'lr': 0.00019998253454603227, 'samples': 534432, 'steps': 1043, 'loss/train': 4.774542331695557} -09/20/2021 18:06:16 - INFO - __main__ - Step 16702: {'lr': 0.00019998253454603227, 'samples': 534464, 'steps': 1043, 'loss/train': 3.024761438369751} -09/20/2021 18:06:17 - INFO - __main__ - Step 16703: {'lr': 0.00019998253454603227, 'samples': 534496, 'steps': 1043, 'loss/train': 3.2792649269104004} -09/20/2021 18:06:17 - INFO - __main__ - Step 16704: {'lr': 0.00019998253454603227, 'samples': 534528, 'steps': 1043, 'loss/train': 4.079090595245361} -09/20/2021 18:06:18 - INFO - __main__ - Step 16705: {'lr': 0.0001999824151279727, 'samples': 534560, 'steps': 1044, 'loss/train': 4.431405544281006} -09/20/2021 18:06:19 - INFO - __main__ - Step 16706: {'lr': 0.0001999824151279727, 'samples': 534592, 'steps': 1044, 'loss/train': 3.932323932647705} -09/20/2021 18:06:20 - INFO - __main__ - Step 16707: {'lr': 0.0001999824151279727, 'samples': 534624, 'steps': 1044, 'loss/train': 3.1898000240325928} -09/20/2021 18:06:20 - INFO - __main__ - Step 16708: {'lr': 0.0001999824151279727, 'samples': 534656, 'steps': 1044, 'loss/train': 3.788959503173828} -09/20/2021 18:06:21 - INFO - __main__ - Step 16709: {'lr': 0.0001999824151279727, 'samples': 534688, 'steps': 1044, 'loss/train': 3.8991785049438477} -09/20/2021 18:06:22 - INFO - __main__ - Step 16710: {'lr': 0.0001999824151279727, 'samples': 534720, 'steps': 1044, 'loss/train': 3.39921498298645} -09/20/2021 18:06:23 - INFO - __main__ - Step 16711: {'lr': 0.0001999824151279727, 'samples': 534752, 'steps': 1044, 'loss/train': 3.4678637981414795} -09/20/2021 18:06:23 - INFO - __main__ - Step 16712: {'lr': 0.0001999824151279727, 'samples': 534784, 'steps': 1044, 'loss/train': 2.690793037414551} -09/20/2021 18:06:24 - INFO - __main__ - Step 16713: {'lr': 0.0001999824151279727, 'samples': 534816, 'steps': 1044, 'loss/train': 3.3082213401794434} -09/20/2021 18:06:25 - INFO - __main__ - Step 16714: {'lr': 0.0001999824151279727, 'samples': 534848, 'steps': 1044, 'loss/train': 3.8465607166290283} -09/20/2021 18:06:26 - INFO - __main__ - Step 16715: {'lr': 0.0001999824151279727, 'samples': 534880, 'steps': 1044, 'loss/train': 3.630502223968506} -09/20/2021 18:06:26 - INFO - __main__ - Step 16716: {'lr': 0.0001999824151279727, 'samples': 534912, 'steps': 1044, 'loss/train': 4.15920352935791} -09/20/2021 18:06:27 - INFO - __main__ - Step 16717: {'lr': 0.0001999824151279727, 'samples': 534944, 'steps': 1044, 'loss/train': 3.9471073150634766} -09/20/2021 18:06:28 - INFO - __main__ - Step 16718: {'lr': 0.0001999824151279727, 'samples': 534976, 'steps': 1044, 'loss/train': 4.795300006866455} -09/20/2021 18:06:29 - INFO - __main__ - Step 16719: {'lr': 0.0001999824151279727, 'samples': 535008, 'steps': 1044, 'loss/train': 3.729912757873535} -09/20/2021 18:06:29 - INFO - __main__ - Step 16720: {'lr': 0.0001999824151279727, 'samples': 535040, 'steps': 1044, 'loss/train': 4.993076324462891} -09/20/2021 18:06:30 - INFO - __main__ - Step 16721: {'lr': 0.00019998229530308507, 'samples': 535072, 'steps': 1045, 'loss/train': 3.0749881267547607} -09/20/2021 18:06:31 - INFO - __main__ - Step 16722: {'lr': 0.00019998229530308507, 'samples': 535104, 'steps': 1045, 'loss/train': 3.7621097564697266} -09/20/2021 18:06:32 - INFO - __main__ - Step 16723: {'lr': 0.00019998229530308507, 'samples': 535136, 'steps': 1045, 'loss/train': 3.3572170734405518} -09/20/2021 18:06:33 - INFO - __main__ - Step 16724: {'lr': 0.00019998229530308507, 'samples': 535168, 'steps': 1045, 'loss/train': 3.0984435081481934} -09/20/2021 18:06:34 - INFO - __main__ - Step 16725: {'lr': 0.00019998229530308507, 'samples': 535200, 'steps': 1045, 'loss/train': 4.082749843597412} -09/20/2021 18:06:35 - INFO - __main__ - Step 16726: {'lr': 0.00019998229530308507, 'samples': 535232, 'steps': 1045, 'loss/train': 3.8843815326690674} -09/20/2021 18:06:35 - INFO - __main__ - Step 16727: {'lr': 0.00019998229530308507, 'samples': 535264, 'steps': 1045, 'loss/train': 1.0940040349960327} -09/20/2021 18:06:36 - INFO - __main__ - Step 16728: {'lr': 0.00019998229530308507, 'samples': 535296, 'steps': 1045, 'loss/train': 3.1853253841400146} -09/20/2021 18:06:37 - INFO - __main__ - Step 16729: {'lr': 0.00019998229530308507, 'samples': 535328, 'steps': 1045, 'loss/train': 4.682921409606934} -09/20/2021 18:06:38 - INFO - __main__ - Step 16730: {'lr': 0.00019998229530308507, 'samples': 535360, 'steps': 1045, 'loss/train': 3.0535714626312256} -09/20/2021 18:06:38 - INFO - __main__ - Step 16731: {'lr': 0.00019998229530308507, 'samples': 535392, 'steps': 1045, 'loss/train': 3.2208175659179688} -09/20/2021 18:06:39 - INFO - __main__ - Step 16732: {'lr': 0.00019998229530308507, 'samples': 535424, 'steps': 1045, 'loss/train': 3.994400978088379} -09/20/2021 18:06:40 - INFO - __main__ - Step 16733: {'lr': 0.00019998229530308507, 'samples': 535456, 'steps': 1045, 'loss/train': 2.91633939743042} -09/20/2021 18:06:41 - INFO - __main__ - Step 16734: {'lr': 0.00019998229530308507, 'samples': 535488, 'steps': 1045, 'loss/train': 3.2458748817443848} -09/20/2021 18:06:41 - INFO - __main__ - Step 16735: {'lr': 0.00019998229530308507, 'samples': 535520, 'steps': 1045, 'loss/train': 3.3968429565429688} -09/20/2021 18:06:42 - INFO - __main__ - Step 16736: {'lr': 0.00019998229530308507, 'samples': 535552, 'steps': 1045, 'loss/train': 3.071950674057007} -09/20/2021 18:06:43 - INFO - __main__ - Step 16737: {'lr': 0.00019998217507136991, 'samples': 535584, 'steps': 1046, 'loss/train': 3.5875046253204346} -09/20/2021 18:06:44 - INFO - __main__ - Step 16738: {'lr': 0.00019998217507136991, 'samples': 535616, 'steps': 1046, 'loss/train': 2.5334420204162598} -09/20/2021 18:06:44 - INFO - __main__ - Step 16739: {'lr': 0.00019998217507136991, 'samples': 535648, 'steps': 1046, 'loss/train': 3.599472761154175} -09/20/2021 18:06:45 - INFO - __main__ - Step 16740: {'lr': 0.00019998217507136991, 'samples': 535680, 'steps': 1046, 'loss/train': 5.043292999267578} -09/20/2021 18:06:46 - INFO - __main__ - Step 16741: {'lr': 0.00019998217507136991, 'samples': 535712, 'steps': 1046, 'loss/train': 3.3073647022247314} -09/20/2021 18:06:47 - INFO - __main__ - Step 16742: {'lr': 0.00019998217507136991, 'samples': 535744, 'steps': 1046, 'loss/train': 2.894519090652466} -09/20/2021 18:06:47 - INFO - __main__ - Step 16743: {'lr': 0.00019998217507136991, 'samples': 535776, 'steps': 1046, 'loss/train': 3.3407039642333984} -09/20/2021 18:06:48 - INFO - __main__ - Step 16744: {'lr': 0.00019998217507136991, 'samples': 535808, 'steps': 1046, 'loss/train': 2.3100175857543945} -09/20/2021 18:06:49 - INFO - __main__ - Step 16745: {'lr': 0.00019998217507136991, 'samples': 535840, 'steps': 1046, 'loss/train': 2.7651073932647705} -09/20/2021 18:06:50 - INFO - __main__ - Step 16746: {'lr': 0.00019998217507136991, 'samples': 535872, 'steps': 1046, 'loss/train': 4.825153350830078} -09/20/2021 18:06:50 - INFO - __main__ - Step 16747: {'lr': 0.00019998217507136991, 'samples': 535904, 'steps': 1046, 'loss/train': 4.159490585327148} -09/20/2021 18:06:51 - INFO - __main__ - Step 16748: {'lr': 0.00019998217507136991, 'samples': 535936, 'steps': 1046, 'loss/train': 3.5899600982666016} -09/20/2021 18:06:52 - INFO - __main__ - Step 16749: {'lr': 0.00019998217507136991, 'samples': 535968, 'steps': 1046, 'loss/train': 1.2981040477752686} -09/20/2021 18:06:53 - INFO - __main__ - Step 16750: {'lr': 0.00019998217507136991, 'samples': 536000, 'steps': 1046, 'loss/train': 3.7502951622009277} -09/20/2021 18:06:53 - INFO - __main__ - Step 16751: {'lr': 0.00019998217507136991, 'samples': 536032, 'steps': 1046, 'loss/train': 2.9190614223480225} -09/20/2021 18:06:54 - INFO - __main__ - Step 16752: {'lr': 0.00019998217507136991, 'samples': 536064, 'steps': 1046, 'loss/train': 3.2573013305664062} -09/20/2021 18:06:55 - INFO - __main__ - Step 16753: {'lr': 0.00019998205443282763, 'samples': 536096, 'steps': 1047, 'loss/train': 3.879910707473755} -09/20/2021 18:06:56 - INFO - __main__ - Step 16754: {'lr': 0.00019998205443282763, 'samples': 536128, 'steps': 1047, 'loss/train': 3.5953664779663086} -09/20/2021 18:06:57 - INFO - __main__ - Step 16755: {'lr': 0.00019998205443282763, 'samples': 536160, 'steps': 1047, 'loss/train': 2.758835554122925} -09/20/2021 18:06:58 - INFO - __main__ - Step 16756: {'lr': 0.00019998205443282763, 'samples': 536192, 'steps': 1047, 'loss/train': 4.240242958068848} -09/20/2021 18:06:59 - INFO - __main__ - Step 16757: {'lr': 0.00019998205443282763, 'samples': 536224, 'steps': 1047, 'loss/train': 3.6662187576293945} -09/20/2021 18:06:59 - INFO - __main__ - Step 16758: {'lr': 0.00019998205443282763, 'samples': 536256, 'steps': 1047, 'loss/train': 4.212280750274658} -09/20/2021 18:07:00 - INFO - __main__ - Step 16759: {'lr': 0.00019998205443282763, 'samples': 536288, 'steps': 1047, 'loss/train': 2.489072322845459} -09/20/2021 18:07:01 - INFO - __main__ - Step 16760: {'lr': 0.00019998205443282763, 'samples': 536320, 'steps': 1047, 'loss/train': 3.421570062637329} -09/20/2021 18:07:02 - INFO - __main__ - Step 16761: {'lr': 0.00019998205443282763, 'samples': 536352, 'steps': 1047, 'loss/train': 3.643789052963257} -09/20/2021 18:07:02 - INFO - __main__ - Step 16762: {'lr': 0.00019998205443282763, 'samples': 536384, 'steps': 1047, 'loss/train': 2.792843818664551} -09/20/2021 18:07:03 - INFO - __main__ - Step 16763: {'lr': 0.00019998205443282763, 'samples': 536416, 'steps': 1047, 'loss/train': 4.047513961791992} -09/20/2021 18:07:04 - INFO - __main__ - Step 16764: {'lr': 0.00019998205443282763, 'samples': 536448, 'steps': 1047, 'loss/train': 4.205016136169434} -09/20/2021 18:07:05 - INFO - __main__ - Step 16765: {'lr': 0.00019998205443282763, 'samples': 536480, 'steps': 1047, 'loss/train': 2.671858310699463} -09/20/2021 18:07:05 - INFO - __main__ - Step 16766: {'lr': 0.00019998205443282763, 'samples': 536512, 'steps': 1047, 'loss/train': 3.928185224533081} -09/20/2021 18:07:06 - INFO - __main__ - Step 16767: {'lr': 0.00019998205443282763, 'samples': 536544, 'steps': 1047, 'loss/train': 3.631340980529785} -09/20/2021 18:07:07 - INFO - __main__ - Step 16768: {'lr': 0.00019998205443282763, 'samples': 536576, 'steps': 1047, 'loss/train': 3.6760854721069336} -09/20/2021 18:07:08 - INFO - __main__ - Step 16769: {'lr': 0.00019998193338745878, 'samples': 536608, 'steps': 1048, 'loss/train': 4.380958557128906} -09/20/2021 18:07:08 - INFO - __main__ - Step 16770: {'lr': 0.00019998193338745878, 'samples': 536640, 'steps': 1048, 'loss/train': 3.254359722137451} -09/20/2021 18:07:09 - INFO - __main__ - Step 16771: {'lr': 0.00019998193338745878, 'samples': 536672, 'steps': 1048, 'loss/train': 3.3833577632904053} -09/20/2021 18:07:10 - INFO - __main__ - Step 16772: {'lr': 0.00019998193338745878, 'samples': 536704, 'steps': 1048, 'loss/train': 3.217024087905884} -09/20/2021 18:07:11 - INFO - __main__ - Step 16773: {'lr': 0.00019998193338745878, 'samples': 536736, 'steps': 1048, 'loss/train': 4.260434627532959} -09/20/2021 18:07:11 - INFO - __main__ - Step 16774: {'lr': 0.00019998193338745878, 'samples': 536768, 'steps': 1048, 'loss/train': 4.555595874786377} -09/20/2021 18:07:12 - INFO - __main__ - Step 16775: {'lr': 0.00019998193338745878, 'samples': 536800, 'steps': 1048, 'loss/train': 3.912597179412842} -09/20/2021 18:07:13 - INFO - __main__ - Step 16776: {'lr': 0.00019998193338745878, 'samples': 536832, 'steps': 1048, 'loss/train': 3.7169015407562256} -09/20/2021 18:07:14 - INFO - __main__ - Step 16777: {'lr': 0.00019998193338745878, 'samples': 536864, 'steps': 1048, 'loss/train': 3.221226453781128} -09/20/2021 18:07:14 - INFO - __main__ - Step 16778: {'lr': 0.00019998193338745878, 'samples': 536896, 'steps': 1048, 'loss/train': 3.2712316513061523} -09/20/2021 18:07:15 - INFO - __main__ - Step 16779: {'lr': 0.00019998193338745878, 'samples': 536928, 'steps': 1048, 'loss/train': 4.090991020202637} -09/20/2021 18:07:16 - INFO - __main__ - Step 16780: {'lr': 0.00019998193338745878, 'samples': 536960, 'steps': 1048, 'loss/train': 2.955341339111328} -09/20/2021 18:07:17 - INFO - __main__ - Step 16781: {'lr': 0.00019998193338745878, 'samples': 536992, 'steps': 1048, 'loss/train': 4.00939416885376} -09/20/2021 18:07:17 - INFO - __main__ - Step 16782: {'lr': 0.00019998193338745878, 'samples': 537024, 'steps': 1048, 'loss/train': 4.460675239562988} -09/20/2021 18:07:18 - INFO - __main__ - Step 16783: {'lr': 0.00019998193338745878, 'samples': 537056, 'steps': 1048, 'loss/train': 4.545979976654053} -09/20/2021 18:07:19 - INFO - __main__ - Step 16784: {'lr': 0.00019998193338745878, 'samples': 537088, 'steps': 1048, 'loss/train': 4.196645259857178} -09/20/2021 18:07:20 - INFO - __main__ - Step 16785: {'lr': 0.0001999818119352638, 'samples': 537120, 'steps': 1049, 'loss/train': 3.3064708709716797} -09/20/2021 18:07:21 - INFO - __main__ - Step 16786: {'lr': 0.0001999818119352638, 'samples': 537152, 'steps': 1049, 'loss/train': 3.7998836040496826} -09/20/2021 18:07:22 - INFO - __main__ - Step 16787: {'lr': 0.0001999818119352638, 'samples': 537184, 'steps': 1049, 'loss/train': 3.1801328659057617} -09/20/2021 18:07:23 - INFO - __main__ - Step 16788: {'lr': 0.0001999818119352638, 'samples': 537216, 'steps': 1049, 'loss/train': 4.33720588684082} -09/20/2021 18:07:23 - INFO - __main__ - Step 16789: {'lr': 0.0001999818119352638, 'samples': 537248, 'steps': 1049, 'loss/train': 3.2251155376434326} -09/20/2021 18:07:24 - INFO - __main__ - Step 16790: {'lr': 0.0001999818119352638, 'samples': 537280, 'steps': 1049, 'loss/train': 4.281871318817139} -09/20/2021 18:07:25 - INFO - __main__ - Step 16791: {'lr': 0.0001999818119352638, 'samples': 537312, 'steps': 1049, 'loss/train': 3.8183252811431885} -09/20/2021 18:07:26 - INFO - __main__ - Step 16792: {'lr': 0.0001999818119352638, 'samples': 537344, 'steps': 1049, 'loss/train': 4.890797138214111} -09/20/2021 18:07:26 - INFO - __main__ - Step 16793: {'lr': 0.0001999818119352638, 'samples': 537376, 'steps': 1049, 'loss/train': 4.084529876708984} -09/20/2021 18:07:27 - INFO - __main__ - Step 16794: {'lr': 0.0001999818119352638, 'samples': 537408, 'steps': 1049, 'loss/train': 5.218423366546631} -09/20/2021 18:07:28 - INFO - __main__ - Step 16795: {'lr': 0.0001999818119352638, 'samples': 537440, 'steps': 1049, 'loss/train': 3.291177988052368} -09/20/2021 18:07:29 - INFO - __main__ - Step 16796: {'lr': 0.0001999818119352638, 'samples': 537472, 'steps': 1049, 'loss/train': 3.215453624725342} -09/20/2021 18:07:29 - INFO - __main__ - Step 16797: {'lr': 0.0001999818119352638, 'samples': 537504, 'steps': 1049, 'loss/train': 3.392221689224243} -09/20/2021 18:07:30 - INFO - __main__ - Step 16798: {'lr': 0.0001999818119352638, 'samples': 537536, 'steps': 1049, 'loss/train': 3.5328409671783447} -09/20/2021 18:07:31 - INFO - __main__ - Step 16799: {'lr': 0.0001999818119352638, 'samples': 537568, 'steps': 1049, 'loss/train': 3.921236753463745} -09/20/2021 18:07:32 - INFO - __main__ - Step 16800: {'lr': 0.0001999818119352638, 'samples': 537600, 'steps': 1049, 'loss/train': 3.335270881652832} -09/20/2021 18:07:33 - INFO - __main__ - Step 16801: {'lr': 0.00019998169007624323, 'samples': 537632, 'steps': 1050, 'loss/train': 2.969036340713501} -09/20/2021 18:07:33 - INFO - __main__ - Step 16802: {'lr': 0.00019998169007624323, 'samples': 537664, 'steps': 1050, 'loss/train': 3.9002559185028076} -09/20/2021 18:07:34 - INFO - __main__ - Step 16803: {'lr': 0.00019998169007624323, 'samples': 537696, 'steps': 1050, 'loss/train': 3.0262908935546875} -09/20/2021 18:07:35 - INFO - __main__ - Step 16804: {'lr': 0.00019998169007624323, 'samples': 537728, 'steps': 1050, 'loss/train': 3.9211809635162354} -09/20/2021 18:07:36 - INFO - __main__ - Step 16805: {'lr': 0.00019998169007624323, 'samples': 537760, 'steps': 1050, 'loss/train': 2.0337109565734863} -09/20/2021 18:07:36 - INFO - __main__ - Step 16806: {'lr': 0.00019998169007624323, 'samples': 537792, 'steps': 1050, 'loss/train': 3.820755958557129} -09/20/2021 18:07:37 - INFO - __main__ - Step 16807: {'lr': 0.00019998169007624323, 'samples': 537824, 'steps': 1050, 'loss/train': 3.3865489959716797} -09/20/2021 18:07:38 - INFO - __main__ - Step 16808: {'lr': 0.00019998169007624323, 'samples': 537856, 'steps': 1050, 'loss/train': 3.2281980514526367} -09/20/2021 18:07:39 - INFO - __main__ - Step 16809: {'lr': 0.00019998169007624323, 'samples': 537888, 'steps': 1050, 'loss/train': 4.406471252441406} -09/20/2021 18:07:39 - INFO - __main__ - Step 16810: {'lr': 0.00019998169007624323, 'samples': 537920, 'steps': 1050, 'loss/train': 4.266855716705322} -09/20/2021 18:07:40 - INFO - __main__ - Step 16811: {'lr': 0.00019998169007624323, 'samples': 537952, 'steps': 1050, 'loss/train': 3.340578556060791} -09/20/2021 18:07:41 - INFO - __main__ - Step 16812: {'lr': 0.00019998169007624323, 'samples': 537984, 'steps': 1050, 'loss/train': 4.529384613037109} -09/20/2021 18:07:42 - INFO - __main__ - Step 16813: {'lr': 0.00019998169007624323, 'samples': 538016, 'steps': 1050, 'loss/train': 3.6432480812072754} -09/20/2021 18:07:42 - INFO - __main__ - Step 16814: {'lr': 0.00019998169007624323, 'samples': 538048, 'steps': 1050, 'loss/train': 2.8714141845703125} -09/20/2021 18:07:43 - INFO - __main__ - Step 16815: {'lr': 0.00019998169007624323, 'samples': 538080, 'steps': 1050, 'loss/train': 4.00825834274292} -09/20/2021 18:07:44 - INFO - __main__ - Step 16816: {'lr': 0.00019998169007624323, 'samples': 538112, 'steps': 1050, 'loss/train': 3.80550217628479} -09/20/2021 18:07:46 - INFO - __main__ - Step 16817: {'lr': 0.00019998156781039756, 'samples': 538144, 'steps': 1051, 'loss/train': 3.863064765930176} -09/20/2021 18:07:47 - INFO - __main__ - Step 16818: {'lr': 0.00019998156781039756, 'samples': 538176, 'steps': 1051, 'loss/train': 3.8865065574645996} -09/20/2021 18:07:47 - INFO - __main__ - Step 16819: {'lr': 0.00019998156781039756, 'samples': 538208, 'steps': 1051, 'loss/train': 3.4489426612854004} -09/20/2021 18:07:48 - INFO - __main__ - Step 16820: {'lr': 0.00019998156781039756, 'samples': 538240, 'steps': 1051, 'loss/train': 3.9931557178497314} -09/20/2021 18:07:49 - INFO - __main__ - Step 16821: {'lr': 0.00019998156781039756, 'samples': 538272, 'steps': 1051, 'loss/train': 2.49748158454895} -09/20/2021 18:07:50 - INFO - __main__ - Step 16822: {'lr': 0.00019998156781039756, 'samples': 538304, 'steps': 1051, 'loss/train': 3.116647481918335} -09/20/2021 18:07:50 - INFO - __main__ - Step 16823: {'lr': 0.00019998156781039756, 'samples': 538336, 'steps': 1051, 'loss/train': 3.2152955532073975} -09/20/2021 18:07:51 - INFO - __main__ - Step 16824: {'lr': 0.00019998156781039756, 'samples': 538368, 'steps': 1051, 'loss/train': 3.3891818523406982} -09/20/2021 18:07:52 - INFO - __main__ - Step 16825: {'lr': 0.00019998156781039756, 'samples': 538400, 'steps': 1051, 'loss/train': 5.054455280303955} -09/20/2021 18:07:53 - INFO - __main__ - Step 16826: {'lr': 0.00019998156781039756, 'samples': 538432, 'steps': 1051, 'loss/train': 4.061713695526123} -09/20/2021 18:07:53 - INFO - __main__ - Step 16827: {'lr': 0.00019998156781039756, 'samples': 538464, 'steps': 1051, 'loss/train': 3.5643198490142822} -09/20/2021 18:07:54 - INFO - __main__ - Step 16828: {'lr': 0.00019998156781039756, 'samples': 538496, 'steps': 1051, 'loss/train': 2.4089717864990234} -09/20/2021 18:07:55 - INFO - __main__ - Step 16829: {'lr': 0.00019998156781039756, 'samples': 538528, 'steps': 1051, 'loss/train': 3.5304417610168457} -09/20/2021 18:07:56 - INFO - __main__ - Step 16830: {'lr': 0.00019998156781039756, 'samples': 538560, 'steps': 1051, 'loss/train': 3.1227643489837646} -09/20/2021 18:07:56 - INFO - __main__ - Step 16831: {'lr': 0.00019998156781039756, 'samples': 538592, 'steps': 1051, 'loss/train': 3.8267602920532227} -09/20/2021 18:07:57 - INFO - __main__ - Step 16832: {'lr': 0.00019998156781039756, 'samples': 538624, 'steps': 1051, 'loss/train': 3.494011402130127} -09/20/2021 18:07:58 - INFO - __main__ - Step 16833: {'lr': 0.00019998144513772728, 'samples': 538656, 'steps': 1052, 'loss/train': 3.235513210296631} -09/20/2021 18:07:59 - INFO - __main__ - Step 16834: {'lr': 0.00019998144513772728, 'samples': 538688, 'steps': 1052, 'loss/train': 3.3894548416137695} -09/20/2021 18:07:59 - INFO - __main__ - Step 16835: {'lr': 0.00019998144513772728, 'samples': 538720, 'steps': 1052, 'loss/train': 3.688854694366455} -09/20/2021 18:08:00 - INFO - __main__ - Step 16836: {'lr': 0.00019998144513772728, 'samples': 538752, 'steps': 1052, 'loss/train': 3.5891592502593994} -09/20/2021 18:08:01 - INFO - __main__ - Step 16837: {'lr': 0.00019998144513772728, 'samples': 538784, 'steps': 1052, 'loss/train': 3.8703153133392334} -09/20/2021 18:08:02 - INFO - __main__ - Step 16838: {'lr': 0.00019998144513772728, 'samples': 538816, 'steps': 1052, 'loss/train': 4.1790452003479} -09/20/2021 18:08:02 - INFO - __main__ - Step 16839: {'lr': 0.00019998144513772728, 'samples': 538848, 'steps': 1052, 'loss/train': 4.598097324371338} -09/20/2021 18:08:03 - INFO - __main__ - Step 16840: {'lr': 0.00019998144513772728, 'samples': 538880, 'steps': 1052, 'loss/train': 2.50809645652771} -09/20/2021 18:08:04 - INFO - __main__ - Step 16841: {'lr': 0.00019998144513772728, 'samples': 538912, 'steps': 1052, 'loss/train': 4.109065532684326} -09/20/2021 18:08:05 - INFO - __main__ - Step 16842: {'lr': 0.00019998144513772728, 'samples': 538944, 'steps': 1052, 'loss/train': 3.6665430068969727} -09/20/2021 18:08:05 - INFO - __main__ - Step 16843: {'lr': 0.00019998144513772728, 'samples': 538976, 'steps': 1052, 'loss/train': 3.4539542198181152} -09/20/2021 18:08:06 - INFO - __main__ - Step 16844: {'lr': 0.00019998144513772728, 'samples': 539008, 'steps': 1052, 'loss/train': 3.999936103820801} -09/20/2021 18:08:07 - INFO - __main__ - Step 16845: {'lr': 0.00019998144513772728, 'samples': 539040, 'steps': 1052, 'loss/train': 0.8475849032402039} -09/20/2021 18:08:08 - INFO - __main__ - Step 16846: {'lr': 0.00019998144513772728, 'samples': 539072, 'steps': 1052, 'loss/train': 4.318583965301514} -09/20/2021 18:08:09 - INFO - __main__ - Step 16847: {'lr': 0.00019998144513772728, 'samples': 539104, 'steps': 1052, 'loss/train': 3.716236114501953} -09/20/2021 18:08:10 - INFO - __main__ - Step 16848: {'lr': 0.00019998144513772728, 'samples': 539136, 'steps': 1052, 'loss/train': 3.2833282947540283} -09/20/2021 18:08:11 - INFO - __main__ - Step 16849: {'lr': 0.00019998132205823285, 'samples': 539168, 'steps': 1053, 'loss/train': 3.5787577629089355} -09/20/2021 18:08:11 - INFO - __main__ - Step 16850: {'lr': 0.00019998132205823285, 'samples': 539200, 'steps': 1053, 'loss/train': 3.5662615299224854} -09/20/2021 18:08:12 - INFO - __main__ - Step 16851: {'lr': 0.00019998132205823285, 'samples': 539232, 'steps': 1053, 'loss/train': 4.208986282348633} -09/20/2021 18:08:13 - INFO - __main__ - Step 16852: {'lr': 0.00019998132205823285, 'samples': 539264, 'steps': 1053, 'loss/train': 3.965467929840088} -09/20/2021 18:08:14 - INFO - __main__ - Step 16853: {'lr': 0.00019998132205823285, 'samples': 539296, 'steps': 1053, 'loss/train': 3.9240360260009766} -09/20/2021 18:08:14 - INFO - __main__ - Step 16854: {'lr': 0.00019998132205823285, 'samples': 539328, 'steps': 1053, 'loss/train': 3.0337138175964355} -09/20/2021 18:08:15 - INFO - __main__ - Step 16855: {'lr': 0.00019998132205823285, 'samples': 539360, 'steps': 1053, 'loss/train': 3.037470817565918} -09/20/2021 18:08:16 - INFO - __main__ - Step 16856: {'lr': 0.00019998132205823285, 'samples': 539392, 'steps': 1053, 'loss/train': 3.4429819583892822} -09/20/2021 18:08:17 - INFO - __main__ - Step 16857: {'lr': 0.00019998132205823285, 'samples': 539424, 'steps': 1053, 'loss/train': 3.8651742935180664} -09/20/2021 18:08:17 - INFO - __main__ - Step 16858: {'lr': 0.00019998132205823285, 'samples': 539456, 'steps': 1053, 'loss/train': 3.6102983951568604} -09/20/2021 18:08:18 - INFO - __main__ - Step 16859: {'lr': 0.00019998132205823285, 'samples': 539488, 'steps': 1053, 'loss/train': 1.6846070289611816} -09/20/2021 18:08:19 - INFO - __main__ - Step 16860: {'lr': 0.00019998132205823285, 'samples': 539520, 'steps': 1053, 'loss/train': 3.8176310062408447} -09/20/2021 18:08:20 - INFO - __main__ - Step 16861: {'lr': 0.00019998132205823285, 'samples': 539552, 'steps': 1053, 'loss/train': 3.7209465503692627} -09/20/2021 18:08:20 - INFO - __main__ - Step 16862: {'lr': 0.00019998132205823285, 'samples': 539584, 'steps': 1053, 'loss/train': 2.6408603191375732} -09/20/2021 18:08:21 - INFO - __main__ - Step 16863: {'lr': 0.00019998132205823285, 'samples': 539616, 'steps': 1053, 'loss/train': 3.0525946617126465} -09/20/2021 18:08:22 - INFO - __main__ - Step 16864: {'lr': 0.00019998132205823285, 'samples': 539648, 'steps': 1053, 'loss/train': 4.4272589683532715} -09/20/2021 18:08:23 - INFO - __main__ - Step 16865: {'lr': 0.00019998119857191483, 'samples': 539680, 'steps': 1054, 'loss/train': 3.990583658218384} -09/20/2021 18:08:24 - INFO - __main__ - Step 16866: {'lr': 0.00019998119857191483, 'samples': 539712, 'steps': 1054, 'loss/train': 3.818596363067627} -09/20/2021 18:08:24 - INFO - __main__ - Step 16867: {'lr': 0.00019998119857191483, 'samples': 539744, 'steps': 1054, 'loss/train': 3.630061149597168} -09/20/2021 18:08:25 - INFO - __main__ - Step 16868: {'lr': 0.00019998119857191483, 'samples': 539776, 'steps': 1054, 'loss/train': 3.154045820236206} -09/20/2021 18:08:26 - INFO - __main__ - Step 16869: {'lr': 0.00019998119857191483, 'samples': 539808, 'steps': 1054, 'loss/train': 3.421318769454956} -09/20/2021 18:08:27 - INFO - __main__ - Step 16870: {'lr': 0.00019998119857191483, 'samples': 539840, 'steps': 1054, 'loss/train': 3.885298013687134} -09/20/2021 18:08:27 - INFO - __main__ - Step 16871: {'lr': 0.00019998119857191483, 'samples': 539872, 'steps': 1054, 'loss/train': 3.853231191635132} -09/20/2021 18:08:28 - INFO - __main__ - Step 16872: {'lr': 0.00019998119857191483, 'samples': 539904, 'steps': 1054, 'loss/train': 2.8972384929656982} -09/20/2021 18:08:29 - INFO - __main__ - Step 16873: {'lr': 0.00019998119857191483, 'samples': 539936, 'steps': 1054, 'loss/train': 3.367562770843506} -09/20/2021 18:08:30 - INFO - __main__ - Step 16874: {'lr': 0.00019998119857191483, 'samples': 539968, 'steps': 1054, 'loss/train': 3.5108160972595215} -09/20/2021 18:08:30 - INFO - __main__ - Step 16875: {'lr': 0.00019998119857191483, 'samples': 540000, 'steps': 1054, 'loss/train': 3.5231196880340576} -09/20/2021 18:08:31 - INFO - __main__ - Step 16876: {'lr': 0.00019998119857191483, 'samples': 540032, 'steps': 1054, 'loss/train': 3.8781545162200928} -09/20/2021 18:08:32 - INFO - __main__ - Step 16877: {'lr': 0.00019998119857191483, 'samples': 540064, 'steps': 1054, 'loss/train': 3.6633541584014893} -09/20/2021 18:08:33 - INFO - __main__ - Step 16878: {'lr': 0.00019998119857191483, 'samples': 540096, 'steps': 1054, 'loss/train': 4.499164581298828} -09/20/2021 18:08:34 - INFO - __main__ - Step 16879: {'lr': 0.00019998119857191483, 'samples': 540128, 'steps': 1054, 'loss/train': 2.7106192111968994} -09/20/2021 18:08:35 - INFO - __main__ - Step 16880: {'lr': 0.00019998119857191483, 'samples': 540160, 'steps': 1054, 'loss/train': 4.610044002532959} -09/20/2021 18:08:35 - INFO - __main__ - Step 16881: {'lr': 0.00019998107467877373, 'samples': 540192, 'steps': 1055, 'loss/train': 3.7248291969299316} -09/20/2021 18:08:36 - INFO - __main__ - Step 16882: {'lr': 0.00019998107467877373, 'samples': 540224, 'steps': 1055, 'loss/train': 1.6894441843032837} -09/20/2021 18:08:37 - INFO - __main__ - Step 16883: {'lr': 0.00019998107467877373, 'samples': 540256, 'steps': 1055, 'loss/train': 2.878610610961914} -09/20/2021 18:08:38 - INFO - __main__ - Step 16884: {'lr': 0.00019998107467877373, 'samples': 540288, 'steps': 1055, 'loss/train': 4.684802532196045} -09/20/2021 18:08:38 - INFO - __main__ - Step 16885: {'lr': 0.00019998107467877373, 'samples': 540320, 'steps': 1055, 'loss/train': 4.093372821807861} -09/20/2021 18:08:39 - INFO - __main__ - Step 16886: {'lr': 0.00019998107467877373, 'samples': 540352, 'steps': 1055, 'loss/train': 3.5180106163024902} -09/20/2021 18:08:40 - INFO - __main__ - Step 16887: {'lr': 0.00019998107467877373, 'samples': 540384, 'steps': 1055, 'loss/train': 6.370876789093018} -09/20/2021 18:08:41 - INFO - __main__ - Step 16888: {'lr': 0.00019998107467877373, 'samples': 540416, 'steps': 1055, 'loss/train': 3.144209861755371} -09/20/2021 18:08:41 - INFO - __main__ - Step 16889: {'lr': 0.00019998107467877373, 'samples': 540448, 'steps': 1055, 'loss/train': 4.075575351715088} -09/20/2021 18:08:42 - INFO - __main__ - Step 16890: {'lr': 0.00019998107467877373, 'samples': 540480, 'steps': 1055, 'loss/train': 4.197078227996826} -09/20/2021 18:08:43 - INFO - __main__ - Step 16891: {'lr': 0.00019998107467877373, 'samples': 540512, 'steps': 1055, 'loss/train': 3.839778423309326} -09/20/2021 18:08:44 - INFO - __main__ - Step 16892: {'lr': 0.00019998107467877373, 'samples': 540544, 'steps': 1055, 'loss/train': 1.1069176197052002} -09/20/2021 18:08:44 - INFO - __main__ - Step 16893: {'lr': 0.00019998107467877373, 'samples': 540576, 'steps': 1055, 'loss/train': 3.3869824409484863} -09/20/2021 18:08:45 - INFO - __main__ - Step 16894: {'lr': 0.00019998107467877373, 'samples': 540608, 'steps': 1055, 'loss/train': 3.4179129600524902} -09/20/2021 18:08:46 - INFO - __main__ - Step 16895: {'lr': 0.00019998107467877373, 'samples': 540640, 'steps': 1055, 'loss/train': 3.698887348175049} -09/20/2021 18:08:47 - INFO - __main__ - Step 16896: {'lr': 0.00019998107467877373, 'samples': 540672, 'steps': 1055, 'loss/train': 2.9622910022735596} -09/20/2021 18:08:48 - INFO - __main__ - Step 16897: {'lr': 0.00019998095037881, 'samples': 540704, 'steps': 1056, 'loss/train': 4.8670220375061035} -09/20/2021 18:08:48 - INFO - __main__ - Step 16898: {'lr': 0.00019998095037881, 'samples': 540736, 'steps': 1056, 'loss/train': 3.8693273067474365} -09/20/2021 18:08:49 - INFO - __main__ - Step 16899: {'lr': 0.00019998095037881, 'samples': 540768, 'steps': 1056, 'loss/train': 1.3836541175842285} -09/20/2021 18:08:50 - INFO - __main__ - Step 16900: {'lr': 0.00019998095037881, 'samples': 540800, 'steps': 1056, 'loss/train': 3.8244035243988037} -09/20/2021 18:08:51 - INFO - __main__ - Step 16901: {'lr': 0.00019998095037881, 'samples': 540832, 'steps': 1056, 'loss/train': 3.955554246902466} -09/20/2021 18:08:51 - INFO - __main__ - Step 16902: {'lr': 0.00019998095037881, 'samples': 540864, 'steps': 1056, 'loss/train': 3.189166307449341} -09/20/2021 18:08:52 - INFO - __main__ - Step 16903: {'lr': 0.00019998095037881, 'samples': 540896, 'steps': 1056, 'loss/train': 3.8263847827911377} -09/20/2021 18:08:53 - INFO - __main__ - Step 16904: {'lr': 0.00019998095037881, 'samples': 540928, 'steps': 1056, 'loss/train': 3.7855255603790283} -09/20/2021 18:08:54 - INFO - __main__ - Step 16905: {'lr': 0.00019998095037881, 'samples': 540960, 'steps': 1056, 'loss/train': 3.5899269580841064} -09/20/2021 18:08:54 - INFO - __main__ - Step 16906: {'lr': 0.00019998095037881, 'samples': 540992, 'steps': 1056, 'loss/train': 3.7504260540008545} -09/20/2021 18:08:55 - INFO - __main__ - Step 16907: {'lr': 0.00019998095037881, 'samples': 541024, 'steps': 1056, 'loss/train': 3.770010471343994} -09/20/2021 18:08:56 - INFO - __main__ - Step 16908: {'lr': 0.00019998095037881, 'samples': 541056, 'steps': 1056, 'loss/train': 3.4628729820251465} -09/20/2021 18:08:57 - INFO - __main__ - Step 16909: {'lr': 0.00019998095037881, 'samples': 541088, 'steps': 1056, 'loss/train': 3.5846707820892334} -09/20/2021 18:08:58 - INFO - __main__ - Step 16910: {'lr': 0.00019998095037881, 'samples': 541120, 'steps': 1056, 'loss/train': 4.717772006988525} -09/20/2021 18:08:59 - INFO - __main__ - Step 16911: {'lr': 0.00019998095037881, 'samples': 541152, 'steps': 1056, 'loss/train': 3.9743053913116455} -09/20/2021 18:08:59 - INFO - __main__ - Step 16912: {'lr': 0.00019998095037881, 'samples': 541184, 'steps': 1056, 'loss/train': 3.947540521621704} -09/20/2021 18:09:00 - INFO - __main__ - Step 16913: {'lr': 0.00019998082567202418, 'samples': 541216, 'steps': 1057, 'loss/train': 2.871150255203247} -09/20/2021 18:09:01 - INFO - __main__ - Step 16914: {'lr': 0.00019998082567202418, 'samples': 541248, 'steps': 1057, 'loss/train': 3.294588804244995} -09/20/2021 18:09:02 - INFO - __main__ - Step 16915: {'lr': 0.00019998082567202418, 'samples': 541280, 'steps': 1057, 'loss/train': 3.3109586238861084} -09/20/2021 18:09:03 - INFO - __main__ - Step 16916: {'lr': 0.00019998082567202418, 'samples': 541312, 'steps': 1057, 'loss/train': 3.8044207096099854} -09/20/2021 18:09:03 - INFO - __main__ - Step 16917: {'lr': 0.00019998082567202418, 'samples': 541344, 'steps': 1057, 'loss/train': 4.136190891265869} -09/20/2021 18:09:04 - INFO - __main__ - Step 16918: {'lr': 0.00019998082567202418, 'samples': 541376, 'steps': 1057, 'loss/train': 3.6928374767303467} -09/20/2021 18:09:05 - INFO - __main__ - Step 16919: {'lr': 0.00019998082567202418, 'samples': 541408, 'steps': 1057, 'loss/train': 3.785771369934082} -09/20/2021 18:09:06 - INFO - __main__ - Step 16920: {'lr': 0.00019998082567202418, 'samples': 541440, 'steps': 1057, 'loss/train': 3.32150936126709} -09/20/2021 18:09:06 - INFO - __main__ - Step 16921: {'lr': 0.00019998082567202418, 'samples': 541472, 'steps': 1057, 'loss/train': 4.546048164367676} -09/20/2021 18:09:07 - INFO - __main__ - Step 16922: {'lr': 0.00019998082567202418, 'samples': 541504, 'steps': 1057, 'loss/train': 3.3360562324523926} -09/20/2021 18:09:08 - INFO - __main__ - Step 16923: {'lr': 0.00019998082567202418, 'samples': 541536, 'steps': 1057, 'loss/train': 2.501148223876953} -09/20/2021 18:09:09 - INFO - __main__ - Step 16924: {'lr': 0.00019998082567202418, 'samples': 541568, 'steps': 1057, 'loss/train': 3.2228991985321045} -09/20/2021 18:09:09 - INFO - __main__ - Step 16925: {'lr': 0.00019998082567202418, 'samples': 541600, 'steps': 1057, 'loss/train': 4.0208539962768555} -09/20/2021 18:09:10 - INFO - __main__ - Step 16926: {'lr': 0.00019998082567202418, 'samples': 541632, 'steps': 1057, 'loss/train': 4.658174514770508} -09/20/2021 18:09:11 - INFO - __main__ - Step 16927: {'lr': 0.00019998082567202418, 'samples': 541664, 'steps': 1057, 'loss/train': 4.27024507522583} -09/20/2021 18:09:12 - INFO - __main__ - Step 16928: {'lr': 0.00019998082567202418, 'samples': 541696, 'steps': 1057, 'loss/train': 4.0556416511535645} -09/20/2021 18:09:12 - INFO - __main__ - Step 16929: {'lr': 0.00019998070055841674, 'samples': 541728, 'steps': 1058, 'loss/train': 3.438617467880249} -09/20/2021 18:09:13 - INFO - __main__ - Step 16930: {'lr': 0.00019998070055841674, 'samples': 541760, 'steps': 1058, 'loss/train': 4.519624710083008} -09/20/2021 18:09:14 - INFO - __main__ - Step 16931: {'lr': 0.00019998070055841674, 'samples': 541792, 'steps': 1058, 'loss/train': 5.182056903839111} -09/20/2021 18:09:15 - INFO - __main__ - Step 16932: {'lr': 0.00019998070055841674, 'samples': 541824, 'steps': 1058, 'loss/train': 2.828852891921997} -09/20/2021 18:09:15 - INFO - __main__ - Step 16933: {'lr': 0.00019998070055841674, 'samples': 541856, 'steps': 1058, 'loss/train': 4.333621025085449} -09/20/2021 18:09:16 - INFO - __main__ - Step 16934: {'lr': 0.00019998070055841674, 'samples': 541888, 'steps': 1058, 'loss/train': 3.4318459033966064} -09/20/2021 18:09:17 - INFO - __main__ - Step 16935: {'lr': 0.00019998070055841674, 'samples': 541920, 'steps': 1058, 'loss/train': 3.0851404666900635} -09/20/2021 18:09:18 - INFO - __main__ - Step 16936: {'lr': 0.00019998070055841674, 'samples': 541952, 'steps': 1058, 'loss/train': 3.37569260597229} -09/20/2021 18:09:18 - INFO - __main__ - Step 16937: {'lr': 0.00019998070055841674, 'samples': 541984, 'steps': 1058, 'loss/train': 3.7098190784454346} -09/20/2021 18:09:19 - INFO - __main__ - Step 16938: {'lr': 0.00019998070055841674, 'samples': 542016, 'steps': 1058, 'loss/train': 3.541321277618408} -09/20/2021 18:09:20 - INFO - __main__ - Step 16939: {'lr': 0.00019998070055841674, 'samples': 542048, 'steps': 1058, 'loss/train': 2.4415767192840576} -09/20/2021 18:09:21 - INFO - __main__ - Step 16940: {'lr': 0.00019998070055841674, 'samples': 542080, 'steps': 1058, 'loss/train': 2.1062636375427246} -09/20/2021 18:09:22 - INFO - __main__ - Step 16941: {'lr': 0.00019998070055841674, 'samples': 542112, 'steps': 1058, 'loss/train': 3.783799648284912} -09/20/2021 18:09:23 - INFO - __main__ - Step 16942: {'lr': 0.00019998070055841674, 'samples': 542144, 'steps': 1058, 'loss/train': 3.2608578205108643} -09/20/2021 18:09:23 - INFO - __main__ - Step 16943: {'lr': 0.00019998070055841674, 'samples': 542176, 'steps': 1058, 'loss/train': 3.8335790634155273} -09/20/2021 18:09:24 - INFO - __main__ - Step 16944: {'lr': 0.00019998070055841674, 'samples': 542208, 'steps': 1058, 'loss/train': 0.9509866237640381} -09/20/2021 18:09:25 - INFO - __main__ - Step 16945: {'lr': 0.00019998057503798825, 'samples': 542240, 'steps': 1059, 'loss/train': 3.338118314743042} -09/20/2021 18:09:26 - INFO - __main__ - Step 16946: {'lr': 0.00019998057503798825, 'samples': 542272, 'steps': 1059, 'loss/train': 4.110389232635498} -09/20/2021 18:09:27 - INFO - __main__ - Step 16947: {'lr': 0.00019998057503798825, 'samples': 542304, 'steps': 1059, 'loss/train': 3.480997323989868} -09/20/2021 18:09:27 - INFO - __main__ - Step 16948: {'lr': 0.00019998057503798825, 'samples': 542336, 'steps': 1059, 'loss/train': 3.1882100105285645} -09/20/2021 18:09:28 - INFO - __main__ - Step 16949: {'lr': 0.00019998057503798825, 'samples': 542368, 'steps': 1059, 'loss/train': 3.794365882873535} -09/20/2021 18:09:29 - INFO - __main__ - Step 16950: {'lr': 0.00019998057503798825, 'samples': 542400, 'steps': 1059, 'loss/train': 3.4773690700531006} -09/20/2021 18:09:30 - INFO - __main__ - Step 16951: {'lr': 0.00019998057503798825, 'samples': 542432, 'steps': 1059, 'loss/train': 3.5111424922943115} -09/20/2021 18:09:30 - INFO - __main__ - Step 16952: {'lr': 0.00019998057503798825, 'samples': 542464, 'steps': 1059, 'loss/train': 3.391751289367676} -09/20/2021 18:09:31 - INFO - __main__ - Step 16953: {'lr': 0.00019998057503798825, 'samples': 542496, 'steps': 1059, 'loss/train': 3.382645606994629} -09/20/2021 18:09:32 - INFO - __main__ - Step 16954: {'lr': 0.00019998057503798825, 'samples': 542528, 'steps': 1059, 'loss/train': 3.787097454071045} -09/20/2021 18:09:33 - INFO - __main__ - Step 16955: {'lr': 0.00019998057503798825, 'samples': 542560, 'steps': 1059, 'loss/train': 3.959488868713379} -09/20/2021 18:09:33 - INFO - __main__ - Step 16956: {'lr': 0.00019998057503798825, 'samples': 542592, 'steps': 1059, 'loss/train': 3.277066946029663} -09/20/2021 18:09:34 - INFO - __main__ - Step 16957: {'lr': 0.00019998057503798825, 'samples': 542624, 'steps': 1059, 'loss/train': 4.400177001953125} -09/20/2021 18:09:35 - INFO - __main__ - Step 16958: {'lr': 0.00019998057503798825, 'samples': 542656, 'steps': 1059, 'loss/train': 5.604701995849609} -09/20/2021 18:09:36 - INFO - __main__ - Step 16959: {'lr': 0.00019998057503798825, 'samples': 542688, 'steps': 1059, 'loss/train': 2.979703426361084} -09/20/2021 18:09:36 - INFO - __main__ - Step 16960: {'lr': 0.00019998057503798825, 'samples': 542720, 'steps': 1059, 'loss/train': 2.6892504692077637} -09/20/2021 18:09:37 - INFO - __main__ - Step 16961: {'lr': 0.00019998044911073918, 'samples': 542752, 'steps': 1060, 'loss/train': 2.835958242416382} -09/20/2021 18:09:38 - INFO - __main__ - Step 16962: {'lr': 0.00019998044911073918, 'samples': 542784, 'steps': 1060, 'loss/train': 3.8414745330810547} -09/20/2021 18:09:39 - INFO - __main__ - Step 16963: {'lr': 0.00019998044911073918, 'samples': 542816, 'steps': 1060, 'loss/train': 3.753891944885254} -09/20/2021 18:09:39 - INFO - __main__ - Step 16964: {'lr': 0.00019998044911073918, 'samples': 542848, 'steps': 1060, 'loss/train': 2.712916851043701} -09/20/2021 18:09:40 - INFO - __main__ - Step 16965: {'lr': 0.00019998044911073918, 'samples': 542880, 'steps': 1060, 'loss/train': 3.4759726524353027} -09/20/2021 18:09:41 - INFO - __main__ - Step 16966: {'lr': 0.00019998044911073918, 'samples': 542912, 'steps': 1060, 'loss/train': 3.744464159011841} -09/20/2021 18:09:42 - INFO - __main__ - Step 16967: {'lr': 0.00019998044911073918, 'samples': 542944, 'steps': 1060, 'loss/train': 3.2778701782226562} -09/20/2021 18:09:42 - INFO - __main__ - Step 16968: {'lr': 0.00019998044911073918, 'samples': 542976, 'steps': 1060, 'loss/train': 4.282745838165283} -09/20/2021 18:09:43 - INFO - __main__ - Step 16969: {'lr': 0.00019998044911073918, 'samples': 543008, 'steps': 1060, 'loss/train': 3.3072967529296875} -09/20/2021 18:09:45 - INFO - __main__ - Step 16970: {'lr': 0.00019998044911073918, 'samples': 543040, 'steps': 1060, 'loss/train': 3.6660664081573486} -09/20/2021 18:09:45 - INFO - __main__ - Step 16971: {'lr': 0.00019998044911073918, 'samples': 543072, 'steps': 1060, 'loss/train': 4.4134674072265625} -09/20/2021 18:09:46 - INFO - __main__ - Step 16972: {'lr': 0.00019998044911073918, 'samples': 543104, 'steps': 1060, 'loss/train': 2.990266799926758} -09/20/2021 18:09:47 - INFO - __main__ - Step 16973: {'lr': 0.00019998044911073918, 'samples': 543136, 'steps': 1060, 'loss/train': 3.7321205139160156} -09/20/2021 18:09:48 - INFO - __main__ - Step 16974: {'lr': 0.00019998044911073918, 'samples': 543168, 'steps': 1060, 'loss/train': 4.67315149307251} -09/20/2021 18:09:48 - INFO - __main__ - Step 16975: {'lr': 0.00019998044911073918, 'samples': 543200, 'steps': 1060, 'loss/train': 5.159298896789551} -09/20/2021 18:09:49 - INFO - __main__ - Step 16976: {'lr': 0.00019998044911073918, 'samples': 543232, 'steps': 1060, 'loss/train': 5.5198445320129395} -09/20/2021 18:09:50 - INFO - __main__ - Step 16977: {'lr': 0.00019998032277667008, 'samples': 543264, 'steps': 1061, 'loss/train': 4.390657424926758} -09/20/2021 18:09:51 - INFO - __main__ - Step 16978: {'lr': 0.00019998032277667008, 'samples': 543296, 'steps': 1061, 'loss/train': 3.901240825653076} -09/20/2021 18:09:52 - INFO - __main__ - Step 16979: {'lr': 0.00019998032277667008, 'samples': 543328, 'steps': 1061, 'loss/train': 4.686474323272705} -09/20/2021 18:09:52 - INFO - __main__ - Step 16980: {'lr': 0.00019998032277667008, 'samples': 543360, 'steps': 1061, 'loss/train': 3.581338405609131} -09/20/2021 18:09:53 - INFO - __main__ - Step 16981: {'lr': 0.00019998032277667008, 'samples': 543392, 'steps': 1061, 'loss/train': 4.514243125915527} -09/20/2021 18:09:54 - INFO - __main__ - Step 16982: {'lr': 0.00019998032277667008, 'samples': 543424, 'steps': 1061, 'loss/train': 3.948465585708618} -09/20/2021 18:09:55 - INFO - __main__ - Step 16983: {'lr': 0.00019998032277667008, 'samples': 543456, 'steps': 1061, 'loss/train': 3.425469160079956} -09/20/2021 18:09:55 - INFO - __main__ - Step 16984: {'lr': 0.00019998032277667008, 'samples': 543488, 'steps': 1061, 'loss/train': 3.3655753135681152} -09/20/2021 18:09:56 - INFO - __main__ - Step 16985: {'lr': 0.00019998032277667008, 'samples': 543520, 'steps': 1061, 'loss/train': 3.4256701469421387} -09/20/2021 18:09:57 - INFO - __main__ - Step 16986: {'lr': 0.00019998032277667008, 'samples': 543552, 'steps': 1061, 'loss/train': 1.1294279098510742} -09/20/2021 18:09:58 - INFO - __main__ - Step 16987: {'lr': 0.00019998032277667008, 'samples': 543584, 'steps': 1061, 'loss/train': 3.2075397968292236} -09/20/2021 18:09:58 - INFO - __main__ - Step 16988: {'lr': 0.00019998032277667008, 'samples': 543616, 'steps': 1061, 'loss/train': 3.4164483547210693} -09/20/2021 18:09:59 - INFO - __main__ - Step 16989: {'lr': 0.00019998032277667008, 'samples': 543648, 'steps': 1061, 'loss/train': 4.044127941131592} -09/20/2021 18:10:00 - INFO - __main__ - Step 16990: {'lr': 0.00019998032277667008, 'samples': 543680, 'steps': 1061, 'loss/train': 3.848381996154785} -09/20/2021 18:10:01 - INFO - __main__ - Step 16991: {'lr': 0.00019998032277667008, 'samples': 543712, 'steps': 1061, 'loss/train': 3.682746171951294} -09/20/2021 18:10:01 - INFO - __main__ - Step 16992: {'lr': 0.00019998032277667008, 'samples': 543744, 'steps': 1061, 'loss/train': 4.126366138458252} -09/20/2021 18:10:02 - INFO - __main__ - Step 16993: {'lr': 0.0001999801960357814, 'samples': 543776, 'steps': 1062, 'loss/train': 3.601876974105835} -09/20/2021 18:10:03 - INFO - __main__ - Step 16994: {'lr': 0.0001999801960357814, 'samples': 543808, 'steps': 1062, 'loss/train': 4.7384867668151855} -09/20/2021 18:10:04 - INFO - __main__ - Step 16995: {'lr': 0.0001999801960357814, 'samples': 543840, 'steps': 1062, 'loss/train': 3.0181941986083984} -09/20/2021 18:10:04 - INFO - __main__ - Step 16996: {'lr': 0.0001999801960357814, 'samples': 543872, 'steps': 1062, 'loss/train': 3.4198038578033447} -09/20/2021 18:10:05 - INFO - __main__ - Step 16997: {'lr': 0.0001999801960357814, 'samples': 543904, 'steps': 1062, 'loss/train': 3.929853677749634} -09/20/2021 18:10:06 - INFO - __main__ - Step 16998: {'lr': 0.0001999801960357814, 'samples': 543936, 'steps': 1062, 'loss/train': 3.0626158714294434} -09/20/2021 18:10:07 - INFO - __main__ - Step 16999: {'lr': 0.0001999801960357814, 'samples': 543968, 'steps': 1062, 'loss/train': 4.050693988800049} -09/20/2021 18:10:07 - INFO - __main__ - Step 17000: {'lr': 0.0001999801960357814, 'samples': 544000, 'steps': 1062, 'loss/train': 3.7101783752441406} -09/20/2021 18:10:08 - INFO - __main__ - Step 17001: {'lr': 0.0001999801960357814, 'samples': 544032, 'steps': 1062, 'loss/train': 2.969670057296753} -09/20/2021 18:10:09 - INFO - __main__ - Step 17002: {'lr': 0.0001999801960357814, 'samples': 544064, 'steps': 1062, 'loss/train': 4.4741315841674805} -09/20/2021 18:10:10 - INFO - __main__ - Step 17003: {'lr': 0.0001999801960357814, 'samples': 544096, 'steps': 1062, 'loss/train': 4.081254959106445} -09/20/2021 18:10:11 - INFO - __main__ - Step 17004: {'lr': 0.0001999801960357814, 'samples': 544128, 'steps': 1062, 'loss/train': 3.4876348972320557} -09/20/2021 18:10:12 - INFO - __main__ - Step 17005: {'lr': 0.0001999801960357814, 'samples': 544160, 'steps': 1062, 'loss/train': 3.837064504623413} -09/20/2021 18:10:12 - INFO - __main__ - Step 17006: {'lr': 0.0001999801960357814, 'samples': 544192, 'steps': 1062, 'loss/train': 4.4514288902282715} -09/20/2021 18:10:13 - INFO - __main__ - Step 17007: {'lr': 0.0001999801960357814, 'samples': 544224, 'steps': 1062, 'loss/train': 1.78705632686615} -09/20/2021 18:10:14 - INFO - __main__ - Step 17008: {'lr': 0.0001999801960357814, 'samples': 544256, 'steps': 1062, 'loss/train': 3.822801351547241} -09/20/2021 18:10:15 - INFO - __main__ - Step 17009: {'lr': 0.0001999800688880737, 'samples': 544288, 'steps': 1063, 'loss/train': 3.6699650287628174} -09/20/2021 18:10:16 - INFO - __main__ - Step 17010: {'lr': 0.0001999800688880737, 'samples': 544320, 'steps': 1063, 'loss/train': 3.0358150005340576} -09/20/2021 18:10:16 - INFO - __main__ - Step 17011: {'lr': 0.0001999800688880737, 'samples': 544352, 'steps': 1063, 'loss/train': 2.1285173892974854} -09/20/2021 18:10:17 - INFO - __main__ - Step 17012: {'lr': 0.0001999800688880737, 'samples': 544384, 'steps': 1063, 'loss/train': 4.638071537017822} -09/20/2021 18:10:18 - INFO - __main__ - Step 17013: {'lr': 0.0001999800688880737, 'samples': 544416, 'steps': 1063, 'loss/train': 3.4655234813690186} -09/20/2021 18:10:19 - INFO - __main__ - Step 17014: {'lr': 0.0001999800688880737, 'samples': 544448, 'steps': 1063, 'loss/train': 3.566868782043457} -09/20/2021 18:10:19 - INFO - __main__ - Step 17015: {'lr': 0.0001999800688880737, 'samples': 544480, 'steps': 1063, 'loss/train': 4.883727550506592} -09/20/2021 18:10:20 - INFO - __main__ - Step 17016: {'lr': 0.0001999800688880737, 'samples': 544512, 'steps': 1063, 'loss/train': 4.461665630340576} -09/20/2021 18:10:21 - INFO - __main__ - Step 17017: {'lr': 0.0001999800688880737, 'samples': 544544, 'steps': 1063, 'loss/train': 3.531468152999878} -09/20/2021 18:10:22 - INFO - __main__ - Step 17018: {'lr': 0.0001999800688880737, 'samples': 544576, 'steps': 1063, 'loss/train': 3.3178870677948} -09/20/2021 18:10:22 - INFO - __main__ - Step 17019: {'lr': 0.0001999800688880737, 'samples': 544608, 'steps': 1063, 'loss/train': 3.543440341949463} -09/20/2021 18:10:23 - INFO - __main__ - Step 17020: {'lr': 0.0001999800688880737, 'samples': 544640, 'steps': 1063, 'loss/train': 4.412588596343994} -09/20/2021 18:10:24 - INFO - __main__ - Step 17021: {'lr': 0.0001999800688880737, 'samples': 544672, 'steps': 1063, 'loss/train': 3.31209135055542} -09/20/2021 18:10:25 - INFO - __main__ - Step 17022: {'lr': 0.0001999800688880737, 'samples': 544704, 'steps': 1063, 'loss/train': 3.8392906188964844} -09/20/2021 18:10:25 - INFO - __main__ - Step 17023: {'lr': 0.0001999800688880737, 'samples': 544736, 'steps': 1063, 'loss/train': 3.654419183731079} -09/20/2021 18:10:26 - INFO - __main__ - Step 17024: {'lr': 0.0001999800688880737, 'samples': 544768, 'steps': 1063, 'loss/train': 3.9207422733306885} -09/20/2021 18:10:27 - INFO - __main__ - Step 17025: {'lr': 0.00019997994133354746, 'samples': 544800, 'steps': 1064, 'loss/train': 3.5027883052825928} -09/20/2021 18:10:28 - INFO - __main__ - Step 17026: {'lr': 0.00019997994133354746, 'samples': 544832, 'steps': 1064, 'loss/train': 3.727745771408081} -09/20/2021 18:10:28 - INFO - __main__ - Step 17027: {'lr': 0.00019997994133354746, 'samples': 544864, 'steps': 1064, 'loss/train': 3.2077488899230957} -09/20/2021 18:10:29 - INFO - __main__ - Step 17028: {'lr': 0.00019997994133354746, 'samples': 544896, 'steps': 1064, 'loss/train': 2.8728277683258057} -09/20/2021 18:10:30 - INFO - __main__ - Step 17029: {'lr': 0.00019997994133354746, 'samples': 544928, 'steps': 1064, 'loss/train': 4.028125286102295} -09/20/2021 18:10:31 - INFO - __main__ - Step 17030: {'lr': 0.00019997994133354746, 'samples': 544960, 'steps': 1064, 'loss/train': 3.6383469104766846} -09/20/2021 18:10:31 - INFO - __main__ - Step 17031: {'lr': 0.00019997994133354746, 'samples': 544992, 'steps': 1064, 'loss/train': 3.5072131156921387} -09/20/2021 18:10:32 - INFO - __main__ - Step 17032: {'lr': 0.00019997994133354746, 'samples': 545024, 'steps': 1064, 'loss/train': 3.6979079246520996} -09/20/2021 18:10:34 - INFO - __main__ - Step 17033: {'lr': 0.00019997994133354746, 'samples': 545056, 'steps': 1064, 'loss/train': 3.418806314468384} -09/20/2021 18:10:34 - INFO - __main__ - Step 17034: {'lr': 0.00019997994133354746, 'samples': 545088, 'steps': 1064, 'loss/train': 3.425065040588379} -09/20/2021 18:10:35 - INFO - __main__ - Step 17035: {'lr': 0.00019997994133354746, 'samples': 545120, 'steps': 1064, 'loss/train': 3.304159164428711} -09/20/2021 18:10:36 - INFO - __main__ - Step 17036: {'lr': 0.00019997994133354746, 'samples': 545152, 'steps': 1064, 'loss/train': 2.1664371490478516} -09/20/2021 18:10:37 - INFO - __main__ - Step 17037: {'lr': 0.00019997994133354746, 'samples': 545184, 'steps': 1064, 'loss/train': 3.333399534225464} -09/20/2021 18:10:37 - INFO - __main__ - Step 17038: {'lr': 0.00019997994133354746, 'samples': 545216, 'steps': 1064, 'loss/train': 4.209219455718994} -09/20/2021 18:10:38 - INFO - __main__ - Step 17039: {'lr': 0.00019997994133354746, 'samples': 545248, 'steps': 1064, 'loss/train': 3.4240570068359375} -09/20/2021 18:10:39 - INFO - __main__ - Step 17040: {'lr': 0.00019997994133354746, 'samples': 545280, 'steps': 1064, 'loss/train': 4.085305690765381} -09/20/2021 18:10:40 - INFO - __main__ - Step 17041: {'lr': 0.00019997981337220325, 'samples': 545312, 'steps': 1065, 'loss/train': 4.296023368835449} -09/20/2021 18:10:40 - INFO - __main__ - Step 17042: {'lr': 0.00019997981337220325, 'samples': 545344, 'steps': 1065, 'loss/train': 1.0962077379226685} -09/20/2021 18:10:41 - INFO - __main__ - Step 17043: {'lr': 0.00019997981337220325, 'samples': 545376, 'steps': 1065, 'loss/train': 3.485684871673584} -09/20/2021 18:10:42 - INFO - __main__ - Step 17044: {'lr': 0.00019997981337220325, 'samples': 545408, 'steps': 1065, 'loss/train': 3.7710273265838623} -09/20/2021 18:10:43 - INFO - __main__ - Step 17045: {'lr': 0.00019997981337220325, 'samples': 545440, 'steps': 1065, 'loss/train': 3.390886068344116} -09/20/2021 18:10:43 - INFO - __main__ - Step 17046: {'lr': 0.00019997981337220325, 'samples': 545472, 'steps': 1065, 'loss/train': 4.365361213684082} -09/20/2021 18:10:44 - INFO - __main__ - Step 17047: {'lr': 0.00019997981337220325, 'samples': 545504, 'steps': 1065, 'loss/train': 3.94008207321167} -09/20/2021 18:10:45 - INFO - __main__ - Step 17048: {'lr': 0.00019997981337220325, 'samples': 545536, 'steps': 1065, 'loss/train': 4.37620735168457} -09/20/2021 18:10:46 - INFO - __main__ - Step 17049: {'lr': 0.00019997981337220325, 'samples': 545568, 'steps': 1065, 'loss/train': 3.7043402194976807} -09/20/2021 18:10:46 - INFO - __main__ - Step 17050: {'lr': 0.00019997981337220325, 'samples': 545600, 'steps': 1065, 'loss/train': 3.1791558265686035} -09/20/2021 18:10:47 - INFO - __main__ - Step 17051: {'lr': 0.00019997981337220325, 'samples': 545632, 'steps': 1065, 'loss/train': 0.7819957733154297} -09/20/2021 18:10:48 - INFO - __main__ - Step 17052: {'lr': 0.00019997981337220325, 'samples': 545664, 'steps': 1065, 'loss/train': 0.6468230485916138} -09/20/2021 18:10:49 - INFO - __main__ - Step 17053: {'lr': 0.00019997981337220325, 'samples': 545696, 'steps': 1065, 'loss/train': 1.2623262405395508} -09/20/2021 18:10:49 - INFO - __main__ - Step 17054: {'lr': 0.00019997981337220325, 'samples': 545728, 'steps': 1065, 'loss/train': 3.5067973136901855} -09/20/2021 18:10:50 - INFO - __main__ - Step 17055: {'lr': 0.00019997981337220325, 'samples': 545760, 'steps': 1065, 'loss/train': 3.6998960971832275} -09/20/2021 18:10:51 - INFO - __main__ - Step 17056: {'lr': 0.00019997981337220325, 'samples': 545792, 'steps': 1065, 'loss/train': 4.0744476318359375} -09/20/2021 18:10:52 - INFO - __main__ - Step 17057: {'lr': 0.00019997968500404159, 'samples': 545824, 'steps': 1066, 'loss/train': 3.8427865505218506} -09/20/2021 18:10:53 - INFO - __main__ - Step 17058: {'lr': 0.00019997968500404159, 'samples': 545856, 'steps': 1066, 'loss/train': 3.482158899307251} -09/20/2021 18:10:53 - INFO - __main__ - Step 17059: {'lr': 0.00019997968500404159, 'samples': 545888, 'steps': 1066, 'loss/train': 3.9152748584747314} -09/20/2021 18:10:54 - INFO - __main__ - Step 17060: {'lr': 0.00019997968500404159, 'samples': 545920, 'steps': 1066, 'loss/train': 4.102587699890137} -09/20/2021 18:10:55 - INFO - __main__ - Step 17061: {'lr': 0.00019997968500404159, 'samples': 545952, 'steps': 1066, 'loss/train': 0.5740601420402527} -09/20/2021 18:10:56 - INFO - __main__ - Step 17062: {'lr': 0.00019997968500404159, 'samples': 545984, 'steps': 1066, 'loss/train': 3.4771134853363037} -09/20/2021 18:10:57 - INFO - __main__ - Step 17063: {'lr': 0.00019997968500404159, 'samples': 546016, 'steps': 1066, 'loss/train': 3.3358235359191895} -09/20/2021 18:10:58 - INFO - __main__ - Step 17064: {'lr': 0.00019997968500404159, 'samples': 546048, 'steps': 1066, 'loss/train': 3.825294256210327} -09/20/2021 18:10:58 - INFO - __main__ - Step 17065: {'lr': 0.00019997968500404159, 'samples': 546080, 'steps': 1066, 'loss/train': 2.0221385955810547} -09/20/2021 18:10:59 - INFO - __main__ - Step 17066: {'lr': 0.00019997968500404159, 'samples': 546112, 'steps': 1066, 'loss/train': 1.287052869796753} -09/20/2021 18:11:00 - INFO - __main__ - Step 17067: {'lr': 0.00019997968500404159, 'samples': 546144, 'steps': 1066, 'loss/train': 3.4848344326019287} -09/20/2021 18:11:01 - INFO - __main__ - Step 17068: {'lr': 0.00019997968500404159, 'samples': 546176, 'steps': 1066, 'loss/train': 4.490293979644775} -09/20/2021 18:11:01 - INFO - __main__ - Step 17069: {'lr': 0.00019997968500404159, 'samples': 546208, 'steps': 1066, 'loss/train': 4.2978596687316895} -09/20/2021 18:11:02 - INFO - __main__ - Step 17070: {'lr': 0.00019997968500404159, 'samples': 546240, 'steps': 1066, 'loss/train': 3.2635297775268555} -09/20/2021 18:11:03 - INFO - __main__ - Step 17071: {'lr': 0.00019997968500404159, 'samples': 546272, 'steps': 1066, 'loss/train': 4.308074474334717} -09/20/2021 18:11:04 - INFO - __main__ - Step 17072: {'lr': 0.00019997968500404159, 'samples': 546304, 'steps': 1066, 'loss/train': 4.872340202331543} -09/20/2021 18:11:05 - INFO - __main__ - Step 17073: {'lr': 0.00019997955622906295, 'samples': 546336, 'steps': 1067, 'loss/train': 3.0136592388153076} -09/20/2021 18:11:05 - INFO - __main__ - Step 17074: {'lr': 0.00019997955622906295, 'samples': 546368, 'steps': 1067, 'loss/train': 2.984980583190918} -09/20/2021 18:11:06 - INFO - __main__ - Step 17075: {'lr': 0.00019997955622906295, 'samples': 546400, 'steps': 1067, 'loss/train': 3.6877870559692383} -09/20/2021 18:11:07 - INFO - __main__ - Step 17076: {'lr': 0.00019997955622906295, 'samples': 546432, 'steps': 1067, 'loss/train': 1.709344506263733} -09/20/2021 18:11:08 - INFO - __main__ - Step 17077: {'lr': 0.00019997955622906295, 'samples': 546464, 'steps': 1067, 'loss/train': 3.053096055984497} -09/20/2021 18:11:08 - INFO - __main__ - Step 17078: {'lr': 0.00019997955622906295, 'samples': 546496, 'steps': 1067, 'loss/train': 3.5002572536468506} -09/20/2021 18:11:09 - INFO - __main__ - Step 17079: {'lr': 0.00019997955622906295, 'samples': 546528, 'steps': 1067, 'loss/train': 4.124425888061523} -09/20/2021 18:11:10 - INFO - __main__ - Step 17080: {'lr': 0.00019997955622906295, 'samples': 546560, 'steps': 1067, 'loss/train': 3.776350259780884} -09/20/2021 18:11:11 - INFO - __main__ - Step 17081: {'lr': 0.00019997955622906295, 'samples': 546592, 'steps': 1067, 'loss/train': 3.261061191558838} -09/20/2021 18:11:11 - INFO - __main__ - Step 17082: {'lr': 0.00019997955622906295, 'samples': 546624, 'steps': 1067, 'loss/train': 2.023804187774658} -09/20/2021 18:11:12 - INFO - __main__ - Step 17083: {'lr': 0.00019997955622906295, 'samples': 546656, 'steps': 1067, 'loss/train': 4.976048469543457} -09/20/2021 18:11:13 - INFO - __main__ - Step 17084: {'lr': 0.00019997955622906295, 'samples': 546688, 'steps': 1067, 'loss/train': 4.677020072937012} -09/20/2021 18:11:14 - INFO - __main__ - Step 17085: {'lr': 0.00019997955622906295, 'samples': 546720, 'steps': 1067, 'loss/train': 4.4656877517700195} -09/20/2021 18:11:14 - INFO - __main__ - Step 17086: {'lr': 0.00019997955622906295, 'samples': 546752, 'steps': 1067, 'loss/train': 3.9679081439971924} -09/20/2021 18:11:15 - INFO - __main__ - Step 17087: {'lr': 0.00019997955622906295, 'samples': 546784, 'steps': 1067, 'loss/train': 4.687368392944336} -09/20/2021 18:11:16 - INFO - __main__ - Step 17088: {'lr': 0.00019997955622906295, 'samples': 546816, 'steps': 1067, 'loss/train': 4.792401313781738} -09/20/2021 18:11:17 - INFO - __main__ - Step 17089: {'lr': 0.00019997942704726789, 'samples': 546848, 'steps': 1068, 'loss/train': 3.74300217628479} -09/20/2021 18:11:17 - INFO - __main__ - Step 17090: {'lr': 0.00019997942704726789, 'samples': 546880, 'steps': 1068, 'loss/train': 4.557161808013916} -09/20/2021 18:11:18 - INFO - __main__ - Step 17091: {'lr': 0.00019997942704726789, 'samples': 546912, 'steps': 1068, 'loss/train': 2.936548948287964} -09/20/2021 18:11:19 - INFO - __main__ - Step 17092: {'lr': 0.00019997942704726789, 'samples': 546944, 'steps': 1068, 'loss/train': 3.4190213680267334} -09/20/2021 18:11:20 - INFO - __main__ - Step 17093: {'lr': 0.00019997942704726789, 'samples': 546976, 'steps': 1068, 'loss/train': 3.705875873565674} -09/20/2021 18:11:21 - INFO - __main__ - Step 17094: {'lr': 0.00019997942704726789, 'samples': 547008, 'steps': 1068, 'loss/train': 4.104268550872803} -09/20/2021 18:11:22 - INFO - __main__ - Step 17095: {'lr': 0.00019997942704726789, 'samples': 547040, 'steps': 1068, 'loss/train': 4.378350257873535} -09/20/2021 18:11:23 - INFO - __main__ - Step 17096: {'lr': 0.00019997942704726789, 'samples': 547072, 'steps': 1068, 'loss/train': 2.4405367374420166} -09/20/2021 18:11:23 - INFO - __main__ - Step 17097: {'lr': 0.00019997942704726789, 'samples': 547104, 'steps': 1068, 'loss/train': 4.392155647277832} -09/20/2021 18:11:24 - INFO - __main__ - Step 17098: {'lr': 0.00019997942704726789, 'samples': 547136, 'steps': 1068, 'loss/train': 3.9798343181610107} -09/20/2021 18:11:25 - INFO - __main__ - Step 17099: {'lr': 0.00019997942704726789, 'samples': 547168, 'steps': 1068, 'loss/train': 2.606336832046509} -09/20/2021 18:11:26 - INFO - __main__ - Step 17100: {'lr': 0.00019997942704726789, 'samples': 547200, 'steps': 1068, 'loss/train': 2.5945160388946533} -09/20/2021 18:11:26 - INFO - __main__ - Step 17101: {'lr': 0.00019997942704726789, 'samples': 547232, 'steps': 1068, 'loss/train': 3.4416558742523193} -09/20/2021 18:11:27 - INFO - __main__ - Step 17102: {'lr': 0.00019997942704726789, 'samples': 547264, 'steps': 1068, 'loss/train': 2.961930990219116} -09/20/2021 18:11:28 - INFO - __main__ - Step 17103: {'lr': 0.00019997942704726789, 'samples': 547296, 'steps': 1068, 'loss/train': 2.467632532119751} -09/20/2021 18:11:29 - INFO - __main__ - Step 17104: {'lr': 0.00019997942704726789, 'samples': 547328, 'steps': 1068, 'loss/train': 2.750871419906616} -09/20/2021 18:11:29 - INFO - __main__ - Step 17105: {'lr': 0.0001999792974586569, 'samples': 547360, 'steps': 1069, 'loss/train': 3.3246254920959473} -09/20/2021 18:11:30 - INFO - __main__ - Step 17106: {'lr': 0.0001999792974586569, 'samples': 547392, 'steps': 1069, 'loss/train': 3.3619961738586426} -09/20/2021 18:11:31 - INFO - __main__ - Step 17107: {'lr': 0.0001999792974586569, 'samples': 547424, 'steps': 1069, 'loss/train': 3.46787691116333} -09/20/2021 18:11:32 - INFO - __main__ - Step 17108: {'lr': 0.0001999792974586569, 'samples': 547456, 'steps': 1069, 'loss/train': 3.2269484996795654} -09/20/2021 18:11:32 - INFO - __main__ - Step 17109: {'lr': 0.0001999792974586569, 'samples': 547488, 'steps': 1069, 'loss/train': 4.127511024475098} -09/20/2021 18:11:33 - INFO - __main__ - Step 17110: {'lr': 0.0001999792974586569, 'samples': 547520, 'steps': 1069, 'loss/train': 4.170283317565918} -09/20/2021 18:11:34 - INFO - __main__ - Step 17111: {'lr': 0.0001999792974586569, 'samples': 547552, 'steps': 1069, 'loss/train': 3.4197685718536377} -09/20/2021 18:11:35 - INFO - __main__ - Step 17112: {'lr': 0.0001999792974586569, 'samples': 547584, 'steps': 1069, 'loss/train': 1.3165533542633057} -09/20/2021 18:11:35 - INFO - __main__ - Step 17113: {'lr': 0.0001999792974586569, 'samples': 547616, 'steps': 1069, 'loss/train': 3.381608724594116} -09/20/2021 18:11:36 - INFO - __main__ - Step 17114: {'lr': 0.0001999792974586569, 'samples': 547648, 'steps': 1069, 'loss/train': 3.430040121078491} -09/20/2021 18:11:37 - INFO - __main__ - Step 17115: {'lr': 0.0001999792974586569, 'samples': 547680, 'steps': 1069, 'loss/train': 4.076831340789795} -09/20/2021 18:11:38 - INFO - __main__ - Step 17116: {'lr': 0.0001999792974586569, 'samples': 547712, 'steps': 1069, 'loss/train': 2.2818329334259033} -09/20/2021 18:11:38 - INFO - __main__ - Step 17117: {'lr': 0.0001999792974586569, 'samples': 547744, 'steps': 1069, 'loss/train': 3.2548093795776367} -09/20/2021 18:11:39 - INFO - __main__ - Step 17118: {'lr': 0.0001999792974586569, 'samples': 547776, 'steps': 1069, 'loss/train': 4.154721260070801} -09/20/2021 18:11:40 - INFO - __main__ - Step 17119: {'lr': 0.0001999792974586569, 'samples': 547808, 'steps': 1069, 'loss/train': 3.5303776264190674} -09/20/2021 18:11:41 - INFO - __main__ - Step 17120: {'lr': 0.0001999792974586569, 'samples': 547840, 'steps': 1069, 'loss/train': 3.778474807739258} -09/20/2021 18:11:42 - INFO - __main__ - Step 17121: {'lr': 0.00019997916746323057, 'samples': 547872, 'steps': 1070, 'loss/train': 2.7792882919311523} -09/20/2021 18:11:42 - INFO - __main__ - Step 17122: {'lr': 0.00019997916746323057, 'samples': 547904, 'steps': 1070, 'loss/train': 1.5557265281677246} -09/20/2021 18:11:43 - INFO - __main__ - Step 17123: {'lr': 0.00019997916746323057, 'samples': 547936, 'steps': 1070, 'loss/train': 3.0957095623016357} -09/20/2021 18:11:44 - INFO - __main__ - Step 17124: {'lr': 0.00019997916746323057, 'samples': 547968, 'steps': 1070, 'loss/train': 4.117905139923096} -09/20/2021 18:11:45 - INFO - __main__ - Step 17125: {'lr': 0.00019997916746323057, 'samples': 548000, 'steps': 1070, 'loss/train': 3.530704975128174} -09/20/2021 18:11:46 - INFO - __main__ - Step 17126: {'lr': 0.00019997916746323057, 'samples': 548032, 'steps': 1070, 'loss/train': 4.6350998878479} -09/20/2021 18:11:47 - INFO - __main__ - Step 17127: {'lr': 0.00019997916746323057, 'samples': 548064, 'steps': 1070, 'loss/train': 3.100841999053955} -09/20/2021 18:11:48 - INFO - __main__ - Step 17128: {'lr': 0.00019997916746323057, 'samples': 548096, 'steps': 1070, 'loss/train': 1.1815621852874756} -09/20/2021 18:11:48 - INFO - __main__ - Step 17129: {'lr': 0.00019997916746323057, 'samples': 548128, 'steps': 1070, 'loss/train': 3.9023385047912598} -09/20/2021 18:11:49 - INFO - __main__ - Step 17130: {'lr': 0.00019997916746323057, 'samples': 548160, 'steps': 1070, 'loss/train': 3.632877826690674} -09/20/2021 18:11:50 - INFO - __main__ - Step 17131: {'lr': 0.00019997916746323057, 'samples': 548192, 'steps': 1070, 'loss/train': 4.473901271820068} -09/20/2021 18:11:51 - INFO - __main__ - Step 17132: {'lr': 0.00019997916746323057, 'samples': 548224, 'steps': 1070, 'loss/train': 3.4901270866394043} -09/20/2021 18:11:51 - INFO - __main__ - Step 17133: {'lr': 0.00019997916746323057, 'samples': 548256, 'steps': 1070, 'loss/train': 2.0593624114990234} -09/20/2021 18:11:52 - INFO - __main__ - Step 17134: {'lr': 0.00019997916746323057, 'samples': 548288, 'steps': 1070, 'loss/train': 2.0840511322021484} -09/20/2021 18:11:53 - INFO - __main__ - Step 17135: {'lr': 0.00019997916746323057, 'samples': 548320, 'steps': 1070, 'loss/train': 4.7242512702941895} -09/20/2021 18:11:54 - INFO - __main__ - Step 17136: {'lr': 0.00019997916746323057, 'samples': 548352, 'steps': 1070, 'loss/train': 3.8145205974578857} -09/20/2021 18:11:55 - INFO - __main__ - Step 17137: {'lr': 0.00019997903706098943, 'samples': 548384, 'steps': 1071, 'loss/train': 4.209229946136475} -09/20/2021 18:11:55 - INFO - __main__ - Step 17138: {'lr': 0.00019997903706098943, 'samples': 548416, 'steps': 1071, 'loss/train': 3.2134695053100586} -09/20/2021 18:11:56 - INFO - __main__ - Step 17139: {'lr': 0.00019997903706098943, 'samples': 548448, 'steps': 1071, 'loss/train': 1.271873116493225} -09/20/2021 18:11:57 - INFO - __main__ - Step 17140: {'lr': 0.00019997903706098943, 'samples': 548480, 'steps': 1071, 'loss/train': 2.7998318672180176} -09/20/2021 18:11:58 - INFO - __main__ - Step 17141: {'lr': 0.00019997903706098943, 'samples': 548512, 'steps': 1071, 'loss/train': 3.9835879802703857} -09/20/2021 18:11:58 - INFO - __main__ - Step 17142: {'lr': 0.00019997903706098943, 'samples': 548544, 'steps': 1071, 'loss/train': 3.0611793994903564} -09/20/2021 18:11:59 - INFO - __main__ - Step 17143: {'lr': 0.00019997903706098943, 'samples': 548576, 'steps': 1071, 'loss/train': 3.2432498931884766} -09/20/2021 18:12:00 - INFO - __main__ - Step 17144: {'lr': 0.00019997903706098943, 'samples': 548608, 'steps': 1071, 'loss/train': 3.1225788593292236} -09/20/2021 18:12:01 - INFO - __main__ - Step 17145: {'lr': 0.00019997903706098943, 'samples': 548640, 'steps': 1071, 'loss/train': 3.5013809204101562} -09/20/2021 18:12:01 - INFO - __main__ - Step 17146: {'lr': 0.00019997903706098943, 'samples': 548672, 'steps': 1071, 'loss/train': 4.256361961364746} -09/20/2021 18:12:02 - INFO - __main__ - Step 17147: {'lr': 0.00019997903706098943, 'samples': 548704, 'steps': 1071, 'loss/train': 3.2435214519500732} -09/20/2021 18:12:03 - INFO - __main__ - Step 17148: {'lr': 0.00019997903706098943, 'samples': 548736, 'steps': 1071, 'loss/train': 3.305837631225586} -09/20/2021 18:12:04 - INFO - __main__ - Step 17149: {'lr': 0.00019997903706098943, 'samples': 548768, 'steps': 1071, 'loss/train': 3.8071131706237793} -09/20/2021 18:12:04 - INFO - __main__ - Step 17150: {'lr': 0.00019997903706098943, 'samples': 548800, 'steps': 1071, 'loss/train': 3.4972875118255615} -09/20/2021 18:12:05 - INFO - __main__ - Step 17151: {'lr': 0.00019997903706098943, 'samples': 548832, 'steps': 1071, 'loss/train': 3.8648438453674316} -09/20/2021 18:12:06 - INFO - __main__ - Step 17152: {'lr': 0.00019997903706098943, 'samples': 548864, 'steps': 1071, 'loss/train': 3.870227336883545} -09/20/2021 18:12:07 - INFO - __main__ - Step 17153: {'lr': 0.00019997890625193392, 'samples': 548896, 'steps': 1072, 'loss/train': 3.6408164501190186} -09/20/2021 18:12:07 - INFO - __main__ - Step 17154: {'lr': 0.00019997890625193392, 'samples': 548928, 'steps': 1072, 'loss/train': 3.7811288833618164} -09/20/2021 18:12:08 - INFO - __main__ - Step 17155: {'lr': 0.00019997890625193392, 'samples': 548960, 'steps': 1072, 'loss/train': 3.6605353355407715} -09/20/2021 18:12:09 - INFO - __main__ - Step 17156: {'lr': 0.00019997890625193392, 'samples': 548992, 'steps': 1072, 'loss/train': 3.749324083328247} -09/20/2021 18:12:10 - INFO - __main__ - Step 17157: {'lr': 0.00019997890625193392, 'samples': 549024, 'steps': 1072, 'loss/train': 3.7356667518615723} -09/20/2021 18:12:11 - INFO - __main__ - Step 17158: {'lr': 0.00019997890625193392, 'samples': 549056, 'steps': 1072, 'loss/train': 4.370121955871582} -09/20/2021 18:12:12 - INFO - __main__ - Step 17159: {'lr': 0.00019997890625193392, 'samples': 549088, 'steps': 1072, 'loss/train': 4.658548831939697} -09/20/2021 18:12:13 - INFO - __main__ - Step 17160: {'lr': 0.00019997890625193392, 'samples': 549120, 'steps': 1072, 'loss/train': 2.640592575073242} -09/20/2021 18:12:14 - INFO - __main__ - Step 17161: {'lr': 0.00019997890625193392, 'samples': 549152, 'steps': 1072, 'loss/train': 3.2599239349365234} -09/20/2021 18:12:14 - INFO - __main__ - Step 17162: {'lr': 0.00019997890625193392, 'samples': 549184, 'steps': 1072, 'loss/train': 3.9821524620056152} -09/20/2021 18:12:15 - INFO - __main__ - Step 17163: {'lr': 0.00019997890625193392, 'samples': 549216, 'steps': 1072, 'loss/train': 4.2325849533081055} -09/20/2021 18:12:16 - INFO - __main__ - Step 17164: {'lr': 0.00019997890625193392, 'samples': 549248, 'steps': 1072, 'loss/train': 3.761512517929077} -09/20/2021 18:12:17 - INFO - __main__ - Step 17165: {'lr': 0.00019997890625193392, 'samples': 549280, 'steps': 1072, 'loss/train': 0.5541580319404602} -09/20/2021 18:12:17 - INFO - __main__ - Step 17166: {'lr': 0.00019997890625193392, 'samples': 549312, 'steps': 1072, 'loss/train': 3.619112253189087} -09/20/2021 18:12:18 - INFO - __main__ - Step 17167: {'lr': 0.00019997890625193392, 'samples': 549344, 'steps': 1072, 'loss/train': 3.7980809211730957} -09/20/2021 18:12:19 - INFO - __main__ - Step 17168: {'lr': 0.00019997890625193392, 'samples': 549376, 'steps': 1072, 'loss/train': 3.2897024154663086} -09/20/2021 18:12:20 - INFO - __main__ - Step 17169: {'lr': 0.00019997877503606467, 'samples': 549408, 'steps': 1073, 'loss/train': 0.5069391131401062} -09/20/2021 18:12:20 - INFO - __main__ - Step 17170: {'lr': 0.00019997877503606467, 'samples': 549440, 'steps': 1073, 'loss/train': 3.464791774749756} -09/20/2021 18:12:21 - INFO - __main__ - Step 17171: {'lr': 0.00019997877503606467, 'samples': 549472, 'steps': 1073, 'loss/train': 3.6760740280151367} -09/20/2021 18:12:22 - INFO - __main__ - Step 17172: {'lr': 0.00019997877503606467, 'samples': 549504, 'steps': 1073, 'loss/train': 3.2919037342071533} -09/20/2021 18:12:23 - INFO - __main__ - Step 17173: {'lr': 0.00019997877503606467, 'samples': 549536, 'steps': 1073, 'loss/train': 3.3008458614349365} -09/20/2021 18:12:23 - INFO - __main__ - Step 17174: {'lr': 0.00019997877503606467, 'samples': 549568, 'steps': 1073, 'loss/train': 3.9827773571014404} -09/20/2021 18:12:24 - INFO - __main__ - Step 17175: {'lr': 0.00019997877503606467, 'samples': 549600, 'steps': 1073, 'loss/train': 3.90019154548645} -09/20/2021 18:12:25 - INFO - __main__ - Step 17176: {'lr': 0.00019997877503606467, 'samples': 549632, 'steps': 1073, 'loss/train': 4.102543354034424} -09/20/2021 18:12:26 - INFO - __main__ - Step 17177: {'lr': 0.00019997877503606467, 'samples': 549664, 'steps': 1073, 'loss/train': 3.4354238510131836} -09/20/2021 18:12:26 - INFO - __main__ - Step 17178: {'lr': 0.00019997877503606467, 'samples': 549696, 'steps': 1073, 'loss/train': 3.8169350624084473} -09/20/2021 18:12:27 - INFO - __main__ - Step 17179: {'lr': 0.00019997877503606467, 'samples': 549728, 'steps': 1073, 'loss/train': 4.200454235076904} -09/20/2021 18:12:28 - INFO - __main__ - Step 17180: {'lr': 0.00019997877503606467, 'samples': 549760, 'steps': 1073, 'loss/train': 2.3291375637054443} -09/20/2021 18:12:29 - INFO - __main__ - Step 17181: {'lr': 0.00019997877503606467, 'samples': 549792, 'steps': 1073, 'loss/train': 2.906252861022949} -09/20/2021 18:12:29 - INFO - __main__ - Step 17182: {'lr': 0.00019997877503606467, 'samples': 549824, 'steps': 1073, 'loss/train': 3.418529987335205} -09/20/2021 18:12:30 - INFO - __main__ - Step 17183: {'lr': 0.00019997877503606467, 'samples': 549856, 'steps': 1073, 'loss/train': 3.3055672645568848} -09/20/2021 18:12:31 - INFO - __main__ - Step 17184: {'lr': 0.00019997877503606467, 'samples': 549888, 'steps': 1073, 'loss/train': 3.5368473529815674} -09/20/2021 18:12:32 - INFO - __main__ - Step 17185: {'lr': 0.00019997864341338213, 'samples': 549920, 'steps': 1074, 'loss/train': 3.6695070266723633} -09/20/2021 18:12:33 - INFO - __main__ - Step 17186: {'lr': 0.00019997864341338213, 'samples': 549952, 'steps': 1074, 'loss/train': 3.3379273414611816} -09/20/2021 18:12:33 - INFO - __main__ - Step 17187: {'lr': 0.00019997864341338213, 'samples': 549984, 'steps': 1074, 'loss/train': 3.3063251972198486} -09/20/2021 18:12:34 - INFO - __main__ - Step 17188: {'lr': 0.00019997864341338213, 'samples': 550016, 'steps': 1074, 'loss/train': 4.176483154296875} -09/20/2021 18:12:35 - INFO - __main__ - Step 17189: {'lr': 0.00019997864341338213, 'samples': 550048, 'steps': 1074, 'loss/train': 0.4653934836387634} -09/20/2021 18:12:36 - INFO - __main__ - Step 17190: {'lr': 0.00019997864341338213, 'samples': 550080, 'steps': 1074, 'loss/train': 3.726519823074341} -09/20/2021 18:12:37 - INFO - __main__ - Step 17191: {'lr': 0.00019997864341338213, 'samples': 550112, 'steps': 1074, 'loss/train': 5.515739440917969} -09/20/2021 18:12:38 - INFO - __main__ - Step 17192: {'lr': 0.00019997864341338213, 'samples': 550144, 'steps': 1074, 'loss/train': 3.4703304767608643} -09/20/2021 18:12:38 - INFO - __main__ - Step 17193: {'lr': 0.00019997864341338213, 'samples': 550176, 'steps': 1074, 'loss/train': 3.6160528659820557} -09/20/2021 18:12:39 - INFO - __main__ - Step 17194: {'lr': 0.00019997864341338213, 'samples': 550208, 'steps': 1074, 'loss/train': 3.363262414932251} -09/20/2021 18:12:40 - INFO - __main__ - Step 17195: {'lr': 0.00019997864341338213, 'samples': 550240, 'steps': 1074, 'loss/train': 1.843247890472412} -09/20/2021 18:12:41 - INFO - __main__ - Step 17196: {'lr': 0.00019997864341338213, 'samples': 550272, 'steps': 1074, 'loss/train': 3.5838680267333984} -09/20/2021 18:12:41 - INFO - __main__ - Step 17197: {'lr': 0.00019997864341338213, 'samples': 550304, 'steps': 1074, 'loss/train': 4.225194931030273} -09/20/2021 18:12:42 - INFO - __main__ - Step 17198: {'lr': 0.00019997864341338213, 'samples': 550336, 'steps': 1074, 'loss/train': 3.823025703430176} -09/20/2021 18:12:43 - INFO - __main__ - Step 17199: {'lr': 0.00019997864341338213, 'samples': 550368, 'steps': 1074, 'loss/train': 3.9434635639190674} -09/20/2021 18:12:44 - INFO - __main__ - Step 17200: {'lr': 0.00019997864341338213, 'samples': 550400, 'steps': 1074, 'loss/train': 4.22455358505249} -09/20/2021 18:12:44 - INFO - __main__ - Step 17201: {'lr': 0.0001999785113838869, 'samples': 550432, 'steps': 1075, 'loss/train': 3.1824915409088135} -09/20/2021 18:12:45 - INFO - __main__ - Step 17202: {'lr': 0.0001999785113838869, 'samples': 550464, 'steps': 1075, 'loss/train': 3.843271255493164} -09/20/2021 18:12:46 - INFO - __main__ - Step 17203: {'lr': 0.0001999785113838869, 'samples': 550496, 'steps': 1075, 'loss/train': 2.7203941345214844} -09/20/2021 18:12:47 - INFO - __main__ - Step 17204: {'lr': 0.0001999785113838869, 'samples': 550528, 'steps': 1075, 'loss/train': 3.7674062252044678} -09/20/2021 18:12:47 - INFO - __main__ - Step 17205: {'lr': 0.0001999785113838869, 'samples': 550560, 'steps': 1075, 'loss/train': 4.818446636199951} -09/20/2021 18:12:48 - INFO - __main__ - Step 17206: {'lr': 0.0001999785113838869, 'samples': 550592, 'steps': 1075, 'loss/train': 3.7430925369262695} -09/20/2021 18:12:49 - INFO - __main__ - Step 17207: {'lr': 0.0001999785113838869, 'samples': 550624, 'steps': 1075, 'loss/train': 2.687547445297241} -09/20/2021 18:12:50 - INFO - __main__ - Step 17208: {'lr': 0.0001999785113838869, 'samples': 550656, 'steps': 1075, 'loss/train': 3.1781558990478516} -09/20/2021 18:12:50 - INFO - __main__ - Step 17209: {'lr': 0.0001999785113838869, 'samples': 550688, 'steps': 1075, 'loss/train': 3.903934955596924} -09/20/2021 18:12:51 - INFO - __main__ - Step 17210: {'lr': 0.0001999785113838869, 'samples': 550720, 'steps': 1075, 'loss/train': 3.171560049057007} -09/20/2021 18:12:52 - INFO - __main__ - Step 17211: {'lr': 0.0001999785113838869, 'samples': 550752, 'steps': 1075, 'loss/train': 3.284358024597168} -09/20/2021 18:12:53 - INFO - __main__ - Step 17212: {'lr': 0.0001999785113838869, 'samples': 550784, 'steps': 1075, 'loss/train': 3.97530198097229} -09/20/2021 18:12:53 - INFO - __main__ - Step 17213: {'lr': 0.0001999785113838869, 'samples': 550816, 'steps': 1075, 'loss/train': 4.449843883514404} -09/20/2021 18:12:54 - INFO - __main__ - Step 17214: {'lr': 0.0001999785113838869, 'samples': 550848, 'steps': 1075, 'loss/train': 3.375138282775879} -09/20/2021 18:12:55 - INFO - __main__ - Step 17215: {'lr': 0.0001999785113838869, 'samples': 550880, 'steps': 1075, 'loss/train': 3.4917430877685547} -09/20/2021 18:12:56 - INFO - __main__ - Step 17216: {'lr': 0.0001999785113838869, 'samples': 550912, 'steps': 1075, 'loss/train': 4.049396991729736} -09/20/2021 18:12:57 - INFO - __main__ - Step 17217: {'lr': 0.0001999783789475795, 'samples': 550944, 'steps': 1076, 'loss/train': 3.0158705711364746} -09/20/2021 18:12:57 - INFO - __main__ - Step 17218: {'lr': 0.0001999783789475795, 'samples': 550976, 'steps': 1076, 'loss/train': 3.4819493293762207} -09/20/2021 18:12:58 - INFO - __main__ - Step 17219: {'lr': 0.0001999783789475795, 'samples': 551008, 'steps': 1076, 'loss/train': 4.271842002868652} -09/20/2021 18:12:59 - INFO - __main__ - Step 17220: {'lr': 0.0001999783789475795, 'samples': 551040, 'steps': 1076, 'loss/train': 3.599203586578369} -09/20/2021 18:13:00 - INFO - __main__ - Step 17221: {'lr': 0.0001999783789475795, 'samples': 551072, 'steps': 1076, 'loss/train': 2.274944305419922} -09/20/2021 18:13:01 - INFO - __main__ - Step 17222: {'lr': 0.0001999783789475795, 'samples': 551104, 'steps': 1076, 'loss/train': 4.115616798400879} -09/20/2021 18:13:02 - INFO - __main__ - Step 17223: {'lr': 0.0001999783789475795, 'samples': 551136, 'steps': 1076, 'loss/train': 3.4487392902374268} -09/20/2021 18:13:02 - INFO - __main__ - Step 17224: {'lr': 0.0001999783789475795, 'samples': 551168, 'steps': 1076, 'loss/train': 4.241994857788086} -09/20/2021 18:13:03 - INFO - __main__ - Step 17225: {'lr': 0.0001999783789475795, 'samples': 551200, 'steps': 1076, 'loss/train': 3.5523595809936523} -09/20/2021 18:13:04 - INFO - __main__ - Step 17226: {'lr': 0.0001999783789475795, 'samples': 551232, 'steps': 1076, 'loss/train': 3.510739326477051} -09/20/2021 18:13:05 - INFO - __main__ - Step 17227: {'lr': 0.0001999783789475795, 'samples': 551264, 'steps': 1076, 'loss/train': 4.792020320892334} -09/20/2021 18:13:05 - INFO - __main__ - Step 17228: {'lr': 0.0001999783789475795, 'samples': 551296, 'steps': 1076, 'loss/train': 3.109077215194702} -09/20/2021 18:13:06 - INFO - __main__ - Step 17229: {'lr': 0.0001999783789475795, 'samples': 551328, 'steps': 1076, 'loss/train': 4.047001838684082} -09/20/2021 18:13:07 - INFO - __main__ - Step 17230: {'lr': 0.0001999783789475795, 'samples': 551360, 'steps': 1076, 'loss/train': 3.9986588954925537} -09/20/2021 18:13:08 - INFO - __main__ - Step 17231: {'lr': 0.0001999783789475795, 'samples': 551392, 'steps': 1076, 'loss/train': 3.553767204284668} -09/20/2021 18:13:08 - INFO - __main__ - Step 17232: {'lr': 0.0001999783789475795, 'samples': 551424, 'steps': 1076, 'loss/train': 3.4775052070617676} -09/20/2021 18:13:09 - INFO - __main__ - Step 17233: {'lr': 0.00019997824610446045, 'samples': 551456, 'steps': 1077, 'loss/train': 3.115368366241455} -09/20/2021 18:13:10 - INFO - __main__ - Step 17234: {'lr': 0.00019997824610446045, 'samples': 551488, 'steps': 1077, 'loss/train': 6.045587062835693} -09/20/2021 18:13:11 - INFO - __main__ - Step 17235: {'lr': 0.00019997824610446045, 'samples': 551520, 'steps': 1077, 'loss/train': 3.4542815685272217} -09/20/2021 18:13:11 - INFO - __main__ - Step 17236: {'lr': 0.00019997824610446045, 'samples': 551552, 'steps': 1077, 'loss/train': 4.014052867889404} -09/20/2021 18:13:12 - INFO - __main__ - Step 17237: {'lr': 0.00019997824610446045, 'samples': 551584, 'steps': 1077, 'loss/train': 1.2119519710540771} -09/20/2021 18:13:13 - INFO - __main__ - Step 17238: {'lr': 0.00019997824610446045, 'samples': 551616, 'steps': 1077, 'loss/train': 3.013481616973877} -09/20/2021 18:13:14 - INFO - __main__ - Step 17239: {'lr': 0.00019997824610446045, 'samples': 551648, 'steps': 1077, 'loss/train': 3.383739471435547} -09/20/2021 18:13:14 - INFO - __main__ - Step 17240: {'lr': 0.00019997824610446045, 'samples': 551680, 'steps': 1077, 'loss/train': 3.7874157428741455} -09/20/2021 18:13:15 - INFO - __main__ - Step 17241: {'lr': 0.00019997824610446045, 'samples': 551712, 'steps': 1077, 'loss/train': 2.9616880416870117} -09/20/2021 18:13:16 - INFO - __main__ - Step 17242: {'lr': 0.00019997824610446045, 'samples': 551744, 'steps': 1077, 'loss/train': 3.7374215126037598} -09/20/2021 18:13:17 - INFO - __main__ - Step 17243: {'lr': 0.00019997824610446045, 'samples': 551776, 'steps': 1077, 'loss/train': 3.300936222076416} -09/20/2021 18:13:17 - INFO - __main__ - Step 17244: {'lr': 0.00019997824610446045, 'samples': 551808, 'steps': 1077, 'loss/train': 3.6235036849975586} -09/20/2021 18:13:18 - INFO - __main__ - Step 17245: {'lr': 0.00019997824610446045, 'samples': 551840, 'steps': 1077, 'loss/train': 3.4168245792388916} -09/20/2021 18:13:19 - INFO - __main__ - Step 17246: {'lr': 0.00019997824610446045, 'samples': 551872, 'steps': 1077, 'loss/train': 3.857501983642578} -09/20/2021 18:13:20 - INFO - __main__ - Step 17247: {'lr': 0.00019997824610446045, 'samples': 551904, 'steps': 1077, 'loss/train': 3.729872941970825} -09/20/2021 18:13:20 - INFO - __main__ - Step 17248: {'lr': 0.00019997824610446045, 'samples': 551936, 'steps': 1077, 'loss/train': 3.1500911712646484} -09/20/2021 18:13:21 - INFO - __main__ - Step 17249: {'lr': 0.0001999781128545303, 'samples': 551968, 'steps': 1078, 'loss/train': 3.0575003623962402} -09/20/2021 18:13:22 - INFO - __main__ - Step 17250: {'lr': 0.0001999781128545303, 'samples': 552000, 'steps': 1078, 'loss/train': 3.354943037033081} -09/20/2021 18:13:23 - INFO - __main__ - Step 17251: {'lr': 0.0001999781128545303, 'samples': 552032, 'steps': 1078, 'loss/train': 3.4807515144348145} -09/20/2021 18:13:24 - INFO - __main__ - Step 17252: {'lr': 0.0001999781128545303, 'samples': 552064, 'steps': 1078, 'loss/train': 1.6302075386047363} -09/20/2021 18:13:25 - INFO - __main__ - Step 17253: {'lr': 0.0001999781128545303, 'samples': 552096, 'steps': 1078, 'loss/train': 3.372840404510498} -09/20/2021 18:13:26 - INFO - __main__ - Step 17254: {'lr': 0.0001999781128545303, 'samples': 552128, 'steps': 1078, 'loss/train': 3.2832696437835693} -09/20/2021 18:13:26 - INFO - __main__ - Step 17255: {'lr': 0.0001999781128545303, 'samples': 552160, 'steps': 1078, 'loss/train': 1.7562037706375122} -09/20/2021 18:13:27 - INFO - __main__ - Step 17256: {'lr': 0.0001999781128545303, 'samples': 552192, 'steps': 1078, 'loss/train': 2.065349578857422} -09/20/2021 18:13:28 - INFO - __main__ - Step 17257: {'lr': 0.0001999781128545303, 'samples': 552224, 'steps': 1078, 'loss/train': 2.4661197662353516} -09/20/2021 18:13:29 - INFO - __main__ - Step 17258: {'lr': 0.0001999781128545303, 'samples': 552256, 'steps': 1078, 'loss/train': 1.22596275806427} -09/20/2021 18:13:29 - INFO - __main__ - Step 17259: {'lr': 0.0001999781128545303, 'samples': 552288, 'steps': 1078, 'loss/train': 4.157184600830078} -09/20/2021 18:13:30 - INFO - __main__ - Step 17260: {'lr': 0.0001999781128545303, 'samples': 552320, 'steps': 1078, 'loss/train': 3.6175835132598877} -09/20/2021 18:13:31 - INFO - __main__ - Step 17261: {'lr': 0.0001999781128545303, 'samples': 552352, 'steps': 1078, 'loss/train': 4.193106651306152} -09/20/2021 18:13:32 - INFO - __main__ - Step 17262: {'lr': 0.0001999781128545303, 'samples': 552384, 'steps': 1078, 'loss/train': 3.2066352367401123} -09/20/2021 18:13:32 - INFO - __main__ - Step 17263: {'lr': 0.0001999781128545303, 'samples': 552416, 'steps': 1078, 'loss/train': 4.116421222686768} -09/20/2021 18:13:33 - INFO - __main__ - Step 17264: {'lr': 0.0001999781128545303, 'samples': 552448, 'steps': 1078, 'loss/train': 3.213528871536255} -09/20/2021 18:13:34 - INFO - __main__ - Step 17265: {'lr': 0.0001999779791977896, 'samples': 552480, 'steps': 1079, 'loss/train': 3.5437238216400146} -09/20/2021 18:13:35 - INFO - __main__ - Step 17266: {'lr': 0.0001999779791977896, 'samples': 552512, 'steps': 1079, 'loss/train': 3.000222682952881} -09/20/2021 18:13:36 - INFO - __main__ - Step 17267: {'lr': 0.0001999779791977896, 'samples': 552544, 'steps': 1079, 'loss/train': 3.580598831176758} -09/20/2021 18:13:36 - INFO - __main__ - Step 17268: {'lr': 0.0001999779791977896, 'samples': 552576, 'steps': 1079, 'loss/train': 2.534168243408203} -09/20/2021 18:13:37 - INFO - __main__ - Step 17269: {'lr': 0.0001999779791977896, 'samples': 552608, 'steps': 1079, 'loss/train': 2.965141773223877} -09/20/2021 18:13:38 - INFO - __main__ - Step 17270: {'lr': 0.0001999779791977896, 'samples': 552640, 'steps': 1079, 'loss/train': 3.0807955265045166} -09/20/2021 18:13:39 - INFO - __main__ - Step 17271: {'lr': 0.0001999779791977896, 'samples': 552672, 'steps': 1079, 'loss/train': 3.970074415206909} -09/20/2021 18:13:39 - INFO - __main__ - Step 17272: {'lr': 0.0001999779791977896, 'samples': 552704, 'steps': 1079, 'loss/train': 2.974522829055786} -09/20/2021 18:13:40 - INFO - __main__ - Step 17273: {'lr': 0.0001999779791977896, 'samples': 552736, 'steps': 1079, 'loss/train': 3.9226255416870117} -09/20/2021 18:13:41 - INFO - __main__ - Step 17274: {'lr': 0.0001999779791977896, 'samples': 552768, 'steps': 1079, 'loss/train': 2.6714625358581543} -09/20/2021 18:13:42 - INFO - __main__ - Step 17275: {'lr': 0.0001999779791977896, 'samples': 552800, 'steps': 1079, 'loss/train': 4.1675944328308105} -09/20/2021 18:13:42 - INFO - __main__ - Step 17276: {'lr': 0.0001999779791977896, 'samples': 552832, 'steps': 1079, 'loss/train': 3.922881603240967} -09/20/2021 18:13:43 - INFO - __main__ - Step 17277: {'lr': 0.0001999779791977896, 'samples': 552864, 'steps': 1079, 'loss/train': 3.484362840652466} -09/20/2021 18:13:44 - INFO - __main__ - Step 17278: {'lr': 0.0001999779791977896, 'samples': 552896, 'steps': 1079, 'loss/train': 3.183614730834961} -09/20/2021 18:13:45 - INFO - __main__ - Step 17279: {'lr': 0.0001999779791977896, 'samples': 552928, 'steps': 1079, 'loss/train': 4.802748203277588} -09/20/2021 18:13:45 - INFO - __main__ - Step 17280: {'lr': 0.0001999779791977896, 'samples': 552960, 'steps': 1079, 'loss/train': 4.695954322814941} -09/20/2021 18:13:46 - INFO - __main__ - Step 17281: {'lr': 0.0001999778451342389, 'samples': 552992, 'steps': 1080, 'loss/train': 3.1695117950439453} -09/20/2021 18:13:47 - INFO - __main__ - Step 17282: {'lr': 0.0001999778451342389, 'samples': 553024, 'steps': 1080, 'loss/train': 3.4740474224090576} -09/20/2021 18:13:48 - INFO - __main__ - Step 17283: {'lr': 0.0001999778451342389, 'samples': 553056, 'steps': 1080, 'loss/train': 3.1007604598999023} -09/20/2021 18:13:49 - INFO - __main__ - Step 17284: {'lr': 0.0001999778451342389, 'samples': 553088, 'steps': 1080, 'loss/train': 3.645718574523926} -09/20/2021 18:13:50 - INFO - __main__ - Step 17285: {'lr': 0.0001999778451342389, 'samples': 553120, 'steps': 1080, 'loss/train': 3.8651607036590576} -09/20/2021 18:13:51 - INFO - __main__ - Step 17286: {'lr': 0.0001999778451342389, 'samples': 553152, 'steps': 1080, 'loss/train': 2.3706769943237305} -09/20/2021 18:13:51 - INFO - __main__ - Step 17287: {'lr': 0.0001999778451342389, 'samples': 553184, 'steps': 1080, 'loss/train': 3.2916066646575928} -09/20/2021 18:13:52 - INFO - __main__ - Step 17288: {'lr': 0.0001999778451342389, 'samples': 553216, 'steps': 1080, 'loss/train': 3.6265246868133545} -09/20/2021 18:13:53 - INFO - __main__ - Step 17289: {'lr': 0.0001999778451342389, 'samples': 553248, 'steps': 1080, 'loss/train': 2.3924877643585205} -09/20/2021 18:13:54 - INFO - __main__ - Step 17290: {'lr': 0.0001999778451342389, 'samples': 553280, 'steps': 1080, 'loss/train': 3.0398590564727783} -09/20/2021 18:13:54 - INFO - __main__ - Step 17291: {'lr': 0.0001999778451342389, 'samples': 553312, 'steps': 1080, 'loss/train': 1.3145853281021118} -09/20/2021 18:13:55 - INFO - __main__ - Step 17292: {'lr': 0.0001999778451342389, 'samples': 553344, 'steps': 1080, 'loss/train': 3.5126538276672363} -09/20/2021 18:13:56 - INFO - __main__ - Step 17293: {'lr': 0.0001999778451342389, 'samples': 553376, 'steps': 1080, 'loss/train': 2.6456329822540283} -09/20/2021 18:13:57 - INFO - __main__ - Step 17294: {'lr': 0.0001999778451342389, 'samples': 553408, 'steps': 1080, 'loss/train': 3.3628921508789062} -09/20/2021 18:13:57 - INFO - __main__ - Step 17295: {'lr': 0.0001999778451342389, 'samples': 553440, 'steps': 1080, 'loss/train': 3.7785160541534424} -09/20/2021 18:13:58 - INFO - __main__ - Step 17296: {'lr': 0.0001999778451342389, 'samples': 553472, 'steps': 1080, 'loss/train': 3.700786590576172} -09/20/2021 18:13:59 - INFO - __main__ - Step 17297: {'lr': 0.00019997771066387876, 'samples': 553504, 'steps': 1081, 'loss/train': 3.6300721168518066} -09/20/2021 18:14:00 - INFO - __main__ - Step 17298: {'lr': 0.00019997771066387876, 'samples': 553536, 'steps': 1081, 'loss/train': 4.253223419189453} -09/20/2021 18:14:00 - INFO - __main__ - Step 17299: {'lr': 0.00019997771066387876, 'samples': 553568, 'steps': 1081, 'loss/train': 4.165747165679932} -09/20/2021 18:14:01 - INFO - __main__ - Step 17300: {'lr': 0.00019997771066387876, 'samples': 553600, 'steps': 1081, 'loss/train': 2.0628762245178223} -09/20/2021 18:14:02 - INFO - __main__ - Step 17301: {'lr': 0.00019997771066387876, 'samples': 553632, 'steps': 1081, 'loss/train': 4.341353893280029} -09/20/2021 18:14:03 - INFO - __main__ - Step 17302: {'lr': 0.00019997771066387876, 'samples': 553664, 'steps': 1081, 'loss/train': 3.20650315284729} -09/20/2021 18:14:03 - INFO - __main__ - Step 17303: {'lr': 0.00019997771066387876, 'samples': 553696, 'steps': 1081, 'loss/train': 3.247551202774048} -09/20/2021 18:14:04 - INFO - __main__ - Step 17304: {'lr': 0.00019997771066387876, 'samples': 553728, 'steps': 1081, 'loss/train': 3.1765925884246826} -09/20/2021 18:14:05 - INFO - __main__ - Step 17305: {'lr': 0.00019997771066387876, 'samples': 553760, 'steps': 1081, 'loss/train': 3.022085666656494} -09/20/2021 18:14:06 - INFO - __main__ - Step 17306: {'lr': 0.00019997771066387876, 'samples': 553792, 'steps': 1081, 'loss/train': 2.9378437995910645} -09/20/2021 18:14:06 - INFO - __main__ - Step 17307: {'lr': 0.00019997771066387876, 'samples': 553824, 'steps': 1081, 'loss/train': 2.1212217807769775} -09/20/2021 18:14:07 - INFO - __main__ - Step 17308: {'lr': 0.00019997771066387876, 'samples': 553856, 'steps': 1081, 'loss/train': 3.0599770545959473} -09/20/2021 18:14:08 - INFO - __main__ - Step 17309: {'lr': 0.00019997771066387876, 'samples': 553888, 'steps': 1081, 'loss/train': 3.4028749465942383} -09/20/2021 18:14:09 - INFO - __main__ - Step 17310: {'lr': 0.00019997771066387876, 'samples': 553920, 'steps': 1081, 'loss/train': 3.6231279373168945} -09/20/2021 18:14:09 - INFO - __main__ - Step 17311: {'lr': 0.00019997771066387876, 'samples': 553952, 'steps': 1081, 'loss/train': 2.9035110473632812} -09/20/2021 18:14:10 - INFO - __main__ - Step 17312: {'lr': 0.00019997771066387876, 'samples': 553984, 'steps': 1081, 'loss/train': 4.058413505554199} -09/20/2021 18:14:11 - INFO - __main__ - Step 17313: {'lr': 0.00019997757578670968, 'samples': 554016, 'steps': 1082, 'loss/train': 3.243314027786255} -09/20/2021 18:14:12 - INFO - __main__ - Step 17314: {'lr': 0.00019997757578670968, 'samples': 554048, 'steps': 1082, 'loss/train': 6.335949897766113} -09/20/2021 18:14:13 - INFO - __main__ - Step 17315: {'lr': 0.00019997757578670968, 'samples': 554080, 'steps': 1082, 'loss/train': 6.419511318206787} -09/20/2021 18:14:13 - INFO - __main__ - Step 17316: {'lr': 0.00019997757578670968, 'samples': 554112, 'steps': 1082, 'loss/train': 6.444015979766846} -09/20/2021 18:14:14 - INFO - __main__ - Step 17317: {'lr': 0.00019997757578670968, 'samples': 554144, 'steps': 1082, 'loss/train': 6.329763889312744} -09/20/2021 18:14:15 - INFO - __main__ - Step 17318: {'lr': 0.00019997757578670968, 'samples': 554176, 'steps': 1082, 'loss/train': 6.443069934844971} -09/20/2021 18:14:16 - INFO - __main__ - Step 17319: {'lr': 0.00019997757578670968, 'samples': 554208, 'steps': 1082, 'loss/train': 2.4276797771453857} -09/20/2021 18:14:17 - INFO - __main__ - Step 17320: {'lr': 0.00019997757578670968, 'samples': 554240, 'steps': 1082, 'loss/train': 4.056859970092773} -09/20/2021 18:14:18 - INFO - __main__ - Step 17321: {'lr': 0.00019997757578670968, 'samples': 554272, 'steps': 1082, 'loss/train': 3.451674461364746} -09/20/2021 18:14:18 - INFO - __main__ - Step 17322: {'lr': 0.00019997757578670968, 'samples': 554304, 'steps': 1082, 'loss/train': 3.624833583831787} -09/20/2021 18:14:19 - INFO - __main__ - Step 17323: {'lr': 0.00019997757578670968, 'samples': 554336, 'steps': 1082, 'loss/train': 5.024956703186035} -09/20/2021 18:14:20 - INFO - __main__ - Step 17324: {'lr': 0.00019997757578670968, 'samples': 554368, 'steps': 1082, 'loss/train': 2.888972520828247} -09/20/2021 18:14:21 - INFO - __main__ - Step 17325: {'lr': 0.00019997757578670968, 'samples': 554400, 'steps': 1082, 'loss/train': 3.2686972618103027} -09/20/2021 18:14:21 - INFO - __main__ - Step 17326: {'lr': 0.00019997757578670968, 'samples': 554432, 'steps': 1082, 'loss/train': 3.111321449279785} -09/20/2021 18:14:22 - INFO - __main__ - Step 17327: {'lr': 0.00019997757578670968, 'samples': 554464, 'steps': 1082, 'loss/train': 2.659526824951172} -09/20/2021 18:14:23 - INFO - __main__ - Step 17328: {'lr': 0.00019997757578670968, 'samples': 554496, 'steps': 1082, 'loss/train': 4.739696025848389} -09/20/2021 18:14:24 - INFO - __main__ - Step 17329: {'lr': 0.00019997744050273225, 'samples': 554528, 'steps': 1083, 'loss/train': 3.6389007568359375} -09/20/2021 18:14:25 - INFO - __main__ - Step 17330: {'lr': 0.00019997744050273225, 'samples': 554560, 'steps': 1083, 'loss/train': 2.176802158355713} -09/20/2021 18:14:25 - INFO - __main__ - Step 17331: {'lr': 0.00019997744050273225, 'samples': 554592, 'steps': 1083, 'loss/train': 4.480079650878906} -09/20/2021 18:14:26 - INFO - __main__ - Step 17332: {'lr': 0.00019997744050273225, 'samples': 554624, 'steps': 1083, 'loss/train': 3.772294521331787} -09/20/2021 18:14:27 - INFO - __main__ - Step 17333: {'lr': 0.00019997744050273225, 'samples': 554656, 'steps': 1083, 'loss/train': 4.042701721191406} -09/20/2021 18:14:28 - INFO - __main__ - Step 17334: {'lr': 0.00019997744050273225, 'samples': 554688, 'steps': 1083, 'loss/train': 3.5933995246887207} -09/20/2021 18:14:28 - INFO - __main__ - Step 17335: {'lr': 0.00019997744050273225, 'samples': 554720, 'steps': 1083, 'loss/train': 4.158318519592285} -09/20/2021 18:14:29 - INFO - __main__ - Step 17336: {'lr': 0.00019997744050273225, 'samples': 554752, 'steps': 1083, 'loss/train': 3.6707332134246826} -09/20/2021 18:14:30 - INFO - __main__ - Step 17337: {'lr': 0.00019997744050273225, 'samples': 554784, 'steps': 1083, 'loss/train': 4.299688339233398} -09/20/2021 18:14:31 - INFO - __main__ - Step 17338: {'lr': 0.00019997744050273225, 'samples': 554816, 'steps': 1083, 'loss/train': 4.292297840118408} -09/20/2021 18:14:31 - INFO - __main__ - Step 17339: {'lr': 0.00019997744050273225, 'samples': 554848, 'steps': 1083, 'loss/train': 4.1201276779174805} -09/20/2021 18:14:32 - INFO - __main__ - Step 17340: {'lr': 0.00019997744050273225, 'samples': 554880, 'steps': 1083, 'loss/train': 3.662412405014038} -09/20/2021 18:14:33 - INFO - __main__ - Step 17341: {'lr': 0.00019997744050273225, 'samples': 554912, 'steps': 1083, 'loss/train': 2.764019727706909} -09/20/2021 18:14:34 - INFO - __main__ - Step 17342: {'lr': 0.00019997744050273225, 'samples': 554944, 'steps': 1083, 'loss/train': 2.886154890060425} -09/20/2021 18:14:34 - INFO - __main__ - Step 17343: {'lr': 0.00019997744050273225, 'samples': 554976, 'steps': 1083, 'loss/train': 5.735564708709717} -09/20/2021 18:14:35 - INFO - __main__ - Step 17344: {'lr': 0.00019997744050273225, 'samples': 555008, 'steps': 1083, 'loss/train': 4.20249605178833} -09/20/2021 18:14:36 - INFO - __main__ - Step 17345: {'lr': 0.00019997730481194698, 'samples': 555040, 'steps': 1084, 'loss/train': 3.8588826656341553} -09/20/2021 18:14:37 - INFO - __main__ - Step 17346: {'lr': 0.00019997730481194698, 'samples': 555072, 'steps': 1084, 'loss/train': 3.8148796558380127} -09/20/2021 18:14:37 - INFO - __main__ - Step 17347: {'lr': 0.00019997730481194698, 'samples': 555104, 'steps': 1084, 'loss/train': 3.9674553871154785} -09/20/2021 18:14:38 - INFO - __main__ - Step 17348: {'lr': 0.00019997730481194698, 'samples': 555136, 'steps': 1084, 'loss/train': 4.751868724822998} -09/20/2021 18:14:39 - INFO - __main__ - Step 17349: {'lr': 0.00019997730481194698, 'samples': 555168, 'steps': 1084, 'loss/train': 4.548879146575928} -09/20/2021 18:14:40 - INFO - __main__ - Step 17350: {'lr': 0.00019997730481194698, 'samples': 555200, 'steps': 1084, 'loss/train': 4.01193904876709} -09/20/2021 18:14:41 - INFO - __main__ - Step 17351: {'lr': 0.00019997730481194698, 'samples': 555232, 'steps': 1084, 'loss/train': 3.999786376953125} -09/20/2021 18:14:42 - INFO - __main__ - Step 17352: {'lr': 0.00019997730481194698, 'samples': 555264, 'steps': 1084, 'loss/train': 2.8569955825805664} -09/20/2021 18:14:42 - INFO - __main__ - Step 17353: {'lr': 0.00019997730481194698, 'samples': 555296, 'steps': 1084, 'loss/train': 3.4280872344970703} -09/20/2021 18:14:43 - INFO - __main__ - Step 17354: {'lr': 0.00019997730481194698, 'samples': 555328, 'steps': 1084, 'loss/train': 3.47715163230896} -09/20/2021 18:14:44 - INFO - __main__ - Step 17355: {'lr': 0.00019997730481194698, 'samples': 555360, 'steps': 1084, 'loss/train': 4.591850757598877} -09/20/2021 18:14:45 - INFO - __main__ - Step 17356: {'lr': 0.00019997730481194698, 'samples': 555392, 'steps': 1084, 'loss/train': 3.441814422607422} -09/20/2021 18:14:45 - INFO - __main__ - Step 17357: {'lr': 0.00019997730481194698, 'samples': 555424, 'steps': 1084, 'loss/train': 3.185606002807617} -09/20/2021 18:14:46 - INFO - __main__ - Step 17358: {'lr': 0.00019997730481194698, 'samples': 555456, 'steps': 1084, 'loss/train': 2.9487760066986084} -09/20/2021 18:14:47 - INFO - __main__ - Step 17359: {'lr': 0.00019997730481194698, 'samples': 555488, 'steps': 1084, 'loss/train': 3.9466984272003174} -09/20/2021 18:14:48 - INFO - __main__ - Step 17360: {'lr': 0.00019997730481194698, 'samples': 555520, 'steps': 1084, 'loss/train': 3.33854603767395} -09/20/2021 18:14:49 - INFO - __main__ - Step 17361: {'lr': 0.00019997716871435444, 'samples': 555552, 'steps': 1085, 'loss/train': 3.309770107269287} -09/20/2021 18:14:49 - INFO - __main__ - Step 17362: {'lr': 0.00019997716871435444, 'samples': 555584, 'steps': 1085, 'loss/train': 3.0455920696258545} -09/20/2021 18:14:50 - INFO - __main__ - Step 17363: {'lr': 0.00019997716871435444, 'samples': 555616, 'steps': 1085, 'loss/train': 3.2253217697143555} -09/20/2021 18:14:51 - INFO - __main__ - Step 17364: {'lr': 0.00019997716871435444, 'samples': 555648, 'steps': 1085, 'loss/train': 3.1960768699645996} -09/20/2021 18:14:52 - INFO - __main__ - Step 17365: {'lr': 0.00019997716871435444, 'samples': 555680, 'steps': 1085, 'loss/train': 3.1506543159484863} -09/20/2021 18:14:52 - INFO - __main__ - Step 17366: {'lr': 0.00019997716871435444, 'samples': 555712, 'steps': 1085, 'loss/train': 2.75689435005188} -09/20/2021 18:14:53 - INFO - __main__ - Step 17367: {'lr': 0.00019997716871435444, 'samples': 555744, 'steps': 1085, 'loss/train': 4.438930988311768} -09/20/2021 18:14:54 - INFO - __main__ - Step 17368: {'lr': 0.00019997716871435444, 'samples': 555776, 'steps': 1085, 'loss/train': 4.324954986572266} -09/20/2021 18:14:55 - INFO - __main__ - Step 17369: {'lr': 0.00019997716871435444, 'samples': 555808, 'steps': 1085, 'loss/train': 3.0891945362091064} -09/20/2021 18:14:55 - INFO - __main__ - Step 17370: {'lr': 0.00019997716871435444, 'samples': 555840, 'steps': 1085, 'loss/train': 2.8333451747894287} -09/20/2021 18:14:56 - INFO - __main__ - Step 17371: {'lr': 0.00019997716871435444, 'samples': 555872, 'steps': 1085, 'loss/train': 0.9414406418800354} -09/20/2021 18:14:57 - INFO - __main__ - Step 17372: {'lr': 0.00019997716871435444, 'samples': 555904, 'steps': 1085, 'loss/train': 3.2821240425109863} -09/20/2021 18:14:58 - INFO - __main__ - Step 17373: {'lr': 0.00019997716871435444, 'samples': 555936, 'steps': 1085, 'loss/train': 3.9406092166900635} -09/20/2021 18:14:58 - INFO - __main__ - Step 17374: {'lr': 0.00019997716871435444, 'samples': 555968, 'steps': 1085, 'loss/train': 4.015717506408691} -09/20/2021 18:14:59 - INFO - __main__ - Step 17375: {'lr': 0.00019997716871435444, 'samples': 556000, 'steps': 1085, 'loss/train': 3.3188157081604004} -09/20/2021 18:15:00 - INFO - __main__ - Step 17376: {'lr': 0.00019997716871435444, 'samples': 556032, 'steps': 1085, 'loss/train': 3.17309832572937} -09/20/2021 18:15:01 - INFO - __main__ - Step 17377: {'lr': 0.0001999770322099552, 'samples': 556064, 'steps': 1086, 'loss/train': 4.225960731506348} -09/20/2021 18:15:01 - INFO - __main__ - Step 17378: {'lr': 0.0001999770322099552, 'samples': 556096, 'steps': 1086, 'loss/train': 3.072463274002075} -09/20/2021 18:15:02 - INFO - __main__ - Step 17379: {'lr': 0.0001999770322099552, 'samples': 556128, 'steps': 1086, 'loss/train': 3.6693525314331055} -09/20/2021 18:15:03 - INFO - __main__ - Step 17380: {'lr': 0.0001999770322099552, 'samples': 556160, 'steps': 1086, 'loss/train': 3.7888433933258057} -09/20/2021 18:15:04 - INFO - __main__ - Step 17381: {'lr': 0.0001999770322099552, 'samples': 556192, 'steps': 1086, 'loss/train': 3.6266117095947266} -09/20/2021 18:15:05 - INFO - __main__ - Step 17382: {'lr': 0.0001999770322099552, 'samples': 556224, 'steps': 1086, 'loss/train': 2.7436397075653076} -09/20/2021 18:15:06 - INFO - __main__ - Step 17383: {'lr': 0.0001999770322099552, 'samples': 556256, 'steps': 1086, 'loss/train': 3.1349236965179443} -09/20/2021 18:15:06 - INFO - __main__ - Step 17384: {'lr': 0.0001999770322099552, 'samples': 556288, 'steps': 1086, 'loss/train': 2.7277183532714844} -09/20/2021 18:15:07 - INFO - __main__ - Step 17385: {'lr': 0.0001999770322099552, 'samples': 556320, 'steps': 1086, 'loss/train': 4.234513759613037} -09/20/2021 18:15:08 - INFO - __main__ - Step 17386: {'lr': 0.0001999770322099552, 'samples': 556352, 'steps': 1086, 'loss/train': 4.557701587677002} -09/20/2021 18:15:09 - INFO - __main__ - Step 17387: {'lr': 0.0001999770322099552, 'samples': 556384, 'steps': 1086, 'loss/train': 3.8776135444641113} -09/20/2021 18:15:09 - INFO - __main__ - Step 17388: {'lr': 0.0001999770322099552, 'samples': 556416, 'steps': 1086, 'loss/train': 4.1421284675598145} -09/20/2021 18:15:10 - INFO - __main__ - Step 17389: {'lr': 0.0001999770322099552, 'samples': 556448, 'steps': 1086, 'loss/train': 4.1930155754089355} -09/20/2021 18:15:11 - INFO - __main__ - Step 17390: {'lr': 0.0001999770322099552, 'samples': 556480, 'steps': 1086, 'loss/train': 8.098244667053223} -09/20/2021 18:15:12 - INFO - __main__ - Step 17391: {'lr': 0.0001999770322099552, 'samples': 556512, 'steps': 1086, 'loss/train': 3.451740026473999} -09/20/2021 18:15:12 - INFO - __main__ - Step 17392: {'lr': 0.0001999770322099552, 'samples': 556544, 'steps': 1086, 'loss/train': 2.8272483348846436} -09/20/2021 18:15:13 - INFO - __main__ - Step 17393: {'lr': 0.00019997689529874978, 'samples': 556576, 'steps': 1087, 'loss/train': 4.559908866882324} -09/20/2021 18:15:14 - INFO - __main__ - Step 17394: {'lr': 0.00019997689529874978, 'samples': 556608, 'steps': 1087, 'loss/train': 2.7462542057037354} -09/20/2021 18:15:15 - INFO - __main__ - Step 17395: {'lr': 0.00019997689529874978, 'samples': 556640, 'steps': 1087, 'loss/train': 0.9281111359596252} -09/20/2021 18:15:16 - INFO - __main__ - Step 17396: {'lr': 0.00019997689529874978, 'samples': 556672, 'steps': 1087, 'loss/train': 3.6847965717315674} -09/20/2021 18:15:16 - INFO - __main__ - Step 17397: {'lr': 0.00019997689529874978, 'samples': 556704, 'steps': 1087, 'loss/train': 3.6572158336639404} -09/20/2021 18:15:17 - INFO - __main__ - Step 17398: {'lr': 0.00019997689529874978, 'samples': 556736, 'steps': 1087, 'loss/train': 3.759816884994507} -09/20/2021 18:15:18 - INFO - __main__ - Step 17399: {'lr': 0.00019997689529874978, 'samples': 556768, 'steps': 1087, 'loss/train': 3.5543577671051025} -09/20/2021 18:15:19 - INFO - __main__ - Step 17400: {'lr': 0.00019997689529874978, 'samples': 556800, 'steps': 1087, 'loss/train': 3.5017943382263184} -09/20/2021 18:15:19 - INFO - __main__ - Step 17401: {'lr': 0.00019997689529874978, 'samples': 556832, 'steps': 1087, 'loss/train': 4.706949234008789} -09/20/2021 18:15:20 - INFO - __main__ - Step 17402: {'lr': 0.00019997689529874978, 'samples': 556864, 'steps': 1087, 'loss/train': 3.5968289375305176} -09/20/2021 18:15:21 - INFO - __main__ - Step 17403: {'lr': 0.00019997689529874978, 'samples': 556896, 'steps': 1087, 'loss/train': 3.953418254852295} -09/20/2021 18:15:22 - INFO - __main__ - Step 17404: {'lr': 0.00019997689529874978, 'samples': 556928, 'steps': 1087, 'loss/train': 2.6574366092681885} -09/20/2021 18:15:22 - INFO - __main__ - Step 17405: {'lr': 0.00019997689529874978, 'samples': 556960, 'steps': 1087, 'loss/train': 3.8399229049682617} -09/20/2021 18:15:23 - INFO - __main__ - Step 17406: {'lr': 0.00019997689529874978, 'samples': 556992, 'steps': 1087, 'loss/train': 3.340949058532715} -09/20/2021 18:15:24 - INFO - __main__ - Step 17407: {'lr': 0.00019997689529874978, 'samples': 557024, 'steps': 1087, 'loss/train': 3.5448246002197266} -09/20/2021 18:15:25 - INFO - __main__ - Step 17408: {'lr': 0.00019997689529874978, 'samples': 557056, 'steps': 1087, 'loss/train': 3.744896173477173} -09/20/2021 18:15:25 - INFO - __main__ - Step 17409: {'lr': 0.0001999767579807388, 'samples': 557088, 'steps': 1088, 'loss/train': 4.632606029510498} -09/20/2021 18:15:26 - INFO - __main__ - Step 17410: {'lr': 0.0001999767579807388, 'samples': 557120, 'steps': 1088, 'loss/train': 2.2137057781219482} -09/20/2021 18:15:27 - INFO - __main__ - Step 17411: {'lr': 0.0001999767579807388, 'samples': 557152, 'steps': 1088, 'loss/train': 4.606679916381836} -09/20/2021 18:15:29 - INFO - __main__ - Step 17412: {'lr': 0.0001999767579807388, 'samples': 557184, 'steps': 1088, 'loss/train': 3.2653920650482178} -09/20/2021 18:15:30 - INFO - __main__ - Step 17413: {'lr': 0.0001999767579807388, 'samples': 557216, 'steps': 1088, 'loss/train': 2.667881727218628} -09/20/2021 18:15:30 - INFO - __main__ - Step 17414: {'lr': 0.0001999767579807388, 'samples': 557248, 'steps': 1088, 'loss/train': 3.6007556915283203} -09/20/2021 18:15:31 - INFO - __main__ - Step 17415: {'lr': 0.0001999767579807388, 'samples': 557280, 'steps': 1088, 'loss/train': 3.696354627609253} -09/20/2021 18:15:32 - INFO - __main__ - Step 17416: {'lr': 0.0001999767579807388, 'samples': 557312, 'steps': 1088, 'loss/train': 3.2011330127716064} -09/20/2021 18:15:33 - INFO - __main__ - Step 17417: {'lr': 0.0001999767579807388, 'samples': 557344, 'steps': 1088, 'loss/train': 3.9941916465759277} -09/20/2021 18:15:33 - INFO - __main__ - Step 17418: {'lr': 0.0001999767579807388, 'samples': 557376, 'steps': 1088, 'loss/train': 4.999292373657227} -09/20/2021 18:15:34 - INFO - __main__ - Step 17419: {'lr': 0.0001999767579807388, 'samples': 557408, 'steps': 1088, 'loss/train': 3.6382412910461426} -09/20/2021 18:15:35 - INFO - __main__ - Step 17420: {'lr': 0.0001999767579807388, 'samples': 557440, 'steps': 1088, 'loss/train': 3.5148589611053467} -09/20/2021 18:15:36 - INFO - __main__ - Step 17421: {'lr': 0.0001999767579807388, 'samples': 557472, 'steps': 1088, 'loss/train': 3.5155751705169678} -09/20/2021 18:15:36 - INFO - __main__ - Step 17422: {'lr': 0.0001999767579807388, 'samples': 557504, 'steps': 1088, 'loss/train': 3.7412264347076416} -09/20/2021 18:15:37 - INFO - __main__ - Step 17423: {'lr': 0.0001999767579807388, 'samples': 557536, 'steps': 1088, 'loss/train': 3.7898178100585938} -09/20/2021 18:15:38 - INFO - __main__ - Step 17424: {'lr': 0.0001999767579807388, 'samples': 557568, 'steps': 1088, 'loss/train': 4.182319641113281} -09/20/2021 18:15:39 - INFO - __main__ - Step 17425: {'lr': 0.00019997662025592275, 'samples': 557600, 'steps': 1089, 'loss/train': 2.57472825050354} -09/20/2021 18:15:39 - INFO - __main__ - Step 17426: {'lr': 0.00019997662025592275, 'samples': 557632, 'steps': 1089, 'loss/train': 3.9295573234558105} -09/20/2021 18:15:40 - INFO - __main__ - Step 17427: {'lr': 0.00019997662025592275, 'samples': 557664, 'steps': 1089, 'loss/train': 3.781606912612915} -09/20/2021 18:15:41 - INFO - __main__ - Step 17428: {'lr': 0.00019997662025592275, 'samples': 557696, 'steps': 1089, 'loss/train': 3.2483603954315186} -09/20/2021 18:15:42 - INFO - __main__ - Step 17429: {'lr': 0.00019997662025592275, 'samples': 557728, 'steps': 1089, 'loss/train': 3.9165396690368652} -09/20/2021 18:15:42 - INFO - __main__ - Step 17430: {'lr': 0.00019997662025592275, 'samples': 557760, 'steps': 1089, 'loss/train': 3.919023036956787} -09/20/2021 18:15:43 - INFO - __main__ - Step 17431: {'lr': 0.00019997662025592275, 'samples': 557792, 'steps': 1089, 'loss/train': 2.84513258934021} -09/20/2021 18:15:44 - INFO - __main__ - Step 17432: {'lr': 0.00019997662025592275, 'samples': 557824, 'steps': 1089, 'loss/train': 0.7767029404640198} -09/20/2021 18:15:45 - INFO - __main__ - Step 17433: {'lr': 0.00019997662025592275, 'samples': 557856, 'steps': 1089, 'loss/train': 4.678984642028809} -09/20/2021 18:15:45 - INFO - __main__ - Step 17434: {'lr': 0.00019997662025592275, 'samples': 557888, 'steps': 1089, 'loss/train': 3.0002760887145996} -09/20/2021 18:15:46 - INFO - __main__ - Step 17435: {'lr': 0.00019997662025592275, 'samples': 557920, 'steps': 1089, 'loss/train': 2.567697048187256} -09/20/2021 18:15:47 - INFO - __main__ - Step 17436: {'lr': 0.00019997662025592275, 'samples': 557952, 'steps': 1089, 'loss/train': 5.537823677062988} -09/20/2021 18:15:48 - INFO - __main__ - Step 17437: {'lr': 0.00019997662025592275, 'samples': 557984, 'steps': 1089, 'loss/train': 4.122821807861328} -09/20/2021 18:15:48 - INFO - __main__ - Step 17438: {'lr': 0.00019997662025592275, 'samples': 558016, 'steps': 1089, 'loss/train': 3.052654266357422} -09/20/2021 18:15:49 - INFO - __main__ - Step 17439: {'lr': 0.00019997662025592275, 'samples': 558048, 'steps': 1089, 'loss/train': 3.450178861618042} -09/20/2021 18:15:50 - INFO - __main__ - Step 17440: {'lr': 0.00019997662025592275, 'samples': 558080, 'steps': 1089, 'loss/train': 2.8021323680877686} -09/20/2021 18:15:51 - INFO - __main__ - Step 17441: {'lr': 0.00019997648212430224, 'samples': 558112, 'steps': 1090, 'loss/train': 5.767229080200195} -09/20/2021 18:15:52 - INFO - __main__ - Step 17442: {'lr': 0.00019997648212430224, 'samples': 558144, 'steps': 1090, 'loss/train': 4.638725280761719} -09/20/2021 18:15:53 - INFO - __main__ - Step 17443: {'lr': 0.00019997648212430224, 'samples': 558176, 'steps': 1090, 'loss/train': 4.52488899230957} -09/20/2021 18:15:54 - INFO - __main__ - Step 17444: {'lr': 0.00019997648212430224, 'samples': 558208, 'steps': 1090, 'loss/train': 3.7585227489471436} -09/20/2021 18:15:54 - INFO - __main__ - Step 17445: {'lr': 0.00019997648212430224, 'samples': 558240, 'steps': 1090, 'loss/train': 2.718601942062378} -09/20/2021 18:15:55 - INFO - __main__ - Step 17446: {'lr': 0.00019997648212430224, 'samples': 558272, 'steps': 1090, 'loss/train': 3.777850866317749} -09/20/2021 18:15:56 - INFO - __main__ - Step 17447: {'lr': 0.00019997648212430224, 'samples': 558304, 'steps': 1090, 'loss/train': 3.0826971530914307} -09/20/2021 18:15:57 - INFO - __main__ - Step 17448: {'lr': 0.00019997648212430224, 'samples': 558336, 'steps': 1090, 'loss/train': 3.7414519786834717} -09/20/2021 18:15:57 - INFO - __main__ - Step 17449: {'lr': 0.00019997648212430224, 'samples': 558368, 'steps': 1090, 'loss/train': 4.219871520996094} -09/20/2021 18:15:58 - INFO - __main__ - Step 17450: {'lr': 0.00019997648212430224, 'samples': 558400, 'steps': 1090, 'loss/train': 1.212180256843567} -09/20/2021 18:15:59 - INFO - __main__ - Step 17451: {'lr': 0.00019997648212430224, 'samples': 558432, 'steps': 1090, 'loss/train': 4.212900638580322} -09/20/2021 18:16:00 - INFO - __main__ - Step 17452: {'lr': 0.00019997648212430224, 'samples': 558464, 'steps': 1090, 'loss/train': 4.122873306274414} -09/20/2021 18:16:00 - INFO - __main__ - Step 17453: {'lr': 0.00019997648212430224, 'samples': 558496, 'steps': 1090, 'loss/train': 3.115152359008789} -09/20/2021 18:16:01 - INFO - __main__ - Step 17454: {'lr': 0.00019997648212430224, 'samples': 558528, 'steps': 1090, 'loss/train': 3.291045904159546} -09/20/2021 18:16:02 - INFO - __main__ - Step 17455: {'lr': 0.00019997648212430224, 'samples': 558560, 'steps': 1090, 'loss/train': 5.385772228240967} -09/20/2021 18:16:03 - INFO - __main__ - Step 17456: {'lr': 0.00019997648212430224, 'samples': 558592, 'steps': 1090, 'loss/train': 3.6478328704833984} -09/20/2021 18:16:04 - INFO - __main__ - Step 17457: {'lr': 0.0001999763435858778, 'samples': 558624, 'steps': 1091, 'loss/train': 3.1719603538513184} -09/20/2021 18:16:04 - INFO - __main__ - Step 17458: {'lr': 0.0001999763435858778, 'samples': 558656, 'steps': 1091, 'loss/train': 3.81624174118042} -09/20/2021 18:16:05 - INFO - __main__ - Step 17459: {'lr': 0.0001999763435858778, 'samples': 558688, 'steps': 1091, 'loss/train': 3.5013084411621094} -09/20/2021 18:16:06 - INFO - __main__ - Step 17460: {'lr': 0.0001999763435858778, 'samples': 558720, 'steps': 1091, 'loss/train': 3.3782122135162354} -09/20/2021 18:16:07 - INFO - __main__ - Step 17461: {'lr': 0.0001999763435858778, 'samples': 558752, 'steps': 1091, 'loss/train': 3.7251617908477783} -09/20/2021 18:16:07 - INFO - __main__ - Step 17462: {'lr': 0.0001999763435858778, 'samples': 558784, 'steps': 1091, 'loss/train': 3.5647430419921875} -09/20/2021 18:16:08 - INFO - __main__ - Step 17463: {'lr': 0.0001999763435858778, 'samples': 558816, 'steps': 1091, 'loss/train': 3.56943941116333} -09/20/2021 18:16:09 - INFO - __main__ - Step 17464: {'lr': 0.0001999763435858778, 'samples': 558848, 'steps': 1091, 'loss/train': 2.9577271938323975} -09/20/2021 18:16:10 - INFO - __main__ - Step 17465: {'lr': 0.0001999763435858778, 'samples': 558880, 'steps': 1091, 'loss/train': 3.120424509048462} -09/20/2021 18:16:10 - INFO - __main__ - Step 17466: {'lr': 0.0001999763435858778, 'samples': 558912, 'steps': 1091, 'loss/train': 4.708489894866943} -09/20/2021 18:16:11 - INFO - __main__ - Step 17467: {'lr': 0.0001999763435858778, 'samples': 558944, 'steps': 1091, 'loss/train': 3.2325220108032227} -09/20/2021 18:16:12 - INFO - __main__ - Step 17468: {'lr': 0.0001999763435858778, 'samples': 558976, 'steps': 1091, 'loss/train': 3.447066307067871} -09/20/2021 18:16:13 - INFO - __main__ - Step 17469: {'lr': 0.0001999763435858778, 'samples': 559008, 'steps': 1091, 'loss/train': 3.0226452350616455} -09/20/2021 18:16:13 - INFO - __main__ - Step 17470: {'lr': 0.0001999763435858778, 'samples': 559040, 'steps': 1091, 'loss/train': 4.089224338531494} -09/20/2021 18:16:14 - INFO - __main__ - Step 17471: {'lr': 0.0001999763435858778, 'samples': 559072, 'steps': 1091, 'loss/train': 4.699869632720947} -09/20/2021 18:16:15 - INFO - __main__ - Step 17472: {'lr': 0.0001999763435858778, 'samples': 559104, 'steps': 1091, 'loss/train': 1.3904486894607544} -09/20/2021 18:16:16 - INFO - __main__ - Step 17473: {'lr': 0.00019997620464065, 'samples': 559136, 'steps': 1092, 'loss/train': 3.6706671714782715} -09/20/2021 18:16:16 - INFO - __main__ - Step 17474: {'lr': 0.00019997620464065, 'samples': 559168, 'steps': 1092, 'loss/train': 3.570430278778076} -09/20/2021 18:16:17 - INFO - __main__ - Step 17475: {'lr': 0.00019997620464065, 'samples': 559200, 'steps': 1092, 'loss/train': 3.4659268856048584} -09/20/2021 18:16:19 - INFO - __main__ - Step 17476: {'lr': 0.00019997620464065, 'samples': 559232, 'steps': 1092, 'loss/train': 4.573116779327393} -09/20/2021 18:16:19 - INFO - __main__ - Step 17477: {'lr': 0.00019997620464065, 'samples': 559264, 'steps': 1092, 'loss/train': 4.184083938598633} -09/20/2021 18:16:20 - INFO - __main__ - Step 17478: {'lr': 0.00019997620464065, 'samples': 559296, 'steps': 1092, 'loss/train': 4.600339412689209} -09/20/2021 18:16:21 - INFO - __main__ - Step 17479: {'lr': 0.00019997620464065, 'samples': 559328, 'steps': 1092, 'loss/train': 3.5763227939605713} -09/20/2021 18:16:22 - INFO - __main__ - Step 17480: {'lr': 0.00019997620464065, 'samples': 559360, 'steps': 1092, 'loss/train': 3.354405403137207} -09/20/2021 18:16:22 - INFO - __main__ - Step 17481: {'lr': 0.00019997620464065, 'samples': 559392, 'steps': 1092, 'loss/train': 3.6894164085388184} -09/20/2021 18:16:23 - INFO - __main__ - Step 17482: {'lr': 0.00019997620464065, 'samples': 559424, 'steps': 1092, 'loss/train': 3.769721031188965} -09/20/2021 18:16:24 - INFO - __main__ - Step 17483: {'lr': 0.00019997620464065, 'samples': 559456, 'steps': 1092, 'loss/train': 4.322051048278809} -09/20/2021 18:16:25 - INFO - __main__ - Step 17484: {'lr': 0.00019997620464065, 'samples': 559488, 'steps': 1092, 'loss/train': 3.796814203262329} -09/20/2021 18:16:25 - INFO - __main__ - Step 17485: {'lr': 0.00019997620464065, 'samples': 559520, 'steps': 1092, 'loss/train': 3.446749210357666} -09/20/2021 18:16:26 - INFO - __main__ - Step 17486: {'lr': 0.00019997620464065, 'samples': 559552, 'steps': 1092, 'loss/train': 4.046967029571533} -09/20/2021 18:16:27 - INFO - __main__ - Step 17487: {'lr': 0.00019997620464065, 'samples': 559584, 'steps': 1092, 'loss/train': 4.030688762664795} -09/20/2021 18:16:28 - INFO - __main__ - Step 17488: {'lr': 0.00019997620464065, 'samples': 559616, 'steps': 1092, 'loss/train': 3.688570499420166} -09/20/2021 18:16:29 - INFO - __main__ - Step 17489: {'lr': 0.00019997606528861944, 'samples': 559648, 'steps': 1093, 'loss/train': 4.058945178985596} -09/20/2021 18:16:29 - INFO - __main__ - Step 17490: {'lr': 0.00019997606528861944, 'samples': 559680, 'steps': 1093, 'loss/train': 4.236232280731201} -09/20/2021 18:16:30 - INFO - __main__ - Step 17491: {'lr': 0.00019997606528861944, 'samples': 559712, 'steps': 1093, 'loss/train': 3.1457366943359375} -09/20/2021 18:16:31 - INFO - __main__ - Step 17492: {'lr': 0.00019997606528861944, 'samples': 559744, 'steps': 1093, 'loss/train': 3.7167627811431885} -09/20/2021 18:16:32 - INFO - __main__ - Step 17493: {'lr': 0.00019997606528861944, 'samples': 559776, 'steps': 1093, 'loss/train': 2.9712207317352295} -09/20/2021 18:16:32 - INFO - __main__ - Step 17494: {'lr': 0.00019997606528861944, 'samples': 559808, 'steps': 1093, 'loss/train': 3.9020841121673584} -09/20/2021 18:16:33 - INFO - __main__ - Step 17495: {'lr': 0.00019997606528861944, 'samples': 559840, 'steps': 1093, 'loss/train': 3.5186233520507812} -09/20/2021 18:16:34 - INFO - __main__ - Step 17496: {'lr': 0.00019997606528861944, 'samples': 559872, 'steps': 1093, 'loss/train': 3.6957130432128906} -09/20/2021 18:16:35 - INFO - __main__ - Step 17497: {'lr': 0.00019997606528861944, 'samples': 559904, 'steps': 1093, 'loss/train': 3.1707305908203125} -09/20/2021 18:16:35 - INFO - __main__ - Step 17498: {'lr': 0.00019997606528861944, 'samples': 559936, 'steps': 1093, 'loss/train': 3.827637195587158} -09/20/2021 18:16:36 - INFO - __main__ - Step 17499: {'lr': 0.00019997606528861944, 'samples': 559968, 'steps': 1093, 'loss/train': 3.0933618545532227} -09/20/2021 18:16:37 - INFO - __main__ - Step 17500: {'lr': 0.00019997606528861944, 'samples': 560000, 'steps': 1093, 'loss/train': 3.278996467590332} -09/20/2021 18:16:38 - INFO - __main__ - Step 17501: {'lr': 0.00019997606528861944, 'samples': 560032, 'steps': 1093, 'loss/train': 3.6090734004974365} -09/20/2021 18:16:38 - INFO - __main__ - Step 17502: {'lr': 0.00019997606528861944, 'samples': 560064, 'steps': 1093, 'loss/train': 4.293115615844727} -09/20/2021 18:16:39 - INFO - __main__ - Step 17503: {'lr': 0.00019997606528861944, 'samples': 560096, 'steps': 1093, 'loss/train': 1.856313705444336} -09/20/2021 18:16:40 - INFO - __main__ - Step 17504: {'lr': 0.00019997606528861944, 'samples': 560128, 'steps': 1093, 'loss/train': 2.82138729095459} -09/20/2021 18:16:41 - INFO - __main__ - Step 17505: {'lr': 0.00019997592552978662, 'samples': 560160, 'steps': 1094, 'loss/train': 1.1791927814483643} -09/20/2021 18:16:41 - INFO - __main__ - Step 17506: {'lr': 0.00019997592552978662, 'samples': 560192, 'steps': 1094, 'loss/train': 1.0010429620742798} -09/20/2021 18:16:43 - INFO - __main__ - Step 17507: {'lr': 0.00019997592552978662, 'samples': 560224, 'steps': 1094, 'loss/train': 4.120267868041992} -09/20/2021 18:16:43 - INFO - __main__ - Step 17508: {'lr': 0.00019997592552978662, 'samples': 560256, 'steps': 1094, 'loss/train': 3.8449668884277344} -09/20/2021 18:16:44 - INFO - __main__ - Step 17509: {'lr': 0.00019997592552978662, 'samples': 560288, 'steps': 1094, 'loss/train': 4.921204566955566} -09/20/2021 18:16:45 - INFO - __main__ - Step 17510: {'lr': 0.00019997592552978662, 'samples': 560320, 'steps': 1094, 'loss/train': 3.412729024887085} -09/20/2021 18:16:46 - INFO - __main__ - Step 17511: {'lr': 0.00019997592552978662, 'samples': 560352, 'steps': 1094, 'loss/train': 4.461093902587891} -09/20/2021 18:16:46 - INFO - __main__ - Step 17512: {'lr': 0.00019997592552978662, 'samples': 560384, 'steps': 1094, 'loss/train': 3.010896921157837} -09/20/2021 18:16:47 - INFO - __main__ - Step 17513: {'lr': 0.00019997592552978662, 'samples': 560416, 'steps': 1094, 'loss/train': 3.376739263534546} -09/20/2021 18:16:48 - INFO - __main__ - Step 17514: {'lr': 0.00019997592552978662, 'samples': 560448, 'steps': 1094, 'loss/train': 3.7387053966522217} -09/20/2021 18:16:49 - INFO - __main__ - Step 17515: {'lr': 0.00019997592552978662, 'samples': 560480, 'steps': 1094, 'loss/train': 3.8004069328308105} -09/20/2021 18:16:49 - INFO - __main__ - Step 17516: {'lr': 0.00019997592552978662, 'samples': 560512, 'steps': 1094, 'loss/train': 4.883747100830078} -09/20/2021 18:16:50 - INFO - __main__ - Step 17517: {'lr': 0.00019997592552978662, 'samples': 560544, 'steps': 1094, 'loss/train': 3.9712133407592773} -09/20/2021 18:16:51 - INFO - __main__ - Step 17518: {'lr': 0.00019997592552978662, 'samples': 560576, 'steps': 1094, 'loss/train': 3.5303151607513428} -09/20/2021 18:16:52 - INFO - __main__ - Step 17519: {'lr': 0.00019997592552978662, 'samples': 560608, 'steps': 1094, 'loss/train': 4.516822814941406} -09/20/2021 18:16:52 - INFO - __main__ - Step 17520: {'lr': 0.00019997592552978662, 'samples': 560640, 'steps': 1094, 'loss/train': 3.1484813690185547} -09/20/2021 18:16:53 - INFO - __main__ - Step 17521: {'lr': 0.00019997578536415218, 'samples': 560672, 'steps': 1095, 'loss/train': 3.2627670764923096} -09/20/2021 18:16:54 - INFO - __main__ - Step 17522: {'lr': 0.00019997578536415218, 'samples': 560704, 'steps': 1095, 'loss/train': 3.889630079269409} -09/20/2021 18:16:55 - INFO - __main__ - Step 17523: {'lr': 0.00019997578536415218, 'samples': 560736, 'steps': 1095, 'loss/train': 4.530357837677002} -09/20/2021 18:16:56 - INFO - __main__ - Step 17524: {'lr': 0.00019997578536415218, 'samples': 560768, 'steps': 1095, 'loss/train': 3.4761369228363037} -09/20/2021 18:16:56 - INFO - __main__ - Step 17525: {'lr': 0.00019997578536415218, 'samples': 560800, 'steps': 1095, 'loss/train': 3.9237327575683594} -09/20/2021 18:16:57 - INFO - __main__ - Step 17526: {'lr': 0.00019997578536415218, 'samples': 560832, 'steps': 1095, 'loss/train': 4.419175148010254} -09/20/2021 18:16:58 - INFO - __main__ - Step 17527: {'lr': 0.00019997578536415218, 'samples': 560864, 'steps': 1095, 'loss/train': 3.8097083568573} -09/20/2021 18:16:59 - INFO - __main__ - Step 17528: {'lr': 0.00019997578536415218, 'samples': 560896, 'steps': 1095, 'loss/train': 3.726947784423828} -09/20/2021 18:16:59 - INFO - __main__ - Step 17529: {'lr': 0.00019997578536415218, 'samples': 560928, 'steps': 1095, 'loss/train': 4.154123306274414} -09/20/2021 18:17:00 - INFO - __main__ - Step 17530: {'lr': 0.00019997578536415218, 'samples': 560960, 'steps': 1095, 'loss/train': 3.534273862838745} -09/20/2021 18:17:01 - INFO - __main__ - Step 17531: {'lr': 0.00019997578536415218, 'samples': 560992, 'steps': 1095, 'loss/train': 3.42641544342041} -09/20/2021 18:17:02 - INFO - __main__ - Step 17532: {'lr': 0.00019997578536415218, 'samples': 561024, 'steps': 1095, 'loss/train': 5.023990154266357} -09/20/2021 18:17:02 - INFO - __main__ - Step 17533: {'lr': 0.00019997578536415218, 'samples': 561056, 'steps': 1095, 'loss/train': 3.7097086906433105} -09/20/2021 18:17:03 - INFO - __main__ - Step 17534: {'lr': 0.00019997578536415218, 'samples': 561088, 'steps': 1095, 'loss/train': 3.065767765045166} -09/20/2021 18:17:04 - INFO - __main__ - Step 17535: {'lr': 0.00019997578536415218, 'samples': 561120, 'steps': 1095, 'loss/train': 3.7548489570617676} -09/20/2021 18:17:05 - INFO - __main__ - Step 17536: {'lr': 0.00019997578536415218, 'samples': 561152, 'steps': 1095, 'loss/train': 3.84403395652771} -09/20/2021 18:17:05 - INFO - __main__ - Step 17537: {'lr': 0.00019997564479171665, 'samples': 561184, 'steps': 1096, 'loss/train': 3.566920042037964} -09/20/2021 18:17:07 - INFO - __main__ - Step 17538: {'lr': 0.00019997564479171665, 'samples': 561216, 'steps': 1096, 'loss/train': 1.8798654079437256} -09/20/2021 18:17:07 - INFO - __main__ - Step 17539: {'lr': 0.00019997564479171665, 'samples': 561248, 'steps': 1096, 'loss/train': 3.6524319648742676} -09/20/2021 18:17:08 - INFO - __main__ - Step 17540: {'lr': 0.00019997564479171665, 'samples': 561280, 'steps': 1096, 'loss/train': 3.5134518146514893} -09/20/2021 18:17:09 - INFO - __main__ - Step 17541: {'lr': 0.00019997564479171665, 'samples': 561312, 'steps': 1096, 'loss/train': 3.701474189758301} -09/20/2021 18:17:10 - INFO - __main__ - Step 17542: {'lr': 0.00019997564479171665, 'samples': 561344, 'steps': 1096, 'loss/train': 3.1714398860931396} -09/20/2021 18:17:10 - INFO - __main__ - Step 17543: {'lr': 0.00019997564479171665, 'samples': 561376, 'steps': 1096, 'loss/train': 2.74648380279541} -09/20/2021 18:17:11 - INFO - __main__ - Step 17544: {'lr': 0.00019997564479171665, 'samples': 561408, 'steps': 1096, 'loss/train': 3.186347246170044} -09/20/2021 18:17:12 - INFO - __main__ - Step 17545: {'lr': 0.00019997564479171665, 'samples': 561440, 'steps': 1096, 'loss/train': 4.520573139190674} -09/20/2021 18:17:13 - INFO - __main__ - Step 17546: {'lr': 0.00019997564479171665, 'samples': 561472, 'steps': 1096, 'loss/train': 3.2689521312713623} -09/20/2021 18:17:13 - INFO - __main__ - Step 17547: {'lr': 0.00019997564479171665, 'samples': 561504, 'steps': 1096, 'loss/train': 5.16433048248291} -09/20/2021 18:17:14 - INFO - __main__ - Step 17548: {'lr': 0.00019997564479171665, 'samples': 561536, 'steps': 1096, 'loss/train': 3.1172423362731934} -09/20/2021 18:17:15 - INFO - __main__ - Step 17549: {'lr': 0.00019997564479171665, 'samples': 561568, 'steps': 1096, 'loss/train': 4.380976676940918} -09/20/2021 18:17:16 - INFO - __main__ - Step 17550: {'lr': 0.00019997564479171665, 'samples': 561600, 'steps': 1096, 'loss/train': 3.330030679702759} -09/20/2021 18:17:16 - INFO - __main__ - Step 17551: {'lr': 0.00019997564479171665, 'samples': 561632, 'steps': 1096, 'loss/train': 2.7792375087738037} -09/20/2021 18:17:17 - INFO - __main__ - Step 17552: {'lr': 0.00019997564479171665, 'samples': 561664, 'steps': 1096, 'loss/train': 3.57987904548645} -09/20/2021 18:17:18 - INFO - __main__ - Step 17553: {'lr': 0.0001999755038124806, 'samples': 561696, 'steps': 1097, 'loss/train': 3.8345859050750732} -09/20/2021 18:17:19 - INFO - __main__ - Step 17554: {'lr': 0.0001999755038124806, 'samples': 561728, 'steps': 1097, 'loss/train': 4.346800804138184} -09/20/2021 18:17:20 - INFO - __main__ - Step 17555: {'lr': 0.0001999755038124806, 'samples': 561760, 'steps': 1097, 'loss/train': 3.1068055629730225} -09/20/2021 18:17:20 - INFO - __main__ - Step 17556: {'lr': 0.0001999755038124806, 'samples': 561792, 'steps': 1097, 'loss/train': 3.7237820625305176} -09/20/2021 18:17:21 - INFO - __main__ - Step 17557: {'lr': 0.0001999755038124806, 'samples': 561824, 'steps': 1097, 'loss/train': 2.48429274559021} -09/20/2021 18:17:22 - INFO - __main__ - Step 17558: {'lr': 0.0001999755038124806, 'samples': 561856, 'steps': 1097, 'loss/train': 5.244954586029053} -09/20/2021 18:17:23 - INFO - __main__ - Step 17559: {'lr': 0.0001999755038124806, 'samples': 561888, 'steps': 1097, 'loss/train': 3.2144088745117188} -09/20/2021 18:17:23 - INFO - __main__ - Step 17560: {'lr': 0.0001999755038124806, 'samples': 561920, 'steps': 1097, 'loss/train': 4.073087215423584} -09/20/2021 18:17:24 - INFO - __main__ - Step 17561: {'lr': 0.0001999755038124806, 'samples': 561952, 'steps': 1097, 'loss/train': 3.9140450954437256} -09/20/2021 18:17:25 - INFO - __main__ - Step 17562: {'lr': 0.0001999755038124806, 'samples': 561984, 'steps': 1097, 'loss/train': 4.10908842086792} -09/20/2021 18:17:26 - INFO - __main__ - Step 17563: {'lr': 0.0001999755038124806, 'samples': 562016, 'steps': 1097, 'loss/train': 3.6262381076812744} -09/20/2021 18:17:26 - INFO - __main__ - Step 17564: {'lr': 0.0001999755038124806, 'samples': 562048, 'steps': 1097, 'loss/train': 1.2178127765655518} -09/20/2021 18:17:27 - INFO - __main__ - Step 17565: {'lr': 0.0001999755038124806, 'samples': 562080, 'steps': 1097, 'loss/train': 0.7584733366966248} -09/20/2021 18:17:28 - INFO - __main__ - Step 17566: {'lr': 0.0001999755038124806, 'samples': 562112, 'steps': 1097, 'loss/train': 4.5146403312683105} -09/20/2021 18:17:29 - INFO - __main__ - Step 17567: {'lr': 0.0001999755038124806, 'samples': 562144, 'steps': 1097, 'loss/train': 3.9559309482574463} -09/20/2021 18:17:29 - INFO - __main__ - Step 17568: {'lr': 0.0001999755038124806, 'samples': 562176, 'steps': 1097, 'loss/train': 3.771735429763794} -09/20/2021 18:17:30 - INFO - __main__ - Step 17569: {'lr': 0.00019997536242644462, 'samples': 562208, 'steps': 1098, 'loss/train': 3.4534847736358643} -09/20/2021 18:17:32 - INFO - __main__ - Step 17570: {'lr': 0.00019997536242644462, 'samples': 562240, 'steps': 1098, 'loss/train': 2.4887847900390625} -09/20/2021 18:17:32 - INFO - __main__ - Step 17571: {'lr': 0.00019997536242644462, 'samples': 562272, 'steps': 1098, 'loss/train': 3.605548858642578} -09/20/2021 18:17:33 - INFO - __main__ - Step 17572: {'lr': 0.00019997536242644462, 'samples': 562304, 'steps': 1098, 'loss/train': 0.964585542678833} -09/20/2021 18:17:34 - INFO - __main__ - Step 17573: {'lr': 0.00019997536242644462, 'samples': 562336, 'steps': 1098, 'loss/train': 3.4336819648742676} -09/20/2021 18:17:35 - INFO - __main__ - Step 17574: {'lr': 0.00019997536242644462, 'samples': 562368, 'steps': 1098, 'loss/train': 2.829979419708252} -09/20/2021 18:17:35 - INFO - __main__ - Step 17575: {'lr': 0.00019997536242644462, 'samples': 562400, 'steps': 1098, 'loss/train': 3.643955707550049} -09/20/2021 18:17:36 - INFO - __main__ - Step 17576: {'lr': 0.00019997536242644462, 'samples': 562432, 'steps': 1098, 'loss/train': 4.13287878036499} -09/20/2021 18:17:37 - INFO - __main__ - Step 17577: {'lr': 0.00019997536242644462, 'samples': 562464, 'steps': 1098, 'loss/train': 3.830228805541992} -09/20/2021 18:17:38 - INFO - __main__ - Step 17578: {'lr': 0.00019997536242644462, 'samples': 562496, 'steps': 1098, 'loss/train': 3.5521087646484375} -09/20/2021 18:17:38 - INFO - __main__ - Step 17579: {'lr': 0.00019997536242644462, 'samples': 562528, 'steps': 1098, 'loss/train': 3.7090959548950195} -09/20/2021 18:17:39 - INFO - __main__ - Step 17580: {'lr': 0.00019997536242644462, 'samples': 562560, 'steps': 1098, 'loss/train': 3.752631425857544} -09/20/2021 18:17:40 - INFO - __main__ - Step 17581: {'lr': 0.00019997536242644462, 'samples': 562592, 'steps': 1098, 'loss/train': 3.404451847076416} -09/20/2021 18:17:41 - INFO - __main__ - Step 17582: {'lr': 0.00019997536242644462, 'samples': 562624, 'steps': 1098, 'loss/train': 2.6354928016662598} -09/20/2021 18:17:41 - INFO - __main__ - Step 17583: {'lr': 0.00019997536242644462, 'samples': 562656, 'steps': 1098, 'loss/train': 3.5139334201812744} -09/20/2021 18:17:42 - INFO - __main__ - Step 17584: {'lr': 0.00019997536242644462, 'samples': 562688, 'steps': 1098, 'loss/train': 3.8381400108337402} -09/20/2021 18:17:43 - INFO - __main__ - Step 17585: {'lr': 0.00019997522063360928, 'samples': 562720, 'steps': 1099, 'loss/train': 5.242280960083008} -09/20/2021 18:17:44 - INFO - __main__ - Step 17586: {'lr': 0.00019997522063360928, 'samples': 562752, 'steps': 1099, 'loss/train': 1.8553142547607422} -09/20/2021 18:17:44 - INFO - __main__ - Step 17587: {'lr': 0.00019997522063360928, 'samples': 562784, 'steps': 1099, 'loss/train': 0.7585399746894836} -09/20/2021 18:17:45 - INFO - __main__ - Step 17588: {'lr': 0.00019997522063360928, 'samples': 562816, 'steps': 1099, 'loss/train': 0.6772764921188354} -09/20/2021 18:17:46 - INFO - __main__ - Step 17589: {'lr': 0.00019997522063360928, 'samples': 562848, 'steps': 1099, 'loss/train': 3.412358045578003} -09/20/2021 18:17:47 - INFO - __main__ - Step 17590: {'lr': 0.00019997522063360928, 'samples': 562880, 'steps': 1099, 'loss/train': 3.4789116382598877} -09/20/2021 18:17:47 - INFO - __main__ - Step 17591: {'lr': 0.00019997522063360928, 'samples': 562912, 'steps': 1099, 'loss/train': 4.282179832458496} -09/20/2021 18:17:48 - INFO - __main__ - Step 17592: {'lr': 0.00019997522063360928, 'samples': 562944, 'steps': 1099, 'loss/train': 3.4588446617126465} -09/20/2021 18:17:49 - INFO - __main__ - Step 17593: {'lr': 0.00019997522063360928, 'samples': 562976, 'steps': 1099, 'loss/train': 2.8378384113311768} -09/20/2021 18:17:50 - INFO - __main__ - Step 17594: {'lr': 0.00019997522063360928, 'samples': 563008, 'steps': 1099, 'loss/train': 4.152557849884033} -09/20/2021 18:17:50 - INFO - __main__ - Step 17595: {'lr': 0.00019997522063360928, 'samples': 563040, 'steps': 1099, 'loss/train': 3.2850732803344727} -09/20/2021 18:17:51 - INFO - __main__ - Step 17596: {'lr': 0.00019997522063360928, 'samples': 563072, 'steps': 1099, 'loss/train': 5.9065704345703125} -09/20/2021 18:17:52 - INFO - __main__ - Step 17597: {'lr': 0.00019997522063360928, 'samples': 563104, 'steps': 1099, 'loss/train': 3.3236522674560547} -09/20/2021 18:17:53 - INFO - __main__ - Step 17598: {'lr': 0.00019997522063360928, 'samples': 563136, 'steps': 1099, 'loss/train': 2.956244707107544} -09/20/2021 18:17:53 - INFO - __main__ - Step 17599: {'lr': 0.00019997522063360928, 'samples': 563168, 'steps': 1099, 'loss/train': 3.8312199115753174} -09/20/2021 18:17:55 - INFO - __main__ - Step 17600: {'lr': 0.00019997522063360928, 'samples': 563200, 'steps': 1099, 'loss/train': 5.646371841430664} -09/20/2021 18:17:56 - INFO - __main__ - Step 17601: {'lr': 0.00019997507843397513, 'samples': 563232, 'steps': 1100, 'loss/train': 4.929378986358643} -09/20/2021 18:17:56 - INFO - __main__ - Step 17602: {'lr': 0.00019997507843397513, 'samples': 563264, 'steps': 1100, 'loss/train': 3.792506694793701} -09/20/2021 18:17:57 - INFO - __main__ - Step 17603: {'lr': 0.00019997507843397513, 'samples': 563296, 'steps': 1100, 'loss/train': 3.279555320739746} -09/20/2021 18:17:58 - INFO - __main__ - Step 17604: {'lr': 0.00019997507843397513, 'samples': 563328, 'steps': 1100, 'loss/train': 3.4599990844726562} -09/20/2021 18:17:59 - INFO - __main__ - Step 17605: {'lr': 0.00019997507843397513, 'samples': 563360, 'steps': 1100, 'loss/train': 4.037339687347412} -09/20/2021 18:17:59 - INFO - __main__ - Step 17606: {'lr': 0.00019997507843397513, 'samples': 563392, 'steps': 1100, 'loss/train': 3.804150342941284} -09/20/2021 18:18:00 - INFO - __main__ - Step 17607: {'lr': 0.00019997507843397513, 'samples': 563424, 'steps': 1100, 'loss/train': 4.263143539428711} -09/20/2021 18:18:01 - INFO - __main__ - Step 17608: {'lr': 0.00019997507843397513, 'samples': 563456, 'steps': 1100, 'loss/train': 3.7393319606781006} -09/20/2021 18:18:02 - INFO - __main__ - Step 17609: {'lr': 0.00019997507843397513, 'samples': 563488, 'steps': 1100, 'loss/train': 3.400831460952759} -09/20/2021 18:18:02 - INFO - __main__ - Step 17610: {'lr': 0.00019997507843397513, 'samples': 563520, 'steps': 1100, 'loss/train': 3.72876238822937} -09/20/2021 18:18:03 - INFO - __main__ - Step 17611: {'lr': 0.00019997507843397513, 'samples': 563552, 'steps': 1100, 'loss/train': 3.380934238433838} -09/20/2021 18:18:04 - INFO - __main__ - Step 17612: {'lr': 0.00019997507843397513, 'samples': 563584, 'steps': 1100, 'loss/train': 3.425039529800415} -09/20/2021 18:18:05 - INFO - __main__ - Step 17613: {'lr': 0.00019997507843397513, 'samples': 563616, 'steps': 1100, 'loss/train': 4.053210258483887} -09/20/2021 18:18:05 - INFO - __main__ - Step 17614: {'lr': 0.00019997507843397513, 'samples': 563648, 'steps': 1100, 'loss/train': 3.699765205383301} -09/20/2021 18:18:06 - INFO - __main__ - Step 17615: {'lr': 0.00019997507843397513, 'samples': 563680, 'steps': 1100, 'loss/train': 4.095494747161865} -09/20/2021 18:18:07 - INFO - __main__ - Step 17616: {'lr': 0.00019997507843397513, 'samples': 563712, 'steps': 1100, 'loss/train': 3.397202253341675} -09/20/2021 18:18:08 - INFO - __main__ - Step 17617: {'lr': 0.0001999749358275428, 'samples': 563744, 'steps': 1101, 'loss/train': 3.4482998847961426} -09/20/2021 18:18:09 - INFO - __main__ - Step 17618: {'lr': 0.0001999749358275428, 'samples': 563776, 'steps': 1101, 'loss/train': 0.7302063703536987} -09/20/2021 18:18:09 - INFO - __main__ - Step 17619: {'lr': 0.0001999749358275428, 'samples': 563808, 'steps': 1101, 'loss/train': 3.1619489192962646} -09/20/2021 18:18:10 - INFO - __main__ - Step 17620: {'lr': 0.0001999749358275428, 'samples': 563840, 'steps': 1101, 'loss/train': 3.4115493297576904} -09/20/2021 18:18:11 - INFO - __main__ - Step 17621: {'lr': 0.0001999749358275428, 'samples': 563872, 'steps': 1101, 'loss/train': 4.112274169921875} -09/20/2021 18:18:12 - INFO - __main__ - Step 17622: {'lr': 0.0001999749358275428, 'samples': 563904, 'steps': 1101, 'loss/train': 3.6436824798583984} -09/20/2021 18:18:12 - INFO - __main__ - Step 17623: {'lr': 0.0001999749358275428, 'samples': 563936, 'steps': 1101, 'loss/train': 4.402100563049316} -09/20/2021 18:18:13 - INFO - __main__ - Step 17624: {'lr': 0.0001999749358275428, 'samples': 563968, 'steps': 1101, 'loss/train': 3.223247528076172} -09/20/2021 18:18:14 - INFO - __main__ - Step 17625: {'lr': 0.0001999749358275428, 'samples': 564000, 'steps': 1101, 'loss/train': 1.2153465747833252} -09/20/2021 18:18:15 - INFO - __main__ - Step 17626: {'lr': 0.0001999749358275428, 'samples': 564032, 'steps': 1101, 'loss/train': 4.46165132522583} -09/20/2021 18:18:15 - INFO - __main__ - Step 17627: {'lr': 0.0001999749358275428, 'samples': 564064, 'steps': 1101, 'loss/train': 2.216264247894287} -09/20/2021 18:18:16 - INFO - __main__ - Step 17628: {'lr': 0.0001999749358275428, 'samples': 564096, 'steps': 1101, 'loss/train': 3.338136911392212} -09/20/2021 18:18:17 - INFO - __main__ - Step 17629: {'lr': 0.0001999749358275428, 'samples': 564128, 'steps': 1101, 'loss/train': 3.3715126514434814} -09/20/2021 18:18:18 - INFO - __main__ - Step 17630: {'lr': 0.0001999749358275428, 'samples': 564160, 'steps': 1101, 'loss/train': 3.294051170349121} -09/20/2021 18:18:18 - INFO - __main__ - Step 17631: {'lr': 0.0001999749358275428, 'samples': 564192, 'steps': 1101, 'loss/train': 0.8630937933921814} -09/20/2021 18:18:20 - INFO - __main__ - Step 17632: {'lr': 0.0001999749358275428, 'samples': 564224, 'steps': 1101, 'loss/train': 1.8599920272827148} -09/20/2021 18:18:21 - INFO - __main__ - Step 17633: {'lr': 0.00019997479281431285, 'samples': 564256, 'steps': 1102, 'loss/train': 3.3375139236450195} -09/20/2021 18:18:21 - INFO - __main__ - Step 17634: {'lr': 0.00019997479281431285, 'samples': 564288, 'steps': 1102, 'loss/train': 3.128464698791504} -09/20/2021 18:18:22 - INFO - __main__ - Step 17635: {'lr': 0.00019997479281431285, 'samples': 564320, 'steps': 1102, 'loss/train': 0.8243982791900635} -09/20/2021 18:18:23 - INFO - __main__ - Step 17636: {'lr': 0.00019997479281431285, 'samples': 564352, 'steps': 1102, 'loss/train': 0.6344307661056519} -09/20/2021 18:18:24 - INFO - __main__ - Step 17637: {'lr': 0.00019997479281431285, 'samples': 564384, 'steps': 1102, 'loss/train': 0.41869404911994934} -09/20/2021 18:18:24 - INFO - __main__ - Step 17638: {'lr': 0.00019997479281431285, 'samples': 564416, 'steps': 1102, 'loss/train': 3.137112617492676} -09/20/2021 18:18:25 - INFO - __main__ - Step 17639: {'lr': 0.00019997479281431285, 'samples': 564448, 'steps': 1102, 'loss/train': 3.165626287460327} -09/20/2021 18:18:26 - INFO - __main__ - Step 17640: {'lr': 0.00019997479281431285, 'samples': 564480, 'steps': 1102, 'loss/train': 3.3104913234710693} -09/20/2021 18:18:27 - INFO - __main__ - Step 17641: {'lr': 0.00019997479281431285, 'samples': 564512, 'steps': 1102, 'loss/train': 4.411685466766357} -09/20/2021 18:18:27 - INFO - __main__ - Step 17642: {'lr': 0.00019997479281431285, 'samples': 564544, 'steps': 1102, 'loss/train': 3.6278252601623535} -09/20/2021 18:18:28 - INFO - __main__ - Step 17643: {'lr': 0.00019997479281431285, 'samples': 564576, 'steps': 1102, 'loss/train': 3.7716522216796875} -09/20/2021 18:18:29 - INFO - __main__ - Step 17644: {'lr': 0.00019997479281431285, 'samples': 564608, 'steps': 1102, 'loss/train': 2.79186749458313} -09/20/2021 18:18:30 - INFO - __main__ - Step 17645: {'lr': 0.00019997479281431285, 'samples': 564640, 'steps': 1102, 'loss/train': 3.399505376815796} -09/20/2021 18:18:30 - INFO - __main__ - Step 17646: {'lr': 0.00019997479281431285, 'samples': 564672, 'steps': 1102, 'loss/train': 3.8208112716674805} -09/20/2021 18:18:31 - INFO - __main__ - Step 17647: {'lr': 0.00019997479281431285, 'samples': 564704, 'steps': 1102, 'loss/train': 3.6722700595855713} -09/20/2021 18:18:32 - INFO - __main__ - Step 17648: {'lr': 0.00019997479281431285, 'samples': 564736, 'steps': 1102, 'loss/train': 4.981867790222168} -09/20/2021 18:18:33 - INFO - __main__ - Step 17649: {'lr': 0.00019997464939428583, 'samples': 564768, 'steps': 1103, 'loss/train': 3.6880745887756348} -09/20/2021 18:18:33 - INFO - __main__ - Step 17650: {'lr': 0.00019997464939428583, 'samples': 564800, 'steps': 1103, 'loss/train': 4.882482051849365} -09/20/2021 18:18:34 - INFO - __main__ - Step 17651: {'lr': 0.00019997464939428583, 'samples': 564832, 'steps': 1103, 'loss/train': 3.507995367050171} -09/20/2021 18:18:35 - INFO - __main__ - Step 17652: {'lr': 0.00019997464939428583, 'samples': 564864, 'steps': 1103, 'loss/train': 3.901358127593994} -09/20/2021 18:18:36 - INFO - __main__ - Step 17653: {'lr': 0.00019997464939428583, 'samples': 564896, 'steps': 1103, 'loss/train': 3.914255142211914} -09/20/2021 18:18:36 - INFO - __main__ - Step 17654: {'lr': 0.00019997464939428583, 'samples': 564928, 'steps': 1103, 'loss/train': 4.085308074951172} -09/20/2021 18:18:37 - INFO - __main__ - Step 17655: {'lr': 0.00019997464939428583, 'samples': 564960, 'steps': 1103, 'loss/train': 3.7698252201080322} -09/20/2021 18:18:38 - INFO - __main__ - Step 17656: {'lr': 0.00019997464939428583, 'samples': 564992, 'steps': 1103, 'loss/train': 3.832876682281494} -09/20/2021 18:18:39 - INFO - __main__ - Step 17657: {'lr': 0.00019997464939428583, 'samples': 565024, 'steps': 1103, 'loss/train': 3.297182321548462} -09/20/2021 18:18:39 - INFO - __main__ - Step 17658: {'lr': 0.00019997464939428583, 'samples': 565056, 'steps': 1103, 'loss/train': 3.459866523742676} -09/20/2021 18:18:40 - INFO - __main__ - Step 17659: {'lr': 0.00019997464939428583, 'samples': 565088, 'steps': 1103, 'loss/train': 3.0702266693115234} -09/20/2021 18:18:41 - INFO - __main__ - Step 17660: {'lr': 0.00019997464939428583, 'samples': 565120, 'steps': 1103, 'loss/train': 3.720303535461426} -09/20/2021 18:18:42 - INFO - __main__ - Step 17661: {'lr': 0.00019997464939428583, 'samples': 565152, 'steps': 1103, 'loss/train': 4.3037943840026855} -09/20/2021 18:18:43 - INFO - __main__ - Step 17662: {'lr': 0.00019997464939428583, 'samples': 565184, 'steps': 1103, 'loss/train': 2.109732151031494} -09/20/2021 18:18:44 - INFO - __main__ - Step 17663: {'lr': 0.00019997464939428583, 'samples': 565216, 'steps': 1103, 'loss/train': 3.9725215435028076} -09/20/2021 18:18:44 - INFO - __main__ - Step 17664: {'lr': 0.00019997464939428583, 'samples': 565248, 'steps': 1103, 'loss/train': 3.5211360454559326} -09/20/2021 18:18:45 - INFO - __main__ - Step 17665: {'lr': 0.00019997450556746239, 'samples': 565280, 'steps': 1104, 'loss/train': 4.494734287261963} -09/20/2021 18:18:46 - INFO - __main__ - Step 17666: {'lr': 0.00019997450556746239, 'samples': 565312, 'steps': 1104, 'loss/train': 3.5984714031219482} -09/20/2021 18:18:47 - INFO - __main__ - Step 17667: {'lr': 0.00019997450556746239, 'samples': 565344, 'steps': 1104, 'loss/train': 3.603599786758423} -09/20/2021 18:18:48 - INFO - __main__ - Step 17668: {'lr': 0.00019997450556746239, 'samples': 565376, 'steps': 1104, 'loss/train': 3.922145128250122} -09/20/2021 18:18:48 - INFO - __main__ - Step 17669: {'lr': 0.00019997450556746239, 'samples': 565408, 'steps': 1104, 'loss/train': 2.508526086807251} -09/20/2021 18:18:49 - INFO - __main__ - Step 17670: {'lr': 0.00019997450556746239, 'samples': 565440, 'steps': 1104, 'loss/train': 3.786189556121826} -09/20/2021 18:18:50 - INFO - __main__ - Step 17671: {'lr': 0.00019997450556746239, 'samples': 565472, 'steps': 1104, 'loss/train': 3.6321053504943848} -09/20/2021 18:18:51 - INFO - __main__ - Step 17672: {'lr': 0.00019997450556746239, 'samples': 565504, 'steps': 1104, 'loss/train': 4.030109882354736} -09/20/2021 18:18:51 - INFO - __main__ - Step 17673: {'lr': 0.00019997450556746239, 'samples': 565536, 'steps': 1104, 'loss/train': 3.531310558319092} -09/20/2021 18:18:52 - INFO - __main__ - Step 17674: {'lr': 0.00019997450556746239, 'samples': 565568, 'steps': 1104, 'loss/train': 3.750467538833618} -09/20/2021 18:18:53 - INFO - __main__ - Step 17675: {'lr': 0.00019997450556746239, 'samples': 565600, 'steps': 1104, 'loss/train': 3.2873408794403076} -09/20/2021 18:18:54 - INFO - __main__ - Step 17676: {'lr': 0.00019997450556746239, 'samples': 565632, 'steps': 1104, 'loss/train': 2.958845853805542} -09/20/2021 18:18:54 - INFO - __main__ - Step 17677: {'lr': 0.00019997450556746239, 'samples': 565664, 'steps': 1104, 'loss/train': 4.265876293182373} -09/20/2021 18:18:55 - INFO - __main__ - Step 17678: {'lr': 0.00019997450556746239, 'samples': 565696, 'steps': 1104, 'loss/train': 4.353448390960693} -09/20/2021 18:18:56 - INFO - __main__ - Step 17679: {'lr': 0.00019997450556746239, 'samples': 565728, 'steps': 1104, 'loss/train': 3.7225091457366943} -09/20/2021 18:18:57 - INFO - __main__ - Step 17680: {'lr': 0.00019997450556746239, 'samples': 565760, 'steps': 1104, 'loss/train': 3.3673741817474365} -09/20/2021 18:18:57 - INFO - __main__ - Step 17681: {'lr': 0.00019997436133384303, 'samples': 565792, 'steps': 1105, 'loss/train': 3.2574052810668945} -09/20/2021 18:18:58 - INFO - __main__ - Step 17682: {'lr': 0.00019997436133384303, 'samples': 565824, 'steps': 1105, 'loss/train': 3.1795120239257812} -09/20/2021 18:18:59 - INFO - __main__ - Step 17683: {'lr': 0.00019997436133384303, 'samples': 565856, 'steps': 1105, 'loss/train': 3.5540356636047363} -09/20/2021 18:19:00 - INFO - __main__ - Step 17684: {'lr': 0.00019997436133384303, 'samples': 565888, 'steps': 1105, 'loss/train': 3.6151249408721924} -09/20/2021 18:19:00 - INFO - __main__ - Step 17685: {'lr': 0.00019997436133384303, 'samples': 565920, 'steps': 1105, 'loss/train': 4.185362815856934} -09/20/2021 18:19:01 - INFO - __main__ - Step 17686: {'lr': 0.00019997436133384303, 'samples': 565952, 'steps': 1105, 'loss/train': 4.275386333465576} -09/20/2021 18:19:02 - INFO - __main__ - Step 17687: {'lr': 0.00019997436133384303, 'samples': 565984, 'steps': 1105, 'loss/train': 3.692857265472412} -09/20/2021 18:19:03 - INFO - __main__ - Step 17688: {'lr': 0.00019997436133384303, 'samples': 566016, 'steps': 1105, 'loss/train': 4.749524116516113} -09/20/2021 18:19:03 - INFO - __main__ - Step 17689: {'lr': 0.00019997436133384303, 'samples': 566048, 'steps': 1105, 'loss/train': 3.1059064865112305} -09/20/2021 18:19:04 - INFO - __main__ - Step 17690: {'lr': 0.00019997436133384303, 'samples': 566080, 'steps': 1105, 'loss/train': 3.4071507453918457} -09/20/2021 18:19:05 - INFO - __main__ - Step 17691: {'lr': 0.00019997436133384303, 'samples': 566112, 'steps': 1105, 'loss/train': 3.790972948074341} -09/20/2021 18:19:06 - INFO - __main__ - Step 17692: {'lr': 0.00019997436133384303, 'samples': 566144, 'steps': 1105, 'loss/train': 3.7137279510498047} -09/20/2021 18:19:07 - INFO - __main__ - Step 17693: {'lr': 0.00019997436133384303, 'samples': 566176, 'steps': 1105, 'loss/train': 3.6530206203460693} -09/20/2021 18:19:08 - INFO - __main__ - Step 17694: {'lr': 0.00019997436133384303, 'samples': 566208, 'steps': 1105, 'loss/train': 3.4625296592712402} -09/20/2021 18:19:09 - INFO - __main__ - Step 17695: {'lr': 0.00019997436133384303, 'samples': 566240, 'steps': 1105, 'loss/train': 4.596475124359131} -09/20/2021 18:19:09 - INFO - __main__ - Step 17696: {'lr': 0.00019997436133384303, 'samples': 566272, 'steps': 1105, 'loss/train': 2.876271963119507} -09/20/2021 18:19:10 - INFO - __main__ - Step 17697: {'lr': 0.00019997421669342843, 'samples': 566304, 'steps': 1106, 'loss/train': 3.3969626426696777} -09/20/2021 18:19:11 - INFO - __main__ - Step 17698: {'lr': 0.00019997421669342843, 'samples': 566336, 'steps': 1106, 'loss/train': 2.927900791168213} -09/20/2021 18:19:12 - INFO - __main__ - Step 17699: {'lr': 0.00019997421669342843, 'samples': 566368, 'steps': 1106, 'loss/train': 4.170243740081787} -09/20/2021 18:19:12 - INFO - __main__ - Step 17700: {'lr': 0.00019997421669342843, 'samples': 566400, 'steps': 1106, 'loss/train': 4.429274559020996} -09/20/2021 18:19:13 - INFO - __main__ - Step 17701: {'lr': 0.00019997421669342843, 'samples': 566432, 'steps': 1106, 'loss/train': 2.6922385692596436} -09/20/2021 18:19:14 - INFO - __main__ - Step 17702: {'lr': 0.00019997421669342843, 'samples': 566464, 'steps': 1106, 'loss/train': 4.877591609954834} -09/20/2021 18:19:15 - INFO - __main__ - Step 17703: {'lr': 0.00019997421669342843, 'samples': 566496, 'steps': 1106, 'loss/train': 4.196936130523682} -09/20/2021 18:19:15 - INFO - __main__ - Step 17704: {'lr': 0.00019997421669342843, 'samples': 566528, 'steps': 1106, 'loss/train': 3.8149707317352295} -09/20/2021 18:19:16 - INFO - __main__ - Step 17705: {'lr': 0.00019997421669342843, 'samples': 566560, 'steps': 1106, 'loss/train': 4.0096588134765625} -09/20/2021 18:19:17 - INFO - __main__ - Step 17706: {'lr': 0.00019997421669342843, 'samples': 566592, 'steps': 1106, 'loss/train': 2.570256233215332} -09/20/2021 18:19:18 - INFO - __main__ - Step 17707: {'lr': 0.00019997421669342843, 'samples': 566624, 'steps': 1106, 'loss/train': 1.91389799118042} -09/20/2021 18:19:18 - INFO - __main__ - Step 17708: {'lr': 0.00019997421669342843, 'samples': 566656, 'steps': 1106, 'loss/train': 2.494835376739502} -09/20/2021 18:19:19 - INFO - __main__ - Step 17709: {'lr': 0.00019997421669342843, 'samples': 566688, 'steps': 1106, 'loss/train': 5.224238872528076} -09/20/2021 18:19:20 - INFO - __main__ - Step 17710: {'lr': 0.00019997421669342843, 'samples': 566720, 'steps': 1106, 'loss/train': 5.04617977142334} -09/20/2021 18:19:21 - INFO - __main__ - Step 17711: {'lr': 0.00019997421669342843, 'samples': 566752, 'steps': 1106, 'loss/train': 3.4952189922332764} -09/20/2021 18:19:21 - INFO - __main__ - Step 17712: {'lr': 0.00019997421669342843, 'samples': 566784, 'steps': 1106, 'loss/train': 3.1331846714019775} -09/20/2021 18:19:22 - INFO - __main__ - Step 17713: {'lr': 0.00019997407164621907, 'samples': 566816, 'steps': 1107, 'loss/train': 3.9341225624084473} -09/20/2021 18:19:23 - INFO - __main__ - Step 17714: {'lr': 0.00019997407164621907, 'samples': 566848, 'steps': 1107, 'loss/train': 4.905085563659668} -09/20/2021 18:19:24 - INFO - __main__ - Step 17715: {'lr': 0.00019997407164621907, 'samples': 566880, 'steps': 1107, 'loss/train': 4.623324394226074} -09/20/2021 18:19:25 - INFO - __main__ - Step 17716: {'lr': 0.00019997407164621907, 'samples': 566912, 'steps': 1107, 'loss/train': 4.758481502532959} -09/20/2021 18:19:25 - INFO - __main__ - Step 17717: {'lr': 0.00019997407164621907, 'samples': 566944, 'steps': 1107, 'loss/train': 3.2927780151367188} -09/20/2021 18:19:26 - INFO - __main__ - Step 17718: {'lr': 0.00019997407164621907, 'samples': 566976, 'steps': 1107, 'loss/train': 4.208250522613525} -09/20/2021 18:19:27 - INFO - __main__ - Step 17719: {'lr': 0.00019997407164621907, 'samples': 567008, 'steps': 1107, 'loss/train': 3.65452241897583} -09/20/2021 18:19:28 - INFO - __main__ - Step 17720: {'lr': 0.00019997407164621907, 'samples': 567040, 'steps': 1107, 'loss/train': 4.191433429718018} -09/20/2021 18:19:28 - INFO - __main__ - Step 17721: {'lr': 0.00019997407164621907, 'samples': 567072, 'steps': 1107, 'loss/train': 3.803457498550415} -09/20/2021 18:19:29 - INFO - __main__ - Step 17722: {'lr': 0.00019997407164621907, 'samples': 567104, 'steps': 1107, 'loss/train': 2.6983046531677246} -09/20/2021 18:19:30 - INFO - __main__ - Step 17723: {'lr': 0.00019997407164621907, 'samples': 567136, 'steps': 1107, 'loss/train': 3.3800275325775146} -09/20/2021 18:19:32 - INFO - __main__ - Step 17724: {'lr': 0.00019997407164621907, 'samples': 567168, 'steps': 1107, 'loss/train': 4.013407230377197} -09/20/2021 18:19:33 - INFO - __main__ - Step 17725: {'lr': 0.00019997407164621907, 'samples': 567200, 'steps': 1107, 'loss/train': 3.697390556335449} -09/20/2021 18:19:33 - INFO - __main__ - Step 17726: {'lr': 0.00019997407164621907, 'samples': 567232, 'steps': 1107, 'loss/train': 1.7782386541366577} -09/20/2021 18:19:34 - INFO - __main__ - Step 17727: {'lr': 0.00019997407164621907, 'samples': 567264, 'steps': 1107, 'loss/train': 2.9758710861206055} -09/20/2021 18:19:35 - INFO - __main__ - Step 17728: {'lr': 0.00019997407164621907, 'samples': 567296, 'steps': 1107, 'loss/train': 1.896484136581421} -09/20/2021 18:19:36 - INFO - __main__ - Step 17729: {'lr': 0.00019997392619221563, 'samples': 567328, 'steps': 1108, 'loss/train': 2.0073487758636475} -09/20/2021 18:19:37 - INFO - __main__ - Step 17730: {'lr': 0.00019997392619221563, 'samples': 567360, 'steps': 1108, 'loss/train': 2.456695318222046} -09/20/2021 18:19:37 - INFO - __main__ - Step 17731: {'lr': 0.00019997392619221563, 'samples': 567392, 'steps': 1108, 'loss/train': 2.336609125137329} -09/20/2021 18:19:38 - INFO - __main__ - Step 17732: {'lr': 0.00019997392619221563, 'samples': 567424, 'steps': 1108, 'loss/train': 4.350268363952637} -09/20/2021 18:19:39 - INFO - __main__ - Step 17733: {'lr': 0.00019997392619221563, 'samples': 567456, 'steps': 1108, 'loss/train': 2.7884457111358643} -09/20/2021 18:19:40 - INFO - __main__ - Step 17734: {'lr': 0.00019997392619221563, 'samples': 567488, 'steps': 1108, 'loss/train': 3.5748181343078613} -09/20/2021 18:19:40 - INFO - __main__ - Step 17735: {'lr': 0.00019997392619221563, 'samples': 567520, 'steps': 1108, 'loss/train': 4.763692378997803} -09/20/2021 18:19:41 - INFO - __main__ - Step 17736: {'lr': 0.00019997392619221563, 'samples': 567552, 'steps': 1108, 'loss/train': 4.463405609130859} -09/20/2021 18:19:42 - INFO - __main__ - Step 17737: {'lr': 0.00019997392619221563, 'samples': 567584, 'steps': 1108, 'loss/train': 3.4792308807373047} -09/20/2021 18:19:43 - INFO - __main__ - Step 17738: {'lr': 0.00019997392619221563, 'samples': 567616, 'steps': 1108, 'loss/train': 1.2242945432662964} -09/20/2021 18:19:43 - INFO - __main__ - Step 17739: {'lr': 0.00019997392619221563, 'samples': 567648, 'steps': 1108, 'loss/train': 4.298001766204834} -09/20/2021 18:19:44 - INFO - __main__ - Step 17740: {'lr': 0.00019997392619221563, 'samples': 567680, 'steps': 1108, 'loss/train': 2.2542545795440674} -09/20/2021 18:19:45 - INFO - __main__ - Step 17741: {'lr': 0.00019997392619221563, 'samples': 567712, 'steps': 1108, 'loss/train': 3.9170422554016113} -09/20/2021 18:19:46 - INFO - __main__ - Step 17742: {'lr': 0.00019997392619221563, 'samples': 567744, 'steps': 1108, 'loss/train': 3.216339111328125} -09/20/2021 18:19:46 - INFO - __main__ - Step 17743: {'lr': 0.00019997392619221563, 'samples': 567776, 'steps': 1108, 'loss/train': 2.9325709342956543} -09/20/2021 18:19:47 - INFO - __main__ - Step 17744: {'lr': 0.00019997392619221563, 'samples': 567808, 'steps': 1108, 'loss/train': 3.9589855670928955} -09/20/2021 18:19:48 - INFO - __main__ - Step 17745: {'lr': 0.0001999737803314187, 'samples': 567840, 'steps': 1109, 'loss/train': 3.768962860107422} -09/20/2021 18:19:49 - INFO - __main__ - Step 17746: {'lr': 0.0001999737803314187, 'samples': 567872, 'steps': 1109, 'loss/train': 4.276936054229736} -09/20/2021 18:19:49 - INFO - __main__ - Step 17747: {'lr': 0.0001999737803314187, 'samples': 567904, 'steps': 1109, 'loss/train': 3.474196434020996} -09/20/2021 18:19:50 - INFO - __main__ - Step 17748: {'lr': 0.0001999737803314187, 'samples': 567936, 'steps': 1109, 'loss/train': 4.096036911010742} -09/20/2021 18:19:51 - INFO - __main__ - Step 17749: {'lr': 0.0001999737803314187, 'samples': 567968, 'steps': 1109, 'loss/train': 3.4570772647857666} -09/20/2021 18:19:52 - INFO - __main__ - Step 17750: {'lr': 0.0001999737803314187, 'samples': 568000, 'steps': 1109, 'loss/train': 2.5114941596984863} -09/20/2021 18:19:52 - INFO - __main__ - Step 17751: {'lr': 0.0001999737803314187, 'samples': 568032, 'steps': 1109, 'loss/train': 4.639925956726074} -09/20/2021 18:19:53 - INFO - __main__ - Step 17752: {'lr': 0.0001999737803314187, 'samples': 568064, 'steps': 1109, 'loss/train': 3.6967875957489014} -09/20/2021 18:19:54 - INFO - __main__ - Step 17753: {'lr': 0.0001999737803314187, 'samples': 568096, 'steps': 1109, 'loss/train': 4.13278865814209} -09/20/2021 18:19:55 - INFO - __main__ - Step 17754: {'lr': 0.0001999737803314187, 'samples': 568128, 'steps': 1109, 'loss/train': 3.9847190380096436} -09/20/2021 18:19:55 - INFO - __main__ - Step 17755: {'lr': 0.0001999737803314187, 'samples': 568160, 'steps': 1109, 'loss/train': 3.677455425262451} -09/20/2021 18:19:57 - INFO - __main__ - Step 17756: {'lr': 0.0001999737803314187, 'samples': 568192, 'steps': 1109, 'loss/train': 4.061310768127441} -09/20/2021 18:19:58 - INFO - __main__ - Step 17757: {'lr': 0.0001999737803314187, 'samples': 568224, 'steps': 1109, 'loss/train': 3.7461588382720947} -09/20/2021 18:19:59 - INFO - __main__ - Step 17758: {'lr': 0.0001999737803314187, 'samples': 568256, 'steps': 1109, 'loss/train': 1.6188331842422485} -09/20/2021 18:20:00 - INFO - __main__ - Step 17759: {'lr': 0.0001999737803314187, 'samples': 568288, 'steps': 1109, 'loss/train': 3.897399663925171} -09/20/2021 18:20:00 - INFO - __main__ - Step 17760: {'lr': 0.0001999737803314187, 'samples': 568320, 'steps': 1109, 'loss/train': 3.6999151706695557} -09/20/2021 18:20:01 - INFO - __main__ - Step 17761: {'lr': 0.0001999736340638288, 'samples': 568352, 'steps': 1110, 'loss/train': 3.8561758995056152} -09/20/2021 18:20:02 - INFO - __main__ - Step 17762: {'lr': 0.0001999736340638288, 'samples': 568384, 'steps': 1110, 'loss/train': 0.7670493721961975} -09/20/2021 18:20:03 - INFO - __main__ - Step 17763: {'lr': 0.0001999736340638288, 'samples': 568416, 'steps': 1110, 'loss/train': 3.6711411476135254} -09/20/2021 18:20:03 - INFO - __main__ - Step 17764: {'lr': 0.0001999736340638288, 'samples': 568448, 'steps': 1110, 'loss/train': 4.089969635009766} -09/20/2021 18:20:04 - INFO - __main__ - Step 17765: {'lr': 0.0001999736340638288, 'samples': 568480, 'steps': 1110, 'loss/train': 3.3468751907348633} -09/20/2021 18:20:05 - INFO - __main__ - Step 17766: {'lr': 0.0001999736340638288, 'samples': 568512, 'steps': 1110, 'loss/train': 4.016305446624756} -09/20/2021 18:20:06 - INFO - __main__ - Step 17767: {'lr': 0.0001999736340638288, 'samples': 568544, 'steps': 1110, 'loss/train': 4.134451866149902} -09/20/2021 18:20:06 - INFO - __main__ - Step 17768: {'lr': 0.0001999736340638288, 'samples': 568576, 'steps': 1110, 'loss/train': 2.5933353900909424} -09/20/2021 18:20:07 - INFO - __main__ - Step 17769: {'lr': 0.0001999736340638288, 'samples': 568608, 'steps': 1110, 'loss/train': 3.4824485778808594} -09/20/2021 18:20:08 - INFO - __main__ - Step 17770: {'lr': 0.0001999736340638288, 'samples': 568640, 'steps': 1110, 'loss/train': 3.8743321895599365} -09/20/2021 18:20:09 - INFO - __main__ - Step 17771: {'lr': 0.0001999736340638288, 'samples': 568672, 'steps': 1110, 'loss/train': 3.9716689586639404} -09/20/2021 18:20:09 - INFO - __main__ - Step 17772: {'lr': 0.0001999736340638288, 'samples': 568704, 'steps': 1110, 'loss/train': 3.3713796138763428} -09/20/2021 18:20:10 - INFO - __main__ - Step 17773: {'lr': 0.0001999736340638288, 'samples': 568736, 'steps': 1110, 'loss/train': 2.6306216716766357} -09/20/2021 18:20:11 - INFO - __main__ - Step 17774: {'lr': 0.0001999736340638288, 'samples': 568768, 'steps': 1110, 'loss/train': 3.0997607707977295} -09/20/2021 18:20:12 - INFO - __main__ - Step 17775: {'lr': 0.0001999736340638288, 'samples': 568800, 'steps': 1110, 'loss/train': 3.4885621070861816} -09/20/2021 18:20:12 - INFO - __main__ - Step 17776: {'lr': 0.0001999736340638288, 'samples': 568832, 'steps': 1110, 'loss/train': 3.4147939682006836} -09/20/2021 18:20:13 - INFO - __main__ - Step 17777: {'lr': 0.00019997348738944658, 'samples': 568864, 'steps': 1111, 'loss/train': 3.7286264896392822} -09/20/2021 18:20:14 - INFO - __main__ - Step 17778: {'lr': 0.00019997348738944658, 'samples': 568896, 'steps': 1111, 'loss/train': 2.139417886734009} -09/20/2021 18:20:15 - INFO - __main__ - Step 17779: {'lr': 0.00019997348738944658, 'samples': 568928, 'steps': 1111, 'loss/train': 1.4831385612487793} -09/20/2021 18:20:16 - INFO - __main__ - Step 17780: {'lr': 0.00019997348738944658, 'samples': 568960, 'steps': 1111, 'loss/train': 1.4525445699691772} -09/20/2021 18:20:16 - INFO - __main__ - Step 17781: {'lr': 0.00019997348738944658, 'samples': 568992, 'steps': 1111, 'loss/train': 0.9339725971221924} -09/20/2021 18:20:17 - INFO - __main__ - Step 17782: {'lr': 0.00019997348738944658, 'samples': 569024, 'steps': 1111, 'loss/train': 2.1031763553619385} -09/20/2021 18:20:18 - INFO - __main__ - Step 17783: {'lr': 0.00019997348738944658, 'samples': 569056, 'steps': 1111, 'loss/train': 1.672336220741272} -09/20/2021 18:20:19 - INFO - __main__ - Step 17784: {'lr': 0.00019997348738944658, 'samples': 569088, 'steps': 1111, 'loss/train': 2.0797834396362305} -09/20/2021 18:20:19 - INFO - __main__ - Step 17785: {'lr': 0.00019997348738944658, 'samples': 569120, 'steps': 1111, 'loss/train': 1.0187418460845947} -09/20/2021 18:20:21 - INFO - __main__ - Step 17786: {'lr': 0.00019997348738944658, 'samples': 569152, 'steps': 1111, 'loss/train': 3.9952945709228516} -09/20/2021 18:20:22 - INFO - __main__ - Step 17787: {'lr': 0.00019997348738944658, 'samples': 569184, 'steps': 1111, 'loss/train': 3.129784107208252} -09/20/2021 18:20:22 - INFO - __main__ - Step 17788: {'lr': 0.00019997348738944658, 'samples': 569216, 'steps': 1111, 'loss/train': 3.7903175354003906} -09/20/2021 18:20:23 - INFO - __main__ - Step 17789: {'lr': 0.00019997348738944658, 'samples': 569248, 'steps': 1111, 'loss/train': 3.2952194213867188} -09/20/2021 18:20:24 - INFO - __main__ - Step 17790: {'lr': 0.00019997348738944658, 'samples': 569280, 'steps': 1111, 'loss/train': 3.4764018058776855} -09/20/2021 18:20:25 - INFO - __main__ - Step 17791: {'lr': 0.00019997348738944658, 'samples': 569312, 'steps': 1111, 'loss/train': 4.5250563621521} -09/20/2021 18:20:25 - INFO - __main__ - Step 17792: {'lr': 0.00019997348738944658, 'samples': 569344, 'steps': 1111, 'loss/train': 3.600796937942505} -09/20/2021 18:20:26 - INFO - __main__ - Step 17793: {'lr': 0.00019997334030827263, 'samples': 569376, 'steps': 1112, 'loss/train': 3.626150608062744} -09/20/2021 18:20:27 - INFO - __main__ - Step 17794: {'lr': 0.00019997334030827263, 'samples': 569408, 'steps': 1112, 'loss/train': 4.280995845794678} -09/20/2021 18:20:28 - INFO - __main__ - Step 17795: {'lr': 0.00019997334030827263, 'samples': 569440, 'steps': 1112, 'loss/train': 3.786827802658081} -09/20/2021 18:20:28 - INFO - __main__ - Step 17796: {'lr': 0.00019997334030827263, 'samples': 569472, 'steps': 1112, 'loss/train': 2.491504192352295} -09/20/2021 18:20:29 - INFO - __main__ - Step 17797: {'lr': 0.00019997334030827263, 'samples': 569504, 'steps': 1112, 'loss/train': 4.727794647216797} -09/20/2021 18:20:30 - INFO - __main__ - Step 17798: {'lr': 0.00019997334030827263, 'samples': 569536, 'steps': 1112, 'loss/train': 0.6196144819259644} -09/20/2021 18:20:31 - INFO - __main__ - Step 17799: {'lr': 0.00019997334030827263, 'samples': 569568, 'steps': 1112, 'loss/train': 0.5341588854789734} -09/20/2021 18:20:31 - INFO - __main__ - Step 17800: {'lr': 0.00019997334030827263, 'samples': 569600, 'steps': 1112, 'loss/train': 3.1471641063690186} -09/20/2021 18:20:32 - INFO - __main__ - Step 17801: {'lr': 0.00019997334030827263, 'samples': 569632, 'steps': 1112, 'loss/train': 8.77700424194336} -09/20/2021 18:20:33 - INFO - __main__ - Step 17802: {'lr': 0.00019997334030827263, 'samples': 569664, 'steps': 1112, 'loss/train': 4.963926315307617} -09/20/2021 18:20:34 - INFO - __main__ - Step 17803: {'lr': 0.00019997334030827263, 'samples': 569696, 'steps': 1112, 'loss/train': 2.277273178100586} -09/20/2021 18:20:34 - INFO - __main__ - Step 17804: {'lr': 0.00019997334030827263, 'samples': 569728, 'steps': 1112, 'loss/train': 5.111617088317871} -09/20/2021 18:20:35 - INFO - __main__ - Step 17805: {'lr': 0.00019997334030827263, 'samples': 569760, 'steps': 1112, 'loss/train': 1.361990213394165} -09/20/2021 18:20:36 - INFO - __main__ - Step 17806: {'lr': 0.00019997334030827263, 'samples': 569792, 'steps': 1112, 'loss/train': 3.82271409034729} -09/20/2021 18:20:37 - INFO - __main__ - Step 17807: {'lr': 0.00019997334030827263, 'samples': 569824, 'steps': 1112, 'loss/train': 3.7863545417785645} -09/20/2021 18:20:37 - INFO - __main__ - Step 17808: {'lr': 0.00019997334030827263, 'samples': 569856, 'steps': 1112, 'loss/train': 3.982813835144043} -09/20/2021 18:20:38 - INFO - __main__ - Step 17809: {'lr': 0.00019997319282030756, 'samples': 569888, 'steps': 1113, 'loss/train': 3.2834198474884033} -09/20/2021 18:20:39 - INFO - __main__ - Step 17810: {'lr': 0.00019997319282030756, 'samples': 569920, 'steps': 1113, 'loss/train': 3.097074031829834} -09/20/2021 18:20:40 - INFO - __main__ - Step 17811: {'lr': 0.00019997319282030756, 'samples': 569952, 'steps': 1113, 'loss/train': 3.5463619232177734} -09/20/2021 18:20:41 - INFO - __main__ - Step 17812: {'lr': 0.00019997319282030756, 'samples': 569984, 'steps': 1113, 'loss/train': 3.424610137939453} -09/20/2021 18:20:41 - INFO - __main__ - Step 17813: {'lr': 0.00019997319282030756, 'samples': 570016, 'steps': 1113, 'loss/train': 4.298182010650635} -09/20/2021 18:20:42 - INFO - __main__ - Step 17814: {'lr': 0.00019997319282030756, 'samples': 570048, 'steps': 1113, 'loss/train': 2.3565902709960938} -09/20/2021 18:20:43 - INFO - __main__ - Step 17815: {'lr': 0.00019997319282030756, 'samples': 570080, 'steps': 1113, 'loss/train': 2.3385579586029053} -09/20/2021 18:20:44 - INFO - __main__ - Step 17816: {'lr': 0.00019997319282030756, 'samples': 570112, 'steps': 1113, 'loss/train': 3.7465462684631348} -09/20/2021 18:20:44 - INFO - __main__ - Step 17817: {'lr': 0.00019997319282030756, 'samples': 570144, 'steps': 1113, 'loss/train': 4.0547895431518555} -09/20/2021 18:20:45 - INFO - __main__ - Step 17818: {'lr': 0.00019997319282030756, 'samples': 570176, 'steps': 1113, 'loss/train': 4.263222694396973} -09/20/2021 18:20:46 - INFO - __main__ - Step 17819: {'lr': 0.00019997319282030756, 'samples': 570208, 'steps': 1113, 'loss/train': 3.94441556930542} -09/20/2021 18:20:47 - INFO - __main__ - Step 17820: {'lr': 0.00019997319282030756, 'samples': 570240, 'steps': 1113, 'loss/train': 4.531480312347412} -09/20/2021 18:20:48 - INFO - __main__ - Step 17821: {'lr': 0.00019997319282030756, 'samples': 570272, 'steps': 1113, 'loss/train': 3.7235448360443115} -09/20/2021 18:20:49 - INFO - __main__ - Step 17822: {'lr': 0.00019997319282030756, 'samples': 570304, 'steps': 1113, 'loss/train': 3.886488676071167} -09/20/2021 18:20:49 - INFO - __main__ - Step 17823: {'lr': 0.00019997319282030756, 'samples': 570336, 'steps': 1113, 'loss/train': 4.406656742095947} -09/20/2021 18:20:50 - INFO - __main__ - Step 17824: {'lr': 0.00019997319282030756, 'samples': 570368, 'steps': 1113, 'loss/train': 3.706315040588379} -09/20/2021 18:20:51 - INFO - __main__ - Step 17825: {'lr': 0.00019997304492555198, 'samples': 570400, 'steps': 1114, 'loss/train': 3.315105676651001} -09/20/2021 18:20:52 - INFO - __main__ - Step 17826: {'lr': 0.00019997304492555198, 'samples': 570432, 'steps': 1114, 'loss/train': 3.8431384563446045} -09/20/2021 18:20:52 - INFO - __main__ - Step 17827: {'lr': 0.00019997304492555198, 'samples': 570464, 'steps': 1114, 'loss/train': 3.0070669651031494} -09/20/2021 18:20:53 - INFO - __main__ - Step 17828: {'lr': 0.00019997304492555198, 'samples': 570496, 'steps': 1114, 'loss/train': 3.5803592205047607} -09/20/2021 18:20:54 - INFO - __main__ - Step 17829: {'lr': 0.00019997304492555198, 'samples': 570528, 'steps': 1114, 'loss/train': 4.140687942504883} -09/20/2021 18:20:55 - INFO - __main__ - Step 17830: {'lr': 0.00019997304492555198, 'samples': 570560, 'steps': 1114, 'loss/train': 3.920421838760376} -09/20/2021 18:20:55 - INFO - __main__ - Step 17831: {'lr': 0.00019997304492555198, 'samples': 570592, 'steps': 1114, 'loss/train': 2.2787561416625977} -09/20/2021 18:20:56 - INFO - __main__ - Step 17832: {'lr': 0.00019997304492555198, 'samples': 570624, 'steps': 1114, 'loss/train': 2.016998767852783} -09/20/2021 18:20:57 - INFO - __main__ - Step 17833: {'lr': 0.00019997304492555198, 'samples': 570656, 'steps': 1114, 'loss/train': 3.567563056945801} -09/20/2021 18:20:58 - INFO - __main__ - Step 17834: {'lr': 0.00019997304492555198, 'samples': 570688, 'steps': 1114, 'loss/train': 5.747125625610352} -09/20/2021 18:20:58 - INFO - __main__ - Step 17835: {'lr': 0.00019997304492555198, 'samples': 570720, 'steps': 1114, 'loss/train': 3.7486531734466553} -09/20/2021 18:20:59 - INFO - __main__ - Step 17836: {'lr': 0.00019997304492555198, 'samples': 570752, 'steps': 1114, 'loss/train': 3.42132830619812} -09/20/2021 18:21:00 - INFO - __main__ - Step 17837: {'lr': 0.00019997304492555198, 'samples': 570784, 'steps': 1114, 'loss/train': 4.809272766113281} -09/20/2021 18:21:01 - INFO - __main__ - Step 17838: {'lr': 0.00019997304492555198, 'samples': 570816, 'steps': 1114, 'loss/train': 3.3819239139556885} -09/20/2021 18:21:01 - INFO - __main__ - Step 17839: {'lr': 0.00019997304492555198, 'samples': 570848, 'steps': 1114, 'loss/train': 3.693877696990967} -09/20/2021 18:21:02 - INFO - __main__ - Step 17840: {'lr': 0.00019997304492555198, 'samples': 570880, 'steps': 1114, 'loss/train': 3.464543342590332} -09/20/2021 18:21:03 - INFO - __main__ - Step 17841: {'lr': 0.00019997289662400643, 'samples': 570912, 'steps': 1115, 'loss/train': 3.996840000152588} -09/20/2021 18:21:04 - INFO - __main__ - Step 17842: {'lr': 0.00019997289662400643, 'samples': 570944, 'steps': 1115, 'loss/train': 4.226809024810791} -09/20/2021 18:21:05 - INFO - __main__ - Step 17843: {'lr': 0.00019997289662400643, 'samples': 570976, 'steps': 1115, 'loss/train': 3.830129623413086} -09/20/2021 18:21:05 - INFO - __main__ - Step 17844: {'lr': 0.00019997289662400643, 'samples': 571008, 'steps': 1115, 'loss/train': 1.1297942399978638} -09/20/2021 18:21:06 - INFO - __main__ - Step 17845: {'lr': 0.00019997289662400643, 'samples': 571040, 'steps': 1115, 'loss/train': 1.631278157234192} -09/20/2021 18:21:07 - INFO - __main__ - Step 17846: {'lr': 0.00019997289662400643, 'samples': 571072, 'steps': 1115, 'loss/train': 3.386540651321411} -09/20/2021 18:21:08 - INFO - __main__ - Step 17847: {'lr': 0.00019997289662400643, 'samples': 571104, 'steps': 1115, 'loss/train': 4.359369277954102} -09/20/2021 18:21:08 - INFO - __main__ - Step 17848: {'lr': 0.00019997289662400643, 'samples': 571136, 'steps': 1115, 'loss/train': 3.9979419708251953} -09/20/2021 18:21:09 - INFO - __main__ - Step 17849: {'lr': 0.00019997289662400643, 'samples': 571168, 'steps': 1115, 'loss/train': 2.30068302154541} -09/20/2021 18:21:10 - INFO - __main__ - Step 17850: {'lr': 0.00019997289662400643, 'samples': 571200, 'steps': 1115, 'loss/train': 3.7019126415252686} -09/20/2021 18:21:11 - INFO - __main__ - Step 17851: {'lr': 0.00019997289662400643, 'samples': 571232, 'steps': 1115, 'loss/train': 3.0154309272766113} -09/20/2021 18:21:12 - INFO - __main__ - Step 17852: {'lr': 0.00019997289662400643, 'samples': 571264, 'steps': 1115, 'loss/train': 0.8962176442146301} -09/20/2021 18:21:13 - INFO - __main__ - Step 17853: {'lr': 0.00019997289662400643, 'samples': 571296, 'steps': 1115, 'loss/train': 4.362915992736816} -09/20/2021 18:21:13 - INFO - __main__ - Step 17854: {'lr': 0.00019997289662400643, 'samples': 571328, 'steps': 1115, 'loss/train': 3.6980679035186768} -09/20/2021 18:21:14 - INFO - __main__ - Step 17855: {'lr': 0.00019997289662400643, 'samples': 571360, 'steps': 1115, 'loss/train': 3.4582481384277344} -09/20/2021 18:21:15 - INFO - __main__ - Step 17856: {'lr': 0.00019997289662400643, 'samples': 571392, 'steps': 1115, 'loss/train': 0.4578513205051422} -09/20/2021 18:21:16 - INFO - __main__ - Step 17857: {'lr': 0.00019997274791567156, 'samples': 571424, 'steps': 1116, 'loss/train': 3.0717692375183105} -09/20/2021 18:21:16 - INFO - __main__ - Step 17858: {'lr': 0.00019997274791567156, 'samples': 571456, 'steps': 1116, 'loss/train': 2.8814282417297363} -09/20/2021 18:21:17 - INFO - __main__ - Step 17859: {'lr': 0.00019997274791567156, 'samples': 571488, 'steps': 1116, 'loss/train': 3.8231818675994873} -09/20/2021 18:21:18 - INFO - __main__ - Step 17860: {'lr': 0.00019997274791567156, 'samples': 571520, 'steps': 1116, 'loss/train': 3.621339797973633} -09/20/2021 18:21:19 - INFO - __main__ - Step 17861: {'lr': 0.00019997274791567156, 'samples': 571552, 'steps': 1116, 'loss/train': 3.9080898761749268} -09/20/2021 18:21:19 - INFO - __main__ - Step 17862: {'lr': 0.00019997274791567156, 'samples': 571584, 'steps': 1116, 'loss/train': 2.8232829570770264} -09/20/2021 18:21:20 - INFO - __main__ - Step 17863: {'lr': 0.00019997274791567156, 'samples': 571616, 'steps': 1116, 'loss/train': 2.535048246383667} -09/20/2021 18:21:21 - INFO - __main__ - Step 17864: {'lr': 0.00019997274791567156, 'samples': 571648, 'steps': 1116, 'loss/train': 4.543722629547119} -09/20/2021 18:21:22 - INFO - __main__ - Step 17865: {'lr': 0.00019997274791567156, 'samples': 571680, 'steps': 1116, 'loss/train': 3.9346373081207275} -09/20/2021 18:21:22 - INFO - __main__ - Step 17866: {'lr': 0.00019997274791567156, 'samples': 571712, 'steps': 1116, 'loss/train': 3.505530834197998} -09/20/2021 18:21:23 - INFO - __main__ - Step 17867: {'lr': 0.00019997274791567156, 'samples': 571744, 'steps': 1116, 'loss/train': 5.114176273345947} -09/20/2021 18:21:24 - INFO - __main__ - Step 17868: {'lr': 0.00019997274791567156, 'samples': 571776, 'steps': 1116, 'loss/train': 3.486957550048828} -09/20/2021 18:21:25 - INFO - __main__ - Step 17869: {'lr': 0.00019997274791567156, 'samples': 571808, 'steps': 1116, 'loss/train': 4.1252007484436035} -09/20/2021 18:21:25 - INFO - __main__ - Step 17870: {'lr': 0.00019997274791567156, 'samples': 571840, 'steps': 1116, 'loss/train': 3.457226037979126} -09/20/2021 18:21:26 - INFO - __main__ - Step 17871: {'lr': 0.00019997274791567156, 'samples': 571872, 'steps': 1116, 'loss/train': 3.305485725402832} -09/20/2021 18:21:27 - INFO - __main__ - Step 17872: {'lr': 0.00019997274791567156, 'samples': 571904, 'steps': 1116, 'loss/train': 3.701021909713745} -09/20/2021 18:21:28 - INFO - __main__ - Step 17873: {'lr': 0.00019997259880054797, 'samples': 571936, 'steps': 1117, 'loss/train': 3.6452176570892334} -09/20/2021 18:21:29 - INFO - __main__ - Step 17874: {'lr': 0.00019997259880054797, 'samples': 571968, 'steps': 1117, 'loss/train': 3.380316734313965} -09/20/2021 18:21:29 - INFO - __main__ - Step 17875: {'lr': 0.00019997259880054797, 'samples': 572000, 'steps': 1117, 'loss/train': 3.723048210144043} -09/20/2021 18:21:30 - INFO - __main__ - Step 17876: {'lr': 0.00019997259880054797, 'samples': 572032, 'steps': 1117, 'loss/train': 3.295436143875122} -09/20/2021 18:21:31 - INFO - __main__ - Step 17877: {'lr': 0.00019997259880054797, 'samples': 572064, 'steps': 1117, 'loss/train': 3.1946983337402344} -09/20/2021 18:21:32 - INFO - __main__ - Step 17878: {'lr': 0.00019997259880054797, 'samples': 572096, 'steps': 1117, 'loss/train': 2.9206769466400146} -09/20/2021 18:21:32 - INFO - __main__ - Step 17879: {'lr': 0.00019997259880054797, 'samples': 572128, 'steps': 1117, 'loss/train': 2.878980875015259} -09/20/2021 18:21:33 - INFO - __main__ - Step 17880: {'lr': 0.00019997259880054797, 'samples': 572160, 'steps': 1117, 'loss/train': 3.3860082626342773} -09/20/2021 18:21:34 - INFO - __main__ - Step 17881: {'lr': 0.00019997259880054797, 'samples': 572192, 'steps': 1117, 'loss/train': 3.0759799480438232} -09/20/2021 18:21:35 - INFO - __main__ - Step 17882: {'lr': 0.00019997259880054797, 'samples': 572224, 'steps': 1117, 'loss/train': 3.558184862136841} -09/20/2021 18:21:36 - INFO - __main__ - Step 17883: {'lr': 0.00019997259880054797, 'samples': 572256, 'steps': 1117, 'loss/train': 3.602665901184082} -09/20/2021 18:21:37 - INFO - __main__ - Step 17884: {'lr': 0.00019997259880054797, 'samples': 572288, 'steps': 1117, 'loss/train': 3.0288009643554688} -09/20/2021 18:21:37 - INFO - __main__ - Step 17885: {'lr': 0.00019997259880054797, 'samples': 572320, 'steps': 1117, 'loss/train': 3.103376865386963} -09/20/2021 18:21:38 - INFO - __main__ - Step 17886: {'lr': 0.00019997259880054797, 'samples': 572352, 'steps': 1117, 'loss/train': 3.545381546020508} -09/20/2021 18:21:39 - INFO - __main__ - Step 17887: {'lr': 0.00019997259880054797, 'samples': 572384, 'steps': 1117, 'loss/train': 2.6730659008026123} -09/20/2021 18:21:40 - INFO - __main__ - Step 17888: {'lr': 0.00019997259880054797, 'samples': 572416, 'steps': 1117, 'loss/train': 3.183039903640747} -09/20/2021 18:21:41 - INFO - __main__ - Step 17889: {'lr': 0.00019997244927863624, 'samples': 572448, 'steps': 1118, 'loss/train': 3.777111291885376} -09/20/2021 18:21:41 - INFO - __main__ - Step 17890: {'lr': 0.00019997244927863624, 'samples': 572480, 'steps': 1118, 'loss/train': 4.088316917419434} -09/20/2021 18:21:42 - INFO - __main__ - Step 17891: {'lr': 0.00019997244927863624, 'samples': 572512, 'steps': 1118, 'loss/train': 3.5617949962615967} -09/20/2021 18:21:43 - INFO - __main__ - Step 17892: {'lr': 0.00019997244927863624, 'samples': 572544, 'steps': 1118, 'loss/train': 3.3455464839935303} -09/20/2021 18:21:44 - INFO - __main__ - Step 17893: {'lr': 0.00019997244927863624, 'samples': 572576, 'steps': 1118, 'loss/train': 3.9816668033599854} -09/20/2021 18:21:44 - INFO - __main__ - Step 17894: {'lr': 0.00019997244927863624, 'samples': 572608, 'steps': 1118, 'loss/train': 4.047341346740723} -09/20/2021 18:21:45 - INFO - __main__ - Step 17895: {'lr': 0.00019997244927863624, 'samples': 572640, 'steps': 1118, 'loss/train': 3.6858248710632324} -09/20/2021 18:21:46 - INFO - __main__ - Step 17896: {'lr': 0.00019997244927863624, 'samples': 572672, 'steps': 1118, 'loss/train': 3.36238431930542} -09/20/2021 18:21:47 - INFO - __main__ - Step 17897: {'lr': 0.00019997244927863624, 'samples': 572704, 'steps': 1118, 'loss/train': 3.631150722503662} -09/20/2021 18:21:47 - INFO - __main__ - Step 17898: {'lr': 0.00019997244927863624, 'samples': 572736, 'steps': 1118, 'loss/train': 2.787127733230591} -09/20/2021 18:21:48 - INFO - __main__ - Step 17899: {'lr': 0.00019997244927863624, 'samples': 572768, 'steps': 1118, 'loss/train': 2.7464065551757812} -09/20/2021 18:21:49 - INFO - __main__ - Step 17900: {'lr': 0.00019997244927863624, 'samples': 572800, 'steps': 1118, 'loss/train': 3.5355935096740723} -09/20/2021 18:21:50 - INFO - __main__ - Step 17901: {'lr': 0.00019997244927863624, 'samples': 572832, 'steps': 1118, 'loss/train': 3.9047563076019287} -09/20/2021 18:21:50 - INFO - __main__ - Step 17902: {'lr': 0.00019997244927863624, 'samples': 572864, 'steps': 1118, 'loss/train': 4.036379337310791} -09/20/2021 18:21:51 - INFO - __main__ - Step 17903: {'lr': 0.00019997244927863624, 'samples': 572896, 'steps': 1118, 'loss/train': 3.8536410331726074} -09/20/2021 18:21:52 - INFO - __main__ - Step 17904: {'lr': 0.00019997244927863624, 'samples': 572928, 'steps': 1118, 'loss/train': 3.9820990562438965} -09/20/2021 18:21:53 - INFO - __main__ - Step 17905: {'lr': 0.00019997229934993707, 'samples': 572960, 'steps': 1119, 'loss/train': 3.1519131660461426} -09/20/2021 18:21:53 - INFO - __main__ - Step 17906: {'lr': 0.00019997229934993707, 'samples': 572992, 'steps': 1119, 'loss/train': 3.7884304523468018} -09/20/2021 18:21:54 - INFO - __main__ - Step 17907: {'lr': 0.00019997229934993707, 'samples': 573024, 'steps': 1119, 'loss/train': 3.4779229164123535} -09/20/2021 18:21:55 - INFO - __main__ - Step 17908: {'lr': 0.00019997229934993707, 'samples': 573056, 'steps': 1119, 'loss/train': 3.692138671875} -09/20/2021 18:21:56 - INFO - __main__ - Step 17909: {'lr': 0.00019997229934993707, 'samples': 573088, 'steps': 1119, 'loss/train': 3.2881665229797363} -09/20/2021 18:21:57 - INFO - __main__ - Step 17910: {'lr': 0.00019997229934993707, 'samples': 573120, 'steps': 1119, 'loss/train': 2.8788065910339355} -09/20/2021 18:21:57 - INFO - __main__ - Step 17911: {'lr': 0.00019997229934993707, 'samples': 573152, 'steps': 1119, 'loss/train': 0.8950377702713013} -09/20/2021 18:21:59 - INFO - __main__ - Step 17912: {'lr': 0.00019997229934993707, 'samples': 573184, 'steps': 1119, 'loss/train': 0.9531705975532532} -09/20/2021 18:21:59 - INFO - __main__ - Step 17913: {'lr': 0.00019997229934993707, 'samples': 573216, 'steps': 1119, 'loss/train': 2.2856991291046143} -09/20/2021 18:22:00 - INFO - __main__ - Step 17914: {'lr': 0.00019997229934993707, 'samples': 573248, 'steps': 1119, 'loss/train': 4.110971450805664} -09/20/2021 18:22:01 - INFO - __main__ - Step 17915: {'lr': 0.00019997229934993707, 'samples': 573280, 'steps': 1119, 'loss/train': 3.618900775909424} -09/20/2021 18:22:02 - INFO - __main__ - Step 17916: {'lr': 0.00019997229934993707, 'samples': 573312, 'steps': 1119, 'loss/train': 3.0446279048919678} -09/20/2021 18:22:02 - INFO - __main__ - Step 17917: {'lr': 0.00019997229934993707, 'samples': 573344, 'steps': 1119, 'loss/train': 3.4894027709960938} -09/20/2021 18:22:03 - INFO - __main__ - Step 17918: {'lr': 0.00019997229934993707, 'samples': 573376, 'steps': 1119, 'loss/train': 2.8785645961761475} -09/20/2021 18:22:04 - INFO - __main__ - Step 17919: {'lr': 0.00019997229934993707, 'samples': 573408, 'steps': 1119, 'loss/train': 4.214817047119141} -09/20/2021 18:22:05 - INFO - __main__ - Step 17920: {'lr': 0.00019997229934993707, 'samples': 573440, 'steps': 1119, 'loss/train': 4.116289138793945} -09/20/2021 18:22:06 - INFO - __main__ - Step 17921: {'lr': 0.00019997214901445093, 'samples': 573472, 'steps': 1120, 'loss/train': 4.922204971313477} -09/20/2021 18:22:06 - INFO - __main__ - Step 17922: {'lr': 0.00019997214901445093, 'samples': 573504, 'steps': 1120, 'loss/train': 2.8595499992370605} -09/20/2021 18:22:07 - INFO - __main__ - Step 17923: {'lr': 0.00019997214901445093, 'samples': 573536, 'steps': 1120, 'loss/train': 3.4082119464874268} -09/20/2021 18:22:08 - INFO - __main__ - Step 17924: {'lr': 0.00019997214901445093, 'samples': 573568, 'steps': 1120, 'loss/train': 3.9014828205108643} -09/20/2021 18:22:08 - INFO - __main__ - Step 17925: {'lr': 0.00019997214901445093, 'samples': 573600, 'steps': 1120, 'loss/train': 5.764349460601807} -09/20/2021 18:22:09 - INFO - __main__ - Step 17926: {'lr': 0.00019997214901445093, 'samples': 573632, 'steps': 1120, 'loss/train': 5.9617156982421875} -09/20/2021 18:22:10 - INFO - __main__ - Step 17927: {'lr': 0.00019997214901445093, 'samples': 573664, 'steps': 1120, 'loss/train': 6.250477313995361} -09/20/2021 18:22:11 - INFO - __main__ - Step 17928: {'lr': 0.00019997214901445093, 'samples': 573696, 'steps': 1120, 'loss/train': 3.117630958557129} -09/20/2021 18:22:11 - INFO - __main__ - Step 17929: {'lr': 0.00019997214901445093, 'samples': 573728, 'steps': 1120, 'loss/train': 0.9599183201789856} -09/20/2021 18:22:12 - INFO - __main__ - Step 17930: {'lr': 0.00019997214901445093, 'samples': 573760, 'steps': 1120, 'loss/train': 4.738114833831787} -09/20/2021 18:22:13 - INFO - __main__ - Step 17931: {'lr': 0.00019997214901445093, 'samples': 573792, 'steps': 1120, 'loss/train': 3.3567452430725098} -09/20/2021 18:22:14 - INFO - __main__ - Step 17932: {'lr': 0.00019997214901445093, 'samples': 573824, 'steps': 1120, 'loss/train': 3.179300546646118} -09/20/2021 18:22:15 - INFO - __main__ - Step 17933: {'lr': 0.00019997214901445093, 'samples': 573856, 'steps': 1120, 'loss/train': 3.841063976287842} -09/20/2021 18:22:15 - INFO - __main__ - Step 17934: {'lr': 0.00019997214901445093, 'samples': 573888, 'steps': 1120, 'loss/train': 2.482279062271118} -09/20/2021 18:22:16 - INFO - __main__ - Step 17935: {'lr': 0.00019997214901445093, 'samples': 573920, 'steps': 1120, 'loss/train': 3.6593992710113525} -09/20/2021 18:22:17 - INFO - __main__ - Step 17936: {'lr': 0.00019997214901445093, 'samples': 573952, 'steps': 1120, 'loss/train': 3.114201307296753} -09/20/2021 18:22:18 - INFO - __main__ - Step 17937: {'lr': 0.00019997199827217853, 'samples': 573984, 'steps': 1121, 'loss/train': 3.8552350997924805} -09/20/2021 18:22:18 - INFO - __main__ - Step 17938: {'lr': 0.00019997199827217853, 'samples': 574016, 'steps': 1121, 'loss/train': 3.2929582595825195} -09/20/2021 18:22:19 - INFO - __main__ - Step 17939: {'lr': 0.00019997199827217853, 'samples': 574048, 'steps': 1121, 'loss/train': 4.25098991394043} -09/20/2021 18:22:20 - INFO - __main__ - Step 17940: {'lr': 0.00019997199827217853, 'samples': 574080, 'steps': 1121, 'loss/train': 3.4169440269470215} -09/20/2021 18:22:21 - INFO - __main__ - Step 17941: {'lr': 0.00019997199827217853, 'samples': 574112, 'steps': 1121, 'loss/train': 3.0969862937927246} -09/20/2021 18:22:21 - INFO - __main__ - Step 17942: {'lr': 0.00019997199827217853, 'samples': 574144, 'steps': 1121, 'loss/train': 4.052520751953125} -09/20/2021 18:22:22 - INFO - __main__ - Step 17943: {'lr': 0.00019997199827217853, 'samples': 574176, 'steps': 1121, 'loss/train': 3.4468955993652344} -09/20/2021 18:22:24 - INFO - __main__ - Step 17944: {'lr': 0.00019997199827217853, 'samples': 574208, 'steps': 1121, 'loss/train': 4.371500492095947} -09/20/2021 18:22:24 - INFO - __main__ - Step 17945: {'lr': 0.00019997199827217853, 'samples': 574240, 'steps': 1121, 'loss/train': 4.154690742492676} -09/20/2021 18:22:25 - INFO - __main__ - Step 17946: {'lr': 0.00019997199827217853, 'samples': 574272, 'steps': 1121, 'loss/train': 3.9583871364593506} -09/20/2021 18:22:26 - INFO - __main__ - Step 17947: {'lr': 0.00019997199827217853, 'samples': 574304, 'steps': 1121, 'loss/train': 4.20875883102417} -09/20/2021 18:22:27 - INFO - __main__ - Step 17948: {'lr': 0.00019997199827217853, 'samples': 574336, 'steps': 1121, 'loss/train': 3.0269250869750977} -09/20/2021 18:22:27 - INFO - __main__ - Step 17949: {'lr': 0.00019997199827217853, 'samples': 574368, 'steps': 1121, 'loss/train': 2.786686658859253} -09/20/2021 18:22:28 - INFO - __main__ - Step 17950: {'lr': 0.00019997199827217853, 'samples': 574400, 'steps': 1121, 'loss/train': 3.7958874702453613} -09/20/2021 18:22:29 - INFO - __main__ - Step 17951: {'lr': 0.00019997199827217853, 'samples': 574432, 'steps': 1121, 'loss/train': 3.9201488494873047} -09/20/2021 18:22:30 - INFO - __main__ - Step 17952: {'lr': 0.00019997199827217853, 'samples': 574464, 'steps': 1121, 'loss/train': 4.4682793617248535} -09/20/2021 18:22:31 - INFO - __main__ - Step 17953: {'lr': 0.00019997184712312044, 'samples': 574496, 'steps': 1122, 'loss/train': 2.9896044731140137} -09/20/2021 18:22:31 - INFO - __main__ - Step 17954: {'lr': 0.00019997184712312044, 'samples': 574528, 'steps': 1122, 'loss/train': 3.46168851852417} -09/20/2021 18:22:32 - INFO - __main__ - Step 17955: {'lr': 0.00019997184712312044, 'samples': 574560, 'steps': 1122, 'loss/train': 0.8006415963172913} -09/20/2021 18:22:33 - INFO - __main__ - Step 17956: {'lr': 0.00019997184712312044, 'samples': 574592, 'steps': 1122, 'loss/train': 0.6645923256874084} -09/20/2021 18:22:34 - INFO - __main__ - Step 17957: {'lr': 0.00019997184712312044, 'samples': 574624, 'steps': 1122, 'loss/train': 1.1439181566238403} -09/20/2021 18:22:34 - INFO - __main__ - Step 17958: {'lr': 0.00019997184712312044, 'samples': 574656, 'steps': 1122, 'loss/train': 0.9118069410324097} -09/20/2021 18:22:35 - INFO - __main__ - Step 17959: {'lr': 0.00019997184712312044, 'samples': 574688, 'steps': 1122, 'loss/train': 1.0099085569381714} -09/20/2021 18:22:36 - INFO - __main__ - Step 17960: {'lr': 0.00019997184712312044, 'samples': 574720, 'steps': 1122, 'loss/train': 3.146599769592285} -09/20/2021 18:22:37 - INFO - __main__ - Step 17961: {'lr': 0.00019997184712312044, 'samples': 574752, 'steps': 1122, 'loss/train': 3.839505434036255} -09/20/2021 18:22:37 - INFO - __main__ - Step 17962: {'lr': 0.00019997184712312044, 'samples': 574784, 'steps': 1122, 'loss/train': 2.5981996059417725} -09/20/2021 18:22:38 - INFO - __main__ - Step 17963: {'lr': 0.00019997184712312044, 'samples': 574816, 'steps': 1122, 'loss/train': 4.712751388549805} -09/20/2021 18:22:39 - INFO - __main__ - Step 17964: {'lr': 0.00019997184712312044, 'samples': 574848, 'steps': 1122, 'loss/train': 4.728726387023926} -09/20/2021 18:22:40 - INFO - __main__ - Step 17965: {'lr': 0.00019997184712312044, 'samples': 574880, 'steps': 1122, 'loss/train': 3.974647283554077} -09/20/2021 18:22:40 - INFO - __main__ - Step 17966: {'lr': 0.00019997184712312044, 'samples': 574912, 'steps': 1122, 'loss/train': 3.449275255203247} -09/20/2021 18:22:41 - INFO - __main__ - Step 17967: {'lr': 0.00019997184712312044, 'samples': 574944, 'steps': 1122, 'loss/train': 3.3651468753814697} -09/20/2021 18:22:42 - INFO - __main__ - Step 17968: {'lr': 0.00019997184712312044, 'samples': 574976, 'steps': 1122, 'loss/train': 2.9984920024871826} -09/20/2021 18:22:43 - INFO - __main__ - Step 17969: {'lr': 0.00019997169556727732, 'samples': 575008, 'steps': 1123, 'loss/train': 4.106540203094482} -09/20/2021 18:22:43 - INFO - __main__ - Step 17970: {'lr': 0.00019997169556727732, 'samples': 575040, 'steps': 1123, 'loss/train': 3.5202877521514893} -09/20/2021 18:22:44 - INFO - __main__ - Step 17971: {'lr': 0.00019997169556727732, 'samples': 575072, 'steps': 1123, 'loss/train': 3.2405030727386475} -09/20/2021 18:22:45 - INFO - __main__ - Step 17972: {'lr': 0.00019997169556727732, 'samples': 575104, 'steps': 1123, 'loss/train': 3.0178847312927246} -09/20/2021 18:22:46 - INFO - __main__ - Step 17973: {'lr': 0.00019997169556727732, 'samples': 575136, 'steps': 1123, 'loss/train': 6.121467590332031} -09/20/2021 18:22:46 - INFO - __main__ - Step 17974: {'lr': 0.00019997169556727732, 'samples': 575168, 'steps': 1123, 'loss/train': 5.9843645095825195} -09/20/2021 18:22:48 - INFO - __main__ - Step 17975: {'lr': 0.00019997169556727732, 'samples': 575200, 'steps': 1123, 'loss/train': 3.6464972496032715} -09/20/2021 18:22:48 - INFO - __main__ - Step 17976: {'lr': 0.00019997169556727732, 'samples': 575232, 'steps': 1123, 'loss/train': 3.8398311138153076} -09/20/2021 18:22:49 - INFO - __main__ - Step 17977: {'lr': 0.00019997169556727732, 'samples': 575264, 'steps': 1123, 'loss/train': 6.367511749267578} -09/20/2021 18:22:50 - INFO - __main__ - Step 17978: {'lr': 0.00019997169556727732, 'samples': 575296, 'steps': 1123, 'loss/train': 3.237147808074951} -09/20/2021 18:22:51 - INFO - __main__ - Step 17979: {'lr': 0.00019997169556727732, 'samples': 575328, 'steps': 1123, 'loss/train': 2.941789150238037} -09/20/2021 18:22:51 - INFO - __main__ - Step 17980: {'lr': 0.00019997169556727732, 'samples': 575360, 'steps': 1123, 'loss/train': 3.770294666290283} -09/20/2021 18:22:52 - INFO - __main__ - Step 17981: {'lr': 0.00019997169556727732, 'samples': 575392, 'steps': 1123, 'loss/train': 3.0886058807373047} -09/20/2021 18:22:53 - INFO - __main__ - Step 17982: {'lr': 0.00019997169556727732, 'samples': 575424, 'steps': 1123, 'loss/train': 3.790165662765503} -09/20/2021 18:22:54 - INFO - __main__ - Step 17983: {'lr': 0.00019997169556727732, 'samples': 575456, 'steps': 1123, 'loss/train': 3.4574227333068848} -09/20/2021 18:22:54 - INFO - __main__ - Step 17984: {'lr': 0.00019997169556727732, 'samples': 575488, 'steps': 1123, 'loss/train': 3.534557819366455} -09/20/2021 18:22:55 - INFO - __main__ - Step 17985: {'lr': 0.00019997154360464975, 'samples': 575520, 'steps': 1124, 'loss/train': 4.003354549407959} -09/20/2021 18:22:56 - INFO - __main__ - Step 17986: {'lr': 0.00019997154360464975, 'samples': 575552, 'steps': 1124, 'loss/train': 3.6089701652526855} -09/20/2021 18:22:57 - INFO - __main__ - Step 17987: {'lr': 0.00019997154360464975, 'samples': 575584, 'steps': 1124, 'loss/train': 3.356564998626709} -09/20/2021 18:22:58 - INFO - __main__ - Step 17988: {'lr': 0.00019997154360464975, 'samples': 575616, 'steps': 1124, 'loss/train': 3.1518654823303223} -09/20/2021 18:22:58 - INFO - __main__ - Step 17989: {'lr': 0.00019997154360464975, 'samples': 575648, 'steps': 1124, 'loss/train': 3.9229178428649902} -09/20/2021 18:22:59 - INFO - __main__ - Step 17990: {'lr': 0.00019997154360464975, 'samples': 575680, 'steps': 1124, 'loss/train': 3.89969801902771} -09/20/2021 18:23:00 - INFO - __main__ - Step 17991: {'lr': 0.00019997154360464975, 'samples': 575712, 'steps': 1124, 'loss/train': 2.734109401702881} -09/20/2021 18:23:01 - INFO - __main__ - Step 17992: {'lr': 0.00019997154360464975, 'samples': 575744, 'steps': 1124, 'loss/train': 3.3035407066345215} -09/20/2021 18:23:01 - INFO - __main__ - Step 17993: {'lr': 0.00019997154360464975, 'samples': 575776, 'steps': 1124, 'loss/train': 4.399262428283691} -09/20/2021 18:23:02 - INFO - __main__ - Step 17994: {'lr': 0.00019997154360464975, 'samples': 575808, 'steps': 1124, 'loss/train': 3.890737295150757} -09/20/2021 18:23:03 - INFO - __main__ - Step 17995: {'lr': 0.00019997154360464975, 'samples': 575840, 'steps': 1124, 'loss/train': 3.7596468925476074} -09/20/2021 18:23:04 - INFO - __main__ - Step 17996: {'lr': 0.00019997154360464975, 'samples': 575872, 'steps': 1124, 'loss/train': 4.187273025512695} -09/20/2021 18:23:04 - INFO - __main__ - Step 17997: {'lr': 0.00019997154360464975, 'samples': 575904, 'steps': 1124, 'loss/train': 3.433159351348877} -09/20/2021 18:23:05 - INFO - __main__ - Step 17998: {'lr': 0.00019997154360464975, 'samples': 575936, 'steps': 1124, 'loss/train': 3.3707242012023926} -09/20/2021 18:23:06 - INFO - __main__ - Step 17999: {'lr': 0.00019997154360464975, 'samples': 575968, 'steps': 1124, 'loss/train': 4.209785461425781} -09/20/2021 18:23:07 - INFO - __main__ - Step 18000: {'lr': 0.00019997154360464975, 'samples': 576000, 'steps': 1124, 'loss/train': 4.908490180969238} -09/20/2021 18:23:07 - INFO - __main__ - Step 18001: {'lr': 0.0001999713912352384, 'samples': 576032, 'steps': 1125, 'loss/train': 1.4072668552398682} -09/20/2021 18:23:08 - INFO - __main__ - Step 18002: {'lr': 0.0001999713912352384, 'samples': 576064, 'steps': 1125, 'loss/train': 3.2426652908325195} -09/20/2021 18:23:09 - INFO - __main__ - Step 18003: {'lr': 0.0001999713912352384, 'samples': 576096, 'steps': 1125, 'loss/train': 3.7069811820983887} -09/20/2021 18:23:10 - INFO - __main__ - Step 18004: {'lr': 0.0001999713912352384, 'samples': 576128, 'steps': 1125, 'loss/train': 2.9574880599975586} -09/20/2021 18:23:10 - INFO - __main__ - Step 18005: {'lr': 0.0001999713912352384, 'samples': 576160, 'steps': 1125, 'loss/train': 4.408470153808594} -09/20/2021 18:23:12 - INFO - __main__ - Step 18006: {'lr': 0.0001999713912352384, 'samples': 576192, 'steps': 1125, 'loss/train': 3.964606523513794} -09/20/2021 18:23:13 - INFO - __main__ - Step 18007: {'lr': 0.0001999713912352384, 'samples': 576224, 'steps': 1125, 'loss/train': 3.727908134460449} -09/20/2021 18:23:13 - INFO - __main__ - Step 18008: {'lr': 0.0001999713912352384, 'samples': 576256, 'steps': 1125, 'loss/train': 4.642321586608887} -09/20/2021 18:23:14 - INFO - __main__ - Step 18009: {'lr': 0.0001999713912352384, 'samples': 576288, 'steps': 1125, 'loss/train': 6.410741329193115} -09/20/2021 18:23:15 - INFO - __main__ - Step 18010: {'lr': 0.0001999713912352384, 'samples': 576320, 'steps': 1125, 'loss/train': 4.16213321685791} -09/20/2021 18:23:16 - INFO - __main__ - Step 18011: {'lr': 0.0001999713912352384, 'samples': 576352, 'steps': 1125, 'loss/train': 3.386199712753296} -09/20/2021 18:23:16 - INFO - __main__ - Step 18012: {'lr': 0.0001999713912352384, 'samples': 576384, 'steps': 1125, 'loss/train': 3.8892345428466797} -09/20/2021 18:23:17 - INFO - __main__ - Step 18013: {'lr': 0.0001999713912352384, 'samples': 576416, 'steps': 1125, 'loss/train': 2.948331594467163} -09/20/2021 18:23:18 - INFO - __main__ - Step 18014: {'lr': 0.0001999713912352384, 'samples': 576448, 'steps': 1125, 'loss/train': 3.813380002975464} -09/20/2021 18:23:19 - INFO - __main__ - Step 18015: {'lr': 0.0001999713912352384, 'samples': 576480, 'steps': 1125, 'loss/train': 3.2978296279907227} -09/20/2021 18:23:19 - INFO - __main__ - Step 18016: {'lr': 0.0001999713912352384, 'samples': 576512, 'steps': 1125, 'loss/train': 3.523676633834839} -09/20/2021 18:23:20 - INFO - __main__ - Step 18017: {'lr': 0.00019997123845904376, 'samples': 576544, 'steps': 1126, 'loss/train': 3.1108171939849854} -09/20/2021 18:23:21 - INFO - __main__ - Step 18018: {'lr': 0.00019997123845904376, 'samples': 576576, 'steps': 1126, 'loss/train': 4.279716491699219} -09/20/2021 18:23:22 - INFO - __main__ - Step 18019: {'lr': 0.00019997123845904376, 'samples': 576608, 'steps': 1126, 'loss/train': 3.99536395072937} -09/20/2021 18:23:22 - INFO - __main__ - Step 18020: {'lr': 0.00019997123845904376, 'samples': 576640, 'steps': 1126, 'loss/train': 3.144747495651245} -09/20/2021 18:23:23 - INFO - __main__ - Step 18021: {'lr': 0.00019997123845904376, 'samples': 576672, 'steps': 1126, 'loss/train': 3.2935400009155273} -09/20/2021 18:23:24 - INFO - __main__ - Step 18022: {'lr': 0.00019997123845904376, 'samples': 576704, 'steps': 1126, 'loss/train': 3.785230875015259} -09/20/2021 18:23:25 - INFO - __main__ - Step 18023: {'lr': 0.00019997123845904376, 'samples': 576736, 'steps': 1126, 'loss/train': 3.151695489883423} -09/20/2021 18:23:25 - INFO - __main__ - Step 18024: {'lr': 0.00019997123845904376, 'samples': 576768, 'steps': 1126, 'loss/train': 4.694543838500977} -09/20/2021 18:23:26 - INFO - __main__ - Step 18025: {'lr': 0.00019997123845904376, 'samples': 576800, 'steps': 1126, 'loss/train': 4.495944976806641} -09/20/2021 18:23:27 - INFO - __main__ - Step 18026: {'lr': 0.00019997123845904376, 'samples': 576832, 'steps': 1126, 'loss/train': 3.5882134437561035} -09/20/2021 18:23:28 - INFO - __main__ - Step 18027: {'lr': 0.00019997123845904376, 'samples': 576864, 'steps': 1126, 'loss/train': 5.592360019683838} -09/20/2021 18:23:28 - INFO - __main__ - Step 18028: {'lr': 0.00019997123845904376, 'samples': 576896, 'steps': 1126, 'loss/train': 3.271146297454834} -09/20/2021 18:23:29 - INFO - __main__ - Step 18029: {'lr': 0.00019997123845904376, 'samples': 576928, 'steps': 1126, 'loss/train': 2.9768552780151367} -09/20/2021 18:23:30 - INFO - __main__ - Step 18030: {'lr': 0.00019997123845904376, 'samples': 576960, 'steps': 1126, 'loss/train': 3.321089506149292} -09/20/2021 18:23:31 - INFO - __main__ - Step 18031: {'lr': 0.00019997123845904376, 'samples': 576992, 'steps': 1126, 'loss/train': 3.4938933849334717} -09/20/2021 18:23:31 - INFO - __main__ - Step 18032: {'lr': 0.00019997123845904376, 'samples': 577024, 'steps': 1126, 'loss/train': 4.221555233001709} -09/20/2021 18:23:32 - INFO - __main__ - Step 18033: {'lr': 0.0001999710852760666, 'samples': 577056, 'steps': 1127, 'loss/train': 4.015760898590088} -09/20/2021 18:23:33 - INFO - __main__ - Step 18034: {'lr': 0.0001999710852760666, 'samples': 577088, 'steps': 1127, 'loss/train': 4.197253704071045} -09/20/2021 18:23:34 - INFO - __main__ - Step 18035: {'lr': 0.0001999710852760666, 'samples': 577120, 'steps': 1127, 'loss/train': 4.123558044433594} -09/20/2021 18:23:35 - INFO - __main__ - Step 18036: {'lr': 0.0001999710852760666, 'samples': 577152, 'steps': 1127, 'loss/train': 3.3264193534851074} -09/20/2021 18:23:35 - INFO - __main__ - Step 18037: {'lr': 0.0001999710852760666, 'samples': 577184, 'steps': 1127, 'loss/train': 3.6587753295898438} -09/20/2021 18:23:37 - INFO - __main__ - Step 18038: {'lr': 0.0001999710852760666, 'samples': 577216, 'steps': 1127, 'loss/train': 3.3863425254821777} -09/20/2021 18:23:38 - INFO - __main__ - Step 18039: {'lr': 0.0001999710852760666, 'samples': 577248, 'steps': 1127, 'loss/train': 1.0768654346466064} -09/20/2021 18:23:38 - INFO - __main__ - Step 18040: {'lr': 0.0001999710852760666, 'samples': 577280, 'steps': 1127, 'loss/train': 3.2702488899230957} -09/20/2021 18:23:39 - INFO - __main__ - Step 18041: {'lr': 0.0001999710852760666, 'samples': 577312, 'steps': 1127, 'loss/train': 3.9351162910461426} -09/20/2021 18:23:40 - INFO - __main__ - Step 18042: {'lr': 0.0001999710852760666, 'samples': 577344, 'steps': 1127, 'loss/train': 4.603641033172607} -09/20/2021 18:23:41 - INFO - __main__ - Step 18043: {'lr': 0.0001999710852760666, 'samples': 577376, 'steps': 1127, 'loss/train': 3.6308257579803467} -09/20/2021 18:23:41 - INFO - __main__ - Step 18044: {'lr': 0.0001999710852760666, 'samples': 577408, 'steps': 1127, 'loss/train': 2.314939260482788} -09/20/2021 18:23:42 - INFO - __main__ - Step 18045: {'lr': 0.0001999710852760666, 'samples': 577440, 'steps': 1127, 'loss/train': 3.3758132457733154} -09/20/2021 18:23:43 - INFO - __main__ - Step 18046: {'lr': 0.0001999710852760666, 'samples': 577472, 'steps': 1127, 'loss/train': 4.427611827850342} -09/20/2021 18:23:44 - INFO - __main__ - Step 18047: {'lr': 0.0001999710852760666, 'samples': 577504, 'steps': 1127, 'loss/train': 4.388099193572998} -09/20/2021 18:23:44 - INFO - __main__ - Step 18048: {'lr': 0.0001999710852760666, 'samples': 577536, 'steps': 1127, 'loss/train': 3.343231439590454} -09/20/2021 18:23:45 - INFO - __main__ - Step 18049: {'lr': 0.00019997093168630745, 'samples': 577568, 'steps': 1128, 'loss/train': 3.5095632076263428} -09/20/2021 18:23:46 - INFO - __main__ - Step 18050: {'lr': 0.00019997093168630745, 'samples': 577600, 'steps': 1128, 'loss/train': 2.9042677879333496} -09/20/2021 18:23:47 - INFO - __main__ - Step 18051: {'lr': 0.00019997093168630745, 'samples': 577632, 'steps': 1128, 'loss/train': 4.455772399902344} -09/20/2021 18:23:47 - INFO - __main__ - Step 18052: {'lr': 0.00019997093168630745, 'samples': 577664, 'steps': 1128, 'loss/train': 4.567256927490234} -09/20/2021 18:23:48 - INFO - __main__ - Step 18053: {'lr': 0.00019997093168630745, 'samples': 577696, 'steps': 1128, 'loss/train': 3.1079490184783936} -09/20/2021 18:23:49 - INFO - __main__ - Step 18054: {'lr': 0.00019997093168630745, 'samples': 577728, 'steps': 1128, 'loss/train': 2.7648189067840576} -09/20/2021 18:23:50 - INFO - __main__ - Step 18055: {'lr': 0.00019997093168630745, 'samples': 577760, 'steps': 1128, 'loss/train': 3.2129688262939453} -09/20/2021 18:23:50 - INFO - __main__ - Step 18056: {'lr': 0.00019997093168630745, 'samples': 577792, 'steps': 1128, 'loss/train': 2.3263940811157227} -09/20/2021 18:23:51 - INFO - __main__ - Step 18057: {'lr': 0.00019997093168630745, 'samples': 577824, 'steps': 1128, 'loss/train': 4.237430572509766} -09/20/2021 18:23:52 - INFO - __main__ - Step 18058: {'lr': 0.00019997093168630745, 'samples': 577856, 'steps': 1128, 'loss/train': 3.5791571140289307} -09/20/2021 18:23:53 - INFO - __main__ - Step 18059: {'lr': 0.00019997093168630745, 'samples': 577888, 'steps': 1128, 'loss/train': 3.5177483558654785} -09/20/2021 18:23:53 - INFO - __main__ - Step 18060: {'lr': 0.00019997093168630745, 'samples': 577920, 'steps': 1128, 'loss/train': 2.8950583934783936} -09/20/2021 18:23:54 - INFO - __main__ - Step 18061: {'lr': 0.00019997093168630745, 'samples': 577952, 'steps': 1128, 'loss/train': 3.915825843811035} -09/20/2021 18:23:55 - INFO - __main__ - Step 18062: {'lr': 0.00019997093168630745, 'samples': 577984, 'steps': 1128, 'loss/train': 3.1348273754119873} -09/20/2021 18:23:56 - INFO - __main__ - Step 18063: {'lr': 0.00019997093168630745, 'samples': 578016, 'steps': 1128, 'loss/train': 0.5843266844749451} -09/20/2021 18:23:56 - INFO - __main__ - Step 18064: {'lr': 0.00019997093168630745, 'samples': 578048, 'steps': 1128, 'loss/train': 0.6026598215103149} -09/20/2021 18:23:57 - INFO - __main__ - Step 18065: {'lr': 0.00019997077768976697, 'samples': 578080, 'steps': 1129, 'loss/train': 1.3634485006332397} -09/20/2021 18:23:58 - INFO - __main__ - Step 18066: {'lr': 0.00019997077768976697, 'samples': 578112, 'steps': 1129, 'loss/train': 1.4983340501785278} -09/20/2021 18:23:59 - INFO - __main__ - Step 18067: {'lr': 0.00019997077768976697, 'samples': 578144, 'steps': 1129, 'loss/train': 4.154818534851074} -09/20/2021 18:24:00 - INFO - __main__ - Step 18068: {'lr': 0.00019997077768976697, 'samples': 578176, 'steps': 1129, 'loss/train': 3.95662784576416} -09/20/2021 18:24:00 - INFO - __main__ - Step 18069: {'lr': 0.00019997077768976697, 'samples': 578208, 'steps': 1129, 'loss/train': 3.149620532989502} -09/20/2021 18:24:02 - INFO - __main__ - Step 18070: {'lr': 0.00019997077768976697, 'samples': 578240, 'steps': 1129, 'loss/train': 2.848015546798706} -09/20/2021 18:24:03 - INFO - __main__ - Step 18071: {'lr': 0.00019997077768976697, 'samples': 578272, 'steps': 1129, 'loss/train': 3.556879758834839} -09/20/2021 18:24:04 - INFO - __main__ - Step 18072: {'lr': 0.00019997077768976697, 'samples': 578304, 'steps': 1129, 'loss/train': 3.5466082096099854} -09/20/2021 18:24:04 - INFO - __main__ - Step 18073: {'lr': 0.00019997077768976697, 'samples': 578336, 'steps': 1129, 'loss/train': 3.440603017807007} -09/20/2021 18:24:05 - INFO - __main__ - Step 18074: {'lr': 0.00019997077768976697, 'samples': 578368, 'steps': 1129, 'loss/train': 3.1957173347473145} -09/20/2021 18:24:06 - INFO - __main__ - Step 18075: {'lr': 0.00019997077768976697, 'samples': 578400, 'steps': 1129, 'loss/train': 3.867309808731079} -09/20/2021 18:24:07 - INFO - __main__ - Step 18076: {'lr': 0.00019997077768976697, 'samples': 578432, 'steps': 1129, 'loss/train': 3.1925415992736816} -09/20/2021 18:24:07 - INFO - __main__ - Step 18077: {'lr': 0.00019997077768976697, 'samples': 578464, 'steps': 1129, 'loss/train': 2.9448599815368652} -09/20/2021 18:24:08 - INFO - __main__ - Step 18078: {'lr': 0.00019997077768976697, 'samples': 578496, 'steps': 1129, 'loss/train': 3.9643542766571045} -09/20/2021 18:24:09 - INFO - __main__ - Step 18079: {'lr': 0.00019997077768976697, 'samples': 578528, 'steps': 1129, 'loss/train': 5.616942882537842} -09/20/2021 18:24:10 - INFO - __main__ - Step 18080: {'lr': 0.00019997077768976697, 'samples': 578560, 'steps': 1129, 'loss/train': 4.089360237121582} -09/20/2021 18:24:10 - INFO - __main__ - Step 18081: {'lr': 0.0001999706232864458, 'samples': 578592, 'steps': 1130, 'loss/train': 3.2731094360351562} -09/20/2021 18:24:11 - INFO - __main__ - Step 18082: {'lr': 0.0001999706232864458, 'samples': 578624, 'steps': 1130, 'loss/train': 4.007223606109619} -09/20/2021 18:24:12 - INFO - __main__ - Step 18083: {'lr': 0.0001999706232864458, 'samples': 578656, 'steps': 1130, 'loss/train': 3.354304075241089} -09/20/2021 18:24:13 - INFO - __main__ - Step 18084: {'lr': 0.0001999706232864458, 'samples': 578688, 'steps': 1130, 'loss/train': 4.443170547485352} -09/20/2021 18:24:13 - INFO - __main__ - Step 18085: {'lr': 0.0001999706232864458, 'samples': 578720, 'steps': 1130, 'loss/train': 3.59483003616333} -09/20/2021 18:24:14 - INFO - __main__ - Step 18086: {'lr': 0.0001999706232864458, 'samples': 578752, 'steps': 1130, 'loss/train': 3.9757001399993896} -09/20/2021 18:24:15 - INFO - __main__ - Step 18087: {'lr': 0.0001999706232864458, 'samples': 578784, 'steps': 1130, 'loss/train': 2.946504592895508} -09/20/2021 18:24:16 - INFO - __main__ - Step 18088: {'lr': 0.0001999706232864458, 'samples': 578816, 'steps': 1130, 'loss/train': 3.591033697128296} -09/20/2021 18:24:16 - INFO - __main__ - Step 18089: {'lr': 0.0001999706232864458, 'samples': 578848, 'steps': 1130, 'loss/train': 4.296442985534668} -09/20/2021 18:24:17 - INFO - __main__ - Step 18090: {'lr': 0.0001999706232864458, 'samples': 578880, 'steps': 1130, 'loss/train': 3.168945550918579} -09/20/2021 18:24:18 - INFO - __main__ - Step 18091: {'lr': 0.0001999706232864458, 'samples': 578912, 'steps': 1130, 'loss/train': 3.1205787658691406} -09/20/2021 18:24:19 - INFO - __main__ - Step 18092: {'lr': 0.0001999706232864458, 'samples': 578944, 'steps': 1130, 'loss/train': 2.817486524581909} -09/20/2021 18:24:19 - INFO - __main__ - Step 18093: {'lr': 0.0001999706232864458, 'samples': 578976, 'steps': 1130, 'loss/train': 3.2749693393707275} -09/20/2021 18:24:20 - INFO - __main__ - Step 18094: {'lr': 0.0001999706232864458, 'samples': 579008, 'steps': 1130, 'loss/train': 2.9209015369415283} -09/20/2021 18:24:21 - INFO - __main__ - Step 18095: {'lr': 0.0001999706232864458, 'samples': 579040, 'steps': 1130, 'loss/train': 3.789884090423584} -09/20/2021 18:24:22 - INFO - __main__ - Step 18096: {'lr': 0.0001999706232864458, 'samples': 579072, 'steps': 1130, 'loss/train': 3.0560286045074463} -09/20/2021 18:24:23 - INFO - __main__ - Step 18097: {'lr': 0.00019997046847634455, 'samples': 579104, 'steps': 1131, 'loss/train': 1.708000898361206} -09/20/2021 18:24:23 - INFO - __main__ - Step 18098: {'lr': 0.00019997046847634455, 'samples': 579136, 'steps': 1131, 'loss/train': 4.997897624969482} -09/20/2021 18:24:24 - INFO - __main__ - Step 18099: {'lr': 0.00019997046847634455, 'samples': 579168, 'steps': 1131, 'loss/train': 3.421671152114868} -09/20/2021 18:24:25 - INFO - __main__ - Step 18100: {'lr': 0.00019997046847634455, 'samples': 579200, 'steps': 1131, 'loss/train': 2.9886772632598877} -09/20/2021 18:24:26 - INFO - __main__ - Step 18101: {'lr': 0.00019997046847634455, 'samples': 579232, 'steps': 1131, 'loss/train': 3.7084059715270996} -09/20/2021 18:24:27 - INFO - __main__ - Step 18102: {'lr': 0.00019997046847634455, 'samples': 579264, 'steps': 1131, 'loss/train': 3.554434061050415} -09/20/2021 18:24:28 - INFO - __main__ - Step 18103: {'lr': 0.00019997046847634455, 'samples': 579296, 'steps': 1131, 'loss/train': 3.380385398864746} -09/20/2021 18:24:28 - INFO - __main__ - Step 18104: {'lr': 0.00019997046847634455, 'samples': 579328, 'steps': 1131, 'loss/train': 3.155059576034546} -09/20/2021 18:24:29 - INFO - __main__ - Step 18105: {'lr': 0.00019997046847634455, 'samples': 579360, 'steps': 1131, 'loss/train': 3.1959986686706543} -09/20/2021 18:24:30 - INFO - __main__ - Step 18106: {'lr': 0.00019997046847634455, 'samples': 579392, 'steps': 1131, 'loss/train': 3.4176254272460938} -09/20/2021 18:24:31 - INFO - __main__ - Step 18107: {'lr': 0.00019997046847634455, 'samples': 579424, 'steps': 1131, 'loss/train': 3.1768174171447754} -09/20/2021 18:24:31 - INFO - __main__ - Step 18108: {'lr': 0.00019997046847634455, 'samples': 579456, 'steps': 1131, 'loss/train': 3.9967739582061768} -09/20/2021 18:24:32 - INFO - __main__ - Step 18109: {'lr': 0.00019997046847634455, 'samples': 579488, 'steps': 1131, 'loss/train': 3.554915428161621} -09/20/2021 18:24:33 - INFO - __main__ - Step 18110: {'lr': 0.00019997046847634455, 'samples': 579520, 'steps': 1131, 'loss/train': 4.263247013092041} -09/20/2021 18:24:34 - INFO - __main__ - Step 18111: {'lr': 0.00019997046847634455, 'samples': 579552, 'steps': 1131, 'loss/train': 3.166232109069824} -09/20/2021 18:24:34 - INFO - __main__ - Step 18112: {'lr': 0.00019997046847634455, 'samples': 579584, 'steps': 1131, 'loss/train': 1.1690293550491333} -09/20/2021 18:24:35 - INFO - __main__ - Step 18113: {'lr': 0.00019997031325946386, 'samples': 579616, 'steps': 1132, 'loss/train': 3.497148036956787} -09/20/2021 18:24:36 - INFO - __main__ - Step 18114: {'lr': 0.00019997031325946386, 'samples': 579648, 'steps': 1132, 'loss/train': 3.437009811401367} -09/20/2021 18:24:37 - INFO - __main__ - Step 18115: {'lr': 0.00019997031325946386, 'samples': 579680, 'steps': 1132, 'loss/train': 3.891615152359009} -09/20/2021 18:24:38 - INFO - __main__ - Step 18116: {'lr': 0.00019997031325946386, 'samples': 579712, 'steps': 1132, 'loss/train': 2.606003761291504} -09/20/2021 18:24:38 - INFO - __main__ - Step 18117: {'lr': 0.00019997031325946386, 'samples': 579744, 'steps': 1132, 'loss/train': 3.8388121128082275} -09/20/2021 18:24:39 - INFO - __main__ - Step 18118: {'lr': 0.00019997031325946386, 'samples': 579776, 'steps': 1132, 'loss/train': 4.345019340515137} -09/20/2021 18:24:40 - INFO - __main__ - Step 18119: {'lr': 0.00019997031325946386, 'samples': 579808, 'steps': 1132, 'loss/train': 4.9762043952941895} -09/20/2021 18:24:41 - INFO - __main__ - Step 18120: {'lr': 0.00019997031325946386, 'samples': 579840, 'steps': 1132, 'loss/train': 5.359877109527588} -09/20/2021 18:24:41 - INFO - __main__ - Step 18121: {'lr': 0.00019997031325946386, 'samples': 579872, 'steps': 1132, 'loss/train': 4.546535015106201} -09/20/2021 18:24:42 - INFO - __main__ - Step 18122: {'lr': 0.00019997031325946386, 'samples': 579904, 'steps': 1132, 'loss/train': 3.6290712356567383} -09/20/2021 18:24:43 - INFO - __main__ - Step 18123: {'lr': 0.00019997031325946386, 'samples': 579936, 'steps': 1132, 'loss/train': 4.346781253814697} -09/20/2021 18:24:44 - INFO - __main__ - Step 18124: {'lr': 0.00019997031325946386, 'samples': 579968, 'steps': 1132, 'loss/train': 3.1478216648101807} -09/20/2021 18:24:44 - INFO - __main__ - Step 18125: {'lr': 0.00019997031325946386, 'samples': 580000, 'steps': 1132, 'loss/train': 0.5125660300254822} -09/20/2021 18:24:45 - INFO - __main__ - Step 18126: {'lr': 0.00019997031325946386, 'samples': 580032, 'steps': 1132, 'loss/train': 3.5615527629852295} -09/20/2021 18:24:46 - INFO - __main__ - Step 18127: {'lr': 0.00019997031325946386, 'samples': 580064, 'steps': 1132, 'loss/train': 3.717074155807495} -09/20/2021 18:24:47 - INFO - __main__ - Step 18128: {'lr': 0.00019997031325946386, 'samples': 580096, 'steps': 1132, 'loss/train': 4.4343791007995605} -09/20/2021 18:24:47 - INFO - __main__ - Step 18129: {'lr': 0.00019997015763580434, 'samples': 580128, 'steps': 1133, 'loss/train': 3.096259832382202} -09/20/2021 18:24:48 - INFO - __main__ - Step 18130: {'lr': 0.00019997015763580434, 'samples': 580160, 'steps': 1133, 'loss/train': 2.8499324321746826} -09/20/2021 18:24:49 - INFO - __main__ - Step 18131: {'lr': 0.00019997015763580434, 'samples': 580192, 'steps': 1133, 'loss/train': 3.896933078765869} -09/20/2021 18:24:50 - INFO - __main__ - Step 18132: {'lr': 0.00019997015763580434, 'samples': 580224, 'steps': 1133, 'loss/train': 2.5719892978668213} -09/20/2021 18:24:51 - INFO - __main__ - Step 18133: {'lr': 0.00019997015763580434, 'samples': 580256, 'steps': 1133, 'loss/train': 3.7797658443450928} -09/20/2021 18:24:52 - INFO - __main__ - Step 18134: {'lr': 0.00019997015763580434, 'samples': 580288, 'steps': 1133, 'loss/train': 3.11961030960083} -09/20/2021 18:24:52 - INFO - __main__ - Step 18135: {'lr': 0.00019997015763580434, 'samples': 580320, 'steps': 1133, 'loss/train': 2.9023971557617188} -09/20/2021 18:24:53 - INFO - __main__ - Step 18136: {'lr': 0.00019997015763580434, 'samples': 580352, 'steps': 1133, 'loss/train': 3.9783051013946533} -09/20/2021 18:24:54 - INFO - __main__ - Step 18137: {'lr': 0.00019997015763580434, 'samples': 580384, 'steps': 1133, 'loss/train': 4.5638532638549805} -09/20/2021 18:24:55 - INFO - __main__ - Step 18138: {'lr': 0.00019997015763580434, 'samples': 580416, 'steps': 1133, 'loss/train': 3.674978256225586} -09/20/2021 18:24:55 - INFO - __main__ - Step 18139: {'lr': 0.00019997015763580434, 'samples': 580448, 'steps': 1133, 'loss/train': 2.9608407020568848} -09/20/2021 18:24:56 - INFO - __main__ - Step 18140: {'lr': 0.00019997015763580434, 'samples': 580480, 'steps': 1133, 'loss/train': 3.584956169128418} -09/20/2021 18:24:57 - INFO - __main__ - Step 18141: {'lr': 0.00019997015763580434, 'samples': 580512, 'steps': 1133, 'loss/train': 4.660501956939697} -09/20/2021 18:24:58 - INFO - __main__ - Step 18142: {'lr': 0.00019997015763580434, 'samples': 580544, 'steps': 1133, 'loss/train': 4.4108476638793945} -09/20/2021 18:24:58 - INFO - __main__ - Step 18143: {'lr': 0.00019997015763580434, 'samples': 580576, 'steps': 1133, 'loss/train': 4.535069465637207} -09/20/2021 18:24:59 - INFO - __main__ - Step 18144: {'lr': 0.00019997015763580434, 'samples': 580608, 'steps': 1133, 'loss/train': 3.828845262527466} -09/20/2021 18:25:00 - INFO - __main__ - Step 18145: {'lr': 0.00019997000160536664, 'samples': 580640, 'steps': 1134, 'loss/train': 3.747758150100708} -09/20/2021 18:25:01 - INFO - __main__ - Step 18146: {'lr': 0.00019997000160536664, 'samples': 580672, 'steps': 1134, 'loss/train': 3.3505043983459473} -09/20/2021 18:25:02 - INFO - __main__ - Step 18147: {'lr': 0.00019997000160536664, 'samples': 580704, 'steps': 1134, 'loss/train': 3.8576436042785645} -09/20/2021 18:25:02 - INFO - __main__ - Step 18148: {'lr': 0.00019997000160536664, 'samples': 580736, 'steps': 1134, 'loss/train': 4.643186092376709} -09/20/2021 18:25:03 - INFO - __main__ - Step 18149: {'lr': 0.00019997000160536664, 'samples': 580768, 'steps': 1134, 'loss/train': 3.0477986335754395} -09/20/2021 18:25:04 - INFO - __main__ - Step 18150: {'lr': 0.00019997000160536664, 'samples': 580800, 'steps': 1134, 'loss/train': 3.6384098529815674} -09/20/2021 18:25:05 - INFO - __main__ - Step 18151: {'lr': 0.00019997000160536664, 'samples': 580832, 'steps': 1134, 'loss/train': 3.1692698001861572} -09/20/2021 18:25:05 - INFO - __main__ - Step 18152: {'lr': 0.00019997000160536664, 'samples': 580864, 'steps': 1134, 'loss/train': 3.9906208515167236} -09/20/2021 18:25:06 - INFO - __main__ - Step 18153: {'lr': 0.00019997000160536664, 'samples': 580896, 'steps': 1134, 'loss/train': 3.4362049102783203} -09/20/2021 18:25:07 - INFO - __main__ - Step 18154: {'lr': 0.00019997000160536664, 'samples': 580928, 'steps': 1134, 'loss/train': 2.8870527744293213} -09/20/2021 18:25:08 - INFO - __main__ - Step 18155: {'lr': 0.00019997000160536664, 'samples': 580960, 'steps': 1134, 'loss/train': 3.1829636096954346} -09/20/2021 18:25:08 - INFO - __main__ - Step 18156: {'lr': 0.00019997000160536664, 'samples': 580992, 'steps': 1134, 'loss/train': 3.648777484893799} -09/20/2021 18:25:09 - INFO - __main__ - Step 18157: {'lr': 0.00019997000160536664, 'samples': 581024, 'steps': 1134, 'loss/train': 3.838862895965576} -09/20/2021 18:25:10 - INFO - __main__ - Step 18158: {'lr': 0.00019997000160536664, 'samples': 581056, 'steps': 1134, 'loss/train': 4.3454203605651855} -09/20/2021 18:25:11 - INFO - __main__ - Step 18159: {'lr': 0.00019997000160536664, 'samples': 581088, 'steps': 1134, 'loss/train': 4.026724338531494} -09/20/2021 18:25:11 - INFO - __main__ - Step 18160: {'lr': 0.00019997000160536664, 'samples': 581120, 'steps': 1134, 'loss/train': 3.5238921642303467} -09/20/2021 18:25:12 - INFO - __main__ - Step 18161: {'lr': 0.00019996984516815135, 'samples': 581152, 'steps': 1135, 'loss/train': 3.4047322273254395} -09/20/2021 18:25:13 - INFO - __main__ - Step 18162: {'lr': 0.00019996984516815135, 'samples': 581184, 'steps': 1135, 'loss/train': 3.5549066066741943} -09/20/2021 18:25:15 - INFO - __main__ - Step 18163: {'lr': 0.00019996984516815135, 'samples': 581216, 'steps': 1135, 'loss/train': 4.39235782623291} -09/20/2021 18:25:15 - INFO - __main__ - Step 18164: {'lr': 0.00019996984516815135, 'samples': 581248, 'steps': 1135, 'loss/train': 3.9399573802948} -09/20/2021 18:25:16 - INFO - __main__ - Step 18165: {'lr': 0.00019996984516815135, 'samples': 581280, 'steps': 1135, 'loss/train': 2.84484601020813} -09/20/2021 18:25:17 - INFO - __main__ - Step 18166: {'lr': 0.00019996984516815135, 'samples': 581312, 'steps': 1135, 'loss/train': 3.4979331493377686} -09/20/2021 18:25:18 - INFO - __main__ - Step 18167: {'lr': 0.00019996984516815135, 'samples': 581344, 'steps': 1135, 'loss/train': 3.3097941875457764} -09/20/2021 18:25:18 - INFO - __main__ - Step 18168: {'lr': 0.00019996984516815135, 'samples': 581376, 'steps': 1135, 'loss/train': 3.5275931358337402} -09/20/2021 18:25:19 - INFO - __main__ - Step 18169: {'lr': 0.00019996984516815135, 'samples': 581408, 'steps': 1135, 'loss/train': 3.2664356231689453} -09/20/2021 18:25:20 - INFO - __main__ - Step 18170: {'lr': 0.00019996984516815135, 'samples': 581440, 'steps': 1135, 'loss/train': 4.47611141204834} -09/20/2021 18:25:21 - INFO - __main__ - Step 18171: {'lr': 0.00019996984516815135, 'samples': 581472, 'steps': 1135, 'loss/train': 3.865158796310425} -09/20/2021 18:25:21 - INFO - __main__ - Step 18172: {'lr': 0.00019996984516815135, 'samples': 581504, 'steps': 1135, 'loss/train': 4.704089164733887} -09/20/2021 18:25:22 - INFO - __main__ - Step 18173: {'lr': 0.00019996984516815135, 'samples': 581536, 'steps': 1135, 'loss/train': 4.672869682312012} -09/20/2021 18:25:23 - INFO - __main__ - Step 18174: {'lr': 0.00019996984516815135, 'samples': 581568, 'steps': 1135, 'loss/train': 4.941596984863281} -09/20/2021 18:25:24 - INFO - __main__ - Step 18175: {'lr': 0.00019996984516815135, 'samples': 581600, 'steps': 1135, 'loss/train': 3.3697054386138916} -09/20/2021 18:25:24 - INFO - __main__ - Step 18176: {'lr': 0.00019996984516815135, 'samples': 581632, 'steps': 1135, 'loss/train': 4.390895366668701} -09/20/2021 18:25:25 - INFO - __main__ - Step 18177: {'lr': 0.0001999696883241592, 'samples': 581664, 'steps': 1136, 'loss/train': 3.420240879058838} -09/20/2021 18:25:26 - INFO - __main__ - Step 18178: {'lr': 0.0001999696883241592, 'samples': 581696, 'steps': 1136, 'loss/train': 3.0631985664367676} -09/20/2021 18:25:27 - INFO - __main__ - Step 18179: {'lr': 0.0001999696883241592, 'samples': 581728, 'steps': 1136, 'loss/train': 1.165460228919983} -09/20/2021 18:25:27 - INFO - __main__ - Step 18180: {'lr': 0.0001999696883241592, 'samples': 581760, 'steps': 1136, 'loss/train': 0.5678395628929138} -09/20/2021 18:25:28 - INFO - __main__ - Step 18181: {'lr': 0.0001999696883241592, 'samples': 581792, 'steps': 1136, 'loss/train': 2.1077115535736084} -09/20/2021 18:25:29 - INFO - __main__ - Step 18182: {'lr': 0.0001999696883241592, 'samples': 581824, 'steps': 1136, 'loss/train': 0.9767134785652161} -09/20/2021 18:25:30 - INFO - __main__ - Step 18183: {'lr': 0.0001999696883241592, 'samples': 581856, 'steps': 1136, 'loss/train': 1.2752254009246826} -09/20/2021 18:25:30 - INFO - __main__ - Step 18184: {'lr': 0.0001999696883241592, 'samples': 581888, 'steps': 1136, 'loss/train': 3.0985007286071777} -09/20/2021 18:25:31 - INFO - __main__ - Step 18185: {'lr': 0.0001999696883241592, 'samples': 581920, 'steps': 1136, 'loss/train': 3.938950538635254} -09/20/2021 18:25:32 - INFO - __main__ - Step 18186: {'lr': 0.0001999696883241592, 'samples': 581952, 'steps': 1136, 'loss/train': 3.0495247840881348} -09/20/2021 18:25:33 - INFO - __main__ - Step 18187: {'lr': 0.0001999696883241592, 'samples': 581984, 'steps': 1136, 'loss/train': 3.495312452316284} -09/20/2021 18:25:33 - INFO - __main__ - Step 18188: {'lr': 0.0001999696883241592, 'samples': 582016, 'steps': 1136, 'loss/train': 3.202213764190674} -09/20/2021 18:25:34 - INFO - __main__ - Step 18189: {'lr': 0.0001999696883241592, 'samples': 582048, 'steps': 1136, 'loss/train': 4.733370780944824} -09/20/2021 18:25:35 - INFO - __main__ - Step 18190: {'lr': 0.0001999696883241592, 'samples': 582080, 'steps': 1136, 'loss/train': 2.8304126262664795} -09/20/2021 18:25:36 - INFO - __main__ - Step 18191: {'lr': 0.0001999696883241592, 'samples': 582112, 'steps': 1136, 'loss/train': 2.5571582317352295} -09/20/2021 18:25:36 - INFO - __main__ - Step 18192: {'lr': 0.0001999696883241592, 'samples': 582144, 'steps': 1136, 'loss/train': 3.3800575733184814} -09/20/2021 18:25:38 - INFO - __main__ - Step 18193: {'lr': 0.00019996953107339079, 'samples': 582176, 'steps': 1137, 'loss/train': 4.887996673583984} -09/20/2021 18:25:39 - INFO - __main__ - Step 18194: {'lr': 0.00019996953107339079, 'samples': 582208, 'steps': 1137, 'loss/train': 3.9982900619506836} -09/20/2021 18:25:40 - INFO - __main__ - Step 18195: {'lr': 0.00019996953107339079, 'samples': 582240, 'steps': 1137, 'loss/train': 4.364871501922607} -09/20/2021 18:25:41 - INFO - __main__ - Step 18196: {'lr': 0.00019996953107339079, 'samples': 582272, 'steps': 1137, 'loss/train': 3.966430902481079} -09/20/2021 18:25:41 - INFO - __main__ - Step 18197: {'lr': 0.00019996953107339079, 'samples': 582304, 'steps': 1137, 'loss/train': 4.040099620819092} -09/20/2021 18:25:42 - INFO - __main__ - Step 18198: {'lr': 0.00019996953107339079, 'samples': 582336, 'steps': 1137, 'loss/train': 3.96125864982605} -09/20/2021 18:25:43 - INFO - __main__ - Step 18199: {'lr': 0.00019996953107339079, 'samples': 582368, 'steps': 1137, 'loss/train': 3.6005287170410156} -09/20/2021 18:25:44 - INFO - __main__ - Step 18200: {'lr': 0.00019996953107339079, 'samples': 582400, 'steps': 1137, 'loss/train': 4.334300994873047} -09/20/2021 18:25:44 - INFO - __main__ - Step 18201: {'lr': 0.00019996953107339079, 'samples': 582432, 'steps': 1137, 'loss/train': 3.3094661235809326} -09/20/2021 18:25:45 - INFO - __main__ - Step 18202: {'lr': 0.00019996953107339079, 'samples': 582464, 'steps': 1137, 'loss/train': 4.0485124588012695} -09/20/2021 18:25:46 - INFO - __main__ - Step 18203: {'lr': 0.00019996953107339079, 'samples': 582496, 'steps': 1137, 'loss/train': 3.2454891204833984} -09/20/2021 18:25:47 - INFO - __main__ - Step 18204: {'lr': 0.00019996953107339079, 'samples': 582528, 'steps': 1137, 'loss/train': 2.7661430835723877} -09/20/2021 18:25:47 - INFO - __main__ - Step 18205: {'lr': 0.00019996953107339079, 'samples': 582560, 'steps': 1137, 'loss/train': 4.147496700286865} -09/20/2021 18:25:48 - INFO - __main__ - Step 18206: {'lr': 0.00019996953107339079, 'samples': 582592, 'steps': 1137, 'loss/train': 4.09138822555542} -09/20/2021 18:25:49 - INFO - __main__ - Step 18207: {'lr': 0.00019996953107339079, 'samples': 582624, 'steps': 1137, 'loss/train': 4.453566551208496} -09/20/2021 18:25:50 - INFO - __main__ - Step 18208: {'lr': 0.00019996953107339079, 'samples': 582656, 'steps': 1137, 'loss/train': 4.8990797996521} -09/20/2021 18:25:50 - INFO - __main__ - Step 18209: {'lr': 0.00019996937341584673, 'samples': 582688, 'steps': 1138, 'loss/train': 2.8152077198028564} -09/20/2021 18:25:51 - INFO - __main__ - Step 18210: {'lr': 0.00019996937341584673, 'samples': 582720, 'steps': 1138, 'loss/train': 3.4166173934936523} -09/20/2021 18:25:52 - INFO - __main__ - Step 18211: {'lr': 0.00019996937341584673, 'samples': 582752, 'steps': 1138, 'loss/train': 3.95670485496521} -09/20/2021 18:25:53 - INFO - __main__ - Step 18212: {'lr': 0.00019996937341584673, 'samples': 582784, 'steps': 1138, 'loss/train': 4.305505752563477} -09/20/2021 18:25:53 - INFO - __main__ - Step 18213: {'lr': 0.00019996937341584673, 'samples': 582816, 'steps': 1138, 'loss/train': 3.141031503677368} -09/20/2021 18:25:54 - INFO - __main__ - Step 18214: {'lr': 0.00019996937341584673, 'samples': 582848, 'steps': 1138, 'loss/train': 3.233959197998047} -09/20/2021 18:25:55 - INFO - __main__ - Step 18215: {'lr': 0.00019996937341584673, 'samples': 582880, 'steps': 1138, 'loss/train': 3.8131918907165527} -09/20/2021 18:25:56 - INFO - __main__ - Step 18216: {'lr': 0.00019996937341584673, 'samples': 582912, 'steps': 1138, 'loss/train': 3.7162675857543945} -09/20/2021 18:25:56 - INFO - __main__ - Step 18217: {'lr': 0.00019996937341584673, 'samples': 582944, 'steps': 1138, 'loss/train': 3.7133796215057373} -09/20/2021 18:25:57 - INFO - __main__ - Step 18218: {'lr': 0.00019996937341584673, 'samples': 582976, 'steps': 1138, 'loss/train': 4.045193195343018} -09/20/2021 18:25:58 - INFO - __main__ - Step 18219: {'lr': 0.00019996937341584673, 'samples': 583008, 'steps': 1138, 'loss/train': 4.532642841339111} -09/20/2021 18:25:59 - INFO - __main__ - Step 18220: {'lr': 0.00019996937341584673, 'samples': 583040, 'steps': 1138, 'loss/train': 1.1809364557266235} -09/20/2021 18:25:59 - INFO - __main__ - Step 18221: {'lr': 0.00019996937341584673, 'samples': 583072, 'steps': 1138, 'loss/train': 3.2143006324768066} -09/20/2021 18:26:00 - INFO - __main__ - Step 18222: {'lr': 0.00019996937341584673, 'samples': 583104, 'steps': 1138, 'loss/train': 1.2119324207305908} -09/20/2021 18:26:01 - INFO - __main__ - Step 18223: {'lr': 0.00019996937341584673, 'samples': 583136, 'steps': 1138, 'loss/train': 0.9347920417785645} -09/20/2021 18:26:02 - INFO - __main__ - Step 18224: {'lr': 0.00019996937341584673, 'samples': 583168, 'steps': 1138, 'loss/train': 1.1333179473876953} -09/20/2021 18:26:03 - INFO - __main__ - Step 18225: {'lr': 0.00019996921535152764, 'samples': 583200, 'steps': 1139, 'loss/train': 1.0644779205322266} -09/20/2021 18:26:04 - INFO - __main__ - Step 18226: {'lr': 0.00019996921535152764, 'samples': 583232, 'steps': 1139, 'loss/train': 2.2699484825134277} -09/20/2021 18:26:05 - INFO - __main__ - Step 18227: {'lr': 0.00019996921535152764, 'samples': 583264, 'steps': 1139, 'loss/train': 3.753230571746826} -09/20/2021 18:26:05 - INFO - __main__ - Step 18228: {'lr': 0.00019996921535152764, 'samples': 583296, 'steps': 1139, 'loss/train': 3.591425895690918} -09/20/2021 18:26:06 - INFO - __main__ - Step 18229: {'lr': 0.00019996921535152764, 'samples': 583328, 'steps': 1139, 'loss/train': 3.183948516845703} -09/20/2021 18:26:07 - INFO - __main__ - Step 18230: {'lr': 0.00019996921535152764, 'samples': 583360, 'steps': 1139, 'loss/train': 3.909675121307373} -09/20/2021 18:26:08 - INFO - __main__ - Step 18231: {'lr': 0.00019996921535152764, 'samples': 583392, 'steps': 1139, 'loss/train': 2.956606149673462} -09/20/2021 18:26:08 - INFO - __main__ - Step 18232: {'lr': 0.00019996921535152764, 'samples': 583424, 'steps': 1139, 'loss/train': 3.7856969833374023} -09/20/2021 18:26:09 - INFO - __main__ - Step 18233: {'lr': 0.00019996921535152764, 'samples': 583456, 'steps': 1139, 'loss/train': 3.7890851497650146} -09/20/2021 18:26:10 - INFO - __main__ - Step 18234: {'lr': 0.00019996921535152764, 'samples': 583488, 'steps': 1139, 'loss/train': 4.268918037414551} -09/20/2021 18:26:11 - INFO - __main__ - Step 18235: {'lr': 0.00019996921535152764, 'samples': 583520, 'steps': 1139, 'loss/train': 3.720686912536621} -09/20/2021 18:26:11 - INFO - __main__ - Step 18236: {'lr': 0.00019996921535152764, 'samples': 583552, 'steps': 1139, 'loss/train': 2.9800643920898438} -09/20/2021 18:26:12 - INFO - __main__ - Step 18237: {'lr': 0.00019996921535152764, 'samples': 583584, 'steps': 1139, 'loss/train': 3.158439874649048} -09/20/2021 18:26:13 - INFO - __main__ - Step 18238: {'lr': 0.00019996921535152764, 'samples': 583616, 'steps': 1139, 'loss/train': 2.732804775238037} -09/20/2021 18:26:14 - INFO - __main__ - Step 18239: {'lr': 0.00019996921535152764, 'samples': 583648, 'steps': 1139, 'loss/train': 3.0937716960906982} -09/20/2021 18:26:14 - INFO - __main__ - Step 18240: {'lr': 0.00019996921535152764, 'samples': 583680, 'steps': 1139, 'loss/train': 3.6674911975860596} -09/20/2021 18:26:15 - INFO - __main__ - Step 18241: {'lr': 0.0001999690568804342, 'samples': 583712, 'steps': 1140, 'loss/train': 3.0778086185455322} -09/20/2021 18:26:16 - INFO - __main__ - Step 18242: {'lr': 0.0001999690568804342, 'samples': 583744, 'steps': 1140, 'loss/train': 2.423322916030884} -09/20/2021 18:26:17 - INFO - __main__ - Step 18243: {'lr': 0.0001999690568804342, 'samples': 583776, 'steps': 1140, 'loss/train': 3.676361322402954} -09/20/2021 18:26:18 - INFO - __main__ - Step 18244: {'lr': 0.0001999690568804342, 'samples': 583808, 'steps': 1140, 'loss/train': 3.701625347137451} -09/20/2021 18:26:18 - INFO - __main__ - Step 18245: {'lr': 0.0001999690568804342, 'samples': 583840, 'steps': 1140, 'loss/train': 3.1058149337768555} -09/20/2021 18:26:19 - INFO - __main__ - Step 18246: {'lr': 0.0001999690568804342, 'samples': 583872, 'steps': 1140, 'loss/train': 2.760921001434326} -09/20/2021 18:26:20 - INFO - __main__ - Step 18247: {'lr': 0.0001999690568804342, 'samples': 583904, 'steps': 1140, 'loss/train': 4.667999267578125} -09/20/2021 18:26:21 - INFO - __main__ - Step 18248: {'lr': 0.0001999690568804342, 'samples': 583936, 'steps': 1140, 'loss/train': 4.588489055633545} -09/20/2021 18:26:21 - INFO - __main__ - Step 18249: {'lr': 0.0001999690568804342, 'samples': 583968, 'steps': 1140, 'loss/train': 4.581266403198242} -09/20/2021 18:26:22 - INFO - __main__ - Step 18250: {'lr': 0.0001999690568804342, 'samples': 584000, 'steps': 1140, 'loss/train': 3.457658052444458} -09/20/2021 18:26:23 - INFO - __main__ - Step 18251: {'lr': 0.0001999690568804342, 'samples': 584032, 'steps': 1140, 'loss/train': 2.6005446910858154} -09/20/2021 18:26:24 - INFO - __main__ - Step 18252: {'lr': 0.0001999690568804342, 'samples': 584064, 'steps': 1140, 'loss/train': 3.503633737564087} -09/20/2021 18:26:24 - INFO - __main__ - Step 18253: {'lr': 0.0001999690568804342, 'samples': 584096, 'steps': 1140, 'loss/train': 4.3013410568237305} -09/20/2021 18:26:25 - INFO - __main__ - Step 18254: {'lr': 0.0001999690568804342, 'samples': 584128, 'steps': 1140, 'loss/train': 3.82314395904541} -09/20/2021 18:26:26 - INFO - __main__ - Step 18255: {'lr': 0.0001999690568804342, 'samples': 584160, 'steps': 1140, 'loss/train': 4.653661251068115} -09/20/2021 18:26:27 - INFO - __main__ - Step 18256: {'lr': 0.0001999690568804342, 'samples': 584192, 'steps': 1140, 'loss/train': 3.0781562328338623} -09/20/2021 18:26:27 - INFO - __main__ - Step 18257: {'lr': 0.0001999688980025671, 'samples': 584224, 'steps': 1141, 'loss/train': 2.9493656158447266} -09/20/2021 18:26:29 - INFO - __main__ - Step 18258: {'lr': 0.0001999688980025671, 'samples': 584256, 'steps': 1141, 'loss/train': 3.855924129486084} -09/20/2021 18:26:30 - INFO - __main__ - Step 18259: {'lr': 0.0001999688980025671, 'samples': 584288, 'steps': 1141, 'loss/train': 4.026285171508789} -09/20/2021 18:26:30 - INFO - __main__ - Step 18260: {'lr': 0.0001999688980025671, 'samples': 584320, 'steps': 1141, 'loss/train': 4.432528972625732} -09/20/2021 18:26:31 - INFO - __main__ - Step 18261: {'lr': 0.0001999688980025671, 'samples': 584352, 'steps': 1141, 'loss/train': 3.415708303451538} -09/20/2021 18:26:32 - INFO - __main__ - Step 18262: {'lr': 0.0001999688980025671, 'samples': 584384, 'steps': 1141, 'loss/train': 3.6864726543426514} -09/20/2021 18:26:33 - INFO - __main__ - Step 18263: {'lr': 0.0001999688980025671, 'samples': 584416, 'steps': 1141, 'loss/train': 4.719151020050049} -09/20/2021 18:26:33 - INFO - __main__ - Step 18264: {'lr': 0.0001999688980025671, 'samples': 584448, 'steps': 1141, 'loss/train': 3.3741097450256348} -09/20/2021 18:26:34 - INFO - __main__ - Step 18265: {'lr': 0.0001999688980025671, 'samples': 584480, 'steps': 1141, 'loss/train': 3.129784345626831} -09/20/2021 18:26:35 - INFO - __main__ - Step 18266: {'lr': 0.0001999688980025671, 'samples': 584512, 'steps': 1141, 'loss/train': 3.8885915279388428} -09/20/2021 18:26:36 - INFO - __main__ - Step 18267: {'lr': 0.0001999688980025671, 'samples': 584544, 'steps': 1141, 'loss/train': 3.2400405406951904} -09/20/2021 18:26:36 - INFO - __main__ - Step 18268: {'lr': 0.0001999688980025671, 'samples': 584576, 'steps': 1141, 'loss/train': 2.716251850128174} -09/20/2021 18:26:37 - INFO - __main__ - Step 18269: {'lr': 0.0001999688980025671, 'samples': 584608, 'steps': 1141, 'loss/train': 2.9762043952941895} -09/20/2021 18:26:38 - INFO - __main__ - Step 18270: {'lr': 0.0001999688980025671, 'samples': 584640, 'steps': 1141, 'loss/train': 3.007208824157715} -09/20/2021 18:26:39 - INFO - __main__ - Step 18271: {'lr': 0.0001999688980025671, 'samples': 584672, 'steps': 1141, 'loss/train': 4.915513515472412} -09/20/2021 18:26:39 - INFO - __main__ - Step 18272: {'lr': 0.0001999688980025671, 'samples': 584704, 'steps': 1141, 'loss/train': 2.6709775924682617} -09/20/2021 18:26:40 - INFO - __main__ - Step 18273: {'lr': 0.00019996873871792694, 'samples': 584736, 'steps': 1142, 'loss/train': 4.2316789627075195} -09/20/2021 18:26:41 - INFO - __main__ - Step 18274: {'lr': 0.00019996873871792694, 'samples': 584768, 'steps': 1142, 'loss/train': 4.248139381408691} -09/20/2021 18:26:42 - INFO - __main__ - Step 18275: {'lr': 0.00019996873871792694, 'samples': 584800, 'steps': 1142, 'loss/train': 2.9320411682128906} -09/20/2021 18:26:42 - INFO - __main__ - Step 18276: {'lr': 0.00019996873871792694, 'samples': 584832, 'steps': 1142, 'loss/train': 2.983511209487915} -09/20/2021 18:26:43 - INFO - __main__ - Step 18277: {'lr': 0.00019996873871792694, 'samples': 584864, 'steps': 1142, 'loss/train': 3.583860158920288} -09/20/2021 18:26:44 - INFO - __main__ - Step 18278: {'lr': 0.00019996873871792694, 'samples': 584896, 'steps': 1142, 'loss/train': 3.1155941486358643} -09/20/2021 18:26:45 - INFO - __main__ - Step 18279: {'lr': 0.00019996873871792694, 'samples': 584928, 'steps': 1142, 'loss/train': 2.8393309116363525} -09/20/2021 18:26:45 - INFO - __main__ - Step 18280: {'lr': 0.00019996873871792694, 'samples': 584960, 'steps': 1142, 'loss/train': 3.15490460395813} -09/20/2021 18:26:46 - INFO - __main__ - Step 18281: {'lr': 0.00019996873871792694, 'samples': 584992, 'steps': 1142, 'loss/train': 3.1071319580078125} -09/20/2021 18:26:47 - INFO - __main__ - Step 18282: {'lr': 0.00019996873871792694, 'samples': 585024, 'steps': 1142, 'loss/train': 3.5012567043304443} -09/20/2021 18:26:48 - INFO - __main__ - Step 18283: {'lr': 0.00019996873871792694, 'samples': 585056, 'steps': 1142, 'loss/train': 4.204848766326904} -09/20/2021 18:26:48 - INFO - __main__ - Step 18284: {'lr': 0.00019996873871792694, 'samples': 585088, 'steps': 1142, 'loss/train': 3.1873626708984375} -09/20/2021 18:26:49 - INFO - __main__ - Step 18285: {'lr': 0.00019996873871792694, 'samples': 585120, 'steps': 1142, 'loss/train': 3.4581339359283447} -09/20/2021 18:26:50 - INFO - __main__ - Step 18286: {'lr': 0.00019996873871792694, 'samples': 585152, 'steps': 1142, 'loss/train': 3.9673871994018555} -09/20/2021 18:26:51 - INFO - __main__ - Step 18287: {'lr': 0.00019996873871792694, 'samples': 585184, 'steps': 1142, 'loss/train': 4.01353645324707} -09/20/2021 18:26:51 - INFO - __main__ - Step 18288: {'lr': 0.00019996873871792694, 'samples': 585216, 'steps': 1142, 'loss/train': 3.4503326416015625} -09/20/2021 18:26:53 - INFO - __main__ - Step 18289: {'lr': 0.00019996857902651436, 'samples': 585248, 'steps': 1143, 'loss/train': 2.404924154281616} -09/20/2021 18:26:54 - INFO - __main__ - Step 18290: {'lr': 0.00019996857902651436, 'samples': 585280, 'steps': 1143, 'loss/train': 2.33760929107666} -09/20/2021 18:26:55 - INFO - __main__ - Step 18291: {'lr': 0.00019996857902651436, 'samples': 585312, 'steps': 1143, 'loss/train': 2.8135454654693604} -09/20/2021 18:26:55 - INFO - __main__ - Step 18292: {'lr': 0.00019996857902651436, 'samples': 585344, 'steps': 1143, 'loss/train': 5.614107608795166} -09/20/2021 18:26:56 - INFO - __main__ - Step 18293: {'lr': 0.00019996857902651436, 'samples': 585376, 'steps': 1143, 'loss/train': 6.159210681915283} -09/20/2021 18:26:57 - INFO - __main__ - Step 18294: {'lr': 0.00019996857902651436, 'samples': 585408, 'steps': 1143, 'loss/train': 3.4904606342315674} -09/20/2021 18:26:58 - INFO - __main__ - Step 18295: {'lr': 0.00019996857902651436, 'samples': 585440, 'steps': 1143, 'loss/train': 3.4447879791259766} -09/20/2021 18:26:58 - INFO - __main__ - Step 18296: {'lr': 0.00019996857902651436, 'samples': 585472, 'steps': 1143, 'loss/train': 3.6319572925567627} -09/20/2021 18:26:59 - INFO - __main__ - Step 18297: {'lr': 0.00019996857902651436, 'samples': 585504, 'steps': 1143, 'loss/train': 2.182379722595215} -09/20/2021 18:27:00 - INFO - __main__ - Step 18298: {'lr': 0.00019996857902651436, 'samples': 585536, 'steps': 1143, 'loss/train': 3.1796817779541016} -09/20/2021 18:27:01 - INFO - __main__ - Step 18299: {'lr': 0.00019996857902651436, 'samples': 585568, 'steps': 1143, 'loss/train': 3.801314353942871} -09/20/2021 18:27:01 - INFO - __main__ - Step 18300: {'lr': 0.00019996857902651436, 'samples': 585600, 'steps': 1143, 'loss/train': 4.191883563995361} -09/20/2021 18:27:02 - INFO - __main__ - Step 18301: {'lr': 0.00019996857902651436, 'samples': 585632, 'steps': 1143, 'loss/train': 3.145419120788574} -09/20/2021 18:27:03 - INFO - __main__ - Step 18302: {'lr': 0.00019996857902651436, 'samples': 585664, 'steps': 1143, 'loss/train': 3.2686007022857666} -09/20/2021 18:27:04 - INFO - __main__ - Step 18303: {'lr': 0.00019996857902651436, 'samples': 585696, 'steps': 1143, 'loss/train': 2.50223708152771} -09/20/2021 18:27:04 - INFO - __main__ - Step 18304: {'lr': 0.00019996857902651436, 'samples': 585728, 'steps': 1143, 'loss/train': 3.3676846027374268} -09/20/2021 18:27:05 - INFO - __main__ - Step 18305: {'lr': 0.00019996841892833, 'samples': 585760, 'steps': 1144, 'loss/train': 3.1497013568878174} -09/20/2021 18:27:06 - INFO - __main__ - Step 18306: {'lr': 0.00019996841892833, 'samples': 585792, 'steps': 1144, 'loss/train': 4.124988555908203} -09/20/2021 18:27:07 - INFO - __main__ - Step 18307: {'lr': 0.00019996841892833, 'samples': 585824, 'steps': 1144, 'loss/train': 4.96575927734375} -09/20/2021 18:27:07 - INFO - __main__ - Step 18308: {'lr': 0.00019996841892833, 'samples': 585856, 'steps': 1144, 'loss/train': 4.176600456237793} -09/20/2021 18:27:08 - INFO - __main__ - Step 18309: {'lr': 0.00019996841892833, 'samples': 585888, 'steps': 1144, 'loss/train': 2.7304911613464355} -09/20/2021 18:27:09 - INFO - __main__ - Step 18310: {'lr': 0.00019996841892833, 'samples': 585920, 'steps': 1144, 'loss/train': 3.3112258911132812} -09/20/2021 18:27:10 - INFO - __main__ - Step 18311: {'lr': 0.00019996841892833, 'samples': 585952, 'steps': 1144, 'loss/train': 2.9059934616088867} -09/20/2021 18:27:10 - INFO - __main__ - Step 18312: {'lr': 0.00019996841892833, 'samples': 585984, 'steps': 1144, 'loss/train': 3.6030209064483643} -09/20/2021 18:27:11 - INFO - __main__ - Step 18313: {'lr': 0.00019996841892833, 'samples': 586016, 'steps': 1144, 'loss/train': 4.444982051849365} -09/20/2021 18:27:12 - INFO - __main__ - Step 18314: {'lr': 0.00019996841892833, 'samples': 586048, 'steps': 1144, 'loss/train': 4.1723785400390625} -09/20/2021 18:27:13 - INFO - __main__ - Step 18315: {'lr': 0.00019996841892833, 'samples': 586080, 'steps': 1144, 'loss/train': 4.013613224029541} -09/20/2021 18:27:13 - INFO - __main__ - Step 18316: {'lr': 0.00019996841892833, 'samples': 586112, 'steps': 1144, 'loss/train': 3.2985477447509766} -09/20/2021 18:27:14 - INFO - __main__ - Step 18317: {'lr': 0.00019996841892833, 'samples': 586144, 'steps': 1144, 'loss/train': 3.2331318855285645} -09/20/2021 18:27:15 - INFO - __main__ - Step 18318: {'lr': 0.00019996841892833, 'samples': 586176, 'steps': 1144, 'loss/train': 3.6723785400390625} -09/20/2021 18:27:16 - INFO - __main__ - Step 18319: {'lr': 0.00019996841892833, 'samples': 586208, 'steps': 1144, 'loss/train': 0.5811808705329895} -09/20/2021 18:27:16 - INFO - __main__ - Step 18320: {'lr': 0.00019996841892833, 'samples': 586240, 'steps': 1144, 'loss/train': 3.4935874938964844} -09/20/2021 18:27:17 - INFO - __main__ - Step 18321: {'lr': 0.00019996825842337454, 'samples': 586272, 'steps': 1145, 'loss/train': 4.724615573883057} -09/20/2021 18:27:18 - INFO - __main__ - Step 18322: {'lr': 0.00019996825842337454, 'samples': 586304, 'steps': 1145, 'loss/train': 4.522485733032227} -09/20/2021 18:27:19 - INFO - __main__ - Step 18323: {'lr': 0.00019996825842337454, 'samples': 586336, 'steps': 1145, 'loss/train': 4.605083465576172} -09/20/2021 18:27:20 - INFO - __main__ - Step 18324: {'lr': 0.00019996825842337454, 'samples': 586368, 'steps': 1145, 'loss/train': 4.035343170166016} -09/20/2021 18:27:21 - INFO - __main__ - Step 18325: {'lr': 0.00019996825842337454, 'samples': 586400, 'steps': 1145, 'loss/train': 3.787627935409546} -09/20/2021 18:27:22 - INFO - __main__ - Step 18326: {'lr': 0.00019996825842337454, 'samples': 586432, 'steps': 1145, 'loss/train': 2.6041676998138428} -09/20/2021 18:27:22 - INFO - __main__ - Step 18327: {'lr': 0.00019996825842337454, 'samples': 586464, 'steps': 1145, 'loss/train': 2.6792216300964355} -09/20/2021 18:27:23 - INFO - __main__ - Step 18328: {'lr': 0.00019996825842337454, 'samples': 586496, 'steps': 1145, 'loss/train': 3.823465347290039} -09/20/2021 18:27:24 - INFO - __main__ - Step 18329: {'lr': 0.00019996825842337454, 'samples': 586528, 'steps': 1145, 'loss/train': 2.815711259841919} -09/20/2021 18:27:25 - INFO - __main__ - Step 18330: {'lr': 0.00019996825842337454, 'samples': 586560, 'steps': 1145, 'loss/train': 2.8490092754364014} -09/20/2021 18:27:25 - INFO - __main__ - Step 18331: {'lr': 0.00019996825842337454, 'samples': 586592, 'steps': 1145, 'loss/train': 3.069453477859497} -09/20/2021 18:27:26 - INFO - __main__ - Step 18332: {'lr': 0.00019996825842337454, 'samples': 586624, 'steps': 1145, 'loss/train': 2.5991241931915283} -09/20/2021 18:27:27 - INFO - __main__ - Step 18333: {'lr': 0.00019996825842337454, 'samples': 586656, 'steps': 1145, 'loss/train': 3.563870668411255} -09/20/2021 18:27:28 - INFO - __main__ - Step 18334: {'lr': 0.00019996825842337454, 'samples': 586688, 'steps': 1145, 'loss/train': 3.828256368637085} -09/20/2021 18:27:28 - INFO - __main__ - Step 18335: {'lr': 0.00019996825842337454, 'samples': 586720, 'steps': 1145, 'loss/train': 2.9165616035461426} -09/20/2021 18:27:29 - INFO - __main__ - Step 18336: {'lr': 0.00019996825842337454, 'samples': 586752, 'steps': 1145, 'loss/train': 2.820204496383667} -09/20/2021 18:27:30 - INFO - __main__ - Step 18337: {'lr': 0.00019996809751164865, 'samples': 586784, 'steps': 1146, 'loss/train': 3.8400790691375732} -09/20/2021 18:27:31 - INFO - __main__ - Step 18338: {'lr': 0.00019996809751164865, 'samples': 586816, 'steps': 1146, 'loss/train': 6.487607002258301} -09/20/2021 18:27:32 - INFO - __main__ - Step 18339: {'lr': 0.00019996809751164865, 'samples': 586848, 'steps': 1146, 'loss/train': 3.4426560401916504} -09/20/2021 18:27:32 - INFO - __main__ - Step 18340: {'lr': 0.00019996809751164865, 'samples': 586880, 'steps': 1146, 'loss/train': 4.095435619354248} -09/20/2021 18:27:33 - INFO - __main__ - Step 18341: {'lr': 0.00019996809751164865, 'samples': 586912, 'steps': 1146, 'loss/train': 5.487399578094482} -09/20/2021 18:27:34 - INFO - __main__ - Step 18342: {'lr': 0.00019996809751164865, 'samples': 586944, 'steps': 1146, 'loss/train': 4.519649505615234} -09/20/2021 18:27:35 - INFO - __main__ - Step 18343: {'lr': 0.00019996809751164865, 'samples': 586976, 'steps': 1146, 'loss/train': 3.5444424152374268} -09/20/2021 18:27:35 - INFO - __main__ - Step 18344: {'lr': 0.00019996809751164865, 'samples': 587008, 'steps': 1146, 'loss/train': 3.0278244018554688} -09/20/2021 18:27:36 - INFO - __main__ - Step 18345: {'lr': 0.00019996809751164865, 'samples': 587040, 'steps': 1146, 'loss/train': 3.799809455871582} -09/20/2021 18:27:37 - INFO - __main__ - Step 18346: {'lr': 0.00019996809751164865, 'samples': 587072, 'steps': 1146, 'loss/train': 5.169220447540283} -09/20/2021 18:27:38 - INFO - __main__ - Step 18347: {'lr': 0.00019996809751164865, 'samples': 587104, 'steps': 1146, 'loss/train': 5.723618030548096} -09/20/2021 18:27:38 - INFO - __main__ - Step 18348: {'lr': 0.00019996809751164865, 'samples': 587136, 'steps': 1146, 'loss/train': 5.666236877441406} -09/20/2021 18:27:39 - INFO - __main__ - Step 18349: {'lr': 0.00019996809751164865, 'samples': 587168, 'steps': 1146, 'loss/train': 4.52955961227417} -09/20/2021 18:27:40 - INFO - __main__ - Step 18350: {'lr': 0.00019996809751164865, 'samples': 587200, 'steps': 1146, 'loss/train': 3.1414618492126465} -09/20/2021 18:27:41 - INFO - __main__ - Step 18351: {'lr': 0.00019996809751164865, 'samples': 587232, 'steps': 1146, 'loss/train': 2.7185070514678955} -09/20/2021 18:27:41 - INFO - __main__ - Step 18352: {'lr': 0.00019996809751164865, 'samples': 587264, 'steps': 1146, 'loss/train': 3.105191469192505} -09/20/2021 18:27:42 - INFO - __main__ - Step 18353: {'lr': 0.00019996793619315293, 'samples': 587296, 'steps': 1147, 'loss/train': 4.165614604949951} -09/20/2021 18:27:43 - INFO - __main__ - Step 18354: {'lr': 0.00019996793619315293, 'samples': 587328, 'steps': 1147, 'loss/train': 1.4377647638320923} -09/20/2021 18:27:44 - INFO - __main__ - Step 18355: {'lr': 0.00019996793619315293, 'samples': 587360, 'steps': 1147, 'loss/train': 4.366908550262451} -09/20/2021 18:27:45 - INFO - __main__ - Step 18356: {'lr': 0.00019996793619315293, 'samples': 587392, 'steps': 1147, 'loss/train': 3.0274808406829834} -09/20/2021 18:27:46 - INFO - __main__ - Step 18357: {'lr': 0.00019996793619315293, 'samples': 587424, 'steps': 1147, 'loss/train': 3.7131669521331787} -09/20/2021 18:27:46 - INFO - __main__ - Step 18358: {'lr': 0.00019996793619315293, 'samples': 587456, 'steps': 1147, 'loss/train': 3.6344196796417236} -09/20/2021 18:27:47 - INFO - __main__ - Step 18359: {'lr': 0.00019996793619315293, 'samples': 587488, 'steps': 1147, 'loss/train': 3.614849090576172} -09/20/2021 18:27:48 - INFO - __main__ - Step 18360: {'lr': 0.00019996793619315293, 'samples': 587520, 'steps': 1147, 'loss/train': 3.909310817718506} -09/20/2021 18:27:49 - INFO - __main__ - Step 18361: {'lr': 0.00019996793619315293, 'samples': 587552, 'steps': 1147, 'loss/train': 3.4909064769744873} -09/20/2021 18:27:49 - INFO - __main__ - Step 18362: {'lr': 0.00019996793619315293, 'samples': 587584, 'steps': 1147, 'loss/train': 3.296910047531128} -09/20/2021 18:27:50 - INFO - __main__ - Step 18363: {'lr': 0.00019996793619315293, 'samples': 587616, 'steps': 1147, 'loss/train': 3.295309066772461} -09/20/2021 18:27:51 - INFO - __main__ - Step 18364: {'lr': 0.00019996793619315293, 'samples': 587648, 'steps': 1147, 'loss/train': 3.532355785369873} -09/20/2021 18:27:52 - INFO - __main__ - Step 18365: {'lr': 0.00019996793619315293, 'samples': 587680, 'steps': 1147, 'loss/train': 3.383064031600952} -09/20/2021 18:27:52 - INFO - __main__ - Step 18366: {'lr': 0.00019996793619315293, 'samples': 587712, 'steps': 1147, 'loss/train': 3.2203867435455322} -09/20/2021 18:27:53 - INFO - __main__ - Step 18367: {'lr': 0.00019996793619315293, 'samples': 587744, 'steps': 1147, 'loss/train': 2.8564453125} -09/20/2021 18:27:54 - INFO - __main__ - Step 18368: {'lr': 0.00019996793619315293, 'samples': 587776, 'steps': 1147, 'loss/train': 3.812594175338745} -09/20/2021 18:27:55 - INFO - __main__ - Step 18369: {'lr': 0.00019996777446788807, 'samples': 587808, 'steps': 1148, 'loss/train': 3.2221028804779053} -09/20/2021 18:27:56 - INFO - __main__ - Step 18370: {'lr': 0.00019996777446788807, 'samples': 587840, 'steps': 1148, 'loss/train': 3.237929344177246} -09/20/2021 18:27:56 - INFO - __main__ - Step 18371: {'lr': 0.00019996777446788807, 'samples': 587872, 'steps': 1148, 'loss/train': 4.043534755706787} -09/20/2021 18:27:57 - INFO - __main__ - Step 18372: {'lr': 0.00019996777446788807, 'samples': 587904, 'steps': 1148, 'loss/train': 3.145009994506836} -09/20/2021 18:27:58 - INFO - __main__ - Step 18373: {'lr': 0.00019996777446788807, 'samples': 587936, 'steps': 1148, 'loss/train': 4.096659183502197} -09/20/2021 18:27:59 - INFO - __main__ - Step 18374: {'lr': 0.00019996777446788807, 'samples': 587968, 'steps': 1148, 'loss/train': 3.1836330890655518} -09/20/2021 18:27:59 - INFO - __main__ - Step 18375: {'lr': 0.00019996777446788807, 'samples': 588000, 'steps': 1148, 'loss/train': 3.720832109451294} -09/20/2021 18:28:00 - INFO - __main__ - Step 18376: {'lr': 0.00019996777446788807, 'samples': 588032, 'steps': 1148, 'loss/train': 3.6894001960754395} -09/20/2021 18:28:01 - INFO - __main__ - Step 18377: {'lr': 0.00019996777446788807, 'samples': 588064, 'steps': 1148, 'loss/train': 3.557692289352417} -09/20/2021 18:28:02 - INFO - __main__ - Step 18378: {'lr': 0.00019996777446788807, 'samples': 588096, 'steps': 1148, 'loss/train': 3.826233148574829} -09/20/2021 18:28:02 - INFO - __main__ - Step 18379: {'lr': 0.00019996777446788807, 'samples': 588128, 'steps': 1148, 'loss/train': 3.3309929370880127} -09/20/2021 18:28:03 - INFO - __main__ - Step 18380: {'lr': 0.00019996777446788807, 'samples': 588160, 'steps': 1148, 'loss/train': 4.7592644691467285} -09/20/2021 18:28:04 - INFO - __main__ - Step 18381: {'lr': 0.00019996777446788807, 'samples': 588192, 'steps': 1148, 'loss/train': 5.7361836433410645} -09/20/2021 18:28:05 - INFO - __main__ - Step 18382: {'lr': 0.00019996777446788807, 'samples': 588224, 'steps': 1148, 'loss/train': 4.089536190032959} -09/20/2021 18:28:05 - INFO - __main__ - Step 18383: {'lr': 0.00019996777446788807, 'samples': 588256, 'steps': 1148, 'loss/train': 4.0830607414245605} -09/20/2021 18:28:06 - INFO - __main__ - Step 18384: {'lr': 0.00019996777446788807, 'samples': 588288, 'steps': 1148, 'loss/train': 3.8402817249298096} -09/20/2021 18:28:08 - INFO - __main__ - Step 18385: {'lr': 0.00019996761233585474, 'samples': 588320, 'steps': 1149, 'loss/train': 3.3393735885620117} -09/20/2021 18:28:09 - INFO - __main__ - Step 18386: {'lr': 0.00019996761233585474, 'samples': 588352, 'steps': 1149, 'loss/train': 3.0898783206939697} -09/20/2021 18:28:10 - INFO - __main__ - Step 18387: {'lr': 0.00019996761233585474, 'samples': 588384, 'steps': 1149, 'loss/train': 3.7475223541259766} -09/20/2021 18:28:11 - INFO - __main__ - Step 18388: {'lr': 0.00019996761233585474, 'samples': 588416, 'steps': 1149, 'loss/train': 5.1907958984375} -09/20/2021 18:28:11 - INFO - __main__ - Step 18389: {'lr': 0.00019996761233585474, 'samples': 588448, 'steps': 1149, 'loss/train': 4.518326282501221} -09/20/2021 18:28:12 - INFO - __main__ - Step 18390: {'lr': 0.00019996761233585474, 'samples': 588480, 'steps': 1149, 'loss/train': 4.846612930297852} -09/20/2021 18:28:13 - INFO - __main__ - Step 18391: {'lr': 0.00019996761233585474, 'samples': 588512, 'steps': 1149, 'loss/train': 4.210780143737793} -09/20/2021 18:28:14 - INFO - __main__ - Step 18392: {'lr': 0.00019996761233585474, 'samples': 588544, 'steps': 1149, 'loss/train': 2.3165714740753174} -09/20/2021 18:28:14 - INFO - __main__ - Step 18393: {'lr': 0.00019996761233585474, 'samples': 588576, 'steps': 1149, 'loss/train': 4.519874572753906} -09/20/2021 18:28:15 - INFO - __main__ - Step 18394: {'lr': 0.00019996761233585474, 'samples': 588608, 'steps': 1149, 'loss/train': 2.783212900161743} -09/20/2021 18:28:16 - INFO - __main__ - Step 18395: {'lr': 0.00019996761233585474, 'samples': 588640, 'steps': 1149, 'loss/train': 3.739854574203491} -09/20/2021 18:28:17 - INFO - __main__ - Step 18396: {'lr': 0.00019996761233585474, 'samples': 588672, 'steps': 1149, 'loss/train': 2.4550392627716064} -09/20/2021 18:28:17 - INFO - __main__ - Step 18397: {'lr': 0.00019996761233585474, 'samples': 588704, 'steps': 1149, 'loss/train': 1.838032841682434} -09/20/2021 18:28:18 - INFO - __main__ - Step 18398: {'lr': 0.00019996761233585474, 'samples': 588736, 'steps': 1149, 'loss/train': 3.7350757122039795} -09/20/2021 18:28:19 - INFO - __main__ - Step 18399: {'lr': 0.00019996761233585474, 'samples': 588768, 'steps': 1149, 'loss/train': 2.6292288303375244} -09/20/2021 18:28:20 - INFO - __main__ - Step 18400: {'lr': 0.00019996761233585474, 'samples': 588800, 'steps': 1149, 'loss/train': 3.4132239818573} -09/20/2021 18:28:20 - INFO - __main__ - Step 18401: {'lr': 0.00019996744979705359, 'samples': 588832, 'steps': 1150, 'loss/train': 3.5192368030548096} -09/20/2021 18:28:21 - INFO - __main__ - Step 18402: {'lr': 0.00019996744979705359, 'samples': 588864, 'steps': 1150, 'loss/train': 4.111118793487549} -09/20/2021 18:28:22 - INFO - __main__ - Step 18403: {'lr': 0.00019996744979705359, 'samples': 588896, 'steps': 1150, 'loss/train': 3.169206380844116} -09/20/2021 18:28:23 - INFO - __main__ - Step 18404: {'lr': 0.00019996744979705359, 'samples': 588928, 'steps': 1150, 'loss/train': 4.43811559677124} -09/20/2021 18:28:23 - INFO - __main__ - Step 18405: {'lr': 0.00019996744979705359, 'samples': 588960, 'steps': 1150, 'loss/train': 3.855879068374634} -09/20/2021 18:28:24 - INFO - __main__ - Step 18406: {'lr': 0.00019996744979705359, 'samples': 588992, 'steps': 1150, 'loss/train': 3.3085098266601562} -09/20/2021 18:28:25 - INFO - __main__ - Step 18407: {'lr': 0.00019996744979705359, 'samples': 589024, 'steps': 1150, 'loss/train': 4.661348342895508} -09/20/2021 18:28:26 - INFO - __main__ - Step 18408: {'lr': 0.00019996744979705359, 'samples': 589056, 'steps': 1150, 'loss/train': 3.4540910720825195} -09/20/2021 18:28:26 - INFO - __main__ - Step 18409: {'lr': 0.00019996744979705359, 'samples': 589088, 'steps': 1150, 'loss/train': 3.302685499191284} -09/20/2021 18:28:27 - INFO - __main__ - Step 18410: {'lr': 0.00019996744979705359, 'samples': 589120, 'steps': 1150, 'loss/train': 3.6784794330596924} -09/20/2021 18:28:28 - INFO - __main__ - Step 18411: {'lr': 0.00019996744979705359, 'samples': 589152, 'steps': 1150, 'loss/train': 2.8895039558410645} -09/20/2021 18:28:29 - INFO - __main__ - Step 18412: {'lr': 0.00019996744979705359, 'samples': 589184, 'steps': 1150, 'loss/train': 3.365527391433716} -09/20/2021 18:28:29 - INFO - __main__ - Step 18413: {'lr': 0.00019996744979705359, 'samples': 589216, 'steps': 1150, 'loss/train': 2.7427115440368652} -09/20/2021 18:28:30 - INFO - __main__ - Step 18414: {'lr': 0.00019996744979705359, 'samples': 589248, 'steps': 1150, 'loss/train': 3.694776773452759} -09/20/2021 18:28:31 - INFO - __main__ - Step 18415: {'lr': 0.00019996744979705359, 'samples': 589280, 'steps': 1150, 'loss/train': 2.998936414718628} -09/20/2021 18:28:32 - INFO - __main__ - Step 18416: {'lr': 0.00019996744979705359, 'samples': 589312, 'steps': 1150, 'loss/train': 3.3434793949127197} -09/20/2021 18:28:33 - INFO - __main__ - Step 18417: {'lr': 0.00019996728685148525, 'samples': 589344, 'steps': 1151, 'loss/train': 2.9803543090820312} -09/20/2021 18:28:34 - INFO - __main__ - Step 18418: {'lr': 0.00019996728685148525, 'samples': 589376, 'steps': 1151, 'loss/train': 4.02128267288208} -09/20/2021 18:28:35 - INFO - __main__ - Step 18419: {'lr': 0.00019996728685148525, 'samples': 589408, 'steps': 1151, 'loss/train': 0.93584144115448} -09/20/2021 18:28:35 - INFO - __main__ - Step 18420: {'lr': 0.00019996728685148525, 'samples': 589440, 'steps': 1151, 'loss/train': 3.6501007080078125} -09/20/2021 18:28:36 - INFO - __main__ - Step 18421: {'lr': 0.00019996728685148525, 'samples': 589472, 'steps': 1151, 'loss/train': 3.2238869667053223} -09/20/2021 18:28:37 - INFO - __main__ - Step 18422: {'lr': 0.00019996728685148525, 'samples': 589504, 'steps': 1151, 'loss/train': 3.8729026317596436} -09/20/2021 18:28:38 - INFO - __main__ - Step 18423: {'lr': 0.00019996728685148525, 'samples': 589536, 'steps': 1151, 'loss/train': 4.620339393615723} -09/20/2021 18:28:38 - INFO - __main__ - Step 18424: {'lr': 0.00019996728685148525, 'samples': 589568, 'steps': 1151, 'loss/train': 3.603522300720215} -09/20/2021 18:28:39 - INFO - __main__ - Step 18425: {'lr': 0.00019996728685148525, 'samples': 589600, 'steps': 1151, 'loss/train': 3.233053207397461} -09/20/2021 18:28:40 - INFO - __main__ - Step 18426: {'lr': 0.00019996728685148525, 'samples': 589632, 'steps': 1151, 'loss/train': 3.171964645385742} -09/20/2021 18:28:41 - INFO - __main__ - Step 18427: {'lr': 0.00019996728685148525, 'samples': 589664, 'steps': 1151, 'loss/train': 3.841637134552002} -09/20/2021 18:28:41 - INFO - __main__ - Step 18428: {'lr': 0.00019996728685148525, 'samples': 589696, 'steps': 1151, 'loss/train': 3.9686763286590576} -09/20/2021 18:28:42 - INFO - __main__ - Step 18429: {'lr': 0.00019996728685148525, 'samples': 589728, 'steps': 1151, 'loss/train': 3.4457788467407227} -09/20/2021 18:28:43 - INFO - __main__ - Step 18430: {'lr': 0.00019996728685148525, 'samples': 589760, 'steps': 1151, 'loss/train': 4.190609455108643} -09/20/2021 18:28:44 - INFO - __main__ - Step 18431: {'lr': 0.00019996728685148525, 'samples': 589792, 'steps': 1151, 'loss/train': 5.0703935623168945} -09/20/2021 18:28:44 - INFO - __main__ - Step 18432: {'lr': 0.00019996728685148525, 'samples': 589824, 'steps': 1151, 'loss/train': 3.338040828704834} -09/20/2021 18:28:45 - INFO - __main__ - Step 18433: {'lr': 0.00019996712349915042, 'samples': 589856, 'steps': 1152, 'loss/train': 2.981430768966675} -09/20/2021 18:28:46 - INFO - __main__ - Step 18434: {'lr': 0.00019996712349915042, 'samples': 589888, 'steps': 1152, 'loss/train': 4.293620586395264} -09/20/2021 18:28:47 - INFO - __main__ - Step 18435: {'lr': 0.00019996712349915042, 'samples': 589920, 'steps': 1152, 'loss/train': 5.260980129241943} -09/20/2021 18:28:47 - INFO - __main__ - Step 18436: {'lr': 0.00019996712349915042, 'samples': 589952, 'steps': 1152, 'loss/train': 3.410430431365967} -09/20/2021 18:28:48 - INFO - __main__ - Step 18437: {'lr': 0.00019996712349915042, 'samples': 589984, 'steps': 1152, 'loss/train': 3.8099167346954346} -09/20/2021 18:28:49 - INFO - __main__ - Step 18438: {'lr': 0.00019996712349915042, 'samples': 590016, 'steps': 1152, 'loss/train': 3.394270896911621} -09/20/2021 18:28:50 - INFO - __main__ - Step 18439: {'lr': 0.00019996712349915042, 'samples': 590048, 'steps': 1152, 'loss/train': 3.284526824951172} -09/20/2021 18:28:50 - INFO - __main__ - Step 18440: {'lr': 0.00019996712349915042, 'samples': 590080, 'steps': 1152, 'loss/train': 3.603569984436035} -09/20/2021 18:28:51 - INFO - __main__ - Step 18441: {'lr': 0.00019996712349915042, 'samples': 590112, 'steps': 1152, 'loss/train': 4.2821946144104} -09/20/2021 18:28:52 - INFO - __main__ - Step 18442: {'lr': 0.00019996712349915042, 'samples': 590144, 'steps': 1152, 'loss/train': 3.9751217365264893} -09/20/2021 18:28:53 - INFO - __main__ - Step 18443: {'lr': 0.00019996712349915042, 'samples': 590176, 'steps': 1152, 'loss/train': 3.618475914001465} -09/20/2021 18:28:53 - INFO - __main__ - Step 18444: {'lr': 0.00019996712349915042, 'samples': 590208, 'steps': 1152, 'loss/train': 3.164395570755005} -09/20/2021 18:28:54 - INFO - __main__ - Step 18445: {'lr': 0.00019996712349915042, 'samples': 590240, 'steps': 1152, 'loss/train': 3.222933053970337} -09/20/2021 18:28:55 - INFO - __main__ - Step 18446: {'lr': 0.00019996712349915042, 'samples': 590272, 'steps': 1152, 'loss/train': 6.3909831047058105} -09/20/2021 18:28:56 - INFO - __main__ - Step 18447: {'lr': 0.00019996712349915042, 'samples': 590304, 'steps': 1152, 'loss/train': 4.085574626922607} -09/20/2021 18:28:57 - INFO - __main__ - Step 18448: {'lr': 0.00019996712349915042, 'samples': 590336, 'steps': 1152, 'loss/train': 3.4577155113220215} -09/20/2021 18:28:58 - INFO - __main__ - Step 18449: {'lr': 0.00019996695974004976, 'samples': 590368, 'steps': 1153, 'loss/train': 3.3736202716827393} -09/20/2021 18:28:59 - INFO - __main__ - Step 18450: {'lr': 0.00019996695974004976, 'samples': 590400, 'steps': 1153, 'loss/train': 4.488822937011719} -09/20/2021 18:29:00 - INFO - __main__ - Step 18451: {'lr': 0.00019996695974004976, 'samples': 590432, 'steps': 1153, 'loss/train': 3.1110002994537354} -09/20/2021 18:29:00 - INFO - __main__ - Step 18452: {'lr': 0.00019996695974004976, 'samples': 590464, 'steps': 1153, 'loss/train': 3.196200132369995} -09/20/2021 18:29:01 - INFO - __main__ - Step 18453: {'lr': 0.00019996695974004976, 'samples': 590496, 'steps': 1153, 'loss/train': 3.6725809574127197} -09/20/2021 18:29:02 - INFO - __main__ - Step 18454: {'lr': 0.00019996695974004976, 'samples': 590528, 'steps': 1153, 'loss/train': 1.229838252067566} -09/20/2021 18:29:03 - INFO - __main__ - Step 18455: {'lr': 0.00019996695974004976, 'samples': 590560, 'steps': 1153, 'loss/train': 1.0923305749893188} -09/20/2021 18:29:03 - INFO - __main__ - Step 18456: {'lr': 0.00019996695974004976, 'samples': 590592, 'steps': 1153, 'loss/train': 0.6989896297454834} -09/20/2021 18:29:04 - INFO - __main__ - Step 18457: {'lr': 0.00019996695974004976, 'samples': 590624, 'steps': 1153, 'loss/train': 4.267725944519043} -09/20/2021 18:29:05 - INFO - __main__ - Step 18458: {'lr': 0.00019996695974004976, 'samples': 590656, 'steps': 1153, 'loss/train': 3.6273834705352783} -09/20/2021 18:29:06 - INFO - __main__ - Step 18459: {'lr': 0.00019996695974004976, 'samples': 590688, 'steps': 1153, 'loss/train': 2.8559107780456543} -09/20/2021 18:29:06 - INFO - __main__ - Step 18460: {'lr': 0.00019996695974004976, 'samples': 590720, 'steps': 1153, 'loss/train': 2.693218946456909} -09/20/2021 18:29:07 - INFO - __main__ - Step 18461: {'lr': 0.00019996695974004976, 'samples': 590752, 'steps': 1153, 'loss/train': 3.3945391178131104} -09/20/2021 18:29:08 - INFO - __main__ - Step 18462: {'lr': 0.00019996695974004976, 'samples': 590784, 'steps': 1153, 'loss/train': 5.089469909667969} -09/20/2021 18:29:09 - INFO - __main__ - Step 18463: {'lr': 0.00019996695974004976, 'samples': 590816, 'steps': 1153, 'loss/train': 4.420598983764648} -09/20/2021 18:29:09 - INFO - __main__ - Step 18464: {'lr': 0.00019996695974004976, 'samples': 590848, 'steps': 1153, 'loss/train': 4.527469158172607} -09/20/2021 18:29:10 - INFO - __main__ - Step 18465: {'lr': 0.00019996679557418389, 'samples': 590880, 'steps': 1154, 'loss/train': 3.9820985794067383} -09/20/2021 18:29:11 - INFO - __main__ - Step 18466: {'lr': 0.00019996679557418389, 'samples': 590912, 'steps': 1154, 'loss/train': 3.2256217002868652} -09/20/2021 18:29:12 - INFO - __main__ - Step 18467: {'lr': 0.00019996679557418389, 'samples': 590944, 'steps': 1154, 'loss/train': 4.027629852294922} -09/20/2021 18:29:12 - INFO - __main__ - Step 18468: {'lr': 0.00019996679557418389, 'samples': 590976, 'steps': 1154, 'loss/train': 4.133683204650879} -09/20/2021 18:29:13 - INFO - __main__ - Step 18469: {'lr': 0.00019996679557418389, 'samples': 591008, 'steps': 1154, 'loss/train': 3.8432676792144775} -09/20/2021 18:29:14 - INFO - __main__ - Step 18470: {'lr': 0.00019996679557418389, 'samples': 591040, 'steps': 1154, 'loss/train': 5.199997425079346} -09/20/2021 18:29:15 - INFO - __main__ - Step 18471: {'lr': 0.00019996679557418389, 'samples': 591072, 'steps': 1154, 'loss/train': 4.387959957122803} -09/20/2021 18:29:15 - INFO - __main__ - Step 18472: {'lr': 0.00019996679557418389, 'samples': 591104, 'steps': 1154, 'loss/train': 3.7934439182281494} -09/20/2021 18:29:16 - INFO - __main__ - Step 18473: {'lr': 0.00019996679557418389, 'samples': 591136, 'steps': 1154, 'loss/train': 4.58779764175415} -09/20/2021 18:29:17 - INFO - __main__ - Step 18474: {'lr': 0.00019996679557418389, 'samples': 591168, 'steps': 1154, 'loss/train': 3.8204586505889893} -09/20/2021 18:29:18 - INFO - __main__ - Step 18475: {'lr': 0.00019996679557418389, 'samples': 591200, 'steps': 1154, 'loss/train': 3.777127265930176} -09/20/2021 18:29:18 - INFO - __main__ - Step 18476: {'lr': 0.00019996679557418389, 'samples': 591232, 'steps': 1154, 'loss/train': 2.9560763835906982} -09/20/2021 18:29:19 - INFO - __main__ - Step 18477: {'lr': 0.00019996679557418389, 'samples': 591264, 'steps': 1154, 'loss/train': 2.95621919631958} -09/20/2021 18:29:20 - INFO - __main__ - Step 18478: {'lr': 0.00019996679557418389, 'samples': 591296, 'steps': 1154, 'loss/train': 2.981111764907837} -09/20/2021 18:29:21 - INFO - __main__ - Step 18479: {'lr': 0.00019996679557418389, 'samples': 591328, 'steps': 1154, 'loss/train': 3.391630172729492} -09/20/2021 18:29:21 - INFO - __main__ - Step 18480: {'lr': 0.00019996679557418389, 'samples': 591360, 'steps': 1154, 'loss/train': 3.4792211055755615} -09/20/2021 18:29:22 - INFO - __main__ - Step 18481: {'lr': 0.00019996663100155354, 'samples': 591392, 'steps': 1155, 'loss/train': 5.287483215332031} -09/20/2021 18:29:24 - INFO - __main__ - Step 18482: {'lr': 0.00019996663100155354, 'samples': 591424, 'steps': 1155, 'loss/train': 2.8727829456329346} -09/20/2021 18:29:24 - INFO - __main__ - Step 18483: {'lr': 0.00019996663100155354, 'samples': 591456, 'steps': 1155, 'loss/train': 3.87906551361084} -09/20/2021 18:29:25 - INFO - __main__ - Step 18484: {'lr': 0.00019996663100155354, 'samples': 591488, 'steps': 1155, 'loss/train': 3.736055374145508} -09/20/2021 18:29:26 - INFO - __main__ - Step 18485: {'lr': 0.00019996663100155354, 'samples': 591520, 'steps': 1155, 'loss/train': 3.148317575454712} -09/20/2021 18:29:27 - INFO - __main__ - Step 18486: {'lr': 0.00019996663100155354, 'samples': 591552, 'steps': 1155, 'loss/train': 4.0009965896606445} -09/20/2021 18:29:27 - INFO - __main__ - Step 18487: {'lr': 0.00019996663100155354, 'samples': 591584, 'steps': 1155, 'loss/train': 2.927666664123535} -09/20/2021 18:29:28 - INFO - __main__ - Step 18488: {'lr': 0.00019996663100155354, 'samples': 591616, 'steps': 1155, 'loss/train': 6.416672229766846} -09/20/2021 18:29:29 - INFO - __main__ - Step 18489: {'lr': 0.00019996663100155354, 'samples': 591648, 'steps': 1155, 'loss/train': 2.56744647026062} -09/20/2021 18:29:30 - INFO - __main__ - Step 18490: {'lr': 0.00019996663100155354, 'samples': 591680, 'steps': 1155, 'loss/train': 3.207505941390991} -09/20/2021 18:29:30 - INFO - __main__ - Step 18491: {'lr': 0.00019996663100155354, 'samples': 591712, 'steps': 1155, 'loss/train': 2.839341878890991} -09/20/2021 18:29:31 - INFO - __main__ - Step 18492: {'lr': 0.00019996663100155354, 'samples': 591744, 'steps': 1155, 'loss/train': 3.368231773376465} -09/20/2021 18:29:32 - INFO - __main__ - Step 18493: {'lr': 0.00019996663100155354, 'samples': 591776, 'steps': 1155, 'loss/train': 3.5130090713500977} -09/20/2021 18:29:33 - INFO - __main__ - Step 18494: {'lr': 0.00019996663100155354, 'samples': 591808, 'steps': 1155, 'loss/train': 3.9668807983398438} -09/20/2021 18:29:33 - INFO - __main__ - Step 18495: {'lr': 0.00019996663100155354, 'samples': 591840, 'steps': 1155, 'loss/train': 3.4576802253723145} -09/20/2021 18:29:34 - INFO - __main__ - Step 18496: {'lr': 0.00019996663100155354, 'samples': 591872, 'steps': 1155, 'loss/train': 4.4434943199157715} -09/20/2021 18:29:35 - INFO - __main__ - Step 18497: {'lr': 0.00019996646602215936, 'samples': 591904, 'steps': 1156, 'loss/train': 3.7169106006622314} -09/20/2021 18:29:36 - INFO - __main__ - Step 18498: {'lr': 0.00019996646602215936, 'samples': 591936, 'steps': 1156, 'loss/train': 2.980928659439087} -09/20/2021 18:29:36 - INFO - __main__ - Step 18499: {'lr': 0.00019996646602215936, 'samples': 591968, 'steps': 1156, 'loss/train': 3.6150498390197754} -09/20/2021 18:29:37 - INFO - __main__ - Step 18500: {'lr': 0.00019996646602215936, 'samples': 592000, 'steps': 1156, 'loss/train': 3.177990436553955} -09/20/2021 18:29:38 - INFO - __main__ - Step 18501: {'lr': 0.00019996646602215936, 'samples': 592032, 'steps': 1156, 'loss/train': 3.9358599185943604} -09/20/2021 18:29:39 - INFO - __main__ - Step 18502: {'lr': 0.00019996646602215936, 'samples': 592064, 'steps': 1156, 'loss/train': 3.313739538192749} -09/20/2021 18:29:39 - INFO - __main__ - Step 18503: {'lr': 0.00019996646602215936, 'samples': 592096, 'steps': 1156, 'loss/train': 3.175783157348633} -09/20/2021 18:29:40 - INFO - __main__ - Step 18504: {'lr': 0.00019996646602215936, 'samples': 592128, 'steps': 1156, 'loss/train': 3.5438990592956543} -09/20/2021 18:29:41 - INFO - __main__ - Step 18505: {'lr': 0.00019996646602215936, 'samples': 592160, 'steps': 1156, 'loss/train': 2.897888422012329} -09/20/2021 18:29:42 - INFO - __main__ - Step 18506: {'lr': 0.00019996646602215936, 'samples': 592192, 'steps': 1156, 'loss/train': 4.335313320159912} -09/20/2021 18:29:42 - INFO - __main__ - Step 18507: {'lr': 0.00019996646602215936, 'samples': 592224, 'steps': 1156, 'loss/train': 4.588051795959473} -09/20/2021 18:29:43 - INFO - __main__ - Step 18508: {'lr': 0.00019996646602215936, 'samples': 592256, 'steps': 1156, 'loss/train': 3.9132165908813477} -09/20/2021 18:29:44 - INFO - __main__ - Step 18509: {'lr': 0.00019996646602215936, 'samples': 592288, 'steps': 1156, 'loss/train': 3.7932944297790527} -09/20/2021 18:29:45 - INFO - __main__ - Step 18510: {'lr': 0.00019996646602215936, 'samples': 592320, 'steps': 1156, 'loss/train': 3.2975480556488037} -09/20/2021 18:29:45 - INFO - __main__ - Step 18511: {'lr': 0.00019996646602215936, 'samples': 592352, 'steps': 1156, 'loss/train': 3.5770022869110107} -09/20/2021 18:29:46 - INFO - __main__ - Step 18512: {'lr': 0.00019996646602215936, 'samples': 592384, 'steps': 1156, 'loss/train': 3.3502721786499023} -09/20/2021 18:29:48 - INFO - __main__ - Step 18513: {'lr': 0.000199966300636002, 'samples': 592416, 'steps': 1157, 'loss/train': 3.973088264465332} -09/20/2021 18:29:48 - INFO - __main__ - Step 18514: {'lr': 0.000199966300636002, 'samples': 592448, 'steps': 1157, 'loss/train': 3.0993294715881348} -09/20/2021 18:29:49 - INFO - __main__ - Step 18515: {'lr': 0.000199966300636002, 'samples': 592480, 'steps': 1157, 'loss/train': 3.9324474334716797} -09/20/2021 18:29:50 - INFO - __main__ - Step 18516: {'lr': 0.000199966300636002, 'samples': 592512, 'steps': 1157, 'loss/train': 3.5313124656677246} -09/20/2021 18:29:51 - INFO - __main__ - Step 18517: {'lr': 0.000199966300636002, 'samples': 592544, 'steps': 1157, 'loss/train': 4.150820732116699} -09/20/2021 18:29:51 - INFO - __main__ - Step 18518: {'lr': 0.000199966300636002, 'samples': 592576, 'steps': 1157, 'loss/train': 3.5943663120269775} -09/20/2021 18:29:52 - INFO - __main__ - Step 18519: {'lr': 0.000199966300636002, 'samples': 592608, 'steps': 1157, 'loss/train': 4.379824161529541} -09/20/2021 18:29:53 - INFO - __main__ - Step 18520: {'lr': 0.000199966300636002, 'samples': 592640, 'steps': 1157, 'loss/train': 3.4072213172912598} -09/20/2021 18:29:54 - INFO - __main__ - Step 18521: {'lr': 0.000199966300636002, 'samples': 592672, 'steps': 1157, 'loss/train': 3.22731876373291} -09/20/2021 18:29:54 - INFO - __main__ - Step 18522: {'lr': 0.000199966300636002, 'samples': 592704, 'steps': 1157, 'loss/train': 1.5676709413528442} -09/20/2021 18:29:55 - INFO - __main__ - Step 18523: {'lr': 0.000199966300636002, 'samples': 592736, 'steps': 1157, 'loss/train': 4.264307498931885} -09/20/2021 18:29:56 - INFO - __main__ - Step 18524: {'lr': 0.000199966300636002, 'samples': 592768, 'steps': 1157, 'loss/train': 3.993363380432129} -09/20/2021 18:29:57 - INFO - __main__ - Step 18525: {'lr': 0.000199966300636002, 'samples': 592800, 'steps': 1157, 'loss/train': 1.1972403526306152} -09/20/2021 18:29:57 - INFO - __main__ - Step 18526: {'lr': 0.000199966300636002, 'samples': 592832, 'steps': 1157, 'loss/train': 0.7209340929985046} -09/20/2021 18:29:58 - INFO - __main__ - Step 18527: {'lr': 0.000199966300636002, 'samples': 592864, 'steps': 1157, 'loss/train': 2.072188377380371} -09/20/2021 18:29:59 - INFO - __main__ - Step 18528: {'lr': 0.000199966300636002, 'samples': 592896, 'steps': 1157, 'loss/train': 2.950120687484741} -09/20/2021 18:30:00 - INFO - __main__ - Step 18529: {'lr': 0.0001999661348430822, 'samples': 592928, 'steps': 1158, 'loss/train': 3.8668503761291504} -09/20/2021 18:30:01 - INFO - __main__ - Step 18530: {'lr': 0.0001999661348430822, 'samples': 592960, 'steps': 1158, 'loss/train': 3.241535186767578} -09/20/2021 18:30:01 - INFO - __main__ - Step 18531: {'lr': 0.0001999661348430822, 'samples': 592992, 'steps': 1158, 'loss/train': 2.503786563873291} -09/20/2021 18:30:02 - INFO - __main__ - Step 18532: {'lr': 0.0001999661348430822, 'samples': 593024, 'steps': 1158, 'loss/train': 3.271251678466797} -09/20/2021 18:30:03 - INFO - __main__ - Step 18533: {'lr': 0.0001999661348430822, 'samples': 593056, 'steps': 1158, 'loss/train': 4.19276762008667} -09/20/2021 18:30:04 - INFO - __main__ - Step 18534: {'lr': 0.0001999661348430822, 'samples': 593088, 'steps': 1158, 'loss/train': 4.014648914337158} -09/20/2021 18:30:04 - INFO - __main__ - Step 18535: {'lr': 0.0001999661348430822, 'samples': 593120, 'steps': 1158, 'loss/train': 3.531628370285034} -09/20/2021 18:30:05 - INFO - __main__ - Step 18536: {'lr': 0.0001999661348430822, 'samples': 593152, 'steps': 1158, 'loss/train': 2.626142978668213} -09/20/2021 18:30:06 - INFO - __main__ - Step 18537: {'lr': 0.0001999661348430822, 'samples': 593184, 'steps': 1158, 'loss/train': 1.466296911239624} -09/20/2021 18:30:07 - INFO - __main__ - Step 18538: {'lr': 0.0001999661348430822, 'samples': 593216, 'steps': 1158, 'loss/train': 3.02177357673645} -09/20/2021 18:30:07 - INFO - __main__ - Step 18539: {'lr': 0.0001999661348430822, 'samples': 593248, 'steps': 1158, 'loss/train': 2.839354991912842} -09/20/2021 18:30:08 - INFO - __main__ - Step 18540: {'lr': 0.0001999661348430822, 'samples': 593280, 'steps': 1158, 'loss/train': 3.074922800064087} -09/20/2021 18:30:09 - INFO - __main__ - Step 18541: {'lr': 0.0001999661348430822, 'samples': 593312, 'steps': 1158, 'loss/train': 4.17515754699707} -09/20/2021 18:30:10 - INFO - __main__ - Step 18542: {'lr': 0.0001999661348430822, 'samples': 593344, 'steps': 1158, 'loss/train': 2.5118465423583984} -09/20/2021 18:30:11 - INFO - __main__ - Step 18543: {'lr': 0.0001999661348430822, 'samples': 593376, 'steps': 1158, 'loss/train': 3.8660695552825928} -09/20/2021 18:30:12 - INFO - __main__ - Step 18544: {'lr': 0.0001999661348430822, 'samples': 593408, 'steps': 1158, 'loss/train': 3.1912524700164795} -09/20/2021 18:30:13 - INFO - __main__ - Step 18545: {'lr': 0.00019996596864340057, 'samples': 593440, 'steps': 1159, 'loss/train': 4.210961818695068} -09/20/2021 18:30:13 - INFO - __main__ - Step 18546: {'lr': 0.00019996596864340057, 'samples': 593472, 'steps': 1159, 'loss/train': 3.7860398292541504} -09/20/2021 18:30:14 - INFO - __main__ - Step 18547: {'lr': 0.00019996596864340057, 'samples': 593504, 'steps': 1159, 'loss/train': 3.3061978816986084} -09/20/2021 18:30:15 - INFO - __main__ - Step 18548: {'lr': 0.00019996596864340057, 'samples': 593536, 'steps': 1159, 'loss/train': 4.10439920425415} -09/20/2021 18:30:16 - INFO - __main__ - Step 18549: {'lr': 0.00019996596864340057, 'samples': 593568, 'steps': 1159, 'loss/train': 4.001542568206787} -09/20/2021 18:30:16 - INFO - __main__ - Step 18550: {'lr': 0.00019996596864340057, 'samples': 593600, 'steps': 1159, 'loss/train': 2.497584581375122} -09/20/2021 18:30:17 - INFO - __main__ - Step 18551: {'lr': 0.00019996596864340057, 'samples': 593632, 'steps': 1159, 'loss/train': 3.5240137577056885} -09/20/2021 18:30:18 - INFO - __main__ - Step 18552: {'lr': 0.00019996596864340057, 'samples': 593664, 'steps': 1159, 'loss/train': 5.083647727966309} -09/20/2021 18:30:19 - INFO - __main__ - Step 18553: {'lr': 0.00019996596864340057, 'samples': 593696, 'steps': 1159, 'loss/train': 3.8577654361724854} -09/20/2021 18:30:19 - INFO - __main__ - Step 18554: {'lr': 0.00019996596864340057, 'samples': 593728, 'steps': 1159, 'loss/train': 3.5251903533935547} -09/20/2021 18:30:20 - INFO - __main__ - Step 18555: {'lr': 0.00019996596864340057, 'samples': 593760, 'steps': 1159, 'loss/train': 4.066348075866699} -09/20/2021 18:30:21 - INFO - __main__ - Step 18556: {'lr': 0.00019996596864340057, 'samples': 593792, 'steps': 1159, 'loss/train': 3.47861385345459} -09/20/2021 18:30:22 - INFO - __main__ - Step 18557: {'lr': 0.00019996596864340057, 'samples': 593824, 'steps': 1159, 'loss/train': 3.6331193447113037} -09/20/2021 18:30:22 - INFO - __main__ - Step 18558: {'lr': 0.00019996596864340057, 'samples': 593856, 'steps': 1159, 'loss/train': 3.174726963043213} -09/20/2021 18:30:23 - INFO - __main__ - Step 18559: {'lr': 0.00019996596864340057, 'samples': 593888, 'steps': 1159, 'loss/train': 3.1469223499298096} -09/20/2021 18:30:24 - INFO - __main__ - Step 18560: {'lr': 0.00019996596864340057, 'samples': 593920, 'steps': 1159, 'loss/train': 2.6643967628479004} -09/20/2021 18:30:25 - INFO - __main__ - Step 18561: {'lr': 0.0001999658020369578, 'samples': 593952, 'steps': 1160, 'loss/train': 4.037891387939453} -09/20/2021 18:30:25 - INFO - __main__ - Step 18562: {'lr': 0.0001999658020369578, 'samples': 593984, 'steps': 1160, 'loss/train': 3.473358154296875} -09/20/2021 18:30:26 - INFO - __main__ - Step 18563: {'lr': 0.0001999658020369578, 'samples': 594016, 'steps': 1160, 'loss/train': 3.4503419399261475} -09/20/2021 18:30:27 - INFO - __main__ - Step 18564: {'lr': 0.0001999658020369578, 'samples': 594048, 'steps': 1160, 'loss/train': 1.7801823616027832} -09/20/2021 18:30:28 - INFO - __main__ - Step 18565: {'lr': 0.0001999658020369578, 'samples': 594080, 'steps': 1160, 'loss/train': 3.361532688140869} -09/20/2021 18:30:28 - INFO - __main__ - Step 18566: {'lr': 0.0001999658020369578, 'samples': 594112, 'steps': 1160, 'loss/train': 4.238938808441162} -09/20/2021 18:30:29 - INFO - __main__ - Step 18567: {'lr': 0.0001999658020369578, 'samples': 594144, 'steps': 1160, 'loss/train': 3.3510143756866455} -09/20/2021 18:30:30 - INFO - __main__ - Step 18568: {'lr': 0.0001999658020369578, 'samples': 594176, 'steps': 1160, 'loss/train': 2.9811127185821533} -09/20/2021 18:30:31 - INFO - __main__ - Step 18569: {'lr': 0.0001999658020369578, 'samples': 594208, 'steps': 1160, 'loss/train': 3.0485966205596924} -09/20/2021 18:30:31 - INFO - __main__ - Step 18570: {'lr': 0.0001999658020369578, 'samples': 594240, 'steps': 1160, 'loss/train': 3.5584707260131836} -09/20/2021 18:30:32 - INFO - __main__ - Step 18571: {'lr': 0.0001999658020369578, 'samples': 594272, 'steps': 1160, 'loss/train': 3.3330636024475098} -09/20/2021 18:30:33 - INFO - __main__ - Step 18572: {'lr': 0.0001999658020369578, 'samples': 594304, 'steps': 1160, 'loss/train': 3.173550844192505} -09/20/2021 18:30:34 - INFO - __main__ - Step 18573: {'lr': 0.0001999658020369578, 'samples': 594336, 'steps': 1160, 'loss/train': 4.285415172576904} -09/20/2021 18:30:35 - INFO - __main__ - Step 18574: {'lr': 0.0001999658020369578, 'samples': 594368, 'steps': 1160, 'loss/train': 3.897481679916382} -09/20/2021 18:30:36 - INFO - __main__ - Step 18575: {'lr': 0.0001999658020369578, 'samples': 594400, 'steps': 1160, 'loss/train': 3.7737338542938232} -09/20/2021 18:30:37 - INFO - __main__ - Step 18576: {'lr': 0.0001999658020369578, 'samples': 594432, 'steps': 1160, 'loss/train': 3.1547625064849854} -09/20/2021 18:30:37 - INFO - __main__ - Step 18577: {'lr': 0.00019996563502375453, 'samples': 594464, 'steps': 1161, 'loss/train': 3.9324164390563965} -09/20/2021 18:30:38 - INFO - __main__ - Step 18578: {'lr': 0.00019996563502375453, 'samples': 594496, 'steps': 1161, 'loss/train': 4.1918182373046875} -09/20/2021 18:30:39 - INFO - __main__ - Step 18579: {'lr': 0.00019996563502375453, 'samples': 594528, 'steps': 1161, 'loss/train': 4.553349494934082} -09/20/2021 18:30:40 - INFO - __main__ - Step 18580: {'lr': 0.00019996563502375453, 'samples': 594560, 'steps': 1161, 'loss/train': 3.9406769275665283} -09/20/2021 18:30:40 - INFO - __main__ - Step 18581: {'lr': 0.00019996563502375453, 'samples': 594592, 'steps': 1161, 'loss/train': 3.0588746070861816} -09/20/2021 18:30:41 - INFO - __main__ - Step 18582: {'lr': 0.00019996563502375453, 'samples': 594624, 'steps': 1161, 'loss/train': 3.2645275592803955} -09/20/2021 18:30:42 - INFO - __main__ - Step 18583: {'lr': 0.00019996563502375453, 'samples': 594656, 'steps': 1161, 'loss/train': 3.389859914779663} -09/20/2021 18:30:43 - INFO - __main__ - Step 18584: {'lr': 0.00019996563502375453, 'samples': 594688, 'steps': 1161, 'loss/train': 2.3208014965057373} -09/20/2021 18:30:43 - INFO - __main__ - Step 18585: {'lr': 0.00019996563502375453, 'samples': 594720, 'steps': 1161, 'loss/train': 2.945779800415039} -09/20/2021 18:30:44 - INFO - __main__ - Step 18586: {'lr': 0.00019996563502375453, 'samples': 594752, 'steps': 1161, 'loss/train': 2.033367872238159} -09/20/2021 18:30:45 - INFO - __main__ - Step 18587: {'lr': 0.00019996563502375453, 'samples': 594784, 'steps': 1161, 'loss/train': 2.084428310394287} -09/20/2021 18:30:46 - INFO - __main__ - Step 18588: {'lr': 0.00019996563502375453, 'samples': 594816, 'steps': 1161, 'loss/train': 3.0694541931152344} -09/20/2021 18:30:46 - INFO - __main__ - Step 18589: {'lr': 0.00019996563502375453, 'samples': 594848, 'steps': 1161, 'loss/train': 3.658730983734131} -09/20/2021 18:30:47 - INFO - __main__ - Step 18590: {'lr': 0.00019996563502375453, 'samples': 594880, 'steps': 1161, 'loss/train': 1.0901384353637695} -09/20/2021 18:30:48 - INFO - __main__ - Step 18591: {'lr': 0.00019996563502375453, 'samples': 594912, 'steps': 1161, 'loss/train': 3.624016284942627} -09/20/2021 18:30:49 - INFO - __main__ - Step 18592: {'lr': 0.00019996563502375453, 'samples': 594944, 'steps': 1161, 'loss/train': 3.792804479598999} -09/20/2021 18:30:50 - INFO - __main__ - Step 18593: {'lr': 0.00019996546760379152, 'samples': 594976, 'steps': 1162, 'loss/train': 2.733832359313965} -09/20/2021 18:30:50 - INFO - __main__ - Step 18594: {'lr': 0.00019996546760379152, 'samples': 595008, 'steps': 1162, 'loss/train': 4.30032205581665} -09/20/2021 18:30:51 - INFO - __main__ - Step 18595: {'lr': 0.00019996546760379152, 'samples': 595040, 'steps': 1162, 'loss/train': 3.124224901199341} -09/20/2021 18:30:52 - INFO - __main__ - Step 18596: {'lr': 0.00019996546760379152, 'samples': 595072, 'steps': 1162, 'loss/train': 3.3471529483795166} -09/20/2021 18:30:53 - INFO - __main__ - Step 18597: {'lr': 0.00019996546760379152, 'samples': 595104, 'steps': 1162, 'loss/train': 4.104918479919434} -09/20/2021 18:30:53 - INFO - __main__ - Step 18598: {'lr': 0.00019996546760379152, 'samples': 595136, 'steps': 1162, 'loss/train': 3.5278234481811523} -09/20/2021 18:30:54 - INFO - __main__ - Step 18599: {'lr': 0.00019996546760379152, 'samples': 595168, 'steps': 1162, 'loss/train': 3.4928510189056396} -09/20/2021 18:30:55 - INFO - __main__ - Step 18600: {'lr': 0.00019996546760379152, 'samples': 595200, 'steps': 1162, 'loss/train': 3.0978338718414307} -09/20/2021 18:30:56 - INFO - __main__ - Step 18601: {'lr': 0.00019996546760379152, 'samples': 595232, 'steps': 1162, 'loss/train': 4.044213771820068} -09/20/2021 18:30:56 - INFO - __main__ - Step 18602: {'lr': 0.00019996546760379152, 'samples': 595264, 'steps': 1162, 'loss/train': 2.97098445892334} -09/20/2021 18:30:57 - INFO - __main__ - Step 18603: {'lr': 0.00019996546760379152, 'samples': 595296, 'steps': 1162, 'loss/train': 4.986639976501465} -09/20/2021 18:30:58 - INFO - __main__ - Step 18604: {'lr': 0.00019996546760379152, 'samples': 595328, 'steps': 1162, 'loss/train': 3.691101312637329} -09/20/2021 18:30:59 - INFO - __main__ - Step 18605: {'lr': 0.00019996546760379152, 'samples': 595360, 'steps': 1162, 'loss/train': 0.8895689845085144} -09/20/2021 18:31:00 - INFO - __main__ - Step 18606: {'lr': 0.00019996546760379152, 'samples': 595392, 'steps': 1162, 'loss/train': 0.8422407507896423} -09/20/2021 18:31:01 - INFO - __main__ - Step 18607: {'lr': 0.00019996546760379152, 'samples': 595424, 'steps': 1162, 'loss/train': 3.7313311100006104} -09/20/2021 18:31:01 - INFO - __main__ - Step 18608: {'lr': 0.00019996546760379152, 'samples': 595456, 'steps': 1162, 'loss/train': 3.8779168128967285} -09/20/2021 18:31:02 - INFO - __main__ - Step 18609: {'lr': 0.00019996529977706938, 'samples': 595488, 'steps': 1163, 'loss/train': 3.1717700958251953} -09/20/2021 18:31:03 - INFO - __main__ - Step 18610: {'lr': 0.00019996529977706938, 'samples': 595520, 'steps': 1163, 'loss/train': 3.571399688720703} -09/20/2021 18:31:04 - INFO - __main__ - Step 18611: {'lr': 0.00019996529977706938, 'samples': 595552, 'steps': 1163, 'loss/train': 2.7684268951416016} -09/20/2021 18:31:04 - INFO - __main__ - Step 18612: {'lr': 0.00019996529977706938, 'samples': 595584, 'steps': 1163, 'loss/train': 3.5696887969970703} -09/20/2021 18:31:05 - INFO - __main__ - Step 18613: {'lr': 0.00019996529977706938, 'samples': 595616, 'steps': 1163, 'loss/train': 3.8695108890533447} -09/20/2021 18:31:06 - INFO - __main__ - Step 18614: {'lr': 0.00019996529977706938, 'samples': 595648, 'steps': 1163, 'loss/train': 2.6892058849334717} -09/20/2021 18:31:07 - INFO - __main__ - Step 18615: {'lr': 0.00019996529977706938, 'samples': 595680, 'steps': 1163, 'loss/train': 3.969377040863037} -09/20/2021 18:31:07 - INFO - __main__ - Step 18616: {'lr': 0.00019996529977706938, 'samples': 595712, 'steps': 1163, 'loss/train': 3.4669430255889893} -09/20/2021 18:31:08 - INFO - __main__ - Step 18617: {'lr': 0.00019996529977706938, 'samples': 595744, 'steps': 1163, 'loss/train': 4.16294527053833} -09/20/2021 18:31:09 - INFO - __main__ - Step 18618: {'lr': 0.00019996529977706938, 'samples': 595776, 'steps': 1163, 'loss/train': 4.005825519561768} -09/20/2021 18:31:10 - INFO - __main__ - Step 18619: {'lr': 0.00019996529977706938, 'samples': 595808, 'steps': 1163, 'loss/train': 5.3734354972839355} -09/20/2021 18:31:10 - INFO - __main__ - Step 18620: {'lr': 0.00019996529977706938, 'samples': 595840, 'steps': 1163, 'loss/train': 4.259251594543457} -09/20/2021 18:31:11 - INFO - __main__ - Step 18621: {'lr': 0.00019996529977706938, 'samples': 595872, 'steps': 1163, 'loss/train': 4.160429000854492} -09/20/2021 18:31:12 - INFO - __main__ - Step 18622: {'lr': 0.00019996529977706938, 'samples': 595904, 'steps': 1163, 'loss/train': 3.35807728767395} -09/20/2021 18:31:13 - INFO - __main__ - Step 18623: {'lr': 0.00019996529977706938, 'samples': 595936, 'steps': 1163, 'loss/train': 3.132861614227295} -09/20/2021 18:31:13 - INFO - __main__ - Step 18624: {'lr': 0.00019996529977706938, 'samples': 595968, 'steps': 1163, 'loss/train': 4.481943607330322} -09/20/2021 18:31:14 - INFO - __main__ - Step 18625: {'lr': 0.00019996513154358882, 'samples': 596000, 'steps': 1164, 'loss/train': 4.575099468231201} -09/20/2021 18:31:15 - INFO - __main__ - Step 18626: {'lr': 0.00019996513154358882, 'samples': 596032, 'steps': 1164, 'loss/train': 3.3168890476226807} -09/20/2021 18:31:16 - INFO - __main__ - Step 18627: {'lr': 0.00019996513154358882, 'samples': 596064, 'steps': 1164, 'loss/train': 4.500604629516602} -09/20/2021 18:31:17 - INFO - __main__ - Step 18628: {'lr': 0.00019996513154358882, 'samples': 596096, 'steps': 1164, 'loss/train': 3.2307240962982178} -09/20/2021 18:31:17 - INFO - __main__ - Step 18629: {'lr': 0.00019996513154358882, 'samples': 596128, 'steps': 1164, 'loss/train': 2.8832132816314697} -09/20/2021 18:31:18 - INFO - __main__ - Step 18630: {'lr': 0.00019996513154358882, 'samples': 596160, 'steps': 1164, 'loss/train': 3.3781886100769043} -09/20/2021 18:31:19 - INFO - __main__ - Step 18631: {'lr': 0.00019996513154358882, 'samples': 596192, 'steps': 1164, 'loss/train': 2.354097843170166} -09/20/2021 18:31:20 - INFO - __main__ - Step 18632: {'lr': 0.00019996513154358882, 'samples': 596224, 'steps': 1164, 'loss/train': 3.502568244934082} -09/20/2021 18:31:20 - INFO - __main__ - Step 18633: {'lr': 0.00019996513154358882, 'samples': 596256, 'steps': 1164, 'loss/train': 3.8865764141082764} -09/20/2021 18:31:21 - INFO - __main__ - Step 18634: {'lr': 0.00019996513154358882, 'samples': 596288, 'steps': 1164, 'loss/train': 3.1455445289611816} -09/20/2021 18:31:22 - INFO - __main__ - Step 18635: {'lr': 0.00019996513154358882, 'samples': 596320, 'steps': 1164, 'loss/train': 3.4812569618225098} -09/20/2021 18:31:23 - INFO - __main__ - Step 18636: {'lr': 0.00019996513154358882, 'samples': 596352, 'steps': 1164, 'loss/train': 3.038668394088745} -09/20/2021 18:31:24 - INFO - __main__ - Step 18637: {'lr': 0.00019996513154358882, 'samples': 596384, 'steps': 1164, 'loss/train': 0.6145526170730591} -09/20/2021 18:31:25 - INFO - __main__ - Step 18638: {'lr': 0.00019996513154358882, 'samples': 596416, 'steps': 1164, 'loss/train': 3.7330212593078613} -09/20/2021 18:31:25 - INFO - __main__ - Step 18639: {'lr': 0.00019996513154358882, 'samples': 596448, 'steps': 1164, 'loss/train': 4.064582824707031} -09/20/2021 18:31:26 - INFO - __main__ - Step 18640: {'lr': 0.00019996513154358882, 'samples': 596480, 'steps': 1164, 'loss/train': 2.933173894882202} -09/20/2021 18:31:27 - INFO - __main__ - Step 18641: {'lr': 0.00019996496290335057, 'samples': 596512, 'steps': 1165, 'loss/train': 3.4097814559936523} -09/20/2021 18:31:28 - INFO - __main__ - Step 18642: {'lr': 0.00019996496290335057, 'samples': 596544, 'steps': 1165, 'loss/train': 2.932750701904297} -09/20/2021 18:31:28 - INFO - __main__ - Step 18643: {'lr': 0.00019996496290335057, 'samples': 596576, 'steps': 1165, 'loss/train': 3.3203208446502686} -09/20/2021 18:31:29 - INFO - __main__ - Step 18644: {'lr': 0.00019996496290335057, 'samples': 596608, 'steps': 1165, 'loss/train': 3.4324851036071777} -09/20/2021 18:31:30 - INFO - __main__ - Step 18645: {'lr': 0.00019996496290335057, 'samples': 596640, 'steps': 1165, 'loss/train': 3.3173110485076904} -09/20/2021 18:31:31 - INFO - __main__ - Step 18646: {'lr': 0.00019996496290335057, 'samples': 596672, 'steps': 1165, 'loss/train': 1.5596323013305664} -09/20/2021 18:31:31 - INFO - __main__ - Step 18647: {'lr': 0.00019996496290335057, 'samples': 596704, 'steps': 1165, 'loss/train': 3.7997870445251465} -09/20/2021 18:31:32 - INFO - __main__ - Step 18648: {'lr': 0.00019996496290335057, 'samples': 596736, 'steps': 1165, 'loss/train': 3.2150020599365234} -09/20/2021 18:31:33 - INFO - __main__ - Step 18649: {'lr': 0.00019996496290335057, 'samples': 596768, 'steps': 1165, 'loss/train': 4.7397074699401855} -09/20/2021 18:31:34 - INFO - __main__ - Step 18650: {'lr': 0.00019996496290335057, 'samples': 596800, 'steps': 1165, 'loss/train': 3.2599613666534424} -09/20/2021 18:31:34 - INFO - __main__ - Step 18651: {'lr': 0.00019996496290335057, 'samples': 596832, 'steps': 1165, 'loss/train': 1.7271337509155273} -09/20/2021 18:31:35 - INFO - __main__ - Step 18652: {'lr': 0.00019996496290335057, 'samples': 596864, 'steps': 1165, 'loss/train': 3.5806949138641357} -09/20/2021 18:31:36 - INFO - __main__ - Step 18653: {'lr': 0.00019996496290335057, 'samples': 596896, 'steps': 1165, 'loss/train': 2.9912116527557373} -09/20/2021 18:31:37 - INFO - __main__ - Step 18654: {'lr': 0.00019996496290335057, 'samples': 596928, 'steps': 1165, 'loss/train': 3.4115219116210938} -09/20/2021 18:31:37 - INFO - __main__ - Step 18655: {'lr': 0.00019996496290335057, 'samples': 596960, 'steps': 1165, 'loss/train': 3.6916072368621826} -09/20/2021 18:31:38 - INFO - __main__ - Step 18656: {'lr': 0.00019996496290335057, 'samples': 596992, 'steps': 1165, 'loss/train': 3.0863211154937744} -09/20/2021 18:31:39 - INFO - __main__ - Step 18657: {'lr': 0.00019996479385635523, 'samples': 597024, 'steps': 1166, 'loss/train': 3.2168211936950684} -09/20/2021 18:31:40 - INFO - __main__ - Step 18658: {'lr': 0.00019996479385635523, 'samples': 597056, 'steps': 1166, 'loss/train': 3.812976121902466} -09/20/2021 18:31:41 - INFO - __main__ - Step 18659: {'lr': 0.00019996479385635523, 'samples': 597088, 'steps': 1166, 'loss/train': 3.2322964668273926} -09/20/2021 18:31:41 - INFO - __main__ - Step 18660: {'lr': 0.00019996479385635523, 'samples': 597120, 'steps': 1166, 'loss/train': 4.503227710723877} -09/20/2021 18:31:42 - INFO - __main__ - Step 18661: {'lr': 0.00019996479385635523, 'samples': 597152, 'steps': 1166, 'loss/train': 4.5320820808410645} -09/20/2021 18:31:43 - INFO - __main__ - Step 18662: {'lr': 0.00019996479385635523, 'samples': 597184, 'steps': 1166, 'loss/train': 3.9957282543182373} -09/20/2021 18:31:44 - INFO - __main__ - Step 18663: {'lr': 0.00019996479385635523, 'samples': 597216, 'steps': 1166, 'loss/train': 2.5970914363861084} -09/20/2021 18:31:44 - INFO - __main__ - Step 18664: {'lr': 0.00019996479385635523, 'samples': 597248, 'steps': 1166, 'loss/train': 3.887108087539673} -09/20/2021 18:31:45 - INFO - __main__ - Step 18665: {'lr': 0.00019996479385635523, 'samples': 597280, 'steps': 1166, 'loss/train': 3.7264578342437744} -09/20/2021 18:31:46 - INFO - __main__ - Step 18666: {'lr': 0.00019996479385635523, 'samples': 597312, 'steps': 1166, 'loss/train': 3.5088236331939697} -09/20/2021 18:31:47 - INFO - __main__ - Step 18667: {'lr': 0.00019996479385635523, 'samples': 597344, 'steps': 1166, 'loss/train': 3.897576093673706} -09/20/2021 18:31:48 - INFO - __main__ - Step 18668: {'lr': 0.00019996479385635523, 'samples': 597376, 'steps': 1166, 'loss/train': 3.628641366958618} -09/20/2021 18:31:49 - INFO - __main__ - Step 18669: {'lr': 0.00019996479385635523, 'samples': 597408, 'steps': 1166, 'loss/train': 2.9258031845092773} -09/20/2021 18:31:49 - INFO - __main__ - Step 18670: {'lr': 0.00019996479385635523, 'samples': 597440, 'steps': 1166, 'loss/train': 3.0457324981689453} -09/20/2021 18:31:50 - INFO - __main__ - Step 18671: {'lr': 0.00019996479385635523, 'samples': 597472, 'steps': 1166, 'loss/train': 4.718111038208008} -09/20/2021 18:31:51 - INFO - __main__ - Step 18672: {'lr': 0.00019996479385635523, 'samples': 597504, 'steps': 1166, 'loss/train': 3.744478464126587} -09/20/2021 18:31:52 - INFO - __main__ - Step 18673: {'lr': 0.00019996462440260358, 'samples': 597536, 'steps': 1167, 'loss/train': 3.807709217071533} -09/20/2021 18:31:53 - INFO - __main__ - Step 18674: {'lr': 0.00019996462440260358, 'samples': 597568, 'steps': 1167, 'loss/train': 4.650198459625244} -09/20/2021 18:31:53 - INFO - __main__ - Step 18675: {'lr': 0.00019996462440260358, 'samples': 597600, 'steps': 1167, 'loss/train': 3.1766786575317383} -09/20/2021 18:31:54 - INFO - __main__ - Step 18676: {'lr': 0.00019996462440260358, 'samples': 597632, 'steps': 1167, 'loss/train': 3.2395286560058594} -09/20/2021 18:31:55 - INFO - __main__ - Step 18677: {'lr': 0.00019996462440260358, 'samples': 597664, 'steps': 1167, 'loss/train': 4.049782752990723} -09/20/2021 18:31:56 - INFO - __main__ - Step 18678: {'lr': 0.00019996462440260358, 'samples': 597696, 'steps': 1167, 'loss/train': 3.436171531677246} -09/20/2021 18:31:56 - INFO - __main__ - Step 18679: {'lr': 0.00019996462440260358, 'samples': 597728, 'steps': 1167, 'loss/train': 3.867793083190918} -09/20/2021 18:31:57 - INFO - __main__ - Step 18680: {'lr': 0.00019996462440260358, 'samples': 597760, 'steps': 1167, 'loss/train': 3.6331634521484375} -09/20/2021 18:31:58 - INFO - __main__ - Step 18681: {'lr': 0.00019996462440260358, 'samples': 597792, 'steps': 1167, 'loss/train': 3.7871100902557373} -09/20/2021 18:31:59 - INFO - __main__ - Step 18682: {'lr': 0.00019996462440260358, 'samples': 597824, 'steps': 1167, 'loss/train': 3.4900386333465576} -09/20/2021 18:31:59 - INFO - __main__ - Step 18683: {'lr': 0.00019996462440260358, 'samples': 597856, 'steps': 1167, 'loss/train': 4.181649208068848} -09/20/2021 18:32:00 - INFO - __main__ - Step 18684: {'lr': 0.00019996462440260358, 'samples': 597888, 'steps': 1167, 'loss/train': 3.6538643836975098} -09/20/2021 18:32:01 - INFO - __main__ - Step 18685: {'lr': 0.00019996462440260358, 'samples': 597920, 'steps': 1167, 'loss/train': 3.730112075805664} -09/20/2021 18:32:02 - INFO - __main__ - Step 18686: {'lr': 0.00019996462440260358, 'samples': 597952, 'steps': 1167, 'loss/train': 3.8313114643096924} -09/20/2021 18:32:02 - INFO - __main__ - Step 18687: {'lr': 0.00019996462440260358, 'samples': 597984, 'steps': 1167, 'loss/train': 3.747828245162964} -09/20/2021 18:32:03 - INFO - __main__ - Step 18688: {'lr': 0.00019996462440260358, 'samples': 598016, 'steps': 1167, 'loss/train': 3.9819109439849854} -09/20/2021 18:32:04 - INFO - __main__ - Step 18689: {'lr': 0.00019996445454209622, 'samples': 598048, 'steps': 1168, 'loss/train': 2.2788143157958984} -09/20/2021 18:32:05 - INFO - __main__ - Step 18690: {'lr': 0.00019996445454209622, 'samples': 598080, 'steps': 1168, 'loss/train': 4.246940612792969} -09/20/2021 18:32:05 - INFO - __main__ - Step 18691: {'lr': 0.00019996445454209622, 'samples': 598112, 'steps': 1168, 'loss/train': 2.629528760910034} -09/20/2021 18:32:06 - INFO - __main__ - Step 18692: {'lr': 0.00019996445454209622, 'samples': 598144, 'steps': 1168, 'loss/train': 3.549570322036743} -09/20/2021 18:32:07 - INFO - __main__ - Step 18693: {'lr': 0.00019996445454209622, 'samples': 598176, 'steps': 1168, 'loss/train': 2.561924457550049} -09/20/2021 18:32:08 - INFO - __main__ - Step 18694: {'lr': 0.00019996445454209622, 'samples': 598208, 'steps': 1168, 'loss/train': 3.560969352722168} -09/20/2021 18:32:08 - INFO - __main__ - Step 18695: {'lr': 0.00019996445454209622, 'samples': 598240, 'steps': 1168, 'loss/train': 3.4127869606018066} -09/20/2021 18:32:09 - INFO - __main__ - Step 18696: {'lr': 0.00019996445454209622, 'samples': 598272, 'steps': 1168, 'loss/train': 3.192911148071289} -09/20/2021 18:32:10 - INFO - __main__ - Step 18697: {'lr': 0.00019996445454209622, 'samples': 598304, 'steps': 1168, 'loss/train': 3.753267526626587} -09/20/2021 18:32:11 - INFO - __main__ - Step 18698: {'lr': 0.00019996445454209622, 'samples': 598336, 'steps': 1168, 'loss/train': 3.4053521156311035} -09/20/2021 18:32:12 - INFO - __main__ - Step 18699: {'lr': 0.00019996445454209622, 'samples': 598368, 'steps': 1168, 'loss/train': 4.199446678161621} -09/20/2021 18:32:13 - INFO - __main__ - Step 18700: {'lr': 0.00019996445454209622, 'samples': 598400, 'steps': 1168, 'loss/train': 4.400890350341797} -09/20/2021 18:32:14 - INFO - __main__ - Step 18701: {'lr': 0.00019996445454209622, 'samples': 598432, 'steps': 1168, 'loss/train': 2.710970878601074} -09/20/2021 18:32:14 - INFO - __main__ - Step 18702: {'lr': 0.00019996445454209622, 'samples': 598464, 'steps': 1168, 'loss/train': 4.762862205505371} -09/20/2021 18:32:15 - INFO - __main__ - Step 18703: {'lr': 0.00019996445454209622, 'samples': 598496, 'steps': 1168, 'loss/train': 3.2013986110687256} -09/20/2021 18:32:16 - INFO - __main__ - Step 18704: {'lr': 0.00019996445454209622, 'samples': 598528, 'steps': 1168, 'loss/train': 3.452465534210205} -09/20/2021 18:32:17 - INFO - __main__ - Step 18705: {'lr': 0.00019996428427483388, 'samples': 598560, 'steps': 1169, 'loss/train': 3.2585408687591553} -09/20/2021 18:32:17 - INFO - __main__ - Step 18706: {'lr': 0.00019996428427483388, 'samples': 598592, 'steps': 1169, 'loss/train': 3.611987590789795} -09/20/2021 18:32:18 - INFO - __main__ - Step 18707: {'lr': 0.00019996428427483388, 'samples': 598624, 'steps': 1169, 'loss/train': 1.2307021617889404} -09/20/2021 18:32:19 - INFO - __main__ - Step 18708: {'lr': 0.00019996428427483388, 'samples': 598656, 'steps': 1169, 'loss/train': 2.6723155975341797} -09/20/2021 18:32:20 - INFO - __main__ - Step 18709: {'lr': 0.00019996428427483388, 'samples': 598688, 'steps': 1169, 'loss/train': 3.75335955619812} -09/20/2021 18:32:20 - INFO - __main__ - Step 18710: {'lr': 0.00019996428427483388, 'samples': 598720, 'steps': 1169, 'loss/train': 4.206615447998047} -09/20/2021 18:32:21 - INFO - __main__ - Step 18711: {'lr': 0.00019996428427483388, 'samples': 598752, 'steps': 1169, 'loss/train': 4.359938144683838} -09/20/2021 18:32:22 - INFO - __main__ - Step 18712: {'lr': 0.00019996428427483388, 'samples': 598784, 'steps': 1169, 'loss/train': 3.3649652004241943} -09/20/2021 18:32:23 - INFO - __main__ - Step 18713: {'lr': 0.00019996428427483388, 'samples': 598816, 'steps': 1169, 'loss/train': 2.7120275497436523} -09/20/2021 18:32:23 - INFO - __main__ - Step 18714: {'lr': 0.00019996428427483388, 'samples': 598848, 'steps': 1169, 'loss/train': 3.5412211418151855} -09/20/2021 18:32:24 - INFO - __main__ - Step 18715: {'lr': 0.00019996428427483388, 'samples': 598880, 'steps': 1169, 'loss/train': 2.5646979808807373} -09/20/2021 18:32:25 - INFO - __main__ - Step 18716: {'lr': 0.00019996428427483388, 'samples': 598912, 'steps': 1169, 'loss/train': 4.313615322113037} -09/20/2021 18:32:26 - INFO - __main__ - Step 18717: {'lr': 0.00019996428427483388, 'samples': 598944, 'steps': 1169, 'loss/train': 4.84904146194458} -09/20/2021 18:32:26 - INFO - __main__ - Step 18718: {'lr': 0.00019996428427483388, 'samples': 598976, 'steps': 1169, 'loss/train': 4.479498386383057} -09/20/2021 18:32:27 - INFO - __main__ - Step 18719: {'lr': 0.00019996428427483388, 'samples': 599008, 'steps': 1169, 'loss/train': 3.2450897693634033} -09/20/2021 18:32:28 - INFO - __main__ - Step 18720: {'lr': 0.00019996428427483388, 'samples': 599040, 'steps': 1169, 'loss/train': 3.4209015369415283} -09/20/2021 18:32:29 - INFO - __main__ - Step 18721: {'lr': 0.00019996411360081727, 'samples': 599072, 'steps': 1170, 'loss/train': 2.9183883666992188} -09/20/2021 18:32:30 - INFO - __main__ - Step 18722: {'lr': 0.00019996411360081727, 'samples': 599104, 'steps': 1170, 'loss/train': 3.58132266998291} -09/20/2021 18:32:30 - INFO - __main__ - Step 18723: {'lr': 0.00019996411360081727, 'samples': 599136, 'steps': 1170, 'loss/train': 2.7706472873687744} -09/20/2021 18:32:31 - INFO - __main__ - Step 18724: {'lr': 0.00019996411360081727, 'samples': 599168, 'steps': 1170, 'loss/train': 4.268226623535156} -09/20/2021 18:32:32 - INFO - __main__ - Step 18725: {'lr': 0.00019996411360081727, 'samples': 599200, 'steps': 1170, 'loss/train': 3.652421712875366} -09/20/2021 18:32:33 - INFO - __main__ - Step 18726: {'lr': 0.00019996411360081727, 'samples': 599232, 'steps': 1170, 'loss/train': 0.9601603746414185} -09/20/2021 18:32:33 - INFO - __main__ - Step 18727: {'lr': 0.00019996411360081727, 'samples': 599264, 'steps': 1170, 'loss/train': 0.6169868111610413} -09/20/2021 18:32:34 - INFO - __main__ - Step 18728: {'lr': 0.00019996411360081727, 'samples': 599296, 'steps': 1170, 'loss/train': 0.9949146509170532} -09/20/2021 18:32:36 - INFO - __main__ - Step 18729: {'lr': 0.00019996411360081727, 'samples': 599328, 'steps': 1170, 'loss/train': 4.379327774047852} -09/20/2021 18:32:37 - INFO - __main__ - Step 18730: {'lr': 0.00019996411360081727, 'samples': 599360, 'steps': 1170, 'loss/train': 3.454422950744629} -09/20/2021 18:32:38 - INFO - __main__ - Step 18731: {'lr': 0.00019996411360081727, 'samples': 599392, 'steps': 1170, 'loss/train': 3.4805243015289307} -09/20/2021 18:32:38 - INFO - __main__ - Step 18732: {'lr': 0.00019996411360081727, 'samples': 599424, 'steps': 1170, 'loss/train': 2.6774346828460693} -09/20/2021 18:32:39 - INFO - __main__ - Step 18733: {'lr': 0.00019996411360081727, 'samples': 599456, 'steps': 1170, 'loss/train': 0.885400116443634} -09/20/2021 18:32:40 - INFO - __main__ - Step 18734: {'lr': 0.00019996411360081727, 'samples': 599488, 'steps': 1170, 'loss/train': 3.552746534347534} -09/20/2021 18:32:41 - INFO - __main__ - Step 18735: {'lr': 0.00019996411360081727, 'samples': 599520, 'steps': 1170, 'loss/train': 3.272135019302368} -09/20/2021 18:32:41 - INFO - __main__ - Step 18736: {'lr': 0.00019996411360081727, 'samples': 599552, 'steps': 1170, 'loss/train': 2.8659770488739014} -09/20/2021 18:32:42 - INFO - __main__ - Step 18737: {'lr': 0.00019996394252004706, 'samples': 599584, 'steps': 1171, 'loss/train': 3.1126468181610107} -09/20/2021 18:32:43 - INFO - __main__ - Step 18738: {'lr': 0.00019996394252004706, 'samples': 599616, 'steps': 1171, 'loss/train': 3.260712146759033} -09/20/2021 18:32:44 - INFO - __main__ - Step 18739: {'lr': 0.00019996394252004706, 'samples': 599648, 'steps': 1171, 'loss/train': 3.5201590061187744} -09/20/2021 18:32:44 - INFO - __main__ - Step 18740: {'lr': 0.00019996394252004706, 'samples': 599680, 'steps': 1171, 'loss/train': 3.571906089782715} -09/20/2021 18:32:45 - INFO - __main__ - Step 18741: {'lr': 0.00019996394252004706, 'samples': 599712, 'steps': 1171, 'loss/train': 3.4452266693115234} -09/20/2021 18:32:46 - INFO - __main__ - Step 18742: {'lr': 0.00019996394252004706, 'samples': 599744, 'steps': 1171, 'loss/train': 3.5067687034606934} -09/20/2021 18:32:47 - INFO - __main__ - Step 18743: {'lr': 0.00019996394252004706, 'samples': 599776, 'steps': 1171, 'loss/train': 3.8312103748321533} -09/20/2021 18:32:47 - INFO - __main__ - Step 18744: {'lr': 0.00019996394252004706, 'samples': 599808, 'steps': 1171, 'loss/train': 3.0214126110076904} -09/20/2021 18:32:48 - INFO - __main__ - Step 18745: {'lr': 0.00019996394252004706, 'samples': 599840, 'steps': 1171, 'loss/train': 4.063092231750488} -09/20/2021 18:32:49 - INFO - __main__ - Step 18746: {'lr': 0.00019996394252004706, 'samples': 599872, 'steps': 1171, 'loss/train': 4.178299427032471} -09/20/2021 18:32:50 - INFO - __main__ - Step 18747: {'lr': 0.00019996394252004706, 'samples': 599904, 'steps': 1171, 'loss/train': 2.847238302230835} -09/20/2021 18:32:50 - INFO - __main__ - Step 18748: {'lr': 0.00019996394252004706, 'samples': 599936, 'steps': 1171, 'loss/train': 2.9589827060699463} -09/20/2021 18:32:51 - INFO - __main__ - Step 18749: {'lr': 0.00019996394252004706, 'samples': 599968, 'steps': 1171, 'loss/train': 3.519554376602173} -09/20/2021 18:32:52 - INFO - __main__ - Step 18750: {'lr': 0.00019996394252004706, 'samples': 600000, 'steps': 1171, 'loss/train': 3.518031120300293} -09/20/2021 18:32:53 - INFO - __main__ - Step 18751: {'lr': 0.00019996394252004706, 'samples': 600032, 'steps': 1171, 'loss/train': 2.9645869731903076} -09/20/2021 18:32:53 - INFO - __main__ - Step 18752: {'lr': 0.00019996394252004706, 'samples': 600064, 'steps': 1171, 'loss/train': 2.5986013412475586} -09/20/2021 18:32:54 - INFO - __main__ - Step 18753: {'lr': 0.00019996377103252398, 'samples': 600096, 'steps': 1172, 'loss/train': 2.89416766166687} -09/20/2021 18:32:55 - INFO - __main__ - Step 18754: {'lr': 0.00019996377103252398, 'samples': 600128, 'steps': 1172, 'loss/train': 4.161194324493408} -09/20/2021 18:32:56 - INFO - __main__ - Step 18755: {'lr': 0.00019996377103252398, 'samples': 600160, 'steps': 1172, 'loss/train': 3.9865968227386475} -09/20/2021 18:32:57 - INFO - __main__ - Step 18756: {'lr': 0.00019996377103252398, 'samples': 600192, 'steps': 1172, 'loss/train': 3.1440272331237793} -09/20/2021 18:32:57 - INFO - __main__ - Step 18757: {'lr': 0.00019996377103252398, 'samples': 600224, 'steps': 1172, 'loss/train': 3.2444283962249756} -09/20/2021 18:32:58 - INFO - __main__ - Step 18758: {'lr': 0.00019996377103252398, 'samples': 600256, 'steps': 1172, 'loss/train': 4.485649585723877} -09/20/2021 18:32:59 - INFO - __main__ - Step 18759: {'lr': 0.00019996377103252398, 'samples': 600288, 'steps': 1172, 'loss/train': 4.773986339569092} -09/20/2021 18:33:00 - INFO - __main__ - Step 18760: {'lr': 0.00019996377103252398, 'samples': 600320, 'steps': 1172, 'loss/train': 4.630414962768555} -09/20/2021 18:33:00 - INFO - __main__ - Step 18761: {'lr': 0.00019996377103252398, 'samples': 600352, 'steps': 1172, 'loss/train': 4.790334224700928} -09/20/2021 18:33:02 - INFO - __main__ - Step 18762: {'lr': 0.00019996377103252398, 'samples': 600384, 'steps': 1172, 'loss/train': 4.475866317749023} -09/20/2021 18:33:02 - INFO - __main__ - Step 18763: {'lr': 0.00019996377103252398, 'samples': 600416, 'steps': 1172, 'loss/train': 3.8545773029327393} -09/20/2021 18:33:03 - INFO - __main__ - Step 18764: {'lr': 0.00019996377103252398, 'samples': 600448, 'steps': 1172, 'loss/train': 4.031198024749756} -09/20/2021 18:33:04 - INFO - __main__ - Step 18765: {'lr': 0.00019996377103252398, 'samples': 600480, 'steps': 1172, 'loss/train': 3.139664649963379} -09/20/2021 18:33:05 - INFO - __main__ - Step 18766: {'lr': 0.00019996377103252398, 'samples': 600512, 'steps': 1172, 'loss/train': 3.3783857822418213} -09/20/2021 18:33:05 - INFO - __main__ - Step 18767: {'lr': 0.00019996377103252398, 'samples': 600544, 'steps': 1172, 'loss/train': 3.6143136024475098} -09/20/2021 18:33:06 - INFO - __main__ - Step 18768: {'lr': 0.00019996377103252398, 'samples': 600576, 'steps': 1172, 'loss/train': 3.2621681690216064} -09/20/2021 18:33:07 - INFO - __main__ - Step 18769: {'lr': 0.0001999635991382487, 'samples': 600608, 'steps': 1173, 'loss/train': 3.5337138175964355} -09/20/2021 18:33:08 - INFO - __main__ - Step 18770: {'lr': 0.0001999635991382487, 'samples': 600640, 'steps': 1173, 'loss/train': 3.3409647941589355} -09/20/2021 18:33:09 - INFO - __main__ - Step 18771: {'lr': 0.0001999635991382487, 'samples': 600672, 'steps': 1173, 'loss/train': 2.2358148097991943} -09/20/2021 18:33:09 - INFO - __main__ - Step 18772: {'lr': 0.0001999635991382487, 'samples': 600704, 'steps': 1173, 'loss/train': 2.2552499771118164} -09/20/2021 18:33:10 - INFO - __main__ - Step 18773: {'lr': 0.0001999635991382487, 'samples': 600736, 'steps': 1173, 'loss/train': 3.44159197807312} -09/20/2021 18:33:11 - INFO - __main__ - Step 18774: {'lr': 0.0001999635991382487, 'samples': 600768, 'steps': 1173, 'loss/train': 3.1825709342956543} -09/20/2021 18:33:12 - INFO - __main__ - Step 18775: {'lr': 0.0001999635991382487, 'samples': 600800, 'steps': 1173, 'loss/train': 4.339505672454834} -09/20/2021 18:33:12 - INFO - __main__ - Step 18776: {'lr': 0.0001999635991382487, 'samples': 600832, 'steps': 1173, 'loss/train': 3.1851158142089844} -09/20/2021 18:33:13 - INFO - __main__ - Step 18777: {'lr': 0.0001999635991382487, 'samples': 600864, 'steps': 1173, 'loss/train': 2.8313887119293213} -09/20/2021 18:33:14 - INFO - __main__ - Step 18778: {'lr': 0.0001999635991382487, 'samples': 600896, 'steps': 1173, 'loss/train': 3.16694712638855} -09/20/2021 18:33:15 - INFO - __main__ - Step 18779: {'lr': 0.0001999635991382487, 'samples': 600928, 'steps': 1173, 'loss/train': 4.480741500854492} -09/20/2021 18:33:15 - INFO - __main__ - Step 18780: {'lr': 0.0001999635991382487, 'samples': 600960, 'steps': 1173, 'loss/train': 2.9883480072021484} -09/20/2021 18:33:16 - INFO - __main__ - Step 18781: {'lr': 0.0001999635991382487, 'samples': 600992, 'steps': 1173, 'loss/train': 3.504054069519043} -09/20/2021 18:33:17 - INFO - __main__ - Step 18782: {'lr': 0.0001999635991382487, 'samples': 601024, 'steps': 1173, 'loss/train': 2.7762610912323} -09/20/2021 18:33:18 - INFO - __main__ - Step 18783: {'lr': 0.0001999635991382487, 'samples': 601056, 'steps': 1173, 'loss/train': 2.7793779373168945} -09/20/2021 18:33:18 - INFO - __main__ - Step 18784: {'lr': 0.0001999635991382487, 'samples': 601088, 'steps': 1173, 'loss/train': 3.4901082515716553} -09/20/2021 18:33:19 - INFO - __main__ - Step 18785: {'lr': 0.00019996342683722192, 'samples': 601120, 'steps': 1174, 'loss/train': 4.3316731452941895} -09/20/2021 18:33:20 - INFO - __main__ - Step 18786: {'lr': 0.00019996342683722192, 'samples': 601152, 'steps': 1174, 'loss/train': 3.315609931945801} -09/20/2021 18:33:21 - INFO - __main__ - Step 18787: {'lr': 0.00019996342683722192, 'samples': 601184, 'steps': 1174, 'loss/train': 2.991361141204834} -09/20/2021 18:33:21 - INFO - __main__ - Step 18788: {'lr': 0.00019996342683722192, 'samples': 601216, 'steps': 1174, 'loss/train': 4.112417221069336} -09/20/2021 18:33:22 - INFO - __main__ - Step 18789: {'lr': 0.00019996342683722192, 'samples': 601248, 'steps': 1174, 'loss/train': 4.201086521148682} -09/20/2021 18:33:23 - INFO - __main__ - Step 18790: {'lr': 0.00019996342683722192, 'samples': 601280, 'steps': 1174, 'loss/train': 2.126112461090088} -09/20/2021 18:33:24 - INFO - __main__ - Step 18791: {'lr': 0.00019996342683722192, 'samples': 601312, 'steps': 1174, 'loss/train': 2.9322707653045654} -09/20/2021 18:33:24 - INFO - __main__ - Step 18792: {'lr': 0.00019996342683722192, 'samples': 601344, 'steps': 1174, 'loss/train': 2.9595601558685303} -09/20/2021 18:33:26 - INFO - __main__ - Step 18793: {'lr': 0.00019996342683722192, 'samples': 601376, 'steps': 1174, 'loss/train': 3.2427306175231934} -09/20/2021 18:33:27 - INFO - __main__ - Step 18794: {'lr': 0.00019996342683722192, 'samples': 601408, 'steps': 1174, 'loss/train': 3.0290541648864746} -09/20/2021 18:33:28 - INFO - __main__ - Step 18795: {'lr': 0.00019996342683722192, 'samples': 601440, 'steps': 1174, 'loss/train': 3.591491937637329} -09/20/2021 18:33:28 - INFO - __main__ - Step 18796: {'lr': 0.00019996342683722192, 'samples': 601472, 'steps': 1174, 'loss/train': 3.464843511581421} -09/20/2021 18:33:29 - INFO - __main__ - Step 18797: {'lr': 0.00019996342683722192, 'samples': 601504, 'steps': 1174, 'loss/train': 3.9700307846069336} -09/20/2021 18:33:30 - INFO - __main__ - Step 18798: {'lr': 0.00019996342683722192, 'samples': 601536, 'steps': 1174, 'loss/train': 3.2055583000183105} -09/20/2021 18:33:31 - INFO - __main__ - Step 18799: {'lr': 0.00019996342683722192, 'samples': 601568, 'steps': 1174, 'loss/train': 4.175554275512695} -09/20/2021 18:33:31 - INFO - __main__ - Step 18800: {'lr': 0.00019996342683722192, 'samples': 601600, 'steps': 1174, 'loss/train': 2.766148090362549} -09/20/2021 18:33:32 - INFO - __main__ - Step 18801: {'lr': 0.00019996325412944432, 'samples': 601632, 'steps': 1175, 'loss/train': 5.310338497161865} -09/20/2021 18:33:33 - INFO - __main__ - Step 18802: {'lr': 0.00019996325412944432, 'samples': 601664, 'steps': 1175, 'loss/train': 4.700557231903076} -09/20/2021 18:33:34 - INFO - __main__ - Step 18803: {'lr': 0.00019996325412944432, 'samples': 601696, 'steps': 1175, 'loss/train': 5.182682991027832} -09/20/2021 18:33:34 - INFO - __main__ - Step 18804: {'lr': 0.00019996325412944432, 'samples': 601728, 'steps': 1175, 'loss/train': 5.580437660217285} -09/20/2021 18:33:35 - INFO - __main__ - Step 18805: {'lr': 0.00019996325412944432, 'samples': 601760, 'steps': 1175, 'loss/train': 4.69720983505249} -09/20/2021 18:33:36 - INFO - __main__ - Step 18806: {'lr': 0.00019996325412944432, 'samples': 601792, 'steps': 1175, 'loss/train': 2.824892282485962} -09/20/2021 18:33:37 - INFO - __main__ - Step 18807: {'lr': 0.00019996325412944432, 'samples': 601824, 'steps': 1175, 'loss/train': 3.196463108062744} -09/20/2021 18:33:37 - INFO - __main__ - Step 18808: {'lr': 0.00019996325412944432, 'samples': 601856, 'steps': 1175, 'loss/train': 2.8143739700317383} -09/20/2021 18:33:38 - INFO - __main__ - Step 18809: {'lr': 0.00019996325412944432, 'samples': 601888, 'steps': 1175, 'loss/train': 2.5047879219055176} -09/20/2021 18:33:39 - INFO - __main__ - Step 18810: {'lr': 0.00019996325412944432, 'samples': 601920, 'steps': 1175, 'loss/train': 3.962664842605591} -09/20/2021 18:33:40 - INFO - __main__ - Step 18811: {'lr': 0.00019996325412944432, 'samples': 601952, 'steps': 1175, 'loss/train': 2.9517054557800293} -09/20/2021 18:33:40 - INFO - __main__ - Step 18812: {'lr': 0.00019996325412944432, 'samples': 601984, 'steps': 1175, 'loss/train': 4.439876556396484} -09/20/2021 18:33:41 - INFO - __main__ - Step 18813: {'lr': 0.00019996325412944432, 'samples': 602016, 'steps': 1175, 'loss/train': 3.712092876434326} -09/20/2021 18:33:42 - INFO - __main__ - Step 18814: {'lr': 0.00019996325412944432, 'samples': 602048, 'steps': 1175, 'loss/train': 3.331648588180542} -09/20/2021 18:33:43 - INFO - __main__ - Step 18815: {'lr': 0.00019996325412944432, 'samples': 602080, 'steps': 1175, 'loss/train': 3.23825740814209} -09/20/2021 18:33:43 - INFO - __main__ - Step 18816: {'lr': 0.00019996325412944432, 'samples': 602112, 'steps': 1175, 'loss/train': 2.953277111053467} -09/20/2021 18:33:44 - INFO - __main__ - Step 18817: {'lr': 0.00019996308101491664, 'samples': 602144, 'steps': 1176, 'loss/train': 4.070038318634033} -09/20/2021 18:33:45 - INFO - __main__ - Step 18818: {'lr': 0.00019996308101491664, 'samples': 602176, 'steps': 1176, 'loss/train': 3.523677349090576} -09/20/2021 18:33:46 - INFO - __main__ - Step 18819: {'lr': 0.00019996308101491664, 'samples': 602208, 'steps': 1176, 'loss/train': 3.671041250228882} -09/20/2021 18:33:47 - INFO - __main__ - Step 18820: {'lr': 0.00019996308101491664, 'samples': 602240, 'steps': 1176, 'loss/train': 3.425499200820923} -09/20/2021 18:33:47 - INFO - __main__ - Step 18821: {'lr': 0.00019996308101491664, 'samples': 602272, 'steps': 1176, 'loss/train': 2.8455874919891357} -09/20/2021 18:33:48 - INFO - __main__ - Step 18822: {'lr': 0.00019996308101491664, 'samples': 602304, 'steps': 1176, 'loss/train': 3.2007524967193604} -09/20/2021 18:33:49 - INFO - __main__ - Step 18823: {'lr': 0.00019996308101491664, 'samples': 602336, 'steps': 1176, 'loss/train': 5.940363883972168} -09/20/2021 18:33:50 - INFO - __main__ - Step 18824: {'lr': 0.00019996308101491664, 'samples': 602368, 'steps': 1176, 'loss/train': 3.3029067516326904} -09/20/2021 18:33:51 - INFO - __main__ - Step 18825: {'lr': 0.00019996308101491664, 'samples': 602400, 'steps': 1176, 'loss/train': 4.147463321685791} -09/20/2021 18:33:52 - INFO - __main__ - Step 18826: {'lr': 0.00019996308101491664, 'samples': 602432, 'steps': 1176, 'loss/train': 3.858484983444214} -09/20/2021 18:33:52 - INFO - __main__ - Step 18827: {'lr': 0.00019996308101491664, 'samples': 602464, 'steps': 1176, 'loss/train': 3.059391498565674} -09/20/2021 18:33:53 - INFO - __main__ - Step 18828: {'lr': 0.00019996308101491664, 'samples': 602496, 'steps': 1176, 'loss/train': 3.4801700115203857} -09/20/2021 18:33:54 - INFO - __main__ - Step 18829: {'lr': 0.00019996308101491664, 'samples': 602528, 'steps': 1176, 'loss/train': 3.310706377029419} -09/20/2021 18:33:55 - INFO - __main__ - Step 18830: {'lr': 0.00019996308101491664, 'samples': 602560, 'steps': 1176, 'loss/train': 4.822046279907227} -09/20/2021 18:33:55 - INFO - __main__ - Step 18831: {'lr': 0.00019996308101491664, 'samples': 602592, 'steps': 1176, 'loss/train': 2.903658866882324} -09/20/2021 18:33:56 - INFO - __main__ - Step 18832: {'lr': 0.00019996308101491664, 'samples': 602624, 'steps': 1176, 'loss/train': 3.621795177459717} -09/20/2021 18:33:57 - INFO - __main__ - Step 18833: {'lr': 0.0001999629074936396, 'samples': 602656, 'steps': 1177, 'loss/train': 4.12860107421875} -09/20/2021 18:33:58 - INFO - __main__ - Step 18834: {'lr': 0.0001999629074936396, 'samples': 602688, 'steps': 1177, 'loss/train': 1.617169976234436} -09/20/2021 18:33:59 - INFO - __main__ - Step 18835: {'lr': 0.0001999629074936396, 'samples': 602720, 'steps': 1177, 'loss/train': 4.0979743003845215} -09/20/2021 18:33:59 - INFO - __main__ - Step 18836: {'lr': 0.0001999629074936396, 'samples': 602752, 'steps': 1177, 'loss/train': 4.164889335632324} -09/20/2021 18:34:00 - INFO - __main__ - Step 18837: {'lr': 0.0001999629074936396, 'samples': 602784, 'steps': 1177, 'loss/train': 4.045492172241211} -09/20/2021 18:34:01 - INFO - __main__ - Step 18838: {'lr': 0.0001999629074936396, 'samples': 602816, 'steps': 1177, 'loss/train': 4.718043804168701} -09/20/2021 18:34:02 - INFO - __main__ - Step 18839: {'lr': 0.0001999629074936396, 'samples': 602848, 'steps': 1177, 'loss/train': 4.5661444664001465} -09/20/2021 18:34:02 - INFO - __main__ - Step 18840: {'lr': 0.0001999629074936396, 'samples': 602880, 'steps': 1177, 'loss/train': 3.265266180038452} -09/20/2021 18:34:03 - INFO - __main__ - Step 18841: {'lr': 0.0001999629074936396, 'samples': 602912, 'steps': 1177, 'loss/train': 2.80619215965271} -09/20/2021 18:34:04 - INFO - __main__ - Step 18842: {'lr': 0.0001999629074936396, 'samples': 602944, 'steps': 1177, 'loss/train': 4.018521785736084} -09/20/2021 18:34:05 - INFO - __main__ - Step 18843: {'lr': 0.0001999629074936396, 'samples': 602976, 'steps': 1177, 'loss/train': 4.7103681564331055} -09/20/2021 18:34:05 - INFO - __main__ - Step 18844: {'lr': 0.0001999629074936396, 'samples': 603008, 'steps': 1177, 'loss/train': 3.8664629459381104} -09/20/2021 18:34:06 - INFO - __main__ - Step 18845: {'lr': 0.0001999629074936396, 'samples': 603040, 'steps': 1177, 'loss/train': 3.6879239082336426} -09/20/2021 18:34:07 - INFO - __main__ - Step 18846: {'lr': 0.0001999629074936396, 'samples': 603072, 'steps': 1177, 'loss/train': 4.401261806488037} -09/20/2021 18:34:08 - INFO - __main__ - Step 18847: {'lr': 0.0001999629074936396, 'samples': 603104, 'steps': 1177, 'loss/train': 3.1856400966644287} -09/20/2021 18:34:08 - INFO - __main__ - Step 18848: {'lr': 0.0001999629074936396, 'samples': 603136, 'steps': 1177, 'loss/train': 3.654682159423828} -09/20/2021 18:34:09 - INFO - __main__ - Step 18849: {'lr': 0.00019996273356561383, 'samples': 603168, 'steps': 1178, 'loss/train': 4.020884037017822} -09/20/2021 18:34:10 - INFO - __main__ - Step 18850: {'lr': 0.00019996273356561383, 'samples': 603200, 'steps': 1178, 'loss/train': 3.358772039413452} -09/20/2021 18:34:11 - INFO - __main__ - Step 18851: {'lr': 0.00019996273356561383, 'samples': 603232, 'steps': 1178, 'loss/train': 4.488504886627197} -09/20/2021 18:34:11 - INFO - __main__ - Step 18852: {'lr': 0.00019996273356561383, 'samples': 603264, 'steps': 1178, 'loss/train': 2.0298497676849365} -09/20/2021 18:34:12 - INFO - __main__ - Step 18853: {'lr': 0.00019996273356561383, 'samples': 603296, 'steps': 1178, 'loss/train': 1.448029637336731} -09/20/2021 18:34:13 - INFO - __main__ - Step 18854: {'lr': 0.00019996273356561383, 'samples': 603328, 'steps': 1178, 'loss/train': 3.8341119289398193} -09/20/2021 18:34:14 - INFO - __main__ - Step 18855: {'lr': 0.00019996273356561383, 'samples': 603360, 'steps': 1178, 'loss/train': 3.916118860244751} -09/20/2021 18:34:15 - INFO - __main__ - Step 18856: {'lr': 0.00019996273356561383, 'samples': 603392, 'steps': 1178, 'loss/train': 3.0104267597198486} -09/20/2021 18:34:16 - INFO - __main__ - Step 18857: {'lr': 0.00019996273356561383, 'samples': 603424, 'steps': 1178, 'loss/train': 3.778437614440918} -09/20/2021 18:34:16 - INFO - __main__ - Step 18858: {'lr': 0.00019996273356561383, 'samples': 603456, 'steps': 1178, 'loss/train': 3.238225221633911} -09/20/2021 18:34:17 - INFO - __main__ - Step 18859: {'lr': 0.00019996273356561383, 'samples': 603488, 'steps': 1178, 'loss/train': 2.542360782623291} -09/20/2021 18:34:18 - INFO - __main__ - Step 18860: {'lr': 0.00019996273356561383, 'samples': 603520, 'steps': 1178, 'loss/train': 3.9050188064575195} -09/20/2021 18:34:19 - INFO - __main__ - Step 18861: {'lr': 0.00019996273356561383, 'samples': 603552, 'steps': 1178, 'loss/train': 3.874650001525879} -09/20/2021 18:34:19 - INFO - __main__ - Step 18862: {'lr': 0.00019996273356561383, 'samples': 603584, 'steps': 1178, 'loss/train': 3.855339527130127} -09/20/2021 18:34:20 - INFO - __main__ - Step 18863: {'lr': 0.00019996273356561383, 'samples': 603616, 'steps': 1178, 'loss/train': 3.3050620555877686} -09/20/2021 18:34:21 - INFO - __main__ - Step 18864: {'lr': 0.00019996273356561383, 'samples': 603648, 'steps': 1178, 'loss/train': 3.5153274536132812} -09/20/2021 18:34:22 - INFO - __main__ - Step 18865: {'lr': 0.0001999625592308401, 'samples': 603680, 'steps': 1179, 'loss/train': 4.062264442443848} -09/20/2021 18:34:23 - INFO - __main__ - Step 18866: {'lr': 0.0001999625592308401, 'samples': 603712, 'steps': 1179, 'loss/train': 3.016930103302002} -09/20/2021 18:34:23 - INFO - __main__ - Step 18867: {'lr': 0.0001999625592308401, 'samples': 603744, 'steps': 1179, 'loss/train': 3.604884386062622} -09/20/2021 18:34:24 - INFO - __main__ - Step 18868: {'lr': 0.0001999625592308401, 'samples': 603776, 'steps': 1179, 'loss/train': 4.083329677581787} -09/20/2021 18:34:25 - INFO - __main__ - Step 18869: {'lr': 0.0001999625592308401, 'samples': 603808, 'steps': 1179, 'loss/train': 3.5889554023742676} -09/20/2021 18:34:26 - INFO - __main__ - Step 18870: {'lr': 0.0001999625592308401, 'samples': 603840, 'steps': 1179, 'loss/train': 3.404343366622925} -09/20/2021 18:34:26 - INFO - __main__ - Step 18871: {'lr': 0.0001999625592308401, 'samples': 603872, 'steps': 1179, 'loss/train': 2.403360605239868} -09/20/2021 18:34:27 - INFO - __main__ - Step 18872: {'lr': 0.0001999625592308401, 'samples': 603904, 'steps': 1179, 'loss/train': 3.702655792236328} -09/20/2021 18:34:28 - INFO - __main__ - Step 18873: {'lr': 0.0001999625592308401, 'samples': 603936, 'steps': 1179, 'loss/train': 3.837470293045044} -09/20/2021 18:34:29 - INFO - __main__ - Step 18874: {'lr': 0.0001999625592308401, 'samples': 603968, 'steps': 1179, 'loss/train': 3.975229501724243} -09/20/2021 18:34:29 - INFO - __main__ - Step 18875: {'lr': 0.0001999625592308401, 'samples': 604000, 'steps': 1179, 'loss/train': 3.144740343093872} -09/20/2021 18:34:30 - INFO - __main__ - Step 18876: {'lr': 0.0001999625592308401, 'samples': 604032, 'steps': 1179, 'loss/train': 3.3107616901397705} -09/20/2021 18:34:31 - INFO - __main__ - Step 18877: {'lr': 0.0001999625592308401, 'samples': 604064, 'steps': 1179, 'loss/train': 3.6540141105651855} -09/20/2021 18:34:32 - INFO - __main__ - Step 18878: {'lr': 0.0001999625592308401, 'samples': 604096, 'steps': 1179, 'loss/train': 1.922249436378479} -09/20/2021 18:34:32 - INFO - __main__ - Step 18879: {'lr': 0.0001999625592308401, 'samples': 604128, 'steps': 1179, 'loss/train': 3.5143685340881348} -09/20/2021 18:34:33 - INFO - __main__ - Step 18880: {'lr': 0.0001999625592308401, 'samples': 604160, 'steps': 1179, 'loss/train': 5.005918979644775} -09/20/2021 18:34:34 - INFO - __main__ - Step 18881: {'lr': 0.00019996238448931913, 'samples': 604192, 'steps': 1180, 'loss/train': 0.91562420129776} -09/20/2021 18:34:35 - INFO - __main__ - Step 18882: {'lr': 0.00019996238448931913, 'samples': 604224, 'steps': 1180, 'loss/train': 3.6784486770629883} -09/20/2021 18:34:35 - INFO - __main__ - Step 18883: {'lr': 0.00019996238448931913, 'samples': 604256, 'steps': 1180, 'loss/train': 3.579963445663452} -09/20/2021 18:34:36 - INFO - __main__ - Step 18884: {'lr': 0.00019996238448931913, 'samples': 604288, 'steps': 1180, 'loss/train': 3.138275623321533} -09/20/2021 18:34:37 - INFO - __main__ - Step 18885: {'lr': 0.00019996238448931913, 'samples': 604320, 'steps': 1180, 'loss/train': 3.463484048843384} -09/20/2021 18:34:38 - INFO - __main__ - Step 18886: {'lr': 0.00019996238448931913, 'samples': 604352, 'steps': 1180, 'loss/train': 4.6526689529418945} -09/20/2021 18:34:39 - INFO - __main__ - Step 18887: {'lr': 0.00019996238448931913, 'samples': 604384, 'steps': 1180, 'loss/train': 3.3253626823425293} -09/20/2021 18:34:40 - INFO - __main__ - Step 18888: {'lr': 0.00019996238448931913, 'samples': 604416, 'steps': 1180, 'loss/train': 3.0629007816314697} -09/20/2021 18:34:41 - INFO - __main__ - Step 18889: {'lr': 0.00019996238448931913, 'samples': 604448, 'steps': 1180, 'loss/train': 3.460552215576172} -09/20/2021 18:34:41 - INFO - __main__ - Step 18890: {'lr': 0.00019996238448931913, 'samples': 604480, 'steps': 1180, 'loss/train': 5.760092258453369} -09/20/2021 18:34:42 - INFO - __main__ - Step 18891: {'lr': 0.00019996238448931913, 'samples': 604512, 'steps': 1180, 'loss/train': 3.0276753902435303} -09/20/2021 18:34:43 - INFO - __main__ - Step 18892: {'lr': 0.00019996238448931913, 'samples': 604544, 'steps': 1180, 'loss/train': 4.581168174743652} -09/20/2021 18:34:44 - INFO - __main__ - Step 18893: {'lr': 0.00019996238448931913, 'samples': 604576, 'steps': 1180, 'loss/train': 3.2921276092529297} -09/20/2021 18:34:44 - INFO - __main__ - Step 18894: {'lr': 0.00019996238448931913, 'samples': 604608, 'steps': 1180, 'loss/train': 3.3627607822418213} -09/20/2021 18:34:45 - INFO - __main__ - Step 18895: {'lr': 0.00019996238448931913, 'samples': 604640, 'steps': 1180, 'loss/train': 6.378471851348877} -09/20/2021 18:34:46 - INFO - __main__ - Step 18896: {'lr': 0.00019996238448931913, 'samples': 604672, 'steps': 1180, 'loss/train': 4.238912582397461} -09/20/2021 18:34:47 - INFO - __main__ - Step 18897: {'lr': 0.00019996220934105158, 'samples': 604704, 'steps': 1181, 'loss/train': 2.7318813800811768} -09/20/2021 18:34:47 - INFO - __main__ - Step 18898: {'lr': 0.00019996220934105158, 'samples': 604736, 'steps': 1181, 'loss/train': 3.601822853088379} -09/20/2021 18:34:48 - INFO - __main__ - Step 18899: {'lr': 0.00019996220934105158, 'samples': 604768, 'steps': 1181, 'loss/train': 1.4648892879486084} -09/20/2021 18:34:49 - INFO - __main__ - Step 18900: {'lr': 0.00019996220934105158, 'samples': 604800, 'steps': 1181, 'loss/train': 3.089585065841675} -09/20/2021 18:34:50 - INFO - __main__ - Step 18901: {'lr': 0.00019996220934105158, 'samples': 604832, 'steps': 1181, 'loss/train': 4.4645771980285645} -09/20/2021 18:34:50 - INFO - __main__ - Step 18902: {'lr': 0.00019996220934105158, 'samples': 604864, 'steps': 1181, 'loss/train': 1.2194067239761353} -09/20/2021 18:34:51 - INFO - __main__ - Step 18903: {'lr': 0.00019996220934105158, 'samples': 604896, 'steps': 1181, 'loss/train': 2.9813125133514404} -09/20/2021 18:34:52 - INFO - __main__ - Step 18904: {'lr': 0.00019996220934105158, 'samples': 604928, 'steps': 1181, 'loss/train': 4.229942321777344} -09/20/2021 18:34:53 - INFO - __main__ - Step 18905: {'lr': 0.00019996220934105158, 'samples': 604960, 'steps': 1181, 'loss/train': 1.4055763483047485} -09/20/2021 18:34:53 - INFO - __main__ - Step 18906: {'lr': 0.00019996220934105158, 'samples': 604992, 'steps': 1181, 'loss/train': 3.459592819213867} -09/20/2021 18:34:54 - INFO - __main__ - Step 18907: {'lr': 0.00019996220934105158, 'samples': 605024, 'steps': 1181, 'loss/train': 2.164374828338623} -09/20/2021 18:34:55 - INFO - __main__ - Step 18908: {'lr': 0.00019996220934105158, 'samples': 605056, 'steps': 1181, 'loss/train': 3.5530812740325928} -09/20/2021 18:34:56 - INFO - __main__ - Step 18909: {'lr': 0.00019996220934105158, 'samples': 605088, 'steps': 1181, 'loss/train': 3.4817442893981934} -09/20/2021 18:34:56 - INFO - __main__ - Step 18910: {'lr': 0.00019996220934105158, 'samples': 605120, 'steps': 1181, 'loss/train': 2.971407175064087} -09/20/2021 18:34:57 - INFO - __main__ - Step 18911: {'lr': 0.00019996220934105158, 'samples': 605152, 'steps': 1181, 'loss/train': 3.509204149246216} -09/20/2021 18:34:58 - INFO - __main__ - Step 18912: {'lr': 0.00019996220934105158, 'samples': 605184, 'steps': 1181, 'loss/train': 3.488433361053467} -09/20/2021 18:34:59 - INFO - __main__ - Step 18913: {'lr': 0.0001999620337860382, 'samples': 605216, 'steps': 1182, 'loss/train': 4.327686309814453} -09/20/2021 18:35:00 - INFO - __main__ - Step 18914: {'lr': 0.0001999620337860382, 'samples': 605248, 'steps': 1182, 'loss/train': 3.0171642303466797} -09/20/2021 18:35:00 - INFO - __main__ - Step 18915: {'lr': 0.0001999620337860382, 'samples': 605280, 'steps': 1182, 'loss/train': 4.783084869384766} -09/20/2021 18:35:01 - INFO - __main__ - Step 18916: {'lr': 0.0001999620337860382, 'samples': 605312, 'steps': 1182, 'loss/train': 1.2833892107009888} -09/20/2021 18:35:02 - INFO - __main__ - Step 18917: {'lr': 0.0001999620337860382, 'samples': 605344, 'steps': 1182, 'loss/train': 3.1486356258392334} -09/20/2021 18:35:03 - INFO - __main__ - Step 18918: {'lr': 0.0001999620337860382, 'samples': 605376, 'steps': 1182, 'loss/train': 3.62812876701355} -09/20/2021 18:35:04 - INFO - __main__ - Step 18919: {'lr': 0.0001999620337860382, 'samples': 605408, 'steps': 1182, 'loss/train': 3.9382643699645996} -09/20/2021 18:35:05 - INFO - __main__ - Step 18920: {'lr': 0.0001999620337860382, 'samples': 605440, 'steps': 1182, 'loss/train': 4.41104793548584} -09/20/2021 18:35:05 - INFO - __main__ - Step 18921: {'lr': 0.0001999620337860382, 'samples': 605472, 'steps': 1182, 'loss/train': 2.6460394859313965} -09/20/2021 18:35:06 - INFO - __main__ - Step 18922: {'lr': 0.0001999620337860382, 'samples': 605504, 'steps': 1182, 'loss/train': 3.932750701904297} -09/20/2021 18:35:07 - INFO - __main__ - Step 18923: {'lr': 0.0001999620337860382, 'samples': 605536, 'steps': 1182, 'loss/train': 3.2599496841430664} -09/20/2021 18:35:08 - INFO - __main__ - Step 18924: {'lr': 0.0001999620337860382, 'samples': 605568, 'steps': 1182, 'loss/train': 3.91213321685791} -09/20/2021 18:35:08 - INFO - __main__ - Step 18925: {'lr': 0.0001999620337860382, 'samples': 605600, 'steps': 1182, 'loss/train': 3.013498306274414} -09/20/2021 18:35:09 - INFO - __main__ - Step 18926: {'lr': 0.0001999620337860382, 'samples': 605632, 'steps': 1182, 'loss/train': 2.5322139263153076} -09/20/2021 18:35:10 - INFO - __main__ - Step 18927: {'lr': 0.0001999620337860382, 'samples': 605664, 'steps': 1182, 'loss/train': 4.211157321929932} -09/20/2021 18:35:11 - INFO - __main__ - Step 18928: {'lr': 0.0001999620337860382, 'samples': 605696, 'steps': 1182, 'loss/train': 4.514791011810303} -09/20/2021 18:35:11 - INFO - __main__ - Step 18929: {'lr': 0.0001999618578242797, 'samples': 605728, 'steps': 1183, 'loss/train': 3.568020820617676} -09/20/2021 18:35:12 - INFO - __main__ - Step 18930: {'lr': 0.0001999618578242797, 'samples': 605760, 'steps': 1183, 'loss/train': 3.1201820373535156} -09/20/2021 18:35:13 - INFO - __main__ - Step 18931: {'lr': 0.0001999618578242797, 'samples': 605792, 'steps': 1183, 'loss/train': 3.5900826454162598} -09/20/2021 18:35:14 - INFO - __main__ - Step 18932: {'lr': 0.0001999618578242797, 'samples': 605824, 'steps': 1183, 'loss/train': 3.072491407394409} -09/20/2021 18:35:14 - INFO - __main__ - Step 18933: {'lr': 0.0001999618578242797, 'samples': 605856, 'steps': 1183, 'loss/train': 3.298274278640747} -09/20/2021 18:35:15 - INFO - __main__ - Step 18934: {'lr': 0.0001999618578242797, 'samples': 605888, 'steps': 1183, 'loss/train': 3.5910146236419678} -09/20/2021 18:35:16 - INFO - __main__ - Step 18935: {'lr': 0.0001999618578242797, 'samples': 605920, 'steps': 1183, 'loss/train': 3.55230975151062} -09/20/2021 18:35:17 - INFO - __main__ - Step 18936: {'lr': 0.0001999618578242797, 'samples': 605952, 'steps': 1183, 'loss/train': 4.287363529205322} -09/20/2021 18:35:17 - INFO - __main__ - Step 18937: {'lr': 0.0001999618578242797, 'samples': 605984, 'steps': 1183, 'loss/train': 3.383272171020508} -09/20/2021 18:35:18 - INFO - __main__ - Step 18938: {'lr': 0.0001999618578242797, 'samples': 606016, 'steps': 1183, 'loss/train': 3.1824758052825928} -09/20/2021 18:35:19 - INFO - __main__ - Step 18939: {'lr': 0.0001999618578242797, 'samples': 606048, 'steps': 1183, 'loss/train': 1.134689211845398} -09/20/2021 18:35:20 - INFO - __main__ - Step 18940: {'lr': 0.0001999618578242797, 'samples': 606080, 'steps': 1183, 'loss/train': 2.9977571964263916} -09/20/2021 18:35:20 - INFO - __main__ - Step 18941: {'lr': 0.0001999618578242797, 'samples': 606112, 'steps': 1183, 'loss/train': 4.182376384735107} -09/20/2021 18:35:21 - INFO - __main__ - Step 18942: {'lr': 0.0001999618578242797, 'samples': 606144, 'steps': 1183, 'loss/train': 3.1237943172454834} -09/20/2021 18:35:22 - INFO - __main__ - Step 18943: {'lr': 0.0001999618578242797, 'samples': 606176, 'steps': 1183, 'loss/train': 5.642698764801025} -09/20/2021 18:35:23 - INFO - __main__ - Step 18944: {'lr': 0.0001999618578242797, 'samples': 606208, 'steps': 1183, 'loss/train': 4.118870258331299} -09/20/2021 18:35:24 - INFO - __main__ - Step 18945: {'lr': 0.00019996168145577675, 'samples': 606240, 'steps': 1184, 'loss/train': 4.194174766540527} -09/20/2021 18:35:24 - INFO - __main__ - Step 18946: {'lr': 0.00019996168145577675, 'samples': 606272, 'steps': 1184, 'loss/train': 0.6023010611534119} -09/20/2021 18:35:25 - INFO - __main__ - Step 18947: {'lr': 0.00019996168145577675, 'samples': 606304, 'steps': 1184, 'loss/train': 3.4493937492370605} -09/20/2021 18:35:26 - INFO - __main__ - Step 18948: {'lr': 0.00019996168145577675, 'samples': 606336, 'steps': 1184, 'loss/train': 4.179231643676758} -09/20/2021 18:35:27 - INFO - __main__ - Step 18949: {'lr': 0.00019996168145577675, 'samples': 606368, 'steps': 1184, 'loss/train': 2.986191987991333} -09/20/2021 18:35:28 - INFO - __main__ - Step 18950: {'lr': 0.00019996168145577675, 'samples': 606400, 'steps': 1184, 'loss/train': 4.222993850708008} -09/20/2021 18:35:29 - INFO - __main__ - Step 18951: {'lr': 0.00019996168145577675, 'samples': 606432, 'steps': 1184, 'loss/train': 3.0158772468566895} -09/20/2021 18:35:29 - INFO - __main__ - Step 18952: {'lr': 0.00019996168145577675, 'samples': 606464, 'steps': 1184, 'loss/train': 3.085052728652954} -09/20/2021 18:35:30 - INFO - __main__ - Step 18953: {'lr': 0.00019996168145577675, 'samples': 606496, 'steps': 1184, 'loss/train': 3.266456127166748} -09/20/2021 18:35:31 - INFO - __main__ - Step 18954: {'lr': 0.00019996168145577675, 'samples': 606528, 'steps': 1184, 'loss/train': 4.096757888793945} -09/20/2021 18:35:32 - INFO - __main__ - Step 18955: {'lr': 0.00019996168145577675, 'samples': 606560, 'steps': 1184, 'loss/train': 3.3377583026885986} -09/20/2021 18:35:32 - INFO - __main__ - Step 18956: {'lr': 0.00019996168145577675, 'samples': 606592, 'steps': 1184, 'loss/train': 3.9072353839874268} -09/20/2021 18:35:33 - INFO - __main__ - Step 18957: {'lr': 0.00019996168145577675, 'samples': 606624, 'steps': 1184, 'loss/train': 1.1571887731552124} -09/20/2021 18:35:34 - INFO - __main__ - Step 18958: {'lr': 0.00019996168145577675, 'samples': 606656, 'steps': 1184, 'loss/train': 3.8248696327209473} -09/20/2021 18:35:35 - INFO - __main__ - Step 18959: {'lr': 0.00019996168145577675, 'samples': 606688, 'steps': 1184, 'loss/train': 4.47501802444458} -09/20/2021 18:35:35 - INFO - __main__ - Step 18960: {'lr': 0.00019996168145577675, 'samples': 606720, 'steps': 1184, 'loss/train': 2.8672521114349365} -09/20/2021 18:35:36 - INFO - __main__ - Step 18961: {'lr': 0.00019996150468053013, 'samples': 606752, 'steps': 1185, 'loss/train': 3.8781704902648926} -09/20/2021 18:35:37 - INFO - __main__ - Step 18962: {'lr': 0.00019996150468053013, 'samples': 606784, 'steps': 1185, 'loss/train': 3.7993390560150146} -09/20/2021 18:35:38 - INFO - __main__ - Step 18963: {'lr': 0.00019996150468053013, 'samples': 606816, 'steps': 1185, 'loss/train': 5.34214448928833} -09/20/2021 18:35:38 - INFO - __main__ - Step 18964: {'lr': 0.00019996150468053013, 'samples': 606848, 'steps': 1185, 'loss/train': 4.25607442855835} -09/20/2021 18:35:39 - INFO - __main__ - Step 18965: {'lr': 0.00019996150468053013, 'samples': 606880, 'steps': 1185, 'loss/train': 3.249282121658325} -09/20/2021 18:35:40 - INFO - __main__ - Step 18966: {'lr': 0.00019996150468053013, 'samples': 606912, 'steps': 1185, 'loss/train': 2.1035096645355225} -09/20/2021 18:35:41 - INFO - __main__ - Step 18967: {'lr': 0.00019996150468053013, 'samples': 606944, 'steps': 1185, 'loss/train': 2.3813202381134033} -09/20/2021 18:35:41 - INFO - __main__ - Step 18968: {'lr': 0.00019996150468053013, 'samples': 606976, 'steps': 1185, 'loss/train': 4.820702075958252} -09/20/2021 18:35:42 - INFO - __main__ - Step 18969: {'lr': 0.00019996150468053013, 'samples': 607008, 'steps': 1185, 'loss/train': 3.8203279972076416} -09/20/2021 18:35:43 - INFO - __main__ - Step 18970: {'lr': 0.00019996150468053013, 'samples': 607040, 'steps': 1185, 'loss/train': 2.9663753509521484} -09/20/2021 18:35:44 - INFO - __main__ - Step 18971: {'lr': 0.00019996150468053013, 'samples': 607072, 'steps': 1185, 'loss/train': 3.2153446674346924} -09/20/2021 18:35:44 - INFO - __main__ - Step 18972: {'lr': 0.00019996150468053013, 'samples': 607104, 'steps': 1185, 'loss/train': 2.780630111694336} -09/20/2021 18:35:45 - INFO - __main__ - Step 18973: {'lr': 0.00019996150468053013, 'samples': 607136, 'steps': 1185, 'loss/train': 2.549586057662964} -09/20/2021 18:35:46 - INFO - __main__ - Step 18974: {'lr': 0.00019996150468053013, 'samples': 607168, 'steps': 1185, 'loss/train': 3.4058358669281006} -09/20/2021 18:35:47 - INFO - __main__ - Step 18975: {'lr': 0.00019996150468053013, 'samples': 607200, 'steps': 1185, 'loss/train': 3.568582773208618} -09/20/2021 18:35:48 - INFO - __main__ - Step 18976: {'lr': 0.00019996150468053013, 'samples': 607232, 'steps': 1185, 'loss/train': 3.8888142108917236} -09/20/2021 18:35:48 - INFO - __main__ - Step 18977: {'lr': 0.00019996132749854057, 'samples': 607264, 'steps': 1186, 'loss/train': 3.6290740966796875} -09/20/2021 18:35:49 - INFO - __main__ - Step 18978: {'lr': 0.00019996132749854057, 'samples': 607296, 'steps': 1186, 'loss/train': 3.628674030303955} -09/20/2021 18:35:50 - INFO - __main__ - Step 18979: {'lr': 0.00019996132749854057, 'samples': 607328, 'steps': 1186, 'loss/train': 3.0827085971832275} -09/20/2021 18:35:51 - INFO - __main__ - Step 18980: {'lr': 0.00019996132749854057, 'samples': 607360, 'steps': 1186, 'loss/train': 5.1057024002075195} -09/20/2021 18:35:51 - INFO - __main__ - Step 18981: {'lr': 0.00019996132749854057, 'samples': 607392, 'steps': 1186, 'loss/train': 4.083496570587158} -09/20/2021 18:35:53 - INFO - __main__ - Step 18982: {'lr': 0.00019996132749854057, 'samples': 607424, 'steps': 1186, 'loss/train': 3.0328574180603027} -09/20/2021 18:35:54 - INFO - __main__ - Step 18983: {'lr': 0.00019996132749854057, 'samples': 607456, 'steps': 1186, 'loss/train': 4.822084426879883} -09/20/2021 18:35:54 - INFO - __main__ - Step 18984: {'lr': 0.00019996132749854057, 'samples': 607488, 'steps': 1186, 'loss/train': 2.6418628692626953} -09/20/2021 18:35:55 - INFO - __main__ - Step 18985: {'lr': 0.00019996132749854057, 'samples': 607520, 'steps': 1186, 'loss/train': 3.3308472633361816} -09/20/2021 18:35:56 - INFO - __main__ - Step 18986: {'lr': 0.00019996132749854057, 'samples': 607552, 'steps': 1186, 'loss/train': 2.4151504039764404} -09/20/2021 18:35:57 - INFO - __main__ - Step 18987: {'lr': 0.00019996132749854057, 'samples': 607584, 'steps': 1186, 'loss/train': 2.9512641429901123} -09/20/2021 18:35:57 - INFO - __main__ - Step 18988: {'lr': 0.00019996132749854057, 'samples': 607616, 'steps': 1186, 'loss/train': 3.8576927185058594} -09/20/2021 18:35:58 - INFO - __main__ - Step 18989: {'lr': 0.00019996132749854057, 'samples': 607648, 'steps': 1186, 'loss/train': 3.2030768394470215} -09/20/2021 18:35:59 - INFO - __main__ - Step 18990: {'lr': 0.00019996132749854057, 'samples': 607680, 'steps': 1186, 'loss/train': 2.997591495513916} -09/20/2021 18:36:00 - INFO - __main__ - Step 18991: {'lr': 0.00019996132749854057, 'samples': 607712, 'steps': 1186, 'loss/train': 6.239045143127441} -09/20/2021 18:36:00 - INFO - __main__ - Step 18992: {'lr': 0.00019996132749854057, 'samples': 607744, 'steps': 1186, 'loss/train': 6.169841766357422} -09/20/2021 18:36:01 - INFO - __main__ - Step 18993: {'lr': 0.00019996114990980873, 'samples': 607776, 'steps': 1187, 'loss/train': 6.172210216522217} -09/20/2021 18:36:02 - INFO - __main__ - Step 18994: {'lr': 0.00019996114990980873, 'samples': 607808, 'steps': 1187, 'loss/train': 6.119989395141602} -09/20/2021 18:36:03 - INFO - __main__ - Step 18995: {'lr': 0.00019996114990980873, 'samples': 607840, 'steps': 1187, 'loss/train': 6.040223121643066} -09/20/2021 18:36:03 - INFO - __main__ - Step 18996: {'lr': 0.00019996114990980873, 'samples': 607872, 'steps': 1187, 'loss/train': 6.089966773986816} -09/20/2021 18:36:04 - INFO - __main__ - Step 18997: {'lr': 0.00019996114990980873, 'samples': 607904, 'steps': 1187, 'loss/train': 4.439070224761963} -09/20/2021 18:36:05 - INFO - __main__ - Step 18998: {'lr': 0.00019996114990980873, 'samples': 607936, 'steps': 1187, 'loss/train': 3.827878952026367} -09/20/2021 18:36:06 - INFO - __main__ - Step 18999: {'lr': 0.00019996114990980873, 'samples': 607968, 'steps': 1187, 'loss/train': 3.786752223968506} -09/20/2021 18:36:06 - INFO - __main__ - Step 19000: {'lr': 0.00019996114990980873, 'samples': 608000, 'steps': 1187, 'loss/train': 3.8229949474334717} -09/20/2021 18:36:07 - INFO - __main__ - Step 19001: {'lr': 0.00019996114990980873, 'samples': 608032, 'steps': 1187, 'loss/train': 3.010519504547119} -09/20/2021 18:36:08 - INFO - __main__ - Step 19002: {'lr': 0.00019996114990980873, 'samples': 608064, 'steps': 1187, 'loss/train': 3.5837759971618652} -09/20/2021 18:36:09 - INFO - __main__ - Step 19003: {'lr': 0.00019996114990980873, 'samples': 608096, 'steps': 1187, 'loss/train': 3.5242552757263184} -09/20/2021 18:36:09 - INFO - __main__ - Step 19004: {'lr': 0.00019996114990980873, 'samples': 608128, 'steps': 1187, 'loss/train': 4.807629585266113} -09/20/2021 18:36:10 - INFO - __main__ - Step 19005: {'lr': 0.00019996114990980873, 'samples': 608160, 'steps': 1187, 'loss/train': 4.818900108337402} -09/20/2021 18:36:11 - INFO - __main__ - Step 19006: {'lr': 0.00019996114990980873, 'samples': 608192, 'steps': 1187, 'loss/train': 2.786079168319702} -09/20/2021 18:36:12 - INFO - __main__ - Step 19007: {'lr': 0.00019996114990980873, 'samples': 608224, 'steps': 1187, 'loss/train': 3.539224863052368} -09/20/2021 18:36:12 - INFO - __main__ - Step 19008: {'lr': 0.00019996114990980873, 'samples': 608256, 'steps': 1187, 'loss/train': 3.9040939807891846} -09/20/2021 18:36:13 - INFO - __main__ - Step 19009: {'lr': 0.00019996097191433534, 'samples': 608288, 'steps': 1188, 'loss/train': 2.8527638912200928} -09/20/2021 18:36:14 - INFO - __main__ - Step 19010: {'lr': 0.00019996097191433534, 'samples': 608320, 'steps': 1188, 'loss/train': 2.9481892585754395} -09/20/2021 18:36:15 - INFO - __main__ - Step 19011: {'lr': 0.00019996097191433534, 'samples': 608352, 'steps': 1188, 'loss/train': 3.3310232162475586} -09/20/2021 18:36:16 - INFO - __main__ - Step 19012: {'lr': 0.00019996097191433534, 'samples': 608384, 'steps': 1188, 'loss/train': 2.926535129547119} -09/20/2021 18:36:16 - INFO - __main__ - Step 19013: {'lr': 0.00019996097191433534, 'samples': 608416, 'steps': 1188, 'loss/train': 1.5948610305786133} -09/20/2021 18:36:17 - INFO - __main__ - Step 19014: {'lr': 0.00019996097191433534, 'samples': 608448, 'steps': 1188, 'loss/train': 4.143723011016846} -09/20/2021 18:36:18 - INFO - __main__ - Step 19015: {'lr': 0.00019996097191433534, 'samples': 608480, 'steps': 1188, 'loss/train': 3.201181650161743} -09/20/2021 18:36:19 - INFO - __main__ - Step 19016: {'lr': 0.00019996097191433534, 'samples': 608512, 'steps': 1188, 'loss/train': 3.1190338134765625} -09/20/2021 18:36:21 - INFO - __main__ - Step 19017: {'lr': 0.00019996097191433534, 'samples': 608544, 'steps': 1188, 'loss/train': 3.5505049228668213} -09/20/2021 18:36:22 - INFO - __main__ - Step 19018: {'lr': 0.00019996097191433534, 'samples': 608576, 'steps': 1188, 'loss/train': 3.46150803565979} -09/20/2021 18:36:22 - INFO - __main__ - Step 19019: {'lr': 0.00019996097191433534, 'samples': 608608, 'steps': 1188, 'loss/train': 3.069859504699707} -09/20/2021 18:36:23 - INFO - __main__ - Step 19020: {'lr': 0.00019996097191433534, 'samples': 608640, 'steps': 1188, 'loss/train': 4.748352527618408} -09/20/2021 18:36:24 - INFO - __main__ - Step 19021: {'lr': 0.00019996097191433534, 'samples': 608672, 'steps': 1188, 'loss/train': 3.297081708908081} -09/20/2021 18:36:25 - INFO - __main__ - Step 19022: {'lr': 0.00019996097191433534, 'samples': 608704, 'steps': 1188, 'loss/train': 4.368194580078125} -09/20/2021 18:36:25 - INFO - __main__ - Step 19023: {'lr': 0.00019996097191433534, 'samples': 608736, 'steps': 1188, 'loss/train': 2.597449779510498} -09/20/2021 18:36:26 - INFO - __main__ - Step 19024: {'lr': 0.00019996097191433534, 'samples': 608768, 'steps': 1188, 'loss/train': 3.5149173736572266} -09/20/2021 18:36:27 - INFO - __main__ - Step 19025: {'lr': 0.00019996079351212117, 'samples': 608800, 'steps': 1189, 'loss/train': 3.8789894580841064} -09/20/2021 18:36:28 - INFO - __main__ - Step 19026: {'lr': 0.00019996079351212117, 'samples': 608832, 'steps': 1189, 'loss/train': 2.9916627407073975} -09/20/2021 18:36:28 - INFO - __main__ - Step 19027: {'lr': 0.00019996079351212117, 'samples': 608864, 'steps': 1189, 'loss/train': 3.288177251815796} -09/20/2021 18:36:29 - INFO - __main__ - Step 19028: {'lr': 0.00019996079351212117, 'samples': 608896, 'steps': 1189, 'loss/train': 4.428001403808594} -09/20/2021 18:36:30 - INFO - __main__ - Step 19029: {'lr': 0.00019996079351212117, 'samples': 608928, 'steps': 1189, 'loss/train': 3.1937835216522217} -09/20/2021 18:36:31 - INFO - __main__ - Step 19030: {'lr': 0.00019996079351212117, 'samples': 608960, 'steps': 1189, 'loss/train': 4.289855480194092} -09/20/2021 18:36:31 - INFO - __main__ - Step 19031: {'lr': 0.00019996079351212117, 'samples': 608992, 'steps': 1189, 'loss/train': 3.902430534362793} -09/20/2021 18:36:32 - INFO - __main__ - Step 19032: {'lr': 0.00019996079351212117, 'samples': 609024, 'steps': 1189, 'loss/train': 4.864051342010498} -09/20/2021 18:36:33 - INFO - __main__ - Step 19033: {'lr': 0.00019996079351212117, 'samples': 609056, 'steps': 1189, 'loss/train': 4.99590539932251} -09/20/2021 18:36:34 - INFO - __main__ - Step 19034: {'lr': 0.00019996079351212117, 'samples': 609088, 'steps': 1189, 'loss/train': 5.042384147644043} -09/20/2021 18:36:34 - INFO - __main__ - Step 19035: {'lr': 0.00019996079351212117, 'samples': 609120, 'steps': 1189, 'loss/train': 4.828624725341797} -09/20/2021 18:36:35 - INFO - __main__ - Step 19036: {'lr': 0.00019996079351212117, 'samples': 609152, 'steps': 1189, 'loss/train': 4.87543249130249} -09/20/2021 18:36:36 - INFO - __main__ - Step 19037: {'lr': 0.00019996079351212117, 'samples': 609184, 'steps': 1189, 'loss/train': 5.061764717102051} -09/20/2021 18:36:37 - INFO - __main__ - Step 19038: {'lr': 0.00019996079351212117, 'samples': 609216, 'steps': 1189, 'loss/train': 4.837109088897705} -09/20/2021 18:36:37 - INFO - __main__ - Step 19039: {'lr': 0.00019996079351212117, 'samples': 609248, 'steps': 1189, 'loss/train': 4.990221977233887} -09/20/2021 18:36:38 - INFO - __main__ - Step 19040: {'lr': 0.00019996079351212117, 'samples': 609280, 'steps': 1189, 'loss/train': 4.977963924407959} -09/20/2021 18:36:39 - INFO - __main__ - Step 19041: {'lr': 0.0001999606147031669, 'samples': 609312, 'steps': 1190, 'loss/train': 4.072629928588867} -09/20/2021 18:36:40 - INFO - __main__ - Step 19042: {'lr': 0.0001999606147031669, 'samples': 609344, 'steps': 1190, 'loss/train': 3.9556543827056885} -09/20/2021 18:36:41 - INFO - __main__ - Step 19043: {'lr': 0.0001999606147031669, 'samples': 609376, 'steps': 1190, 'loss/train': 4.0537800788879395} -09/20/2021 18:36:41 - INFO - __main__ - Step 19044: {'lr': 0.0001999606147031669, 'samples': 609408, 'steps': 1190, 'loss/train': 4.162479877471924} -09/20/2021 18:36:42 - INFO - __main__ - Step 19045: {'lr': 0.0001999606147031669, 'samples': 609440, 'steps': 1190, 'loss/train': 4.132359504699707} -09/20/2021 18:36:43 - INFO - __main__ - Step 19046: {'lr': 0.0001999606147031669, 'samples': 609472, 'steps': 1190, 'loss/train': 3.332016944885254} -09/20/2021 18:36:44 - INFO - __main__ - Step 19047: {'lr': 0.0001999606147031669, 'samples': 609504, 'steps': 1190, 'loss/train': 3.8444664478302} -09/20/2021 18:36:44 - INFO - __main__ - Step 19048: {'lr': 0.0001999606147031669, 'samples': 609536, 'steps': 1190, 'loss/train': 3.805543899536133} -09/20/2021 18:36:45 - INFO - __main__ - Step 19049: {'lr': 0.0001999606147031669, 'samples': 609568, 'steps': 1190, 'loss/train': 3.6361241340637207} -09/20/2021 18:36:46 - INFO - __main__ - Step 19050: {'lr': 0.0001999606147031669, 'samples': 609600, 'steps': 1190, 'loss/train': 3.8359410762786865} -09/20/2021 18:36:47 - INFO - __main__ - Step 19051: {'lr': 0.0001999606147031669, 'samples': 609632, 'steps': 1190, 'loss/train': 4.8846354484558105} -09/20/2021 18:36:47 - INFO - __main__ - Step 19052: {'lr': 0.0001999606147031669, 'samples': 609664, 'steps': 1190, 'loss/train': 3.7638113498687744} -09/20/2021 18:36:48 - INFO - __main__ - Step 19053: {'lr': 0.0001999606147031669, 'samples': 609696, 'steps': 1190, 'loss/train': 3.7245562076568604} -09/20/2021 18:36:49 - INFO - __main__ - Step 19054: {'lr': 0.0001999606147031669, 'samples': 609728, 'steps': 1190, 'loss/train': 3.7835614681243896} -09/20/2021 18:36:51 - INFO - __main__ - Step 19055: {'lr': 0.0001999606147031669, 'samples': 609760, 'steps': 1190, 'loss/train': 3.4523751735687256} -09/20/2021 18:36:52 - INFO - __main__ - Step 19056: {'lr': 0.0001999606147031669, 'samples': 609792, 'steps': 1190, 'loss/train': 4.195865154266357} -09/20/2021 18:36:53 - INFO - __main__ - Step 19057: {'lr': 0.0001999604354874733, 'samples': 609824, 'steps': 1191, 'loss/train': 3.7966372966766357} -09/20/2021 18:36:53 - INFO - __main__ - Step 19058: {'lr': 0.0001999604354874733, 'samples': 609856, 'steps': 1191, 'loss/train': 2.5802361965179443} -09/20/2021 18:36:54 - INFO - __main__ - Step 19059: {'lr': 0.0001999604354874733, 'samples': 609888, 'steps': 1191, 'loss/train': 3.501713991165161} -09/20/2021 18:36:55 - INFO - __main__ - Step 19060: {'lr': 0.0001999604354874733, 'samples': 609920, 'steps': 1191, 'loss/train': 4.254627704620361} -09/20/2021 18:36:56 - INFO - __main__ - Step 19061: {'lr': 0.0001999604354874733, 'samples': 609952, 'steps': 1191, 'loss/train': 3.9817440509796143} -09/20/2021 18:36:56 - INFO - __main__ - Step 19062: {'lr': 0.0001999604354874733, 'samples': 609984, 'steps': 1191, 'loss/train': 3.4796154499053955} -09/20/2021 18:36:57 - INFO - __main__ - Step 19063: {'lr': 0.0001999604354874733, 'samples': 610016, 'steps': 1191, 'loss/train': 3.8038835525512695} -09/20/2021 18:36:58 - INFO - __main__ - Step 19064: {'lr': 0.0001999604354874733, 'samples': 610048, 'steps': 1191, 'loss/train': 3.5540390014648438} -09/20/2021 18:36:59 - INFO - __main__ - Step 19065: {'lr': 0.0001999604354874733, 'samples': 610080, 'steps': 1191, 'loss/train': 3.7653582096099854} -09/20/2021 18:36:59 - INFO - __main__ - Step 19066: {'lr': 0.0001999604354874733, 'samples': 610112, 'steps': 1191, 'loss/train': 3.02947735786438} -09/20/2021 18:37:00 - INFO - __main__ - Step 19067: {'lr': 0.0001999604354874733, 'samples': 610144, 'steps': 1191, 'loss/train': 4.395866870880127} -09/20/2021 18:37:01 - INFO - __main__ - Step 19068: {'lr': 0.0001999604354874733, 'samples': 610176, 'steps': 1191, 'loss/train': 2.563795804977417} -09/20/2021 18:37:02 - INFO - __main__ - Step 19069: {'lr': 0.0001999604354874733, 'samples': 610208, 'steps': 1191, 'loss/train': 2.5887653827667236} -09/20/2021 18:37:02 - INFO - __main__ - Step 19070: {'lr': 0.0001999604354874733, 'samples': 610240, 'steps': 1191, 'loss/train': 2.327157974243164} -09/20/2021 18:37:03 - INFO - __main__ - Step 19071: {'lr': 0.0001999604354874733, 'samples': 610272, 'steps': 1191, 'loss/train': 2.3678767681121826} -09/20/2021 18:37:04 - INFO - __main__ - Step 19072: {'lr': 0.0001999604354874733, 'samples': 610304, 'steps': 1191, 'loss/train': 2.349076271057129} -09/20/2021 18:37:05 - INFO - __main__ - Step 19073: {'lr': 0.00019996025586504104, 'samples': 610336, 'steps': 1192, 'loss/train': 2.699310779571533} -09/20/2021 18:37:05 - INFO - __main__ - Step 19074: {'lr': 0.00019996025586504104, 'samples': 610368, 'steps': 1192, 'loss/train': 2.019325017929077} -09/20/2021 18:37:06 - INFO - __main__ - Step 19075: {'lr': 0.00019996025586504104, 'samples': 610400, 'steps': 1192, 'loss/train': 2.8768742084503174} -09/20/2021 18:37:07 - INFO - __main__ - Step 19076: {'lr': 0.00019996025586504104, 'samples': 610432, 'steps': 1192, 'loss/train': 2.0692598819732666} -09/20/2021 18:37:08 - INFO - __main__ - Step 19077: {'lr': 0.00019996025586504104, 'samples': 610464, 'steps': 1192, 'loss/train': 2.535762071609497} -09/20/2021 18:37:08 - INFO - __main__ - Step 19078: {'lr': 0.00019996025586504104, 'samples': 610496, 'steps': 1192, 'loss/train': 3.465489387512207} -09/20/2021 18:37:09 - INFO - __main__ - Step 19079: {'lr': 0.00019996025586504104, 'samples': 610528, 'steps': 1192, 'loss/train': 3.080934762954712} -09/20/2021 18:37:10 - INFO - __main__ - Step 19080: {'lr': 0.00019996025586504104, 'samples': 610560, 'steps': 1192, 'loss/train': 3.5745997428894043} -09/20/2021 18:37:11 - INFO - __main__ - Step 19081: {'lr': 0.00019996025586504104, 'samples': 610592, 'steps': 1192, 'loss/train': 3.7538628578186035} -09/20/2021 18:37:11 - INFO - __main__ - Step 19082: {'lr': 0.00019996025586504104, 'samples': 610624, 'steps': 1192, 'loss/train': 3.6636908054351807} -09/20/2021 18:37:12 - INFO - __main__ - Step 19083: {'lr': 0.00019996025586504104, 'samples': 610656, 'steps': 1192, 'loss/train': 2.0260698795318604} -09/20/2021 18:37:13 - INFO - __main__ - Step 19084: {'lr': 0.00019996025586504104, 'samples': 610688, 'steps': 1192, 'loss/train': 3.1678762435913086} -09/20/2021 18:37:14 - INFO - __main__ - Step 19085: {'lr': 0.00019996025586504104, 'samples': 610720, 'steps': 1192, 'loss/train': 5.14288330078125} -09/20/2021 18:37:14 - INFO - __main__ - Step 19086: {'lr': 0.00019996025586504104, 'samples': 610752, 'steps': 1192, 'loss/train': 3.9685299396514893} -09/20/2021 18:37:15 - INFO - __main__ - Step 19087: {'lr': 0.00019996025586504104, 'samples': 610784, 'steps': 1192, 'loss/train': 4.017305374145508} -09/20/2021 18:37:16 - INFO - __main__ - Step 19088: {'lr': 0.00019996025586504104, 'samples': 610816, 'steps': 1192, 'loss/train': 3.2864768505096436} -09/20/2021 18:37:17 - INFO - __main__ - Step 19089: {'lr': 0.0001999600758358709, 'samples': 610848, 'steps': 1193, 'loss/train': 4.33745813369751} -09/20/2021 18:37:18 - INFO - __main__ - Step 19090: {'lr': 0.0001999600758358709, 'samples': 610880, 'steps': 1193, 'loss/train': 3.5942955017089844} -09/20/2021 18:37:19 - INFO - __main__ - Step 19091: {'lr': 0.0001999600758358709, 'samples': 610912, 'steps': 1193, 'loss/train': 3.631129503250122} -09/20/2021 18:37:20 - INFO - __main__ - Step 19092: {'lr': 0.0001999600758358709, 'samples': 610944, 'steps': 1193, 'loss/train': 3.244305372238159} -09/20/2021 18:37:20 - INFO - __main__ - Step 19093: {'lr': 0.0001999600758358709, 'samples': 610976, 'steps': 1193, 'loss/train': 3.5742011070251465} -09/20/2021 18:37:21 - INFO - __main__ - Step 19094: {'lr': 0.0001999600758358709, 'samples': 611008, 'steps': 1193, 'loss/train': 3.446303129196167} -09/20/2021 18:37:22 - INFO - __main__ - Step 19095: {'lr': 0.0001999600758358709, 'samples': 611040, 'steps': 1193, 'loss/train': 3.3510570526123047} -09/20/2021 18:37:23 - INFO - __main__ - Step 19096: {'lr': 0.0001999600758358709, 'samples': 611072, 'steps': 1193, 'loss/train': 4.020874977111816} -09/20/2021 18:37:23 - INFO - __main__ - Step 19097: {'lr': 0.0001999600758358709, 'samples': 611104, 'steps': 1193, 'loss/train': 3.613814353942871} -09/20/2021 18:37:24 - INFO - __main__ - Step 19098: {'lr': 0.0001999600758358709, 'samples': 611136, 'steps': 1193, 'loss/train': 4.347945213317871} -09/20/2021 18:37:25 - INFO - __main__ - Step 19099: {'lr': 0.0001999600758358709, 'samples': 611168, 'steps': 1193, 'loss/train': 3.5623953342437744} -09/20/2021 18:37:26 - INFO - __main__ - Step 19100: {'lr': 0.0001999600758358709, 'samples': 611200, 'steps': 1193, 'loss/train': 1.842421531677246} -09/20/2021 18:37:26 - INFO - __main__ - Step 19101: {'lr': 0.0001999600758358709, 'samples': 611232, 'steps': 1193, 'loss/train': 3.009383201599121} -09/20/2021 18:37:27 - INFO - __main__ - Step 19102: {'lr': 0.0001999600758358709, 'samples': 611264, 'steps': 1193, 'loss/train': 3.2641751766204834} -09/20/2021 18:37:28 - INFO - __main__ - Step 19103: {'lr': 0.0001999600758358709, 'samples': 611296, 'steps': 1193, 'loss/train': 3.6714110374450684} -09/20/2021 18:37:29 - INFO - __main__ - Step 19104: {'lr': 0.0001999600758358709, 'samples': 611328, 'steps': 1193, 'loss/train': 3.6073522567749023} -09/20/2021 18:37:30 - INFO - __main__ - Step 19105: {'lr': 0.0001999598953999636, 'samples': 611360, 'steps': 1194, 'loss/train': 4.970515251159668} -09/20/2021 18:37:30 - INFO - __main__ - Step 19106: {'lr': 0.0001999598953999636, 'samples': 611392, 'steps': 1194, 'loss/train': 3.308155059814453} -09/20/2021 18:37:31 - INFO - __main__ - Step 19107: {'lr': 0.0001999598953999636, 'samples': 611424, 'steps': 1194, 'loss/train': 3.4095497131347656} -09/20/2021 18:37:32 - INFO - __main__ - Step 19108: {'lr': 0.0001999598953999636, 'samples': 611456, 'steps': 1194, 'loss/train': 3.486515998840332} -09/20/2021 18:37:33 - INFO - __main__ - Step 19109: {'lr': 0.0001999598953999636, 'samples': 611488, 'steps': 1194, 'loss/train': 4.09287166595459} -09/20/2021 18:37:33 - INFO - __main__ - Step 19110: {'lr': 0.0001999598953999636, 'samples': 611520, 'steps': 1194, 'loss/train': 6.275753498077393} -09/20/2021 18:37:34 - INFO - __main__ - Step 19111: {'lr': 0.0001999598953999636, 'samples': 611552, 'steps': 1194, 'loss/train': 3.4629313945770264} -09/20/2021 18:37:35 - INFO - __main__ - Step 19112: {'lr': 0.0001999598953999636, 'samples': 611584, 'steps': 1194, 'loss/train': 3.507892370223999} -09/20/2021 18:37:36 - INFO - __main__ - Step 19113: {'lr': 0.0001999598953999636, 'samples': 611616, 'steps': 1194, 'loss/train': 3.6643996238708496} -09/20/2021 18:37:36 - INFO - __main__ - Step 19114: {'lr': 0.0001999598953999636, 'samples': 611648, 'steps': 1194, 'loss/train': 4.857094764709473} -09/20/2021 18:37:37 - INFO - __main__ - Step 19115: {'lr': 0.0001999598953999636, 'samples': 611680, 'steps': 1194, 'loss/train': 4.401925086975098} -09/20/2021 18:37:38 - INFO - __main__ - Step 19116: {'lr': 0.0001999598953999636, 'samples': 611712, 'steps': 1194, 'loss/train': 3.1438591480255127} -09/20/2021 18:37:39 - INFO - __main__ - Step 19117: {'lr': 0.0001999598953999636, 'samples': 611744, 'steps': 1194, 'loss/train': 3.6435601711273193} -09/20/2021 18:37:39 - INFO - __main__ - Step 19118: {'lr': 0.0001999598953999636, 'samples': 611776, 'steps': 1194, 'loss/train': 3.262477159500122} -09/20/2021 18:37:40 - INFO - __main__ - Step 19119: {'lr': 0.0001999598953999636, 'samples': 611808, 'steps': 1194, 'loss/train': 2.65578031539917} -09/20/2021 18:37:41 - INFO - __main__ - Step 19120: {'lr': 0.0001999598953999636, 'samples': 611840, 'steps': 1194, 'loss/train': 4.163980484008789} -09/20/2021 18:37:43 - INFO - __main__ - Step 19121: {'lr': 0.0001999597145573199, 'samples': 611872, 'steps': 1195, 'loss/train': 3.2983014583587646} -09/20/2021 18:37:43 - INFO - __main__ - Step 19122: {'lr': 0.0001999597145573199, 'samples': 611904, 'steps': 1195, 'loss/train': 0.602772057056427} -09/20/2021 18:37:44 - INFO - __main__ - Step 19123: {'lr': 0.0001999597145573199, 'samples': 611936, 'steps': 1195, 'loss/train': 0.606619119644165} -09/20/2021 18:37:45 - INFO - __main__ - Step 19124: {'lr': 0.0001999597145573199, 'samples': 611968, 'steps': 1195, 'loss/train': 2.9139864444732666} -09/20/2021 18:37:46 - INFO - __main__ - Step 19125: {'lr': 0.0001999597145573199, 'samples': 612000, 'steps': 1195, 'loss/train': 3.352121591567993} -09/20/2021 18:37:46 - INFO - __main__ - Step 19126: {'lr': 0.0001999597145573199, 'samples': 612032, 'steps': 1195, 'loss/train': 3.3677210807800293} -09/20/2021 18:37:47 - INFO - __main__ - Step 19127: {'lr': 0.0001999597145573199, 'samples': 612064, 'steps': 1195, 'loss/train': 3.910414934158325} -09/20/2021 18:37:48 - INFO - __main__ - Step 19128: {'lr': 0.0001999597145573199, 'samples': 612096, 'steps': 1195, 'loss/train': 3.343578815460205} -09/20/2021 18:37:49 - INFO - __main__ - Step 19129: {'lr': 0.0001999597145573199, 'samples': 612128, 'steps': 1195, 'loss/train': 2.8524138927459717} -09/20/2021 18:37:49 - INFO - __main__ - Step 19130: {'lr': 0.0001999597145573199, 'samples': 612160, 'steps': 1195, 'loss/train': 3.3696939945220947} -09/20/2021 18:37:50 - INFO - __main__ - Step 19131: {'lr': 0.0001999597145573199, 'samples': 612192, 'steps': 1195, 'loss/train': 2.8972301483154297} -09/20/2021 18:37:51 - INFO - __main__ - Step 19132: {'lr': 0.0001999597145573199, 'samples': 612224, 'steps': 1195, 'loss/train': 2.9164271354675293} -09/20/2021 18:37:52 - INFO - __main__ - Step 19133: {'lr': 0.0001999597145573199, 'samples': 612256, 'steps': 1195, 'loss/train': 3.2598254680633545} -09/20/2021 18:37:52 - INFO - __main__ - Step 19134: {'lr': 0.0001999597145573199, 'samples': 612288, 'steps': 1195, 'loss/train': 3.5868215560913086} -09/20/2021 18:37:53 - INFO - __main__ - Step 19135: {'lr': 0.0001999597145573199, 'samples': 612320, 'steps': 1195, 'loss/train': 3.465998888015747} -09/20/2021 18:37:54 - INFO - __main__ - Step 19136: {'lr': 0.0001999597145573199, 'samples': 612352, 'steps': 1195, 'loss/train': 3.11142635345459} -09/20/2021 18:37:55 - INFO - __main__ - Step 19137: {'lr': 0.0001999595333079405, 'samples': 612384, 'steps': 1196, 'loss/train': 4.135087013244629} -09/20/2021 18:37:55 - INFO - __main__ - Step 19138: {'lr': 0.0001999595333079405, 'samples': 612416, 'steps': 1196, 'loss/train': 3.457090377807617} -09/20/2021 18:37:56 - INFO - __main__ - Step 19139: {'lr': 0.0001999595333079405, 'samples': 612448, 'steps': 1196, 'loss/train': 3.3947255611419678} -09/20/2021 18:37:57 - INFO - __main__ - Step 19140: {'lr': 0.0001999595333079405, 'samples': 612480, 'steps': 1196, 'loss/train': 3.030759572982788} -09/20/2021 18:37:58 - INFO - __main__ - Step 19141: {'lr': 0.0001999595333079405, 'samples': 612512, 'steps': 1196, 'loss/train': 3.5815417766571045} -09/20/2021 18:37:58 - INFO - __main__ - Step 19142: {'lr': 0.0001999595333079405, 'samples': 612544, 'steps': 1196, 'loss/train': 3.7855112552642822} -09/20/2021 18:37:59 - INFO - __main__ - Step 19143: {'lr': 0.0001999595333079405, 'samples': 612576, 'steps': 1196, 'loss/train': 5.329689979553223} -09/20/2021 18:38:00 - INFO - __main__ - Step 19144: {'lr': 0.0001999595333079405, 'samples': 612608, 'steps': 1196, 'loss/train': 3.9516918659210205} -09/20/2021 18:38:01 - INFO - __main__ - Step 19145: {'lr': 0.0001999595333079405, 'samples': 612640, 'steps': 1196, 'loss/train': 3.2326345443725586} -09/20/2021 18:38:01 - INFO - __main__ - Step 19146: {'lr': 0.0001999595333079405, 'samples': 612672, 'steps': 1196, 'loss/train': 3.5753469467163086} -09/20/2021 18:38:02 - INFO - __main__ - Step 19147: {'lr': 0.0001999595333079405, 'samples': 612704, 'steps': 1196, 'loss/train': 3.156254529953003} -09/20/2021 18:38:03 - INFO - __main__ - Step 19148: {'lr': 0.0001999595333079405, 'samples': 612736, 'steps': 1196, 'loss/train': 4.028494358062744} -09/20/2021 18:38:04 - INFO - __main__ - Step 19149: {'lr': 0.0001999595333079405, 'samples': 612768, 'steps': 1196, 'loss/train': 3.409052848815918} -09/20/2021 18:38:04 - INFO - __main__ - Step 19150: {'lr': 0.0001999595333079405, 'samples': 612800, 'steps': 1196, 'loss/train': 3.8634417057037354} -09/20/2021 18:38:05 - INFO - __main__ - Step 19151: {'lr': 0.0001999595333079405, 'samples': 612832, 'steps': 1196, 'loss/train': 3.332430601119995} -09/20/2021 18:38:06 - INFO - __main__ - Step 19152: {'lr': 0.0001999595333079405, 'samples': 612864, 'steps': 1196, 'loss/train': 3.263824701309204} -09/20/2021 18:38:07 - INFO - __main__ - Step 19153: {'lr': 0.0001999593516518261, 'samples': 612896, 'steps': 1197, 'loss/train': 2.9956626892089844} -09/20/2021 18:38:08 - INFO - __main__ - Step 19154: {'lr': 0.0001999593516518261, 'samples': 612928, 'steps': 1197, 'loss/train': 0.5312394499778748} -09/20/2021 18:38:08 - INFO - __main__ - Step 19155: {'lr': 0.0001999593516518261, 'samples': 612960, 'steps': 1197, 'loss/train': 0.4889414608478546} -09/20/2021 18:38:09 - INFO - __main__ - Step 19156: {'lr': 0.0001999593516518261, 'samples': 612992, 'steps': 1197, 'loss/train': 3.364866256713867} -09/20/2021 18:38:10 - INFO - __main__ - Step 19157: {'lr': 0.0001999593516518261, 'samples': 613024, 'steps': 1197, 'loss/train': 3.4568428993225098} -09/20/2021 18:38:11 - INFO - __main__ - Step 19158: {'lr': 0.0001999593516518261, 'samples': 613056, 'steps': 1197, 'loss/train': 3.4141340255737305} -09/20/2021 18:38:12 - INFO - __main__ - Step 19159: {'lr': 0.0001999593516518261, 'samples': 613088, 'steps': 1197, 'loss/train': 4.1227335929870605} -09/20/2021 18:38:13 - INFO - __main__ - Step 19160: {'lr': 0.0001999593516518261, 'samples': 613120, 'steps': 1197, 'loss/train': 4.4154510498046875} -09/20/2021 18:38:13 - INFO - __main__ - Step 19161: {'lr': 0.0001999593516518261, 'samples': 613152, 'steps': 1197, 'loss/train': 2.581958055496216} -09/20/2021 18:38:14 - INFO - __main__ - Step 19162: {'lr': 0.0001999593516518261, 'samples': 613184, 'steps': 1197, 'loss/train': 3.6763479709625244} -09/20/2021 18:38:15 - INFO - __main__ - Step 19163: {'lr': 0.0001999593516518261, 'samples': 613216, 'steps': 1197, 'loss/train': 2.8598814010620117} -09/20/2021 18:38:16 - INFO - __main__ - Step 19164: {'lr': 0.0001999593516518261, 'samples': 613248, 'steps': 1197, 'loss/train': 3.7867250442504883} -09/20/2021 18:38:16 - INFO - __main__ - Step 19165: {'lr': 0.0001999593516518261, 'samples': 613280, 'steps': 1197, 'loss/train': 2.9453132152557373} -09/20/2021 18:38:17 - INFO - __main__ - Step 19166: {'lr': 0.0001999593516518261, 'samples': 613312, 'steps': 1197, 'loss/train': 2.6567695140838623} -09/20/2021 18:38:18 - INFO - __main__ - Step 19167: {'lr': 0.0001999593516518261, 'samples': 613344, 'steps': 1197, 'loss/train': 3.2889907360076904} -09/20/2021 18:38:19 - INFO - __main__ - Step 19168: {'lr': 0.0001999593516518261, 'samples': 613376, 'steps': 1197, 'loss/train': 2.8789710998535156} -09/20/2021 18:38:20 - INFO - __main__ - Step 19169: {'lr': 0.00019995916958897753, 'samples': 613408, 'steps': 1198, 'loss/train': 3.957953453063965} -09/20/2021 18:38:20 - INFO - __main__ - Step 19170: {'lr': 0.00019995916958897753, 'samples': 613440, 'steps': 1198, 'loss/train': 3.079423666000366} -09/20/2021 18:38:21 - INFO - __main__ - Step 19171: {'lr': 0.00019995916958897753, 'samples': 613472, 'steps': 1198, 'loss/train': 4.559813976287842} -09/20/2021 18:38:22 - INFO - __main__ - Step 19172: {'lr': 0.00019995916958897753, 'samples': 613504, 'steps': 1198, 'loss/train': 3.431095838546753} -09/20/2021 18:38:23 - INFO - __main__ - Step 19173: {'lr': 0.00019995916958897753, 'samples': 613536, 'steps': 1198, 'loss/train': 3.262009620666504} -09/20/2021 18:38:23 - INFO - __main__ - Step 19174: {'lr': 0.00019995916958897753, 'samples': 613568, 'steps': 1198, 'loss/train': 4.813011169433594} -09/20/2021 18:38:24 - INFO - __main__ - Step 19175: {'lr': 0.00019995916958897753, 'samples': 613600, 'steps': 1198, 'loss/train': 4.1044511795043945} -09/20/2021 18:38:25 - INFO - __main__ - Step 19176: {'lr': 0.00019995916958897753, 'samples': 613632, 'steps': 1198, 'loss/train': 3.345332384109497} -09/20/2021 18:38:26 - INFO - __main__ - Step 19177: {'lr': 0.00019995916958897753, 'samples': 613664, 'steps': 1198, 'loss/train': 3.702016592025757} -09/20/2021 18:38:26 - INFO - __main__ - Step 19178: {'lr': 0.00019995916958897753, 'samples': 613696, 'steps': 1198, 'loss/train': 3.9946422576904297} -09/20/2021 18:38:27 - INFO - __main__ - Step 19179: {'lr': 0.00019995916958897753, 'samples': 613728, 'steps': 1198, 'loss/train': 3.229782819747925} -09/20/2021 18:38:28 - INFO - __main__ - Step 19180: {'lr': 0.00019995916958897753, 'samples': 613760, 'steps': 1198, 'loss/train': 3.0886483192443848} -09/20/2021 18:38:29 - INFO - __main__ - Step 19181: {'lr': 0.00019995916958897753, 'samples': 613792, 'steps': 1198, 'loss/train': 3.4789202213287354} -09/20/2021 18:38:29 - INFO - __main__ - Step 19182: {'lr': 0.00019995916958897753, 'samples': 613824, 'steps': 1198, 'loss/train': 3.4508323669433594} -09/20/2021 18:38:30 - INFO - __main__ - Step 19183: {'lr': 0.00019995916958897753, 'samples': 613856, 'steps': 1198, 'loss/train': 3.7695350646972656} -09/20/2021 18:38:31 - INFO - __main__ - Step 19184: {'lr': 0.00019995916958897753, 'samples': 613888, 'steps': 1198, 'loss/train': 3.9574649333953857} -09/20/2021 18:38:32 - INFO - __main__ - Step 19185: {'lr': 0.0001999589871193955, 'samples': 613920, 'steps': 1199, 'loss/train': 2.4167513847351074} -09/20/2021 18:38:32 - INFO - __main__ - Step 19186: {'lr': 0.0001999589871193955, 'samples': 613952, 'steps': 1199, 'loss/train': 3.6882197856903076} -09/20/2021 18:38:33 - INFO - __main__ - Step 19187: {'lr': 0.0001999589871193955, 'samples': 613984, 'steps': 1199, 'loss/train': 3.2069857120513916} -09/20/2021 18:38:35 - INFO - __main__ - Step 19188: {'lr': 0.0001999589871193955, 'samples': 614016, 'steps': 1199, 'loss/train': 3.539499282836914} -09/20/2021 18:38:35 - INFO - __main__ - Step 19189: {'lr': 0.0001999589871193955, 'samples': 614048, 'steps': 1199, 'loss/train': 5.241335868835449} -09/20/2021 18:38:36 - INFO - __main__ - Step 19190: {'lr': 0.0001999589871193955, 'samples': 614080, 'steps': 1199, 'loss/train': 5.064855575561523} -09/20/2021 18:38:37 - INFO - __main__ - Step 19191: {'lr': 0.0001999589871193955, 'samples': 614112, 'steps': 1199, 'loss/train': 3.168834924697876} -09/20/2021 18:38:38 - INFO - __main__ - Step 19192: {'lr': 0.0001999589871193955, 'samples': 614144, 'steps': 1199, 'loss/train': 5.5842671394348145} -09/20/2021 18:38:38 - INFO - __main__ - Step 19193: {'lr': 0.0001999589871193955, 'samples': 614176, 'steps': 1199, 'loss/train': 3.9817452430725098} -09/20/2021 18:38:39 - INFO - __main__ - Step 19194: {'lr': 0.0001999589871193955, 'samples': 614208, 'steps': 1199, 'loss/train': 4.033526420593262} -09/20/2021 18:38:40 - INFO - __main__ - Step 19195: {'lr': 0.0001999589871193955, 'samples': 614240, 'steps': 1199, 'loss/train': 3.0566177368164062} -09/20/2021 18:38:41 - INFO - __main__ - Step 19196: {'lr': 0.0001999589871193955, 'samples': 614272, 'steps': 1199, 'loss/train': 4.531709671020508} -09/20/2021 18:38:41 - INFO - __main__ - Step 19197: {'lr': 0.0001999589871193955, 'samples': 614304, 'steps': 1199, 'loss/train': 4.6003618240356445} -09/20/2021 18:38:42 - INFO - __main__ - Step 19198: {'lr': 0.0001999589871193955, 'samples': 614336, 'steps': 1199, 'loss/train': 3.806781053543091} -09/20/2021 18:38:43 - INFO - __main__ - Step 19199: {'lr': 0.0001999589871193955, 'samples': 614368, 'steps': 1199, 'loss/train': 2.956047296524048} -09/20/2021 18:38:44 - INFO - __main__ - Step 19200: {'lr': 0.0001999589871193955, 'samples': 614400, 'steps': 1199, 'loss/train': 3.7693073749542236} -09/20/2021 18:38:44 - INFO - __main__ - Step 19201: {'lr': 0.00019995880424308071, 'samples': 614432, 'steps': 1200, 'loss/train': 0.7607395648956299} -09/20/2021 18:38:45 - INFO - __main__ - Step 19202: {'lr': 0.00019995880424308071, 'samples': 614464, 'steps': 1200, 'loss/train': 3.6651434898376465} -09/20/2021 18:38:46 - INFO - __main__ - Step 19203: {'lr': 0.00019995880424308071, 'samples': 614496, 'steps': 1200, 'loss/train': 2.7604386806488037} -09/20/2021 18:38:47 - INFO - __main__ - Step 19204: {'lr': 0.00019995880424308071, 'samples': 614528, 'steps': 1200, 'loss/train': 5.463493824005127} -09/20/2021 18:38:47 - INFO - __main__ - Step 19205: {'lr': 0.00019995880424308071, 'samples': 614560, 'steps': 1200, 'loss/train': 5.777066707611084} -09/20/2021 18:38:48 - INFO - __main__ - Step 19206: {'lr': 0.00019995880424308071, 'samples': 614592, 'steps': 1200, 'loss/train': 2.6836142539978027} -09/20/2021 18:38:49 - INFO - __main__ - Step 19207: {'lr': 0.00019995880424308071, 'samples': 614624, 'steps': 1200, 'loss/train': 3.903914451599121} -09/20/2021 18:38:50 - INFO - __main__ - Step 19208: {'lr': 0.00019995880424308071, 'samples': 614656, 'steps': 1200, 'loss/train': 3.0247902870178223} -09/20/2021 18:38:50 - INFO - __main__ - Step 19209: {'lr': 0.00019995880424308071, 'samples': 614688, 'steps': 1200, 'loss/train': 3.6992673873901367} -09/20/2021 18:38:51 - INFO - __main__ - Step 19210: {'lr': 0.00019995880424308071, 'samples': 614720, 'steps': 1200, 'loss/train': 5.22991418838501} -09/20/2021 18:38:52 - INFO - __main__ - Step 19211: {'lr': 0.00019995880424308071, 'samples': 614752, 'steps': 1200, 'loss/train': 4.194723129272461} -09/20/2021 18:38:53 - INFO - __main__ - Step 19212: {'lr': 0.00019995880424308071, 'samples': 614784, 'steps': 1200, 'loss/train': 3.439162492752075} -09/20/2021 18:38:53 - INFO - __main__ - Step 19213: {'lr': 0.00019995880424308071, 'samples': 614816, 'steps': 1200, 'loss/train': 2.958280563354492} -09/20/2021 18:38:54 - INFO - __main__ - Step 19214: {'lr': 0.00019995880424308071, 'samples': 614848, 'steps': 1200, 'loss/train': 3.645613670349121} -09/20/2021 18:38:55 - INFO - __main__ - Step 19215: {'lr': 0.00019995880424308071, 'samples': 614880, 'steps': 1200, 'loss/train': 2.9533884525299072} -09/20/2021 18:38:56 - INFO - __main__ - Step 19216: {'lr': 0.00019995880424308071, 'samples': 614912, 'steps': 1200, 'loss/train': 0.43332064151763916} -09/20/2021 18:38:57 - INFO - __main__ - Step 19217: {'lr': 0.00019995862096003393, 'samples': 614944, 'steps': 1201, 'loss/train': 0.7646106481552124} -09/20/2021 18:38:58 - INFO - __main__ - Step 19218: {'lr': 0.00019995862096003393, 'samples': 614976, 'steps': 1201, 'loss/train': 0.5429400205612183} -09/20/2021 18:38:59 - INFO - __main__ - Step 19219: {'lr': 0.00019995862096003393, 'samples': 615008, 'steps': 1201, 'loss/train': 0.503043532371521} -09/20/2021 18:39:00 - INFO - __main__ - Step 19220: {'lr': 0.00019995862096003393, 'samples': 615040, 'steps': 1201, 'loss/train': 4.23723030090332} -09/20/2021 18:39:00 - INFO - __main__ - Step 19221: {'lr': 0.00019995862096003393, 'samples': 615072, 'steps': 1201, 'loss/train': 3.1006550788879395} -09/20/2021 18:39:01 - INFO - __main__ - Step 19222: {'lr': 0.00019995862096003393, 'samples': 615104, 'steps': 1201, 'loss/train': 2.7428457736968994} -09/20/2021 18:39:02 - INFO - __main__ - Step 19223: {'lr': 0.00019995862096003393, 'samples': 615136, 'steps': 1201, 'loss/train': 3.1006126403808594} -09/20/2021 18:39:03 - INFO - __main__ - Step 19224: {'lr': 0.00019995862096003393, 'samples': 615168, 'steps': 1201, 'loss/train': 3.3382678031921387} -09/20/2021 18:39:03 - INFO - __main__ - Step 19225: {'lr': 0.00019995862096003393, 'samples': 615200, 'steps': 1201, 'loss/train': 3.7517247200012207} -09/20/2021 18:39:04 - INFO - __main__ - Step 19226: {'lr': 0.00019995862096003393, 'samples': 615232, 'steps': 1201, 'loss/train': 3.9543747901916504} -09/20/2021 18:39:05 - INFO - __main__ - Step 19227: {'lr': 0.00019995862096003393, 'samples': 615264, 'steps': 1201, 'loss/train': 4.0394697189331055} -09/20/2021 18:39:06 - INFO - __main__ - Step 19228: {'lr': 0.00019995862096003393, 'samples': 615296, 'steps': 1201, 'loss/train': 3.832472324371338} -09/20/2021 18:39:06 - INFO - __main__ - Step 19229: {'lr': 0.00019995862096003393, 'samples': 615328, 'steps': 1201, 'loss/train': 3.896848201751709} -09/20/2021 18:39:07 - INFO - __main__ - Step 19230: {'lr': 0.00019995862096003393, 'samples': 615360, 'steps': 1201, 'loss/train': 4.48006010055542} -09/20/2021 18:39:08 - INFO - __main__ - Step 19231: {'lr': 0.00019995862096003393, 'samples': 615392, 'steps': 1201, 'loss/train': 1.57671058177948} -09/20/2021 18:39:09 - INFO - __main__ - Step 19232: {'lr': 0.00019995862096003393, 'samples': 615424, 'steps': 1201, 'loss/train': 3.3769943714141846} -09/20/2021 18:39:09 - INFO - __main__ - Step 19233: {'lr': 0.00019995843727025592, 'samples': 615456, 'steps': 1202, 'loss/train': 3.8376779556274414} -09/20/2021 18:39:10 - INFO - __main__ - Step 19234: {'lr': 0.00019995843727025592, 'samples': 615488, 'steps': 1202, 'loss/train': 3.189504861831665} -09/20/2021 18:39:11 - INFO - __main__ - Step 19235: {'lr': 0.00019995843727025592, 'samples': 615520, 'steps': 1202, 'loss/train': 3.41841197013855} -09/20/2021 18:39:12 - INFO - __main__ - Step 19236: {'lr': 0.00019995843727025592, 'samples': 615552, 'steps': 1202, 'loss/train': 3.9330410957336426} -09/20/2021 18:39:12 - INFO - __main__ - Step 19237: {'lr': 0.00019995843727025592, 'samples': 615584, 'steps': 1202, 'loss/train': 3.667433977127075} -09/20/2021 18:39:13 - INFO - __main__ - Step 19238: {'lr': 0.00019995843727025592, 'samples': 615616, 'steps': 1202, 'loss/train': 2.8731470108032227} -09/20/2021 18:39:14 - INFO - __main__ - Step 19239: {'lr': 0.00019995843727025592, 'samples': 615648, 'steps': 1202, 'loss/train': 3.1378629207611084} -09/20/2021 18:39:15 - INFO - __main__ - Step 19240: {'lr': 0.00019995843727025592, 'samples': 615680, 'steps': 1202, 'loss/train': 3.109947919845581} -09/20/2021 18:39:15 - INFO - __main__ - Step 19241: {'lr': 0.00019995843727025592, 'samples': 615712, 'steps': 1202, 'loss/train': 4.444720268249512} -09/20/2021 18:39:16 - INFO - __main__ - Step 19242: {'lr': 0.00019995843727025592, 'samples': 615744, 'steps': 1202, 'loss/train': 3.150928258895874} -09/20/2021 18:39:17 - INFO - __main__ - Step 19243: {'lr': 0.00019995843727025592, 'samples': 615776, 'steps': 1202, 'loss/train': 3.6190433502197266} -09/20/2021 18:39:18 - INFO - __main__ - Step 19244: {'lr': 0.00019995843727025592, 'samples': 615808, 'steps': 1202, 'loss/train': 3.4565889835357666} -09/20/2021 18:39:18 - INFO - __main__ - Step 19245: {'lr': 0.00019995843727025592, 'samples': 615840, 'steps': 1202, 'loss/train': 3.6791181564331055} -09/20/2021 18:39:19 - INFO - __main__ - Step 19246: {'lr': 0.00019995843727025592, 'samples': 615872, 'steps': 1202, 'loss/train': 3.5493392944335938} -09/20/2021 18:39:20 - INFO - __main__ - Step 19247: {'lr': 0.00019995843727025592, 'samples': 615904, 'steps': 1202, 'loss/train': 3.318140983581543} -09/20/2021 18:39:22 - INFO - __main__ - Step 19248: {'lr': 0.00019995843727025592, 'samples': 615936, 'steps': 1202, 'loss/train': 4.067049503326416} -09/20/2021 18:39:23 - INFO - __main__ - Step 19249: {'lr': 0.00019995825317374743, 'samples': 615968, 'steps': 1203, 'loss/train': 2.934216260910034} -09/20/2021 18:39:23 - INFO - __main__ - Step 19250: {'lr': 0.00019995825317374743, 'samples': 616000, 'steps': 1203, 'loss/train': 3.538107395172119} -09/20/2021 18:39:24 - INFO - __main__ - Step 19251: {'lr': 0.00019995825317374743, 'samples': 616032, 'steps': 1203, 'loss/train': 3.7584073543548584} -09/20/2021 18:39:25 - INFO - __main__ - Step 19252: {'lr': 0.00019995825317374743, 'samples': 616064, 'steps': 1203, 'loss/train': 3.5215845108032227} -09/20/2021 18:39:26 - INFO - __main__ - Step 19253: {'lr': 0.00019995825317374743, 'samples': 616096, 'steps': 1203, 'loss/train': 2.693204641342163} -09/20/2021 18:39:26 - INFO - __main__ - Step 19254: {'lr': 0.00019995825317374743, 'samples': 616128, 'steps': 1203, 'loss/train': 2.673039197921753} -09/20/2021 18:39:27 - INFO - __main__ - Step 19255: {'lr': 0.00019995825317374743, 'samples': 616160, 'steps': 1203, 'loss/train': 3.8801798820495605} -09/20/2021 18:39:28 - INFO - __main__ - Step 19256: {'lr': 0.00019995825317374743, 'samples': 616192, 'steps': 1203, 'loss/train': 3.5925114154815674} -09/20/2021 18:39:29 - INFO - __main__ - Step 19257: {'lr': 0.00019995825317374743, 'samples': 616224, 'steps': 1203, 'loss/train': 5.431737899780273} -09/20/2021 18:39:29 - INFO - __main__ - Step 19258: {'lr': 0.00019995825317374743, 'samples': 616256, 'steps': 1203, 'loss/train': 4.141469478607178} -09/20/2021 18:39:30 - INFO - __main__ - Step 19259: {'lr': 0.00019995825317374743, 'samples': 616288, 'steps': 1203, 'loss/train': 4.78580379486084} -09/20/2021 18:39:31 - INFO - __main__ - Step 19260: {'lr': 0.00019995825317374743, 'samples': 616320, 'steps': 1203, 'loss/train': 4.171452045440674} -09/20/2021 18:39:32 - INFO - __main__ - Step 19261: {'lr': 0.00019995825317374743, 'samples': 616352, 'steps': 1203, 'loss/train': 3.4763691425323486} -09/20/2021 18:39:32 - INFO - __main__ - Step 19262: {'lr': 0.00019995825317374743, 'samples': 616384, 'steps': 1203, 'loss/train': 3.1263980865478516} -09/20/2021 18:39:33 - INFO - __main__ - Step 19263: {'lr': 0.00019995825317374743, 'samples': 616416, 'steps': 1203, 'loss/train': 3.6663331985473633} -09/20/2021 18:39:34 - INFO - __main__ - Step 19264: {'lr': 0.00019995825317374743, 'samples': 616448, 'steps': 1203, 'loss/train': 1.7464592456817627} -09/20/2021 18:39:35 - INFO - __main__ - Step 19265: {'lr': 0.0001999580686705092, 'samples': 616480, 'steps': 1204, 'loss/train': 3.31533145904541} -09/20/2021 18:39:35 - INFO - __main__ - Step 19266: {'lr': 0.0001999580686705092, 'samples': 616512, 'steps': 1204, 'loss/train': 3.284966230392456} -09/20/2021 18:39:36 - INFO - __main__ - Step 19267: {'lr': 0.0001999580686705092, 'samples': 616544, 'steps': 1204, 'loss/train': 3.045804738998413} -09/20/2021 18:39:37 - INFO - __main__ - Step 19268: {'lr': 0.0001999580686705092, 'samples': 616576, 'steps': 1204, 'loss/train': 4.004737377166748} -09/20/2021 18:39:38 - INFO - __main__ - Step 19269: {'lr': 0.0001999580686705092, 'samples': 616608, 'steps': 1204, 'loss/train': 3.5882554054260254} -09/20/2021 18:39:38 - INFO - __main__ - Step 19270: {'lr': 0.0001999580686705092, 'samples': 616640, 'steps': 1204, 'loss/train': 3.2684662342071533} -09/20/2021 18:39:39 - INFO - __main__ - Step 19271: {'lr': 0.0001999580686705092, 'samples': 616672, 'steps': 1204, 'loss/train': 3.189980983734131} -09/20/2021 18:39:40 - INFO - __main__ - Step 19272: {'lr': 0.0001999580686705092, 'samples': 616704, 'steps': 1204, 'loss/train': 3.6922566890716553} -09/20/2021 18:39:41 - INFO - __main__ - Step 19273: {'lr': 0.0001999580686705092, 'samples': 616736, 'steps': 1204, 'loss/train': 4.348923683166504} -09/20/2021 18:39:41 - INFO - __main__ - Step 19274: {'lr': 0.0001999580686705092, 'samples': 616768, 'steps': 1204, 'loss/train': 3.5284311771392822} -09/20/2021 18:39:42 - INFO - __main__ - Step 19275: {'lr': 0.0001999580686705092, 'samples': 616800, 'steps': 1204, 'loss/train': 2.795091390609741} -09/20/2021 18:39:43 - INFO - __main__ - Step 19276: {'lr': 0.0001999580686705092, 'samples': 616832, 'steps': 1204, 'loss/train': 3.687103748321533} -09/20/2021 18:39:44 - INFO - __main__ - Step 19277: {'lr': 0.0001999580686705092, 'samples': 616864, 'steps': 1204, 'loss/train': 1.2849993705749512} -09/20/2021 18:39:44 - INFO - __main__ - Step 19278: {'lr': 0.0001999580686705092, 'samples': 616896, 'steps': 1204, 'loss/train': 0.897167444229126} -09/20/2021 18:39:45 - INFO - __main__ - Step 19279: {'lr': 0.0001999580686705092, 'samples': 616928, 'steps': 1204, 'loss/train': 0.9117071032524109} -09/20/2021 18:39:46 - INFO - __main__ - Step 19280: {'lr': 0.0001999580686705092, 'samples': 616960, 'steps': 1204, 'loss/train': 1.5061529874801636} -09/20/2021 18:39:47 - INFO - __main__ - Step 19281: {'lr': 0.00019995788376054194, 'samples': 616992, 'steps': 1205, 'loss/train': 0.7716450691223145} -09/20/2021 18:39:48 - INFO - __main__ - Step 19282: {'lr': 0.00019995788376054194, 'samples': 617024, 'steps': 1205, 'loss/train': 1.6208844184875488} -09/20/2021 18:39:49 - INFO - __main__ - Step 19283: {'lr': 0.00019995788376054194, 'samples': 617056, 'steps': 1205, 'loss/train': 3.8333237171173096} -09/20/2021 18:39:50 - INFO - __main__ - Step 19284: {'lr': 0.00019995788376054194, 'samples': 617088, 'steps': 1205, 'loss/train': 3.5316762924194336} -09/20/2021 18:39:50 - INFO - __main__ - Step 19285: {'lr': 0.00019995788376054194, 'samples': 617120, 'steps': 1205, 'loss/train': 3.49997878074646} -09/20/2021 18:39:51 - INFO - __main__ - Step 19286: {'lr': 0.00019995788376054194, 'samples': 617152, 'steps': 1205, 'loss/train': 4.469489097595215} -09/20/2021 18:39:52 - INFO - __main__ - Step 19287: {'lr': 0.00019995788376054194, 'samples': 617184, 'steps': 1205, 'loss/train': 3.460822582244873} -09/20/2021 18:39:53 - INFO - __main__ - Step 19288: {'lr': 0.00019995788376054194, 'samples': 617216, 'steps': 1205, 'loss/train': 2.6301326751708984} -09/20/2021 18:39:53 - INFO - __main__ - Step 19289: {'lr': 0.00019995788376054194, 'samples': 617248, 'steps': 1205, 'loss/train': 3.1393487453460693} -09/20/2021 18:39:54 - INFO - __main__ - Step 19290: {'lr': 0.00019995788376054194, 'samples': 617280, 'steps': 1205, 'loss/train': 4.388119220733643} -09/20/2021 18:39:55 - INFO - __main__ - Step 19291: {'lr': 0.00019995788376054194, 'samples': 617312, 'steps': 1205, 'loss/train': 1.505531668663025} -09/20/2021 18:39:56 - INFO - __main__ - Step 19292: {'lr': 0.00019995788376054194, 'samples': 617344, 'steps': 1205, 'loss/train': 3.5756194591522217} -09/20/2021 18:39:56 - INFO - __main__ - Step 19293: {'lr': 0.00019995788376054194, 'samples': 617376, 'steps': 1205, 'loss/train': 3.7053987979888916} -09/20/2021 18:39:57 - INFO - __main__ - Step 19294: {'lr': 0.00019995788376054194, 'samples': 617408, 'steps': 1205, 'loss/train': 3.336925745010376} -09/20/2021 18:39:58 - INFO - __main__ - Step 19295: {'lr': 0.00019995788376054194, 'samples': 617440, 'steps': 1205, 'loss/train': 2.911398410797119} -09/20/2021 18:39:59 - INFO - __main__ - Step 19296: {'lr': 0.00019995788376054194, 'samples': 617472, 'steps': 1205, 'loss/train': 3.80790114402771} -09/20/2021 18:40:00 - INFO - __main__ - Step 19297: {'lr': 0.00019995769844384647, 'samples': 617504, 'steps': 1206, 'loss/train': 3.3524093627929688} -09/20/2021 18:40:00 - INFO - __main__ - Step 19298: {'lr': 0.00019995769844384647, 'samples': 617536, 'steps': 1206, 'loss/train': 3.539560556411743} -09/20/2021 18:40:01 - INFO - __main__ - Step 19299: {'lr': 0.00019995769844384647, 'samples': 617568, 'steps': 1206, 'loss/train': 3.6217639446258545} -09/20/2021 18:40:02 - INFO - __main__ - Step 19300: {'lr': 0.00019995769844384647, 'samples': 617600, 'steps': 1206, 'loss/train': 3.5620768070220947} -09/20/2021 18:40:03 - INFO - __main__ - Step 19301: {'lr': 0.00019995769844384647, 'samples': 617632, 'steps': 1206, 'loss/train': 5.015135288238525} -09/20/2021 18:40:03 - INFO - __main__ - Step 19302: {'lr': 0.00019995769844384647, 'samples': 617664, 'steps': 1206, 'loss/train': 3.79295015335083} -09/20/2021 18:40:04 - INFO - __main__ - Step 19303: {'lr': 0.00019995769844384647, 'samples': 617696, 'steps': 1206, 'loss/train': 3.215890645980835} -09/20/2021 18:40:05 - INFO - __main__ - Step 19304: {'lr': 0.00019995769844384647, 'samples': 617728, 'steps': 1206, 'loss/train': 3.401362657546997} -09/20/2021 18:40:06 - INFO - __main__ - Step 19305: {'lr': 0.00019995769844384647, 'samples': 617760, 'steps': 1206, 'loss/train': 4.036839008331299} -09/20/2021 18:40:06 - INFO - __main__ - Step 19306: {'lr': 0.00019995769844384647, 'samples': 617792, 'steps': 1206, 'loss/train': 4.295060157775879} -09/20/2021 18:40:07 - INFO - __main__ - Step 19307: {'lr': 0.00019995769844384647, 'samples': 617824, 'steps': 1206, 'loss/train': 3.2673707008361816} -09/20/2021 18:40:08 - INFO - __main__ - Step 19308: {'lr': 0.00019995769844384647, 'samples': 617856, 'steps': 1206, 'loss/train': 2.6704485416412354} -09/20/2021 18:40:09 - INFO - __main__ - Step 19309: {'lr': 0.00019995769844384647, 'samples': 617888, 'steps': 1206, 'loss/train': 2.9416000843048096} -09/20/2021 18:40:09 - INFO - __main__ - Step 19310: {'lr': 0.00019995769844384647, 'samples': 617920, 'steps': 1206, 'loss/train': 3.2374136447906494} -09/20/2021 18:40:10 - INFO - __main__ - Step 19311: {'lr': 0.00019995769844384647, 'samples': 617952, 'steps': 1206, 'loss/train': 4.598605155944824} -09/20/2021 18:40:12 - INFO - __main__ - Step 19312: {'lr': 0.00019995769844384647, 'samples': 617984, 'steps': 1206, 'loss/train': 3.616225004196167} -09/20/2021 18:40:13 - INFO - __main__ - Step 19313: {'lr': 0.0001999575127204235, 'samples': 618016, 'steps': 1207, 'loss/train': 3.208240032196045} -09/20/2021 18:40:13 - INFO - __main__ - Step 19314: {'lr': 0.0001999575127204235, 'samples': 618048, 'steps': 1207, 'loss/train': 3.422605037689209} -09/20/2021 18:40:14 - INFO - __main__ - Step 19315: {'lr': 0.0001999575127204235, 'samples': 618080, 'steps': 1207, 'loss/train': 3.424189329147339} -09/20/2021 18:40:15 - INFO - __main__ - Step 19316: {'lr': 0.0001999575127204235, 'samples': 618112, 'steps': 1207, 'loss/train': 2.9701836109161377} -09/20/2021 18:40:16 - INFO - __main__ - Step 19317: {'lr': 0.0001999575127204235, 'samples': 618144, 'steps': 1207, 'loss/train': 3.7895681858062744} -09/20/2021 18:40:16 - INFO - __main__ - Step 19318: {'lr': 0.0001999575127204235, 'samples': 618176, 'steps': 1207, 'loss/train': 3.4495432376861572} -09/20/2021 18:40:17 - INFO - __main__ - Step 19319: {'lr': 0.0001999575127204235, 'samples': 618208, 'steps': 1207, 'loss/train': 2.818782091140747} -09/20/2021 18:40:18 - INFO - __main__ - Step 19320: {'lr': 0.0001999575127204235, 'samples': 618240, 'steps': 1207, 'loss/train': 3.8825769424438477} -09/20/2021 18:40:19 - INFO - __main__ - Step 19321: {'lr': 0.0001999575127204235, 'samples': 618272, 'steps': 1207, 'loss/train': 3.5413644313812256} -09/20/2021 18:40:19 - INFO - __main__ - Step 19322: {'lr': 0.0001999575127204235, 'samples': 618304, 'steps': 1207, 'loss/train': 3.0251240730285645} -09/20/2021 18:40:20 - INFO - __main__ - Step 19323: {'lr': 0.0001999575127204235, 'samples': 618336, 'steps': 1207, 'loss/train': 3.6391818523406982} -09/20/2021 18:40:21 - INFO - __main__ - Step 19324: {'lr': 0.0001999575127204235, 'samples': 618368, 'steps': 1207, 'loss/train': 2.7912168502807617} -09/20/2021 18:40:22 - INFO - __main__ - Step 19325: {'lr': 0.0001999575127204235, 'samples': 618400, 'steps': 1207, 'loss/train': 3.795342445373535} -09/20/2021 18:40:22 - INFO - __main__ - Step 19326: {'lr': 0.0001999575127204235, 'samples': 618432, 'steps': 1207, 'loss/train': 3.510495185852051} -09/20/2021 18:40:23 - INFO - __main__ - Step 19327: {'lr': 0.0001999575127204235, 'samples': 618464, 'steps': 1207, 'loss/train': 3.505739450454712} -09/20/2021 18:40:24 - INFO - __main__ - Step 19328: {'lr': 0.0001999575127204235, 'samples': 618496, 'steps': 1207, 'loss/train': 2.706498384475708} -09/20/2021 18:40:25 - INFO - __main__ - Step 19329: {'lr': 0.0001999573265902738, 'samples': 618528, 'steps': 1208, 'loss/train': 3.280104875564575} -09/20/2021 18:40:25 - INFO - __main__ - Step 19330: {'lr': 0.0001999573265902738, 'samples': 618560, 'steps': 1208, 'loss/train': 3.352085828781128} -09/20/2021 18:40:26 - INFO - __main__ - Step 19331: {'lr': 0.0001999573265902738, 'samples': 618592, 'steps': 1208, 'loss/train': 3.128291368484497} -09/20/2021 18:40:27 - INFO - __main__ - Step 19332: {'lr': 0.0001999573265902738, 'samples': 618624, 'steps': 1208, 'loss/train': 3.731247663497925} -09/20/2021 18:40:28 - INFO - __main__ - Step 19333: {'lr': 0.0001999573265902738, 'samples': 618656, 'steps': 1208, 'loss/train': 4.4071245193481445} -09/20/2021 18:40:28 - INFO - __main__ - Step 19334: {'lr': 0.0001999573265902738, 'samples': 618688, 'steps': 1208, 'loss/train': 2.0505053997039795} -09/20/2021 18:40:29 - INFO - __main__ - Step 19335: {'lr': 0.0001999573265902738, 'samples': 618720, 'steps': 1208, 'loss/train': 1.140313744544983} -09/20/2021 18:40:30 - INFO - __main__ - Step 19336: {'lr': 0.0001999573265902738, 'samples': 618752, 'steps': 1208, 'loss/train': 0.8834025859832764} -09/20/2021 18:40:31 - INFO - __main__ - Step 19337: {'lr': 0.0001999573265902738, 'samples': 618784, 'steps': 1208, 'loss/train': 0.9618616700172424} -09/20/2021 18:40:31 - INFO - __main__ - Step 19338: {'lr': 0.0001999573265902738, 'samples': 618816, 'steps': 1208, 'loss/train': 2.3856210708618164} -09/20/2021 18:40:32 - INFO - __main__ - Step 19339: {'lr': 0.0001999573265902738, 'samples': 618848, 'steps': 1208, 'loss/train': 2.5404040813446045} -09/20/2021 18:40:33 - INFO - __main__ - Step 19340: {'lr': 0.0001999573265902738, 'samples': 618880, 'steps': 1208, 'loss/train': 3.9328689575195312} -09/20/2021 18:40:34 - INFO - __main__ - Step 19341: {'lr': 0.0001999573265902738, 'samples': 618912, 'steps': 1208, 'loss/train': 3.4893853664398193} -09/20/2021 18:40:34 - INFO - __main__ - Step 19342: {'lr': 0.0001999573265902738, 'samples': 618944, 'steps': 1208, 'loss/train': 4.296652317047119} -09/20/2021 18:40:36 - INFO - __main__ - Step 19343: {'lr': 0.0001999573265902738, 'samples': 618976, 'steps': 1208, 'loss/train': 3.410564422607422} -09/20/2021 18:40:36 - INFO - __main__ - Step 19344: {'lr': 0.0001999573265902738, 'samples': 619008, 'steps': 1208, 'loss/train': 4.148472309112549} -09/20/2021 18:40:37 - INFO - __main__ - Step 19345: {'lr': 0.00019995714005339812, 'samples': 619040, 'steps': 1209, 'loss/train': 3.42145037651062} -09/20/2021 18:40:38 - INFO - __main__ - Step 19346: {'lr': 0.00019995714005339812, 'samples': 619072, 'steps': 1209, 'loss/train': 4.1564130783081055} -09/20/2021 18:40:39 - INFO - __main__ - Step 19347: {'lr': 0.00019995714005339812, 'samples': 619104, 'steps': 1209, 'loss/train': 3.7690675258636475} -09/20/2021 18:40:40 - INFO - __main__ - Step 19348: {'lr': 0.00019995714005339812, 'samples': 619136, 'steps': 1209, 'loss/train': 2.8783175945281982} -09/20/2021 18:40:40 - INFO - __main__ - Step 19349: {'lr': 0.00019995714005339812, 'samples': 619168, 'steps': 1209, 'loss/train': 3.6911942958831787} -09/20/2021 18:40:41 - INFO - __main__ - Step 19350: {'lr': 0.00019995714005339812, 'samples': 619200, 'steps': 1209, 'loss/train': 3.774163007736206} -09/20/2021 18:40:42 - INFO - __main__ - Step 19351: {'lr': 0.00019995714005339812, 'samples': 619232, 'steps': 1209, 'loss/train': 4.023324012756348} -09/20/2021 18:40:43 - INFO - __main__ - Step 19352: {'lr': 0.00019995714005339812, 'samples': 619264, 'steps': 1209, 'loss/train': 3.895198345184326} -09/20/2021 18:40:43 - INFO - __main__ - Step 19353: {'lr': 0.00019995714005339812, 'samples': 619296, 'steps': 1209, 'loss/train': 3.5897512435913086} -09/20/2021 18:40:44 - INFO - __main__ - Step 19354: {'lr': 0.00019995714005339812, 'samples': 619328, 'steps': 1209, 'loss/train': 3.351050615310669} -09/20/2021 18:40:45 - INFO - __main__ - Step 19355: {'lr': 0.00019995714005339812, 'samples': 619360, 'steps': 1209, 'loss/train': 3.8877344131469727} -09/20/2021 18:40:46 - INFO - __main__ - Step 19356: {'lr': 0.00019995714005339812, 'samples': 619392, 'steps': 1209, 'loss/train': 1.133805513381958} -09/20/2021 18:40:46 - INFO - __main__ - Step 19357: {'lr': 0.00019995714005339812, 'samples': 619424, 'steps': 1209, 'loss/train': 3.806764841079712} -09/20/2021 18:40:47 - INFO - __main__ - Step 19358: {'lr': 0.00019995714005339812, 'samples': 619456, 'steps': 1209, 'loss/train': 5.5457282066345215} -09/20/2021 18:40:48 - INFO - __main__ - Step 19359: {'lr': 0.00019995714005339812, 'samples': 619488, 'steps': 1209, 'loss/train': 3.807964563369751} -09/20/2021 18:40:49 - INFO - __main__ - Step 19360: {'lr': 0.00019995714005339812, 'samples': 619520, 'steps': 1209, 'loss/train': 3.121629476547241} -09/20/2021 18:40:50 - INFO - __main__ - Step 19361: {'lr': 0.00019995695310979724, 'samples': 619552, 'steps': 1210, 'loss/train': 4.396684169769287} -09/20/2021 18:40:50 - INFO - __main__ - Step 19362: {'lr': 0.00019995695310979724, 'samples': 619584, 'steps': 1210, 'loss/train': 3.87687611579895} -09/20/2021 18:40:51 - INFO - __main__ - Step 19363: {'lr': 0.00019995695310979724, 'samples': 619616, 'steps': 1210, 'loss/train': 3.575978994369507} -09/20/2021 18:40:52 - INFO - __main__ - Step 19364: {'lr': 0.00019995695310979724, 'samples': 619648, 'steps': 1210, 'loss/train': 3.2875163555145264} -09/20/2021 18:40:53 - INFO - __main__ - Step 19365: {'lr': 0.00019995695310979724, 'samples': 619680, 'steps': 1210, 'loss/train': 3.558877468109131} -09/20/2021 18:40:53 - INFO - __main__ - Step 19366: {'lr': 0.00019995695310979724, 'samples': 619712, 'steps': 1210, 'loss/train': 3.9527814388275146} -09/20/2021 18:40:54 - INFO - __main__ - Step 19367: {'lr': 0.00019995695310979724, 'samples': 619744, 'steps': 1210, 'loss/train': 3.769646406173706} -09/20/2021 18:40:55 - INFO - __main__ - Step 19368: {'lr': 0.00019995695310979724, 'samples': 619776, 'steps': 1210, 'loss/train': 4.421748638153076} -09/20/2021 18:40:56 - INFO - __main__ - Step 19369: {'lr': 0.00019995695310979724, 'samples': 619808, 'steps': 1210, 'loss/train': 3.0766100883483887} -09/20/2021 18:40:56 - INFO - __main__ - Step 19370: {'lr': 0.00019995695310979724, 'samples': 619840, 'steps': 1210, 'loss/train': 3.6813113689422607} -09/20/2021 18:40:57 - INFO - __main__ - Step 19371: {'lr': 0.00019995695310979724, 'samples': 619872, 'steps': 1210, 'loss/train': 2.699268102645874} -09/20/2021 18:40:58 - INFO - __main__ - Step 19372: {'lr': 0.00019995695310979724, 'samples': 619904, 'steps': 1210, 'loss/train': 3.7048213481903076} -09/20/2021 18:40:59 - INFO - __main__ - Step 19373: {'lr': 0.00019995695310979724, 'samples': 619936, 'steps': 1210, 'loss/train': 1.4472627639770508} -09/20/2021 18:40:59 - INFO - __main__ - Step 19374: {'lr': 0.00019995695310979724, 'samples': 619968, 'steps': 1210, 'loss/train': 4.899121284484863} -09/20/2021 18:41:01 - INFO - __main__ - Step 19375: {'lr': 0.00019995695310979724, 'samples': 620000, 'steps': 1210, 'loss/train': 4.358102321624756} -09/20/2021 18:41:02 - INFO - __main__ - Step 19376: {'lr': 0.00019995695310979724, 'samples': 620032, 'steps': 1210, 'loss/train': 3.591108798980713} -09/20/2021 18:41:03 - INFO - __main__ - Step 19377: {'lr': 0.0001999567657594719, 'samples': 620064, 'steps': 1211, 'loss/train': 4.858688831329346} -09/20/2021 18:41:03 - INFO - __main__ - Step 19378: {'lr': 0.0001999567657594719, 'samples': 620096, 'steps': 1211, 'loss/train': 3.1679484844207764} -09/20/2021 18:41:04 - INFO - __main__ - Step 19379: {'lr': 0.0001999567657594719, 'samples': 620128, 'steps': 1211, 'loss/train': 4.354768753051758} -09/20/2021 18:41:05 - INFO - __main__ - Step 19380: {'lr': 0.0001999567657594719, 'samples': 620160, 'steps': 1211, 'loss/train': 3.2756705284118652} -09/20/2021 18:41:06 - INFO - __main__ - Step 19381: {'lr': 0.0001999567657594719, 'samples': 620192, 'steps': 1211, 'loss/train': 3.2962887287139893} -09/20/2021 18:41:06 - INFO - __main__ - Step 19382: {'lr': 0.0001999567657594719, 'samples': 620224, 'steps': 1211, 'loss/train': 3.7041358947753906} -09/20/2021 18:41:07 - INFO - __main__ - Step 19383: {'lr': 0.0001999567657594719, 'samples': 620256, 'steps': 1211, 'loss/train': 3.8130478858947754} -09/20/2021 18:41:08 - INFO - __main__ - Step 19384: {'lr': 0.0001999567657594719, 'samples': 620288, 'steps': 1211, 'loss/train': 1.5050427913665771} -09/20/2021 18:41:09 - INFO - __main__ - Step 19385: {'lr': 0.0001999567657594719, 'samples': 620320, 'steps': 1211, 'loss/train': 3.3412208557128906} -09/20/2021 18:41:09 - INFO - __main__ - Step 19386: {'lr': 0.0001999567657594719, 'samples': 620352, 'steps': 1211, 'loss/train': 3.0537548065185547} -09/20/2021 18:41:10 - INFO - __main__ - Step 19387: {'lr': 0.0001999567657594719, 'samples': 620384, 'steps': 1211, 'loss/train': 2.68107271194458} -09/20/2021 18:41:11 - INFO - __main__ - Step 19388: {'lr': 0.0001999567657594719, 'samples': 620416, 'steps': 1211, 'loss/train': 2.2238800525665283} -09/20/2021 18:41:12 - INFO - __main__ - Step 19389: {'lr': 0.0001999567657594719, 'samples': 620448, 'steps': 1211, 'loss/train': 2.2549853324890137} -09/20/2021 18:41:12 - INFO - __main__ - Step 19390: {'lr': 0.0001999567657594719, 'samples': 620480, 'steps': 1211, 'loss/train': 2.814368724822998} -09/20/2021 18:41:13 - INFO - __main__ - Step 19391: {'lr': 0.0001999567657594719, 'samples': 620512, 'steps': 1211, 'loss/train': 5.1987457275390625} -09/20/2021 18:41:14 - INFO - __main__ - Step 19392: {'lr': 0.0001999567657594719, 'samples': 620544, 'steps': 1211, 'loss/train': 3.6684343814849854} -09/20/2021 18:41:15 - INFO - __main__ - Step 19393: {'lr': 0.00019995657800242286, 'samples': 620576, 'steps': 1212, 'loss/train': 3.459460735321045} -09/20/2021 18:41:16 - INFO - __main__ - Step 19394: {'lr': 0.00019995657800242286, 'samples': 620608, 'steps': 1212, 'loss/train': 3.055262565612793} -09/20/2021 18:41:16 - INFO - __main__ - Step 19395: {'lr': 0.00019995657800242286, 'samples': 620640, 'steps': 1212, 'loss/train': 3.1919362545013428} -09/20/2021 18:41:17 - INFO - __main__ - Step 19396: {'lr': 0.00019995657800242286, 'samples': 620672, 'steps': 1212, 'loss/train': 4.279895782470703} -09/20/2021 18:41:18 - INFO - __main__ - Step 19397: {'lr': 0.00019995657800242286, 'samples': 620704, 'steps': 1212, 'loss/train': 2.1110517978668213} -09/20/2021 18:41:19 - INFO - __main__ - Step 19398: {'lr': 0.00019995657800242286, 'samples': 620736, 'steps': 1212, 'loss/train': 3.458268880844116} -09/20/2021 18:41:19 - INFO - __main__ - Step 19399: {'lr': 0.00019995657800242286, 'samples': 620768, 'steps': 1212, 'loss/train': 2.264845609664917} -09/20/2021 18:41:20 - INFO - __main__ - Step 19400: {'lr': 0.00019995657800242286, 'samples': 620800, 'steps': 1212, 'loss/train': 4.232837677001953} -09/20/2021 18:41:21 - INFO - __main__ - Step 19401: {'lr': 0.00019995657800242286, 'samples': 620832, 'steps': 1212, 'loss/train': 3.769648790359497} -09/20/2021 18:41:22 - INFO - __main__ - Step 19402: {'lr': 0.00019995657800242286, 'samples': 620864, 'steps': 1212, 'loss/train': 3.3565433025360107} -09/20/2021 18:41:22 - INFO - __main__ - Step 19403: {'lr': 0.00019995657800242286, 'samples': 620896, 'steps': 1212, 'loss/train': 3.760244846343994} -09/20/2021 18:41:23 - INFO - __main__ - Step 19404: {'lr': 0.00019995657800242286, 'samples': 620928, 'steps': 1212, 'loss/train': 3.507167339324951} -09/20/2021 18:41:24 - INFO - __main__ - Step 19405: {'lr': 0.00019995657800242286, 'samples': 620960, 'steps': 1212, 'loss/train': 3.6607296466827393} -09/20/2021 18:41:25 - INFO - __main__ - Step 19406: {'lr': 0.00019995657800242286, 'samples': 620992, 'steps': 1212, 'loss/train': 2.546060562133789} -09/20/2021 18:41:26 - INFO - __main__ - Step 19407: {'lr': 0.00019995657800242286, 'samples': 621024, 'steps': 1212, 'loss/train': 3.7515687942504883} -09/20/2021 18:41:27 - INFO - __main__ - Step 19408: {'lr': 0.00019995657800242286, 'samples': 621056, 'steps': 1212, 'loss/train': 0.8902287483215332} -09/20/2021 18:41:28 - INFO - __main__ - Step 19409: {'lr': 0.0001999563898386509, 'samples': 621088, 'steps': 1213, 'loss/train': 3.9989352226257324} -09/20/2021 18:41:29 - INFO - __main__ - Step 19410: {'lr': 0.0001999563898386509, 'samples': 621120, 'steps': 1213, 'loss/train': 3.636244297027588} -09/20/2021 18:41:29 - INFO - __main__ - Step 19411: {'lr': 0.0001999563898386509, 'samples': 621152, 'steps': 1213, 'loss/train': 0.46618878841400146} -09/20/2021 18:41:30 - INFO - __main__ - Step 19412: {'lr': 0.0001999563898386509, 'samples': 621184, 'steps': 1213, 'loss/train': 4.014666557312012} -09/20/2021 18:41:31 - INFO - __main__ - Step 19413: {'lr': 0.0001999563898386509, 'samples': 621216, 'steps': 1213, 'loss/train': 2.8548552989959717} -09/20/2021 18:41:32 - INFO - __main__ - Step 19414: {'lr': 0.0001999563898386509, 'samples': 621248, 'steps': 1213, 'loss/train': 4.3287529945373535} -09/20/2021 18:41:32 - INFO - __main__ - Step 19415: {'lr': 0.0001999563898386509, 'samples': 621280, 'steps': 1213, 'loss/train': 2.79512882232666} -09/20/2021 18:41:33 - INFO - __main__ - Step 19416: {'lr': 0.0001999563898386509, 'samples': 621312, 'steps': 1213, 'loss/train': 2.874993324279785} -09/20/2021 18:41:34 - INFO - __main__ - Step 19417: {'lr': 0.0001999563898386509, 'samples': 621344, 'steps': 1213, 'loss/train': 4.5770263671875} -09/20/2021 18:41:35 - INFO - __main__ - Step 19418: {'lr': 0.0001999563898386509, 'samples': 621376, 'steps': 1213, 'loss/train': 3.68253231048584} -09/20/2021 18:41:35 - INFO - __main__ - Step 19419: {'lr': 0.0001999563898386509, 'samples': 621408, 'steps': 1213, 'loss/train': 3.3674817085266113} -09/20/2021 18:41:36 - INFO - __main__ - Step 19420: {'lr': 0.0001999563898386509, 'samples': 621440, 'steps': 1213, 'loss/train': 2.9327569007873535} -09/20/2021 18:41:37 - INFO - __main__ - Step 19421: {'lr': 0.0001999563898386509, 'samples': 621472, 'steps': 1213, 'loss/train': 3.6908562183380127} -09/20/2021 18:41:38 - INFO - __main__ - Step 19422: {'lr': 0.0001999563898386509, 'samples': 621504, 'steps': 1213, 'loss/train': 3.8758928775787354} -09/20/2021 18:41:38 - INFO - __main__ - Step 19423: {'lr': 0.0001999563898386509, 'samples': 621536, 'steps': 1213, 'loss/train': 2.819366455078125} -09/20/2021 18:41:39 - INFO - __main__ - Step 19424: {'lr': 0.0001999563898386509, 'samples': 621568, 'steps': 1213, 'loss/train': 2.956035614013672} -09/20/2021 18:41:40 - INFO - __main__ - Step 19425: {'lr': 0.00019995620126815678, 'samples': 621600, 'steps': 1214, 'loss/train': 3.4014692306518555} -09/20/2021 18:41:41 - INFO - __main__ - Step 19426: {'lr': 0.00019995620126815678, 'samples': 621632, 'steps': 1214, 'loss/train': 4.166517734527588} -09/20/2021 18:41:41 - INFO - __main__ - Step 19427: {'lr': 0.00019995620126815678, 'samples': 621664, 'steps': 1214, 'loss/train': 3.2175452709198} -09/20/2021 18:41:42 - INFO - __main__ - Step 19428: {'lr': 0.00019995620126815678, 'samples': 621696, 'steps': 1214, 'loss/train': 1.1772043704986572} -09/20/2021 18:41:43 - INFO - __main__ - Step 19429: {'lr': 0.00019995620126815678, 'samples': 621728, 'steps': 1214, 'loss/train': 0.9483647346496582} -09/20/2021 18:41:44 - INFO - __main__ - Step 19430: {'lr': 0.00019995620126815678, 'samples': 621760, 'steps': 1214, 'loss/train': 0.9208406805992126} -09/20/2021 18:41:44 - INFO - __main__ - Step 19431: {'lr': 0.00019995620126815678, 'samples': 621792, 'steps': 1214, 'loss/train': 0.5946465730667114} -09/20/2021 18:41:45 - INFO - __main__ - Step 19432: {'lr': 0.00019995620126815678, 'samples': 621824, 'steps': 1214, 'loss/train': 3.263775110244751} -09/20/2021 18:41:46 - INFO - __main__ - Step 19433: {'lr': 0.00019995620126815678, 'samples': 621856, 'steps': 1214, 'loss/train': 3.777312755584717} -09/20/2021 18:41:47 - INFO - __main__ - Step 19434: {'lr': 0.00019995620126815678, 'samples': 621888, 'steps': 1214, 'loss/train': 4.499849796295166} -09/20/2021 18:41:47 - INFO - __main__ - Step 19435: {'lr': 0.00019995620126815678, 'samples': 621920, 'steps': 1214, 'loss/train': 3.5600483417510986} -09/20/2021 18:41:48 - INFO - __main__ - Step 19436: {'lr': 0.00019995620126815678, 'samples': 621952, 'steps': 1214, 'loss/train': 3.9451181888580322} -09/20/2021 18:41:49 - INFO - __main__ - Step 19437: {'lr': 0.00019995620126815678, 'samples': 621984, 'steps': 1214, 'loss/train': 3.0868146419525146} -09/20/2021 18:41:50 - INFO - __main__ - Step 19438: {'lr': 0.00019995620126815678, 'samples': 622016, 'steps': 1214, 'loss/train': 3.2316293716430664} -09/20/2021 18:41:51 - INFO - __main__ - Step 19439: {'lr': 0.00019995620126815678, 'samples': 622048, 'steps': 1214, 'loss/train': 4.1063551902771} -09/20/2021 18:41:52 - INFO - __main__ - Step 19440: {'lr': 0.00019995620126815678, 'samples': 622080, 'steps': 1214, 'loss/train': 3.594794273376465} -09/20/2021 18:41:53 - INFO - __main__ - Step 19441: {'lr': 0.00019995601229094126, 'samples': 622112, 'steps': 1215, 'loss/train': 3.8448598384857178} -09/20/2021 18:41:53 - INFO - __main__ - Step 19442: {'lr': 0.00019995601229094126, 'samples': 622144, 'steps': 1215, 'loss/train': 3.893604278564453} -09/20/2021 18:41:54 - INFO - __main__ - Step 19443: {'lr': 0.00019995601229094126, 'samples': 622176, 'steps': 1215, 'loss/train': 4.378646373748779} -09/20/2021 18:41:55 - INFO - __main__ - Step 19444: {'lr': 0.00019995601229094126, 'samples': 622208, 'steps': 1215, 'loss/train': 3.583569288253784} -09/20/2021 18:41:56 - INFO - __main__ - Step 19445: {'lr': 0.00019995601229094126, 'samples': 622240, 'steps': 1215, 'loss/train': 3.0547845363616943} -09/20/2021 18:41:56 - INFO - __main__ - Step 19446: {'lr': 0.00019995601229094126, 'samples': 622272, 'steps': 1215, 'loss/train': 3.674098491668701} -09/20/2021 18:41:57 - INFO - __main__ - Step 19447: {'lr': 0.00019995601229094126, 'samples': 622304, 'steps': 1215, 'loss/train': 4.868091106414795} -09/20/2021 18:41:58 - INFO - __main__ - Step 19448: {'lr': 0.00019995601229094126, 'samples': 622336, 'steps': 1215, 'loss/train': 3.2282466888427734} -09/20/2021 18:41:59 - INFO - __main__ - Step 19449: {'lr': 0.00019995601229094126, 'samples': 622368, 'steps': 1215, 'loss/train': 3.775150775909424} -09/20/2021 18:41:59 - INFO - __main__ - Step 19450: {'lr': 0.00019995601229094126, 'samples': 622400, 'steps': 1215, 'loss/train': 3.0965001583099365} -09/20/2021 18:42:00 - INFO - __main__ - Step 19451: {'lr': 0.00019995601229094126, 'samples': 622432, 'steps': 1215, 'loss/train': 2.975123882293701} -09/20/2021 18:42:01 - INFO - __main__ - Step 19452: {'lr': 0.00019995601229094126, 'samples': 622464, 'steps': 1215, 'loss/train': 2.6964049339294434} -09/20/2021 18:42:02 - INFO - __main__ - Step 19453: {'lr': 0.00019995601229094126, 'samples': 622496, 'steps': 1215, 'loss/train': 3.422734260559082} -09/20/2021 18:42:02 - INFO - __main__ - Step 19454: {'lr': 0.00019995601229094126, 'samples': 622528, 'steps': 1215, 'loss/train': 3.501631498336792} -09/20/2021 18:42:03 - INFO - __main__ - Step 19455: {'lr': 0.00019995601229094126, 'samples': 622560, 'steps': 1215, 'loss/train': 3.0726890563964844} -09/20/2021 18:42:04 - INFO - __main__ - Step 19456: {'lr': 0.00019995601229094126, 'samples': 622592, 'steps': 1215, 'loss/train': 3.854308843612671} -09/20/2021 18:42:05 - INFO - __main__ - Step 19457: {'lr': 0.0001999558229070051, 'samples': 622624, 'steps': 1216, 'loss/train': 3.661381244659424} -09/20/2021 18:42:05 - INFO - __main__ - Step 19458: {'lr': 0.0001999558229070051, 'samples': 622656, 'steps': 1216, 'loss/train': 3.112353563308716} -09/20/2021 18:42:06 - INFO - __main__ - Step 19459: {'lr': 0.0001999558229070051, 'samples': 622688, 'steps': 1216, 'loss/train': 3.911149024963379} -09/20/2021 18:42:07 - INFO - __main__ - Step 19460: {'lr': 0.0001999558229070051, 'samples': 622720, 'steps': 1216, 'loss/train': 3.6220502853393555} -09/20/2021 18:42:08 - INFO - __main__ - Step 19461: {'lr': 0.0001999558229070051, 'samples': 622752, 'steps': 1216, 'loss/train': 2.6168296337127686} -09/20/2021 18:42:08 - INFO - __main__ - Step 19462: {'lr': 0.0001999558229070051, 'samples': 622784, 'steps': 1216, 'loss/train': 3.4992165565490723} -09/20/2021 18:42:09 - INFO - __main__ - Step 19463: {'lr': 0.0001999558229070051, 'samples': 622816, 'steps': 1216, 'loss/train': 2.4567673206329346} -09/20/2021 18:42:10 - INFO - __main__ - Step 19464: {'lr': 0.0001999558229070051, 'samples': 622848, 'steps': 1216, 'loss/train': 4.490163803100586} -09/20/2021 18:42:11 - INFO - __main__ - Step 19465: {'lr': 0.0001999558229070051, 'samples': 622880, 'steps': 1216, 'loss/train': 0.8692592978477478} -09/20/2021 18:42:11 - INFO - __main__ - Step 19466: {'lr': 0.0001999558229070051, 'samples': 622912, 'steps': 1216, 'loss/train': 3.42106556892395} -09/20/2021 18:42:12 - INFO - __main__ - Step 19467: {'lr': 0.0001999558229070051, 'samples': 622944, 'steps': 1216, 'loss/train': 3.9342408180236816} -09/20/2021 18:42:13 - INFO - __main__ - Step 19468: {'lr': 0.0001999558229070051, 'samples': 622976, 'steps': 1216, 'loss/train': 3.712110757827759} -09/20/2021 18:42:14 - INFO - __main__ - Step 19469: {'lr': 0.0001999558229070051, 'samples': 623008, 'steps': 1216, 'loss/train': 4.357521057128906} -09/20/2021 18:42:15 - INFO - __main__ - Step 19470: {'lr': 0.0001999558229070051, 'samples': 623040, 'steps': 1216, 'loss/train': 5.094313144683838} -09/20/2021 18:42:16 - INFO - __main__ - Step 19471: {'lr': 0.0001999558229070051, 'samples': 623072, 'steps': 1216, 'loss/train': 3.160503387451172} -09/20/2021 18:42:16 - INFO - __main__ - Step 19472: {'lr': 0.0001999558229070051, 'samples': 623104, 'steps': 1216, 'loss/train': 3.012829542160034} -09/20/2021 18:42:17 - INFO - __main__ - Step 19473: {'lr': 0.0001999556331163491, 'samples': 623136, 'steps': 1217, 'loss/train': 2.766449451446533} -09/20/2021 18:42:18 - INFO - __main__ - Step 19474: {'lr': 0.0001999556331163491, 'samples': 623168, 'steps': 1217, 'loss/train': 5.4100823402404785} -09/20/2021 18:42:19 - INFO - __main__ - Step 19475: {'lr': 0.0001999556331163491, 'samples': 623200, 'steps': 1217, 'loss/train': 3.734790086746216} -09/20/2021 18:42:20 - INFO - __main__ - Step 19476: {'lr': 0.0001999556331163491, 'samples': 623232, 'steps': 1217, 'loss/train': 2.661348819732666} -09/20/2021 18:42:20 - INFO - __main__ - Step 19477: {'lr': 0.0001999556331163491, 'samples': 623264, 'steps': 1217, 'loss/train': 2.7126450538635254} -09/20/2021 18:42:21 - INFO - __main__ - Step 19478: {'lr': 0.0001999556331163491, 'samples': 623296, 'steps': 1217, 'loss/train': 3.868973970413208} -09/20/2021 18:42:22 - INFO - __main__ - Step 19479: {'lr': 0.0001999556331163491, 'samples': 623328, 'steps': 1217, 'loss/train': 2.717278242111206} -09/20/2021 18:42:23 - INFO - __main__ - Step 19480: {'lr': 0.0001999556331163491, 'samples': 623360, 'steps': 1217, 'loss/train': 2.963040828704834} -09/20/2021 18:42:23 - INFO - __main__ - Step 19481: {'lr': 0.0001999556331163491, 'samples': 623392, 'steps': 1217, 'loss/train': 3.809170961380005} -09/20/2021 18:42:24 - INFO - __main__ - Step 19482: {'lr': 0.0001999556331163491, 'samples': 623424, 'steps': 1217, 'loss/train': 2.9340157508850098} -09/20/2021 18:42:25 - INFO - __main__ - Step 19483: {'lr': 0.0001999556331163491, 'samples': 623456, 'steps': 1217, 'loss/train': 4.6134114265441895} -09/20/2021 18:42:26 - INFO - __main__ - Step 19484: {'lr': 0.0001999556331163491, 'samples': 623488, 'steps': 1217, 'loss/train': 3.610217571258545} -09/20/2021 18:42:26 - INFO - __main__ - Step 19485: {'lr': 0.0001999556331163491, 'samples': 623520, 'steps': 1217, 'loss/train': 2.946408987045288} -09/20/2021 18:42:27 - INFO - __main__ - Step 19486: {'lr': 0.0001999556331163491, 'samples': 623552, 'steps': 1217, 'loss/train': 3.417724609375} -09/20/2021 18:42:28 - INFO - __main__ - Step 19487: {'lr': 0.0001999556331163491, 'samples': 623584, 'steps': 1217, 'loss/train': 3.4175827503204346} -09/20/2021 18:42:29 - INFO - __main__ - Step 19488: {'lr': 0.0001999556331163491, 'samples': 623616, 'steps': 1217, 'loss/train': 3.839351177215576} -09/20/2021 18:42:29 - INFO - __main__ - Step 19489: {'lr': 0.00019995544291897402, 'samples': 623648, 'steps': 1218, 'loss/train': 3.349919319152832} -09/20/2021 18:42:30 - INFO - __main__ - Step 19490: {'lr': 0.00019995544291897402, 'samples': 623680, 'steps': 1218, 'loss/train': 2.243344783782959} -09/20/2021 18:42:31 - INFO - __main__ - Step 19491: {'lr': 0.00019995544291897402, 'samples': 623712, 'steps': 1218, 'loss/train': 3.2969210147857666} -09/20/2021 18:42:32 - INFO - __main__ - Step 19492: {'lr': 0.00019995544291897402, 'samples': 623744, 'steps': 1218, 'loss/train': 3.474977731704712} -09/20/2021 18:42:32 - INFO - __main__ - Step 19493: {'lr': 0.00019995544291897402, 'samples': 623776, 'steps': 1218, 'loss/train': 3.4589998722076416} -09/20/2021 18:42:33 - INFO - __main__ - Step 19494: {'lr': 0.00019995544291897402, 'samples': 623808, 'steps': 1218, 'loss/train': 3.2676782608032227} -09/20/2021 18:42:34 - INFO - __main__ - Step 19495: {'lr': 0.00019995544291897402, 'samples': 623840, 'steps': 1218, 'loss/train': 4.278071880340576} -09/20/2021 18:42:35 - INFO - __main__ - Step 19496: {'lr': 0.00019995544291897402, 'samples': 623872, 'steps': 1218, 'loss/train': 1.588039755821228} -09/20/2021 18:42:35 - INFO - __main__ - Step 19497: {'lr': 0.00019995544291897402, 'samples': 623904, 'steps': 1218, 'loss/train': 3.6125986576080322} -09/20/2021 18:42:36 - INFO - __main__ - Step 19498: {'lr': 0.00019995544291897402, 'samples': 623936, 'steps': 1218, 'loss/train': 2.23600435256958} -09/20/2021 18:42:38 - INFO - __main__ - Step 19499: {'lr': 0.00019995544291897402, 'samples': 623968, 'steps': 1218, 'loss/train': 3.8830816745758057} -09/20/2021 18:42:38 - INFO - __main__ - Step 19500: {'lr': 0.00019995544291897402, 'samples': 624000, 'steps': 1218, 'loss/train': 2.789881467819214} -09/20/2021 18:42:39 - INFO - __main__ - Step 19501: {'lr': 0.00019995544291897402, 'samples': 624032, 'steps': 1218, 'loss/train': 3.3415894508361816} -09/20/2021 18:42:40 - INFO - __main__ - Step 19502: {'lr': 0.00019995544291897402, 'samples': 624064, 'steps': 1218, 'loss/train': 4.996649742126465} -09/20/2021 18:42:41 - INFO - __main__ - Step 19503: {'lr': 0.00019995544291897402, 'samples': 624096, 'steps': 1218, 'loss/train': 2.4078726768493652} -09/20/2021 18:42:41 - INFO - __main__ - Step 19504: {'lr': 0.00019995544291897402, 'samples': 624128, 'steps': 1218, 'loss/train': 3.716783285140991} -09/20/2021 18:42:42 - INFO - __main__ - Step 19505: {'lr': 0.00019995525231488064, 'samples': 624160, 'steps': 1219, 'loss/train': 3.579174518585205} -09/20/2021 18:42:43 - INFO - __main__ - Step 19506: {'lr': 0.00019995525231488064, 'samples': 624192, 'steps': 1219, 'loss/train': 3.6964855194091797} -09/20/2021 18:42:44 - INFO - __main__ - Step 19507: {'lr': 0.00019995525231488064, 'samples': 624224, 'steps': 1219, 'loss/train': 3.99749493598938} -09/20/2021 18:42:44 - INFO - __main__ - Step 19508: {'lr': 0.00019995525231488064, 'samples': 624256, 'steps': 1219, 'loss/train': 3.558077812194824} -09/20/2021 18:42:45 - INFO - __main__ - Step 19509: {'lr': 0.00019995525231488064, 'samples': 624288, 'steps': 1219, 'loss/train': 2.986067771911621} -09/20/2021 18:42:46 - INFO - __main__ - Step 19510: {'lr': 0.00019995525231488064, 'samples': 624320, 'steps': 1219, 'loss/train': 4.04404878616333} -09/20/2021 18:42:47 - INFO - __main__ - Step 19511: {'lr': 0.00019995525231488064, 'samples': 624352, 'steps': 1219, 'loss/train': 3.4200081825256348} -09/20/2021 18:42:47 - INFO - __main__ - Step 19512: {'lr': 0.00019995525231488064, 'samples': 624384, 'steps': 1219, 'loss/train': 2.9286420345306396} -09/20/2021 18:42:48 - INFO - __main__ - Step 19513: {'lr': 0.00019995525231488064, 'samples': 624416, 'steps': 1219, 'loss/train': 2.681788921356201} -09/20/2021 18:42:49 - INFO - __main__ - Step 19514: {'lr': 0.00019995525231488064, 'samples': 624448, 'steps': 1219, 'loss/train': 3.591670513153076} -09/20/2021 18:42:50 - INFO - __main__ - Step 19515: {'lr': 0.00019995525231488064, 'samples': 624480, 'steps': 1219, 'loss/train': 2.73603892326355} -09/20/2021 18:42:50 - INFO - __main__ - Step 19516: {'lr': 0.00019995525231488064, 'samples': 624512, 'steps': 1219, 'loss/train': 2.5903079509735107} -09/20/2021 18:42:51 - INFO - __main__ - Step 19517: {'lr': 0.00019995525231488064, 'samples': 624544, 'steps': 1219, 'loss/train': 2.537144899368286} -09/20/2021 18:42:52 - INFO - __main__ - Step 19518: {'lr': 0.00019995525231488064, 'samples': 624576, 'steps': 1219, 'loss/train': 4.312484264373779} -09/20/2021 18:42:53 - INFO - __main__ - Step 19519: {'lr': 0.00019995525231488064, 'samples': 624608, 'steps': 1219, 'loss/train': 4.267457962036133} -09/20/2021 18:42:53 - INFO - __main__ - Step 19520: {'lr': 0.00019995525231488064, 'samples': 624640, 'steps': 1219, 'loss/train': 2.935166120529175} -09/20/2021 18:42:54 - INFO - __main__ - Step 19521: {'lr': 0.0001999550613040697, 'samples': 624672, 'steps': 1220, 'loss/train': 4.4982099533081055} -09/20/2021 18:42:55 - INFO - __main__ - Step 19522: {'lr': 0.0001999550613040697, 'samples': 624704, 'steps': 1220, 'loss/train': 3.907426118850708} -09/20/2021 18:42:56 - INFO - __main__ - Step 19523: {'lr': 0.0001999550613040697, 'samples': 624736, 'steps': 1220, 'loss/train': 3.768761396408081} -09/20/2021 18:42:57 - INFO - __main__ - Step 19524: {'lr': 0.0001999550613040697, 'samples': 624768, 'steps': 1220, 'loss/train': 3.321042776107788} -09/20/2021 18:42:57 - INFO - __main__ - Step 19525: {'lr': 0.0001999550613040697, 'samples': 624800, 'steps': 1220, 'loss/train': 3.647573471069336} -09/20/2021 18:42:58 - INFO - __main__ - Step 19526: {'lr': 0.0001999550613040697, 'samples': 624832, 'steps': 1220, 'loss/train': 2.3636207580566406} -09/20/2021 18:42:59 - INFO - __main__ - Step 19527: {'lr': 0.0001999550613040697, 'samples': 624864, 'steps': 1220, 'loss/train': 3.162649154663086} -09/20/2021 18:43:00 - INFO - __main__ - Step 19528: {'lr': 0.0001999550613040697, 'samples': 624896, 'steps': 1220, 'loss/train': 4.372494220733643} -09/20/2021 18:43:01 - INFO - __main__ - Step 19529: {'lr': 0.0001999550613040697, 'samples': 624928, 'steps': 1220, 'loss/train': 3.735001802444458} -09/20/2021 18:43:02 - INFO - __main__ - Step 19530: {'lr': 0.0001999550613040697, 'samples': 624960, 'steps': 1220, 'loss/train': 3.8939154148101807} -09/20/2021 18:43:03 - INFO - __main__ - Step 19531: {'lr': 0.0001999550613040697, 'samples': 624992, 'steps': 1220, 'loss/train': 4.038029670715332} -09/20/2021 18:43:03 - INFO - __main__ - Step 19532: {'lr': 0.0001999550613040697, 'samples': 625024, 'steps': 1220, 'loss/train': 2.8840978145599365} -09/20/2021 18:43:04 - INFO - __main__ - Step 19533: {'lr': 0.0001999550613040697, 'samples': 625056, 'steps': 1220, 'loss/train': 3.1118927001953125} -09/20/2021 18:43:05 - INFO - __main__ - Step 19534: {'lr': 0.0001999550613040697, 'samples': 625088, 'steps': 1220, 'loss/train': 3.6691067218780518} -09/20/2021 18:43:06 - INFO - __main__ - Step 19535: {'lr': 0.0001999550613040697, 'samples': 625120, 'steps': 1220, 'loss/train': 3.800143003463745} -09/20/2021 18:43:06 - INFO - __main__ - Step 19536: {'lr': 0.0001999550613040697, 'samples': 625152, 'steps': 1220, 'loss/train': 1.1580079793930054} -09/20/2021 18:43:07 - INFO - __main__ - Step 19537: {'lr': 0.00019995486988654202, 'samples': 625184, 'steps': 1221, 'loss/train': 3.5286474227905273} -09/20/2021 18:43:08 - INFO - __main__ - Step 19538: {'lr': 0.00019995486988654202, 'samples': 625216, 'steps': 1221, 'loss/train': 3.6108052730560303} -09/20/2021 18:43:09 - INFO - __main__ - Step 19539: {'lr': 0.00019995486988654202, 'samples': 625248, 'steps': 1221, 'loss/train': 4.748880863189697} -09/20/2021 18:43:09 - INFO - __main__ - Step 19540: {'lr': 0.00019995486988654202, 'samples': 625280, 'steps': 1221, 'loss/train': 3.1163904666900635} -09/20/2021 18:43:10 - INFO - __main__ - Step 19541: {'lr': 0.00019995486988654202, 'samples': 625312, 'steps': 1221, 'loss/train': 2.9361395835876465} -09/20/2021 18:43:11 - INFO - __main__ - Step 19542: {'lr': 0.00019995486988654202, 'samples': 625344, 'steps': 1221, 'loss/train': 3.457167387008667} -09/20/2021 18:43:12 - INFO - __main__ - Step 19543: {'lr': 0.00019995486988654202, 'samples': 625376, 'steps': 1221, 'loss/train': 3.2533164024353027} -09/20/2021 18:43:12 - INFO - __main__ - Step 19544: {'lr': 0.00019995486988654202, 'samples': 625408, 'steps': 1221, 'loss/train': 3.259366750717163} -09/20/2021 18:43:13 - INFO - __main__ - Step 19545: {'lr': 0.00019995486988654202, 'samples': 625440, 'steps': 1221, 'loss/train': 3.9500787258148193} -09/20/2021 18:43:14 - INFO - __main__ - Step 19546: {'lr': 0.00019995486988654202, 'samples': 625472, 'steps': 1221, 'loss/train': 3.0024592876434326} -09/20/2021 18:43:15 - INFO - __main__ - Step 19547: {'lr': 0.00019995486988654202, 'samples': 625504, 'steps': 1221, 'loss/train': 3.9001591205596924} -09/20/2021 18:43:15 - INFO - __main__ - Step 19548: {'lr': 0.00019995486988654202, 'samples': 625536, 'steps': 1221, 'loss/train': 2.3912508487701416} -09/20/2021 18:43:16 - INFO - __main__ - Step 19549: {'lr': 0.00019995486988654202, 'samples': 625568, 'steps': 1221, 'loss/train': 0.8379008173942566} -09/20/2021 18:43:17 - INFO - __main__ - Step 19550: {'lr': 0.00019995486988654202, 'samples': 625600, 'steps': 1221, 'loss/train': 0.5300782322883606} -09/20/2021 18:43:18 - INFO - __main__ - Step 19551: {'lr': 0.00019995486988654202, 'samples': 625632, 'steps': 1221, 'loss/train': 2.2612221240997314} -09/20/2021 18:43:18 - INFO - __main__ - Step 19552: {'lr': 0.00019995486988654202, 'samples': 625664, 'steps': 1221, 'loss/train': 3.480090379714966} -09/20/2021 18:43:19 - INFO - __main__ - Step 19553: {'lr': 0.00019995467806229838, 'samples': 625696, 'steps': 1222, 'loss/train': 3.0931055545806885} -09/20/2021 18:43:20 - INFO - __main__ - Step 19554: {'lr': 0.00019995467806229838, 'samples': 625728, 'steps': 1222, 'loss/train': 2.1936662197113037} -09/20/2021 18:43:21 - INFO - __main__ - Step 19555: {'lr': 0.00019995467806229838, 'samples': 625760, 'steps': 1222, 'loss/train': 3.195770263671875} -09/20/2021 18:43:22 - INFO - __main__ - Step 19556: {'lr': 0.00019995467806229838, 'samples': 625792, 'steps': 1222, 'loss/train': 3.226412296295166} -09/20/2021 18:43:22 - INFO - __main__ - Step 19557: {'lr': 0.00019995467806229838, 'samples': 625824, 'steps': 1222, 'loss/train': 3.5433943271636963} -09/20/2021 18:43:23 - INFO - __main__ - Step 19558: {'lr': 0.00019995467806229838, 'samples': 625856, 'steps': 1222, 'loss/train': 3.4706342220306396} -09/20/2021 18:43:24 - INFO - __main__ - Step 19559: {'lr': 0.00019995467806229838, 'samples': 625888, 'steps': 1222, 'loss/train': 3.5862977504730225} -09/20/2021 18:43:25 - INFO - __main__ - Step 19560: {'lr': 0.00019995467806229838, 'samples': 625920, 'steps': 1222, 'loss/train': 4.10203742980957} -09/20/2021 18:43:26 - INFO - __main__ - Step 19561: {'lr': 0.00019995467806229838, 'samples': 625952, 'steps': 1222, 'loss/train': 3.0271003246307373} -09/20/2021 18:43:27 - INFO - __main__ - Step 19562: {'lr': 0.00019995467806229838, 'samples': 625984, 'steps': 1222, 'loss/train': 3.028878927230835} -09/20/2021 18:43:27 - INFO - __main__ - Step 19563: {'lr': 0.00019995467806229838, 'samples': 626016, 'steps': 1222, 'loss/train': 3.688851833343506} -09/20/2021 18:43:28 - INFO - __main__ - Step 19564: {'lr': 0.00019995467806229838, 'samples': 626048, 'steps': 1222, 'loss/train': 3.289156913757324} -09/20/2021 18:43:29 - INFO - __main__ - Step 19565: {'lr': 0.00019995467806229838, 'samples': 626080, 'steps': 1222, 'loss/train': 3.471903085708618} -09/20/2021 18:43:30 - INFO - __main__ - Step 19566: {'lr': 0.00019995467806229838, 'samples': 626112, 'steps': 1222, 'loss/train': 2.4175727367401123} -09/20/2021 18:43:30 - INFO - __main__ - Step 19567: {'lr': 0.00019995467806229838, 'samples': 626144, 'steps': 1222, 'loss/train': 3.288316249847412} -09/20/2021 18:43:31 - INFO - __main__ - Step 19568: {'lr': 0.00019995467806229838, 'samples': 626176, 'steps': 1222, 'loss/train': 2.432422161102295} -09/20/2021 18:43:32 - INFO - __main__ - Step 19569: {'lr': 0.0001999544858313395, 'samples': 626208, 'steps': 1223, 'loss/train': 3.58838152885437} -09/20/2021 18:43:33 - INFO - __main__ - Step 19570: {'lr': 0.0001999544858313395, 'samples': 626240, 'steps': 1223, 'loss/train': 3.2152624130249023} -09/20/2021 18:43:34 - INFO - __main__ - Step 19571: {'lr': 0.0001999544858313395, 'samples': 626272, 'steps': 1223, 'loss/train': 3.4648549556732178} -09/20/2021 18:43:34 - INFO - __main__ - Step 19572: {'lr': 0.0001999544858313395, 'samples': 626304, 'steps': 1223, 'loss/train': 3.366271734237671} -09/20/2021 18:43:35 - INFO - __main__ - Step 19573: {'lr': 0.0001999544858313395, 'samples': 626336, 'steps': 1223, 'loss/train': 2.7354846000671387} -09/20/2021 18:43:36 - INFO - __main__ - Step 19574: {'lr': 0.0001999544858313395, 'samples': 626368, 'steps': 1223, 'loss/train': 3.501734972000122} -09/20/2021 18:43:37 - INFO - __main__ - Step 19575: {'lr': 0.0001999544858313395, 'samples': 626400, 'steps': 1223, 'loss/train': 4.894068241119385} -09/20/2021 18:43:37 - INFO - __main__ - Step 19576: {'lr': 0.0001999544858313395, 'samples': 626432, 'steps': 1223, 'loss/train': 3.627528429031372} -09/20/2021 18:43:38 - INFO - __main__ - Step 19577: {'lr': 0.0001999544858313395, 'samples': 626464, 'steps': 1223, 'loss/train': 4.018716812133789} -09/20/2021 18:43:39 - INFO - __main__ - Step 19578: {'lr': 0.0001999544858313395, 'samples': 626496, 'steps': 1223, 'loss/train': 3.693922519683838} -09/20/2021 18:43:40 - INFO - __main__ - Step 19579: {'lr': 0.0001999544858313395, 'samples': 626528, 'steps': 1223, 'loss/train': 3.7834532260894775} -09/20/2021 18:43:40 - INFO - __main__ - Step 19580: {'lr': 0.0001999544858313395, 'samples': 626560, 'steps': 1223, 'loss/train': 3.913832902908325} -09/20/2021 18:43:41 - INFO - __main__ - Step 19581: {'lr': 0.0001999544858313395, 'samples': 626592, 'steps': 1223, 'loss/train': 4.479452133178711} -09/20/2021 18:43:42 - INFO - __main__ - Step 19582: {'lr': 0.0001999544858313395, 'samples': 626624, 'steps': 1223, 'loss/train': 3.2341089248657227} -09/20/2021 18:43:43 - INFO - __main__ - Step 19583: {'lr': 0.0001999544858313395, 'samples': 626656, 'steps': 1223, 'loss/train': 3.6186752319335938} -09/20/2021 18:43:43 - INFO - __main__ - Step 19584: {'lr': 0.0001999544858313395, 'samples': 626688, 'steps': 1223, 'loss/train': 4.207374572753906} -09/20/2021 18:43:44 - INFO - __main__ - Step 19585: {'lr': 0.00019995429319366622, 'samples': 626720, 'steps': 1224, 'loss/train': 3.8663747310638428} -09/20/2021 18:43:45 - INFO - __main__ - Step 19586: {'lr': 0.00019995429319366622, 'samples': 626752, 'steps': 1224, 'loss/train': 2.766646146774292} -09/20/2021 18:43:46 - INFO - __main__ - Step 19587: {'lr': 0.00019995429319366622, 'samples': 626784, 'steps': 1224, 'loss/train': 3.2996206283569336} -09/20/2021 18:43:46 - INFO - __main__ - Step 19588: {'lr': 0.00019995429319366622, 'samples': 626816, 'steps': 1224, 'loss/train': 4.04330587387085} -09/20/2021 18:43:47 - INFO - __main__ - Step 19589: {'lr': 0.00019995429319366622, 'samples': 626848, 'steps': 1224, 'loss/train': 3.9400806427001953} -09/20/2021 18:43:48 - INFO - __main__ - Step 19590: {'lr': 0.00019995429319366622, 'samples': 626880, 'steps': 1224, 'loss/train': 3.824267625808716} -09/20/2021 18:43:49 - INFO - __main__ - Step 19591: {'lr': 0.00019995429319366622, 'samples': 626912, 'steps': 1224, 'loss/train': 3.4186291694641113} -09/20/2021 18:43:50 - INFO - __main__ - Step 19592: {'lr': 0.00019995429319366622, 'samples': 626944, 'steps': 1224, 'loss/train': 3.4590883255004883} -09/20/2021 18:43:51 - INFO - __main__ - Step 19593: {'lr': 0.00019995429319366622, 'samples': 626976, 'steps': 1224, 'loss/train': 3.4996156692504883} -09/20/2021 18:43:51 - INFO - __main__ - Step 19594: {'lr': 0.00019995429319366622, 'samples': 627008, 'steps': 1224, 'loss/train': 2.9777719974517822} -09/20/2021 18:43:52 - INFO - __main__ - Step 19595: {'lr': 0.00019995429319366622, 'samples': 627040, 'steps': 1224, 'loss/train': 3.2152788639068604} -09/20/2021 18:43:53 - INFO - __main__ - Step 19596: {'lr': 0.00019995429319366622, 'samples': 627072, 'steps': 1224, 'loss/train': 4.271734237670898} -09/20/2021 18:43:54 - INFO - __main__ - Step 19597: {'lr': 0.00019995429319366622, 'samples': 627104, 'steps': 1224, 'loss/train': 3.023707866668701} -09/20/2021 18:43:54 - INFO - __main__ - Step 19598: {'lr': 0.00019995429319366622, 'samples': 627136, 'steps': 1224, 'loss/train': 3.7605090141296387} -09/20/2021 18:43:55 - INFO - __main__ - Step 19599: {'lr': 0.00019995429319366622, 'samples': 627168, 'steps': 1224, 'loss/train': 2.625727415084839} -09/20/2021 18:43:56 - INFO - __main__ - Step 19600: {'lr': 0.00019995429319366622, 'samples': 627200, 'steps': 1224, 'loss/train': 3.6886751651763916} -09/20/2021 18:43:57 - INFO - __main__ - Step 19601: {'lr': 0.00019995410014927932, 'samples': 627232, 'steps': 1225, 'loss/train': 5.0152106285095215} -09/20/2021 18:43:58 - INFO - __main__ - Step 19602: {'lr': 0.00019995410014927932, 'samples': 627264, 'steps': 1225, 'loss/train': 3.1506712436676025} -09/20/2021 18:43:58 - INFO - __main__ - Step 19603: {'lr': 0.00019995410014927932, 'samples': 627296, 'steps': 1225, 'loss/train': 3.031625509262085} -09/20/2021 18:43:59 - INFO - __main__ - Step 19604: {'lr': 0.00019995410014927932, 'samples': 627328, 'steps': 1225, 'loss/train': 3.088881015777588} -09/20/2021 18:44:00 - INFO - __main__ - Step 19605: {'lr': 0.00019995410014927932, 'samples': 627360, 'steps': 1225, 'loss/train': 5.008078575134277} -09/20/2021 18:44:01 - INFO - __main__ - Step 19606: {'lr': 0.00019995410014927932, 'samples': 627392, 'steps': 1225, 'loss/train': 2.340399742126465} -09/20/2021 18:44:01 - INFO - __main__ - Step 19607: {'lr': 0.00019995410014927932, 'samples': 627424, 'steps': 1225, 'loss/train': 3.1820356845855713} -09/20/2021 18:44:02 - INFO - __main__ - Step 19608: {'lr': 0.00019995410014927932, 'samples': 627456, 'steps': 1225, 'loss/train': 5.583129405975342} -09/20/2021 18:44:03 - INFO - __main__ - Step 19609: {'lr': 0.00019995410014927932, 'samples': 627488, 'steps': 1225, 'loss/train': 4.668895244598389} -09/20/2021 18:44:04 - INFO - __main__ - Step 19610: {'lr': 0.00019995410014927932, 'samples': 627520, 'steps': 1225, 'loss/train': 3.0695600509643555} -09/20/2021 18:44:04 - INFO - __main__ - Step 19611: {'lr': 0.00019995410014927932, 'samples': 627552, 'steps': 1225, 'loss/train': 3.174057960510254} -09/20/2021 18:44:05 - INFO - __main__ - Step 19612: {'lr': 0.00019995410014927932, 'samples': 627584, 'steps': 1225, 'loss/train': 2.5218403339385986} -09/20/2021 18:44:06 - INFO - __main__ - Step 19613: {'lr': 0.00019995410014927932, 'samples': 627616, 'steps': 1225, 'loss/train': 3.854156732559204} -09/20/2021 18:44:07 - INFO - __main__ - Step 19614: {'lr': 0.00019995410014927932, 'samples': 627648, 'steps': 1225, 'loss/train': 3.0875298976898193} -09/20/2021 18:44:07 - INFO - __main__ - Step 19615: {'lr': 0.00019995410014927932, 'samples': 627680, 'steps': 1225, 'loss/train': 4.143641471862793} -09/20/2021 18:44:08 - INFO - __main__ - Step 19616: {'lr': 0.00019995410014927932, 'samples': 627712, 'steps': 1225, 'loss/train': 2.7372519969940186} -09/20/2021 18:44:09 - INFO - __main__ - Step 19617: {'lr': 0.00019995390669817956, 'samples': 627744, 'steps': 1226, 'loss/train': 3.579479932785034} -09/20/2021 18:44:10 - INFO - __main__ - Step 19618: {'lr': 0.00019995390669817956, 'samples': 627776, 'steps': 1226, 'loss/train': 3.2313179969787598} -09/20/2021 18:44:11 - INFO - __main__ - Step 19619: {'lr': 0.00019995390669817956, 'samples': 627808, 'steps': 1226, 'loss/train': 3.435698986053467} -09/20/2021 18:44:11 - INFO - __main__ - Step 19620: {'lr': 0.00019995390669817956, 'samples': 627840, 'steps': 1226, 'loss/train': 3.3042654991149902} -09/20/2021 18:44:13 - INFO - __main__ - Step 19621: {'lr': 0.00019995390669817956, 'samples': 627872, 'steps': 1226, 'loss/train': 3.8312699794769287} -09/20/2021 18:44:13 - INFO - __main__ - Step 19622: {'lr': 0.00019995390669817956, 'samples': 627904, 'steps': 1226, 'loss/train': 5.316561222076416} -09/20/2021 18:44:14 - INFO - __main__ - Step 19623: {'lr': 0.00019995390669817956, 'samples': 627936, 'steps': 1226, 'loss/train': 3.2145910263061523} -09/20/2021 18:44:15 - INFO - __main__ - Step 19624: {'lr': 0.00019995390669817956, 'samples': 627968, 'steps': 1226, 'loss/train': 3.3630096912384033} -09/20/2021 18:44:16 - INFO - __main__ - Step 19625: {'lr': 0.00019995390669817956, 'samples': 628000, 'steps': 1226, 'loss/train': 3.286113739013672} -09/20/2021 18:44:16 - INFO - __main__ - Step 19626: {'lr': 0.00019995390669817956, 'samples': 628032, 'steps': 1226, 'loss/train': 2.955294609069824} -09/20/2021 18:44:17 - INFO - __main__ - Step 19627: {'lr': 0.00019995390669817956, 'samples': 628064, 'steps': 1226, 'loss/train': 3.069927930831909} -09/20/2021 18:44:18 - INFO - __main__ - Step 19628: {'lr': 0.00019995390669817956, 'samples': 628096, 'steps': 1226, 'loss/train': 3.788247585296631} -09/20/2021 18:44:19 - INFO - __main__ - Step 19629: {'lr': 0.00019995390669817956, 'samples': 628128, 'steps': 1226, 'loss/train': 2.213803291320801} -09/20/2021 18:44:19 - INFO - __main__ - Step 19630: {'lr': 0.00019995390669817956, 'samples': 628160, 'steps': 1226, 'loss/train': 3.185724973678589} -09/20/2021 18:44:20 - INFO - __main__ - Step 19631: {'lr': 0.00019995390669817956, 'samples': 628192, 'steps': 1226, 'loss/train': 3.2626402378082275} -09/20/2021 18:44:21 - INFO - __main__ - Step 19632: {'lr': 0.00019995390669817956, 'samples': 628224, 'steps': 1226, 'loss/train': 4.599477767944336} -09/20/2021 18:44:22 - INFO - __main__ - Step 19633: {'lr': 0.00019995371284036776, 'samples': 628256, 'steps': 1227, 'loss/train': 2.8692946434020996} -09/20/2021 18:44:22 - INFO - __main__ - Step 19634: {'lr': 0.00019995371284036776, 'samples': 628288, 'steps': 1227, 'loss/train': 3.3452694416046143} -09/20/2021 18:44:23 - INFO - __main__ - Step 19635: {'lr': 0.00019995371284036776, 'samples': 628320, 'steps': 1227, 'loss/train': 2.9429385662078857} -09/20/2021 18:44:24 - INFO - __main__ - Step 19636: {'lr': 0.00019995371284036776, 'samples': 628352, 'steps': 1227, 'loss/train': 4.688744068145752} -09/20/2021 18:44:25 - INFO - __main__ - Step 19637: {'lr': 0.00019995371284036776, 'samples': 628384, 'steps': 1227, 'loss/train': 4.26693868637085} -09/20/2021 18:44:25 - INFO - __main__ - Step 19638: {'lr': 0.00019995371284036776, 'samples': 628416, 'steps': 1227, 'loss/train': 4.081348896026611} -09/20/2021 18:44:26 - INFO - __main__ - Step 19639: {'lr': 0.00019995371284036776, 'samples': 628448, 'steps': 1227, 'loss/train': 3.4465725421905518} -09/20/2021 18:44:27 - INFO - __main__ - Step 19640: {'lr': 0.00019995371284036776, 'samples': 628480, 'steps': 1227, 'loss/train': 4.074034690856934} -09/20/2021 18:44:28 - INFO - __main__ - Step 19641: {'lr': 0.00019995371284036776, 'samples': 628512, 'steps': 1227, 'loss/train': 3.9250128269195557} -09/20/2021 18:44:28 - INFO - __main__ - Step 19642: {'lr': 0.00019995371284036776, 'samples': 628544, 'steps': 1227, 'loss/train': 3.3612968921661377} -09/20/2021 18:44:29 - INFO - __main__ - Step 19643: {'lr': 0.00019995371284036776, 'samples': 628576, 'steps': 1227, 'loss/train': 3.848378896713257} -09/20/2021 18:44:30 - INFO - __main__ - Step 19644: {'lr': 0.00019995371284036776, 'samples': 628608, 'steps': 1227, 'loss/train': 3.4145729541778564} -09/20/2021 18:44:31 - INFO - __main__ - Step 19645: {'lr': 0.00019995371284036776, 'samples': 628640, 'steps': 1227, 'loss/train': 3.686127185821533} -09/20/2021 18:44:31 - INFO - __main__ - Step 19646: {'lr': 0.00019995371284036776, 'samples': 628672, 'steps': 1227, 'loss/train': 3.734618663787842} -09/20/2021 18:44:32 - INFO - __main__ - Step 19647: {'lr': 0.00019995371284036776, 'samples': 628704, 'steps': 1227, 'loss/train': 4.716165065765381} -09/20/2021 18:44:33 - INFO - __main__ - Step 19648: {'lr': 0.00019995371284036776, 'samples': 628736, 'steps': 1227, 'loss/train': 3.633207082748413} -09/20/2021 18:44:34 - INFO - __main__ - Step 19649: {'lr': 0.0001999535185758447, 'samples': 628768, 'steps': 1228, 'loss/train': 2.3212995529174805} -09/20/2021 18:44:35 - INFO - __main__ - Step 19650: {'lr': 0.0001999535185758447, 'samples': 628800, 'steps': 1228, 'loss/train': 3.6433823108673096} -09/20/2021 18:44:35 - INFO - __main__ - Step 19651: {'lr': 0.0001999535185758447, 'samples': 628832, 'steps': 1228, 'loss/train': 3.7011680603027344} -09/20/2021 18:44:36 - INFO - __main__ - Step 19652: {'lr': 0.0001999535185758447, 'samples': 628864, 'steps': 1228, 'loss/train': 3.367793083190918} -09/20/2021 18:44:37 - INFO - __main__ - Step 19653: {'lr': 0.0001999535185758447, 'samples': 628896, 'steps': 1228, 'loss/train': 2.526578426361084} -09/20/2021 18:44:38 - INFO - __main__ - Step 19654: {'lr': 0.0001999535185758447, 'samples': 628928, 'steps': 1228, 'loss/train': 1.1281112432479858} -09/20/2021 18:44:39 - INFO - __main__ - Step 19655: {'lr': 0.0001999535185758447, 'samples': 628960, 'steps': 1228, 'loss/train': 0.9469600915908813} -09/20/2021 18:44:40 - INFO - __main__ - Step 19656: {'lr': 0.0001999535185758447, 'samples': 628992, 'steps': 1228, 'loss/train': 0.7195940017700195} -09/20/2021 18:44:40 - INFO - __main__ - Step 19657: {'lr': 0.0001999535185758447, 'samples': 629024, 'steps': 1228, 'loss/train': 3.049297571182251} -09/20/2021 18:44:41 - INFO - __main__ - Step 19658: {'lr': 0.0001999535185758447, 'samples': 629056, 'steps': 1228, 'loss/train': 3.499939203262329} -09/20/2021 18:44:42 - INFO - __main__ - Step 19659: {'lr': 0.0001999535185758447, 'samples': 629088, 'steps': 1228, 'loss/train': 3.533686637878418} -09/20/2021 18:44:43 - INFO - __main__ - Step 19660: {'lr': 0.0001999535185758447, 'samples': 629120, 'steps': 1228, 'loss/train': 4.438022136688232} -09/20/2021 18:44:43 - INFO - __main__ - Step 19661: {'lr': 0.0001999535185758447, 'samples': 629152, 'steps': 1228, 'loss/train': 4.016423225402832} -09/20/2021 18:44:44 - INFO - __main__ - Step 19662: {'lr': 0.0001999535185758447, 'samples': 629184, 'steps': 1228, 'loss/train': 0.8540397882461548} -09/20/2021 18:44:45 - INFO - __main__ - Step 19663: {'lr': 0.0001999535185758447, 'samples': 629216, 'steps': 1228, 'loss/train': 3.694592237472534} -09/20/2021 18:44:46 - INFO - __main__ - Step 19664: {'lr': 0.0001999535185758447, 'samples': 629248, 'steps': 1228, 'loss/train': 3.6624813079833984} -09/20/2021 18:44:47 - INFO - __main__ - Step 19665: {'lr': 0.00019995332390461114, 'samples': 629280, 'steps': 1229, 'loss/train': 2.766144275665283} -09/20/2021 18:44:47 - INFO - __main__ - Step 19666: {'lr': 0.00019995332390461114, 'samples': 629312, 'steps': 1229, 'loss/train': 2.9121060371398926} -09/20/2021 18:44:48 - INFO - __main__ - Step 19667: {'lr': 0.00019995332390461114, 'samples': 629344, 'steps': 1229, 'loss/train': 3.124105215072632} -09/20/2021 18:44:49 - INFO - __main__ - Step 19668: {'lr': 0.00019995332390461114, 'samples': 629376, 'steps': 1229, 'loss/train': 3.3605875968933105} -09/20/2021 18:44:50 - INFO - __main__ - Step 19669: {'lr': 0.00019995332390461114, 'samples': 629408, 'steps': 1229, 'loss/train': 3.3228864669799805} -09/20/2021 18:44:50 - INFO - __main__ - Step 19670: {'lr': 0.00019995332390461114, 'samples': 629440, 'steps': 1229, 'loss/train': 4.092309951782227} -09/20/2021 18:44:51 - INFO - __main__ - Step 19671: {'lr': 0.00019995332390461114, 'samples': 629472, 'steps': 1229, 'loss/train': 2.5696418285369873} -09/20/2021 18:44:52 - INFO - __main__ - Step 19672: {'lr': 0.00019995332390461114, 'samples': 629504, 'steps': 1229, 'loss/train': 5.302872180938721} -09/20/2021 18:44:53 - INFO - __main__ - Step 19673: {'lr': 0.00019995332390461114, 'samples': 629536, 'steps': 1229, 'loss/train': 2.7251100540161133} -09/20/2021 18:44:53 - INFO - __main__ - Step 19674: {'lr': 0.00019995332390461114, 'samples': 629568, 'steps': 1229, 'loss/train': 3.5201303958892822} -09/20/2021 18:44:54 - INFO - __main__ - Step 19675: {'lr': 0.00019995332390461114, 'samples': 629600, 'steps': 1229, 'loss/train': 2.8768579959869385} -09/20/2021 18:44:55 - INFO - __main__ - Step 19676: {'lr': 0.00019995332390461114, 'samples': 629632, 'steps': 1229, 'loss/train': 2.4812636375427246} -09/20/2021 18:44:56 - INFO - __main__ - Step 19677: {'lr': 0.00019995332390461114, 'samples': 629664, 'steps': 1229, 'loss/train': 3.0473387241363525} -09/20/2021 18:44:56 - INFO - __main__ - Step 19678: {'lr': 0.00019995332390461114, 'samples': 629696, 'steps': 1229, 'loss/train': 5.371128082275391} -09/20/2021 18:44:57 - INFO - __main__ - Step 19679: {'lr': 0.00019995332390461114, 'samples': 629728, 'steps': 1229, 'loss/train': 2.5194919109344482} -09/20/2021 18:44:58 - INFO - __main__ - Step 19680: {'lr': 0.00019995332390461114, 'samples': 629760, 'steps': 1229, 'loss/train': 3.8425004482269287} -09/20/2021 18:44:59 - INFO - __main__ - Step 19681: {'lr': 0.0001999531288266679, 'samples': 629792, 'steps': 1230, 'loss/train': 2.839589834213257} -09/20/2021 18:45:00 - INFO - __main__ - Step 19682: {'lr': 0.0001999531288266679, 'samples': 629824, 'steps': 1230, 'loss/train': 3.648496627807617} -09/20/2021 18:45:00 - INFO - __main__ - Step 19683: {'lr': 0.0001999531288266679, 'samples': 629856, 'steps': 1230, 'loss/train': 3.0917952060699463} -09/20/2021 18:45:01 - INFO - __main__ - Step 19684: {'lr': 0.0001999531288266679, 'samples': 629888, 'steps': 1230, 'loss/train': 3.6010279655456543} -09/20/2021 18:45:02 - INFO - __main__ - Step 19685: {'lr': 0.0001999531288266679, 'samples': 629920, 'steps': 1230, 'loss/train': 3.2745683193206787} -09/20/2021 18:45:03 - INFO - __main__ - Step 19686: {'lr': 0.0001999531288266679, 'samples': 629952, 'steps': 1230, 'loss/train': 3.952789545059204} -09/20/2021 18:45:04 - INFO - __main__ - Step 19687: {'lr': 0.0001999531288266679, 'samples': 629984, 'steps': 1230, 'loss/train': 3.603076934814453} -09/20/2021 18:45:05 - INFO - __main__ - Step 19688: {'lr': 0.0001999531288266679, 'samples': 630016, 'steps': 1230, 'loss/train': 3.822641372680664} -09/20/2021 18:45:05 - INFO - __main__ - Step 19689: {'lr': 0.0001999531288266679, 'samples': 630048, 'steps': 1230, 'loss/train': 3.4475040435791016} -09/20/2021 18:45:06 - INFO - __main__ - Step 19690: {'lr': 0.0001999531288266679, 'samples': 630080, 'steps': 1230, 'loss/train': 2.9775283336639404} -09/20/2021 18:45:07 - INFO - __main__ - Step 19691: {'lr': 0.0001999531288266679, 'samples': 630112, 'steps': 1230, 'loss/train': 3.409372329711914} -09/20/2021 18:45:08 - INFO - __main__ - Step 19692: {'lr': 0.0001999531288266679, 'samples': 630144, 'steps': 1230, 'loss/train': 3.3778786659240723} -09/20/2021 18:45:08 - INFO - __main__ - Step 19693: {'lr': 0.0001999531288266679, 'samples': 630176, 'steps': 1230, 'loss/train': 3.193864583969116} -09/20/2021 18:45:09 - INFO - __main__ - Step 19694: {'lr': 0.0001999531288266679, 'samples': 630208, 'steps': 1230, 'loss/train': 2.953162431716919} -09/20/2021 18:45:10 - INFO - __main__ - Step 19695: {'lr': 0.0001999531288266679, 'samples': 630240, 'steps': 1230, 'loss/train': 4.046079635620117} -09/20/2021 18:45:11 - INFO - __main__ - Step 19696: {'lr': 0.0001999531288266679, 'samples': 630272, 'steps': 1230, 'loss/train': 0.5232084393501282} -09/20/2021 18:45:11 - INFO - __main__ - Step 19697: {'lr': 0.00019995293334201577, 'samples': 630304, 'steps': 1231, 'loss/train': 3.585862159729004} -09/20/2021 18:45:12 - INFO - __main__ - Step 19698: {'lr': 0.00019995293334201577, 'samples': 630336, 'steps': 1231, 'loss/train': 2.790835380554199} -09/20/2021 18:45:13 - INFO - __main__ - Step 19699: {'lr': 0.00019995293334201577, 'samples': 630368, 'steps': 1231, 'loss/train': 4.138234615325928} -09/20/2021 18:45:14 - INFO - __main__ - Step 19700: {'lr': 0.00019995293334201577, 'samples': 630400, 'steps': 1231, 'loss/train': 3.397693157196045} -09/20/2021 18:45:14 - INFO - __main__ - Step 19701: {'lr': 0.00019995293334201577, 'samples': 630432, 'steps': 1231, 'loss/train': 3.3815224170684814} -09/20/2021 18:45:15 - INFO - __main__ - Step 19702: {'lr': 0.00019995293334201577, 'samples': 630464, 'steps': 1231, 'loss/train': 4.354177474975586} -09/20/2021 18:45:16 - INFO - __main__ - Step 19703: {'lr': 0.00019995293334201577, 'samples': 630496, 'steps': 1231, 'loss/train': 4.037302494049072} -09/20/2021 18:45:17 - INFO - __main__ - Step 19704: {'lr': 0.00019995293334201577, 'samples': 630528, 'steps': 1231, 'loss/train': 3.415451765060425} -09/20/2021 18:45:17 - INFO - __main__ - Step 19705: {'lr': 0.00019995293334201577, 'samples': 630560, 'steps': 1231, 'loss/train': 4.356948375701904} -09/20/2021 18:45:18 - INFO - __main__ - Step 19706: {'lr': 0.00019995293334201577, 'samples': 630592, 'steps': 1231, 'loss/train': 4.361517906188965} -09/20/2021 18:45:19 - INFO - __main__ - Step 19707: {'lr': 0.00019995293334201577, 'samples': 630624, 'steps': 1231, 'loss/train': 1.0224087238311768} -09/20/2021 18:45:20 - INFO - __main__ - Step 19708: {'lr': 0.00019995293334201577, 'samples': 630656, 'steps': 1231, 'loss/train': 3.412712574005127} -09/20/2021 18:45:20 - INFO - __main__ - Step 19709: {'lr': 0.00019995293334201577, 'samples': 630688, 'steps': 1231, 'loss/train': 3.132312536239624} -09/20/2021 18:45:21 - INFO - __main__ - Step 19710: {'lr': 0.00019995293334201577, 'samples': 630720, 'steps': 1231, 'loss/train': 3.136950731277466} -09/20/2021 18:45:22 - INFO - __main__ - Step 19711: {'lr': 0.00019995293334201577, 'samples': 630752, 'steps': 1231, 'loss/train': 2.9420506954193115} -09/20/2021 18:45:23 - INFO - __main__ - Step 19712: {'lr': 0.00019995293334201577, 'samples': 630784, 'steps': 1231, 'loss/train': 3.247748851776123} -09/20/2021 18:45:24 - INFO - __main__ - Step 19713: {'lr': 0.0001999527374506555, 'samples': 630816, 'steps': 1232, 'loss/train': 4.223080158233643} -09/20/2021 18:45:24 - INFO - __main__ - Step 19714: {'lr': 0.0001999527374506555, 'samples': 630848, 'steps': 1232, 'loss/train': 3.6248159408569336} -09/20/2021 18:45:25 - INFO - __main__ - Step 19715: {'lr': 0.0001999527374506555, 'samples': 630880, 'steps': 1232, 'loss/train': 4.4014081954956055} -09/20/2021 18:45:26 - INFO - __main__ - Step 19716: {'lr': 0.0001999527374506555, 'samples': 630912, 'steps': 1232, 'loss/train': 3.3766238689422607} -09/20/2021 18:45:27 - INFO - __main__ - Step 19717: {'lr': 0.0001999527374506555, 'samples': 630944, 'steps': 1232, 'loss/train': 3.3824400901794434} -09/20/2021 18:45:29 - INFO - __main__ - Step 19718: {'lr': 0.0001999527374506555, 'samples': 630976, 'steps': 1232, 'loss/train': 4.3169050216674805} -09/20/2021 18:45:29 - INFO - __main__ - Step 19719: {'lr': 0.0001999527374506555, 'samples': 631008, 'steps': 1232, 'loss/train': 3.019719123840332} -09/20/2021 18:45:30 - INFO - __main__ - Step 19720: {'lr': 0.0001999527374506555, 'samples': 631040, 'steps': 1232, 'loss/train': 2.9193899631500244} -09/20/2021 18:45:31 - INFO - __main__ - Step 19721: {'lr': 0.0001999527374506555, 'samples': 631072, 'steps': 1232, 'loss/train': 3.68617582321167} -09/20/2021 18:45:32 - INFO - __main__ - Step 19722: {'lr': 0.0001999527374506555, 'samples': 631104, 'steps': 1232, 'loss/train': 2.4803659915924072} -09/20/2021 18:45:32 - INFO - __main__ - Step 19723: {'lr': 0.0001999527374506555, 'samples': 631136, 'steps': 1232, 'loss/train': 3.278815507888794} -09/20/2021 18:45:33 - INFO - __main__ - Step 19724: {'lr': 0.0001999527374506555, 'samples': 631168, 'steps': 1232, 'loss/train': 2.8672127723693848} -09/20/2021 18:45:34 - INFO - __main__ - Step 19725: {'lr': 0.0001999527374506555, 'samples': 631200, 'steps': 1232, 'loss/train': 5.536528587341309} -09/20/2021 18:45:35 - INFO - __main__ - Step 19726: {'lr': 0.0001999527374506555, 'samples': 631232, 'steps': 1232, 'loss/train': 3.485694169998169} -09/20/2021 18:45:35 - INFO - __main__ - Step 19727: {'lr': 0.0001999527374506555, 'samples': 631264, 'steps': 1232, 'loss/train': 0.5371040105819702} -09/20/2021 18:45:36 - INFO - __main__ - Step 19728: {'lr': 0.0001999527374506555, 'samples': 631296, 'steps': 1232, 'loss/train': 0.8414491415023804} -09/20/2021 18:45:37 - INFO - __main__ - Step 19729: {'lr': 0.000199952541152588, 'samples': 631328, 'steps': 1233, 'loss/train': 0.7075017690658569} -09/20/2021 18:45:38 - INFO - __main__ - Step 19730: {'lr': 0.000199952541152588, 'samples': 631360, 'steps': 1233, 'loss/train': 1.508592128753662} -09/20/2021 18:45:38 - INFO - __main__ - Step 19731: {'lr': 0.000199952541152588, 'samples': 631392, 'steps': 1233, 'loss/train': 2.9425342082977295} -09/20/2021 18:45:39 - INFO - __main__ - Step 19732: {'lr': 0.000199952541152588, 'samples': 631424, 'steps': 1233, 'loss/train': 3.337822914123535} -09/20/2021 18:45:40 - INFO - __main__ - Step 19733: {'lr': 0.000199952541152588, 'samples': 631456, 'steps': 1233, 'loss/train': 3.0726449489593506} -09/20/2021 18:45:41 - INFO - __main__ - Step 19734: {'lr': 0.000199952541152588, 'samples': 631488, 'steps': 1233, 'loss/train': 4.53873872756958} -09/20/2021 18:45:41 - INFO - __main__ - Step 19735: {'lr': 0.000199952541152588, 'samples': 631520, 'steps': 1233, 'loss/train': 3.279761791229248} -09/20/2021 18:45:42 - INFO - __main__ - Step 19736: {'lr': 0.000199952541152588, 'samples': 631552, 'steps': 1233, 'loss/train': 3.121643543243408} -09/20/2021 18:45:43 - INFO - __main__ - Step 19737: {'lr': 0.000199952541152588, 'samples': 631584, 'steps': 1233, 'loss/train': 3.2913968563079834} -09/20/2021 18:45:44 - INFO - __main__ - Step 19738: {'lr': 0.000199952541152588, 'samples': 631616, 'steps': 1233, 'loss/train': 5.327988624572754} -09/20/2021 18:45:44 - INFO - __main__ - Step 19739: {'lr': 0.000199952541152588, 'samples': 631648, 'steps': 1233, 'loss/train': 6.629642963409424} -09/20/2021 18:45:45 - INFO - __main__ - Step 19740: {'lr': 0.000199952541152588, 'samples': 631680, 'steps': 1233, 'loss/train': 3.210787534713745} -09/20/2021 18:45:46 - INFO - __main__ - Step 19741: {'lr': 0.000199952541152588, 'samples': 631712, 'steps': 1233, 'loss/train': 3.447678804397583} -09/20/2021 18:45:47 - INFO - __main__ - Step 19742: {'lr': 0.000199952541152588, 'samples': 631744, 'steps': 1233, 'loss/train': 3.3246405124664307} -09/20/2021 18:45:47 - INFO - __main__ - Step 19743: {'lr': 0.000199952541152588, 'samples': 631776, 'steps': 1233, 'loss/train': 3.6139135360717773} -09/20/2021 18:45:48 - INFO - __main__ - Step 19744: {'lr': 0.000199952541152588, 'samples': 631808, 'steps': 1233, 'loss/train': 3.4591972827911377} -09/20/2021 18:45:49 - INFO - __main__ - Step 19745: {'lr': 0.00019995234444781395, 'samples': 631840, 'steps': 1234, 'loss/train': 2.726424217224121} -09/20/2021 18:45:50 - INFO - __main__ - Step 19746: {'lr': 0.00019995234444781395, 'samples': 631872, 'steps': 1234, 'loss/train': 3.1957528591156006} -09/20/2021 18:45:51 - INFO - __main__ - Step 19747: {'lr': 0.00019995234444781395, 'samples': 631904, 'steps': 1234, 'loss/train': 3.288159132003784} -09/20/2021 18:45:51 - INFO - __main__ - Step 19748: {'lr': 0.00019995234444781395, 'samples': 631936, 'steps': 1234, 'loss/train': 2.9055323600769043} -09/20/2021 18:45:53 - INFO - __main__ - Step 19749: {'lr': 0.00019995234444781395, 'samples': 631968, 'steps': 1234, 'loss/train': 3.854843854904175} -09/20/2021 18:45:53 - INFO - __main__ - Step 19750: {'lr': 0.00019995234444781395, 'samples': 632000, 'steps': 1234, 'loss/train': 3.8355979919433594} -09/20/2021 18:45:54 - INFO - __main__ - Step 19751: {'lr': 0.00019995234444781395, 'samples': 632032, 'steps': 1234, 'loss/train': 2.9837019443511963} -09/20/2021 18:45:55 - INFO - __main__ - Step 19752: {'lr': 0.00019995234444781395, 'samples': 632064, 'steps': 1234, 'loss/train': 4.0325212478637695} -09/20/2021 18:45:56 - INFO - __main__ - Step 19753: {'lr': 0.00019995234444781395, 'samples': 632096, 'steps': 1234, 'loss/train': 3.7606122493743896} -09/20/2021 18:45:56 - INFO - __main__ - Step 19754: {'lr': 0.00019995234444781395, 'samples': 632128, 'steps': 1234, 'loss/train': 3.668792486190796} -09/20/2021 18:45:57 - INFO - __main__ - Step 19755: {'lr': 0.00019995234444781395, 'samples': 632160, 'steps': 1234, 'loss/train': 0.7504382133483887} -09/20/2021 18:45:58 - INFO - __main__ - Step 19756: {'lr': 0.00019995234444781395, 'samples': 632192, 'steps': 1234, 'loss/train': 4.730857849121094} -09/20/2021 18:45:59 - INFO - __main__ - Step 19757: {'lr': 0.00019995234444781395, 'samples': 632224, 'steps': 1234, 'loss/train': 0.9728838205337524} -09/20/2021 18:45:59 - INFO - __main__ - Step 19758: {'lr': 0.00019995234444781395, 'samples': 632256, 'steps': 1234, 'loss/train': 4.173002243041992} -09/20/2021 18:46:00 - INFO - __main__ - Step 19759: {'lr': 0.00019995234444781395, 'samples': 632288, 'steps': 1234, 'loss/train': 3.2826266288757324} -09/20/2021 18:46:01 - INFO - __main__ - Step 19760: {'lr': 0.00019995234444781395, 'samples': 632320, 'steps': 1234, 'loss/train': 3.729961395263672} -09/20/2021 18:46:02 - INFO - __main__ - Step 19761: {'lr': 0.0001999521473363342, 'samples': 632352, 'steps': 1235, 'loss/train': 3.0081405639648438} -09/20/2021 18:46:02 - INFO - __main__ - Step 19762: {'lr': 0.0001999521473363342, 'samples': 632384, 'steps': 1235, 'loss/train': 3.1398236751556396} -09/20/2021 18:46:03 - INFO - __main__ - Step 19763: {'lr': 0.0001999521473363342, 'samples': 632416, 'steps': 1235, 'loss/train': 3.3862242698669434} -09/20/2021 18:46:04 - INFO - __main__ - Step 19764: {'lr': 0.0001999521473363342, 'samples': 632448, 'steps': 1235, 'loss/train': 3.8450772762298584} -09/20/2021 18:46:05 - INFO - __main__ - Step 19765: {'lr': 0.0001999521473363342, 'samples': 632480, 'steps': 1235, 'loss/train': 3.334287643432617} -09/20/2021 18:46:05 - INFO - __main__ - Step 19766: {'lr': 0.0001999521473363342, 'samples': 632512, 'steps': 1235, 'loss/train': 3.4210898876190186} -09/20/2021 18:46:06 - INFO - __main__ - Step 19767: {'lr': 0.0001999521473363342, 'samples': 632544, 'steps': 1235, 'loss/train': 3.679797649383545} -09/20/2021 18:46:07 - INFO - __main__ - Step 19768: {'lr': 0.0001999521473363342, 'samples': 632576, 'steps': 1235, 'loss/train': 3.3179972171783447} -09/20/2021 18:46:08 - INFO - __main__ - Step 19769: {'lr': 0.0001999521473363342, 'samples': 632608, 'steps': 1235, 'loss/train': 3.612802743911743} -09/20/2021 18:46:08 - INFO - __main__ - Step 19770: {'lr': 0.0001999521473363342, 'samples': 632640, 'steps': 1235, 'loss/train': 3.4884109497070312} -09/20/2021 18:46:09 - INFO - __main__ - Step 19771: {'lr': 0.0001999521473363342, 'samples': 632672, 'steps': 1235, 'loss/train': 3.7748913764953613} -09/20/2021 18:46:10 - INFO - __main__ - Step 19772: {'lr': 0.0001999521473363342, 'samples': 632704, 'steps': 1235, 'loss/train': 4.055521488189697} -09/20/2021 18:46:11 - INFO - __main__ - Step 19773: {'lr': 0.0001999521473363342, 'samples': 632736, 'steps': 1235, 'loss/train': 3.7231717109680176} -09/20/2021 18:46:11 - INFO - __main__ - Step 19774: {'lr': 0.0001999521473363342, 'samples': 632768, 'steps': 1235, 'loss/train': 2.8726606369018555} -09/20/2021 18:46:12 - INFO - __main__ - Step 19775: {'lr': 0.0001999521473363342, 'samples': 632800, 'steps': 1235, 'loss/train': 3.5255954265594482} -09/20/2021 18:46:13 - INFO - __main__ - Step 19776: {'lr': 0.0001999521473363342, 'samples': 632832, 'steps': 1235, 'loss/train': 3.1983368396759033} -09/20/2021 18:46:14 - INFO - __main__ - Step 19777: {'lr': 0.00019995194981814958, 'samples': 632864, 'steps': 1236, 'loss/train': 3.6597328186035156} -09/20/2021 18:46:15 - INFO - __main__ - Step 19778: {'lr': 0.00019995194981814958, 'samples': 632896, 'steps': 1236, 'loss/train': 3.2400920391082764} -09/20/2021 18:46:15 - INFO - __main__ - Step 19779: {'lr': 0.00019995194981814958, 'samples': 632928, 'steps': 1236, 'loss/train': 2.74672794342041} -09/20/2021 18:46:17 - INFO - __main__ - Step 19780: {'lr': 0.00019995194981814958, 'samples': 632960, 'steps': 1236, 'loss/train': 3.6964316368103027} -09/20/2021 18:46:17 - INFO - __main__ - Step 19781: {'lr': 0.00019995194981814958, 'samples': 632992, 'steps': 1236, 'loss/train': 3.8424770832061768} -09/20/2021 18:46:18 - INFO - __main__ - Step 19782: {'lr': 0.00019995194981814958, 'samples': 633024, 'steps': 1236, 'loss/train': 3.9182560443878174} -09/20/2021 18:46:19 - INFO - __main__ - Step 19783: {'lr': 0.00019995194981814958, 'samples': 633056, 'steps': 1236, 'loss/train': 3.3866097927093506} -09/20/2021 18:46:20 - INFO - __main__ - Step 19784: {'lr': 0.00019995194981814958, 'samples': 633088, 'steps': 1236, 'loss/train': 3.6269593238830566} -09/20/2021 18:46:20 - INFO - __main__ - Step 19785: {'lr': 0.00019995194981814958, 'samples': 633120, 'steps': 1236, 'loss/train': 2.941723346710205} -09/20/2021 18:46:21 - INFO - __main__ - Step 19786: {'lr': 0.00019995194981814958, 'samples': 633152, 'steps': 1236, 'loss/train': 4.262610912322998} -09/20/2021 18:46:22 - INFO - __main__ - Step 19787: {'lr': 0.00019995194981814958, 'samples': 633184, 'steps': 1236, 'loss/train': 2.7206344604492188} -09/20/2021 18:46:23 - INFO - __main__ - Step 19788: {'lr': 0.00019995194981814958, 'samples': 633216, 'steps': 1236, 'loss/train': 3.5529873371124268} -09/20/2021 18:46:23 - INFO - __main__ - Step 19789: {'lr': 0.00019995194981814958, 'samples': 633248, 'steps': 1236, 'loss/train': 3.0121090412139893} -09/20/2021 18:46:24 - INFO - __main__ - Step 19790: {'lr': 0.00019995194981814958, 'samples': 633280, 'steps': 1236, 'loss/train': 4.129044532775879} -09/20/2021 18:46:25 - INFO - __main__ - Step 19791: {'lr': 0.00019995194981814958, 'samples': 633312, 'steps': 1236, 'loss/train': 2.916843891143799} -09/20/2021 18:46:26 - INFO - __main__ - Step 19792: {'lr': 0.00019995194981814958, 'samples': 633344, 'steps': 1236, 'loss/train': 3.6118600368499756} -09/20/2021 18:46:27 - INFO - __main__ - Step 19793: {'lr': 0.00019995175189326084, 'samples': 633376, 'steps': 1237, 'loss/train': 2.908818006515503} -09/20/2021 18:46:27 - INFO - __main__ - Step 19794: {'lr': 0.00019995175189326084, 'samples': 633408, 'steps': 1237, 'loss/train': 3.133284091949463} -09/20/2021 18:46:28 - INFO - __main__ - Step 19795: {'lr': 0.00019995175189326084, 'samples': 633440, 'steps': 1237, 'loss/train': 3.032539129257202} -09/20/2021 18:46:29 - INFO - __main__ - Step 19796: {'lr': 0.00019995175189326084, 'samples': 633472, 'steps': 1237, 'loss/train': 3.2683069705963135} -09/20/2021 18:46:30 - INFO - __main__ - Step 19797: {'lr': 0.00019995175189326084, 'samples': 633504, 'steps': 1237, 'loss/train': 4.743157386779785} -09/20/2021 18:46:30 - INFO - __main__ - Step 19798: {'lr': 0.00019995175189326084, 'samples': 633536, 'steps': 1237, 'loss/train': 3.835299491882324} -09/20/2021 18:46:31 - INFO - __main__ - Step 19799: {'lr': 0.00019995175189326084, 'samples': 633568, 'steps': 1237, 'loss/train': 3.807398796081543} -09/20/2021 18:46:32 - INFO - __main__ - Step 19800: {'lr': 0.00019995175189326084, 'samples': 633600, 'steps': 1237, 'loss/train': 3.362941265106201} -09/20/2021 18:46:33 - INFO - __main__ - Step 19801: {'lr': 0.00019995175189326084, 'samples': 633632, 'steps': 1237, 'loss/train': 3.345440626144409} -09/20/2021 18:46:33 - INFO - __main__ - Step 19802: {'lr': 0.00019995175189326084, 'samples': 633664, 'steps': 1237, 'loss/train': 2.7933478355407715} -09/20/2021 18:46:34 - INFO - __main__ - Step 19803: {'lr': 0.00019995175189326084, 'samples': 633696, 'steps': 1237, 'loss/train': 3.2466914653778076} -09/20/2021 18:46:35 - INFO - __main__ - Step 19804: {'lr': 0.00019995175189326084, 'samples': 633728, 'steps': 1237, 'loss/train': 3.1132655143737793} -09/20/2021 18:46:36 - INFO - __main__ - Step 19805: {'lr': 0.00019995175189326084, 'samples': 633760, 'steps': 1237, 'loss/train': 2.979024648666382} -09/20/2021 18:46:36 - INFO - __main__ - Step 19806: {'lr': 0.00019995175189326084, 'samples': 633792, 'steps': 1237, 'loss/train': 3.5776357650756836} -09/20/2021 18:46:37 - INFO - __main__ - Step 19807: {'lr': 0.00019995175189326084, 'samples': 633824, 'steps': 1237, 'loss/train': 3.6771352291107178} -09/20/2021 18:46:38 - INFO - __main__ - Step 19808: {'lr': 0.00019995175189326084, 'samples': 633856, 'steps': 1237, 'loss/train': 3.115971088409424} -09/20/2021 18:46:39 - INFO - __main__ - Step 19809: {'lr': 0.0001999515535616688, 'samples': 633888, 'steps': 1238, 'loss/train': 3.7521257400512695} -09/20/2021 18:46:39 - INFO - __main__ - Step 19810: {'lr': 0.0001999515535616688, 'samples': 633920, 'steps': 1238, 'loss/train': 3.5305073261260986} -09/20/2021 18:46:40 - INFO - __main__ - Step 19811: {'lr': 0.0001999515535616688, 'samples': 633952, 'steps': 1238, 'loss/train': 4.028987407684326} -09/20/2021 18:46:41 - INFO - __main__ - Step 19812: {'lr': 0.0001999515535616688, 'samples': 633984, 'steps': 1238, 'loss/train': 2.3397834300994873} -09/20/2021 18:46:42 - INFO - __main__ - Step 19813: {'lr': 0.0001999515535616688, 'samples': 634016, 'steps': 1238, 'loss/train': 3.50351619720459} -09/20/2021 18:46:43 - INFO - __main__ - Step 19814: {'lr': 0.0001999515535616688, 'samples': 634048, 'steps': 1238, 'loss/train': 3.9384193420410156} -09/20/2021 18:46:44 - INFO - __main__ - Step 19815: {'lr': 0.0001999515535616688, 'samples': 634080, 'steps': 1238, 'loss/train': 2.552701711654663} -09/20/2021 18:46:44 - INFO - __main__ - Step 19816: {'lr': 0.0001999515535616688, 'samples': 634112, 'steps': 1238, 'loss/train': 3.4068543910980225} -09/20/2021 18:46:45 - INFO - __main__ - Step 19817: {'lr': 0.0001999515535616688, 'samples': 634144, 'steps': 1238, 'loss/train': 3.4675662517547607} -09/20/2021 18:46:46 - INFO - __main__ - Step 19818: {'lr': 0.0001999515535616688, 'samples': 634176, 'steps': 1238, 'loss/train': 4.155468940734863} -09/20/2021 18:46:47 - INFO - __main__ - Step 19819: {'lr': 0.0001999515535616688, 'samples': 634208, 'steps': 1238, 'loss/train': 3.7580296993255615} -09/20/2021 18:46:47 - INFO - __main__ - Step 19820: {'lr': 0.0001999515535616688, 'samples': 634240, 'steps': 1238, 'loss/train': 2.962817668914795} -09/20/2021 18:46:48 - INFO - __main__ - Step 19821: {'lr': 0.0001999515535616688, 'samples': 634272, 'steps': 1238, 'loss/train': 3.3759684562683105} -09/20/2021 18:46:49 - INFO - __main__ - Step 19822: {'lr': 0.0001999515535616688, 'samples': 634304, 'steps': 1238, 'loss/train': 3.8508007526397705} -09/20/2021 18:46:50 - INFO - __main__ - Step 19823: {'lr': 0.0001999515535616688, 'samples': 634336, 'steps': 1238, 'loss/train': 3.0875656604766846} -09/20/2021 18:46:50 - INFO - __main__ - Step 19824: {'lr': 0.0001999515535616688, 'samples': 634368, 'steps': 1238, 'loss/train': 3.278319835662842} -09/20/2021 18:46:51 - INFO - __main__ - Step 19825: {'lr': 0.00019995135482337432, 'samples': 634400, 'steps': 1239, 'loss/train': 3.6793153285980225} -09/20/2021 18:46:52 - INFO - __main__ - Step 19826: {'lr': 0.00019995135482337432, 'samples': 634432, 'steps': 1239, 'loss/train': 4.103488445281982} -09/20/2021 18:46:53 - INFO - __main__ - Step 19827: {'lr': 0.00019995135482337432, 'samples': 634464, 'steps': 1239, 'loss/train': 1.5591660737991333} -09/20/2021 18:46:54 - INFO - __main__ - Step 19828: {'lr': 0.00019995135482337432, 'samples': 634496, 'steps': 1239, 'loss/train': 3.2743115425109863} -09/20/2021 18:46:54 - INFO - __main__ - Step 19829: {'lr': 0.00019995135482337432, 'samples': 634528, 'steps': 1239, 'loss/train': 3.698310136795044} -09/20/2021 18:46:55 - INFO - __main__ - Step 19830: {'lr': 0.00019995135482337432, 'samples': 634560, 'steps': 1239, 'loss/train': 1.7479346990585327} -09/20/2021 18:46:56 - INFO - __main__ - Step 19831: {'lr': 0.00019995135482337432, 'samples': 634592, 'steps': 1239, 'loss/train': 3.6762962341308594} -09/20/2021 18:46:57 - INFO - __main__ - Step 19832: {'lr': 0.00019995135482337432, 'samples': 634624, 'steps': 1239, 'loss/train': 3.5563650131225586} -09/20/2021 18:46:57 - INFO - __main__ - Step 19833: {'lr': 0.00019995135482337432, 'samples': 634656, 'steps': 1239, 'loss/train': 3.0615732669830322} -09/20/2021 18:46:58 - INFO - __main__ - Step 19834: {'lr': 0.00019995135482337432, 'samples': 634688, 'steps': 1239, 'loss/train': 3.6478123664855957} -09/20/2021 18:46:59 - INFO - __main__ - Step 19835: {'lr': 0.00019995135482337432, 'samples': 634720, 'steps': 1239, 'loss/train': 3.792910575866699} -09/20/2021 18:47:00 - INFO - __main__ - Step 19836: {'lr': 0.00019995135482337432, 'samples': 634752, 'steps': 1239, 'loss/train': 2.674755096435547} -09/20/2021 18:47:00 - INFO - __main__ - Step 19837: {'lr': 0.00019995135482337432, 'samples': 634784, 'steps': 1239, 'loss/train': 3.1063730716705322} -09/20/2021 18:47:01 - INFO - __main__ - Step 19838: {'lr': 0.00019995135482337432, 'samples': 634816, 'steps': 1239, 'loss/train': 3.5572991371154785} -09/20/2021 18:47:02 - INFO - __main__ - Step 19839: {'lr': 0.00019995135482337432, 'samples': 634848, 'steps': 1239, 'loss/train': 3.2132420539855957} -09/20/2021 18:47:03 - INFO - __main__ - Step 19840: {'lr': 0.00019995135482337432, 'samples': 634880, 'steps': 1239, 'loss/train': 3.2320921421051025} -09/20/2021 18:47:03 - INFO - __main__ - Step 19841: {'lr': 0.00019995115567837814, 'samples': 634912, 'steps': 1240, 'loss/train': 3.342949390411377} -09/20/2021 18:47:04 - INFO - __main__ - Step 19842: {'lr': 0.00019995115567837814, 'samples': 634944, 'steps': 1240, 'loss/train': 3.200878858566284} -09/20/2021 18:47:06 - INFO - __main__ - Step 19843: {'lr': 0.00019995115567837814, 'samples': 634976, 'steps': 1240, 'loss/train': 3.320463180541992} -09/20/2021 18:47:06 - INFO - __main__ - Step 19844: {'lr': 0.00019995115567837814, 'samples': 635008, 'steps': 1240, 'loss/train': 3.213512659072876} -09/20/2021 18:47:07 - INFO - __main__ - Step 19845: {'lr': 0.00019995115567837814, 'samples': 635040, 'steps': 1240, 'loss/train': 2.743471622467041} -09/20/2021 18:47:08 - INFO - __main__ - Step 19846: {'lr': 0.00019995115567837814, 'samples': 635072, 'steps': 1240, 'loss/train': 3.581164836883545} -09/20/2021 18:47:09 - INFO - __main__ - Step 19847: {'lr': 0.00019995115567837814, 'samples': 635104, 'steps': 1240, 'loss/train': 3.4780750274658203} -09/20/2021 18:47:09 - INFO - __main__ - Step 19848: {'lr': 0.00019995115567837814, 'samples': 635136, 'steps': 1240, 'loss/train': 3.9640979766845703} -09/20/2021 18:47:10 - INFO - __main__ - Step 19849: {'lr': 0.00019995115567837814, 'samples': 635168, 'steps': 1240, 'loss/train': 3.6680593490600586} -09/20/2021 18:47:11 - INFO - __main__ - Step 19850: {'lr': 0.00019995115567837814, 'samples': 635200, 'steps': 1240, 'loss/train': 3.501051664352417} -09/20/2021 18:47:12 - INFO - __main__ - Step 19851: {'lr': 0.00019995115567837814, 'samples': 635232, 'steps': 1240, 'loss/train': 3.1086511611938477} -09/20/2021 18:47:12 - INFO - __main__ - Step 19852: {'lr': 0.00019995115567837814, 'samples': 635264, 'steps': 1240, 'loss/train': 3.5658364295959473} -09/20/2021 18:47:13 - INFO - __main__ - Step 19853: {'lr': 0.00019995115567837814, 'samples': 635296, 'steps': 1240, 'loss/train': 3.066410541534424} -09/20/2021 18:47:14 - INFO - __main__ - Step 19854: {'lr': 0.00019995115567837814, 'samples': 635328, 'steps': 1240, 'loss/train': 2.970987319946289} -09/20/2021 18:47:15 - INFO - __main__ - Step 19855: {'lr': 0.00019995115567837814, 'samples': 635360, 'steps': 1240, 'loss/train': 3.73370099067688} -09/20/2021 18:47:15 - INFO - __main__ - Step 19856: {'lr': 0.00019995115567837814, 'samples': 635392, 'steps': 1240, 'loss/train': 2.5081117153167725} -09/20/2021 18:47:16 - INFO - __main__ - Step 19857: {'lr': 0.00019995095612668107, 'samples': 635424, 'steps': 1241, 'loss/train': 2.5386643409729004} -09/20/2021 18:47:17 - INFO - __main__ - Step 19858: {'lr': 0.00019995095612668107, 'samples': 635456, 'steps': 1241, 'loss/train': 2.6431775093078613} -09/20/2021 18:47:18 - INFO - __main__ - Step 19859: {'lr': 0.00019995095612668107, 'samples': 635488, 'steps': 1241, 'loss/train': 3.5347177982330322} -09/20/2021 18:47:19 - INFO - __main__ - Step 19860: {'lr': 0.00019995095612668107, 'samples': 635520, 'steps': 1241, 'loss/train': 4.377525806427002} -09/20/2021 18:47:19 - INFO - __main__ - Step 19861: {'lr': 0.00019995095612668107, 'samples': 635552, 'steps': 1241, 'loss/train': 0.9502304792404175} -09/20/2021 18:47:20 - INFO - __main__ - Step 19862: {'lr': 0.00019995095612668107, 'samples': 635584, 'steps': 1241, 'loss/train': 1.1868449449539185} -09/20/2021 18:47:21 - INFO - __main__ - Step 19863: {'lr': 0.00019995095612668107, 'samples': 635616, 'steps': 1241, 'loss/train': 0.6097865104675293} -09/20/2021 18:47:22 - INFO - __main__ - Step 19864: {'lr': 0.00019995095612668107, 'samples': 635648, 'steps': 1241, 'loss/train': 1.0675921440124512} -09/20/2021 18:47:22 - INFO - __main__ - Step 19865: {'lr': 0.00019995095612668107, 'samples': 635680, 'steps': 1241, 'loss/train': 4.688595294952393} -09/20/2021 18:47:23 - INFO - __main__ - Step 19866: {'lr': 0.00019995095612668107, 'samples': 635712, 'steps': 1241, 'loss/train': 3.104755163192749} -09/20/2021 18:47:24 - INFO - __main__ - Step 19867: {'lr': 0.00019995095612668107, 'samples': 635744, 'steps': 1241, 'loss/train': 3.3346376419067383} -09/20/2021 18:47:25 - INFO - __main__ - Step 19868: {'lr': 0.00019995095612668107, 'samples': 635776, 'steps': 1241, 'loss/train': 3.185696840286255} -09/20/2021 18:47:25 - INFO - __main__ - Step 19869: {'lr': 0.00019995095612668107, 'samples': 635808, 'steps': 1241, 'loss/train': 2.9577674865722656} -09/20/2021 18:47:26 - INFO - __main__ - Step 19870: {'lr': 0.00019995095612668107, 'samples': 635840, 'steps': 1241, 'loss/train': 3.1013059616088867} -09/20/2021 18:47:27 - INFO - __main__ - Step 19871: {'lr': 0.00019995095612668107, 'samples': 635872, 'steps': 1241, 'loss/train': 2.5364925861358643} -09/20/2021 18:47:28 - INFO - __main__ - Step 19872: {'lr': 0.00019995095612668107, 'samples': 635904, 'steps': 1241, 'loss/train': 3.1519391536712646} -09/20/2021 18:47:28 - INFO - __main__ - Step 19873: {'lr': 0.00019995075616828398, 'samples': 635936, 'steps': 1242, 'loss/train': 3.032320261001587} -09/20/2021 18:47:30 - INFO - __main__ - Step 19874: {'lr': 0.00019995075616828398, 'samples': 635968, 'steps': 1242, 'loss/train': 2.7529988288879395} -09/20/2021 18:47:31 - INFO - __main__ - Step 19875: {'lr': 0.00019995075616828398, 'samples': 636000, 'steps': 1242, 'loss/train': 2.9851694107055664} -09/20/2021 18:47:31 - INFO - __main__ - Step 19876: {'lr': 0.00019995075616828398, 'samples': 636032, 'steps': 1242, 'loss/train': 3.940152168273926} -09/20/2021 18:47:32 - INFO - __main__ - Step 19877: {'lr': 0.00019995075616828398, 'samples': 636064, 'steps': 1242, 'loss/train': 2.8606789112091064} -09/20/2021 18:47:33 - INFO - __main__ - Step 19878: {'lr': 0.00019995075616828398, 'samples': 636096, 'steps': 1242, 'loss/train': 3.306532621383667} -09/20/2021 18:47:34 - INFO - __main__ - Step 19879: {'lr': 0.00019995075616828398, 'samples': 636128, 'steps': 1242, 'loss/train': 4.095481872558594} -09/20/2021 18:47:34 - INFO - __main__ - Step 19880: {'lr': 0.00019995075616828398, 'samples': 636160, 'steps': 1242, 'loss/train': 3.788623809814453} -09/20/2021 18:47:35 - INFO - __main__ - Step 19881: {'lr': 0.00019995075616828398, 'samples': 636192, 'steps': 1242, 'loss/train': 4.584547996520996} -09/20/2021 18:47:36 - INFO - __main__ - Step 19882: {'lr': 0.00019995075616828398, 'samples': 636224, 'steps': 1242, 'loss/train': 3.0785207748413086} -09/20/2021 18:47:37 - INFO - __main__ - Step 19883: {'lr': 0.00019995075616828398, 'samples': 636256, 'steps': 1242, 'loss/train': 3.7505314350128174} -09/20/2021 18:47:37 - INFO - __main__ - Step 19884: {'lr': 0.00019995075616828398, 'samples': 636288, 'steps': 1242, 'loss/train': 2.590454578399658} -09/20/2021 18:47:38 - INFO - __main__ - Step 19885: {'lr': 0.00019995075616828398, 'samples': 636320, 'steps': 1242, 'loss/train': 3.829773187637329} -09/20/2021 18:47:39 - INFO - __main__ - Step 19886: {'lr': 0.00019995075616828398, 'samples': 636352, 'steps': 1242, 'loss/train': 3.1722910404205322} -09/20/2021 18:47:40 - INFO - __main__ - Step 19887: {'lr': 0.00019995075616828398, 'samples': 636384, 'steps': 1242, 'loss/train': 4.252623081207275} -09/20/2021 18:47:40 - INFO - __main__ - Step 19888: {'lr': 0.00019995075616828398, 'samples': 636416, 'steps': 1242, 'loss/train': 2.758573055267334} -09/20/2021 18:47:41 - INFO - __main__ - Step 19889: {'lr': 0.00019995055580318763, 'samples': 636448, 'steps': 1243, 'loss/train': 3.474177598953247} -09/20/2021 18:47:42 - INFO - __main__ - Step 19890: {'lr': 0.00019995055580318763, 'samples': 636480, 'steps': 1243, 'loss/train': 3.369778871536255} -09/20/2021 18:47:43 - INFO - __main__ - Step 19891: {'lr': 0.00019995055580318763, 'samples': 636512, 'steps': 1243, 'loss/train': 3.4805240631103516} -09/20/2021 18:47:43 - INFO - __main__ - Step 19892: {'lr': 0.00019995055580318763, 'samples': 636544, 'steps': 1243, 'loss/train': 6.056352138519287} -09/20/2021 18:47:44 - INFO - __main__ - Step 19893: {'lr': 0.00019995055580318763, 'samples': 636576, 'steps': 1243, 'loss/train': 3.958432197570801} -09/20/2021 18:47:45 - INFO - __main__ - Step 19894: {'lr': 0.00019995055580318763, 'samples': 636608, 'steps': 1243, 'loss/train': 3.4962522983551025} -09/20/2021 18:47:46 - INFO - __main__ - Step 19895: {'lr': 0.00019995055580318763, 'samples': 636640, 'steps': 1243, 'loss/train': 2.9896810054779053} -09/20/2021 18:47:46 - INFO - __main__ - Step 19896: {'lr': 0.00019995055580318763, 'samples': 636672, 'steps': 1243, 'loss/train': 4.6613945960998535} -09/20/2021 18:47:47 - INFO - __main__ - Step 19897: {'lr': 0.00019995055580318763, 'samples': 636704, 'steps': 1243, 'loss/train': 3.9213085174560547} -09/20/2021 18:47:48 - INFO - __main__ - Step 19898: {'lr': 0.00019995055580318763, 'samples': 636736, 'steps': 1243, 'loss/train': 2.7678329944610596} -09/20/2021 18:47:49 - INFO - __main__ - Step 19899: {'lr': 0.00019995055580318763, 'samples': 636768, 'steps': 1243, 'loss/train': 6.441843509674072} -09/20/2021 18:47:49 - INFO - __main__ - Step 19900: {'lr': 0.00019995055580318763, 'samples': 636800, 'steps': 1243, 'loss/train': 4.132567882537842} -09/20/2021 18:47:50 - INFO - __main__ - Step 19901: {'lr': 0.00019995055580318763, 'samples': 636832, 'steps': 1243, 'loss/train': 2.645975351333618} -09/20/2021 18:47:51 - INFO - __main__ - Step 19902: {'lr': 0.00019995055580318763, 'samples': 636864, 'steps': 1243, 'loss/train': 4.512783050537109} -09/20/2021 18:47:52 - INFO - __main__ - Step 19903: {'lr': 0.00019995055580318763, 'samples': 636896, 'steps': 1243, 'loss/train': 3.6842164993286133} -09/20/2021 18:47:52 - INFO - __main__ - Step 19904: {'lr': 0.00019995055580318763, 'samples': 636928, 'steps': 1243, 'loss/train': 3.2319202423095703} -09/20/2021 18:47:53 - INFO - __main__ - Step 19905: {'lr': 0.00019995035503139288, 'samples': 636960, 'steps': 1244, 'loss/train': 3.8410093784332275} -09/20/2021 18:47:55 - INFO - __main__ - Step 19906: {'lr': 0.00019995035503139288, 'samples': 636992, 'steps': 1244, 'loss/train': 3.774308204650879} -09/20/2021 18:47:55 - INFO - __main__ - Step 19907: {'lr': 0.00019995035503139288, 'samples': 637024, 'steps': 1244, 'loss/train': 0.5420698523521423} -09/20/2021 18:47:56 - INFO - __main__ - Step 19908: {'lr': 0.00019995035503139288, 'samples': 637056, 'steps': 1244, 'loss/train': 4.7046074867248535} -09/20/2021 18:47:57 - INFO - __main__ - Step 19909: {'lr': 0.00019995035503139288, 'samples': 637088, 'steps': 1244, 'loss/train': 4.0493340492248535} -09/20/2021 18:47:58 - INFO - __main__ - Step 19910: {'lr': 0.00019995035503139288, 'samples': 637120, 'steps': 1244, 'loss/train': 3.1258885860443115} -09/20/2021 18:47:58 - INFO - __main__ - Step 19911: {'lr': 0.00019995035503139288, 'samples': 637152, 'steps': 1244, 'loss/train': 4.137821197509766} -09/20/2021 18:47:59 - INFO - __main__ - Step 19912: {'lr': 0.00019995035503139288, 'samples': 637184, 'steps': 1244, 'loss/train': 3.834972381591797} -09/20/2021 18:48:00 - INFO - __main__ - Step 19913: {'lr': 0.00019995035503139288, 'samples': 637216, 'steps': 1244, 'loss/train': 4.873311519622803} -09/20/2021 18:48:01 - INFO - __main__ - Step 19914: {'lr': 0.00019995035503139288, 'samples': 637248, 'steps': 1244, 'loss/train': 2.7032792568206787} -09/20/2021 18:48:01 - INFO - __main__ - Step 19915: {'lr': 0.00019995035503139288, 'samples': 637280, 'steps': 1244, 'loss/train': 3.6187803745269775} -09/20/2021 18:48:02 - INFO - __main__ - Step 19916: {'lr': 0.00019995035503139288, 'samples': 637312, 'steps': 1244, 'loss/train': 3.370252847671509} -09/20/2021 18:48:03 - INFO - __main__ - Step 19917: {'lr': 0.00019995035503139288, 'samples': 637344, 'steps': 1244, 'loss/train': 2.7558846473693848} -09/20/2021 18:48:04 - INFO - __main__ - Step 19918: {'lr': 0.00019995035503139288, 'samples': 637376, 'steps': 1244, 'loss/train': 3.2330894470214844} -09/20/2021 18:48:04 - INFO - __main__ - Step 19919: {'lr': 0.00019995035503139288, 'samples': 637408, 'steps': 1244, 'loss/train': 3.6638920307159424} -09/20/2021 18:48:05 - INFO - __main__ - Step 19920: {'lr': 0.00019995035503139288, 'samples': 637440, 'steps': 1244, 'loss/train': 2.7818028926849365} -09/20/2021 18:48:06 - INFO - __main__ - Step 19921: {'lr': 0.0001999501538529005, 'samples': 637472, 'steps': 1245, 'loss/train': 4.746285915374756} -09/20/2021 18:48:07 - INFO - __main__ - Step 19922: {'lr': 0.0001999501538529005, 'samples': 637504, 'steps': 1245, 'loss/train': 3.893120288848877} -09/20/2021 18:48:08 - INFO - __main__ - Step 19923: {'lr': 0.0001999501538529005, 'samples': 637536, 'steps': 1245, 'loss/train': 3.277883291244507} -09/20/2021 18:48:08 - INFO - __main__ - Step 19924: {'lr': 0.0001999501538529005, 'samples': 637568, 'steps': 1245, 'loss/train': 3.379354238510132} -09/20/2021 18:48:09 - INFO - __main__ - Step 19925: {'lr': 0.0001999501538529005, 'samples': 637600, 'steps': 1245, 'loss/train': 3.8924472332000732} -09/20/2021 18:48:10 - INFO - __main__ - Step 19926: {'lr': 0.0001999501538529005, 'samples': 637632, 'steps': 1245, 'loss/train': 4.036213397979736} -09/20/2021 18:48:11 - INFO - __main__ - Step 19927: {'lr': 0.0001999501538529005, 'samples': 637664, 'steps': 1245, 'loss/train': 4.157353401184082} -09/20/2021 18:48:11 - INFO - __main__ - Step 19928: {'lr': 0.0001999501538529005, 'samples': 637696, 'steps': 1245, 'loss/train': 3.7457261085510254} -09/20/2021 18:48:12 - INFO - __main__ - Step 19929: {'lr': 0.0001999501538529005, 'samples': 637728, 'steps': 1245, 'loss/train': 3.4361801147460938} -09/20/2021 18:48:13 - INFO - __main__ - Step 19930: {'lr': 0.0001999501538529005, 'samples': 637760, 'steps': 1245, 'loss/train': 2.934180736541748} -09/20/2021 18:48:14 - INFO - __main__ - Step 19931: {'lr': 0.0001999501538529005, 'samples': 637792, 'steps': 1245, 'loss/train': 3.3522727489471436} -09/20/2021 18:48:14 - INFO - __main__ - Step 19932: {'lr': 0.0001999501538529005, 'samples': 637824, 'steps': 1245, 'loss/train': 3.202908992767334} -09/20/2021 18:48:15 - INFO - __main__ - Step 19933: {'lr': 0.0001999501538529005, 'samples': 637856, 'steps': 1245, 'loss/train': 3.524195432662964} -09/20/2021 18:48:16 - INFO - __main__ - Step 19934: {'lr': 0.0001999501538529005, 'samples': 637888, 'steps': 1245, 'loss/train': 3.602447271347046} -09/20/2021 18:48:17 - INFO - __main__ - Step 19935: {'lr': 0.0001999501538529005, 'samples': 637920, 'steps': 1245, 'loss/train': 2.662672281265259} -09/20/2021 18:48:17 - INFO - __main__ - Step 19936: {'lr': 0.0001999501538529005, 'samples': 637952, 'steps': 1245, 'loss/train': 2.795898914337158} -09/20/2021 18:48:19 - INFO - __main__ - Step 19937: {'lr': 0.00019994995226771135, 'samples': 637984, 'steps': 1246, 'loss/train': 3.355755090713501} -09/20/2021 18:48:20 - INFO - __main__ - Step 19938: {'lr': 0.00019994995226771135, 'samples': 638016, 'steps': 1246, 'loss/train': 3.2485005855560303} -09/20/2021 18:48:20 - INFO - __main__ - Step 19939: {'lr': 0.00019994995226771135, 'samples': 638048, 'steps': 1246, 'loss/train': 4.429391384124756} -09/20/2021 18:48:21 - INFO - __main__ - Step 19940: {'lr': 0.00019994995226771135, 'samples': 638080, 'steps': 1246, 'loss/train': 1.839850664138794} -09/20/2021 18:48:22 - INFO - __main__ - Step 19941: {'lr': 0.00019994995226771135, 'samples': 638112, 'steps': 1246, 'loss/train': 3.743441343307495} -09/20/2021 18:48:23 - INFO - __main__ - Step 19942: {'lr': 0.00019994995226771135, 'samples': 638144, 'steps': 1246, 'loss/train': 3.6969311237335205} -09/20/2021 18:48:23 - INFO - __main__ - Step 19943: {'lr': 0.00019994995226771135, 'samples': 638176, 'steps': 1246, 'loss/train': 3.095745086669922} -09/20/2021 18:48:24 - INFO - __main__ - Step 19944: {'lr': 0.00019994995226771135, 'samples': 638208, 'steps': 1246, 'loss/train': 3.444490432739258} -09/20/2021 18:48:25 - INFO - __main__ - Step 19945: {'lr': 0.00019994995226771135, 'samples': 638240, 'steps': 1246, 'loss/train': 3.092743396759033} -09/20/2021 18:48:26 - INFO - __main__ - Step 19946: {'lr': 0.00019994995226771135, 'samples': 638272, 'steps': 1246, 'loss/train': 4.211426734924316} -09/20/2021 18:48:26 - INFO - __main__ - Step 19947: {'lr': 0.00019994995226771135, 'samples': 638304, 'steps': 1246, 'loss/train': 4.192225456237793} -09/20/2021 18:48:27 - INFO - __main__ - Step 19948: {'lr': 0.00019994995226771135, 'samples': 638336, 'steps': 1246, 'loss/train': 3.4791901111602783} -09/20/2021 18:48:28 - INFO - __main__ - Step 19949: {'lr': 0.00019994995226771135, 'samples': 638368, 'steps': 1246, 'loss/train': 3.4351329803466797} -09/20/2021 18:48:29 - INFO - __main__ - Step 19950: {'lr': 0.00019994995226771135, 'samples': 638400, 'steps': 1246, 'loss/train': 2.8326778411865234} -09/20/2021 18:48:29 - INFO - __main__ - Step 19951: {'lr': 0.00019994995226771135, 'samples': 638432, 'steps': 1246, 'loss/train': 3.9163036346435547} -09/20/2021 18:48:30 - INFO - __main__ - Step 19952: {'lr': 0.00019994995226771135, 'samples': 638464, 'steps': 1246, 'loss/train': 3.532607078552246} -09/20/2021 18:48:31 - INFO - __main__ - Step 19953: {'lr': 0.00019994975027582624, 'samples': 638496, 'steps': 1247, 'loss/train': 3.1962873935699463} -09/20/2021 18:48:32 - INFO - __main__ - Step 19954: {'lr': 0.00019994975027582624, 'samples': 638528, 'steps': 1247, 'loss/train': 3.1591663360595703} -09/20/2021 18:48:32 - INFO - __main__ - Step 19955: {'lr': 0.00019994975027582624, 'samples': 638560, 'steps': 1247, 'loss/train': 2.7816081047058105} -09/20/2021 18:48:33 - INFO - __main__ - Step 19956: {'lr': 0.00019994975027582624, 'samples': 638592, 'steps': 1247, 'loss/train': 4.2058234214782715} -09/20/2021 18:48:34 - INFO - __main__ - Step 19957: {'lr': 0.00019994975027582624, 'samples': 638624, 'steps': 1247, 'loss/train': 5.044713020324707} -09/20/2021 18:48:35 - INFO - __main__ - Step 19958: {'lr': 0.00019994975027582624, 'samples': 638656, 'steps': 1247, 'loss/train': 3.6409213542938232} -09/20/2021 18:48:35 - INFO - __main__ - Step 19959: {'lr': 0.00019994975027582624, 'samples': 638688, 'steps': 1247, 'loss/train': 3.0199787616729736} -09/20/2021 18:48:36 - INFO - __main__ - Step 19960: {'lr': 0.00019994975027582624, 'samples': 638720, 'steps': 1247, 'loss/train': 3.1583361625671387} -09/20/2021 18:48:37 - INFO - __main__ - Step 19961: {'lr': 0.00019994975027582624, 'samples': 638752, 'steps': 1247, 'loss/train': 4.415980815887451} -09/20/2021 18:48:38 - INFO - __main__ - Step 19962: {'lr': 0.00019994975027582624, 'samples': 638784, 'steps': 1247, 'loss/train': 4.678310394287109} -09/20/2021 18:48:38 - INFO - __main__ - Step 19963: {'lr': 0.00019994975027582624, 'samples': 638816, 'steps': 1247, 'loss/train': 3.440255641937256} -09/20/2021 18:48:39 - INFO - __main__ - Step 19964: {'lr': 0.00019994975027582624, 'samples': 638848, 'steps': 1247, 'loss/train': 2.6166865825653076} -09/20/2021 18:48:40 - INFO - __main__ - Step 19965: {'lr': 0.00019994975027582624, 'samples': 638880, 'steps': 1247, 'loss/train': 3.611346483230591} -09/20/2021 18:48:41 - INFO - __main__ - Step 19966: {'lr': 0.00019994975027582624, 'samples': 638912, 'steps': 1247, 'loss/train': 1.815905213356018} -09/20/2021 18:48:42 - INFO - __main__ - Step 19967: {'lr': 0.00019994975027582624, 'samples': 638944, 'steps': 1247, 'loss/train': 5.439666748046875} -09/20/2021 18:48:43 - INFO - __main__ - Step 19968: {'lr': 0.00019994975027582624, 'samples': 638976, 'steps': 1247, 'loss/train': 3.4435501098632812} -09/20/2021 18:48:44 - INFO - __main__ - Step 19969: {'lr': 0.00019994954787724595, 'samples': 639008, 'steps': 1248, 'loss/train': 3.2700493335723877} -09/20/2021 18:48:44 - INFO - __main__ - Step 19970: {'lr': 0.00019994954787724595, 'samples': 639040, 'steps': 1248, 'loss/train': 3.4532761573791504} -09/20/2021 18:48:45 - INFO - __main__ - Step 19971: {'lr': 0.00019994954787724595, 'samples': 639072, 'steps': 1248, 'loss/train': 2.7307846546173096} -09/20/2021 18:48:46 - INFO - __main__ - Step 19972: {'lr': 0.00019994954787724595, 'samples': 639104, 'steps': 1248, 'loss/train': 3.3709285259246826} -09/20/2021 18:48:47 - INFO - __main__ - Step 19973: {'lr': 0.00019994954787724595, 'samples': 639136, 'steps': 1248, 'loss/train': 3.8897881507873535} -09/20/2021 18:48:47 - INFO - __main__ - Step 19974: {'lr': 0.00019994954787724595, 'samples': 639168, 'steps': 1248, 'loss/train': 0.9697397947311401} -09/20/2021 18:48:48 - INFO - __main__ - Step 19975: {'lr': 0.00019994954787724595, 'samples': 639200, 'steps': 1248, 'loss/train': 3.0410594940185547} -09/20/2021 18:48:49 - INFO - __main__ - Step 19976: {'lr': 0.00019994954787724595, 'samples': 639232, 'steps': 1248, 'loss/train': 2.9788947105407715} -09/20/2021 18:48:50 - INFO - __main__ - Step 19977: {'lr': 0.00019994954787724595, 'samples': 639264, 'steps': 1248, 'loss/train': 2.8589510917663574} -09/20/2021 18:48:50 - INFO - __main__ - Step 19978: {'lr': 0.00019994954787724595, 'samples': 639296, 'steps': 1248, 'loss/train': 2.7815792560577393} -09/20/2021 18:48:51 - INFO - __main__ - Step 19979: {'lr': 0.00019994954787724595, 'samples': 639328, 'steps': 1248, 'loss/train': 3.79895281791687} -09/20/2021 18:48:52 - INFO - __main__ - Step 19980: {'lr': 0.00019994954787724595, 'samples': 639360, 'steps': 1248, 'loss/train': 4.278707504272461} -09/20/2021 18:48:53 - INFO - __main__ - Step 19981: {'lr': 0.00019994954787724595, 'samples': 639392, 'steps': 1248, 'loss/train': 3.509920597076416} -09/20/2021 18:48:53 - INFO - __main__ - Step 19982: {'lr': 0.00019994954787724595, 'samples': 639424, 'steps': 1248, 'loss/train': 2.6509175300598145} -09/20/2021 18:48:54 - INFO - __main__ - Step 19983: {'lr': 0.00019994954787724595, 'samples': 639456, 'steps': 1248, 'loss/train': 2.9314677715301514} -09/20/2021 18:48:55 - INFO - __main__ - Step 19984: {'lr': 0.00019994954787724595, 'samples': 639488, 'steps': 1248, 'loss/train': 3.335400104522705} -09/20/2021 18:48:56 - INFO - __main__ - Step 19985: {'lr': 0.00019994934507197137, 'samples': 639520, 'steps': 1249, 'loss/train': 3.1607859134674072} -09/20/2021 18:48:56 - INFO - __main__ - Step 19986: {'lr': 0.00019994934507197137, 'samples': 639552, 'steps': 1249, 'loss/train': 0.9460300207138062} -09/20/2021 18:48:57 - INFO - __main__ - Step 19987: {'lr': 0.00019994934507197137, 'samples': 639584, 'steps': 1249, 'loss/train': 2.9898183345794678} -09/20/2021 18:48:58 - INFO - __main__ - Step 19988: {'lr': 0.00019994934507197137, 'samples': 639616, 'steps': 1249, 'loss/train': 3.426914930343628} -09/20/2021 18:48:59 - INFO - __main__ - Step 19989: {'lr': 0.00019994934507197137, 'samples': 639648, 'steps': 1249, 'loss/train': 3.13081693649292} -09/20/2021 18:48:59 - INFO - __main__ - Step 19990: {'lr': 0.00019994934507197137, 'samples': 639680, 'steps': 1249, 'loss/train': 3.1178083419799805} -09/20/2021 18:49:00 - INFO - __main__ - Step 19991: {'lr': 0.00019994934507197137, 'samples': 639712, 'steps': 1249, 'loss/train': 3.9114508628845215} -09/20/2021 18:49:01 - INFO - __main__ - Step 19992: {'lr': 0.00019994934507197137, 'samples': 639744, 'steps': 1249, 'loss/train': 3.5308172702789307} -09/20/2021 18:49:02 - INFO - __main__ - Step 19993: {'lr': 0.00019994934507197137, 'samples': 639776, 'steps': 1249, 'loss/train': 3.955244302749634} -09/20/2021 18:49:02 - INFO - __main__ - Step 19994: {'lr': 0.00019994934507197137, 'samples': 639808, 'steps': 1249, 'loss/train': 2.300835609436035} -09/20/2021 18:49:03 - INFO - __main__ - Step 19995: {'lr': 0.00019994934507197137, 'samples': 639840, 'steps': 1249, 'loss/train': 4.287653923034668} -09/20/2021 18:49:04 - INFO - __main__ - Step 19996: {'lr': 0.00019994934507197137, 'samples': 639872, 'steps': 1249, 'loss/train': 2.845902681350708} -09/20/2021 18:49:05 - INFO - __main__ - Step 19997: {'lr': 0.00019994934507197137, 'samples': 639904, 'steps': 1249, 'loss/train': 3.293545961380005} -09/20/2021 18:49:06 - INFO - __main__ - Step 19998: {'lr': 0.00019994934507197137, 'samples': 639936, 'steps': 1249, 'loss/train': 3.7890048027038574} -09/20/2021 18:49:07 - INFO - __main__ - Step 19999: {'lr': 0.00019994934507197137, 'samples': 639968, 'steps': 1249, 'loss/train': 3.1318986415863037} -09/20/2021 18:49:07 - INFO - __main__ - Step 20000: {'lr': 0.00019994934507197137, 'samples': 640000, 'steps': 1249, 'loss/train': 3.595933437347412} -09/20/2021 18:49:08 - INFO - __main__ - Step 20001: {'lr': 0.00019994914186000328, 'samples': 640032, 'steps': 1250, 'loss/train': 4.106491565704346} -09/20/2021 18:49:09 - INFO - __main__ - Step 20002: {'lr': 0.00019994914186000328, 'samples': 640064, 'steps': 1250, 'loss/train': 2.878351926803589} -09/20/2021 18:49:10 - INFO - __main__ - Step 20003: {'lr': 0.00019994914186000328, 'samples': 640096, 'steps': 1250, 'loss/train': 3.375885248184204} -09/20/2021 18:49:11 - INFO - __main__ - Step 20004: {'lr': 0.00019994914186000328, 'samples': 640128, 'steps': 1250, 'loss/train': 3.776451826095581} -09/20/2021 18:49:11 - INFO - __main__ - Step 20005: {'lr': 0.00019994914186000328, 'samples': 640160, 'steps': 1250, 'loss/train': 3.4409916400909424} -09/20/2021 18:49:12 - INFO - __main__ - Step 20006: {'lr': 0.00019994914186000328, 'samples': 640192, 'steps': 1250, 'loss/train': 3.525740385055542} -09/20/2021 18:49:13 - INFO - __main__ - Step 20007: {'lr': 0.00019994914186000328, 'samples': 640224, 'steps': 1250, 'loss/train': 3.121873140335083} -09/20/2021 18:49:14 - INFO - __main__ - Step 20008: {'lr': 0.00019994914186000328, 'samples': 640256, 'steps': 1250, 'loss/train': 3.320974826812744} -09/20/2021 18:49:14 - INFO - __main__ - Step 20009: {'lr': 0.00019994914186000328, 'samples': 640288, 'steps': 1250, 'loss/train': 3.0011098384857178} -09/20/2021 18:49:15 - INFO - __main__ - Step 20010: {'lr': 0.00019994914186000328, 'samples': 640320, 'steps': 1250, 'loss/train': 2.8355507850646973} -09/20/2021 18:49:16 - INFO - __main__ - Step 20011: {'lr': 0.00019994914186000328, 'samples': 640352, 'steps': 1250, 'loss/train': 3.228675365447998} -09/20/2021 18:49:17 - INFO - __main__ - Step 20012: {'lr': 0.00019994914186000328, 'samples': 640384, 'steps': 1250, 'loss/train': 0.8079175353050232} -09/20/2021 18:49:17 - INFO - __main__ - Step 20013: {'lr': 0.00019994914186000328, 'samples': 640416, 'steps': 1250, 'loss/train': 3.4020891189575195} -09/20/2021 18:49:18 - INFO - __main__ - Step 20014: {'lr': 0.00019994914186000328, 'samples': 640448, 'steps': 1250, 'loss/train': 3.0108275413513184} -09/20/2021 18:49:19 - INFO - __main__ - Step 20015: {'lr': 0.00019994914186000328, 'samples': 640480, 'steps': 1250, 'loss/train': 3.8263156414031982} -09/20/2021 18:49:20 - INFO - __main__ - Step 20016: {'lr': 0.00019994914186000328, 'samples': 640512, 'steps': 1250, 'loss/train': 3.580648899078369} -09/20/2021 18:49:20 - INFO - __main__ - Step 20017: {'lr': 0.0001999489382413425, 'samples': 640544, 'steps': 1251, 'loss/train': 3.4128518104553223} -09/20/2021 18:49:21 - INFO - __main__ - Step 20018: {'lr': 0.0001999489382413425, 'samples': 640576, 'steps': 1251, 'loss/train': 3.262648344039917} -09/20/2021 18:49:22 - INFO - __main__ - Step 20019: {'lr': 0.0001999489382413425, 'samples': 640608, 'steps': 1251, 'loss/train': 4.004827499389648} -09/20/2021 18:49:23 - INFO - __main__ - Step 20020: {'lr': 0.0001999489382413425, 'samples': 640640, 'steps': 1251, 'loss/train': 3.2990829944610596} -09/20/2021 18:49:23 - INFO - __main__ - Step 20021: {'lr': 0.0001999489382413425, 'samples': 640672, 'steps': 1251, 'loss/train': 3.2645838260650635} -09/20/2021 18:49:24 - INFO - __main__ - Step 20022: {'lr': 0.0001999489382413425, 'samples': 640704, 'steps': 1251, 'loss/train': 2.672611713409424} -09/20/2021 18:49:25 - INFO - __main__ - Step 20023: {'lr': 0.0001999489382413425, 'samples': 640736, 'steps': 1251, 'loss/train': 3.171907424926758} -09/20/2021 18:49:26 - INFO - __main__ - Step 20024: {'lr': 0.0001999489382413425, 'samples': 640768, 'steps': 1251, 'loss/train': 3.425504207611084} -09/20/2021 18:49:26 - INFO - __main__ - Step 20025: {'lr': 0.0001999489382413425, 'samples': 640800, 'steps': 1251, 'loss/train': 3.1468491554260254} -09/20/2021 18:49:27 - INFO - __main__ - Step 20026: {'lr': 0.0001999489382413425, 'samples': 640832, 'steps': 1251, 'loss/train': 3.273155927658081} -09/20/2021 18:49:28 - INFO - __main__ - Step 20027: {'lr': 0.0001999489382413425, 'samples': 640864, 'steps': 1251, 'loss/train': 3.5450022220611572} -09/20/2021 18:49:30 - INFO - __main__ - Step 20028: {'lr': 0.0001999489382413425, 'samples': 640896, 'steps': 1251, 'loss/train': 2.6536011695861816} -09/20/2021 18:49:31 - INFO - __main__ - Step 20029: {'lr': 0.0001999489382413425, 'samples': 640928, 'steps': 1251, 'loss/train': 2.6485846042633057} -09/20/2021 18:49:31 - INFO - __main__ - Step 20030: {'lr': 0.0001999489382413425, 'samples': 640960, 'steps': 1251, 'loss/train': 3.049558639526367} -09/20/2021 18:49:32 - INFO - __main__ - Step 20031: {'lr': 0.0001999489382413425, 'samples': 640992, 'steps': 1251, 'loss/train': 3.8381683826446533} -09/20/2021 18:49:33 - INFO - __main__ - Step 20032: {'lr': 0.0001999489382413425, 'samples': 641024, 'steps': 1251, 'loss/train': 3.3199048042297363} -09/20/2021 18:49:34 - INFO - __main__ - Step 20033: {'lr': 0.0001999487342159899, 'samples': 641056, 'steps': 1252, 'loss/train': 4.732179641723633} -09/20/2021 18:49:34 - INFO - __main__ - Step 20034: {'lr': 0.0001999487342159899, 'samples': 641088, 'steps': 1252, 'loss/train': 3.2933218479156494} -09/20/2021 18:49:35 - INFO - __main__ - Step 20035: {'lr': 0.0001999487342159899, 'samples': 641120, 'steps': 1252, 'loss/train': 2.9793429374694824} -09/20/2021 18:49:36 - INFO - __main__ - Step 20036: {'lr': 0.0001999487342159899, 'samples': 641152, 'steps': 1252, 'loss/train': 2.594827175140381} -09/20/2021 18:49:37 - INFO - __main__ - Step 20037: {'lr': 0.0001999487342159899, 'samples': 641184, 'steps': 1252, 'loss/train': 3.9160962104797363} -09/20/2021 18:49:37 - INFO - __main__ - Step 20038: {'lr': 0.0001999487342159899, 'samples': 641216, 'steps': 1252, 'loss/train': 3.0307161808013916} -09/20/2021 18:49:38 - INFO - __main__ - Step 20039: {'lr': 0.0001999487342159899, 'samples': 641248, 'steps': 1252, 'loss/train': 3.9585940837860107} -09/20/2021 18:49:39 - INFO - __main__ - Step 20040: {'lr': 0.0001999487342159899, 'samples': 641280, 'steps': 1252, 'loss/train': 3.284968376159668} -09/20/2021 18:49:40 - INFO - __main__ - Step 20041: {'lr': 0.0001999487342159899, 'samples': 641312, 'steps': 1252, 'loss/train': 2.7453739643096924} -09/20/2021 18:49:40 - INFO - __main__ - Step 20042: {'lr': 0.0001999487342159899, 'samples': 641344, 'steps': 1252, 'loss/train': 3.101668119430542} -09/20/2021 18:49:41 - INFO - __main__ - Step 20043: {'lr': 0.0001999487342159899, 'samples': 641376, 'steps': 1252, 'loss/train': 2.556060791015625} -09/20/2021 18:49:42 - INFO - __main__ - Step 20044: {'lr': 0.0001999487342159899, 'samples': 641408, 'steps': 1252, 'loss/train': 5.04020881652832} -09/20/2021 18:49:43 - INFO - __main__ - Step 20045: {'lr': 0.0001999487342159899, 'samples': 641440, 'steps': 1252, 'loss/train': 3.5980470180511475} -09/20/2021 18:49:43 - INFO - __main__ - Step 20046: {'lr': 0.0001999487342159899, 'samples': 641472, 'steps': 1252, 'loss/train': 3.201488494873047} -09/20/2021 18:49:44 - INFO - __main__ - Step 20047: {'lr': 0.0001999487342159899, 'samples': 641504, 'steps': 1252, 'loss/train': 3.0090322494506836} -09/20/2021 18:49:45 - INFO - __main__ - Step 20048: {'lr': 0.0001999487342159899, 'samples': 641536, 'steps': 1252, 'loss/train': 4.604773998260498} -09/20/2021 18:49:46 - INFO - __main__ - Step 20049: {'lr': 0.0001999485297839463, 'samples': 641568, 'steps': 1253, 'loss/train': 2.869213104248047} -09/20/2021 18:49:47 - INFO - __main__ - Step 20050: {'lr': 0.0001999485297839463, 'samples': 641600, 'steps': 1253, 'loss/train': 4.172992706298828} -09/20/2021 18:49:47 - INFO - __main__ - Step 20051: {'lr': 0.0001999485297839463, 'samples': 641632, 'steps': 1253, 'loss/train': 4.56029748916626} -09/20/2021 18:49:48 - INFO - __main__ - Step 20052: {'lr': 0.0001999485297839463, 'samples': 641664, 'steps': 1253, 'loss/train': 3.222170829772949} -09/20/2021 18:49:49 - INFO - __main__ - Step 20053: {'lr': 0.0001999485297839463, 'samples': 641696, 'steps': 1253, 'loss/train': 3.710451364517212} -09/20/2021 18:49:50 - INFO - __main__ - Step 20054: {'lr': 0.0001999485297839463, 'samples': 641728, 'steps': 1253, 'loss/train': 4.376646995544434} -09/20/2021 18:49:50 - INFO - __main__ - Step 20055: {'lr': 0.0001999485297839463, 'samples': 641760, 'steps': 1253, 'loss/train': 4.4904327392578125} -09/20/2021 18:49:51 - INFO - __main__ - Step 20056: {'lr': 0.0001999485297839463, 'samples': 641792, 'steps': 1253, 'loss/train': 2.371089458465576} -09/20/2021 18:49:52 - INFO - __main__ - Step 20057: {'lr': 0.0001999485297839463, 'samples': 641824, 'steps': 1253, 'loss/train': 3.3634274005889893} -09/20/2021 18:49:53 - INFO - __main__ - Step 20058: {'lr': 0.0001999485297839463, 'samples': 641856, 'steps': 1253, 'loss/train': 2.4711673259735107} -09/20/2021 18:49:54 - INFO - __main__ - Step 20059: {'lr': 0.0001999485297839463, 'samples': 641888, 'steps': 1253, 'loss/train': 3.044699192047119} -09/20/2021 18:49:55 - INFO - __main__ - Step 20060: {'lr': 0.0001999485297839463, 'samples': 641920, 'steps': 1253, 'loss/train': 3.693547487258911} -09/20/2021 18:49:55 - INFO - __main__ - Step 20061: {'lr': 0.0001999485297839463, 'samples': 641952, 'steps': 1253, 'loss/train': 4.312484264373779} -09/20/2021 18:49:56 - INFO - __main__ - Step 20062: {'lr': 0.0001999485297839463, 'samples': 641984, 'steps': 1253, 'loss/train': 2.696897506713867} -09/20/2021 18:49:57 - INFO - __main__ - Step 20063: {'lr': 0.0001999485297839463, 'samples': 642016, 'steps': 1253, 'loss/train': 3.5521538257598877} -09/20/2021 18:49:58 - INFO - __main__ - Step 20064: {'lr': 0.0001999485297839463, 'samples': 642048, 'steps': 1253, 'loss/train': 3.052347421646118} -09/20/2021 18:49:59 - INFO - __main__ - Step 20065: {'lr': 0.0001999483249452125, 'samples': 642080, 'steps': 1254, 'loss/train': 3.1667683124542236} -09/20/2021 18:49:59 - INFO - __main__ - Step 20066: {'lr': 0.0001999483249452125, 'samples': 642112, 'steps': 1254, 'loss/train': 2.9212095737457275} -09/20/2021 18:50:00 - INFO - __main__ - Step 20067: {'lr': 0.0001999483249452125, 'samples': 642144, 'steps': 1254, 'loss/train': 3.9306204319000244} -09/20/2021 18:50:01 - INFO - __main__ - Step 20068: {'lr': 0.0001999483249452125, 'samples': 642176, 'steps': 1254, 'loss/train': 3.575608491897583} -09/20/2021 18:50:02 - INFO - __main__ - Step 20069: {'lr': 0.0001999483249452125, 'samples': 642208, 'steps': 1254, 'loss/train': 4.100803852081299} -09/20/2021 18:50:02 - INFO - __main__ - Step 20070: {'lr': 0.0001999483249452125, 'samples': 642240, 'steps': 1254, 'loss/train': 4.265020847320557} -09/20/2021 18:50:03 - INFO - __main__ - Step 20071: {'lr': 0.0001999483249452125, 'samples': 642272, 'steps': 1254, 'loss/train': 5.047383785247803} -09/20/2021 18:50:04 - INFO - __main__ - Step 20072: {'lr': 0.0001999483249452125, 'samples': 642304, 'steps': 1254, 'loss/train': 3.98667049407959} -09/20/2021 18:50:05 - INFO - __main__ - Step 20073: {'lr': 0.0001999483249452125, 'samples': 642336, 'steps': 1254, 'loss/train': 4.368325233459473} -09/20/2021 18:50:05 - INFO - __main__ - Step 20074: {'lr': 0.0001999483249452125, 'samples': 642368, 'steps': 1254, 'loss/train': 3.8027734756469727} -09/20/2021 18:50:06 - INFO - __main__ - Step 20075: {'lr': 0.0001999483249452125, 'samples': 642400, 'steps': 1254, 'loss/train': 1.0595219135284424} -09/20/2021 18:50:07 - INFO - __main__ - Step 20076: {'lr': 0.0001999483249452125, 'samples': 642432, 'steps': 1254, 'loss/train': 3.381906509399414} -09/20/2021 18:50:08 - INFO - __main__ - Step 20077: {'lr': 0.0001999483249452125, 'samples': 642464, 'steps': 1254, 'loss/train': 3.09847092628479} -09/20/2021 18:50:08 - INFO - __main__ - Step 20078: {'lr': 0.0001999483249452125, 'samples': 642496, 'steps': 1254, 'loss/train': 3.633878707885742} -09/20/2021 18:50:09 - INFO - __main__ - Step 20079: {'lr': 0.0001999483249452125, 'samples': 642528, 'steps': 1254, 'loss/train': 3.6998507976531982} -09/20/2021 18:50:10 - INFO - __main__ - Step 20080: {'lr': 0.0001999483249452125, 'samples': 642560, 'steps': 1254, 'loss/train': 2.943190574645996} -09/20/2021 18:50:11 - INFO - __main__ - Step 20081: {'lr': 0.00019994811969978934, 'samples': 642592, 'steps': 1255, 'loss/train': 3.3210248947143555} -09/20/2021 18:50:12 - INFO - __main__ - Step 20082: {'lr': 0.00019994811969978934, 'samples': 642624, 'steps': 1255, 'loss/train': 4.228944778442383} -09/20/2021 18:50:12 - INFO - __main__ - Step 20083: {'lr': 0.00019994811969978934, 'samples': 642656, 'steps': 1255, 'loss/train': 3.4565513134002686} -09/20/2021 18:50:13 - INFO - __main__ - Step 20084: {'lr': 0.00019994811969978934, 'samples': 642688, 'steps': 1255, 'loss/train': 3.3282322883605957} -09/20/2021 18:50:14 - INFO - __main__ - Step 20085: {'lr': 0.00019994811969978934, 'samples': 642720, 'steps': 1255, 'loss/train': 2.7754006385803223} -09/20/2021 18:50:15 - INFO - __main__ - Step 20086: {'lr': 0.00019994811969978934, 'samples': 642752, 'steps': 1255, 'loss/train': 3.9093923568725586} -09/20/2021 18:50:15 - INFO - __main__ - Step 20087: {'lr': 0.00019994811969978934, 'samples': 642784, 'steps': 1255, 'loss/train': 3.236377477645874} -09/20/2021 18:50:16 - INFO - __main__ - Step 20088: {'lr': 0.00019994811969978934, 'samples': 642816, 'steps': 1255, 'loss/train': 2.373016834259033} -09/20/2021 18:50:17 - INFO - __main__ - Step 20089: {'lr': 0.00019994811969978934, 'samples': 642848, 'steps': 1255, 'loss/train': 3.9744584560394287} -09/20/2021 18:50:18 - INFO - __main__ - Step 20090: {'lr': 0.00019994811969978934, 'samples': 642880, 'steps': 1255, 'loss/train': 2.8684873580932617} -09/20/2021 18:50:19 - INFO - __main__ - Step 20091: {'lr': 0.00019994811969978934, 'samples': 642912, 'steps': 1255, 'loss/train': 2.775238513946533} -09/20/2021 18:50:20 - INFO - __main__ - Step 20092: {'lr': 0.00019994811969978934, 'samples': 642944, 'steps': 1255, 'loss/train': 3.3484058380126953} -09/20/2021 18:50:20 - INFO - __main__ - Step 20093: {'lr': 0.00019994811969978934, 'samples': 642976, 'steps': 1255, 'loss/train': 3.7269766330718994} -09/20/2021 18:50:21 - INFO - __main__ - Step 20094: {'lr': 0.00019994811969978934, 'samples': 643008, 'steps': 1255, 'loss/train': 3.278705358505249} -09/20/2021 18:50:22 - INFO - __main__ - Step 20095: {'lr': 0.00019994811969978934, 'samples': 643040, 'steps': 1255, 'loss/train': 3.0430681705474854} -09/20/2021 18:50:23 - INFO - __main__ - Step 20096: {'lr': 0.00019994811969978934, 'samples': 643072, 'steps': 1255, 'loss/train': 2.166013479232788} -09/20/2021 18:50:23 - INFO - __main__ - Step 20097: {'lr': 0.0001999479140476777, 'samples': 643104, 'steps': 1256, 'loss/train': 3.8747732639312744} -09/20/2021 18:50:24 - INFO - __main__ - Step 20098: {'lr': 0.0001999479140476777, 'samples': 643136, 'steps': 1256, 'loss/train': 4.270869255065918} -09/20/2021 18:50:25 - INFO - __main__ - Step 20099: {'lr': 0.0001999479140476777, 'samples': 643168, 'steps': 1256, 'loss/train': 3.003828763961792} -09/20/2021 18:50:26 - INFO - __main__ - Step 20100: {'lr': 0.0001999479140476777, 'samples': 643200, 'steps': 1256, 'loss/train': 3.2799031734466553} -09/20/2021 18:50:26 - INFO - __main__ - Step 20101: {'lr': 0.0001999479140476777, 'samples': 643232, 'steps': 1256, 'loss/train': 2.3893015384674072} -09/20/2021 18:50:27 - INFO - __main__ - Step 20102: {'lr': 0.0001999479140476777, 'samples': 643264, 'steps': 1256, 'loss/train': 3.9812302589416504} -09/20/2021 18:50:28 - INFO - __main__ - Step 20103: {'lr': 0.0001999479140476777, 'samples': 643296, 'steps': 1256, 'loss/train': 3.7456068992614746} -09/20/2021 18:50:29 - INFO - __main__ - Step 20104: {'lr': 0.0001999479140476777, 'samples': 643328, 'steps': 1256, 'loss/train': 2.9340569972991943} -09/20/2021 18:50:29 - INFO - __main__ - Step 20105: {'lr': 0.0001999479140476777, 'samples': 643360, 'steps': 1256, 'loss/train': 2.9409661293029785} -09/20/2021 18:50:30 - INFO - __main__ - Step 20106: {'lr': 0.0001999479140476777, 'samples': 643392, 'steps': 1256, 'loss/train': 4.026904106140137} -09/20/2021 18:50:31 - INFO - __main__ - Step 20107: {'lr': 0.0001999479140476777, 'samples': 643424, 'steps': 1256, 'loss/train': 3.7752504348754883} -09/20/2021 18:50:32 - INFO - __main__ - Step 20108: {'lr': 0.0001999479140476777, 'samples': 643456, 'steps': 1256, 'loss/train': 3.5870578289031982} -09/20/2021 18:50:32 - INFO - __main__ - Step 20109: {'lr': 0.0001999479140476777, 'samples': 643488, 'steps': 1256, 'loss/train': 3.1251120567321777} -09/20/2021 18:50:33 - INFO - __main__ - Step 20110: {'lr': 0.0001999479140476777, 'samples': 643520, 'steps': 1256, 'loss/train': 4.158053874969482} -09/20/2021 18:50:34 - INFO - __main__ - Step 20111: {'lr': 0.0001999479140476777, 'samples': 643552, 'steps': 1256, 'loss/train': 3.760091543197632} -09/20/2021 18:50:35 - INFO - __main__ - Step 20112: {'lr': 0.0001999479140476777, 'samples': 643584, 'steps': 1256, 'loss/train': 4.076850891113281} -09/20/2021 18:50:36 - INFO - __main__ - Step 20113: {'lr': 0.0001999477079888784, 'samples': 643616, 'steps': 1257, 'loss/train': 4.063701629638672} -09/20/2021 18:50:36 - INFO - __main__ - Step 20114: {'lr': 0.0001999477079888784, 'samples': 643648, 'steps': 1257, 'loss/train': 3.3065383434295654} -09/20/2021 18:50:37 - INFO - __main__ - Step 20115: {'lr': 0.0001999477079888784, 'samples': 643680, 'steps': 1257, 'loss/train': 3.1881558895111084} -09/20/2021 18:50:38 - INFO - __main__ - Step 20116: {'lr': 0.0001999477079888784, 'samples': 643712, 'steps': 1257, 'loss/train': 3.382279634475708} -09/20/2021 18:50:39 - INFO - __main__ - Step 20117: {'lr': 0.0001999477079888784, 'samples': 643744, 'steps': 1257, 'loss/train': 3.2898027896881104} -09/20/2021 18:50:39 - INFO - __main__ - Step 20118: {'lr': 0.0001999477079888784, 'samples': 643776, 'steps': 1257, 'loss/train': 4.23769998550415} -09/20/2021 18:50:40 - INFO - __main__ - Step 20119: {'lr': 0.0001999477079888784, 'samples': 643808, 'steps': 1257, 'loss/train': 3.7088797092437744} -09/20/2021 18:50:41 - INFO - __main__ - Step 20120: {'lr': 0.0001999477079888784, 'samples': 643840, 'steps': 1257, 'loss/train': 3.428150177001953} -09/20/2021 18:50:42 - INFO - __main__ - Step 20121: {'lr': 0.0001999477079888784, 'samples': 643872, 'steps': 1257, 'loss/train': 3.591965675354004} -09/20/2021 18:50:43 - INFO - __main__ - Step 20122: {'lr': 0.0001999477079888784, 'samples': 643904, 'steps': 1257, 'loss/train': 3.347541570663452} -09/20/2021 18:50:44 - INFO - __main__ - Step 20123: {'lr': 0.0001999477079888784, 'samples': 643936, 'steps': 1257, 'loss/train': 3.1875176429748535} -09/20/2021 18:50:45 - INFO - __main__ - Step 20124: {'lr': 0.0001999477079888784, 'samples': 643968, 'steps': 1257, 'loss/train': 3.275601387023926} -09/20/2021 18:50:46 - INFO - __main__ - Step 20125: {'lr': 0.0001999477079888784, 'samples': 644000, 'steps': 1257, 'loss/train': 3.267542839050293} -09/20/2021 18:50:46 - INFO - __main__ - Step 20126: {'lr': 0.0001999477079888784, 'samples': 644032, 'steps': 1257, 'loss/train': 3.461749792098999} -09/20/2021 18:50:47 - INFO - __main__ - Step 20127: {'lr': 0.0001999477079888784, 'samples': 644064, 'steps': 1257, 'loss/train': 3.1830198764801025} -09/20/2021 18:50:48 - INFO - __main__ - Step 20128: {'lr': 0.0001999477079888784, 'samples': 644096, 'steps': 1257, 'loss/train': 3.9421801567077637} -09/20/2021 18:50:49 - INFO - __main__ - Step 20129: {'lr': 0.00019994750152339222, 'samples': 644128, 'steps': 1258, 'loss/train': 4.1539812088012695} -09/20/2021 18:50:49 - INFO - __main__ - Step 20130: {'lr': 0.00019994750152339222, 'samples': 644160, 'steps': 1258, 'loss/train': 3.339444398880005} -09/20/2021 18:50:50 - INFO - __main__ - Step 20131: {'lr': 0.00019994750152339222, 'samples': 644192, 'steps': 1258, 'loss/train': 3.5061089992523193} -09/20/2021 18:50:51 - INFO - __main__ - Step 20132: {'lr': 0.00019994750152339222, 'samples': 644224, 'steps': 1258, 'loss/train': 3.1715011596679688} -09/20/2021 18:50:52 - INFO - __main__ - Step 20133: {'lr': 0.00019994750152339222, 'samples': 644256, 'steps': 1258, 'loss/train': 0.8995027542114258} -09/20/2021 18:50:52 - INFO - __main__ - Step 20134: {'lr': 0.00019994750152339222, 'samples': 644288, 'steps': 1258, 'loss/train': 5.042392253875732} -09/20/2021 18:50:53 - INFO - __main__ - Step 20135: {'lr': 0.00019994750152339222, 'samples': 644320, 'steps': 1258, 'loss/train': 4.151401996612549} -09/20/2021 18:50:54 - INFO - __main__ - Step 20136: {'lr': 0.00019994750152339222, 'samples': 644352, 'steps': 1258, 'loss/train': 3.318127393722534} -09/20/2021 18:50:55 - INFO - __main__ - Step 20137: {'lr': 0.00019994750152339222, 'samples': 644384, 'steps': 1258, 'loss/train': 2.6064140796661377} -09/20/2021 18:50:55 - INFO - __main__ - Step 20138: {'lr': 0.00019994750152339222, 'samples': 644416, 'steps': 1258, 'loss/train': 0.7816022634506226} -09/20/2021 18:50:56 - INFO - __main__ - Step 20139: {'lr': 0.00019994750152339222, 'samples': 644448, 'steps': 1258, 'loss/train': 3.943673849105835} -09/20/2021 18:50:57 - INFO - __main__ - Step 20140: {'lr': 0.00019994750152339222, 'samples': 644480, 'steps': 1258, 'loss/train': 3.3444371223449707} -09/20/2021 18:50:58 - INFO - __main__ - Step 20141: {'lr': 0.00019994750152339222, 'samples': 644512, 'steps': 1258, 'loss/train': 2.131378412246704} -09/20/2021 18:50:58 - INFO - __main__ - Step 20142: {'lr': 0.00019994750152339222, 'samples': 644544, 'steps': 1258, 'loss/train': 2.594444513320923} -09/20/2021 18:50:59 - INFO - __main__ - Step 20143: {'lr': 0.00019994750152339222, 'samples': 644576, 'steps': 1258, 'loss/train': 2.4578874111175537} -09/20/2021 18:51:00 - INFO - __main__ - Step 20144: {'lr': 0.00019994750152339222, 'samples': 644608, 'steps': 1258, 'loss/train': 2.0750110149383545} -09/20/2021 18:51:01 - INFO - __main__ - Step 20145: {'lr': 0.00019994729465122005, 'samples': 644640, 'steps': 1259, 'loss/train': 2.5826306343078613} -09/20/2021 18:51:02 - INFO - __main__ - Step 20146: {'lr': 0.00019994729465122005, 'samples': 644672, 'steps': 1259, 'loss/train': 2.6492857933044434} -09/20/2021 18:51:02 - INFO - __main__ - Step 20147: {'lr': 0.00019994729465122005, 'samples': 644704, 'steps': 1259, 'loss/train': 2.2275187969207764} -09/20/2021 18:51:03 - INFO - __main__ - Step 20148: {'lr': 0.00019994729465122005, 'samples': 644736, 'steps': 1259, 'loss/train': 2.439603090286255} -09/20/2021 18:51:04 - INFO - __main__ - Step 20149: {'lr': 0.00019994729465122005, 'samples': 644768, 'steps': 1259, 'loss/train': 2.368546724319458} -09/20/2021 18:51:05 - INFO - __main__ - Step 20150: {'lr': 0.00019994729465122005, 'samples': 644800, 'steps': 1259, 'loss/train': 4.3916802406311035} -09/20/2021 18:51:05 - INFO - __main__ - Step 20151: {'lr': 0.00019994729465122005, 'samples': 644832, 'steps': 1259, 'loss/train': 3.457024335861206} -09/20/2021 18:51:06 - INFO - __main__ - Step 20152: {'lr': 0.00019994729465122005, 'samples': 644864, 'steps': 1259, 'loss/train': 3.461188554763794} -09/20/2021 18:51:07 - INFO - __main__ - Step 20153: {'lr': 0.00019994729465122005, 'samples': 644896, 'steps': 1259, 'loss/train': 3.0111913681030273} -09/20/2021 18:51:08 - INFO - __main__ - Step 20154: {'lr': 0.00019994729465122005, 'samples': 644928, 'steps': 1259, 'loss/train': 2.674837112426758} -09/20/2021 18:51:08 - INFO - __main__ - Step 20155: {'lr': 0.00019994729465122005, 'samples': 644960, 'steps': 1259, 'loss/train': 4.013160705566406} -09/20/2021 18:51:09 - INFO - __main__ - Step 20156: {'lr': 0.00019994729465122005, 'samples': 644992, 'steps': 1259, 'loss/train': 3.0906894207000732} -09/20/2021 18:51:10 - INFO - __main__ - Step 20157: {'lr': 0.00019994729465122005, 'samples': 645024, 'steps': 1259, 'loss/train': 3.776590585708618} -09/20/2021 18:51:11 - INFO - __main__ - Step 20158: {'lr': 0.00019994729465122005, 'samples': 645056, 'steps': 1259, 'loss/train': 3.450911283493042} -09/20/2021 18:51:12 - INFO - __main__ - Step 20159: {'lr': 0.00019994729465122005, 'samples': 645088, 'steps': 1259, 'loss/train': 4.0281596183776855} -09/20/2021 18:51:13 - INFO - __main__ - Step 20160: {'lr': 0.00019994729465122005, 'samples': 645120, 'steps': 1259, 'loss/train': 3.0801355838775635} -09/20/2021 18:51:14 - INFO - __main__ - Step 20161: {'lr': 0.00019994708737236275, 'samples': 645152, 'steps': 1260, 'loss/train': 3.4879255294799805} -09/20/2021 18:51:15 - INFO - __main__ - Step 20162: {'lr': 0.00019994708737236275, 'samples': 645184, 'steps': 1260, 'loss/train': 3.3246519565582275} -09/20/2021 18:51:15 - INFO - __main__ - Step 20163: {'lr': 0.00019994708737236275, 'samples': 645216, 'steps': 1260, 'loss/train': 4.6636576652526855} -09/20/2021 18:51:16 - INFO - __main__ - Step 20164: {'lr': 0.00019994708737236275, 'samples': 645248, 'steps': 1260, 'loss/train': 3.175323486328125} -09/20/2021 18:51:17 - INFO - __main__ - Step 20165: {'lr': 0.00019994708737236275, 'samples': 645280, 'steps': 1260, 'loss/train': 3.931610584259033} -09/20/2021 18:51:18 - INFO - __main__ - Step 20166: {'lr': 0.00019994708737236275, 'samples': 645312, 'steps': 1260, 'loss/train': 2.7209432125091553} -09/20/2021 18:51:18 - INFO - __main__ - Step 20167: {'lr': 0.00019994708737236275, 'samples': 645344, 'steps': 1260, 'loss/train': 3.982379198074341} -09/20/2021 18:51:19 - INFO - __main__ - Step 20168: {'lr': 0.00019994708737236275, 'samples': 645376, 'steps': 1260, 'loss/train': 3.8357560634613037} -09/20/2021 18:51:20 - INFO - __main__ - Step 20169: {'lr': 0.00019994708737236275, 'samples': 645408, 'steps': 1260, 'loss/train': 3.4618778228759766} -09/20/2021 18:51:21 - INFO - __main__ - Step 20170: {'lr': 0.00019994708737236275, 'samples': 645440, 'steps': 1260, 'loss/train': 3.4181973934173584} -09/20/2021 18:51:21 - INFO - __main__ - Step 20171: {'lr': 0.00019994708737236275, 'samples': 645472, 'steps': 1260, 'loss/train': 3.1561262607574463} -09/20/2021 18:51:22 - INFO - __main__ - Step 20172: {'lr': 0.00019994708737236275, 'samples': 645504, 'steps': 1260, 'loss/train': 3.1648833751678467} -09/20/2021 18:51:23 - INFO - __main__ - Step 20173: {'lr': 0.00019994708737236275, 'samples': 645536, 'steps': 1260, 'loss/train': 2.728832244873047} -09/20/2021 18:51:24 - INFO - __main__ - Step 20174: {'lr': 0.00019994708737236275, 'samples': 645568, 'steps': 1260, 'loss/train': 2.9466969966888428} -09/20/2021 18:51:24 - INFO - __main__ - Step 20175: {'lr': 0.00019994708737236275, 'samples': 645600, 'steps': 1260, 'loss/train': 2.826531171798706} -09/20/2021 18:51:25 - INFO - __main__ - Step 20176: {'lr': 0.00019994708737236275, 'samples': 645632, 'steps': 1260, 'loss/train': 2.969305992126465} -09/20/2021 18:51:26 - INFO - __main__ - Step 20177: {'lr': 0.00019994687968682114, 'samples': 645664, 'steps': 1261, 'loss/train': 3.5676605701446533} -09/20/2021 18:51:27 - INFO - __main__ - Step 20178: {'lr': 0.00019994687968682114, 'samples': 645696, 'steps': 1261, 'loss/train': 3.9047865867614746} -09/20/2021 18:51:28 - INFO - __main__ - Step 20179: {'lr': 0.00019994687968682114, 'samples': 645728, 'steps': 1261, 'loss/train': 3.1111338138580322} -09/20/2021 18:51:28 - INFO - __main__ - Step 20180: {'lr': 0.00019994687968682114, 'samples': 645760, 'steps': 1261, 'loss/train': 2.4716219902038574} -09/20/2021 18:51:29 - INFO - __main__ - Step 20181: {'lr': 0.00019994687968682114, 'samples': 645792, 'steps': 1261, 'loss/train': 3.203110456466675} -09/20/2021 18:51:30 - INFO - __main__ - Step 20182: {'lr': 0.00019994687968682114, 'samples': 645824, 'steps': 1261, 'loss/train': 3.686838150024414} -09/20/2021 18:51:30 - INFO - __main__ - Step 20183: {'lr': 0.00019994687968682114, 'samples': 645856, 'steps': 1261, 'loss/train': 1.0229617357254028} -09/20/2021 18:51:31 - INFO - __main__ - Step 20184: {'lr': 0.00019994687968682114, 'samples': 645888, 'steps': 1261, 'loss/train': 3.6119675636291504} -09/20/2021 18:51:32 - INFO - __main__ - Step 20185: {'lr': 0.00019994687968682114, 'samples': 645920, 'steps': 1261, 'loss/train': 3.325418710708618} -09/20/2021 18:51:33 - INFO - __main__ - Step 20186: {'lr': 0.00019994687968682114, 'samples': 645952, 'steps': 1261, 'loss/train': 3.5525171756744385} -09/20/2021 18:51:33 - INFO - __main__ - Step 20187: {'lr': 0.00019994687968682114, 'samples': 645984, 'steps': 1261, 'loss/train': 2.068857192993164} -09/20/2021 18:51:34 - INFO - __main__ - Step 20188: {'lr': 0.00019994687968682114, 'samples': 646016, 'steps': 1261, 'loss/train': 1.810903549194336} -09/20/2021 18:51:35 - INFO - __main__ - Step 20189: {'lr': 0.00019994687968682114, 'samples': 646048, 'steps': 1261, 'loss/train': 2.3582499027252197} -09/20/2021 18:51:36 - INFO - __main__ - Step 20190: {'lr': 0.00019994687968682114, 'samples': 646080, 'steps': 1261, 'loss/train': 2.30104660987854} -09/20/2021 18:51:36 - INFO - __main__ - Step 20191: {'lr': 0.00019994687968682114, 'samples': 646112, 'steps': 1261, 'loss/train': 2.123084306716919} -09/20/2021 18:51:37 - INFO - __main__ - Step 20192: {'lr': 0.00019994687968682114, 'samples': 646144, 'steps': 1261, 'loss/train': 1.7961304187774658} -09/20/2021 18:51:38 - INFO - __main__ - Step 20193: {'lr': 0.00019994667159459604, 'samples': 646176, 'steps': 1262, 'loss/train': 2.331690788269043} -09/20/2021 18:51:39 - INFO - __main__ - Step 20194: {'lr': 0.00019994667159459604, 'samples': 646208, 'steps': 1262, 'loss/train': 2.5079548358917236} -09/20/2021 18:51:40 - INFO - __main__ - Step 20195: {'lr': 0.00019994667159459604, 'samples': 646240, 'steps': 1262, 'loss/train': 3.4270315170288086} -09/20/2021 18:51:41 - INFO - __main__ - Step 20196: {'lr': 0.00019994667159459604, 'samples': 646272, 'steps': 1262, 'loss/train': 3.258026123046875} -09/20/2021 18:51:42 - INFO - __main__ - Step 20197: {'lr': 0.00019994667159459604, 'samples': 646304, 'steps': 1262, 'loss/train': 3.422715663909912} -09/20/2021 18:51:42 - INFO - __main__ - Step 20198: {'lr': 0.00019994667159459604, 'samples': 646336, 'steps': 1262, 'loss/train': 3.125290632247925} -09/20/2021 18:51:43 - INFO - __main__ - Step 20199: {'lr': 0.00019994667159459604, 'samples': 646368, 'steps': 1262, 'loss/train': 3.269883871078491} -09/20/2021 18:51:44 - INFO - __main__ - Step 20200: {'lr': 0.00019994667159459604, 'samples': 646400, 'steps': 1262, 'loss/train': 3.8024284839630127} -09/20/2021 18:51:45 - INFO - __main__ - Step 20201: {'lr': 0.00019994667159459604, 'samples': 646432, 'steps': 1262, 'loss/train': 3.4997692108154297} -09/20/2021 18:51:45 - INFO - __main__ - Step 20202: {'lr': 0.00019994667159459604, 'samples': 646464, 'steps': 1262, 'loss/train': 4.241943836212158} -09/20/2021 18:51:46 - INFO - __main__ - Step 20203: {'lr': 0.00019994667159459604, 'samples': 646496, 'steps': 1262, 'loss/train': 2.7304866313934326} -09/20/2021 18:51:47 - INFO - __main__ - Step 20204: {'lr': 0.00019994667159459604, 'samples': 646528, 'steps': 1262, 'loss/train': 3.4417386054992676} -09/20/2021 18:51:48 - INFO - __main__ - Step 20205: {'lr': 0.00019994667159459604, 'samples': 646560, 'steps': 1262, 'loss/train': 4.218859672546387} -09/20/2021 18:51:48 - INFO - __main__ - Step 20206: {'lr': 0.00019994667159459604, 'samples': 646592, 'steps': 1262, 'loss/train': 2.9666452407836914} -09/20/2021 18:51:49 - INFO - __main__ - Step 20207: {'lr': 0.00019994667159459604, 'samples': 646624, 'steps': 1262, 'loss/train': 3.3759632110595703} -09/20/2021 18:51:50 - INFO - __main__ - Step 20208: {'lr': 0.00019994667159459604, 'samples': 646656, 'steps': 1262, 'loss/train': 2.391007423400879} -09/20/2021 18:51:51 - INFO - __main__ - Step 20209: {'lr': 0.00019994646309568834, 'samples': 646688, 'steps': 1263, 'loss/train': 3.3061916828155518} -09/20/2021 18:51:52 - INFO - __main__ - Step 20210: {'lr': 0.00019994646309568834, 'samples': 646720, 'steps': 1263, 'loss/train': 3.490007162094116} -09/20/2021 18:51:52 - INFO - __main__ - Step 20211: {'lr': 0.00019994646309568834, 'samples': 646752, 'steps': 1263, 'loss/train': 2.9773130416870117} -09/20/2021 18:51:53 - INFO - __main__ - Step 20212: {'lr': 0.00019994646309568834, 'samples': 646784, 'steps': 1263, 'loss/train': 3.378021478652954} -09/20/2021 18:51:54 - INFO - __main__ - Step 20213: {'lr': 0.00019994646309568834, 'samples': 646816, 'steps': 1263, 'loss/train': 2.8120310306549072} -09/20/2021 18:51:55 - INFO - __main__ - Step 20214: {'lr': 0.00019994646309568834, 'samples': 646848, 'steps': 1263, 'loss/train': 2.5689499378204346} -09/20/2021 18:51:55 - INFO - __main__ - Step 20215: {'lr': 0.00019994646309568834, 'samples': 646880, 'steps': 1263, 'loss/train': 3.786308526992798} -09/20/2021 18:51:56 - INFO - __main__ - Step 20216: {'lr': 0.00019994646309568834, 'samples': 646912, 'steps': 1263, 'loss/train': 4.103507041931152} -09/20/2021 18:51:57 - INFO - __main__ - Step 20217: {'lr': 0.00019994646309568834, 'samples': 646944, 'steps': 1263, 'loss/train': 2.6187868118286133} -09/20/2021 18:51:58 - INFO - __main__ - Step 20218: {'lr': 0.00019994646309568834, 'samples': 646976, 'steps': 1263, 'loss/train': 3.0697944164276123} -09/20/2021 18:51:58 - INFO - __main__ - Step 20219: {'lr': 0.00019994646309568834, 'samples': 647008, 'steps': 1263, 'loss/train': 3.5696499347686768} -09/20/2021 18:51:59 - INFO - __main__ - Step 20220: {'lr': 0.00019994646309568834, 'samples': 647040, 'steps': 1263, 'loss/train': 3.076288938522339} -09/20/2021 18:52:00 - INFO - __main__ - Step 20221: {'lr': 0.00019994646309568834, 'samples': 647072, 'steps': 1263, 'loss/train': 3.723463296890259} -09/20/2021 18:52:01 - INFO - __main__ - Step 20222: {'lr': 0.00019994646309568834, 'samples': 647104, 'steps': 1263, 'loss/train': 2.53759765625} -09/20/2021 18:52:01 - INFO - __main__ - Step 20223: {'lr': 0.00019994646309568834, 'samples': 647136, 'steps': 1263, 'loss/train': 2.079211473464966} -09/20/2021 18:52:02 - INFO - __main__ - Step 20224: {'lr': 0.00019994646309568834, 'samples': 647168, 'steps': 1263, 'loss/train': 3.29132342338562} -09/20/2021 18:52:03 - INFO - __main__ - Step 20225: {'lr': 0.00019994625419009887, 'samples': 647200, 'steps': 1264, 'loss/train': 3.280088186264038} -09/20/2021 18:52:04 - INFO - __main__ - Step 20226: {'lr': 0.00019994625419009887, 'samples': 647232, 'steps': 1264, 'loss/train': 1.9882153272628784} -09/20/2021 18:52:05 - INFO - __main__ - Step 20227: {'lr': 0.00019994625419009887, 'samples': 647264, 'steps': 1264, 'loss/train': 2.9145560264587402} -09/20/2021 18:52:06 - INFO - __main__ - Step 20228: {'lr': 0.00019994625419009887, 'samples': 647296, 'steps': 1264, 'loss/train': 3.9159562587738037} -09/20/2021 18:52:06 - INFO - __main__ - Step 20229: {'lr': 0.00019994625419009887, 'samples': 647328, 'steps': 1264, 'loss/train': 3.2046194076538086} -09/20/2021 18:52:07 - INFO - __main__ - Step 20230: {'lr': 0.00019994625419009887, 'samples': 647360, 'steps': 1264, 'loss/train': 4.861777305603027} -09/20/2021 18:52:08 - INFO - __main__ - Step 20231: {'lr': 0.00019994625419009887, 'samples': 647392, 'steps': 1264, 'loss/train': 3.314450979232788} -09/20/2021 18:52:09 - INFO - __main__ - Step 20232: {'lr': 0.00019994625419009887, 'samples': 647424, 'steps': 1264, 'loss/train': 2.724613666534424} -09/20/2021 18:52:09 - INFO - __main__ - Step 20233: {'lr': 0.00019994625419009887, 'samples': 647456, 'steps': 1264, 'loss/train': 3.665013074874878} -09/20/2021 18:52:10 - INFO - __main__ - Step 20234: {'lr': 0.00019994625419009887, 'samples': 647488, 'steps': 1264, 'loss/train': 3.4586610794067383} -09/20/2021 18:52:11 - INFO - __main__ - Step 20235: {'lr': 0.00019994625419009887, 'samples': 647520, 'steps': 1264, 'loss/train': 2.952375888824463} -09/20/2021 18:52:12 - INFO - __main__ - Step 20236: {'lr': 0.00019994625419009887, 'samples': 647552, 'steps': 1264, 'loss/train': 3.7549922466278076} -09/20/2021 18:52:12 - INFO - __main__ - Step 20237: {'lr': 0.00019994625419009887, 'samples': 647584, 'steps': 1264, 'loss/train': 4.373943328857422} -09/20/2021 18:52:13 - INFO - __main__ - Step 20238: {'lr': 0.00019994625419009887, 'samples': 647616, 'steps': 1264, 'loss/train': 5.477459907531738} -09/20/2021 18:52:14 - INFO - __main__ - Step 20239: {'lr': 0.00019994625419009887, 'samples': 647648, 'steps': 1264, 'loss/train': 3.8179283142089844} -09/20/2021 18:52:15 - INFO - __main__ - Step 20240: {'lr': 0.00019994625419009887, 'samples': 647680, 'steps': 1264, 'loss/train': 3.3172945976257324} -09/20/2021 18:52:16 - INFO - __main__ - Step 20241: {'lr': 0.00019994604487782848, 'samples': 647712, 'steps': 1265, 'loss/train': 3.4751954078674316} -09/20/2021 18:52:16 - INFO - __main__ - Step 20242: {'lr': 0.00019994604487782848, 'samples': 647744, 'steps': 1265, 'loss/train': 4.155224800109863} -09/20/2021 18:52:17 - INFO - __main__ - Step 20243: {'lr': 0.00019994604487782848, 'samples': 647776, 'steps': 1265, 'loss/train': 3.0189785957336426} -09/20/2021 18:52:18 - INFO - __main__ - Step 20244: {'lr': 0.00019994604487782848, 'samples': 647808, 'steps': 1265, 'loss/train': 4.330658912658691} -09/20/2021 18:52:19 - INFO - __main__ - Step 20245: {'lr': 0.00019994604487782848, 'samples': 647840, 'steps': 1265, 'loss/train': 3.0595483779907227} -09/20/2021 18:52:19 - INFO - __main__ - Step 20246: {'lr': 0.00019994604487782848, 'samples': 647872, 'steps': 1265, 'loss/train': 3.4890904426574707} -09/20/2021 18:52:20 - INFO - __main__ - Step 20247: {'lr': 0.00019994604487782848, 'samples': 647904, 'steps': 1265, 'loss/train': 2.978870153427124} -09/20/2021 18:52:21 - INFO - __main__ - Step 20248: {'lr': 0.00019994604487782848, 'samples': 647936, 'steps': 1265, 'loss/train': 2.896545171737671} -09/20/2021 18:52:22 - INFO - __main__ - Step 20249: {'lr': 0.00019994604487782848, 'samples': 647968, 'steps': 1265, 'loss/train': 3.2945406436920166} -09/20/2021 18:52:22 - INFO - __main__ - Step 20250: {'lr': 0.00019994604487782848, 'samples': 648000, 'steps': 1265, 'loss/train': 1.506229043006897} -09/20/2021 18:52:23 - INFO - __main__ - Step 20251: {'lr': 0.00019994604487782848, 'samples': 648032, 'steps': 1265, 'loss/train': 2.73343825340271} -09/20/2021 18:52:24 - INFO - __main__ - Step 20252: {'lr': 0.00019994604487782848, 'samples': 648064, 'steps': 1265, 'loss/train': 3.094147205352783} -09/20/2021 18:52:25 - INFO - __main__ - Step 20253: {'lr': 0.00019994604487782848, 'samples': 648096, 'steps': 1265, 'loss/train': 2.5547916889190674} -09/20/2021 18:52:25 - INFO - __main__ - Step 20254: {'lr': 0.00019994604487782848, 'samples': 648128, 'steps': 1265, 'loss/train': 3.045816659927368} -09/20/2021 18:52:26 - INFO - __main__ - Step 20255: {'lr': 0.00019994604487782848, 'samples': 648160, 'steps': 1265, 'loss/train': 4.001749515533447} -09/20/2021 18:52:27 - INFO - __main__ - Step 20256: {'lr': 0.00019994604487782848, 'samples': 648192, 'steps': 1265, 'loss/train': 3.5203380584716797} -09/20/2021 18:52:28 - INFO - __main__ - Step 20257: {'lr': 0.00019994583515887802, 'samples': 648224, 'steps': 1266, 'loss/train': 3.6450905799865723} -09/20/2021 18:52:29 - INFO - __main__ - Step 20258: {'lr': 0.00019994583515887802, 'samples': 648256, 'steps': 1266, 'loss/train': 4.046712875366211} -09/20/2021 18:52:30 - INFO - __main__ - Step 20259: {'lr': 0.00019994583515887802, 'samples': 648288, 'steps': 1266, 'loss/train': 3.343684196472168} -09/20/2021 18:52:31 - INFO - __main__ - Step 20260: {'lr': 0.00019994583515887802, 'samples': 648320, 'steps': 1266, 'loss/train': 2.584522247314453} -09/20/2021 18:52:31 - INFO - __main__ - Step 20261: {'lr': 0.00019994583515887802, 'samples': 648352, 'steps': 1266, 'loss/train': 3.7027084827423096} -09/20/2021 18:52:32 - INFO - __main__ - Step 20262: {'lr': 0.00019994583515887802, 'samples': 648384, 'steps': 1266, 'loss/train': 3.3034651279449463} -09/20/2021 18:52:33 - INFO - __main__ - Step 20263: {'lr': 0.00019994583515887802, 'samples': 648416, 'steps': 1266, 'loss/train': 2.3154714107513428} -09/20/2021 18:52:34 - INFO - __main__ - Step 20264: {'lr': 0.00019994583515887802, 'samples': 648448, 'steps': 1266, 'loss/train': 3.009556293487549} -09/20/2021 18:52:34 - INFO - __main__ - Step 20265: {'lr': 0.00019994583515887802, 'samples': 648480, 'steps': 1266, 'loss/train': 0.7235610485076904} -09/20/2021 18:52:35 - INFO - __main__ - Step 20266: {'lr': 0.00019994583515887802, 'samples': 648512, 'steps': 1266, 'loss/train': 2.9366848468780518} -09/20/2021 18:52:36 - INFO - __main__ - Step 20267: {'lr': 0.00019994583515887802, 'samples': 648544, 'steps': 1266, 'loss/train': 2.1583025455474854} -09/20/2021 18:52:37 - INFO - __main__ - Step 20268: {'lr': 0.00019994583515887802, 'samples': 648576, 'steps': 1266, 'loss/train': 2.727052688598633} -09/20/2021 18:52:37 - INFO - __main__ - Step 20269: {'lr': 0.00019994583515887802, 'samples': 648608, 'steps': 1266, 'loss/train': 2.577523708343506} -09/20/2021 18:52:38 - INFO - __main__ - Step 20270: {'lr': 0.00019994583515887802, 'samples': 648640, 'steps': 1266, 'loss/train': 4.562572956085205} -09/20/2021 18:52:39 - INFO - __main__ - Step 20271: {'lr': 0.00019994583515887802, 'samples': 648672, 'steps': 1266, 'loss/train': 2.971343517303467} -09/20/2021 18:52:40 - INFO - __main__ - Step 20272: {'lr': 0.00019994583515887802, 'samples': 648704, 'steps': 1266, 'loss/train': 2.8141095638275146} -09/20/2021 18:52:40 - INFO - __main__ - Step 20273: {'lr': 0.00019994562503324831, 'samples': 648736, 'steps': 1267, 'loss/train': 2.9454610347747803} -09/20/2021 18:52:41 - INFO - __main__ - Step 20274: {'lr': 0.00019994562503324831, 'samples': 648768, 'steps': 1267, 'loss/train': 4.252354621887207} -09/20/2021 18:52:42 - INFO - __main__ - Step 20275: {'lr': 0.00019994562503324831, 'samples': 648800, 'steps': 1267, 'loss/train': 2.5209999084472656} -09/20/2021 18:52:43 - INFO - __main__ - Step 20276: {'lr': 0.00019994562503324831, 'samples': 648832, 'steps': 1267, 'loss/train': 3.5462937355041504} -09/20/2021 18:52:43 - INFO - __main__ - Step 20277: {'lr': 0.00019994562503324831, 'samples': 648864, 'steps': 1267, 'loss/train': 3.599074363708496} -09/20/2021 18:52:44 - INFO - __main__ - Step 20278: {'lr': 0.00019994562503324831, 'samples': 648896, 'steps': 1267, 'loss/train': 2.63545560836792} -09/20/2021 18:52:45 - INFO - __main__ - Step 20279: {'lr': 0.00019994562503324831, 'samples': 648928, 'steps': 1267, 'loss/train': 3.7909345626831055} -09/20/2021 18:52:46 - INFO - __main__ - Step 20280: {'lr': 0.00019994562503324831, 'samples': 648960, 'steps': 1267, 'loss/train': 3.0334713459014893} -09/20/2021 18:52:46 - INFO - __main__ - Step 20281: {'lr': 0.00019994562503324831, 'samples': 648992, 'steps': 1267, 'loss/train': 3.3051464557647705} -09/20/2021 18:52:47 - INFO - __main__ - Step 20282: {'lr': 0.00019994562503324831, 'samples': 649024, 'steps': 1267, 'loss/train': 3.6699278354644775} -09/20/2021 18:52:48 - INFO - __main__ - Step 20283: {'lr': 0.00019994562503324831, 'samples': 649056, 'steps': 1267, 'loss/train': 2.0910327434539795} -09/20/2021 18:52:49 - INFO - __main__ - Step 20284: {'lr': 0.00019994562503324831, 'samples': 649088, 'steps': 1267, 'loss/train': 4.083329677581787} -09/20/2021 18:52:49 - INFO - __main__ - Step 20285: {'lr': 0.00019994562503324831, 'samples': 649120, 'steps': 1267, 'loss/train': 4.156075954437256} -09/20/2021 18:52:51 - INFO - __main__ - Step 20286: {'lr': 0.00019994562503324831, 'samples': 649152, 'steps': 1267, 'loss/train': 3.608168125152588} -09/20/2021 18:52:51 - INFO - __main__ - Step 20287: {'lr': 0.00019994562503324831, 'samples': 649184, 'steps': 1267, 'loss/train': 2.7720072269439697} -09/20/2021 18:52:52 - INFO - __main__ - Step 20288: {'lr': 0.00019994562503324831, 'samples': 649216, 'steps': 1267, 'loss/train': 3.456519603729248} -09/20/2021 18:52:53 - INFO - __main__ - Step 20289: {'lr': 0.00019994541450094028, 'samples': 649248, 'steps': 1268, 'loss/train': 3.4103498458862305} -09/20/2021 18:52:54 - INFO - __main__ - Step 20290: {'lr': 0.00019994541450094028, 'samples': 649280, 'steps': 1268, 'loss/train': 3.170264482498169} -09/20/2021 18:52:55 - INFO - __main__ - Step 20291: {'lr': 0.00019994541450094028, 'samples': 649312, 'steps': 1268, 'loss/train': 2.831188917160034} -09/20/2021 18:52:55 - INFO - __main__ - Step 20292: {'lr': 0.00019994541450094028, 'samples': 649344, 'steps': 1268, 'loss/train': 3.012230634689331} -09/20/2021 18:52:56 - INFO - __main__ - Step 20293: {'lr': 0.00019994541450094028, 'samples': 649376, 'steps': 1268, 'loss/train': 4.131987571716309} -09/20/2021 18:52:57 - INFO - __main__ - Step 20294: {'lr': 0.00019994541450094028, 'samples': 649408, 'steps': 1268, 'loss/train': 3.907261848449707} -09/20/2021 18:52:58 - INFO - __main__ - Step 20295: {'lr': 0.00019994541450094028, 'samples': 649440, 'steps': 1268, 'loss/train': 3.59690523147583} -09/20/2021 18:52:58 - INFO - __main__ - Step 20296: {'lr': 0.00019994541450094028, 'samples': 649472, 'steps': 1268, 'loss/train': 3.2542920112609863} -09/20/2021 18:52:59 - INFO - __main__ - Step 20297: {'lr': 0.00019994541450094028, 'samples': 649504, 'steps': 1268, 'loss/train': 3.4041152000427246} -09/20/2021 18:53:00 - INFO - __main__ - Step 20298: {'lr': 0.00019994541450094028, 'samples': 649536, 'steps': 1268, 'loss/train': 3.672353744506836} -09/20/2021 18:53:01 - INFO - __main__ - Step 20299: {'lr': 0.00019994541450094028, 'samples': 649568, 'steps': 1268, 'loss/train': 3.437471866607666} -09/20/2021 18:53:01 - INFO - __main__ - Step 20300: {'lr': 0.00019994541450094028, 'samples': 649600, 'steps': 1268, 'loss/train': 2.7450132369995117} -09/20/2021 18:53:02 - INFO - __main__ - Step 20301: {'lr': 0.00019994541450094028, 'samples': 649632, 'steps': 1268, 'loss/train': 2.7907001972198486} -09/20/2021 18:53:03 - INFO - __main__ - Step 20302: {'lr': 0.00019994541450094028, 'samples': 649664, 'steps': 1268, 'loss/train': 0.8594515919685364} -09/20/2021 18:53:04 - INFO - __main__ - Step 20303: {'lr': 0.00019994541450094028, 'samples': 649696, 'steps': 1268, 'loss/train': 3.7436270713806152} -09/20/2021 18:53:04 - INFO - __main__ - Step 20304: {'lr': 0.00019994541450094028, 'samples': 649728, 'steps': 1268, 'loss/train': 3.6838860511779785} -09/20/2021 18:53:05 - INFO - __main__ - Step 20305: {'lr': 0.00019994520356195474, 'samples': 649760, 'steps': 1269, 'loss/train': 2.6817331314086914} -09/20/2021 18:53:06 - INFO - __main__ - Step 20306: {'lr': 0.00019994520356195474, 'samples': 649792, 'steps': 1269, 'loss/train': 3.275275468826294} -09/20/2021 18:53:07 - INFO - __main__ - Step 20307: {'lr': 0.00019994520356195474, 'samples': 649824, 'steps': 1269, 'loss/train': 3.0657167434692383} -09/20/2021 18:53:07 - INFO - __main__ - Step 20308: {'lr': 0.00019994520356195474, 'samples': 649856, 'steps': 1269, 'loss/train': 3.7627670764923096} -09/20/2021 18:53:08 - INFO - __main__ - Step 20309: {'lr': 0.00019994520356195474, 'samples': 649888, 'steps': 1269, 'loss/train': 3.026439905166626} -09/20/2021 18:53:09 - INFO - __main__ - Step 20310: {'lr': 0.00019994520356195474, 'samples': 649920, 'steps': 1269, 'loss/train': 3.709195137023926} -09/20/2021 18:53:10 - INFO - __main__ - Step 20311: {'lr': 0.00019994520356195474, 'samples': 649952, 'steps': 1269, 'loss/train': 3.72725510597229} -09/20/2021 18:53:10 - INFO - __main__ - Step 20312: {'lr': 0.00019994520356195474, 'samples': 649984, 'steps': 1269, 'loss/train': 1.4536523818969727} -09/20/2021 18:53:11 - INFO - __main__ - Step 20313: {'lr': 0.00019994520356195474, 'samples': 650016, 'steps': 1269, 'loss/train': 3.6934468746185303} -09/20/2021 18:53:12 - INFO - __main__ - Step 20314: {'lr': 0.00019994520356195474, 'samples': 650048, 'steps': 1269, 'loss/train': 2.794896364212036} -09/20/2021 18:53:13 - INFO - __main__ - Step 20315: {'lr': 0.00019994520356195474, 'samples': 650080, 'steps': 1269, 'loss/train': 3.1950135231018066} -09/20/2021 18:53:13 - INFO - __main__ - Step 20316: {'lr': 0.00019994520356195474, 'samples': 650112, 'steps': 1269, 'loss/train': 2.915112018585205} -09/20/2021 18:53:15 - INFO - __main__ - Step 20317: {'lr': 0.00019994520356195474, 'samples': 650144, 'steps': 1269, 'loss/train': 3.371826410293579} -09/20/2021 18:53:16 - INFO - __main__ - Step 20318: {'lr': 0.00019994520356195474, 'samples': 650176, 'steps': 1269, 'loss/train': 4.347723007202148} -09/20/2021 18:53:17 - INFO - __main__ - Step 20319: {'lr': 0.00019994520356195474, 'samples': 650208, 'steps': 1269, 'loss/train': 2.3071420192718506} -09/20/2021 18:53:18 - INFO - __main__ - Step 20320: {'lr': 0.00019994520356195474, 'samples': 650240, 'steps': 1269, 'loss/train': 3.777454137802124} -09/20/2021 18:53:19 - INFO - __main__ - Step 20321: {'lr': 0.00019994499221629255, 'samples': 650272, 'steps': 1270, 'loss/train': 2.6734142303466797} -09/20/2021 18:53:19 - INFO - __main__ - Step 20322: {'lr': 0.00019994499221629255, 'samples': 650304, 'steps': 1270, 'loss/train': 3.3146677017211914} -09/20/2021 18:53:20 - INFO - __main__ - Step 20323: {'lr': 0.00019994499221629255, 'samples': 650336, 'steps': 1270, 'loss/train': 2.2870841026306152} -09/20/2021 18:53:21 - INFO - __main__ - Step 20324: {'lr': 0.00019994499221629255, 'samples': 650368, 'steps': 1270, 'loss/train': 2.7142186164855957} -09/20/2021 18:53:22 - INFO - __main__ - Step 20325: {'lr': 0.00019994499221629255, 'samples': 650400, 'steps': 1270, 'loss/train': 3.1946144104003906} -09/20/2021 18:53:22 - INFO - __main__ - Step 20326: {'lr': 0.00019994499221629255, 'samples': 650432, 'steps': 1270, 'loss/train': 0.8878626823425293} -09/20/2021 18:53:23 - INFO - __main__ - Step 20327: {'lr': 0.00019994499221629255, 'samples': 650464, 'steps': 1270, 'loss/train': 1.3953757286071777} -09/20/2021 18:53:24 - INFO - __main__ - Step 20328: {'lr': 0.00019994499221629255, 'samples': 650496, 'steps': 1270, 'loss/train': 3.2910702228546143} -09/20/2021 18:53:24 - INFO - __main__ - Step 20329: {'lr': 0.00019994499221629255, 'samples': 650528, 'steps': 1270, 'loss/train': 2.8691611289978027} -09/20/2021 18:53:25 - INFO - __main__ - Step 20330: {'lr': 0.00019994499221629255, 'samples': 650560, 'steps': 1270, 'loss/train': 3.312080144882202} -09/20/2021 18:53:26 - INFO - __main__ - Step 20331: {'lr': 0.00019994499221629255, 'samples': 650592, 'steps': 1270, 'loss/train': 2.2307229042053223} -09/20/2021 18:53:27 - INFO - __main__ - Step 20332: {'lr': 0.00019994499221629255, 'samples': 650624, 'steps': 1270, 'loss/train': 3.5733723640441895} -09/20/2021 18:53:27 - INFO - __main__ - Step 20333: {'lr': 0.00019994499221629255, 'samples': 650656, 'steps': 1270, 'loss/train': 3.1291918754577637} -09/20/2021 18:53:28 - INFO - __main__ - Step 20334: {'lr': 0.00019994499221629255, 'samples': 650688, 'steps': 1270, 'loss/train': 3.4323923587799072} -09/20/2021 18:53:29 - INFO - __main__ - Step 20335: {'lr': 0.00019994499221629255, 'samples': 650720, 'steps': 1270, 'loss/train': 3.410781145095825} -09/20/2021 18:53:30 - INFO - __main__ - Step 20336: {'lr': 0.00019994499221629255, 'samples': 650752, 'steps': 1270, 'loss/train': 4.2848429679870605} -09/20/2021 18:53:31 - INFO - __main__ - Step 20337: {'lr': 0.00019994478046395458, 'samples': 650784, 'steps': 1271, 'loss/train': 2.6861908435821533} -09/20/2021 18:53:31 - INFO - __main__ - Step 20338: {'lr': 0.00019994478046395458, 'samples': 650816, 'steps': 1271, 'loss/train': 3.256338357925415} -09/20/2021 18:53:32 - INFO - __main__ - Step 20339: {'lr': 0.00019994478046395458, 'samples': 650848, 'steps': 1271, 'loss/train': 3.5204715728759766} -09/20/2021 18:53:33 - INFO - __main__ - Step 20340: {'lr': 0.00019994478046395458, 'samples': 650880, 'steps': 1271, 'loss/train': 2.852006435394287} -09/20/2021 18:53:34 - INFO - __main__ - Step 20341: {'lr': 0.00019994478046395458, 'samples': 650912, 'steps': 1271, 'loss/train': 1.861709475517273} -09/20/2021 18:53:34 - INFO - __main__ - Step 20342: {'lr': 0.00019994478046395458, 'samples': 650944, 'steps': 1271, 'loss/train': 4.325628280639648} -09/20/2021 18:53:35 - INFO - __main__ - Step 20343: {'lr': 0.00019994478046395458, 'samples': 650976, 'steps': 1271, 'loss/train': 4.1513895988464355} -09/20/2021 18:53:36 - INFO - __main__ - Step 20344: {'lr': 0.00019994478046395458, 'samples': 651008, 'steps': 1271, 'loss/train': 4.5511603355407715} -09/20/2021 18:53:37 - INFO - __main__ - Step 20345: {'lr': 0.00019994478046395458, 'samples': 651040, 'steps': 1271, 'loss/train': 3.324207305908203} -09/20/2021 18:53:37 - INFO - __main__ - Step 20346: {'lr': 0.00019994478046395458, 'samples': 651072, 'steps': 1271, 'loss/train': 1.4789034128189087} -09/20/2021 18:53:38 - INFO - __main__ - Step 20347: {'lr': 0.00019994478046395458, 'samples': 651104, 'steps': 1271, 'loss/train': 2.5162906646728516} -09/20/2021 18:53:39 - INFO - __main__ - Step 20348: {'lr': 0.00019994478046395458, 'samples': 651136, 'steps': 1271, 'loss/train': 2.977458953857422} -09/20/2021 18:53:40 - INFO - __main__ - Step 20349: {'lr': 0.00019994478046395458, 'samples': 651168, 'steps': 1271, 'loss/train': 2.3702681064605713} -09/20/2021 18:53:40 - INFO - __main__ - Step 20350: {'lr': 0.00019994478046395458, 'samples': 651200, 'steps': 1271, 'loss/train': 2.6857388019561768} -09/20/2021 18:53:41 - INFO - __main__ - Step 20351: {'lr': 0.00019994478046395458, 'samples': 651232, 'steps': 1271, 'loss/train': 2.221261501312256} -09/20/2021 18:53:42 - INFO - __main__ - Step 20352: {'lr': 0.00019994478046395458, 'samples': 651264, 'steps': 1271, 'loss/train': 2.6816012859344482} -09/20/2021 18:53:43 - INFO - __main__ - Step 20353: {'lr': 0.00019994456830494168, 'samples': 651296, 'steps': 1272, 'loss/train': 2.4473721981048584} -09/20/2021 18:53:44 - INFO - __main__ - Step 20354: {'lr': 0.00019994456830494168, 'samples': 651328, 'steps': 1272, 'loss/train': 1.9873708486557007} -09/20/2021 18:53:44 - INFO - __main__ - Step 20355: {'lr': 0.00019994456830494168, 'samples': 651360, 'steps': 1272, 'loss/train': 2.1189143657684326} -09/20/2021 18:53:45 - INFO - __main__ - Step 20356: {'lr': 0.00019994456830494168, 'samples': 651392, 'steps': 1272, 'loss/train': 2.197783946990967} -09/20/2021 18:53:46 - INFO - __main__ - Step 20357: {'lr': 0.00019994456830494168, 'samples': 651424, 'steps': 1272, 'loss/train': 1.8584473133087158} -09/20/2021 18:53:47 - INFO - __main__ - Step 20358: {'lr': 0.00019994456830494168, 'samples': 651456, 'steps': 1272, 'loss/train': 2.0184757709503174} -09/20/2021 18:53:47 - INFO - __main__ - Step 20359: {'lr': 0.00019994456830494168, 'samples': 651488, 'steps': 1272, 'loss/train': 2.125687837600708} -09/20/2021 18:53:48 - INFO - __main__ - Step 20360: {'lr': 0.00019994456830494168, 'samples': 651520, 'steps': 1272, 'loss/train': 1.8606319427490234} -09/20/2021 18:53:50 - INFO - __main__ - Step 20361: {'lr': 0.00019994456830494168, 'samples': 651552, 'steps': 1272, 'loss/train': 1.885711908340454} -09/20/2021 18:53:51 - INFO - __main__ - Step 20362: {'lr': 0.00019994456830494168, 'samples': 651584, 'steps': 1272, 'loss/train': 3.176318883895874} -09/20/2021 18:53:52 - INFO - __main__ - Step 20363: {'lr': 0.00019994456830494168, 'samples': 651616, 'steps': 1272, 'loss/train': 3.8056271076202393} -09/20/2021 18:53:53 - INFO - __main__ - Step 20364: {'lr': 0.00019994456830494168, 'samples': 651648, 'steps': 1272, 'loss/train': 2.9511444568634033} -09/20/2021 18:53:53 - INFO - __main__ - Step 20365: {'lr': 0.00019994456830494168, 'samples': 651680, 'steps': 1272, 'loss/train': 3.264509677886963} -09/20/2021 18:53:54 - INFO - __main__ - Step 20366: {'lr': 0.00019994456830494168, 'samples': 651712, 'steps': 1272, 'loss/train': 2.955347776412964} -09/20/2021 18:53:55 - INFO - __main__ - Step 20367: {'lr': 0.00019994456830494168, 'samples': 651744, 'steps': 1272, 'loss/train': 2.7294139862060547} -09/20/2021 18:53:56 - INFO - __main__ - Step 20368: {'lr': 0.00019994456830494168, 'samples': 651776, 'steps': 1272, 'loss/train': 3.322516441345215} -09/20/2021 18:53:57 - INFO - __main__ - Step 20369: {'lr': 0.00019994435573925473, 'samples': 651808, 'steps': 1273, 'loss/train': 3.5661990642547607} -09/20/2021 18:53:57 - INFO - __main__ - Step 20370: {'lr': 0.00019994435573925473, 'samples': 651840, 'steps': 1273, 'loss/train': 5.376204013824463} -09/20/2021 18:53:58 - INFO - __main__ - Step 20371: {'lr': 0.00019994435573925473, 'samples': 651872, 'steps': 1273, 'loss/train': 3.22105073928833} -09/20/2021 18:53:59 - INFO - __main__ - Step 20372: {'lr': 0.00019994435573925473, 'samples': 651904, 'steps': 1273, 'loss/train': 3.4683518409729004} -09/20/2021 18:54:00 - INFO - __main__ - Step 20373: {'lr': 0.00019994435573925473, 'samples': 651936, 'steps': 1273, 'loss/train': 3.1327013969421387} -09/20/2021 18:54:00 - INFO - __main__ - Step 20374: {'lr': 0.00019994435573925473, 'samples': 651968, 'steps': 1273, 'loss/train': 0.7562429308891296} -09/20/2021 18:54:01 - INFO - __main__ - Step 20375: {'lr': 0.00019994435573925473, 'samples': 652000, 'steps': 1273, 'loss/train': 4.096607685089111} -09/20/2021 18:54:02 - INFO - __main__ - Step 20376: {'lr': 0.00019994435573925473, 'samples': 652032, 'steps': 1273, 'loss/train': 2.543881893157959} -09/20/2021 18:54:03 - INFO - __main__ - Step 20377: {'lr': 0.00019994435573925473, 'samples': 652064, 'steps': 1273, 'loss/train': 3.942904472351074} -09/20/2021 18:54:03 - INFO - __main__ - Step 20378: {'lr': 0.00019994435573925473, 'samples': 652096, 'steps': 1273, 'loss/train': 3.0758399963378906} -09/20/2021 18:54:04 - INFO - __main__ - Step 20379: {'lr': 0.00019994435573925473, 'samples': 652128, 'steps': 1273, 'loss/train': 2.604922294616699} -09/20/2021 18:54:05 - INFO - __main__ - Step 20380: {'lr': 0.00019994435573925473, 'samples': 652160, 'steps': 1273, 'loss/train': 2.666383743286133} -09/20/2021 18:54:06 - INFO - __main__ - Step 20381: {'lr': 0.00019994435573925473, 'samples': 652192, 'steps': 1273, 'loss/train': 2.721963882446289} -09/20/2021 18:54:06 - INFO - __main__ - Step 20382: {'lr': 0.00019994435573925473, 'samples': 652224, 'steps': 1273, 'loss/train': 3.995208501815796} -09/20/2021 18:54:07 - INFO - __main__ - Step 20383: {'lr': 0.00019994435573925473, 'samples': 652256, 'steps': 1273, 'loss/train': 3.364217519760132} -09/20/2021 18:54:08 - INFO - __main__ - Step 20384: {'lr': 0.00019994435573925473, 'samples': 652288, 'steps': 1273, 'loss/train': 2.308173656463623} -09/20/2021 18:54:09 - INFO - __main__ - Step 20385: {'lr': 0.00019994414276689457, 'samples': 652320, 'steps': 1274, 'loss/train': 2.6306886672973633} -09/20/2021 18:54:09 - INFO - __main__ - Step 20386: {'lr': 0.00019994414276689457, 'samples': 652352, 'steps': 1274, 'loss/train': 2.5141396522521973} -09/20/2021 18:54:10 - INFO - __main__ - Step 20387: {'lr': 0.00019994414276689457, 'samples': 652384, 'steps': 1274, 'loss/train': 1.0799388885498047} -09/20/2021 18:54:11 - INFO - __main__ - Step 20388: {'lr': 0.00019994414276689457, 'samples': 652416, 'steps': 1274, 'loss/train': 0.7016801834106445} -09/20/2021 18:54:12 - INFO - __main__ - Step 20389: {'lr': 0.00019994414276689457, 'samples': 652448, 'steps': 1274, 'loss/train': 1.3377816677093506} -09/20/2021 18:54:12 - INFO - __main__ - Step 20390: {'lr': 0.00019994414276689457, 'samples': 652480, 'steps': 1274, 'loss/train': 2.397772789001465} -09/20/2021 18:54:13 - INFO - __main__ - Step 20391: {'lr': 0.00019994414276689457, 'samples': 652512, 'steps': 1274, 'loss/train': 0.7287428379058838} -09/20/2021 18:54:14 - INFO - __main__ - Step 20392: {'lr': 0.00019994414276689457, 'samples': 652544, 'steps': 1274, 'loss/train': 3.2866482734680176} -09/20/2021 18:54:15 - INFO - __main__ - Step 20393: {'lr': 0.00019994414276689457, 'samples': 652576, 'steps': 1274, 'loss/train': 3.5748486518859863} -09/20/2021 18:54:16 - INFO - __main__ - Step 20394: {'lr': 0.00019994414276689457, 'samples': 652608, 'steps': 1274, 'loss/train': 3.62393856048584} -09/20/2021 18:54:17 - INFO - __main__ - Step 20395: {'lr': 0.00019994414276689457, 'samples': 652640, 'steps': 1274, 'loss/train': 2.281165838241577} -09/20/2021 18:54:17 - INFO - __main__ - Step 20396: {'lr': 0.00019994414276689457, 'samples': 652672, 'steps': 1274, 'loss/train': 3.4104526042938232} -09/20/2021 18:54:18 - INFO - __main__ - Step 20397: {'lr': 0.00019994414276689457, 'samples': 652704, 'steps': 1274, 'loss/train': 3.2467737197875977} -09/20/2021 18:54:19 - INFO - __main__ - Step 20398: {'lr': 0.00019994414276689457, 'samples': 652736, 'steps': 1274, 'loss/train': 3.8621158599853516} -09/20/2021 18:54:20 - INFO - __main__ - Step 20399: {'lr': 0.00019994414276689457, 'samples': 652768, 'steps': 1274, 'loss/train': 4.849239349365234} -09/20/2021 18:54:20 - INFO - __main__ - Step 20400: {'lr': 0.00019994414276689457, 'samples': 652800, 'steps': 1274, 'loss/train': 0.34063658118247986} -09/20/2021 18:54:21 - INFO - __main__ - Step 20401: {'lr': 0.0001999439293878621, 'samples': 652832, 'steps': 1275, 'loss/train': 2.9917683601379395} -09/20/2021 18:54:22 - INFO - __main__ - Step 20402: {'lr': 0.0001999439293878621, 'samples': 652864, 'steps': 1275, 'loss/train': 3.3528573513031006} -09/20/2021 18:54:23 - INFO - __main__ - Step 20403: {'lr': 0.0001999439293878621, 'samples': 652896, 'steps': 1275, 'loss/train': 2.9648473262786865} -09/20/2021 18:54:24 - INFO - __main__ - Step 20404: {'lr': 0.0001999439293878621, 'samples': 652928, 'steps': 1275, 'loss/train': 3.743905782699585} -09/20/2021 18:54:24 - INFO - __main__ - Step 20405: {'lr': 0.0001999439293878621, 'samples': 652960, 'steps': 1275, 'loss/train': 3.743847370147705} -09/20/2021 18:54:25 - INFO - __main__ - Step 20406: {'lr': 0.0001999439293878621, 'samples': 652992, 'steps': 1275, 'loss/train': 3.047645330429077} -09/20/2021 18:54:26 - INFO - __main__ - Step 20407: {'lr': 0.0001999439293878621, 'samples': 653024, 'steps': 1275, 'loss/train': 4.179439067840576} -09/20/2021 18:54:27 - INFO - __main__ - Step 20408: {'lr': 0.0001999439293878621, 'samples': 653056, 'steps': 1275, 'loss/train': 4.129630088806152} -09/20/2021 18:54:27 - INFO - __main__ - Step 20409: {'lr': 0.0001999439293878621, 'samples': 653088, 'steps': 1275, 'loss/train': 2.7530219554901123} -09/20/2021 18:54:28 - INFO - __main__ - Step 20410: {'lr': 0.0001999439293878621, 'samples': 653120, 'steps': 1275, 'loss/train': 3.195478677749634} -09/20/2021 18:54:29 - INFO - __main__ - Step 20411: {'lr': 0.0001999439293878621, 'samples': 653152, 'steps': 1275, 'loss/train': 3.0007965564727783} -09/20/2021 18:54:30 - INFO - __main__ - Step 20412: {'lr': 0.0001999439293878621, 'samples': 653184, 'steps': 1275, 'loss/train': 4.274219989776611} -09/20/2021 18:54:30 - INFO - __main__ - Step 20413: {'lr': 0.0001999439293878621, 'samples': 653216, 'steps': 1275, 'loss/train': 3.6915903091430664} -09/20/2021 18:54:31 - INFO - __main__ - Step 20414: {'lr': 0.0001999439293878621, 'samples': 653248, 'steps': 1275, 'loss/train': 3.638984441757202} -09/20/2021 18:54:32 - INFO - __main__ - Step 20415: {'lr': 0.0001999439293878621, 'samples': 653280, 'steps': 1275, 'loss/train': 4.146304607391357} -09/20/2021 18:54:33 - INFO - __main__ - Step 20416: {'lr': 0.0001999439293878621, 'samples': 653312, 'steps': 1275, 'loss/train': 3.2898671627044678} -09/20/2021 18:54:34 - INFO - __main__ - Step 20417: {'lr': 0.00019994371560215813, 'samples': 653344, 'steps': 1276, 'loss/train': 2.9500463008880615} -09/20/2021 18:54:34 - INFO - __main__ - Step 20418: {'lr': 0.00019994371560215813, 'samples': 653376, 'steps': 1276, 'loss/train': 3.187685012817383} -09/20/2021 18:54:35 - INFO - __main__ - Step 20419: {'lr': 0.00019994371560215813, 'samples': 653408, 'steps': 1276, 'loss/train': 2.871403455734253} -09/20/2021 18:54:36 - INFO - __main__ - Step 20420: {'lr': 0.00019994371560215813, 'samples': 653440, 'steps': 1276, 'loss/train': 3.607762098312378} -09/20/2021 18:54:37 - INFO - __main__ - Step 20421: {'lr': 0.00019994371560215813, 'samples': 653472, 'steps': 1276, 'loss/train': 2.9741528034210205} -09/20/2021 18:54:37 - INFO - __main__ - Step 20422: {'lr': 0.00019994371560215813, 'samples': 653504, 'steps': 1276, 'loss/train': 1.8765772581100464} -09/20/2021 18:54:38 - INFO - __main__ - Step 20423: {'lr': 0.00019994371560215813, 'samples': 653536, 'steps': 1276, 'loss/train': 1.5498344898223877} -09/20/2021 18:54:40 - INFO - __main__ - Step 20424: {'lr': 0.00019994371560215813, 'samples': 653568, 'steps': 1276, 'loss/train': 2.697913408279419} -09/20/2021 18:54:40 - INFO - __main__ - Step 20425: {'lr': 0.00019994371560215813, 'samples': 653600, 'steps': 1276, 'loss/train': 3.4394783973693848} -09/20/2021 18:54:41 - INFO - __main__ - Step 20426: {'lr': 0.00019994371560215813, 'samples': 653632, 'steps': 1276, 'loss/train': 3.814347267150879} -09/20/2021 18:54:42 - INFO - __main__ - Step 20427: {'lr': 0.00019994371560215813, 'samples': 653664, 'steps': 1276, 'loss/train': 3.363805055618286} -09/20/2021 18:54:43 - INFO - __main__ - Step 20428: {'lr': 0.00019994371560215813, 'samples': 653696, 'steps': 1276, 'loss/train': 2.8208940029144287} -09/20/2021 18:54:43 - INFO - __main__ - Step 20429: {'lr': 0.00019994371560215813, 'samples': 653728, 'steps': 1276, 'loss/train': 3.6470725536346436} -09/20/2021 18:54:44 - INFO - __main__ - Step 20430: {'lr': 0.00019994371560215813, 'samples': 653760, 'steps': 1276, 'loss/train': 3.0854806900024414} -09/20/2021 18:54:45 - INFO - __main__ - Step 20431: {'lr': 0.00019994371560215813, 'samples': 653792, 'steps': 1276, 'loss/train': 4.25943660736084} -09/20/2021 18:54:46 - INFO - __main__ - Step 20432: {'lr': 0.00019994371560215813, 'samples': 653824, 'steps': 1276, 'loss/train': 3.1843760013580322} -09/20/2021 18:54:46 - INFO - __main__ - Step 20433: {'lr': 0.0001999435014097836, 'samples': 653856, 'steps': 1277, 'loss/train': 2.0563337802886963} -09/20/2021 18:54:47 - INFO - __main__ - Step 20434: {'lr': 0.0001999435014097836, 'samples': 653888, 'steps': 1277, 'loss/train': 2.1308231353759766} -09/20/2021 18:54:48 - INFO - __main__ - Step 20435: {'lr': 0.0001999435014097836, 'samples': 653920, 'steps': 1277, 'loss/train': 2.2424137592315674} -09/20/2021 18:54:49 - INFO - __main__ - Step 20436: {'lr': 0.0001999435014097836, 'samples': 653952, 'steps': 1277, 'loss/train': 2.0141139030456543} -09/20/2021 18:54:49 - INFO - __main__ - Step 20437: {'lr': 0.0001999435014097836, 'samples': 653984, 'steps': 1277, 'loss/train': 2.437039852142334} -09/20/2021 18:54:50 - INFO - __main__ - Step 20438: {'lr': 0.0001999435014097836, 'samples': 654016, 'steps': 1277, 'loss/train': 4.016582012176514} -09/20/2021 18:54:51 - INFO - __main__ - Step 20439: {'lr': 0.0001999435014097836, 'samples': 654048, 'steps': 1277, 'loss/train': 3.045172691345215} -09/20/2021 18:54:52 - INFO - __main__ - Step 20440: {'lr': 0.0001999435014097836, 'samples': 654080, 'steps': 1277, 'loss/train': 3.32501482963562} -09/20/2021 18:54:52 - INFO - __main__ - Step 20441: {'lr': 0.0001999435014097836, 'samples': 654112, 'steps': 1277, 'loss/train': 3.1637370586395264} -09/20/2021 18:54:53 - INFO - __main__ - Step 20442: {'lr': 0.0001999435014097836, 'samples': 654144, 'steps': 1277, 'loss/train': 3.326603889465332} -09/20/2021 18:54:54 - INFO - __main__ - Step 20443: {'lr': 0.0001999435014097836, 'samples': 654176, 'steps': 1277, 'loss/train': 3.4132542610168457} -09/20/2021 18:54:55 - INFO - __main__ - Step 20444: {'lr': 0.0001999435014097836, 'samples': 654208, 'steps': 1277, 'loss/train': 1.7059757709503174} -09/20/2021 18:54:55 - INFO - __main__ - Step 20445: {'lr': 0.0001999435014097836, 'samples': 654240, 'steps': 1277, 'loss/train': 3.1316757202148438} -09/20/2021 18:54:56 - INFO - __main__ - Step 20446: {'lr': 0.0001999435014097836, 'samples': 654272, 'steps': 1277, 'loss/train': 3.415405035018921} -09/20/2021 18:54:57 - INFO - __main__ - Step 20447: {'lr': 0.0001999435014097836, 'samples': 654304, 'steps': 1277, 'loss/train': 4.034862041473389} -09/20/2021 18:54:58 - INFO - __main__ - Step 20448: {'lr': 0.0001999435014097836, 'samples': 654336, 'steps': 1277, 'loss/train': 3.3350393772125244} -09/20/2021 18:54:59 - INFO - __main__ - Step 20449: {'lr': 0.00019994328681073934, 'samples': 654368, 'steps': 1278, 'loss/train': 2.914928913116455} -09/20/2021 18:54:59 - INFO - __main__ - Step 20450: {'lr': 0.00019994328681073934, 'samples': 654400, 'steps': 1278, 'loss/train': 2.710008144378662} -09/20/2021 18:55:00 - INFO - __main__ - Step 20451: {'lr': 0.00019994328681073934, 'samples': 654432, 'steps': 1278, 'loss/train': 3.1597089767456055} -09/20/2021 18:55:01 - INFO - __main__ - Step 20452: {'lr': 0.00019994328681073934, 'samples': 654464, 'steps': 1278, 'loss/train': 3.3118951320648193} -09/20/2021 18:55:02 - INFO - __main__ - Step 20453: {'lr': 0.00019994328681073934, 'samples': 654496, 'steps': 1278, 'loss/train': 3.652987003326416} -09/20/2021 18:55:02 - INFO - __main__ - Step 20454: {'lr': 0.00019994328681073934, 'samples': 654528, 'steps': 1278, 'loss/train': 4.641627788543701} -09/20/2021 18:55:03 - INFO - __main__ - Step 20455: {'lr': 0.00019994328681073934, 'samples': 654560, 'steps': 1278, 'loss/train': 1.9636253118515015} -09/20/2021 18:55:04 - INFO - __main__ - Step 20456: {'lr': 0.00019994328681073934, 'samples': 654592, 'steps': 1278, 'loss/train': 3.8177952766418457} -09/20/2021 18:55:05 - INFO - __main__ - Step 20457: {'lr': 0.00019994328681073934, 'samples': 654624, 'steps': 1278, 'loss/train': 2.5658609867095947} -09/20/2021 18:55:06 - INFO - __main__ - Step 20458: {'lr': 0.00019994328681073934, 'samples': 654656, 'steps': 1278, 'loss/train': 3.4420218467712402} -09/20/2021 18:55:07 - INFO - __main__ - Step 20459: {'lr': 0.00019994328681073934, 'samples': 654688, 'steps': 1278, 'loss/train': 3.4836010932922363} -09/20/2021 18:55:07 - INFO - __main__ - Step 20460: {'lr': 0.00019994328681073934, 'samples': 654720, 'steps': 1278, 'loss/train': 2.6684951782226562} -09/20/2021 18:55:08 - INFO - __main__ - Step 20461: {'lr': 0.00019994328681073934, 'samples': 654752, 'steps': 1278, 'loss/train': 3.18229079246521} -09/20/2021 18:55:09 - INFO - __main__ - Step 20462: {'lr': 0.00019994328681073934, 'samples': 654784, 'steps': 1278, 'loss/train': 4.52994441986084} -09/20/2021 18:55:10 - INFO - __main__ - Step 20463: {'lr': 0.00019994328681073934, 'samples': 654816, 'steps': 1278, 'loss/train': 4.35183048248291} -09/20/2021 18:55:10 - INFO - __main__ - Step 20464: {'lr': 0.00019994328681073934, 'samples': 654848, 'steps': 1278, 'loss/train': 2.7708897590637207} -09/20/2021 18:55:11 - INFO - __main__ - Step 20465: {'lr': 0.00019994307180502623, 'samples': 654880, 'steps': 1279, 'loss/train': 3.3282859325408936} -09/20/2021 18:55:12 - INFO - __main__ - Step 20466: {'lr': 0.00019994307180502623, 'samples': 654912, 'steps': 1279, 'loss/train': 3.2570412158966064} -09/20/2021 18:55:13 - INFO - __main__ - Step 20467: {'lr': 0.00019994307180502623, 'samples': 654944, 'steps': 1279, 'loss/train': 3.6328136920928955} -09/20/2021 18:55:14 - INFO - __main__ - Step 20468: {'lr': 0.00019994307180502623, 'samples': 654976, 'steps': 1279, 'loss/train': 3.6911234855651855} -09/20/2021 18:55:14 - INFO - __main__ - Step 20469: {'lr': 0.00019994307180502623, 'samples': 655008, 'steps': 1279, 'loss/train': 4.099597454071045} -09/20/2021 18:55:15 - INFO - __main__ - Step 20470: {'lr': 0.00019994307180502623, 'samples': 655040, 'steps': 1279, 'loss/train': 4.0084638595581055} -09/20/2021 18:55:16 - INFO - __main__ - Step 20471: {'lr': 0.00019994307180502623, 'samples': 655072, 'steps': 1279, 'loss/train': 3.6846706867218018} -09/20/2021 18:55:17 - INFO - __main__ - Step 20472: {'lr': 0.00019994307180502623, 'samples': 655104, 'steps': 1279, 'loss/train': 2.3882558345794678} -09/20/2021 18:55:17 - INFO - __main__ - Step 20473: {'lr': 0.00019994307180502623, 'samples': 655136, 'steps': 1279, 'loss/train': 3.4135375022888184} -09/20/2021 18:55:18 - INFO - __main__ - Step 20474: {'lr': 0.00019994307180502623, 'samples': 655168, 'steps': 1279, 'loss/train': 3.7159245014190674} -09/20/2021 18:55:19 - INFO - __main__ - Step 20475: {'lr': 0.00019994307180502623, 'samples': 655200, 'steps': 1279, 'loss/train': 2.5727176666259766} -09/20/2021 18:55:20 - INFO - __main__ - Step 20476: {'lr': 0.00019994307180502623, 'samples': 655232, 'steps': 1279, 'loss/train': 2.261064291000366} -09/20/2021 18:55:20 - INFO - __main__ - Step 20477: {'lr': 0.00019994307180502623, 'samples': 655264, 'steps': 1279, 'loss/train': 3.4403977394104004} -09/20/2021 18:55:21 - INFO - __main__ - Step 20478: {'lr': 0.00019994307180502623, 'samples': 655296, 'steps': 1279, 'loss/train': 2.624427556991577} -09/20/2021 18:55:22 - INFO - __main__ - Step 20479: {'lr': 0.00019994307180502623, 'samples': 655328, 'steps': 1279, 'loss/train': 1.0776236057281494} -09/20/2021 18:55:23 - INFO - __main__ - Step 20480: {'lr': 0.00019994307180502623, 'samples': 655360, 'steps': 1279, 'loss/train': 3.162811517715454} -09/20/2021 18:55:23 - INFO - __main__ - Step 20481: {'lr': 0.00019994285639264518, 'samples': 655392, 'steps': 1280, 'loss/train': 3.056995153427124} -09/20/2021 18:55:24 - INFO - __main__ - Step 20482: {'lr': 0.00019994285639264518, 'samples': 655424, 'steps': 1280, 'loss/train': 3.369203567504883} -09/20/2021 18:55:25 - INFO - __main__ - Step 20483: {'lr': 0.00019994285639264518, 'samples': 655456, 'steps': 1280, 'loss/train': 3.5862252712249756} -09/20/2021 18:55:26 - INFO - __main__ - Step 20484: {'lr': 0.00019994285639264518, 'samples': 655488, 'steps': 1280, 'loss/train': 2.462693691253662} -09/20/2021 18:55:26 - INFO - __main__ - Step 20485: {'lr': 0.00019994285639264518, 'samples': 655520, 'steps': 1280, 'loss/train': 3.434943675994873} -09/20/2021 18:55:27 - INFO - __main__ - Step 20486: {'lr': 0.00019994285639264518, 'samples': 655552, 'steps': 1280, 'loss/train': 3.3064651489257812} -09/20/2021 18:55:28 - INFO - __main__ - Step 20487: {'lr': 0.00019994285639264518, 'samples': 655584, 'steps': 1280, 'loss/train': 3.206730365753174} -09/20/2021 18:55:29 - INFO - __main__ - Step 20488: {'lr': 0.00019994285639264518, 'samples': 655616, 'steps': 1280, 'loss/train': 3.165469169616699} -09/20/2021 18:55:30 - INFO - __main__ - Step 20489: {'lr': 0.00019994285639264518, 'samples': 655648, 'steps': 1280, 'loss/train': 3.0244343280792236} -09/20/2021 18:55:31 - INFO - __main__ - Step 20490: {'lr': 0.00019994285639264518, 'samples': 655680, 'steps': 1280, 'loss/train': 3.400182008743286} -09/20/2021 18:55:31 - INFO - __main__ - Step 20491: {'lr': 0.00019994285639264518, 'samples': 655712, 'steps': 1280, 'loss/train': 3.007606267929077} -09/20/2021 18:55:32 - INFO - __main__ - Step 20492: {'lr': 0.00019994285639264518, 'samples': 655744, 'steps': 1280, 'loss/train': 2.274521589279175} -09/20/2021 18:55:33 - INFO - __main__ - Step 20493: {'lr': 0.00019994285639264518, 'samples': 655776, 'steps': 1280, 'loss/train': 4.0125203132629395} -09/20/2021 18:55:34 - INFO - __main__ - Step 20494: {'lr': 0.00019994285639264518, 'samples': 655808, 'steps': 1280, 'loss/train': 2.8175857067108154} -09/20/2021 18:55:34 - INFO - __main__ - Step 20495: {'lr': 0.00019994285639264518, 'samples': 655840, 'steps': 1280, 'loss/train': 3.404487133026123} -09/20/2021 18:55:35 - INFO - __main__ - Step 20496: {'lr': 0.00019994285639264518, 'samples': 655872, 'steps': 1280, 'loss/train': 3.059617280960083} -09/20/2021 18:55:36 - INFO - __main__ - Step 20497: {'lr': 0.000199942640573597, 'samples': 655904, 'steps': 1281, 'loss/train': 3.5045764446258545} -09/20/2021 18:55:37 - INFO - __main__ - Step 20498: {'lr': 0.000199942640573597, 'samples': 655936, 'steps': 1281, 'loss/train': 3.6902167797088623} -09/20/2021 18:55:38 - INFO - __main__ - Step 20499: {'lr': 0.000199942640573597, 'samples': 655968, 'steps': 1281, 'loss/train': 3.3681488037109375} -09/20/2021 18:55:38 - INFO - __main__ - Step 20500: {'lr': 0.000199942640573597, 'samples': 656000, 'steps': 1281, 'loss/train': 3.0131237506866455} -09/20/2021 18:55:39 - INFO - __main__ - Step 20501: {'lr': 0.000199942640573597, 'samples': 656032, 'steps': 1281, 'loss/train': 2.6131842136383057} -09/20/2021 18:55:40 - INFO - __main__ - Step 20502: {'lr': 0.000199942640573597, 'samples': 656064, 'steps': 1281, 'loss/train': 3.6661415100097656} -09/20/2021 18:55:41 - INFO - __main__ - Step 20503: {'lr': 0.000199942640573597, 'samples': 656096, 'steps': 1281, 'loss/train': 3.882108449935913} -09/20/2021 18:55:41 - INFO - __main__ - Step 20504: {'lr': 0.000199942640573597, 'samples': 656128, 'steps': 1281, 'loss/train': 3.8879504203796387} -09/20/2021 18:55:42 - INFO - __main__ - Step 20505: {'lr': 0.000199942640573597, 'samples': 656160, 'steps': 1281, 'loss/train': 3.618072032928467} -09/20/2021 18:55:43 - INFO - __main__ - Step 20506: {'lr': 0.000199942640573597, 'samples': 656192, 'steps': 1281, 'loss/train': 3.1662375926971436} -09/20/2021 18:55:44 - INFO - __main__ - Step 20507: {'lr': 0.000199942640573597, 'samples': 656224, 'steps': 1281, 'loss/train': 4.2869415283203125} -09/20/2021 18:55:44 - INFO - __main__ - Step 20508: {'lr': 0.000199942640573597, 'samples': 656256, 'steps': 1281, 'loss/train': 2.7526609897613525} -09/20/2021 18:55:45 - INFO - __main__ - Step 20509: {'lr': 0.000199942640573597, 'samples': 656288, 'steps': 1281, 'loss/train': 4.352883338928223} -09/20/2021 18:55:46 - INFO - __main__ - Step 20510: {'lr': 0.000199942640573597, 'samples': 656320, 'steps': 1281, 'loss/train': 2.445540428161621} -09/20/2021 18:55:47 - INFO - __main__ - Step 20511: {'lr': 0.000199942640573597, 'samples': 656352, 'steps': 1281, 'loss/train': 3.7266314029693604} -09/20/2021 18:55:47 - INFO - __main__ - Step 20512: {'lr': 0.000199942640573597, 'samples': 656384, 'steps': 1281, 'loss/train': 3.8776214122772217} -09/20/2021 18:55:48 - INFO - __main__ - Step 20513: {'lr': 0.00019994242434788262, 'samples': 656416, 'steps': 1282, 'loss/train': 3.5619349479675293} -09/20/2021 18:55:49 - INFO - __main__ - Step 20514: {'lr': 0.00019994242434788262, 'samples': 656448, 'steps': 1282, 'loss/train': 3.6530919075012207} -09/20/2021 18:55:50 - INFO - __main__ - Step 20515: {'lr': 0.00019994242434788262, 'samples': 656480, 'steps': 1282, 'loss/train': 5.8643670082092285} -09/20/2021 18:55:50 - INFO - __main__ - Step 20516: {'lr': 0.00019994242434788262, 'samples': 656512, 'steps': 1282, 'loss/train': 3.8262104988098145} -09/20/2021 18:55:51 - INFO - __main__ - Step 20517: {'lr': 0.00019994242434788262, 'samples': 656544, 'steps': 1282, 'loss/train': 3.7054238319396973} -09/20/2021 18:55:53 - INFO - __main__ - Step 20518: {'lr': 0.00019994242434788262, 'samples': 656576, 'steps': 1282, 'loss/train': 3.4200260639190674} -09/20/2021 18:55:53 - INFO - __main__ - Step 20519: {'lr': 0.00019994242434788262, 'samples': 656608, 'steps': 1282, 'loss/train': 2.457956552505493} -09/20/2021 18:55:54 - INFO - __main__ - Step 20520: {'lr': 0.00019994242434788262, 'samples': 656640, 'steps': 1282, 'loss/train': 2.7871298789978027} -09/20/2021 18:55:55 - INFO - __main__ - Step 20521: {'lr': 0.00019994242434788262, 'samples': 656672, 'steps': 1282, 'loss/train': 3.1091232299804688} -09/20/2021 18:55:56 - INFO - __main__ - Step 20522: {'lr': 0.00019994242434788262, 'samples': 656704, 'steps': 1282, 'loss/train': 3.5043187141418457} -09/20/2021 18:55:56 - INFO - __main__ - Step 20523: {'lr': 0.00019994242434788262, 'samples': 656736, 'steps': 1282, 'loss/train': 3.858572244644165} -09/20/2021 18:55:57 - INFO - __main__ - Step 20524: {'lr': 0.00019994242434788262, 'samples': 656768, 'steps': 1282, 'loss/train': 4.936466693878174} -09/20/2021 18:55:58 - INFO - __main__ - Step 20525: {'lr': 0.00019994242434788262, 'samples': 656800, 'steps': 1282, 'loss/train': 2.574655771255493} -09/20/2021 18:55:59 - INFO - __main__ - Step 20526: {'lr': 0.00019994242434788262, 'samples': 656832, 'steps': 1282, 'loss/train': 3.2070884704589844} -09/20/2021 18:55:59 - INFO - __main__ - Step 20527: {'lr': 0.00019994242434788262, 'samples': 656864, 'steps': 1282, 'loss/train': 4.235174179077148} -09/20/2021 18:56:00 - INFO - __main__ - Step 20528: {'lr': 0.00019994242434788262, 'samples': 656896, 'steps': 1282, 'loss/train': 4.871456146240234} -09/20/2021 18:56:01 - INFO - __main__ - Step 20529: {'lr': 0.00019994220771550288, 'samples': 656928, 'steps': 1283, 'loss/train': 5.0291948318481445} -09/20/2021 18:56:02 - INFO - __main__ - Step 20530: {'lr': 0.00019994220771550288, 'samples': 656960, 'steps': 1283, 'loss/train': 4.922481536865234} -09/20/2021 18:56:03 - INFO - __main__ - Step 20531: {'lr': 0.00019994220771550288, 'samples': 656992, 'steps': 1283, 'loss/train': 3.58052921295166} -09/20/2021 18:56:03 - INFO - __main__ - Step 20532: {'lr': 0.00019994220771550288, 'samples': 657024, 'steps': 1283, 'loss/train': 3.430886745452881} -09/20/2021 18:56:04 - INFO - __main__ - Step 20533: {'lr': 0.00019994220771550288, 'samples': 657056, 'steps': 1283, 'loss/train': 3.8416502475738525} -09/20/2021 18:56:05 - INFO - __main__ - Step 20534: {'lr': 0.00019994220771550288, 'samples': 657088, 'steps': 1283, 'loss/train': 3.4344496726989746} -09/20/2021 18:56:06 - INFO - __main__ - Step 20535: {'lr': 0.00019994220771550288, 'samples': 657120, 'steps': 1283, 'loss/train': 4.150901794433594} -09/20/2021 18:56:06 - INFO - __main__ - Step 20536: {'lr': 0.00019994220771550288, 'samples': 657152, 'steps': 1283, 'loss/train': 4.6362810134887695} -09/20/2021 18:56:07 - INFO - __main__ - Step 20537: {'lr': 0.00019994220771550288, 'samples': 657184, 'steps': 1283, 'loss/train': 3.486339807510376} -09/20/2021 18:56:08 - INFO - __main__ - Step 20538: {'lr': 0.00019994220771550288, 'samples': 657216, 'steps': 1283, 'loss/train': 3.139449119567871} -09/20/2021 18:56:09 - INFO - __main__ - Step 20539: {'lr': 0.00019994220771550288, 'samples': 657248, 'steps': 1283, 'loss/train': 3.534567356109619} -09/20/2021 18:56:09 - INFO - __main__ - Step 20540: {'lr': 0.00019994220771550288, 'samples': 657280, 'steps': 1283, 'loss/train': 6.756768703460693} -09/20/2021 18:56:10 - INFO - __main__ - Step 20541: {'lr': 0.00019994220771550288, 'samples': 657312, 'steps': 1283, 'loss/train': 2.435582399368286} -09/20/2021 18:56:11 - INFO - __main__ - Step 20542: {'lr': 0.00019994220771550288, 'samples': 657344, 'steps': 1283, 'loss/train': 3.250126361846924} -09/20/2021 18:56:12 - INFO - __main__ - Step 20543: {'lr': 0.00019994220771550288, 'samples': 657376, 'steps': 1283, 'loss/train': 3.975971221923828} -09/20/2021 18:56:12 - INFO - __main__ - Step 20544: {'lr': 0.00019994220771550288, 'samples': 657408, 'steps': 1283, 'loss/train': 3.300255298614502} -09/20/2021 18:56:13 - INFO - __main__ - Step 20545: {'lr': 0.0001999419906764587, 'samples': 657440, 'steps': 1284, 'loss/train': 3.4281067848205566} -09/20/2021 18:56:14 - INFO - __main__ - Step 20546: {'lr': 0.0001999419906764587, 'samples': 657472, 'steps': 1284, 'loss/train': 3.336681604385376} -09/20/2021 18:56:15 - INFO - __main__ - Step 20547: {'lr': 0.0001999419906764587, 'samples': 657504, 'steps': 1284, 'loss/train': 1.8108241558074951} -09/20/2021 18:56:15 - INFO - __main__ - Step 20548: {'lr': 0.0001999419906764587, 'samples': 657536, 'steps': 1284, 'loss/train': 3.961749792098999} -09/20/2021 18:56:17 - INFO - __main__ - Step 20549: {'lr': 0.0001999419906764587, 'samples': 657568, 'steps': 1284, 'loss/train': 3.4328653812408447} -09/20/2021 18:56:17 - INFO - __main__ - Step 20550: {'lr': 0.0001999419906764587, 'samples': 657600, 'steps': 1284, 'loss/train': 3.6169795989990234} -09/20/2021 18:56:18 - INFO - __main__ - Step 20551: {'lr': 0.0001999419906764587, 'samples': 657632, 'steps': 1284, 'loss/train': 3.763690233230591} -09/20/2021 18:56:19 - INFO - __main__ - Step 20552: {'lr': 0.0001999419906764587, 'samples': 657664, 'steps': 1284, 'loss/train': 4.490593910217285} -09/20/2021 18:56:20 - INFO - __main__ - Step 20553: {'lr': 0.0001999419906764587, 'samples': 657696, 'steps': 1284, 'loss/train': 2.8279242515563965} -09/20/2021 18:56:20 - INFO - __main__ - Step 20554: {'lr': 0.0001999419906764587, 'samples': 657728, 'steps': 1284, 'loss/train': 2.74550199508667} -09/20/2021 18:56:21 - INFO - __main__ - Step 20555: {'lr': 0.0001999419906764587, 'samples': 657760, 'steps': 1284, 'loss/train': 3.004354476928711} -09/20/2021 18:56:22 - INFO - __main__ - Step 20556: {'lr': 0.0001999419906764587, 'samples': 657792, 'steps': 1284, 'loss/train': 3.502044916152954} -09/20/2021 18:56:23 - INFO - __main__ - Step 20557: {'lr': 0.0001999419906764587, 'samples': 657824, 'steps': 1284, 'loss/train': 3.3742785453796387} -09/20/2021 18:56:23 - INFO - __main__ - Step 20558: {'lr': 0.0001999419906764587, 'samples': 657856, 'steps': 1284, 'loss/train': 3.572380781173706} -09/20/2021 18:56:24 - INFO - __main__ - Step 20559: {'lr': 0.0001999419906764587, 'samples': 657888, 'steps': 1284, 'loss/train': 3.485551595687866} -09/20/2021 18:56:25 - INFO - __main__ - Step 20560: {'lr': 0.0001999419906764587, 'samples': 657920, 'steps': 1284, 'loss/train': 4.062043190002441} -09/20/2021 18:56:26 - INFO - __main__ - Step 20561: {'lr': 0.00019994177323075097, 'samples': 657952, 'steps': 1285, 'loss/train': 4.271667003631592} -09/20/2021 18:56:27 - INFO - __main__ - Step 20562: {'lr': 0.00019994177323075097, 'samples': 657984, 'steps': 1285, 'loss/train': 3.352389335632324} -09/20/2021 18:56:27 - INFO - __main__ - Step 20563: {'lr': 0.00019994177323075097, 'samples': 658016, 'steps': 1285, 'loss/train': 4.010480880737305} -09/20/2021 18:56:28 - INFO - __main__ - Step 20564: {'lr': 0.00019994177323075097, 'samples': 658048, 'steps': 1285, 'loss/train': 0.8582269549369812} -09/20/2021 18:56:29 - INFO - __main__ - Step 20565: {'lr': 0.00019994177323075097, 'samples': 658080, 'steps': 1285, 'loss/train': 2.577242374420166} -09/20/2021 18:56:30 - INFO - __main__ - Step 20566: {'lr': 0.00019994177323075097, 'samples': 658112, 'steps': 1285, 'loss/train': 1.5902386903762817} -09/20/2021 18:56:30 - INFO - __main__ - Step 20567: {'lr': 0.00019994177323075097, 'samples': 658144, 'steps': 1285, 'loss/train': 3.2278573513031006} -09/20/2021 18:56:31 - INFO - __main__ - Step 20568: {'lr': 0.00019994177323075097, 'samples': 658176, 'steps': 1285, 'loss/train': 2.726928234100342} -09/20/2021 18:56:32 - INFO - __main__ - Step 20569: {'lr': 0.00019994177323075097, 'samples': 658208, 'steps': 1285, 'loss/train': 3.262986660003662} -09/20/2021 18:56:33 - INFO - __main__ - Step 20570: {'lr': 0.00019994177323075097, 'samples': 658240, 'steps': 1285, 'loss/train': 3.87634539604187} -09/20/2021 18:56:33 - INFO - __main__ - Step 20571: {'lr': 0.00019994177323075097, 'samples': 658272, 'steps': 1285, 'loss/train': 3.448821783065796} -09/20/2021 18:56:34 - INFO - __main__ - Step 20572: {'lr': 0.00019994177323075097, 'samples': 658304, 'steps': 1285, 'loss/train': 3.167949676513672} -09/20/2021 18:56:35 - INFO - __main__ - Step 20573: {'lr': 0.00019994177323075097, 'samples': 658336, 'steps': 1285, 'loss/train': 2.4759514331817627} -09/20/2021 18:56:36 - INFO - __main__ - Step 20574: {'lr': 0.00019994177323075097, 'samples': 658368, 'steps': 1285, 'loss/train': 3.208662748336792} -09/20/2021 18:56:36 - INFO - __main__ - Step 20575: {'lr': 0.00019994177323075097, 'samples': 658400, 'steps': 1285, 'loss/train': 3.8108108043670654} -09/20/2021 18:56:37 - INFO - __main__ - Step 20576: {'lr': 0.00019994177323075097, 'samples': 658432, 'steps': 1285, 'loss/train': 3.3596715927124023} -09/20/2021 18:56:38 - INFO - __main__ - Step 20577: {'lr': 0.00019994155537838055, 'samples': 658464, 'steps': 1286, 'loss/train': 2.081648588180542} -09/20/2021 18:56:39 - INFO - __main__ - Step 20578: {'lr': 0.00019994155537838055, 'samples': 658496, 'steps': 1286, 'loss/train': 4.33118200302124} -09/20/2021 18:56:39 - INFO - __main__ - Step 20579: {'lr': 0.00019994155537838055, 'samples': 658528, 'steps': 1286, 'loss/train': 4.078864574432373} -09/20/2021 18:56:41 - INFO - __main__ - Step 20580: {'lr': 0.00019994155537838055, 'samples': 658560, 'steps': 1286, 'loss/train': 1.6233174800872803} -09/20/2021 18:56:42 - INFO - __main__ - Step 20581: {'lr': 0.00019994155537838055, 'samples': 658592, 'steps': 1286, 'loss/train': 3.8067970275878906} -09/20/2021 18:56:43 - INFO - __main__ - Step 20582: {'lr': 0.00019994155537838055, 'samples': 658624, 'steps': 1286, 'loss/train': 2.4104347229003906} -09/20/2021 18:56:43 - INFO - __main__ - Step 20583: {'lr': 0.00019994155537838055, 'samples': 658656, 'steps': 1286, 'loss/train': 3.936821699142456} -09/20/2021 18:56:44 - INFO - __main__ - Step 20584: {'lr': 0.00019994155537838055, 'samples': 658688, 'steps': 1286, 'loss/train': 3.9003665447235107} -09/20/2021 18:56:45 - INFO - __main__ - Step 20585: {'lr': 0.00019994155537838055, 'samples': 658720, 'steps': 1286, 'loss/train': 3.21815824508667} -09/20/2021 18:56:46 - INFO - __main__ - Step 20586: {'lr': 0.00019994155537838055, 'samples': 658752, 'steps': 1286, 'loss/train': 3.740614175796509} -09/20/2021 18:56:46 - INFO - __main__ - Step 20587: {'lr': 0.00019994155537838055, 'samples': 658784, 'steps': 1286, 'loss/train': 3.26572847366333} -09/20/2021 18:56:47 - INFO - __main__ - Step 20588: {'lr': 0.00019994155537838055, 'samples': 658816, 'steps': 1286, 'loss/train': 3.97477126121521} -09/20/2021 18:56:48 - INFO - __main__ - Step 20589: {'lr': 0.00019994155537838055, 'samples': 658848, 'steps': 1286, 'loss/train': 3.4417710304260254} -09/20/2021 18:56:49 - INFO - __main__ - Step 20590: {'lr': 0.00019994155537838055, 'samples': 658880, 'steps': 1286, 'loss/train': 1.2910329103469849} -09/20/2021 18:56:49 - INFO - __main__ - Step 20591: {'lr': 0.00019994155537838055, 'samples': 658912, 'steps': 1286, 'loss/train': 3.55422306060791} -09/20/2021 18:56:50 - INFO - __main__ - Step 20592: {'lr': 0.00019994155537838055, 'samples': 658944, 'steps': 1286, 'loss/train': 4.2240519523620605} -09/20/2021 18:56:51 - INFO - __main__ - Step 20593: {'lr': 0.0001999413371193483, 'samples': 658976, 'steps': 1287, 'loss/train': 3.95440936088562} -09/20/2021 18:56:52 - INFO - __main__ - Step 20594: {'lr': 0.0001999413371193483, 'samples': 659008, 'steps': 1287, 'loss/train': 3.741682767868042} -09/20/2021 18:56:52 - INFO - __main__ - Step 20595: {'lr': 0.0001999413371193483, 'samples': 659040, 'steps': 1287, 'loss/train': 3.3776867389678955} -09/20/2021 18:56:53 - INFO - __main__ - Step 20596: {'lr': 0.0001999413371193483, 'samples': 659072, 'steps': 1287, 'loss/train': 2.5426976680755615} -09/20/2021 18:56:54 - INFO - __main__ - Step 20597: {'lr': 0.0001999413371193483, 'samples': 659104, 'steps': 1287, 'loss/train': 2.554497003555298} -09/20/2021 18:56:55 - INFO - __main__ - Step 20598: {'lr': 0.0001999413371193483, 'samples': 659136, 'steps': 1287, 'loss/train': 2.3933143615722656} -09/20/2021 18:56:55 - INFO - __main__ - Step 20599: {'lr': 0.0001999413371193483, 'samples': 659168, 'steps': 1287, 'loss/train': 2.622375726699829} -09/20/2021 18:56:56 - INFO - __main__ - Step 20600: {'lr': 0.0001999413371193483, 'samples': 659200, 'steps': 1287, 'loss/train': 2.8057446479797363} -09/20/2021 18:56:57 - INFO - __main__ - Step 20601: {'lr': 0.0001999413371193483, 'samples': 659232, 'steps': 1287, 'loss/train': 1.9963188171386719} -09/20/2021 18:56:58 - INFO - __main__ - Step 20602: {'lr': 0.0001999413371193483, 'samples': 659264, 'steps': 1287, 'loss/train': 2.5854220390319824} -09/20/2021 18:56:58 - INFO - __main__ - Step 20603: {'lr': 0.0001999413371193483, 'samples': 659296, 'steps': 1287, 'loss/train': 2.8215911388397217} -09/20/2021 18:56:59 - INFO - __main__ - Step 20604: {'lr': 0.0001999413371193483, 'samples': 659328, 'steps': 1287, 'loss/train': 2.9474539756774902} -09/20/2021 18:57:00 - INFO - __main__ - Step 20605: {'lr': 0.0001999413371193483, 'samples': 659360, 'steps': 1287, 'loss/train': 3.6347270011901855} -09/20/2021 18:57:01 - INFO - __main__ - Step 20606: {'lr': 0.0001999413371193483, 'samples': 659392, 'steps': 1287, 'loss/train': 1.3204022645950317} -09/20/2021 18:57:01 - INFO - __main__ - Step 20607: {'lr': 0.0001999413371193483, 'samples': 659424, 'steps': 1287, 'loss/train': 4.536813259124756} -09/20/2021 18:57:02 - INFO - __main__ - Step 20608: {'lr': 0.0001999413371193483, 'samples': 659456, 'steps': 1287, 'loss/train': 3.1755642890930176} -09/20/2021 18:57:03 - INFO - __main__ - Step 20609: {'lr': 0.00019994111845365514, 'samples': 659488, 'steps': 1288, 'loss/train': 3.6319305896759033} -09/20/2021 18:57:04 - INFO - __main__ - Step 20610: {'lr': 0.00019994111845365514, 'samples': 659520, 'steps': 1288, 'loss/train': 3.779430866241455} -09/20/2021 18:57:05 - INFO - __main__ - Step 20611: {'lr': 0.00019994111845365514, 'samples': 659552, 'steps': 1288, 'loss/train': 3.353745937347412} -09/20/2021 18:57:05 - INFO - __main__ - Step 20612: {'lr': 0.00019994111845365514, 'samples': 659584, 'steps': 1288, 'loss/train': 3.812506914138794} -09/20/2021 18:57:06 - INFO - __main__ - Step 20613: {'lr': 0.00019994111845365514, 'samples': 659616, 'steps': 1288, 'loss/train': 2.7914609909057617} -09/20/2021 18:57:07 - INFO - __main__ - Step 20614: {'lr': 0.00019994111845365514, 'samples': 659648, 'steps': 1288, 'loss/train': 4.824706554412842} -09/20/2021 18:57:08 - INFO - __main__ - Step 20615: {'lr': 0.00019994111845365514, 'samples': 659680, 'steps': 1288, 'loss/train': 4.293356895446777} -09/20/2021 18:57:09 - INFO - __main__ - Step 20616: {'lr': 0.00019994111845365514, 'samples': 659712, 'steps': 1288, 'loss/train': 3.15804386138916} -09/20/2021 18:57:10 - INFO - __main__ - Step 20617: {'lr': 0.00019994111845365514, 'samples': 659744, 'steps': 1288, 'loss/train': 3.82509708404541} -09/20/2021 18:57:11 - INFO - __main__ - Step 20618: {'lr': 0.00019994111845365514, 'samples': 659776, 'steps': 1288, 'loss/train': 3.677279233932495} -09/20/2021 18:57:11 - INFO - __main__ - Step 20619: {'lr': 0.00019994111845365514, 'samples': 659808, 'steps': 1288, 'loss/train': 2.400951385498047} -09/20/2021 18:57:12 - INFO - __main__ - Step 20620: {'lr': 0.00019994111845365514, 'samples': 659840, 'steps': 1288, 'loss/train': 3.931608200073242} -09/20/2021 18:57:13 - INFO - __main__ - Step 20621: {'lr': 0.00019994111845365514, 'samples': 659872, 'steps': 1288, 'loss/train': 3.805753707885742} -09/20/2021 18:57:14 - INFO - __main__ - Step 20622: {'lr': 0.00019994111845365514, 'samples': 659904, 'steps': 1288, 'loss/train': 1.7902504205703735} -09/20/2021 18:57:14 - INFO - __main__ - Step 20623: {'lr': 0.00019994111845365514, 'samples': 659936, 'steps': 1288, 'loss/train': 0.6210969090461731} -09/20/2021 18:57:15 - INFO - __main__ - Step 20624: {'lr': 0.00019994111845365514, 'samples': 659968, 'steps': 1288, 'loss/train': 0.4852842688560486} -09/20/2021 18:57:16 - INFO - __main__ - Step 20625: {'lr': 0.00019994089938130198, 'samples': 660000, 'steps': 1289, 'loss/train': 0.6640685796737671} -09/20/2021 18:57:17 - INFO - __main__ - Step 20626: {'lr': 0.00019994089938130198, 'samples': 660032, 'steps': 1289, 'loss/train': 3.8410604000091553} -09/20/2021 18:57:17 - INFO - __main__ - Step 20627: {'lr': 0.00019994089938130198, 'samples': 660064, 'steps': 1289, 'loss/train': 2.6696360111236572} -09/20/2021 18:57:18 - INFO - __main__ - Step 20628: {'lr': 0.00019994089938130198, 'samples': 660096, 'steps': 1289, 'loss/train': 3.6998226642608643} -09/20/2021 18:57:19 - INFO - __main__ - Step 20629: {'lr': 0.00019994089938130198, 'samples': 660128, 'steps': 1289, 'loss/train': 4.8616766929626465} -09/20/2021 18:57:20 - INFO - __main__ - Step 20630: {'lr': 0.00019994089938130198, 'samples': 660160, 'steps': 1289, 'loss/train': 2.8661916255950928} -09/20/2021 18:57:20 - INFO - __main__ - Step 20631: {'lr': 0.00019994089938130198, 'samples': 660192, 'steps': 1289, 'loss/train': 3.6232187747955322} -09/20/2021 18:57:21 - INFO - __main__ - Step 20632: {'lr': 0.00019994089938130198, 'samples': 660224, 'steps': 1289, 'loss/train': 4.456795692443848} -09/20/2021 18:57:22 - INFO - __main__ - Step 20633: {'lr': 0.00019994089938130198, 'samples': 660256, 'steps': 1289, 'loss/train': 3.675419330596924} -09/20/2021 18:57:23 - INFO - __main__ - Step 20634: {'lr': 0.00019994089938130198, 'samples': 660288, 'steps': 1289, 'loss/train': 3.4218244552612305} -09/20/2021 18:57:23 - INFO - __main__ - Step 20635: {'lr': 0.00019994089938130198, 'samples': 660320, 'steps': 1289, 'loss/train': 3.549910545349121} -09/20/2021 18:57:24 - INFO - __main__ - Step 20636: {'lr': 0.00019994089938130198, 'samples': 660352, 'steps': 1289, 'loss/train': 4.626173496246338} -09/20/2021 18:57:25 - INFO - __main__ - Step 20637: {'lr': 0.00019994089938130198, 'samples': 660384, 'steps': 1289, 'loss/train': 3.0101757049560547} -09/20/2021 18:57:26 - INFO - __main__ - Step 20638: {'lr': 0.00019994089938130198, 'samples': 660416, 'steps': 1289, 'loss/train': 3.491706132888794} -09/20/2021 18:57:26 - INFO - __main__ - Step 20639: {'lr': 0.00019994089938130198, 'samples': 660448, 'steps': 1289, 'loss/train': 2.45827579498291} -09/20/2021 18:57:27 - INFO - __main__ - Step 20640: {'lr': 0.00019994089938130198, 'samples': 660480, 'steps': 1289, 'loss/train': 4.621006011962891} -09/20/2021 18:57:28 - INFO - __main__ - Step 20641: {'lr': 0.00019994067990228967, 'samples': 660512, 'steps': 1290, 'loss/train': 4.5325117111206055} -09/20/2021 18:57:29 - INFO - __main__ - Step 20642: {'lr': 0.00019994067990228967, 'samples': 660544, 'steps': 1290, 'loss/train': 2.953472137451172} -09/20/2021 18:57:30 - INFO - __main__ - Step 20643: {'lr': 0.00019994067990228967, 'samples': 660576, 'steps': 1290, 'loss/train': 2.560704231262207} -09/20/2021 18:57:30 - INFO - __main__ - Step 20644: {'lr': 0.00019994067990228967, 'samples': 660608, 'steps': 1290, 'loss/train': 3.2677056789398193} -09/20/2021 18:57:31 - INFO - __main__ - Step 20645: {'lr': 0.00019994067990228967, 'samples': 660640, 'steps': 1290, 'loss/train': 4.15470027923584} -09/20/2021 18:57:32 - INFO - __main__ - Step 20646: {'lr': 0.00019994067990228967, 'samples': 660672, 'steps': 1290, 'loss/train': 2.81584095954895} -09/20/2021 18:57:33 - INFO - __main__ - Step 20647: {'lr': 0.00019994067990228967, 'samples': 660704, 'steps': 1290, 'loss/train': 4.711499214172363} -09/20/2021 18:57:34 - INFO - __main__ - Step 20648: {'lr': 0.00019994067990228967, 'samples': 660736, 'steps': 1290, 'loss/train': 3.5212111473083496} -09/20/2021 18:57:35 - INFO - __main__ - Step 20649: {'lr': 0.00019994067990228967, 'samples': 660768, 'steps': 1290, 'loss/train': 1.3485828638076782} -09/20/2021 18:57:35 - INFO - __main__ - Step 20650: {'lr': 0.00019994067990228967, 'samples': 660800, 'steps': 1290, 'loss/train': 2.611532211303711} -09/20/2021 18:57:36 - INFO - __main__ - Step 20651: {'lr': 0.00019994067990228967, 'samples': 660832, 'steps': 1290, 'loss/train': 3.7097997665405273} -09/20/2021 18:57:37 - INFO - __main__ - Step 20652: {'lr': 0.00019994067990228967, 'samples': 660864, 'steps': 1290, 'loss/train': 3.3705525398254395} -09/20/2021 18:57:38 - INFO - __main__ - Step 20653: {'lr': 0.00019994067990228967, 'samples': 660896, 'steps': 1290, 'loss/train': 2.469374418258667} -09/20/2021 18:57:38 - INFO - __main__ - Step 20654: {'lr': 0.00019994067990228967, 'samples': 660928, 'steps': 1290, 'loss/train': 3.872959613800049} -09/20/2021 18:57:39 - INFO - __main__ - Step 20655: {'lr': 0.00019994067990228967, 'samples': 660960, 'steps': 1290, 'loss/train': 2.7394323348999023} -09/20/2021 18:57:40 - INFO - __main__ - Step 20656: {'lr': 0.00019994067990228967, 'samples': 660992, 'steps': 1290, 'loss/train': 3.1153624057769775} -09/20/2021 18:57:41 - INFO - __main__ - Step 20657: {'lr': 0.00019994046001661913, 'samples': 661024, 'steps': 1291, 'loss/train': 3.7251501083374023} -09/20/2021 18:57:41 - INFO - __main__ - Step 20658: {'lr': 0.00019994046001661913, 'samples': 661056, 'steps': 1291, 'loss/train': 2.80987548828125} -09/20/2021 18:57:42 - INFO - __main__ - Step 20659: {'lr': 0.00019994046001661913, 'samples': 661088, 'steps': 1291, 'loss/train': 3.716696262359619} -09/20/2021 18:57:43 - INFO - __main__ - Step 20660: {'lr': 0.00019994046001661913, 'samples': 661120, 'steps': 1291, 'loss/train': 3.2701003551483154} -09/20/2021 18:57:44 - INFO - __main__ - Step 20661: {'lr': 0.00019994046001661913, 'samples': 661152, 'steps': 1291, 'loss/train': 3.595973491668701} -09/20/2021 18:57:44 - INFO - __main__ - Step 20662: {'lr': 0.00019994046001661913, 'samples': 661184, 'steps': 1291, 'loss/train': 4.259066581726074} -09/20/2021 18:57:45 - INFO - __main__ - Step 20663: {'lr': 0.00019994046001661913, 'samples': 661216, 'steps': 1291, 'loss/train': 2.892333507537842} -09/20/2021 18:57:46 - INFO - __main__ - Step 20664: {'lr': 0.00019994046001661913, 'samples': 661248, 'steps': 1291, 'loss/train': 3.296157121658325} -09/20/2021 18:57:47 - INFO - __main__ - Step 20665: {'lr': 0.00019994046001661913, 'samples': 661280, 'steps': 1291, 'loss/train': 4.020392894744873} -09/20/2021 18:57:47 - INFO - __main__ - Step 20666: {'lr': 0.00019994046001661913, 'samples': 661312, 'steps': 1291, 'loss/train': 2.787792444229126} -09/20/2021 18:57:48 - INFO - __main__ - Step 20667: {'lr': 0.00019994046001661913, 'samples': 661344, 'steps': 1291, 'loss/train': 3.508037805557251} -09/20/2021 18:57:49 - INFO - __main__ - Step 20668: {'lr': 0.00019994046001661913, 'samples': 661376, 'steps': 1291, 'loss/train': 3.215786933898926} -09/20/2021 18:57:50 - INFO - __main__ - Step 20669: {'lr': 0.00019994046001661913, 'samples': 661408, 'steps': 1291, 'loss/train': 3.270658493041992} -09/20/2021 18:57:50 - INFO - __main__ - Step 20670: {'lr': 0.00019994046001661913, 'samples': 661440, 'steps': 1291, 'loss/train': 3.2502474784851074} -09/20/2021 18:57:51 - INFO - __main__ - Step 20671: {'lr': 0.00019994046001661913, 'samples': 661472, 'steps': 1291, 'loss/train': 3.345592737197876} -09/20/2021 18:57:52 - INFO - __main__ - Step 20672: {'lr': 0.00019994046001661913, 'samples': 661504, 'steps': 1291, 'loss/train': 3.8297948837280273} -09/20/2021 18:57:53 - INFO - __main__ - Step 20673: {'lr': 0.00019994023972429124, 'samples': 661536, 'steps': 1292, 'loss/train': 3.571092128753662} -09/20/2021 18:57:54 - INFO - __main__ - Step 20674: {'lr': 0.00019994023972429124, 'samples': 661568, 'steps': 1292, 'loss/train': 3.931936740875244} -09/20/2021 18:57:54 - INFO - __main__ - Step 20675: {'lr': 0.00019994023972429124, 'samples': 661600, 'steps': 1292, 'loss/train': 4.212733268737793} -09/20/2021 18:57:55 - INFO - __main__ - Step 20676: {'lr': 0.00019994023972429124, 'samples': 661632, 'steps': 1292, 'loss/train': 2.644327163696289} -09/20/2021 18:57:56 - INFO - __main__ - Step 20677: {'lr': 0.00019994023972429124, 'samples': 661664, 'steps': 1292, 'loss/train': 2.9938275814056396} -09/20/2021 18:57:57 - INFO - __main__ - Step 20678: {'lr': 0.00019994023972429124, 'samples': 661696, 'steps': 1292, 'loss/train': 4.611509323120117} -09/20/2021 18:57:58 - INFO - __main__ - Step 20679: {'lr': 0.00019994023972429124, 'samples': 661728, 'steps': 1292, 'loss/train': 3.792001724243164} -09/20/2021 18:57:59 - INFO - __main__ - Step 20680: {'lr': 0.00019994023972429124, 'samples': 661760, 'steps': 1292, 'loss/train': 2.7430899143218994} -09/20/2021 18:57:59 - INFO - __main__ - Step 20681: {'lr': 0.00019994023972429124, 'samples': 661792, 'steps': 1292, 'loss/train': 2.747312307357788} -09/20/2021 18:58:00 - INFO - __main__ - Step 20682: {'lr': 0.00019994023972429124, 'samples': 661824, 'steps': 1292, 'loss/train': 3.436378240585327} -09/20/2021 18:58:01 - INFO - __main__ - Step 20683: {'lr': 0.00019994023972429124, 'samples': 661856, 'steps': 1292, 'loss/train': 3.103243112564087} -09/20/2021 18:58:02 - INFO - __main__ - Step 20684: {'lr': 0.00019994023972429124, 'samples': 661888, 'steps': 1292, 'loss/train': 0.9161670804023743} -09/20/2021 18:58:02 - INFO - __main__ - Step 20685: {'lr': 0.00019994023972429124, 'samples': 661920, 'steps': 1292, 'loss/train': 0.6544938683509827} -09/20/2021 18:58:03 - INFO - __main__ - Step 20686: {'lr': 0.00019994023972429124, 'samples': 661952, 'steps': 1292, 'loss/train': 0.7104054689407349} -09/20/2021 18:58:04 - INFO - __main__ - Step 20687: {'lr': 0.00019994023972429124, 'samples': 661984, 'steps': 1292, 'loss/train': 3.0292294025421143} -09/20/2021 18:58:05 - INFO - __main__ - Step 20688: {'lr': 0.00019994023972429124, 'samples': 662016, 'steps': 1292, 'loss/train': 3.300652265548706} -09/20/2021 18:58:06 - INFO - __main__ - Step 20689: {'lr': 0.0001999400190253069, 'samples': 662048, 'steps': 1293, 'loss/train': 3.778272867202759} -09/20/2021 18:58:06 - INFO - __main__ - Step 20690: {'lr': 0.0001999400190253069, 'samples': 662080, 'steps': 1293, 'loss/train': 2.9016923904418945} -09/20/2021 18:58:07 - INFO - __main__ - Step 20691: {'lr': 0.0001999400190253069, 'samples': 662112, 'steps': 1293, 'loss/train': 4.100912094116211} -09/20/2021 18:58:08 - INFO - __main__ - Step 20692: {'lr': 0.0001999400190253069, 'samples': 662144, 'steps': 1293, 'loss/train': 3.285403251647949} -09/20/2021 18:58:09 - INFO - __main__ - Step 20693: {'lr': 0.0001999400190253069, 'samples': 662176, 'steps': 1293, 'loss/train': 3.5488600730895996} -09/20/2021 18:58:09 - INFO - __main__ - Step 20694: {'lr': 0.0001999400190253069, 'samples': 662208, 'steps': 1293, 'loss/train': 3.1444804668426514} -09/20/2021 18:58:10 - INFO - __main__ - Step 20695: {'lr': 0.0001999400190253069, 'samples': 662240, 'steps': 1293, 'loss/train': 2.684987783432007} -09/20/2021 18:58:11 - INFO - __main__ - Step 20696: {'lr': 0.0001999400190253069, 'samples': 662272, 'steps': 1293, 'loss/train': 3.226670742034912} -09/20/2021 18:58:12 - INFO - __main__ - Step 20697: {'lr': 0.0001999400190253069, 'samples': 662304, 'steps': 1293, 'loss/train': 2.430206775665283} -09/20/2021 18:58:12 - INFO - __main__ - Step 20698: {'lr': 0.0001999400190253069, 'samples': 662336, 'steps': 1293, 'loss/train': 4.836493968963623} -09/20/2021 18:58:13 - INFO - __main__ - Step 20699: {'lr': 0.0001999400190253069, 'samples': 662368, 'steps': 1293, 'loss/train': 3.605781316757202} -09/20/2021 18:58:14 - INFO - __main__ - Step 20700: {'lr': 0.0001999400190253069, 'samples': 662400, 'steps': 1293, 'loss/train': 3.2776379585266113} -09/20/2021 18:58:15 - INFO - __main__ - Step 20701: {'lr': 0.0001999400190253069, 'samples': 662432, 'steps': 1293, 'loss/train': 2.5012922286987305} -09/20/2021 18:58:15 - INFO - __main__ - Step 20702: {'lr': 0.0001999400190253069, 'samples': 662464, 'steps': 1293, 'loss/train': 2.440957546234131} -09/20/2021 18:58:16 - INFO - __main__ - Step 20703: {'lr': 0.0001999400190253069, 'samples': 662496, 'steps': 1293, 'loss/train': 2.9445579051971436} -09/20/2021 18:58:17 - INFO - __main__ - Step 20704: {'lr': 0.0001999400190253069, 'samples': 662528, 'steps': 1293, 'loss/train': 3.3900601863861084} -09/20/2021 18:58:18 - INFO - __main__ - Step 20705: {'lr': 0.00019993979791966705, 'samples': 662560, 'steps': 1294, 'loss/train': 3.347012758255005} -09/20/2021 18:58:18 - INFO - __main__ - Step 20706: {'lr': 0.00019993979791966705, 'samples': 662592, 'steps': 1294, 'loss/train': 3.453899383544922} -09/20/2021 18:58:19 - INFO - __main__ - Step 20707: {'lr': 0.00019993979791966705, 'samples': 662624, 'steps': 1294, 'loss/train': 3.405447483062744} -09/20/2021 18:58:20 - INFO - __main__ - Step 20708: {'lr': 0.00019993979791966705, 'samples': 662656, 'steps': 1294, 'loss/train': 3.4034149646759033} -09/20/2021 18:58:22 - INFO - __main__ - Step 20709: {'lr': 0.00019993979791966705, 'samples': 662688, 'steps': 1294, 'loss/train': 3.2646689414978027} -09/20/2021 18:58:22 - INFO - __main__ - Step 20710: {'lr': 0.00019993979791966705, 'samples': 662720, 'steps': 1294, 'loss/train': 3.1041529178619385} -09/20/2021 18:58:23 - INFO - __main__ - Step 20711: {'lr': 0.00019993979791966705, 'samples': 662752, 'steps': 1294, 'loss/train': 3.3515625} -09/20/2021 18:58:24 - INFO - __main__ - Step 20712: {'lr': 0.00019993979791966705, 'samples': 662784, 'steps': 1294, 'loss/train': 3.27919340133667} -09/20/2021 18:58:25 - INFO - __main__ - Step 20713: {'lr': 0.00019993979791966705, 'samples': 662816, 'steps': 1294, 'loss/train': 1.5087733268737793} -09/20/2021 18:58:25 - INFO - __main__ - Step 20714: {'lr': 0.00019993979791966705, 'samples': 662848, 'steps': 1294, 'loss/train': 3.2581026554107666} -09/20/2021 18:58:26 - INFO - __main__ - Step 20715: {'lr': 0.00019993979791966705, 'samples': 662880, 'steps': 1294, 'loss/train': 3.0570003986358643} -09/20/2021 18:58:27 - INFO - __main__ - Step 20716: {'lr': 0.00019993979791966705, 'samples': 662912, 'steps': 1294, 'loss/train': 3.2644500732421875} -09/20/2021 18:58:28 - INFO - __main__ - Step 20717: {'lr': 0.00019993979791966705, 'samples': 662944, 'steps': 1294, 'loss/train': 3.0761289596557617} -09/20/2021 18:58:28 - INFO - __main__ - Step 20718: {'lr': 0.00019993979791966705, 'samples': 662976, 'steps': 1294, 'loss/train': 3.1957218647003174} -09/20/2021 18:58:29 - INFO - __main__ - Step 20719: {'lr': 0.00019993979791966705, 'samples': 663008, 'steps': 1294, 'loss/train': 3.0950376987457275} -09/20/2021 18:58:30 - INFO - __main__ - Step 20720: {'lr': 0.00019993979791966705, 'samples': 663040, 'steps': 1294, 'loss/train': 2.176036834716797} -09/20/2021 18:58:31 - INFO - __main__ - Step 20721: {'lr': 0.00019993957640737251, 'samples': 663072, 'steps': 1295, 'loss/train': 2.6002156734466553} -09/20/2021 18:58:32 - INFO - __main__ - Step 20722: {'lr': 0.00019993957640737251, 'samples': 663104, 'steps': 1295, 'loss/train': 3.248642683029175} -09/20/2021 18:58:32 - INFO - __main__ - Step 20723: {'lr': 0.00019993957640737251, 'samples': 663136, 'steps': 1295, 'loss/train': 2.9075088500976562} -09/20/2021 18:58:33 - INFO - __main__ - Step 20724: {'lr': 0.00019993957640737251, 'samples': 663168, 'steps': 1295, 'loss/train': 2.7895121574401855} -09/20/2021 18:58:34 - INFO - __main__ - Step 20725: {'lr': 0.00019993957640737251, 'samples': 663200, 'steps': 1295, 'loss/train': 4.081056594848633} -09/20/2021 18:58:35 - INFO - __main__ - Step 20726: {'lr': 0.00019993957640737251, 'samples': 663232, 'steps': 1295, 'loss/train': 3.528836488723755} -09/20/2021 18:58:35 - INFO - __main__ - Step 20727: {'lr': 0.00019993957640737251, 'samples': 663264, 'steps': 1295, 'loss/train': 4.094258785247803} -09/20/2021 18:58:36 - INFO - __main__ - Step 20728: {'lr': 0.00019993957640737251, 'samples': 663296, 'steps': 1295, 'loss/train': 3.242802619934082} -09/20/2021 18:58:37 - INFO - __main__ - Step 20729: {'lr': 0.00019993957640737251, 'samples': 663328, 'steps': 1295, 'loss/train': 3.4399428367614746} -09/20/2021 18:58:38 - INFO - __main__ - Step 20730: {'lr': 0.00019993957640737251, 'samples': 663360, 'steps': 1295, 'loss/train': 1.4277688264846802} -09/20/2021 18:58:38 - INFO - __main__ - Step 20731: {'lr': 0.00019993957640737251, 'samples': 663392, 'steps': 1295, 'loss/train': 2.9272663593292236} -09/20/2021 18:58:39 - INFO - __main__ - Step 20732: {'lr': 0.00019993957640737251, 'samples': 663424, 'steps': 1295, 'loss/train': 4.058457374572754} -09/20/2021 18:58:40 - INFO - __main__ - Step 20733: {'lr': 0.00019993957640737251, 'samples': 663456, 'steps': 1295, 'loss/train': 2.747875928878784} -09/20/2021 18:58:41 - INFO - __main__ - Step 20734: {'lr': 0.00019993957640737251, 'samples': 663488, 'steps': 1295, 'loss/train': 2.9188473224639893} -09/20/2021 18:58:41 - INFO - __main__ - Step 20735: {'lr': 0.00019993957640737251, 'samples': 663520, 'steps': 1295, 'loss/train': 3.695941686630249} -09/20/2021 18:58:42 - INFO - __main__ - Step 20736: {'lr': 0.00019993957640737251, 'samples': 663552, 'steps': 1295, 'loss/train': 3.1815924644470215} -09/20/2021 18:58:43 - INFO - __main__ - Step 20737: {'lr': 0.00019993935448842424, 'samples': 663584, 'steps': 1296, 'loss/train': 2.6388511657714844} -09/20/2021 18:58:44 - INFO - __main__ - Step 20738: {'lr': 0.00019993935448842424, 'samples': 663616, 'steps': 1296, 'loss/train': 3.464616298675537} -09/20/2021 18:58:44 - INFO - __main__ - Step 20739: {'lr': 0.00019993935448842424, 'samples': 663648, 'steps': 1296, 'loss/train': 1.7485284805297852} -09/20/2021 18:58:46 - INFO - __main__ - Step 20740: {'lr': 0.00019993935448842424, 'samples': 663680, 'steps': 1296, 'loss/train': 3.696925401687622} -09/20/2021 18:58:46 - INFO - __main__ - Step 20741: {'lr': 0.00019993935448842424, 'samples': 663712, 'steps': 1296, 'loss/train': 3.3348588943481445} -09/20/2021 18:58:47 - INFO - __main__ - Step 20742: {'lr': 0.00019993935448842424, 'samples': 663744, 'steps': 1296, 'loss/train': 3.091799259185791} -09/20/2021 18:58:48 - INFO - __main__ - Step 20743: {'lr': 0.00019993935448842424, 'samples': 663776, 'steps': 1296, 'loss/train': 3.6759724617004395} -09/20/2021 18:58:49 - INFO - __main__ - Step 20744: {'lr': 0.00019993935448842424, 'samples': 663808, 'steps': 1296, 'loss/train': 3.2460741996765137} -09/20/2021 18:58:49 - INFO - __main__ - Step 20745: {'lr': 0.00019993935448842424, 'samples': 663840, 'steps': 1296, 'loss/train': 2.9766411781311035} -09/20/2021 18:58:50 - INFO - __main__ - Step 20746: {'lr': 0.00019993935448842424, 'samples': 663872, 'steps': 1296, 'loss/train': 2.845590829849243} -09/20/2021 18:58:51 - INFO - __main__ - Step 20747: {'lr': 0.00019993935448842424, 'samples': 663904, 'steps': 1296, 'loss/train': 2.688203811645508} -09/20/2021 18:58:52 - INFO - __main__ - Step 20748: {'lr': 0.00019993935448842424, 'samples': 663936, 'steps': 1296, 'loss/train': 3.200901746749878} -09/20/2021 18:58:52 - INFO - __main__ - Step 20749: {'lr': 0.00019993935448842424, 'samples': 663968, 'steps': 1296, 'loss/train': 3.4494431018829346} -09/20/2021 18:58:53 - INFO - __main__ - Step 20750: {'lr': 0.00019993935448842424, 'samples': 664000, 'steps': 1296, 'loss/train': 4.397042274475098} -09/20/2021 18:58:54 - INFO - __main__ - Step 20751: {'lr': 0.00019993935448842424, 'samples': 664032, 'steps': 1296, 'loss/train': 3.2339346408843994} -09/20/2021 18:58:55 - INFO - __main__ - Step 20752: {'lr': 0.00019993935448842424, 'samples': 664064, 'steps': 1296, 'loss/train': 2.9766244888305664} -09/20/2021 18:58:56 - INFO - __main__ - Step 20753: {'lr': 0.00019993913216282308, 'samples': 664096, 'steps': 1297, 'loss/train': 3.299489974975586} -09/20/2021 18:58:56 - INFO - __main__ - Step 20754: {'lr': 0.00019993913216282308, 'samples': 664128, 'steps': 1297, 'loss/train': 3.84414005279541} -09/20/2021 18:58:57 - INFO - __main__ - Step 20755: {'lr': 0.00019993913216282308, 'samples': 664160, 'steps': 1297, 'loss/train': 3.8131539821624756} -09/20/2021 18:58:58 - INFO - __main__ - Step 20756: {'lr': 0.00019993913216282308, 'samples': 664192, 'steps': 1297, 'loss/train': 1.4893158674240112} -09/20/2021 18:58:59 - INFO - __main__ - Step 20757: {'lr': 0.00019993913216282308, 'samples': 664224, 'steps': 1297, 'loss/train': 3.127715587615967} -09/20/2021 18:58:59 - INFO - __main__ - Step 20758: {'lr': 0.00019993913216282308, 'samples': 664256, 'steps': 1297, 'loss/train': 3.556148052215576} -09/20/2021 18:59:00 - INFO - __main__ - Step 20759: {'lr': 0.00019993913216282308, 'samples': 664288, 'steps': 1297, 'loss/train': 3.084033250808716} -09/20/2021 18:59:01 - INFO - __main__ - Step 20760: {'lr': 0.00019993913216282308, 'samples': 664320, 'steps': 1297, 'loss/train': 3.832521438598633} -09/20/2021 18:59:02 - INFO - __main__ - Step 20761: {'lr': 0.00019993913216282308, 'samples': 664352, 'steps': 1297, 'loss/train': 2.8476412296295166} -09/20/2021 18:59:02 - INFO - __main__ - Step 20762: {'lr': 0.00019993913216282308, 'samples': 664384, 'steps': 1297, 'loss/train': 2.933306932449341} -09/20/2021 18:59:03 - INFO - __main__ - Step 20763: {'lr': 0.00019993913216282308, 'samples': 664416, 'steps': 1297, 'loss/train': 3.461711883544922} -09/20/2021 18:59:04 - INFO - __main__ - Step 20764: {'lr': 0.00019993913216282308, 'samples': 664448, 'steps': 1297, 'loss/train': 3.8368611335754395} -09/20/2021 18:59:05 - INFO - __main__ - Step 20765: {'lr': 0.00019993913216282308, 'samples': 664480, 'steps': 1297, 'loss/train': 1.6935492753982544} -09/20/2021 18:59:05 - INFO - __main__ - Step 20766: {'lr': 0.00019993913216282308, 'samples': 664512, 'steps': 1297, 'loss/train': 2.846377372741699} -09/20/2021 18:59:06 - INFO - __main__ - Step 20767: {'lr': 0.00019993913216282308, 'samples': 664544, 'steps': 1297, 'loss/train': 4.052434921264648} -09/20/2021 18:59:07 - INFO - __main__ - Step 20768: {'lr': 0.00019993913216282308, 'samples': 664576, 'steps': 1297, 'loss/train': 2.6800873279571533} -09/20/2021 18:59:08 - INFO - __main__ - Step 20769: {'lr': 0.00019993890943057, 'samples': 664608, 'steps': 1298, 'loss/train': 3.0517194271087646} -09/20/2021 18:59:09 - INFO - __main__ - Step 20770: {'lr': 0.00019993890943057, 'samples': 664640, 'steps': 1298, 'loss/train': 3.78452730178833} -09/20/2021 18:59:10 - INFO - __main__ - Step 20771: {'lr': 0.00019993890943057, 'samples': 664672, 'steps': 1298, 'loss/train': 4.028902053833008} -09/20/2021 18:59:11 - INFO - __main__ - Step 20772: {'lr': 0.00019993890943057, 'samples': 664704, 'steps': 1298, 'loss/train': 4.230624675750732} -09/20/2021 18:59:11 - INFO - __main__ - Step 20773: {'lr': 0.00019993890943057, 'samples': 664736, 'steps': 1298, 'loss/train': 3.1846234798431396} -09/20/2021 18:59:12 - INFO - __main__ - Step 20774: {'lr': 0.00019993890943057, 'samples': 664768, 'steps': 1298, 'loss/train': 4.622291564941406} -09/20/2021 18:59:13 - INFO - __main__ - Step 20775: {'lr': 0.00019993890943057, 'samples': 664800, 'steps': 1298, 'loss/train': 2.9587690830230713} -09/20/2021 18:59:14 - INFO - __main__ - Step 20776: {'lr': 0.00019993890943057, 'samples': 664832, 'steps': 1298, 'loss/train': 1.9596562385559082} -09/20/2021 18:59:14 - INFO - __main__ - Step 20777: {'lr': 0.00019993890943057, 'samples': 664864, 'steps': 1298, 'loss/train': 2.17220139503479} -09/20/2021 18:59:15 - INFO - __main__ - Step 20778: {'lr': 0.00019993890943057, 'samples': 664896, 'steps': 1298, 'loss/train': 1.9824299812316895} -09/20/2021 18:59:16 - INFO - __main__ - Step 20779: {'lr': 0.00019993890943057, 'samples': 664928, 'steps': 1298, 'loss/train': 2.773008108139038} -09/20/2021 18:59:17 - INFO - __main__ - Step 20780: {'lr': 0.00019993890943057, 'samples': 664960, 'steps': 1298, 'loss/train': 2.986450433731079} -09/20/2021 18:59:17 - INFO - __main__ - Step 20781: {'lr': 0.00019993890943057, 'samples': 664992, 'steps': 1298, 'loss/train': 4.128208637237549} -09/20/2021 18:59:18 - INFO - __main__ - Step 20782: {'lr': 0.00019993890943057, 'samples': 665024, 'steps': 1298, 'loss/train': 3.1770241260528564} -09/20/2021 18:59:19 - INFO - __main__ - Step 20783: {'lr': 0.00019993890943057, 'samples': 665056, 'steps': 1298, 'loss/train': 3.4793622493743896} -09/20/2021 18:59:20 - INFO - __main__ - Step 20784: {'lr': 0.00019993890943057, 'samples': 665088, 'steps': 1298, 'loss/train': 3.7547802925109863} -09/20/2021 18:59:21 - INFO - __main__ - Step 20785: {'lr': 0.00019993868629166592, 'samples': 665120, 'steps': 1299, 'loss/train': 3.2117867469787598} -09/20/2021 18:59:21 - INFO - __main__ - Step 20786: {'lr': 0.00019993868629166592, 'samples': 665152, 'steps': 1299, 'loss/train': 3.4371585845947266} -09/20/2021 18:59:22 - INFO - __main__ - Step 20787: {'lr': 0.00019993868629166592, 'samples': 665184, 'steps': 1299, 'loss/train': 2.9897806644439697} -09/20/2021 18:59:23 - INFO - __main__ - Step 20788: {'lr': 0.00019993868629166592, 'samples': 665216, 'steps': 1299, 'loss/train': 2.8309218883514404} -09/20/2021 18:59:24 - INFO - __main__ - Step 20789: {'lr': 0.00019993868629166592, 'samples': 665248, 'steps': 1299, 'loss/train': 3.261939764022827} -09/20/2021 18:59:24 - INFO - __main__ - Step 20790: {'lr': 0.00019993868629166592, 'samples': 665280, 'steps': 1299, 'loss/train': 4.501554012298584} -09/20/2021 18:59:25 - INFO - __main__ - Step 20791: {'lr': 0.00019993868629166592, 'samples': 665312, 'steps': 1299, 'loss/train': 4.273571968078613} -09/20/2021 18:59:26 - INFO - __main__ - Step 20792: {'lr': 0.00019993868629166592, 'samples': 665344, 'steps': 1299, 'loss/train': 4.311137676239014} -09/20/2021 18:59:27 - INFO - __main__ - Step 20793: {'lr': 0.00019993868629166592, 'samples': 665376, 'steps': 1299, 'loss/train': 4.139038562774658} -09/20/2021 18:59:27 - INFO - __main__ - Step 20794: {'lr': 0.00019993868629166592, 'samples': 665408, 'steps': 1299, 'loss/train': 2.6051831245422363} -09/20/2021 18:59:28 - INFO - __main__ - Step 20795: {'lr': 0.00019993868629166592, 'samples': 665440, 'steps': 1299, 'loss/train': 3.718970537185669} -09/20/2021 18:59:29 - INFO - __main__ - Step 20796: {'lr': 0.00019993868629166592, 'samples': 665472, 'steps': 1299, 'loss/train': 4.174264907836914} -09/20/2021 18:59:30 - INFO - __main__ - Step 20797: {'lr': 0.00019993868629166592, 'samples': 665504, 'steps': 1299, 'loss/train': 3.6724586486816406} -09/20/2021 18:59:30 - INFO - __main__ - Step 20798: {'lr': 0.00019993868629166592, 'samples': 665536, 'steps': 1299, 'loss/train': 3.8125722408294678} -09/20/2021 18:59:31 - INFO - __main__ - Step 20799: {'lr': 0.00019993868629166592, 'samples': 665568, 'steps': 1299, 'loss/train': 3.5705454349517822} -09/20/2021 18:59:32 - INFO - __main__ - Step 20800: {'lr': 0.00019993868629166592, 'samples': 665600, 'steps': 1299, 'loss/train': 2.137866973876953} -09/20/2021 18:59:33 - INFO - __main__ - Step 20801: {'lr': 0.0001999384627461117, 'samples': 665632, 'steps': 1300, 'loss/train': 3.3562097549438477} -09/20/2021 18:59:34 - INFO - __main__ - Step 20802: {'lr': 0.0001999384627461117, 'samples': 665664, 'steps': 1300, 'loss/train': 3.209632635116577} -09/20/2021 18:59:35 - INFO - __main__ - Step 20803: {'lr': 0.0001999384627461117, 'samples': 665696, 'steps': 1300, 'loss/train': 3.4329686164855957} -09/20/2021 18:59:36 - INFO - __main__ - Step 20804: {'lr': 0.0001999384627461117, 'samples': 665728, 'steps': 1300, 'loss/train': 3.7571799755096436} -09/20/2021 18:59:36 - INFO - __main__ - Step 20805: {'lr': 0.0001999384627461117, 'samples': 665760, 'steps': 1300, 'loss/train': 2.9109084606170654} -09/20/2021 18:59:37 - INFO - __main__ - Step 20806: {'lr': 0.0001999384627461117, 'samples': 665792, 'steps': 1300, 'loss/train': 3.50338077545166} -09/20/2021 18:59:38 - INFO - __main__ - Step 20807: {'lr': 0.0001999384627461117, 'samples': 665824, 'steps': 1300, 'loss/train': 3.100682020187378} -09/20/2021 18:59:39 - INFO - __main__ - Step 20808: {'lr': 0.0001999384627461117, 'samples': 665856, 'steps': 1300, 'loss/train': 3.0387423038482666} -09/20/2021 18:59:39 - INFO - __main__ - Step 20809: {'lr': 0.0001999384627461117, 'samples': 665888, 'steps': 1300, 'loss/train': 3.534461498260498} -09/20/2021 18:59:40 - INFO - __main__ - Step 20810: {'lr': 0.0001999384627461117, 'samples': 665920, 'steps': 1300, 'loss/train': 2.980619430541992} -09/20/2021 18:59:41 - INFO - __main__ - Step 20811: {'lr': 0.0001999384627461117, 'samples': 665952, 'steps': 1300, 'loss/train': 2.7888810634613037} -09/20/2021 18:59:42 - INFO - __main__ - Step 20812: {'lr': 0.0001999384627461117, 'samples': 665984, 'steps': 1300, 'loss/train': 2.7797038555145264} -09/20/2021 18:59:42 - INFO - __main__ - Step 20813: {'lr': 0.0001999384627461117, 'samples': 666016, 'steps': 1300, 'loss/train': 3.7282445430755615} -09/20/2021 18:59:43 - INFO - __main__ - Step 20814: {'lr': 0.0001999384627461117, 'samples': 666048, 'steps': 1300, 'loss/train': 3.486619234085083} -09/20/2021 18:59:44 - INFO - __main__ - Step 20815: {'lr': 0.0001999384627461117, 'samples': 666080, 'steps': 1300, 'loss/train': 3.795217275619507} -09/20/2021 18:59:45 - INFO - __main__ - Step 20816: {'lr': 0.0001999384627461117, 'samples': 666112, 'steps': 1300, 'loss/train': 3.128039836883545} -09/20/2021 18:59:46 - INFO - __main__ - Step 20817: {'lr': 0.00019993823879390824, 'samples': 666144, 'steps': 1301, 'loss/train': 3.78134822845459} -09/20/2021 18:59:46 - INFO - __main__ - Step 20818: {'lr': 0.00019993823879390824, 'samples': 666176, 'steps': 1301, 'loss/train': 3.6962027549743652} -09/20/2021 18:59:47 - INFO - __main__ - Step 20819: {'lr': 0.00019993823879390824, 'samples': 666208, 'steps': 1301, 'loss/train': 2.6213324069976807} -09/20/2021 18:59:48 - INFO - __main__ - Step 20820: {'lr': 0.00019993823879390824, 'samples': 666240, 'steps': 1301, 'loss/train': 3.805527687072754} -09/20/2021 18:59:48 - INFO - __main__ - Step 20821: {'lr': 0.00019993823879390824, 'samples': 666272, 'steps': 1301, 'loss/train': 2.949708938598633} -09/20/2021 18:59:49 - INFO - __main__ - Step 20822: {'lr': 0.00019993823879390824, 'samples': 666304, 'steps': 1301, 'loss/train': 2.5203263759613037} -09/20/2021 18:59:50 - INFO - __main__ - Step 20823: {'lr': 0.00019993823879390824, 'samples': 666336, 'steps': 1301, 'loss/train': 4.029639720916748} -09/20/2021 18:59:51 - INFO - __main__ - Step 20824: {'lr': 0.00019993823879390824, 'samples': 666368, 'steps': 1301, 'loss/train': 4.422469615936279} -09/20/2021 18:59:52 - INFO - __main__ - Step 20825: {'lr': 0.00019993823879390824, 'samples': 666400, 'steps': 1301, 'loss/train': 3.996382236480713} -09/20/2021 18:59:52 - INFO - __main__ - Step 20826: {'lr': 0.00019993823879390824, 'samples': 666432, 'steps': 1301, 'loss/train': 4.09302282333374} -09/20/2021 18:59:53 - INFO - __main__ - Step 20827: {'lr': 0.00019993823879390824, 'samples': 666464, 'steps': 1301, 'loss/train': 4.148639678955078} -09/20/2021 18:59:54 - INFO - __main__ - Step 20828: {'lr': 0.00019993823879390824, 'samples': 666496, 'steps': 1301, 'loss/train': 3.1606671810150146} -09/20/2021 18:59:55 - INFO - __main__ - Step 20829: {'lr': 0.00019993823879390824, 'samples': 666528, 'steps': 1301, 'loss/train': 3.5097179412841797} -09/20/2021 18:59:55 - INFO - __main__ - Step 20830: {'lr': 0.00019993823879390824, 'samples': 666560, 'steps': 1301, 'loss/train': 3.3262202739715576} -09/20/2021 18:59:56 - INFO - __main__ - Step 20831: {'lr': 0.00019993823879390824, 'samples': 666592, 'steps': 1301, 'loss/train': 3.636918067932129} -09/20/2021 18:59:57 - INFO - __main__ - Step 20832: {'lr': 0.00019993823879390824, 'samples': 666624, 'steps': 1301, 'loss/train': 3.887061834335327} -09/20/2021 18:59:58 - INFO - __main__ - Step 20833: {'lr': 0.00019993801443505649, 'samples': 666656, 'steps': 1302, 'loss/train': 2.9797205924987793} -09/20/2021 18:59:59 - INFO - __main__ - Step 20834: {'lr': 0.00019993801443505649, 'samples': 666688, 'steps': 1302, 'loss/train': 2.9340569972991943} -09/20/2021 19:00:00 - INFO - __main__ - Step 20835: {'lr': 0.00019993801443505649, 'samples': 666720, 'steps': 1302, 'loss/train': 3.1719493865966797} -09/20/2021 19:00:00 - INFO - __main__ - Step 20836: {'lr': 0.00019993801443505649, 'samples': 666752, 'steps': 1302, 'loss/train': 3.2218668460845947} -09/20/2021 19:00:01 - INFO - __main__ - Step 20837: {'lr': 0.00019993801443505649, 'samples': 666784, 'steps': 1302, 'loss/train': 2.9538121223449707} -09/20/2021 19:00:02 - INFO - __main__ - Step 20838: {'lr': 0.00019993801443505649, 'samples': 666816, 'steps': 1302, 'loss/train': 3.2591986656188965} -09/20/2021 19:00:03 - INFO - __main__ - Step 20839: {'lr': 0.00019993801443505649, 'samples': 666848, 'steps': 1302, 'loss/train': 3.338367462158203} -09/20/2021 19:00:03 - INFO - __main__ - Step 20840: {'lr': 0.00019993801443505649, 'samples': 666880, 'steps': 1302, 'loss/train': 2.954267740249634} -09/20/2021 19:00:04 - INFO - __main__ - Step 20841: {'lr': 0.00019993801443505649, 'samples': 666912, 'steps': 1302, 'loss/train': 3.1584560871124268} -09/20/2021 19:00:05 - INFO - __main__ - Step 20842: {'lr': 0.00019993801443505649, 'samples': 666944, 'steps': 1302, 'loss/train': 0.7979240417480469} -09/20/2021 19:00:06 - INFO - __main__ - Step 20843: {'lr': 0.00019993801443505649, 'samples': 666976, 'steps': 1302, 'loss/train': 0.9678334593772888} -09/20/2021 19:00:06 - INFO - __main__ - Step 20844: {'lr': 0.00019993801443505649, 'samples': 667008, 'steps': 1302, 'loss/train': 2.809671401977539} -09/20/2021 19:00:07 - INFO - __main__ - Step 20845: {'lr': 0.00019993801443505649, 'samples': 667040, 'steps': 1302, 'loss/train': 3.110553741455078} -09/20/2021 19:00:08 - INFO - __main__ - Step 20846: {'lr': 0.00019993801443505649, 'samples': 667072, 'steps': 1302, 'loss/train': 3.416322708129883} -09/20/2021 19:00:09 - INFO - __main__ - Step 20847: {'lr': 0.00019993801443505649, 'samples': 667104, 'steps': 1302, 'loss/train': 3.0219101905822754} -09/20/2021 19:00:09 - INFO - __main__ - Step 20848: {'lr': 0.00019993801443505649, 'samples': 667136, 'steps': 1302, 'loss/train': 4.219687461853027} -09/20/2021 19:00:10 - INFO - __main__ - Step 20849: {'lr': 0.00019993778966955733, 'samples': 667168, 'steps': 1303, 'loss/train': 2.8694143295288086} -09/20/2021 19:00:11 - INFO - __main__ - Step 20850: {'lr': 0.00019993778966955733, 'samples': 667200, 'steps': 1303, 'loss/train': 3.9261696338653564} -09/20/2021 19:00:12 - INFO - __main__ - Step 20851: {'lr': 0.00019993778966955733, 'samples': 667232, 'steps': 1303, 'loss/train': 3.8579704761505127} -09/20/2021 19:00:13 - INFO - __main__ - Step 20852: {'lr': 0.00019993778966955733, 'samples': 667264, 'steps': 1303, 'loss/train': 2.734294891357422} -09/20/2021 19:00:13 - INFO - __main__ - Step 20853: {'lr': 0.00019993778966955733, 'samples': 667296, 'steps': 1303, 'loss/train': 3.940119981765747} -09/20/2021 19:00:14 - INFO - __main__ - Step 20854: {'lr': 0.00019993778966955733, 'samples': 667328, 'steps': 1303, 'loss/train': 4.559122085571289} -09/20/2021 19:00:15 - INFO - __main__ - Step 20855: {'lr': 0.00019993778966955733, 'samples': 667360, 'steps': 1303, 'loss/train': 4.353521347045898} -09/20/2021 19:00:16 - INFO - __main__ - Step 20856: {'lr': 0.00019993778966955733, 'samples': 667392, 'steps': 1303, 'loss/train': 4.074213981628418} -09/20/2021 19:00:16 - INFO - __main__ - Step 20857: {'lr': 0.00019993778966955733, 'samples': 667424, 'steps': 1303, 'loss/train': 3.1458070278167725} -09/20/2021 19:00:17 - INFO - __main__ - Step 20858: {'lr': 0.00019993778966955733, 'samples': 667456, 'steps': 1303, 'loss/train': 4.309872150421143} -09/20/2021 19:00:18 - INFO - __main__ - Step 20859: {'lr': 0.00019993778966955733, 'samples': 667488, 'steps': 1303, 'loss/train': 3.1104230880737305} -09/20/2021 19:00:19 - INFO - __main__ - Step 20860: {'lr': 0.00019993778966955733, 'samples': 667520, 'steps': 1303, 'loss/train': 3.048313617706299} -09/20/2021 19:00:19 - INFO - __main__ - Step 20861: {'lr': 0.00019993778966955733, 'samples': 667552, 'steps': 1303, 'loss/train': 2.9640355110168457} -09/20/2021 19:00:20 - INFO - __main__ - Step 20862: {'lr': 0.00019993778966955733, 'samples': 667584, 'steps': 1303, 'loss/train': 3.6917529106140137} -09/20/2021 19:00:21 - INFO - __main__ - Step 20863: {'lr': 0.00019993778966955733, 'samples': 667616, 'steps': 1303, 'loss/train': 3.5967774391174316} -09/20/2021 19:00:22 - INFO - __main__ - Step 20864: {'lr': 0.00019993778966955733, 'samples': 667648, 'steps': 1303, 'loss/train': 2.3164217472076416} -09/20/2021 19:00:23 - INFO - __main__ - Step 20865: {'lr': 0.00019993756449741173, 'samples': 667680, 'steps': 1304, 'loss/train': 3.1468193531036377} -09/20/2021 19:00:24 - INFO - __main__ - Step 20866: {'lr': 0.00019993756449741173, 'samples': 667712, 'steps': 1304, 'loss/train': 3.0752034187316895} -09/20/2021 19:00:24 - INFO - __main__ - Step 20867: {'lr': 0.00019993756449741173, 'samples': 667744, 'steps': 1304, 'loss/train': 3.301811933517456} -09/20/2021 19:00:25 - INFO - __main__ - Step 20868: {'lr': 0.00019993756449741173, 'samples': 667776, 'steps': 1304, 'loss/train': 3.735921859741211} -09/20/2021 19:00:26 - INFO - __main__ - Step 20869: {'lr': 0.00019993756449741173, 'samples': 667808, 'steps': 1304, 'loss/train': 2.9353203773498535} -09/20/2021 19:00:27 - INFO - __main__ - Step 20870: {'lr': 0.00019993756449741173, 'samples': 667840, 'steps': 1304, 'loss/train': 2.930079460144043} -09/20/2021 19:00:27 - INFO - __main__ - Step 20871: {'lr': 0.00019993756449741173, 'samples': 667872, 'steps': 1304, 'loss/train': 3.13472318649292} -09/20/2021 19:00:28 - INFO - __main__ - Step 20872: {'lr': 0.00019993756449741173, 'samples': 667904, 'steps': 1304, 'loss/train': 3.3342628479003906} -09/20/2021 19:00:29 - INFO - __main__ - Step 20873: {'lr': 0.00019993756449741173, 'samples': 667936, 'steps': 1304, 'loss/train': 4.0616888999938965} -09/20/2021 19:00:30 - INFO - __main__ - Step 20874: {'lr': 0.00019993756449741173, 'samples': 667968, 'steps': 1304, 'loss/train': 4.4755096435546875} -09/20/2021 19:00:30 - INFO - __main__ - Step 20875: {'lr': 0.00019993756449741173, 'samples': 668000, 'steps': 1304, 'loss/train': 3.433462619781494} -09/20/2021 19:00:31 - INFO - __main__ - Step 20876: {'lr': 0.00019993756449741173, 'samples': 668032, 'steps': 1304, 'loss/train': 3.472163438796997} -09/20/2021 19:00:32 - INFO - __main__ - Step 20877: {'lr': 0.00019993756449741173, 'samples': 668064, 'steps': 1304, 'loss/train': 3.3397161960601807} -09/20/2021 19:00:33 - INFO - __main__ - Step 20878: {'lr': 0.00019993756449741173, 'samples': 668096, 'steps': 1304, 'loss/train': 2.0762991905212402} -09/20/2021 19:00:33 - INFO - __main__ - Step 20879: {'lr': 0.00019993756449741173, 'samples': 668128, 'steps': 1304, 'loss/train': 4.230908393859863} -09/20/2021 19:00:34 - INFO - __main__ - Step 20880: {'lr': 0.00019993756449741173, 'samples': 668160, 'steps': 1304, 'loss/train': 2.713266134262085} -09/20/2021 19:00:35 - INFO - __main__ - Step 20881: {'lr': 0.00019993733891862054, 'samples': 668192, 'steps': 1305, 'loss/train': 2.630070209503174} -09/20/2021 19:00:36 - INFO - __main__ - Step 20882: {'lr': 0.00019993733891862054, 'samples': 668224, 'steps': 1305, 'loss/train': 3.638662576675415} -09/20/2021 19:00:37 - INFO - __main__ - Step 20883: {'lr': 0.00019993733891862054, 'samples': 668256, 'steps': 1305, 'loss/train': 3.201563835144043} -09/20/2021 19:00:37 - INFO - __main__ - Step 20884: {'lr': 0.00019993733891862054, 'samples': 668288, 'steps': 1305, 'loss/train': 4.178768157958984} -09/20/2021 19:00:38 - INFO - __main__ - Step 20885: {'lr': 0.00019993733891862054, 'samples': 668320, 'steps': 1305, 'loss/train': 2.702894449234009} -09/20/2021 19:00:39 - INFO - __main__ - Step 20886: {'lr': 0.00019993733891862054, 'samples': 668352, 'steps': 1305, 'loss/train': 4.435386657714844} -09/20/2021 19:00:40 - INFO - __main__ - Step 20887: {'lr': 0.00019993733891862054, 'samples': 668384, 'steps': 1305, 'loss/train': 3.775216579437256} -09/20/2021 19:00:40 - INFO - __main__ - Step 20888: {'lr': 0.00019993733891862054, 'samples': 668416, 'steps': 1305, 'loss/train': 2.7204604148864746} -09/20/2021 19:00:41 - INFO - __main__ - Step 20889: {'lr': 0.00019993733891862054, 'samples': 668448, 'steps': 1305, 'loss/train': 3.998824119567871} -09/20/2021 19:00:42 - INFO - __main__ - Step 20890: {'lr': 0.00019993733891862054, 'samples': 668480, 'steps': 1305, 'loss/train': 3.0183897018432617} -09/20/2021 19:00:43 - INFO - __main__ - Step 20891: {'lr': 0.00019993733891862054, 'samples': 668512, 'steps': 1305, 'loss/train': 2.382565975189209} -09/20/2021 19:00:43 - INFO - __main__ - Step 20892: {'lr': 0.00019993733891862054, 'samples': 668544, 'steps': 1305, 'loss/train': 2.851501703262329} -09/20/2021 19:00:45 - INFO - __main__ - Step 20893: {'lr': 0.00019993733891862054, 'samples': 668576, 'steps': 1305, 'loss/train': 3.115821123123169} -09/20/2021 19:00:45 - INFO - __main__ - Step 20894: {'lr': 0.00019993733891862054, 'samples': 668608, 'steps': 1305, 'loss/train': 3.401210069656372} -09/20/2021 19:00:46 - INFO - __main__ - Step 20895: {'lr': 0.00019993733891862054, 'samples': 668640, 'steps': 1305, 'loss/train': 2.4890096187591553} -09/20/2021 19:00:47 - INFO - __main__ - Step 20896: {'lr': 0.00019993733891862054, 'samples': 668672, 'steps': 1305, 'loss/train': 3.784902811050415} -09/20/2021 19:00:48 - INFO - __main__ - Step 20897: {'lr': 0.00019993711293318472, 'samples': 668704, 'steps': 1306, 'loss/train': 2.6090755462646484} -09/20/2021 19:00:48 - INFO - __main__ - Step 20898: {'lr': 0.00019993711293318472, 'samples': 668736, 'steps': 1306, 'loss/train': 3.0485482215881348} -09/20/2021 19:00:49 - INFO - __main__ - Step 20899: {'lr': 0.00019993711293318472, 'samples': 668768, 'steps': 1306, 'loss/train': 2.8218884468078613} -09/20/2021 19:00:50 - INFO - __main__ - Step 20900: {'lr': 0.00019993711293318472, 'samples': 668800, 'steps': 1306, 'loss/train': 2.29518723487854} -09/20/2021 19:00:51 - INFO - __main__ - Step 20901: {'lr': 0.00019993711293318472, 'samples': 668832, 'steps': 1306, 'loss/train': 2.6071696281433105} -09/20/2021 19:00:51 - INFO - __main__ - Step 20902: {'lr': 0.00019993711293318472, 'samples': 668864, 'steps': 1306, 'loss/train': 3.0523033142089844} -09/20/2021 19:00:52 - INFO - __main__ - Step 20903: {'lr': 0.00019993711293318472, 'samples': 668896, 'steps': 1306, 'loss/train': 3.469203472137451} -09/20/2021 19:00:53 - INFO - __main__ - Step 20904: {'lr': 0.00019993711293318472, 'samples': 668928, 'steps': 1306, 'loss/train': 2.8517587184906006} -09/20/2021 19:00:54 - INFO - __main__ - Step 20905: {'lr': 0.00019993711293318472, 'samples': 668960, 'steps': 1306, 'loss/train': 3.57867693901062} -09/20/2021 19:00:54 - INFO - __main__ - Step 20906: {'lr': 0.00019993711293318472, 'samples': 668992, 'steps': 1306, 'loss/train': 3.184284210205078} -09/20/2021 19:00:55 - INFO - __main__ - Step 20907: {'lr': 0.00019993711293318472, 'samples': 669024, 'steps': 1306, 'loss/train': 2.884460926055908} -09/20/2021 19:00:56 - INFO - __main__ - Step 20908: {'lr': 0.00019993711293318472, 'samples': 669056, 'steps': 1306, 'loss/train': 2.863558530807495} -09/20/2021 19:00:57 - INFO - __main__ - Step 20909: {'lr': 0.00019993711293318472, 'samples': 669088, 'steps': 1306, 'loss/train': 4.346446990966797} -09/20/2021 19:00:57 - INFO - __main__ - Step 20910: {'lr': 0.00019993711293318472, 'samples': 669120, 'steps': 1306, 'loss/train': 5.779201507568359} -09/20/2021 19:00:58 - INFO - __main__ - Step 20911: {'lr': 0.00019993711293318472, 'samples': 669152, 'steps': 1306, 'loss/train': 3.3322222232818604} -09/20/2021 19:00:59 - INFO - __main__ - Step 20912: {'lr': 0.00019993711293318472, 'samples': 669184, 'steps': 1306, 'loss/train': 3.1179587841033936} -09/20/2021 19:01:00 - INFO - __main__ - Step 20913: {'lr': 0.00019993688654110515, 'samples': 669216, 'steps': 1307, 'loss/train': 4.127814292907715} -09/20/2021 19:01:01 - INFO - __main__ - Step 20914: {'lr': 0.00019993688654110515, 'samples': 669248, 'steps': 1307, 'loss/train': 5.003244400024414} -09/20/2021 19:01:01 - INFO - __main__ - Step 20915: {'lr': 0.00019993688654110515, 'samples': 669280, 'steps': 1307, 'loss/train': 3.72694730758667} -09/20/2021 19:01:02 - INFO - __main__ - Step 20916: {'lr': 0.00019993688654110515, 'samples': 669312, 'steps': 1307, 'loss/train': 3.4438419342041016} -09/20/2021 19:01:03 - INFO - __main__ - Step 20917: {'lr': 0.00019993688654110515, 'samples': 669344, 'steps': 1307, 'loss/train': 1.670326590538025} -09/20/2021 19:01:04 - INFO - __main__ - Step 20918: {'lr': 0.00019993688654110515, 'samples': 669376, 'steps': 1307, 'loss/train': 3.208245038986206} -09/20/2021 19:01:04 - INFO - __main__ - Step 20919: {'lr': 0.00019993688654110515, 'samples': 669408, 'steps': 1307, 'loss/train': 4.8425445556640625} -09/20/2021 19:01:05 - INFO - __main__ - Step 20920: {'lr': 0.00019993688654110515, 'samples': 669440, 'steps': 1307, 'loss/train': 3.3008499145507812} -09/20/2021 19:01:06 - INFO - __main__ - Step 20921: {'lr': 0.00019993688654110515, 'samples': 669472, 'steps': 1307, 'loss/train': 4.835867404937744} -09/20/2021 19:01:07 - INFO - __main__ - Step 20922: {'lr': 0.00019993688654110515, 'samples': 669504, 'steps': 1307, 'loss/train': 2.929328680038452} -09/20/2021 19:01:07 - INFO - __main__ - Step 20923: {'lr': 0.00019993688654110515, 'samples': 669536, 'steps': 1307, 'loss/train': 2.597768545150757} -09/20/2021 19:01:09 - INFO - __main__ - Step 20924: {'lr': 0.00019993688654110515, 'samples': 669568, 'steps': 1307, 'loss/train': 3.860976219177246} -09/20/2021 19:01:09 - INFO - __main__ - Step 20925: {'lr': 0.00019993688654110515, 'samples': 669600, 'steps': 1307, 'loss/train': 0.9385666847229004} -09/20/2021 19:01:10 - INFO - __main__ - Step 20926: {'lr': 0.00019993688654110515, 'samples': 669632, 'steps': 1307, 'loss/train': 3.4326794147491455} -09/20/2021 19:01:11 - INFO - __main__ - Step 20927: {'lr': 0.00019993688654110515, 'samples': 669664, 'steps': 1307, 'loss/train': 3.6346428394317627} -09/20/2021 19:01:12 - INFO - __main__ - Step 20928: {'lr': 0.00019993688654110515, 'samples': 669696, 'steps': 1307, 'loss/train': 2.9676272869110107} -09/20/2021 19:01:12 - INFO - __main__ - Step 20929: {'lr': 0.0001999366597423828, 'samples': 669728, 'steps': 1308, 'loss/train': 3.7545619010925293} -09/20/2021 19:01:13 - INFO - __main__ - Step 20930: {'lr': 0.0001999366597423828, 'samples': 669760, 'steps': 1308, 'loss/train': 3.1256914138793945} -09/20/2021 19:01:14 - INFO - __main__ - Step 20931: {'lr': 0.0001999366597423828, 'samples': 669792, 'steps': 1308, 'loss/train': 3.4846599102020264} -09/20/2021 19:01:15 - INFO - __main__ - Step 20932: {'lr': 0.0001999366597423828, 'samples': 669824, 'steps': 1308, 'loss/train': 3.67231822013855} -09/20/2021 19:01:15 - INFO - __main__ - Step 20933: {'lr': 0.0001999366597423828, 'samples': 669856, 'steps': 1308, 'loss/train': 2.0715534687042236} -09/20/2021 19:01:16 - INFO - __main__ - Step 20934: {'lr': 0.0001999366597423828, 'samples': 669888, 'steps': 1308, 'loss/train': 2.6770291328430176} -09/20/2021 19:01:17 - INFO - __main__ - Step 20935: {'lr': 0.0001999366597423828, 'samples': 669920, 'steps': 1308, 'loss/train': 2.896286725997925} -09/20/2021 19:01:18 - INFO - __main__ - Step 20936: {'lr': 0.0001999366597423828, 'samples': 669952, 'steps': 1308, 'loss/train': 3.2026405334472656} -09/20/2021 19:01:18 - INFO - __main__ - Step 20937: {'lr': 0.0001999366597423828, 'samples': 669984, 'steps': 1308, 'loss/train': 3.4478423595428467} -09/20/2021 19:01:19 - INFO - __main__ - Step 20938: {'lr': 0.0001999366597423828, 'samples': 670016, 'steps': 1308, 'loss/train': 3.337740182876587} -09/20/2021 19:01:20 - INFO - __main__ - Step 20939: {'lr': 0.0001999366597423828, 'samples': 670048, 'steps': 1308, 'loss/train': 2.373408794403076} -09/20/2021 19:01:21 - INFO - __main__ - Step 20940: {'lr': 0.0001999366597423828, 'samples': 670080, 'steps': 1308, 'loss/train': 3.6593220233917236} -09/20/2021 19:01:21 - INFO - __main__ - Step 20941: {'lr': 0.0001999366597423828, 'samples': 670112, 'steps': 1308, 'loss/train': 2.766115665435791} -09/20/2021 19:01:22 - INFO - __main__ - Step 20942: {'lr': 0.0001999366597423828, 'samples': 670144, 'steps': 1308, 'loss/train': 2.874709129333496} -09/20/2021 19:01:23 - INFO - __main__ - Step 20943: {'lr': 0.0001999366597423828, 'samples': 670176, 'steps': 1308, 'loss/train': 3.9422295093536377} -09/20/2021 19:01:24 - INFO - __main__ - Step 20944: {'lr': 0.0001999366597423828, 'samples': 670208, 'steps': 1308, 'loss/train': 2.8130524158477783} -09/20/2021 19:01:25 - INFO - __main__ - Step 20945: {'lr': 0.00019993643253701858, 'samples': 670240, 'steps': 1309, 'loss/train': 2.6707839965820312} -09/20/2021 19:01:25 - INFO - __main__ - Step 20946: {'lr': 0.00019993643253701858, 'samples': 670272, 'steps': 1309, 'loss/train': 3.7155587673187256} -09/20/2021 19:01:26 - INFO - __main__ - Step 20947: {'lr': 0.00019993643253701858, 'samples': 670304, 'steps': 1309, 'loss/train': 4.134966850280762} -09/20/2021 19:01:27 - INFO - __main__ - Step 20948: {'lr': 0.00019993643253701858, 'samples': 670336, 'steps': 1309, 'loss/train': 2.8284270763397217} -09/20/2021 19:01:28 - INFO - __main__ - Step 20949: {'lr': 0.00019993643253701858, 'samples': 670368, 'steps': 1309, 'loss/train': 3.1679680347442627} -09/20/2021 19:01:28 - INFO - __main__ - Step 20950: {'lr': 0.00019993643253701858, 'samples': 670400, 'steps': 1309, 'loss/train': 4.211698532104492} -09/20/2021 19:01:29 - INFO - __main__ - Step 20951: {'lr': 0.00019993643253701858, 'samples': 670432, 'steps': 1309, 'loss/train': 2.6107215881347656} -09/20/2021 19:01:30 - INFO - __main__ - Step 20952: {'lr': 0.00019993643253701858, 'samples': 670464, 'steps': 1309, 'loss/train': 3.503851890563965} -09/20/2021 19:01:31 - INFO - __main__ - Step 20953: {'lr': 0.00019993643253701858, 'samples': 670496, 'steps': 1309, 'loss/train': 3.7001287937164307} -09/20/2021 19:01:31 - INFO - __main__ - Step 20954: {'lr': 0.00019993643253701858, 'samples': 670528, 'steps': 1309, 'loss/train': 3.0666003227233887} -09/20/2021 19:01:33 - INFO - __main__ - Step 20955: {'lr': 0.00019993643253701858, 'samples': 670560, 'steps': 1309, 'loss/train': 3.3514225482940674} -09/20/2021 19:01:33 - INFO - __main__ - Step 20956: {'lr': 0.00019993643253701858, 'samples': 670592, 'steps': 1309, 'loss/train': 3.5996253490448} -09/20/2021 19:01:34 - INFO - __main__ - Step 20957: {'lr': 0.00019993643253701858, 'samples': 670624, 'steps': 1309, 'loss/train': 3.29584002494812} -09/20/2021 19:01:35 - INFO - __main__ - Step 20958: {'lr': 0.00019993643253701858, 'samples': 670656, 'steps': 1309, 'loss/train': 4.595926761627197} -09/20/2021 19:01:36 - INFO - __main__ - Step 20959: {'lr': 0.00019993643253701858, 'samples': 670688, 'steps': 1309, 'loss/train': 4.863544464111328} -09/20/2021 19:01:36 - INFO - __main__ - Step 20960: {'lr': 0.00019993643253701858, 'samples': 670720, 'steps': 1309, 'loss/train': 3.429201364517212} -09/20/2021 19:01:37 - INFO - __main__ - Step 20961: {'lr': 0.00019993620492501338, 'samples': 670752, 'steps': 1310, 'loss/train': 2.645005941390991} -09/20/2021 19:01:38 - INFO - __main__ - Step 20962: {'lr': 0.00019993620492501338, 'samples': 670784, 'steps': 1310, 'loss/train': 2.6364753246307373} -09/20/2021 19:01:39 - INFO - __main__ - Step 20963: {'lr': 0.00019993620492501338, 'samples': 670816, 'steps': 1310, 'loss/train': 4.0331597328186035} -09/20/2021 19:01:40 - INFO - __main__ - Step 20964: {'lr': 0.00019993620492501338, 'samples': 670848, 'steps': 1310, 'loss/train': 2.8031044006347656} -09/20/2021 19:01:40 - INFO - __main__ - Step 20965: {'lr': 0.00019993620492501338, 'samples': 670880, 'steps': 1310, 'loss/train': 3.0496740341186523} -09/20/2021 19:01:41 - INFO - __main__ - Step 20966: {'lr': 0.00019993620492501338, 'samples': 670912, 'steps': 1310, 'loss/train': 3.6875696182250977} -09/20/2021 19:01:42 - INFO - __main__ - Step 20967: {'lr': 0.00019993620492501338, 'samples': 670944, 'steps': 1310, 'loss/train': 3.620413064956665} -09/20/2021 19:01:43 - INFO - __main__ - Step 20968: {'lr': 0.00019993620492501338, 'samples': 670976, 'steps': 1310, 'loss/train': 3.4013190269470215} -09/20/2021 19:01:43 - INFO - __main__ - Step 20969: {'lr': 0.00019993620492501338, 'samples': 671008, 'steps': 1310, 'loss/train': 3.3211286067962646} -09/20/2021 19:01:44 - INFO - __main__ - Step 20970: {'lr': 0.00019993620492501338, 'samples': 671040, 'steps': 1310, 'loss/train': 3.0261690616607666} -09/20/2021 19:01:45 - INFO - __main__ - Step 20971: {'lr': 0.00019993620492501338, 'samples': 671072, 'steps': 1310, 'loss/train': 3.9507999420166016} -09/20/2021 19:01:46 - INFO - __main__ - Step 20972: {'lr': 0.00019993620492501338, 'samples': 671104, 'steps': 1310, 'loss/train': 3.066255807876587} -09/20/2021 19:01:46 - INFO - __main__ - Step 20973: {'lr': 0.00019993620492501338, 'samples': 671136, 'steps': 1310, 'loss/train': 3.2459583282470703} -09/20/2021 19:01:47 - INFO - __main__ - Step 20974: {'lr': 0.00019993620492501338, 'samples': 671168, 'steps': 1310, 'loss/train': 3.7010133266448975} -09/20/2021 19:01:48 - INFO - __main__ - Step 20975: {'lr': 0.00019993620492501338, 'samples': 671200, 'steps': 1310, 'loss/train': 2.9565157890319824} -09/20/2021 19:01:49 - INFO - __main__ - Step 20976: {'lr': 0.00019993620492501338, 'samples': 671232, 'steps': 1310, 'loss/train': 2.086547613143921} -09/20/2021 19:01:49 - INFO - __main__ - Step 20977: {'lr': 0.00019993597690636813, 'samples': 671264, 'steps': 1311, 'loss/train': 3.394428253173828} -09/20/2021 19:01:50 - INFO - __main__ - Step 20978: {'lr': 0.00019993597690636813, 'samples': 671296, 'steps': 1311, 'loss/train': 3.3281571865081787} -09/20/2021 19:01:51 - INFO - __main__ - Step 20979: {'lr': 0.00019993597690636813, 'samples': 671328, 'steps': 1311, 'loss/train': 3.833225727081299} -09/20/2021 19:01:52 - INFO - __main__ - Step 20980: {'lr': 0.00019993597690636813, 'samples': 671360, 'steps': 1311, 'loss/train': 3.9069297313690186} -09/20/2021 19:01:52 - INFO - __main__ - Step 20981: {'lr': 0.00019993597690636813, 'samples': 671392, 'steps': 1311, 'loss/train': 3.155426502227783} -09/20/2021 19:01:53 - INFO - __main__ - Step 20982: {'lr': 0.00019993597690636813, 'samples': 671424, 'steps': 1311, 'loss/train': 3.359628915786743} -09/20/2021 19:01:54 - INFO - __main__ - Step 20983: {'lr': 0.00019993597690636813, 'samples': 671456, 'steps': 1311, 'loss/train': 3.6398940086364746} -09/20/2021 19:01:55 - INFO - __main__ - Step 20984: {'lr': 0.00019993597690636813, 'samples': 671488, 'steps': 1311, 'loss/train': 2.8305892944335938} -09/20/2021 19:01:55 - INFO - __main__ - Step 20985: {'lr': 0.00019993597690636813, 'samples': 671520, 'steps': 1311, 'loss/train': 1.9142340421676636} -09/20/2021 19:01:57 - INFO - __main__ - Step 20986: {'lr': 0.00019993597690636813, 'samples': 671552, 'steps': 1311, 'loss/train': 3.952887773513794} -09/20/2021 19:01:57 - INFO - __main__ - Step 20987: {'lr': 0.00019993597690636813, 'samples': 671584, 'steps': 1311, 'loss/train': 3.127458095550537} -09/20/2021 19:01:58 - INFO - __main__ - Step 20988: {'lr': 0.00019993597690636813, 'samples': 671616, 'steps': 1311, 'loss/train': 2.4517221450805664} -09/20/2021 19:01:59 - INFO - __main__ - Step 20989: {'lr': 0.00019993597690636813, 'samples': 671648, 'steps': 1311, 'loss/train': 3.1429953575134277} -09/20/2021 19:02:00 - INFO - __main__ - Step 20990: {'lr': 0.00019993597690636813, 'samples': 671680, 'steps': 1311, 'loss/train': 0.9309989809989929} -09/20/2021 19:02:00 - INFO - __main__ - Step 20991: {'lr': 0.00019993597690636813, 'samples': 671712, 'steps': 1311, 'loss/train': 2.577329635620117} -09/20/2021 19:02:01 - INFO - __main__ - Step 20992: {'lr': 0.00019993597690636813, 'samples': 671744, 'steps': 1311, 'loss/train': 2.55847430229187} -09/20/2021 19:02:02 - INFO - __main__ - Step 20993: {'lr': 0.0001999357484810838, 'samples': 671776, 'steps': 1312, 'loss/train': 5.2266950607299805} -09/20/2021 19:02:03 - INFO - __main__ - Step 20994: {'lr': 0.0001999357484810838, 'samples': 671808, 'steps': 1312, 'loss/train': 3.7524795532226562} -09/20/2021 19:02:04 - INFO - __main__ - Step 20995: {'lr': 0.0001999357484810838, 'samples': 671840, 'steps': 1312, 'loss/train': 3.228163003921509} -09/20/2021 19:02:04 - INFO - __main__ - Step 20996: {'lr': 0.0001999357484810838, 'samples': 671872, 'steps': 1312, 'loss/train': 3.166698455810547} -09/20/2021 19:02:05 - INFO - __main__ - Step 20997: {'lr': 0.0001999357484810838, 'samples': 671904, 'steps': 1312, 'loss/train': 2.9600257873535156} -09/20/2021 19:02:06 - INFO - __main__ - Step 20998: {'lr': 0.0001999357484810838, 'samples': 671936, 'steps': 1312, 'loss/train': 3.345292329788208} -09/20/2021 19:02:07 - INFO - __main__ - Step 20999: {'lr': 0.0001999357484810838, 'samples': 671968, 'steps': 1312, 'loss/train': 3.708357572555542} -09/20/2021 19:02:07 - INFO - __main__ - Step 21000: {'lr': 0.0001999357484810838, 'samples': 672000, 'steps': 1312, 'loss/train': 3.6290886402130127} -09/20/2021 19:02:08 - INFO - __main__ - Step 21001: {'lr': 0.0001999357484810838, 'samples': 672032, 'steps': 1312, 'loss/train': 3.0520951747894287} -09/20/2021 19:02:09 - INFO - __main__ - Step 21002: {'lr': 0.0001999357484810838, 'samples': 672064, 'steps': 1312, 'loss/train': 4.912009239196777} -09/20/2021 19:02:10 - INFO - __main__ - Step 21003: {'lr': 0.0001999357484810838, 'samples': 672096, 'steps': 1312, 'loss/train': 4.160528182983398} -09/20/2021 19:02:10 - INFO - __main__ - Step 21004: {'lr': 0.0001999357484810838, 'samples': 672128, 'steps': 1312, 'loss/train': 2.542018175125122} -09/20/2021 19:02:11 - INFO - __main__ - Step 21005: {'lr': 0.0001999357484810838, 'samples': 672160, 'steps': 1312, 'loss/train': 2.980276584625244} -09/20/2021 19:02:12 - INFO - __main__ - Step 21006: {'lr': 0.0001999357484810838, 'samples': 672192, 'steps': 1312, 'loss/train': 2.7919445037841797} -09/20/2021 19:02:13 - INFO - __main__ - Step 21007: {'lr': 0.0001999357484810838, 'samples': 672224, 'steps': 1312, 'loss/train': 3.0077033042907715} -09/20/2021 19:02:13 - INFO - __main__ - Step 21008: {'lr': 0.0001999357484810838, 'samples': 672256, 'steps': 1312, 'loss/train': 4.222569465637207} -09/20/2021 19:02:14 - INFO - __main__ - Step 21009: {'lr': 0.00019993551964916134, 'samples': 672288, 'steps': 1313, 'loss/train': 3.2441277503967285} -09/20/2021 19:02:15 - INFO - __main__ - Step 21010: {'lr': 0.00019993551964916134, 'samples': 672320, 'steps': 1313, 'loss/train': 3.0139713287353516} -09/20/2021 19:02:16 - INFO - __main__ - Step 21011: {'lr': 0.00019993551964916134, 'samples': 672352, 'steps': 1313, 'loss/train': 3.7710328102111816} -09/20/2021 19:02:16 - INFO - __main__ - Step 21012: {'lr': 0.00019993551964916134, 'samples': 672384, 'steps': 1313, 'loss/train': 4.257450580596924} -09/20/2021 19:02:17 - INFO - __main__ - Step 21013: {'lr': 0.00019993551964916134, 'samples': 672416, 'steps': 1313, 'loss/train': 3.9263033866882324} -09/20/2021 19:02:18 - INFO - __main__ - Step 21014: {'lr': 0.00019993551964916134, 'samples': 672448, 'steps': 1313, 'loss/train': 2.808729410171509} -09/20/2021 19:02:19 - INFO - __main__ - Step 21015: {'lr': 0.00019993551964916134, 'samples': 672480, 'steps': 1313, 'loss/train': 3.8835136890411377} -09/20/2021 19:02:19 - INFO - __main__ - Step 21016: {'lr': 0.00019993551964916134, 'samples': 672512, 'steps': 1313, 'loss/train': 2.3001246452331543} -09/20/2021 19:02:20 - INFO - __main__ - Step 21017: {'lr': 0.00019993551964916134, 'samples': 672544, 'steps': 1313, 'loss/train': 4.2683210372924805} -09/20/2021 19:02:22 - INFO - __main__ - Step 21018: {'lr': 0.00019993551964916134, 'samples': 672576, 'steps': 1313, 'loss/train': 3.2432172298431396} -09/20/2021 19:02:23 - INFO - __main__ - Step 21019: {'lr': 0.00019993551964916134, 'samples': 672608, 'steps': 1313, 'loss/train': 2.9253597259521484} -09/20/2021 19:02:23 - INFO - __main__ - Step 21020: {'lr': 0.00019993551964916134, 'samples': 672640, 'steps': 1313, 'loss/train': 3.245107889175415} -09/20/2021 19:02:24 - INFO - __main__ - Step 21021: {'lr': 0.00019993551964916134, 'samples': 672672, 'steps': 1313, 'loss/train': 3.4766616821289062} -09/20/2021 19:02:25 - INFO - __main__ - Step 21022: {'lr': 0.00019993551964916134, 'samples': 672704, 'steps': 1313, 'loss/train': 3.575873374938965} -09/20/2021 19:02:26 - INFO - __main__ - Step 21023: {'lr': 0.00019993551964916134, 'samples': 672736, 'steps': 1313, 'loss/train': 2.6757843494415283} -09/20/2021 19:02:26 - INFO - __main__ - Step 21024: {'lr': 0.00019993551964916134, 'samples': 672768, 'steps': 1313, 'loss/train': 4.118015289306641} -09/20/2021 19:02:27 - INFO - __main__ - Step 21025: {'lr': 0.0001999352904106016, 'samples': 672800, 'steps': 1314, 'loss/train': 3.770933151245117} -09/20/2021 19:02:28 - INFO - __main__ - Step 21026: {'lr': 0.0001999352904106016, 'samples': 672832, 'steps': 1314, 'loss/train': 3.693509340286255} -09/20/2021 19:02:29 - INFO - __main__ - Step 21027: {'lr': 0.0001999352904106016, 'samples': 672864, 'steps': 1314, 'loss/train': 2.818211793899536} -09/20/2021 19:02:30 - INFO - __main__ - Step 21028: {'lr': 0.0001999352904106016, 'samples': 672896, 'steps': 1314, 'loss/train': 1.053248643875122} -09/20/2021 19:02:30 - INFO - __main__ - Step 21029: {'lr': 0.0001999352904106016, 'samples': 672928, 'steps': 1314, 'loss/train': 4.314757347106934} -09/20/2021 19:02:31 - INFO - __main__ - Step 21030: {'lr': 0.0001999352904106016, 'samples': 672960, 'steps': 1314, 'loss/train': 2.617642879486084} -09/20/2021 19:02:32 - INFO - __main__ - Step 21031: {'lr': 0.0001999352904106016, 'samples': 672992, 'steps': 1314, 'loss/train': 2.9014604091644287} -09/20/2021 19:02:33 - INFO - __main__ - Step 21032: {'lr': 0.0001999352904106016, 'samples': 673024, 'steps': 1314, 'loss/train': 3.269657611846924} -09/20/2021 19:02:33 - INFO - __main__ - Step 21033: {'lr': 0.0001999352904106016, 'samples': 673056, 'steps': 1314, 'loss/train': 3.5315794944763184} -09/20/2021 19:02:34 - INFO - __main__ - Step 21034: {'lr': 0.0001999352904106016, 'samples': 673088, 'steps': 1314, 'loss/train': 4.314048767089844} -09/20/2021 19:02:35 - INFO - __main__ - Step 21035: {'lr': 0.0001999352904106016, 'samples': 673120, 'steps': 1314, 'loss/train': 3.2458033561706543} -09/20/2021 19:02:36 - INFO - __main__ - Step 21036: {'lr': 0.0001999352904106016, 'samples': 673152, 'steps': 1314, 'loss/train': 2.8909707069396973} -09/20/2021 19:02:36 - INFO - __main__ - Step 21037: {'lr': 0.0001999352904106016, 'samples': 673184, 'steps': 1314, 'loss/train': 3.3052926063537598} -09/20/2021 19:02:37 - INFO - __main__ - Step 21038: {'lr': 0.0001999352904106016, 'samples': 673216, 'steps': 1314, 'loss/train': 2.6486992835998535} -09/20/2021 19:02:38 - INFO - __main__ - Step 21039: {'lr': 0.0001999352904106016, 'samples': 673248, 'steps': 1314, 'loss/train': 3.098984479904175} -09/20/2021 19:02:39 - INFO - __main__ - Step 21040: {'lr': 0.0001999352904106016, 'samples': 673280, 'steps': 1314, 'loss/train': 3.573228359222412} -09/20/2021 19:02:39 - INFO - __main__ - Step 21041: {'lr': 0.00019993506076540553, 'samples': 673312, 'steps': 1315, 'loss/train': 1.0430916547775269} -09/20/2021 19:02:40 - INFO - __main__ - Step 21042: {'lr': 0.00019993506076540553, 'samples': 673344, 'steps': 1315, 'loss/train': 2.8374135494232178} -09/20/2021 19:02:41 - INFO - __main__ - Step 21043: {'lr': 0.00019993506076540553, 'samples': 673376, 'steps': 1315, 'loss/train': 4.354111194610596} -09/20/2021 19:02:42 - INFO - __main__ - Step 21044: {'lr': 0.00019993506076540553, 'samples': 673408, 'steps': 1315, 'loss/train': 3.6673998832702637} -09/20/2021 19:02:42 - INFO - __main__ - Step 21045: {'lr': 0.00019993506076540553, 'samples': 673440, 'steps': 1315, 'loss/train': 2.3637678623199463} -09/20/2021 19:02:43 - INFO - __main__ - Step 21046: {'lr': 0.00019993506076540553, 'samples': 673472, 'steps': 1315, 'loss/train': 3.1508922576904297} -09/20/2021 19:02:44 - INFO - __main__ - Step 21047: {'lr': 0.00019993506076540553, 'samples': 673504, 'steps': 1315, 'loss/train': 3.5761234760284424} -09/20/2021 19:02:45 - INFO - __main__ - Step 21048: {'lr': 0.00019993506076540553, 'samples': 673536, 'steps': 1315, 'loss/train': 3.1542861461639404} -09/20/2021 19:02:45 - INFO - __main__ - Step 21049: {'lr': 0.00019993506076540553, 'samples': 673568, 'steps': 1315, 'loss/train': 3.6911263465881348} -09/20/2021 19:02:47 - INFO - __main__ - Step 21050: {'lr': 0.00019993506076540553, 'samples': 673600, 'steps': 1315, 'loss/train': 3.8179054260253906} -09/20/2021 19:02:48 - INFO - __main__ - Step 21051: {'lr': 0.00019993506076540553, 'samples': 673632, 'steps': 1315, 'loss/train': 1.1453899145126343} -09/20/2021 19:02:48 - INFO - __main__ - Step 21052: {'lr': 0.00019993506076540553, 'samples': 673664, 'steps': 1315, 'loss/train': 3.5391485691070557} -09/20/2021 19:02:49 - INFO - __main__ - Step 21053: {'lr': 0.00019993506076540553, 'samples': 673696, 'steps': 1315, 'loss/train': 3.041938066482544} -09/20/2021 19:02:50 - INFO - __main__ - Step 21054: {'lr': 0.00019993506076540553, 'samples': 673728, 'steps': 1315, 'loss/train': 3.538865327835083} -09/20/2021 19:02:51 - INFO - __main__ - Step 21055: {'lr': 0.00019993506076540553, 'samples': 673760, 'steps': 1315, 'loss/train': 4.622311592102051} -09/20/2021 19:02:51 - INFO - __main__ - Step 21056: {'lr': 0.00019993506076540553, 'samples': 673792, 'steps': 1315, 'loss/train': 3.8800878524780273} -09/20/2021 19:02:52 - INFO - __main__ - Step 21057: {'lr': 0.0001999348307135741, 'samples': 673824, 'steps': 1316, 'loss/train': 3.174194574356079} -09/20/2021 19:02:53 - INFO - __main__ - Step 21058: {'lr': 0.0001999348307135741, 'samples': 673856, 'steps': 1316, 'loss/train': 2.357052803039551} -09/20/2021 19:02:54 - INFO - __main__ - Step 21059: {'lr': 0.0001999348307135741, 'samples': 673888, 'steps': 1316, 'loss/train': 3.671422243118286} -09/20/2021 19:02:54 - INFO - __main__ - Step 21060: {'lr': 0.0001999348307135741, 'samples': 673920, 'steps': 1316, 'loss/train': 4.079856872558594} -09/20/2021 19:02:55 - INFO - __main__ - Step 21061: {'lr': 0.0001999348307135741, 'samples': 673952, 'steps': 1316, 'loss/train': 2.433875799179077} -09/20/2021 19:02:56 - INFO - __main__ - Step 21062: {'lr': 0.0001999348307135741, 'samples': 673984, 'steps': 1316, 'loss/train': 3.081029176712036} -09/20/2021 19:02:57 - INFO - __main__ - Step 21063: {'lr': 0.0001999348307135741, 'samples': 674016, 'steps': 1316, 'loss/train': 2.9284534454345703} -09/20/2021 19:02:57 - INFO - __main__ - Step 21064: {'lr': 0.0001999348307135741, 'samples': 674048, 'steps': 1316, 'loss/train': 3.9224846363067627} -09/20/2021 19:02:58 - INFO - __main__ - Step 21065: {'lr': 0.0001999348307135741, 'samples': 674080, 'steps': 1316, 'loss/train': 1.4064542055130005} -09/20/2021 19:02:59 - INFO - __main__ - Step 21066: {'lr': 0.0001999348307135741, 'samples': 674112, 'steps': 1316, 'loss/train': 3.315134048461914} -09/20/2021 19:03:00 - INFO - __main__ - Step 21067: {'lr': 0.0001999348307135741, 'samples': 674144, 'steps': 1316, 'loss/train': 2.8480942249298096} -09/20/2021 19:03:00 - INFO - __main__ - Step 21068: {'lr': 0.0001999348307135741, 'samples': 674176, 'steps': 1316, 'loss/train': 4.3124284744262695} -09/20/2021 19:03:01 - INFO - __main__ - Step 21069: {'lr': 0.0001999348307135741, 'samples': 674208, 'steps': 1316, 'loss/train': 3.5007529258728027} -09/20/2021 19:03:02 - INFO - __main__ - Step 21070: {'lr': 0.0001999348307135741, 'samples': 674240, 'steps': 1316, 'loss/train': 3.517157554626465} -09/20/2021 19:03:03 - INFO - __main__ - Step 21071: {'lr': 0.0001999348307135741, 'samples': 674272, 'steps': 1316, 'loss/train': 3.6306142807006836} -09/20/2021 19:03:03 - INFO - __main__ - Step 21072: {'lr': 0.0001999348307135741, 'samples': 674304, 'steps': 1316, 'loss/train': 2.6703970432281494} -09/20/2021 19:03:04 - INFO - __main__ - Step 21073: {'lr': 0.00019993460025510826, 'samples': 674336, 'steps': 1317, 'loss/train': 3.9698190689086914} -09/20/2021 19:03:05 - INFO - __main__ - Step 21074: {'lr': 0.00019993460025510826, 'samples': 674368, 'steps': 1317, 'loss/train': 3.491403102874756} -09/20/2021 19:03:06 - INFO - __main__ - Step 21075: {'lr': 0.00019993460025510826, 'samples': 674400, 'steps': 1317, 'loss/train': 3.006901741027832} -09/20/2021 19:03:07 - INFO - __main__ - Step 21076: {'lr': 0.00019993460025510826, 'samples': 674432, 'steps': 1317, 'loss/train': 5.734396457672119} -09/20/2021 19:03:07 - INFO - __main__ - Step 21077: {'lr': 0.00019993460025510826, 'samples': 674464, 'steps': 1317, 'loss/train': 4.45241641998291} -09/20/2021 19:03:08 - INFO - __main__ - Step 21078: {'lr': 0.00019993460025510826, 'samples': 674496, 'steps': 1317, 'loss/train': 3.600351095199585} -09/20/2021 19:03:09 - INFO - __main__ - Step 21079: {'lr': 0.00019993460025510826, 'samples': 674528, 'steps': 1317, 'loss/train': 4.2530999183654785} -09/20/2021 19:03:10 - INFO - __main__ - Step 21080: {'lr': 0.00019993460025510826, 'samples': 674560, 'steps': 1317, 'loss/train': 3.715320587158203} -09/20/2021 19:03:11 - INFO - __main__ - Step 21081: {'lr': 0.00019993460025510826, 'samples': 674592, 'steps': 1317, 'loss/train': 3.0224907398223877} -09/20/2021 19:03:12 - INFO - __main__ - Step 21082: {'lr': 0.00019993460025510826, 'samples': 674624, 'steps': 1317, 'loss/train': 2.3231372833251953} -09/20/2021 19:03:12 - INFO - __main__ - Step 21083: {'lr': 0.00019993460025510826, 'samples': 674656, 'steps': 1317, 'loss/train': 2.902899980545044} -09/20/2021 19:03:13 - INFO - __main__ - Step 21084: {'lr': 0.00019993460025510826, 'samples': 674688, 'steps': 1317, 'loss/train': 2.889901876449585} -09/20/2021 19:03:14 - INFO - __main__ - Step 21085: {'lr': 0.00019993460025510826, 'samples': 674720, 'steps': 1317, 'loss/train': 2.913830518722534} -09/20/2021 19:03:15 - INFO - __main__ - Step 21086: {'lr': 0.00019993460025510826, 'samples': 674752, 'steps': 1317, 'loss/train': 3.888230323791504} -09/20/2021 19:03:15 - INFO - __main__ - Step 21087: {'lr': 0.00019993460025510826, 'samples': 674784, 'steps': 1317, 'loss/train': 2.925731897354126} -09/20/2021 19:03:16 - INFO - __main__ - Step 21088: {'lr': 0.00019993460025510826, 'samples': 674816, 'steps': 1317, 'loss/train': 3.007627248764038} -09/20/2021 19:03:17 - INFO - __main__ - Step 21089: {'lr': 0.0001999343693900089, 'samples': 674848, 'steps': 1318, 'loss/train': 3.097705364227295} -09/20/2021 19:03:18 - INFO - __main__ - Step 21090: {'lr': 0.0001999343693900089, 'samples': 674880, 'steps': 1318, 'loss/train': 3.559023380279541} -09/20/2021 19:03:18 - INFO - __main__ - Step 21091: {'lr': 0.0001999343693900089, 'samples': 674912, 'steps': 1318, 'loss/train': 3.2442328929901123} -09/20/2021 19:03:19 - INFO - __main__ - Step 21092: {'lr': 0.0001999343693900089, 'samples': 674944, 'steps': 1318, 'loss/train': 2.410611152648926} -09/20/2021 19:03:20 - INFO - __main__ - Step 21093: {'lr': 0.0001999343693900089, 'samples': 674976, 'steps': 1318, 'loss/train': 3.992312431335449} -09/20/2021 19:03:21 - INFO - __main__ - Step 21094: {'lr': 0.0001999343693900089, 'samples': 675008, 'steps': 1318, 'loss/train': 3.2676916122436523} -09/20/2021 19:03:21 - INFO - __main__ - Step 21095: {'lr': 0.0001999343693900089, 'samples': 675040, 'steps': 1318, 'loss/train': 2.9433679580688477} -09/20/2021 19:03:22 - INFO - __main__ - Step 21096: {'lr': 0.0001999343693900089, 'samples': 675072, 'steps': 1318, 'loss/train': 3.1514644622802734} -09/20/2021 19:03:23 - INFO - __main__ - Step 21097: {'lr': 0.0001999343693900089, 'samples': 675104, 'steps': 1318, 'loss/train': 2.193955898284912} -09/20/2021 19:03:24 - INFO - __main__ - Step 21098: {'lr': 0.0001999343693900089, 'samples': 675136, 'steps': 1318, 'loss/train': 3.150480031967163} -09/20/2021 19:03:24 - INFO - __main__ - Step 21099: {'lr': 0.0001999343693900089, 'samples': 675168, 'steps': 1318, 'loss/train': 3.8362503051757812} -09/20/2021 19:03:25 - INFO - __main__ - Step 21100: {'lr': 0.0001999343693900089, 'samples': 675200, 'steps': 1318, 'loss/train': 2.955495834350586} -09/20/2021 19:03:26 - INFO - __main__ - Step 21101: {'lr': 0.0001999343693900089, 'samples': 675232, 'steps': 1318, 'loss/train': 2.9088988304138184} -09/20/2021 19:03:27 - INFO - __main__ - Step 21102: {'lr': 0.0001999343693900089, 'samples': 675264, 'steps': 1318, 'loss/train': 3.0517590045928955} -09/20/2021 19:03:27 - INFO - __main__ - Step 21103: {'lr': 0.0001999343693900089, 'samples': 675296, 'steps': 1318, 'loss/train': 3.2555091381073} -09/20/2021 19:03:28 - INFO - __main__ - Step 21104: {'lr': 0.0001999343693900089, 'samples': 675328, 'steps': 1318, 'loss/train': 3.494170904159546} -09/20/2021 19:03:29 - INFO - __main__ - Step 21105: {'lr': 0.00019993413811827696, 'samples': 675360, 'steps': 1319, 'loss/train': 3.593341588973999} -09/20/2021 19:03:30 - INFO - __main__ - Step 21106: {'lr': 0.00019993413811827696, 'samples': 675392, 'steps': 1319, 'loss/train': 0.49456220865249634} -09/20/2021 19:03:31 - INFO - __main__ - Step 21107: {'lr': 0.00019993413811827696, 'samples': 675424, 'steps': 1319, 'loss/train': 3.5256569385528564} -09/20/2021 19:03:31 - INFO - __main__ - Step 21108: {'lr': 0.00019993413811827696, 'samples': 675456, 'steps': 1319, 'loss/train': 3.489018201828003} -09/20/2021 19:03:32 - INFO - __main__ - Step 21109: {'lr': 0.00019993413811827696, 'samples': 675488, 'steps': 1319, 'loss/train': 3.828407049179077} -09/20/2021 19:03:33 - INFO - __main__ - Step 21110: {'lr': 0.00019993413811827696, 'samples': 675520, 'steps': 1319, 'loss/train': 3.835419178009033} -09/20/2021 19:03:34 - INFO - __main__ - Step 21111: {'lr': 0.00019993413811827696, 'samples': 675552, 'steps': 1319, 'loss/train': 3.7772560119628906} -09/20/2021 19:03:35 - INFO - __main__ - Step 21112: {'lr': 0.00019993413811827696, 'samples': 675584, 'steps': 1319, 'loss/train': 2.720186471939087} -09/20/2021 19:03:36 - INFO - __main__ - Step 21113: {'lr': 0.00019993413811827696, 'samples': 675616, 'steps': 1319, 'loss/train': 3.2923059463500977} -09/20/2021 19:03:36 - INFO - __main__ - Step 21114: {'lr': 0.00019993413811827696, 'samples': 675648, 'steps': 1319, 'loss/train': 3.2602901458740234} -09/20/2021 19:03:37 - INFO - __main__ - Step 21115: {'lr': 0.00019993413811827696, 'samples': 675680, 'steps': 1319, 'loss/train': 4.032089710235596} -09/20/2021 19:03:38 - INFO - __main__ - Step 21116: {'lr': 0.00019993413811827696, 'samples': 675712, 'steps': 1319, 'loss/train': 3.3318252563476562} -09/20/2021 19:03:39 - INFO - __main__ - Step 21117: {'lr': 0.00019993413811827696, 'samples': 675744, 'steps': 1319, 'loss/train': 0.5294380187988281} -09/20/2021 19:03:39 - INFO - __main__ - Step 21118: {'lr': 0.00019993413811827696, 'samples': 675776, 'steps': 1319, 'loss/train': 2.2196671962738037} -09/20/2021 19:03:40 - INFO - __main__ - Step 21119: {'lr': 0.00019993413811827696, 'samples': 675808, 'steps': 1319, 'loss/train': 4.500833988189697} -09/20/2021 19:03:41 - INFO - __main__ - Step 21120: {'lr': 0.00019993413811827696, 'samples': 675840, 'steps': 1319, 'loss/train': 2.3423471450805664} -09/20/2021 19:03:42 - INFO - __main__ - Step 21121: {'lr': 0.0001999339064399134, 'samples': 675872, 'steps': 1320, 'loss/train': 3.260380983352661} -09/20/2021 19:03:42 - INFO - __main__ - Step 21122: {'lr': 0.0001999339064399134, 'samples': 675904, 'steps': 1320, 'loss/train': 2.9603376388549805} -09/20/2021 19:03:43 - INFO - __main__ - Step 21123: {'lr': 0.0001999339064399134, 'samples': 675936, 'steps': 1320, 'loss/train': 3.856839895248413} -09/20/2021 19:03:44 - INFO - __main__ - Step 21124: {'lr': 0.0001999339064399134, 'samples': 675968, 'steps': 1320, 'loss/train': 4.757077217102051} -09/20/2021 19:03:45 - INFO - __main__ - Step 21125: {'lr': 0.0001999339064399134, 'samples': 676000, 'steps': 1320, 'loss/train': 2.6261329650878906} -09/20/2021 19:03:45 - INFO - __main__ - Step 21126: {'lr': 0.0001999339064399134, 'samples': 676032, 'steps': 1320, 'loss/train': 3.3548777103424072} -09/20/2021 19:03:46 - INFO - __main__ - Step 21127: {'lr': 0.0001999339064399134, 'samples': 676064, 'steps': 1320, 'loss/train': 3.7352192401885986} -09/20/2021 19:03:47 - INFO - __main__ - Step 21128: {'lr': 0.0001999339064399134, 'samples': 676096, 'steps': 1320, 'loss/train': 3.363640308380127} -09/20/2021 19:03:48 - INFO - __main__ - Step 21129: {'lr': 0.0001999339064399134, 'samples': 676128, 'steps': 1320, 'loss/train': 2.9402360916137695} -09/20/2021 19:03:48 - INFO - __main__ - Step 21130: {'lr': 0.0001999339064399134, 'samples': 676160, 'steps': 1320, 'loss/train': 2.8920674324035645} -09/20/2021 19:03:49 - INFO - __main__ - Step 21131: {'lr': 0.0001999339064399134, 'samples': 676192, 'steps': 1320, 'loss/train': 3.2051472663879395} -09/20/2021 19:03:50 - INFO - __main__ - Step 21132: {'lr': 0.0001999339064399134, 'samples': 676224, 'steps': 1320, 'loss/train': 3.4117348194122314} -09/20/2021 19:03:51 - INFO - __main__ - Step 21133: {'lr': 0.0001999339064399134, 'samples': 676256, 'steps': 1320, 'loss/train': 3.678114414215088} -09/20/2021 19:03:51 - INFO - __main__ - Step 21134: {'lr': 0.0001999339064399134, 'samples': 676288, 'steps': 1320, 'loss/train': 3.433742046356201} -09/20/2021 19:03:52 - INFO - __main__ - Step 21135: {'lr': 0.0001999339064399134, 'samples': 676320, 'steps': 1320, 'loss/train': 2.65791654586792} -09/20/2021 19:03:53 - INFO - __main__ - Step 21136: {'lr': 0.0001999339064399134, 'samples': 676352, 'steps': 1320, 'loss/train': 3.8680226802825928} -09/20/2021 19:03:54 - INFO - __main__ - Step 21137: {'lr': 0.00019993367435491922, 'samples': 676384, 'steps': 1321, 'loss/train': 3.3805654048919678} -09/20/2021 19:03:55 - INFO - __main__ - Step 21138: {'lr': 0.00019993367435491922, 'samples': 676416, 'steps': 1321, 'loss/train': 6.10338830947876} -09/20/2021 19:03:55 - INFO - __main__ - Step 21139: {'lr': 0.00019993367435491922, 'samples': 676448, 'steps': 1321, 'loss/train': 2.4097282886505127} -09/20/2021 19:03:56 - INFO - __main__ - Step 21140: {'lr': 0.00019993367435491922, 'samples': 676480, 'steps': 1321, 'loss/train': 3.053380250930786} -09/20/2021 19:03:57 - INFO - __main__ - Step 21141: {'lr': 0.00019993367435491922, 'samples': 676512, 'steps': 1321, 'loss/train': 2.086285352706909} -09/20/2021 19:03:58 - INFO - __main__ - Step 21142: {'lr': 0.00019993367435491922, 'samples': 676544, 'steps': 1321, 'loss/train': 3.32291316986084} -09/20/2021 19:03:59 - INFO - __main__ - Step 21143: {'lr': 0.00019993367435491922, 'samples': 676576, 'steps': 1321, 'loss/train': 3.478917360305786} -09/20/2021 19:04:00 - INFO - __main__ - Step 21144: {'lr': 0.00019993367435491922, 'samples': 676608, 'steps': 1321, 'loss/train': 4.20797061920166} -09/20/2021 19:04:01 - INFO - __main__ - Step 21145: {'lr': 0.00019993367435491922, 'samples': 676640, 'steps': 1321, 'loss/train': 0.6083515882492065} -09/20/2021 19:04:01 - INFO - __main__ - Step 21146: {'lr': 0.00019993367435491922, 'samples': 676672, 'steps': 1321, 'loss/train': 0.8772246241569519} -09/20/2021 19:04:02 - INFO - __main__ - Step 21147: {'lr': 0.00019993367435491922, 'samples': 676704, 'steps': 1321, 'loss/train': 0.664353609085083} -09/20/2021 19:04:03 - INFO - __main__ - Step 21148: {'lr': 0.00019993367435491922, 'samples': 676736, 'steps': 1321, 'loss/train': 4.222593307495117} -09/20/2021 19:04:04 - INFO - __main__ - Step 21149: {'lr': 0.00019993367435491922, 'samples': 676768, 'steps': 1321, 'loss/train': 3.2604081630706787} -09/20/2021 19:04:04 - INFO - __main__ - Step 21150: {'lr': 0.00019993367435491922, 'samples': 676800, 'steps': 1321, 'loss/train': 3.7827281951904297} -09/20/2021 19:04:05 - INFO - __main__ - Step 21151: {'lr': 0.00019993367435491922, 'samples': 676832, 'steps': 1321, 'loss/train': 4.110716819763184} -09/20/2021 19:04:06 - INFO - __main__ - Step 21152: {'lr': 0.00019993367435491922, 'samples': 676864, 'steps': 1321, 'loss/train': 2.6353468894958496} -09/20/2021 19:04:07 - INFO - __main__ - Step 21153: {'lr': 0.00019993344186329526, 'samples': 676896, 'steps': 1322, 'loss/train': 2.7177605628967285} -09/20/2021 19:04:07 - INFO - __main__ - Step 21154: {'lr': 0.00019993344186329526, 'samples': 676928, 'steps': 1322, 'loss/train': 3.0116004943847656} -09/20/2021 19:04:08 - INFO - __main__ - Step 21155: {'lr': 0.00019993344186329526, 'samples': 676960, 'steps': 1322, 'loss/train': 3.40165114402771} -09/20/2021 19:04:09 - INFO - __main__ - Step 21156: {'lr': 0.00019993344186329526, 'samples': 676992, 'steps': 1322, 'loss/train': 3.3446624279022217} -09/20/2021 19:04:10 - INFO - __main__ - Step 21157: {'lr': 0.00019993344186329526, 'samples': 677024, 'steps': 1322, 'loss/train': 3.369525194168091} -09/20/2021 19:04:10 - INFO - __main__ - Step 21158: {'lr': 0.00019993344186329526, 'samples': 677056, 'steps': 1322, 'loss/train': 3.327331066131592} -09/20/2021 19:04:11 - INFO - __main__ - Step 21159: {'lr': 0.00019993344186329526, 'samples': 677088, 'steps': 1322, 'loss/train': 3.0215091705322266} -09/20/2021 19:04:12 - INFO - __main__ - Step 21160: {'lr': 0.00019993344186329526, 'samples': 677120, 'steps': 1322, 'loss/train': 2.313389539718628} -09/20/2021 19:04:13 - INFO - __main__ - Step 21161: {'lr': 0.00019993344186329526, 'samples': 677152, 'steps': 1322, 'loss/train': 3.271015167236328} -09/20/2021 19:04:13 - INFO - __main__ - Step 21162: {'lr': 0.00019993344186329526, 'samples': 677184, 'steps': 1322, 'loss/train': 4.0755228996276855} -09/20/2021 19:04:14 - INFO - __main__ - Step 21163: {'lr': 0.00019993344186329526, 'samples': 677216, 'steps': 1322, 'loss/train': 3.806830883026123} -09/20/2021 19:04:15 - INFO - __main__ - Step 21164: {'lr': 0.00019993344186329526, 'samples': 677248, 'steps': 1322, 'loss/train': 2.41105055809021} -09/20/2021 19:04:16 - INFO - __main__ - Step 21165: {'lr': 0.00019993344186329526, 'samples': 677280, 'steps': 1322, 'loss/train': 3.386458396911621} -09/20/2021 19:04:16 - INFO - __main__ - Step 21166: {'lr': 0.00019993344186329526, 'samples': 677312, 'steps': 1322, 'loss/train': 2.776500701904297} -09/20/2021 19:04:17 - INFO - __main__ - Step 21167: {'lr': 0.00019993344186329526, 'samples': 677344, 'steps': 1322, 'loss/train': 2.460078239440918} -09/20/2021 19:04:18 - INFO - __main__ - Step 21168: {'lr': 0.00019993344186329526, 'samples': 677376, 'steps': 1322, 'loss/train': 3.0142533779144287} -09/20/2021 19:04:19 - INFO - __main__ - Step 21169: {'lr': 0.00019993320896504252, 'samples': 677408, 'steps': 1323, 'loss/train': 3.597442626953125} -09/20/2021 19:04:20 - INFO - __main__ - Step 21170: {'lr': 0.00019993320896504252, 'samples': 677440, 'steps': 1323, 'loss/train': 4.3710761070251465} -09/20/2021 19:04:20 - INFO - __main__ - Step 21171: {'lr': 0.00019993320896504252, 'samples': 677472, 'steps': 1323, 'loss/train': 4.524550437927246} -09/20/2021 19:04:21 - INFO - __main__ - Step 21172: {'lr': 0.00019993320896504252, 'samples': 677504, 'steps': 1323, 'loss/train': 3.2515957355499268} -09/20/2021 19:04:22 - INFO - __main__ - Step 21173: {'lr': 0.00019993320896504252, 'samples': 677536, 'steps': 1323, 'loss/train': 3.194941759109497} -09/20/2021 19:04:23 - INFO - __main__ - Step 21174: {'lr': 0.00019993320896504252, 'samples': 677568, 'steps': 1323, 'loss/train': 3.1758534908294678} -09/20/2021 19:04:23 - INFO - __main__ - Step 21175: {'lr': 0.00019993320896504252, 'samples': 677600, 'steps': 1323, 'loss/train': 3.1799964904785156} -09/20/2021 19:04:24 - INFO - __main__ - Step 21176: {'lr': 0.00019993320896504252, 'samples': 677632, 'steps': 1323, 'loss/train': 3.2616798877716064} -09/20/2021 19:04:25 - INFO - __main__ - Step 21177: {'lr': 0.00019993320896504252, 'samples': 677664, 'steps': 1323, 'loss/train': 3.1577439308166504} -09/20/2021 19:04:26 - INFO - __main__ - Step 21178: {'lr': 0.00019993320896504252, 'samples': 677696, 'steps': 1323, 'loss/train': 3.542309522628784} -09/20/2021 19:04:27 - INFO - __main__ - Step 21179: {'lr': 0.00019993320896504252, 'samples': 677728, 'steps': 1323, 'loss/train': 3.75150203704834} -09/20/2021 19:04:28 - INFO - __main__ - Step 21180: {'lr': 0.00019993320896504252, 'samples': 677760, 'steps': 1323, 'loss/train': 4.135714054107666} -09/20/2021 19:04:28 - INFO - __main__ - Step 21181: {'lr': 0.00019993320896504252, 'samples': 677792, 'steps': 1323, 'loss/train': 2.383471727371216} -09/20/2021 19:04:29 - INFO - __main__ - Step 21182: {'lr': 0.00019993320896504252, 'samples': 677824, 'steps': 1323, 'loss/train': 3.366880416870117} -09/20/2021 19:04:30 - INFO - __main__ - Step 21183: {'lr': 0.00019993320896504252, 'samples': 677856, 'steps': 1323, 'loss/train': 2.5654184818267822} -09/20/2021 19:04:31 - INFO - __main__ - Step 21184: {'lr': 0.00019993320896504252, 'samples': 677888, 'steps': 1323, 'loss/train': 0.7039706707000732} -09/20/2021 19:04:31 - INFO - __main__ - Step 21185: {'lr': 0.00019993297566016192, 'samples': 677920, 'steps': 1324, 'loss/train': 4.008270263671875} -09/20/2021 19:04:32 - INFO - __main__ - Step 21186: {'lr': 0.00019993297566016192, 'samples': 677952, 'steps': 1324, 'loss/train': 5.109308242797852} -09/20/2021 19:04:33 - INFO - __main__ - Step 21187: {'lr': 0.00019993297566016192, 'samples': 677984, 'steps': 1324, 'loss/train': 3.12817120552063} -09/20/2021 19:04:34 - INFO - __main__ - Step 21188: {'lr': 0.00019993297566016192, 'samples': 678016, 'steps': 1324, 'loss/train': 3.383530616760254} -09/20/2021 19:04:34 - INFO - __main__ - Step 21189: {'lr': 0.00019993297566016192, 'samples': 678048, 'steps': 1324, 'loss/train': 2.9679477214813232} -09/20/2021 19:04:35 - INFO - __main__ - Step 21190: {'lr': 0.00019993297566016192, 'samples': 678080, 'steps': 1324, 'loss/train': 2.8573856353759766} -09/20/2021 19:04:36 - INFO - __main__ - Step 21191: {'lr': 0.00019993297566016192, 'samples': 678112, 'steps': 1324, 'loss/train': 2.910861015319824} -09/20/2021 19:04:37 - INFO - __main__ - Step 21192: {'lr': 0.00019993297566016192, 'samples': 678144, 'steps': 1324, 'loss/train': 4.022124767303467} -09/20/2021 19:04:37 - INFO - __main__ - Step 21193: {'lr': 0.00019993297566016192, 'samples': 678176, 'steps': 1324, 'loss/train': 3.136070489883423} -09/20/2021 19:04:38 - INFO - __main__ - Step 21194: {'lr': 0.00019993297566016192, 'samples': 678208, 'steps': 1324, 'loss/train': 3.118354082107544} -09/20/2021 19:04:39 - INFO - __main__ - Step 21195: {'lr': 0.00019993297566016192, 'samples': 678240, 'steps': 1324, 'loss/train': 4.2701239585876465} -09/20/2021 19:04:40 - INFO - __main__ - Step 21196: {'lr': 0.00019993297566016192, 'samples': 678272, 'steps': 1324, 'loss/train': 1.6745381355285645} -09/20/2021 19:04:40 - INFO - __main__ - Step 21197: {'lr': 0.00019993297566016192, 'samples': 678304, 'steps': 1324, 'loss/train': 2.900674343109131} -09/20/2021 19:04:41 - INFO - __main__ - Step 21198: {'lr': 0.00019993297566016192, 'samples': 678336, 'steps': 1324, 'loss/train': 3.160442352294922} -09/20/2021 19:04:42 - INFO - __main__ - Step 21199: {'lr': 0.00019993297566016192, 'samples': 678368, 'steps': 1324, 'loss/train': 3.7914390563964844} -09/20/2021 19:04:43 - INFO - __main__ - Step 21200: {'lr': 0.00019993297566016192, 'samples': 678400, 'steps': 1324, 'loss/train': 2.582261800765991} -09/20/2021 19:04:44 - INFO - __main__ - Step 21201: {'lr': 0.00019993274194865445, 'samples': 678432, 'steps': 1325, 'loss/train': 3.8353443145751953} -09/20/2021 19:04:44 - INFO - __main__ - Step 21202: {'lr': 0.00019993274194865445, 'samples': 678464, 'steps': 1325, 'loss/train': 3.4217193126678467} -09/20/2021 19:04:45 - INFO - __main__ - Step 21203: {'lr': 0.00019993274194865445, 'samples': 678496, 'steps': 1325, 'loss/train': 1.7821797132492065} -09/20/2021 19:04:46 - INFO - __main__ - Step 21204: {'lr': 0.00019993274194865445, 'samples': 678528, 'steps': 1325, 'loss/train': 3.483625650405884} -09/20/2021 19:04:47 - INFO - __main__ - Step 21205: {'lr': 0.00019993274194865445, 'samples': 678560, 'steps': 1325, 'loss/train': 2.7623512744903564} -09/20/2021 19:04:47 - INFO - __main__ - Step 21206: {'lr': 0.00019993274194865445, 'samples': 678592, 'steps': 1325, 'loss/train': 2.608449935913086} -09/20/2021 19:04:48 - INFO - __main__ - Step 21207: {'lr': 0.00019993274194865445, 'samples': 678624, 'steps': 1325, 'loss/train': 3.3523929119110107} -09/20/2021 19:04:49 - INFO - __main__ - Step 21208: {'lr': 0.00019993274194865445, 'samples': 678656, 'steps': 1325, 'loss/train': 3.933241844177246} -09/20/2021 19:04:50 - INFO - __main__ - Step 21209: {'lr': 0.00019993274194865445, 'samples': 678688, 'steps': 1325, 'loss/train': 3.001046895980835} -09/20/2021 19:04:51 - INFO - __main__ - Step 21210: {'lr': 0.00019993274194865445, 'samples': 678720, 'steps': 1325, 'loss/train': 3.145589828491211} -09/20/2021 19:04:52 - INFO - __main__ - Step 21211: {'lr': 0.00019993274194865445, 'samples': 678752, 'steps': 1325, 'loss/train': 5.441564559936523} -09/20/2021 19:04:52 - INFO - __main__ - Step 21212: {'lr': 0.00019993274194865445, 'samples': 678784, 'steps': 1325, 'loss/train': 3.4471235275268555} -09/20/2021 19:04:53 - INFO - __main__ - Step 21213: {'lr': 0.00019993274194865445, 'samples': 678816, 'steps': 1325, 'loss/train': 3.98956036567688} -09/20/2021 19:04:54 - INFO - __main__ - Step 21214: {'lr': 0.00019993274194865445, 'samples': 678848, 'steps': 1325, 'loss/train': 2.3543295860290527} -09/20/2021 19:04:55 - INFO - __main__ - Step 21215: {'lr': 0.00019993274194865445, 'samples': 678880, 'steps': 1325, 'loss/train': 3.35709810256958} -09/20/2021 19:04:55 - INFO - __main__ - Step 21216: {'lr': 0.00019993274194865445, 'samples': 678912, 'steps': 1325, 'loss/train': 3.0601861476898193} -09/20/2021 19:04:56 - INFO - __main__ - Step 21217: {'lr': 0.00019993250783052104, 'samples': 678944, 'steps': 1326, 'loss/train': 2.867882251739502} -09/20/2021 19:04:57 - INFO - __main__ - Step 21218: {'lr': 0.00019993250783052104, 'samples': 678976, 'steps': 1326, 'loss/train': 2.7701401710510254} -09/20/2021 19:04:58 - INFO - __main__ - Step 21219: {'lr': 0.00019993250783052104, 'samples': 679008, 'steps': 1326, 'loss/train': 2.8233587741851807} -09/20/2021 19:04:59 - INFO - __main__ - Step 21220: {'lr': 0.00019993250783052104, 'samples': 679040, 'steps': 1326, 'loss/train': 3.2884881496429443} -09/20/2021 19:04:59 - INFO - __main__ - Step 21221: {'lr': 0.00019993250783052104, 'samples': 679072, 'steps': 1326, 'loss/train': 2.521489143371582} -09/20/2021 19:05:00 - INFO - __main__ - Step 21222: {'lr': 0.00019993250783052104, 'samples': 679104, 'steps': 1326, 'loss/train': 3.440275192260742} -09/20/2021 19:05:01 - INFO - __main__ - Step 21223: {'lr': 0.00019993250783052104, 'samples': 679136, 'steps': 1326, 'loss/train': 3.384990930557251} -09/20/2021 19:05:02 - INFO - __main__ - Step 21224: {'lr': 0.00019993250783052104, 'samples': 679168, 'steps': 1326, 'loss/train': 2.93709397315979} -09/20/2021 19:05:02 - INFO - __main__ - Step 21225: {'lr': 0.00019993250783052104, 'samples': 679200, 'steps': 1326, 'loss/train': 3.2722644805908203} -09/20/2021 19:05:03 - INFO - __main__ - Step 21226: {'lr': 0.00019993250783052104, 'samples': 679232, 'steps': 1326, 'loss/train': 3.147143602371216} -09/20/2021 19:05:04 - INFO - __main__ - Step 21227: {'lr': 0.00019993250783052104, 'samples': 679264, 'steps': 1326, 'loss/train': 3.484943151473999} -09/20/2021 19:05:05 - INFO - __main__ - Step 21228: {'lr': 0.00019993250783052104, 'samples': 679296, 'steps': 1326, 'loss/train': 3.2014951705932617} -09/20/2021 19:05:05 - INFO - __main__ - Step 21229: {'lr': 0.00019993250783052104, 'samples': 679328, 'steps': 1326, 'loss/train': 4.575386047363281} -09/20/2021 19:05:06 - INFO - __main__ - Step 21230: {'lr': 0.00019993250783052104, 'samples': 679360, 'steps': 1326, 'loss/train': 4.646839141845703} -09/20/2021 19:05:07 - INFO - __main__ - Step 21231: {'lr': 0.00019993250783052104, 'samples': 679392, 'steps': 1326, 'loss/train': 3.504798173904419} -09/20/2021 19:05:08 - INFO - __main__ - Step 21232: {'lr': 0.00019993250783052104, 'samples': 679424, 'steps': 1326, 'loss/train': 3.3552052974700928} -09/20/2021 19:05:08 - INFO - __main__ - Step 21233: {'lr': 0.00019993227330576265, 'samples': 679456, 'steps': 1327, 'loss/train': 3.2898552417755127} -09/20/2021 19:05:09 - INFO - __main__ - Step 21234: {'lr': 0.00019993227330576265, 'samples': 679488, 'steps': 1327, 'loss/train': 4.1476240158081055} -09/20/2021 19:05:10 - INFO - __main__ - Step 21235: {'lr': 0.00019993227330576265, 'samples': 679520, 'steps': 1327, 'loss/train': 3.0598227977752686} -09/20/2021 19:05:11 - INFO - __main__ - Step 21236: {'lr': 0.00019993227330576265, 'samples': 679552, 'steps': 1327, 'loss/train': 3.760946273803711} -09/20/2021 19:05:11 - INFO - __main__ - Step 21237: {'lr': 0.00019993227330576265, 'samples': 679584, 'steps': 1327, 'loss/train': 4.233923435211182} -09/20/2021 19:05:12 - INFO - __main__ - Step 21238: {'lr': 0.00019993227330576265, 'samples': 679616, 'steps': 1327, 'loss/train': 3.8600687980651855} -09/20/2021 19:05:13 - INFO - __main__ - Step 21239: {'lr': 0.00019993227330576265, 'samples': 679648, 'steps': 1327, 'loss/train': 2.5037150382995605} -09/20/2021 19:05:14 - INFO - __main__ - Step 21240: {'lr': 0.00019993227330576265, 'samples': 679680, 'steps': 1327, 'loss/train': 2.9619834423065186} -09/20/2021 19:05:15 - INFO - __main__ - Step 21241: {'lr': 0.00019993227330576265, 'samples': 679712, 'steps': 1327, 'loss/train': 3.3767969608306885} -09/20/2021 19:05:16 - INFO - __main__ - Step 21242: {'lr': 0.00019993227330576265, 'samples': 679744, 'steps': 1327, 'loss/train': 3.772284984588623} -09/20/2021 19:05:16 - INFO - __main__ - Step 21243: {'lr': 0.00019993227330576265, 'samples': 679776, 'steps': 1327, 'loss/train': 2.7380638122558594} -09/20/2021 19:05:17 - INFO - __main__ - Step 21244: {'lr': 0.00019993227330576265, 'samples': 679808, 'steps': 1327, 'loss/train': 2.2342872619628906} -09/20/2021 19:05:18 - INFO - __main__ - Step 21245: {'lr': 0.00019993227330576265, 'samples': 679840, 'steps': 1327, 'loss/train': 3.1542298793792725} -09/20/2021 19:05:19 - INFO - __main__ - Step 21246: {'lr': 0.00019993227330576265, 'samples': 679872, 'steps': 1327, 'loss/train': 3.112305164337158} -09/20/2021 19:05:19 - INFO - __main__ - Step 21247: {'lr': 0.00019993227330576265, 'samples': 679904, 'steps': 1327, 'loss/train': 2.8715157508850098} -09/20/2021 19:05:20 - INFO - __main__ - Step 21248: {'lr': 0.00019993227330576265, 'samples': 679936, 'steps': 1327, 'loss/train': 2.770610809326172} -09/20/2021 19:05:21 - INFO - __main__ - Step 21249: {'lr': 0.00019993203837438022, 'samples': 679968, 'steps': 1328, 'loss/train': 3.779066801071167} -09/20/2021 19:05:22 - INFO - __main__ - Step 21250: {'lr': 0.00019993203837438022, 'samples': 680000, 'steps': 1328, 'loss/train': 3.670293092727661} -09/20/2021 19:05:23 - INFO - __main__ - Step 21251: {'lr': 0.00019993203837438022, 'samples': 680032, 'steps': 1328, 'loss/train': 2.6029515266418457} -09/20/2021 19:05:23 - INFO - __main__ - Step 21252: {'lr': 0.00019993203837438022, 'samples': 680064, 'steps': 1328, 'loss/train': 2.152627468109131} -09/20/2021 19:05:24 - INFO - __main__ - Step 21253: {'lr': 0.00019993203837438022, 'samples': 680096, 'steps': 1328, 'loss/train': 3.160698890686035} -09/20/2021 19:05:25 - INFO - __main__ - Step 21254: {'lr': 0.00019993203837438022, 'samples': 680128, 'steps': 1328, 'loss/train': 4.103656768798828} -09/20/2021 19:05:26 - INFO - __main__ - Step 21255: {'lr': 0.00019993203837438022, 'samples': 680160, 'steps': 1328, 'loss/train': 3.4244070053100586} -09/20/2021 19:05:26 - INFO - __main__ - Step 21256: {'lr': 0.00019993203837438022, 'samples': 680192, 'steps': 1328, 'loss/train': 3.0238046646118164} -09/20/2021 19:05:27 - INFO - __main__ - Step 21257: {'lr': 0.00019993203837438022, 'samples': 680224, 'steps': 1328, 'loss/train': 2.5776207447052} -09/20/2021 19:05:28 - INFO - __main__ - Step 21258: {'lr': 0.00019993203837438022, 'samples': 680256, 'steps': 1328, 'loss/train': 0.8845654129981995} -09/20/2021 19:05:29 - INFO - __main__ - Step 21259: {'lr': 0.00019993203837438022, 'samples': 680288, 'steps': 1328, 'loss/train': 3.3669824600219727} -09/20/2021 19:05:29 - INFO - __main__ - Step 21260: {'lr': 0.00019993203837438022, 'samples': 680320, 'steps': 1328, 'loss/train': 2.8108530044555664} -09/20/2021 19:05:30 - INFO - __main__ - Step 21261: {'lr': 0.00019993203837438022, 'samples': 680352, 'steps': 1328, 'loss/train': 3.17246675491333} -09/20/2021 19:05:31 - INFO - __main__ - Step 21262: {'lr': 0.00019993203837438022, 'samples': 680384, 'steps': 1328, 'loss/train': 3.461512804031372} -09/20/2021 19:05:32 - INFO - __main__ - Step 21263: {'lr': 0.00019993203837438022, 'samples': 680416, 'steps': 1328, 'loss/train': 3.838064432144165} -09/20/2021 19:05:32 - INFO - __main__ - Step 21264: {'lr': 0.00019993203837438022, 'samples': 680448, 'steps': 1328, 'loss/train': 1.167370080947876} -09/20/2021 19:05:33 - INFO - __main__ - Step 21265: {'lr': 0.00019993180303637474, 'samples': 680480, 'steps': 1329, 'loss/train': 3.4284555912017822} -09/20/2021 19:05:34 - INFO - __main__ - Step 21266: {'lr': 0.00019993180303637474, 'samples': 680512, 'steps': 1329, 'loss/train': 3.7398831844329834} -09/20/2021 19:05:35 - INFO - __main__ - Step 21267: {'lr': 0.00019993180303637474, 'samples': 680544, 'steps': 1329, 'loss/train': 3.865259885787964} -09/20/2021 19:05:36 - INFO - __main__ - Step 21268: {'lr': 0.00019993180303637474, 'samples': 680576, 'steps': 1329, 'loss/train': 4.323779582977295} -09/20/2021 19:05:37 - INFO - __main__ - Step 21269: {'lr': 0.00019993180303637474, 'samples': 680608, 'steps': 1329, 'loss/train': 4.012362957000732} -09/20/2021 19:05:38 - INFO - __main__ - Step 21270: {'lr': 0.00019993180303637474, 'samples': 680640, 'steps': 1329, 'loss/train': 3.4522488117218018} -09/20/2021 19:05:38 - INFO - __main__ - Step 21271: {'lr': 0.00019993180303637474, 'samples': 680672, 'steps': 1329, 'loss/train': 2.3506040573120117} -09/20/2021 19:05:39 - INFO - __main__ - Step 21272: {'lr': 0.00019993180303637474, 'samples': 680704, 'steps': 1329, 'loss/train': 2.5851709842681885} -09/20/2021 19:05:40 - INFO - __main__ - Step 21273: {'lr': 0.00019993180303637474, 'samples': 680736, 'steps': 1329, 'loss/train': 2.0988142490386963} -09/20/2021 19:05:41 - INFO - __main__ - Step 21274: {'lr': 0.00019993180303637474, 'samples': 680768, 'steps': 1329, 'loss/train': 3.1459946632385254} -09/20/2021 19:05:41 - INFO - __main__ - Step 21275: {'lr': 0.00019993180303637474, 'samples': 680800, 'steps': 1329, 'loss/train': 3.072115421295166} -09/20/2021 19:05:42 - INFO - __main__ - Step 21276: {'lr': 0.00019993180303637474, 'samples': 680832, 'steps': 1329, 'loss/train': 2.9231820106506348} -09/20/2021 19:05:43 - INFO - __main__ - Step 21277: {'lr': 0.00019993180303637474, 'samples': 680864, 'steps': 1329, 'loss/train': 4.499547004699707} -09/20/2021 19:05:44 - INFO - __main__ - Step 21278: {'lr': 0.00019993180303637474, 'samples': 680896, 'steps': 1329, 'loss/train': 3.487185001373291} -09/20/2021 19:05:44 - INFO - __main__ - Step 21279: {'lr': 0.00019993180303637474, 'samples': 680928, 'steps': 1329, 'loss/train': 3.636582136154175} -09/20/2021 19:05:45 - INFO - __main__ - Step 21280: {'lr': 0.00019993180303637474, 'samples': 680960, 'steps': 1329, 'loss/train': 4.258825778961182} -09/20/2021 19:05:46 - INFO - __main__ - Step 21281: {'lr': 0.0001999315672917471, 'samples': 680992, 'steps': 1330, 'loss/train': 0.5223383903503418} -09/20/2021 19:05:47 - INFO - __main__ - Step 21282: {'lr': 0.0001999315672917471, 'samples': 681024, 'steps': 1330, 'loss/train': 0.8229176998138428} -09/20/2021 19:05:47 - INFO - __main__ - Step 21283: {'lr': 0.0001999315672917471, 'samples': 681056, 'steps': 1330, 'loss/train': 3.8709826469421387} -09/20/2021 19:05:48 - INFO - __main__ - Step 21284: {'lr': 0.0001999315672917471, 'samples': 681088, 'steps': 1330, 'loss/train': 3.7121994495391846} -09/20/2021 19:05:49 - INFO - __main__ - Step 21285: {'lr': 0.0001999315672917471, 'samples': 681120, 'steps': 1330, 'loss/train': 2.843543291091919} -09/20/2021 19:05:50 - INFO - __main__ - Step 21286: {'lr': 0.0001999315672917471, 'samples': 681152, 'steps': 1330, 'loss/train': 2.21429181098938} -09/20/2021 19:05:50 - INFO - __main__ - Step 21287: {'lr': 0.0001999315672917471, 'samples': 681184, 'steps': 1330, 'loss/train': 0.9165077805519104} -09/20/2021 19:05:51 - INFO - __main__ - Step 21288: {'lr': 0.0001999315672917471, 'samples': 681216, 'steps': 1330, 'loss/train': 3.002760887145996} -09/20/2021 19:05:52 - INFO - __main__ - Step 21289: {'lr': 0.0001999315672917471, 'samples': 681248, 'steps': 1330, 'loss/train': 3.2234363555908203} -09/20/2021 19:05:53 - INFO - __main__ - Step 21290: {'lr': 0.0001999315672917471, 'samples': 681280, 'steps': 1330, 'loss/train': 2.9594485759735107} -09/20/2021 19:05:53 - INFO - __main__ - Step 21291: {'lr': 0.0001999315672917471, 'samples': 681312, 'steps': 1330, 'loss/train': 3.825589656829834} -09/20/2021 19:05:54 - INFO - __main__ - Step 21292: {'lr': 0.0001999315672917471, 'samples': 681344, 'steps': 1330, 'loss/train': 3.2268922328948975} -09/20/2021 19:05:55 - INFO - __main__ - Step 21293: {'lr': 0.0001999315672917471, 'samples': 681376, 'steps': 1330, 'loss/train': 4.996092796325684} -09/20/2021 19:05:56 - INFO - __main__ - Step 21294: {'lr': 0.0001999315672917471, 'samples': 681408, 'steps': 1330, 'loss/train': 2.9391415119171143} -09/20/2021 19:05:56 - INFO - __main__ - Step 21295: {'lr': 0.0001999315672917471, 'samples': 681440, 'steps': 1330, 'loss/train': 4.928879261016846} -09/20/2021 19:05:57 - INFO - __main__ - Step 21296: {'lr': 0.0001999315672917471, 'samples': 681472, 'steps': 1330, 'loss/train': 4.2656073570251465} -09/20/2021 19:05:58 - INFO - __main__ - Step 21297: {'lr': 0.0001999313311404983, 'samples': 681504, 'steps': 1331, 'loss/train': 3.3740055561065674} -09/20/2021 19:05:59 - INFO - __main__ - Step 21298: {'lr': 0.0001999313311404983, 'samples': 681536, 'steps': 1331, 'loss/train': 3.887789487838745} -09/20/2021 19:06:00 - INFO - __main__ - Step 21299: {'lr': 0.0001999313311404983, 'samples': 681568, 'steps': 1331, 'loss/train': 3.3729124069213867} -09/20/2021 19:06:01 - INFO - __main__ - Step 21300: {'lr': 0.0001999313311404983, 'samples': 681600, 'steps': 1331, 'loss/train': 2.6384973526000977} -09/20/2021 19:06:02 - INFO - __main__ - Step 21301: {'lr': 0.0001999313311404983, 'samples': 681632, 'steps': 1331, 'loss/train': 5.846560001373291} -09/20/2021 19:06:02 - INFO - __main__ - Step 21302: {'lr': 0.0001999313311404983, 'samples': 681664, 'steps': 1331, 'loss/train': 4.07410192489624} -09/20/2021 19:06:03 - INFO - __main__ - Step 21303: {'lr': 0.0001999313311404983, 'samples': 681696, 'steps': 1331, 'loss/train': 4.107045650482178} -09/20/2021 19:06:04 - INFO - __main__ - Step 21304: {'lr': 0.0001999313311404983, 'samples': 681728, 'steps': 1331, 'loss/train': 2.75291109085083} -09/20/2021 19:06:05 - INFO - __main__ - Step 21305: {'lr': 0.0001999313311404983, 'samples': 681760, 'steps': 1331, 'loss/train': 3.8637351989746094} -09/20/2021 19:06:05 - INFO - __main__ - Step 21306: {'lr': 0.0001999313311404983, 'samples': 681792, 'steps': 1331, 'loss/train': 3.9273622035980225} -09/20/2021 19:06:06 - INFO - __main__ - Step 21307: {'lr': 0.0001999313311404983, 'samples': 681824, 'steps': 1331, 'loss/train': 3.5367236137390137} -09/20/2021 19:06:07 - INFO - __main__ - Step 21308: {'lr': 0.0001999313311404983, 'samples': 681856, 'steps': 1331, 'loss/train': 3.5655264854431152} -09/20/2021 19:06:08 - INFO - __main__ - Step 21309: {'lr': 0.0001999313311404983, 'samples': 681888, 'steps': 1331, 'loss/train': 3.783776044845581} -09/20/2021 19:06:08 - INFO - __main__ - Step 21310: {'lr': 0.0001999313311404983, 'samples': 681920, 'steps': 1331, 'loss/train': 2.2597203254699707} -09/20/2021 19:06:09 - INFO - __main__ - Step 21311: {'lr': 0.0001999313311404983, 'samples': 681952, 'steps': 1331, 'loss/train': 2.9669973850250244} -09/20/2021 19:06:10 - INFO - __main__ - Step 21312: {'lr': 0.0001999313311404983, 'samples': 681984, 'steps': 1331, 'loss/train': 2.8644347190856934} -09/20/2021 19:06:11 - INFO - __main__ - Step 21313: {'lr': 0.00019993109458262933, 'samples': 682016, 'steps': 1332, 'loss/train': 2.2318310737609863} -09/20/2021 19:06:12 - INFO - __main__ - Step 21314: {'lr': 0.00019993109458262933, 'samples': 682048, 'steps': 1332, 'loss/train': 2.800283432006836} -09/20/2021 19:06:12 - INFO - __main__ - Step 21315: {'lr': 0.00019993109458262933, 'samples': 682080, 'steps': 1332, 'loss/train': 3.8294355869293213} -09/20/2021 19:06:13 - INFO - __main__ - Step 21316: {'lr': 0.00019993109458262933, 'samples': 682112, 'steps': 1332, 'loss/train': 4.222604274749756} -09/20/2021 19:06:14 - INFO - __main__ - Step 21317: {'lr': 0.00019993109458262933, 'samples': 682144, 'steps': 1332, 'loss/train': 3.8879127502441406} -09/20/2021 19:06:15 - INFO - __main__ - Step 21318: {'lr': 0.00019993109458262933, 'samples': 682176, 'steps': 1332, 'loss/train': 2.911780595779419} -09/20/2021 19:06:15 - INFO - __main__ - Step 21319: {'lr': 0.00019993109458262933, 'samples': 682208, 'steps': 1332, 'loss/train': 3.8122498989105225} -09/20/2021 19:06:16 - INFO - __main__ - Step 21320: {'lr': 0.00019993109458262933, 'samples': 682240, 'steps': 1332, 'loss/train': 3.6234805583953857} -09/20/2021 19:06:17 - INFO - __main__ - Step 21321: {'lr': 0.00019993109458262933, 'samples': 682272, 'steps': 1332, 'loss/train': 3.3753719329833984} -09/20/2021 19:06:18 - INFO - __main__ - Step 21322: {'lr': 0.00019993109458262933, 'samples': 682304, 'steps': 1332, 'loss/train': 3.5734775066375732} -09/20/2021 19:06:18 - INFO - __main__ - Step 21323: {'lr': 0.00019993109458262933, 'samples': 682336, 'steps': 1332, 'loss/train': 3.34596586227417} -09/20/2021 19:06:19 - INFO - __main__ - Step 21324: {'lr': 0.00019993109458262933, 'samples': 682368, 'steps': 1332, 'loss/train': 3.7202296257019043} -09/20/2021 19:06:20 - INFO - __main__ - Step 21325: {'lr': 0.00019993109458262933, 'samples': 682400, 'steps': 1332, 'loss/train': 3.240471601486206} -09/20/2021 19:06:21 - INFO - __main__ - Step 21326: {'lr': 0.00019993109458262933, 'samples': 682432, 'steps': 1332, 'loss/train': 4.959635257720947} -09/20/2021 19:06:21 - INFO - __main__ - Step 21327: {'lr': 0.00019993109458262933, 'samples': 682464, 'steps': 1332, 'loss/train': 3.7966105937957764} -09/20/2021 19:06:22 - INFO - __main__ - Step 21328: {'lr': 0.00019993109458262933, 'samples': 682496, 'steps': 1332, 'loss/train': 3.7894890308380127} -09/20/2021 19:06:23 - INFO - __main__ - Step 21329: {'lr': 0.00019993085761814113, 'samples': 682528, 'steps': 1333, 'loss/train': 3.3380322456359863} -09/20/2021 19:06:24 - INFO - __main__ - Step 21330: {'lr': 0.00019993085761814113, 'samples': 682560, 'steps': 1333, 'loss/train': 3.132721185684204} -09/20/2021 19:06:26 - INFO - __main__ - Step 21331: {'lr': 0.00019993085761814113, 'samples': 682592, 'steps': 1333, 'loss/train': 4.161285877227783} -09/20/2021 19:06:26 - INFO - __main__ - Step 21332: {'lr': 0.00019993085761814113, 'samples': 682624, 'steps': 1333, 'loss/train': 2.505113124847412} -09/20/2021 19:06:27 - INFO - __main__ - Step 21333: {'lr': 0.00019993085761814113, 'samples': 682656, 'steps': 1333, 'loss/train': 2.967355728149414} -09/20/2021 19:06:28 - INFO - __main__ - Step 21334: {'lr': 0.00019993085761814113, 'samples': 682688, 'steps': 1333, 'loss/train': 3.1027402877807617} -09/20/2021 19:06:29 - INFO - __main__ - Step 21335: {'lr': 0.00019993085761814113, 'samples': 682720, 'steps': 1333, 'loss/train': 4.673326015472412} -09/20/2021 19:06:29 - INFO - __main__ - Step 21336: {'lr': 0.00019993085761814113, 'samples': 682752, 'steps': 1333, 'loss/train': 4.137633323669434} -09/20/2021 19:06:30 - INFO - __main__ - Step 21337: {'lr': 0.00019993085761814113, 'samples': 682784, 'steps': 1333, 'loss/train': 4.40457820892334} -09/20/2021 19:06:31 - INFO - __main__ - Step 21338: {'lr': 0.00019993085761814113, 'samples': 682816, 'steps': 1333, 'loss/train': 2.9026527404785156} -09/20/2021 19:06:32 - INFO - __main__ - Step 21339: {'lr': 0.00019993085761814113, 'samples': 682848, 'steps': 1333, 'loss/train': 4.22728967666626} -09/20/2021 19:06:32 - INFO - __main__ - Step 21340: {'lr': 0.00019993085761814113, 'samples': 682880, 'steps': 1333, 'loss/train': 1.92073392868042} -09/20/2021 19:06:33 - INFO - __main__ - Step 21341: {'lr': 0.00019993085761814113, 'samples': 682912, 'steps': 1333, 'loss/train': 1.885572910308838} -09/20/2021 19:06:34 - INFO - __main__ - Step 21342: {'lr': 0.00019993085761814113, 'samples': 682944, 'steps': 1333, 'loss/train': 2.064936637878418} -09/20/2021 19:06:35 - INFO - __main__ - Step 21343: {'lr': 0.00019993085761814113, 'samples': 682976, 'steps': 1333, 'loss/train': 2.020968198776245} -09/20/2021 19:06:35 - INFO - __main__ - Step 21344: {'lr': 0.00019993085761814113, 'samples': 683008, 'steps': 1333, 'loss/train': 2.223224639892578} -09/20/2021 19:06:36 - INFO - __main__ - Step 21345: {'lr': 0.0001999306202470346, 'samples': 683040, 'steps': 1334, 'loss/train': 1.711509108543396} -09/20/2021 19:06:37 - INFO - __main__ - Step 21346: {'lr': 0.0001999306202470346, 'samples': 683072, 'steps': 1334, 'loss/train': 1.9898061752319336} -09/20/2021 19:06:38 - INFO - __main__ - Step 21347: {'lr': 0.0001999306202470346, 'samples': 683104, 'steps': 1334, 'loss/train': 2.0986061096191406} -09/20/2021 19:06:39 - INFO - __main__ - Step 21348: {'lr': 0.0001999306202470346, 'samples': 683136, 'steps': 1334, 'loss/train': 2.6182076930999756} -09/20/2021 19:06:39 - INFO - __main__ - Step 21349: {'lr': 0.0001999306202470346, 'samples': 683168, 'steps': 1334, 'loss/train': 2.854741334915161} -09/20/2021 19:06:40 - INFO - __main__ - Step 21350: {'lr': 0.0001999306202470346, 'samples': 683200, 'steps': 1334, 'loss/train': 2.960071325302124} -09/20/2021 19:06:41 - INFO - __main__ - Step 21351: {'lr': 0.0001999306202470346, 'samples': 683232, 'steps': 1334, 'loss/train': 1.9688276052474976} -09/20/2021 19:06:42 - INFO - __main__ - Step 21352: {'lr': 0.0001999306202470346, 'samples': 683264, 'steps': 1334, 'loss/train': 0.5808749794960022} -09/20/2021 19:06:42 - INFO - __main__ - Step 21353: {'lr': 0.0001999306202470346, 'samples': 683296, 'steps': 1334, 'loss/train': 0.5305401086807251} -09/20/2021 19:06:43 - INFO - __main__ - Step 21354: {'lr': 0.0001999306202470346, 'samples': 683328, 'steps': 1334, 'loss/train': 1.239524006843567} -09/20/2021 19:06:44 - INFO - __main__ - Step 21355: {'lr': 0.0001999306202470346, 'samples': 683360, 'steps': 1334, 'loss/train': 3.0646631717681885} -09/20/2021 19:06:45 - INFO - __main__ - Step 21356: {'lr': 0.0001999306202470346, 'samples': 683392, 'steps': 1334, 'loss/train': 2.879620313644409} -09/20/2021 19:06:45 - INFO - __main__ - Step 21357: {'lr': 0.0001999306202470346, 'samples': 683424, 'steps': 1334, 'loss/train': 3.635985851287842} -09/20/2021 19:06:46 - INFO - __main__ - Step 21358: {'lr': 0.0001999306202470346, 'samples': 683456, 'steps': 1334, 'loss/train': 3.1381146907806396} -09/20/2021 19:06:47 - INFO - __main__ - Step 21359: {'lr': 0.0001999306202470346, 'samples': 683488, 'steps': 1334, 'loss/train': 3.4629626274108887} -09/20/2021 19:06:48 - INFO - __main__ - Step 21360: {'lr': 0.0001999306202470346, 'samples': 683520, 'steps': 1334, 'loss/train': 3.8500607013702393} -09/20/2021 19:06:49 - INFO - __main__ - Step 21361: {'lr': 0.00019993038246931085, 'samples': 683552, 'steps': 1335, 'loss/train': 3.3273813724517822} -09/20/2021 19:06:49 - INFO - __main__ - Step 21362: {'lr': 0.00019993038246931085, 'samples': 683584, 'steps': 1335, 'loss/train': 4.45551061630249} -09/20/2021 19:06:50 - INFO - __main__ - Step 21363: {'lr': 0.00019993038246931085, 'samples': 683616, 'steps': 1335, 'loss/train': 3.705195665359497} -09/20/2021 19:06:51 - INFO - __main__ - Step 21364: {'lr': 0.00019993038246931085, 'samples': 683648, 'steps': 1335, 'loss/train': 3.429267406463623} -09/20/2021 19:06:52 - INFO - __main__ - Step 21365: {'lr': 0.00019993038246931085, 'samples': 683680, 'steps': 1335, 'loss/train': 3.0491344928741455} -09/20/2021 19:06:52 - INFO - __main__ - Step 21366: {'lr': 0.00019993038246931085, 'samples': 683712, 'steps': 1335, 'loss/train': 3.050398826599121} -09/20/2021 19:06:54 - INFO - __main__ - Step 21367: {'lr': 0.00019993038246931085, 'samples': 683744, 'steps': 1335, 'loss/train': 2.7519683837890625} -09/20/2021 19:06:54 - INFO - __main__ - Step 21368: {'lr': 0.00019993038246931085, 'samples': 683776, 'steps': 1335, 'loss/train': 3.3505072593688965} -09/20/2021 19:06:55 - INFO - __main__ - Step 21369: {'lr': 0.00019993038246931085, 'samples': 683808, 'steps': 1335, 'loss/train': 3.2600691318511963} -09/20/2021 19:06:56 - INFO - __main__ - Step 21370: {'lr': 0.00019993038246931085, 'samples': 683840, 'steps': 1335, 'loss/train': 4.2560248374938965} -09/20/2021 19:06:57 - INFO - __main__ - Step 21371: {'lr': 0.00019993038246931085, 'samples': 683872, 'steps': 1335, 'loss/train': 3.240260124206543} -09/20/2021 19:06:57 - INFO - __main__ - Step 21372: {'lr': 0.00019993038246931085, 'samples': 683904, 'steps': 1335, 'loss/train': 2.8502132892608643} -09/20/2021 19:06:58 - INFO - __main__ - Step 21373: {'lr': 0.00019993038246931085, 'samples': 683936, 'steps': 1335, 'loss/train': 2.6064021587371826} -09/20/2021 19:06:59 - INFO - __main__ - Step 21374: {'lr': 0.00019993038246931085, 'samples': 683968, 'steps': 1335, 'loss/train': 4.117733001708984} -09/20/2021 19:07:00 - INFO - __main__ - Step 21375: {'lr': 0.00019993038246931085, 'samples': 684000, 'steps': 1335, 'loss/train': 3.2845797538757324} -09/20/2021 19:07:00 - INFO - __main__ - Step 21376: {'lr': 0.00019993038246931085, 'samples': 684032, 'steps': 1335, 'loss/train': 3.521243095397949} -09/20/2021 19:07:01 - INFO - __main__ - Step 21377: {'lr': 0.0001999301442849707, 'samples': 684064, 'steps': 1336, 'loss/train': 3.2554540634155273} -09/20/2021 19:07:02 - INFO - __main__ - Step 21378: {'lr': 0.0001999301442849707, 'samples': 684096, 'steps': 1336, 'loss/train': 3.2175400257110596} -09/20/2021 19:07:03 - INFO - __main__ - Step 21379: {'lr': 0.0001999301442849707, 'samples': 684128, 'steps': 1336, 'loss/train': 2.338823080062866} -09/20/2021 19:07:03 - INFO - __main__ - Step 21380: {'lr': 0.0001999301442849707, 'samples': 684160, 'steps': 1336, 'loss/train': 3.056755542755127} -09/20/2021 19:07:04 - INFO - __main__ - Step 21381: {'lr': 0.0001999301442849707, 'samples': 684192, 'steps': 1336, 'loss/train': 4.818580627441406} -09/20/2021 19:07:05 - INFO - __main__ - Step 21382: {'lr': 0.0001999301442849707, 'samples': 684224, 'steps': 1336, 'loss/train': 4.893104553222656} -09/20/2021 19:07:06 - INFO - __main__ - Step 21383: {'lr': 0.0001999301442849707, 'samples': 684256, 'steps': 1336, 'loss/train': 3.3822555541992188} -09/20/2021 19:07:06 - INFO - __main__ - Step 21384: {'lr': 0.0001999301442849707, 'samples': 684288, 'steps': 1336, 'loss/train': 3.5518345832824707} -09/20/2021 19:07:07 - INFO - __main__ - Step 21385: {'lr': 0.0001999301442849707, 'samples': 684320, 'steps': 1336, 'loss/train': 2.8136966228485107} -09/20/2021 19:07:08 - INFO - __main__ - Step 21386: {'lr': 0.0001999301442849707, 'samples': 684352, 'steps': 1336, 'loss/train': 3.146695137023926} -09/20/2021 19:07:09 - INFO - __main__ - Step 21387: {'lr': 0.0001999301442849707, 'samples': 684384, 'steps': 1336, 'loss/train': 4.261394023895264} -09/20/2021 19:07:09 - INFO - __main__ - Step 21388: {'lr': 0.0001999301442849707, 'samples': 684416, 'steps': 1336, 'loss/train': 3.1315765380859375} -09/20/2021 19:07:10 - INFO - __main__ - Step 21389: {'lr': 0.0001999301442849707, 'samples': 684448, 'steps': 1336, 'loss/train': 2.737112045288086} -09/20/2021 19:07:11 - INFO - __main__ - Step 21390: {'lr': 0.0001999301442849707, 'samples': 684480, 'steps': 1336, 'loss/train': 2.890336036682129} -09/20/2021 19:07:12 - INFO - __main__ - Step 21391: {'lr': 0.0001999301442849707, 'samples': 684512, 'steps': 1336, 'loss/train': 2.781629800796509} -09/20/2021 19:07:12 - INFO - __main__ - Step 21392: {'lr': 0.0001999301442849707, 'samples': 684544, 'steps': 1336, 'loss/train': 3.585033893585205} -09/20/2021 19:07:13 - INFO - __main__ - Step 21393: {'lr': 0.0001999299056940152, 'samples': 684576, 'steps': 1337, 'loss/train': 2.722241163253784} -09/20/2021 19:07:14 - INFO - __main__ - Step 21394: {'lr': 0.0001999299056940152, 'samples': 684608, 'steps': 1337, 'loss/train': 3.2114341259002686} -09/20/2021 19:07:15 - INFO - __main__ - Step 21395: {'lr': 0.0001999299056940152, 'samples': 684640, 'steps': 1337, 'loss/train': 3.340968608856201} -09/20/2021 19:07:16 - INFO - __main__ - Step 21396: {'lr': 0.0001999299056940152, 'samples': 684672, 'steps': 1337, 'loss/train': 3.7975709438323975} -09/20/2021 19:07:16 - INFO - __main__ - Step 21397: {'lr': 0.0001999299056940152, 'samples': 684704, 'steps': 1337, 'loss/train': 3.760877847671509} -09/20/2021 19:07:17 - INFO - __main__ - Step 21398: {'lr': 0.0001999299056940152, 'samples': 684736, 'steps': 1337, 'loss/train': 3.4806125164031982} -09/20/2021 19:07:18 - INFO - __main__ - Step 21399: {'lr': 0.0001999299056940152, 'samples': 684768, 'steps': 1337, 'loss/train': 4.5855512619018555} -09/20/2021 19:07:19 - INFO - __main__ - Step 21400: {'lr': 0.0001999299056940152, 'samples': 684800, 'steps': 1337, 'loss/train': 2.5200419425964355} -09/20/2021 19:07:20 - INFO - __main__ - Step 21401: {'lr': 0.0001999299056940152, 'samples': 684832, 'steps': 1337, 'loss/train': 3.3620541095733643} -09/20/2021 19:07:21 - INFO - __main__ - Step 21402: {'lr': 0.0001999299056940152, 'samples': 684864, 'steps': 1337, 'loss/train': 2.334798812866211} -09/20/2021 19:07:21 - INFO - __main__ - Step 21403: {'lr': 0.0001999299056940152, 'samples': 684896, 'steps': 1337, 'loss/train': 3.8978569507598877} -09/20/2021 19:07:22 - INFO - __main__ - Step 21404: {'lr': 0.0001999299056940152, 'samples': 684928, 'steps': 1337, 'loss/train': 3.7677180767059326} -09/20/2021 19:07:23 - INFO - __main__ - Step 21405: {'lr': 0.0001999299056940152, 'samples': 684960, 'steps': 1337, 'loss/train': 3.2982633113861084} -09/20/2021 19:07:24 - INFO - __main__ - Step 21406: {'lr': 0.0001999299056940152, 'samples': 684992, 'steps': 1337, 'loss/train': 5.5030059814453125} -09/20/2021 19:07:24 - INFO - __main__ - Step 21407: {'lr': 0.0001999299056940152, 'samples': 685024, 'steps': 1337, 'loss/train': 3.907823085784912} -09/20/2021 19:07:25 - INFO - __main__ - Step 21408: {'lr': 0.0001999299056940152, 'samples': 685056, 'steps': 1337, 'loss/train': 3.0538642406463623} -09/20/2021 19:07:26 - INFO - __main__ - Step 21409: {'lr': 0.0001999296666964453, 'samples': 685088, 'steps': 1338, 'loss/train': 4.363847732543945} -09/20/2021 19:07:27 - INFO - __main__ - Step 21410: {'lr': 0.0001999296666964453, 'samples': 685120, 'steps': 1338, 'loss/train': 3.0808305740356445} -09/20/2021 19:07:27 - INFO - __main__ - Step 21411: {'lr': 0.0001999296666964453, 'samples': 685152, 'steps': 1338, 'loss/train': 4.029137134552002} -09/20/2021 19:07:28 - INFO - __main__ - Step 21412: {'lr': 0.0001999296666964453, 'samples': 685184, 'steps': 1338, 'loss/train': 3.9621543884277344} -09/20/2021 19:07:29 - INFO - __main__ - Step 21413: {'lr': 0.0001999296666964453, 'samples': 685216, 'steps': 1338, 'loss/train': 3.2679672241210938} -09/20/2021 19:07:30 - INFO - __main__ - Step 21414: {'lr': 0.0001999296666964453, 'samples': 685248, 'steps': 1338, 'loss/train': 3.8087174892425537} -09/20/2021 19:07:30 - INFO - __main__ - Step 21415: {'lr': 0.0001999296666964453, 'samples': 685280, 'steps': 1338, 'loss/train': 1.0641746520996094} -09/20/2021 19:07:31 - INFO - __main__ - Step 21416: {'lr': 0.0001999296666964453, 'samples': 685312, 'steps': 1338, 'loss/train': 2.2033276557922363} -09/20/2021 19:07:32 - INFO - __main__ - Step 21417: {'lr': 0.0001999296666964453, 'samples': 685344, 'steps': 1338, 'loss/train': 2.7079989910125732} -09/20/2021 19:07:33 - INFO - __main__ - Step 21418: {'lr': 0.0001999296666964453, 'samples': 685376, 'steps': 1338, 'loss/train': 3.0361409187316895} -09/20/2021 19:07:33 - INFO - __main__ - Step 21419: {'lr': 0.0001999296666964453, 'samples': 685408, 'steps': 1338, 'loss/train': 3.132190227508545} -09/20/2021 19:07:34 - INFO - __main__ - Step 21420: {'lr': 0.0001999296666964453, 'samples': 685440, 'steps': 1338, 'loss/train': 4.071926593780518} -09/20/2021 19:07:35 - INFO - __main__ - Step 21421: {'lr': 0.0001999296666964453, 'samples': 685472, 'steps': 1338, 'loss/train': 3.2071924209594727} -09/20/2021 19:07:36 - INFO - __main__ - Step 21422: {'lr': 0.0001999296666964453, 'samples': 685504, 'steps': 1338, 'loss/train': 3.631669521331787} -09/20/2021 19:07:36 - INFO - __main__ - Step 21423: {'lr': 0.0001999296666964453, 'samples': 685536, 'steps': 1338, 'loss/train': 3.8089241981506348} -09/20/2021 19:07:37 - INFO - __main__ - Step 21424: {'lr': 0.0001999296666964453, 'samples': 685568, 'steps': 1338, 'loss/train': 2.880645275115967} -09/20/2021 19:07:38 - INFO - __main__ - Step 21425: {'lr': 0.00019992942729226196, 'samples': 685600, 'steps': 1339, 'loss/train': 3.0801539421081543} -09/20/2021 19:07:39 - INFO - __main__ - Step 21426: {'lr': 0.00019992942729226196, 'samples': 685632, 'steps': 1339, 'loss/train': 3.5577070713043213} -09/20/2021 19:07:40 - INFO - __main__ - Step 21427: {'lr': 0.00019992942729226196, 'samples': 685664, 'steps': 1339, 'loss/train': 0.8863733410835266} -09/20/2021 19:07:40 - INFO - __main__ - Step 21428: {'lr': 0.00019992942729226196, 'samples': 685696, 'steps': 1339, 'loss/train': 3.5292980670928955} -09/20/2021 19:07:42 - INFO - __main__ - Step 21429: {'lr': 0.00019992942729226196, 'samples': 685728, 'steps': 1339, 'loss/train': 2.9011874198913574} -09/20/2021 19:07:42 - INFO - __main__ - Step 21430: {'lr': 0.00019992942729226196, 'samples': 685760, 'steps': 1339, 'loss/train': 2.4751906394958496} -09/20/2021 19:07:43 - INFO - __main__ - Step 21431: {'lr': 0.00019992942729226196, 'samples': 685792, 'steps': 1339, 'loss/train': 3.7272727489471436} -09/20/2021 19:07:44 - INFO - __main__ - Step 21432: {'lr': 0.00019992942729226196, 'samples': 685824, 'steps': 1339, 'loss/train': 3.337181568145752} -09/20/2021 19:07:45 - INFO - __main__ - Step 21433: {'lr': 0.00019992942729226196, 'samples': 685856, 'steps': 1339, 'loss/train': 2.7252275943756104} -09/20/2021 19:07:45 - INFO - __main__ - Step 21434: {'lr': 0.00019992942729226196, 'samples': 685888, 'steps': 1339, 'loss/train': 3.2386112213134766} -09/20/2021 19:07:46 - INFO - __main__ - Step 21435: {'lr': 0.00019992942729226196, 'samples': 685920, 'steps': 1339, 'loss/train': 2.288407325744629} -09/20/2021 19:07:47 - INFO - __main__ - Step 21436: {'lr': 0.00019992942729226196, 'samples': 685952, 'steps': 1339, 'loss/train': 3.181704044342041} -09/20/2021 19:07:48 - INFO - __main__ - Step 21437: {'lr': 0.00019992942729226196, 'samples': 685984, 'steps': 1339, 'loss/train': 2.590592861175537} -09/20/2021 19:07:48 - INFO - __main__ - Step 21438: {'lr': 0.00019992942729226196, 'samples': 686016, 'steps': 1339, 'loss/train': 1.6075483560562134} -09/20/2021 19:07:49 - INFO - __main__ - Step 21439: {'lr': 0.00019992942729226196, 'samples': 686048, 'steps': 1339, 'loss/train': 3.6171138286590576} -09/20/2021 19:07:50 - INFO - __main__ - Step 21440: {'lr': 0.00019992942729226196, 'samples': 686080, 'steps': 1339, 'loss/train': 2.907888412475586} -09/20/2021 19:07:51 - INFO - __main__ - Step 21441: {'lr': 0.00019992918748146617, 'samples': 686112, 'steps': 1340, 'loss/train': 2.6597797870635986} -09/20/2021 19:07:52 - INFO - __main__ - Step 21442: {'lr': 0.00019992918748146617, 'samples': 686144, 'steps': 1340, 'loss/train': 2.6277904510498047} -09/20/2021 19:07:52 - INFO - __main__ - Step 21443: {'lr': 0.00019992918748146617, 'samples': 686176, 'steps': 1340, 'loss/train': 2.9035940170288086} -09/20/2021 19:07:53 - INFO - __main__ - Step 21444: {'lr': 0.00019992918748146617, 'samples': 686208, 'steps': 1340, 'loss/train': 3.4158122539520264} -09/20/2021 19:07:54 - INFO - __main__ - Step 21445: {'lr': 0.00019992918748146617, 'samples': 686240, 'steps': 1340, 'loss/train': 2.35017728805542} -09/20/2021 19:07:55 - INFO - __main__ - Step 21446: {'lr': 0.00019992918748146617, 'samples': 686272, 'steps': 1340, 'loss/train': 2.5720157623291016} -09/20/2021 19:07:55 - INFO - __main__ - Step 21447: {'lr': 0.00019992918748146617, 'samples': 686304, 'steps': 1340, 'loss/train': 2.579817056655884} -09/20/2021 19:07:56 - INFO - __main__ - Step 21448: {'lr': 0.00019992918748146617, 'samples': 686336, 'steps': 1340, 'loss/train': 3.2167210578918457} -09/20/2021 19:07:57 - INFO - __main__ - Step 21449: {'lr': 0.00019992918748146617, 'samples': 686368, 'steps': 1340, 'loss/train': 3.49249267578125} -09/20/2021 19:07:58 - INFO - __main__ - Step 21450: {'lr': 0.00019992918748146617, 'samples': 686400, 'steps': 1340, 'loss/train': 3.517771005630493} -09/20/2021 19:07:58 - INFO - __main__ - Step 21451: {'lr': 0.00019992918748146617, 'samples': 686432, 'steps': 1340, 'loss/train': 0.7920821905136108} -09/20/2021 19:07:59 - INFO - __main__ - Step 21452: {'lr': 0.00019992918748146617, 'samples': 686464, 'steps': 1340, 'loss/train': 2.920924663543701} -09/20/2021 19:08:00 - INFO - __main__ - Step 21453: {'lr': 0.00019992918748146617, 'samples': 686496, 'steps': 1340, 'loss/train': 2.7202396392822266} -09/20/2021 19:08:01 - INFO - __main__ - Step 21454: {'lr': 0.00019992918748146617, 'samples': 686528, 'steps': 1340, 'loss/train': 4.631652355194092} -09/20/2021 19:08:01 - INFO - __main__ - Step 21455: {'lr': 0.00019992918748146617, 'samples': 686560, 'steps': 1340, 'loss/train': 3.089402198791504} -09/20/2021 19:08:02 - INFO - __main__ - Step 21456: {'lr': 0.00019992918748146617, 'samples': 686592, 'steps': 1340, 'loss/train': 3.520089864730835} -09/20/2021 19:08:03 - INFO - __main__ - Step 21457: {'lr': 0.00019992894726405893, 'samples': 686624, 'steps': 1341, 'loss/train': 4.004059314727783} -09/20/2021 19:08:04 - INFO - __main__ - Step 21458: {'lr': 0.00019992894726405893, 'samples': 686656, 'steps': 1341, 'loss/train': 3.629202127456665} -09/20/2021 19:08:04 - INFO - __main__ - Step 21459: {'lr': 0.00019992894726405893, 'samples': 686688, 'steps': 1341, 'loss/train': 3.505368709564209} -09/20/2021 19:08:06 - INFO - __main__ - Step 21460: {'lr': 0.00019992894726405893, 'samples': 686720, 'steps': 1341, 'loss/train': 3.242910623550415} -09/20/2021 19:08:06 - INFO - __main__ - Step 21461: {'lr': 0.00019992894726405893, 'samples': 686752, 'steps': 1341, 'loss/train': 2.9933183193206787} -09/20/2021 19:08:07 - INFO - __main__ - Step 21462: {'lr': 0.00019992894726405893, 'samples': 686784, 'steps': 1341, 'loss/train': 3.3912596702575684} -09/20/2021 19:08:08 - INFO - __main__ - Step 21463: {'lr': 0.00019992894726405893, 'samples': 686816, 'steps': 1341, 'loss/train': 1.4944077730178833} -09/20/2021 19:08:09 - INFO - __main__ - Step 21464: {'lr': 0.00019992894726405893, 'samples': 686848, 'steps': 1341, 'loss/train': 3.685537099838257} -09/20/2021 19:08:09 - INFO - __main__ - Step 21465: {'lr': 0.00019992894726405893, 'samples': 686880, 'steps': 1341, 'loss/train': 3.3722116947174072} -09/20/2021 19:08:10 - INFO - __main__ - Step 21466: {'lr': 0.00019992894726405893, 'samples': 686912, 'steps': 1341, 'loss/train': 4.247533798217773} -09/20/2021 19:08:11 - INFO - __main__ - Step 21467: {'lr': 0.00019992894726405893, 'samples': 686944, 'steps': 1341, 'loss/train': 3.0841057300567627} -09/20/2021 19:08:12 - INFO - __main__ - Step 21468: {'lr': 0.00019992894726405893, 'samples': 686976, 'steps': 1341, 'loss/train': 3.252521276473999} -09/20/2021 19:08:12 - INFO - __main__ - Step 21469: {'lr': 0.00019992894726405893, 'samples': 687008, 'steps': 1341, 'loss/train': 2.6034963130950928} -09/20/2021 19:08:13 - INFO - __main__ - Step 21470: {'lr': 0.00019992894726405893, 'samples': 687040, 'steps': 1341, 'loss/train': 2.7153661251068115} -09/20/2021 19:08:14 - INFO - __main__ - Step 21471: {'lr': 0.00019992894726405893, 'samples': 687072, 'steps': 1341, 'loss/train': 3.3394973278045654} -09/20/2021 19:08:15 - INFO - __main__ - Step 21472: {'lr': 0.00019992894726405893, 'samples': 687104, 'steps': 1341, 'loss/train': 3.810521364212036} -09/20/2021 19:08:16 - INFO - __main__ - Step 21473: {'lr': 0.00019992870664004117, 'samples': 687136, 'steps': 1342, 'loss/train': 2.0937812328338623} -09/20/2021 19:08:16 - INFO - __main__ - Step 21474: {'lr': 0.00019992870664004117, 'samples': 687168, 'steps': 1342, 'loss/train': 4.034658908843994} -09/20/2021 19:08:17 - INFO - __main__ - Step 21475: {'lr': 0.00019992870664004117, 'samples': 687200, 'steps': 1342, 'loss/train': 4.0320143699646} -09/20/2021 19:08:18 - INFO - __main__ - Step 21476: {'lr': 0.00019992870664004117, 'samples': 687232, 'steps': 1342, 'loss/train': 3.4996531009674072} -09/20/2021 19:08:19 - INFO - __main__ - Step 21477: {'lr': 0.00019992870664004117, 'samples': 687264, 'steps': 1342, 'loss/train': 3.3093254566192627} -09/20/2021 19:08:19 - INFO - __main__ - Step 21478: {'lr': 0.00019992870664004117, 'samples': 687296, 'steps': 1342, 'loss/train': 2.2267048358917236} -09/20/2021 19:08:20 - INFO - __main__ - Step 21479: {'lr': 0.00019992870664004117, 'samples': 687328, 'steps': 1342, 'loss/train': 0.36877718567848206} -09/20/2021 19:08:21 - INFO - __main__ - Step 21480: {'lr': 0.00019992870664004117, 'samples': 687360, 'steps': 1342, 'loss/train': 2.4884612560272217} -09/20/2021 19:08:22 - INFO - __main__ - Step 21481: {'lr': 0.00019992870664004117, 'samples': 687392, 'steps': 1342, 'loss/train': 3.3193628787994385} -09/20/2021 19:08:22 - INFO - __main__ - Step 21482: {'lr': 0.00019992870664004117, 'samples': 687424, 'steps': 1342, 'loss/train': 2.870732307434082} -09/20/2021 19:08:23 - INFO - __main__ - Step 21483: {'lr': 0.00019992870664004117, 'samples': 687456, 'steps': 1342, 'loss/train': 4.1195173263549805} -09/20/2021 19:08:24 - INFO - __main__ - Step 21484: {'lr': 0.00019992870664004117, 'samples': 687488, 'steps': 1342, 'loss/train': 3.1207962036132812} -09/20/2021 19:08:25 - INFO - __main__ - Step 21485: {'lr': 0.00019992870664004117, 'samples': 687520, 'steps': 1342, 'loss/train': 3.511612892150879} -09/20/2021 19:08:25 - INFO - __main__ - Step 21486: {'lr': 0.00019992870664004117, 'samples': 687552, 'steps': 1342, 'loss/train': 3.6081700325012207} -09/20/2021 19:08:26 - INFO - __main__ - Step 21487: {'lr': 0.00019992870664004117, 'samples': 687584, 'steps': 1342, 'loss/train': 4.033386707305908} -09/20/2021 19:08:27 - INFO - __main__ - Step 21488: {'lr': 0.00019992870664004117, 'samples': 687616, 'steps': 1342, 'loss/train': 3.2768290042877197} -09/20/2021 19:08:28 - INFO - __main__ - Step 21489: {'lr': 0.00019992846560941389, 'samples': 687648, 'steps': 1343, 'loss/train': 3.71401047706604} -09/20/2021 19:08:28 - INFO - __main__ - Step 21490: {'lr': 0.00019992846560941389, 'samples': 687680, 'steps': 1343, 'loss/train': 3.0000598430633545} -09/20/2021 19:08:30 - INFO - __main__ - Step 21491: {'lr': 0.00019992846560941389, 'samples': 687712, 'steps': 1343, 'loss/train': 3.3723230361938477} -09/20/2021 19:08:31 - INFO - __main__ - Step 21492: {'lr': 0.00019992846560941389, 'samples': 687744, 'steps': 1343, 'loss/train': 2.7147443294525146} -09/20/2021 19:08:31 - INFO - __main__ - Step 21493: {'lr': 0.00019992846560941389, 'samples': 687776, 'steps': 1343, 'loss/train': 3.1676371097564697} -09/20/2021 19:08:32 - INFO - __main__ - Step 21494: {'lr': 0.00019992846560941389, 'samples': 687808, 'steps': 1343, 'loss/train': 3.3768463134765625} -09/20/2021 19:08:33 - INFO - __main__ - Step 21495: {'lr': 0.00019992846560941389, 'samples': 687840, 'steps': 1343, 'loss/train': 0.577596127986908} -09/20/2021 19:08:34 - INFO - __main__ - Step 21496: {'lr': 0.00019992846560941389, 'samples': 687872, 'steps': 1343, 'loss/train': 2.9107954502105713} -09/20/2021 19:08:34 - INFO - __main__ - Step 21497: {'lr': 0.00019992846560941389, 'samples': 687904, 'steps': 1343, 'loss/train': 3.136070728302002} -09/20/2021 19:08:35 - INFO - __main__ - Step 21498: {'lr': 0.00019992846560941389, 'samples': 687936, 'steps': 1343, 'loss/train': 3.2817134857177734} -09/20/2021 19:08:36 - INFO - __main__ - Step 21499: {'lr': 0.00019992846560941389, 'samples': 687968, 'steps': 1343, 'loss/train': 2.370856523513794} -09/20/2021 19:08:37 - INFO - __main__ - Step 21500: {'lr': 0.00019992846560941389, 'samples': 688000, 'steps': 1343, 'loss/train': 3.3197970390319824} -09/20/2021 19:08:37 - INFO - __main__ - Step 21501: {'lr': 0.00019992846560941389, 'samples': 688032, 'steps': 1343, 'loss/train': 2.6635406017303467} -09/20/2021 19:08:38 - INFO - __main__ - Step 21502: {'lr': 0.00019992846560941389, 'samples': 688064, 'steps': 1343, 'loss/train': 3.5840134620666504} -09/20/2021 19:08:39 - INFO - __main__ - Step 21503: {'lr': 0.00019992846560941389, 'samples': 688096, 'steps': 1343, 'loss/train': 3.000671625137329} -09/20/2021 19:08:40 - INFO - __main__ - Step 21504: {'lr': 0.00019992846560941389, 'samples': 688128, 'steps': 1343, 'loss/train': 1.9843027591705322} -09/20/2021 19:08:40 - INFO - __main__ - Step 21505: {'lr': 0.0001999282241721781, 'samples': 688160, 'steps': 1344, 'loss/train': 3.757408857345581} -09/20/2021 19:08:41 - INFO - __main__ - Step 21506: {'lr': 0.0001999282241721781, 'samples': 688192, 'steps': 1344, 'loss/train': 4.024185657501221} -09/20/2021 19:08:42 - INFO - __main__ - Step 21507: {'lr': 0.0001999282241721781, 'samples': 688224, 'steps': 1344, 'loss/train': 2.8651583194732666} -09/20/2021 19:08:43 - INFO - __main__ - Step 21508: {'lr': 0.0001999282241721781, 'samples': 688256, 'steps': 1344, 'loss/train': 3.0320444107055664} -09/20/2021 19:08:43 - INFO - __main__ - Step 21509: {'lr': 0.0001999282241721781, 'samples': 688288, 'steps': 1344, 'loss/train': 0.8580935597419739} -09/20/2021 19:08:44 - INFO - __main__ - Step 21510: {'lr': 0.0001999282241721781, 'samples': 688320, 'steps': 1344, 'loss/train': 2.8278162479400635} -09/20/2021 19:08:45 - INFO - __main__ - Step 21511: {'lr': 0.0001999282241721781, 'samples': 688352, 'steps': 1344, 'loss/train': 3.64522123336792} -09/20/2021 19:08:46 - INFO - __main__ - Step 21512: {'lr': 0.0001999282241721781, 'samples': 688384, 'steps': 1344, 'loss/train': 0.5840440988540649} -09/20/2021 19:08:46 - INFO - __main__ - Step 21513: {'lr': 0.0001999282241721781, 'samples': 688416, 'steps': 1344, 'loss/train': 2.6684701442718506} -09/20/2021 19:08:47 - INFO - __main__ - Step 21514: {'lr': 0.0001999282241721781, 'samples': 688448, 'steps': 1344, 'loss/train': 3.388284206390381} -09/20/2021 19:08:48 - INFO - __main__ - Step 21515: {'lr': 0.0001999282241721781, 'samples': 688480, 'steps': 1344, 'loss/train': 3.7552056312561035} -09/20/2021 19:08:49 - INFO - __main__ - Step 21516: {'lr': 0.0001999282241721781, 'samples': 688512, 'steps': 1344, 'loss/train': 4.306443214416504} -09/20/2021 19:08:49 - INFO - __main__ - Step 21517: {'lr': 0.0001999282241721781, 'samples': 688544, 'steps': 1344, 'loss/train': 3.7135870456695557} -09/20/2021 19:08:50 - INFO - __main__ - Step 21518: {'lr': 0.0001999282241721781, 'samples': 688576, 'steps': 1344, 'loss/train': 2.8188509941101074} -09/20/2021 19:08:51 - INFO - __main__ - Step 21519: {'lr': 0.0001999282241721781, 'samples': 688608, 'steps': 1344, 'loss/train': 3.179885149002075} -09/20/2021 19:08:52 - INFO - __main__ - Step 21520: {'lr': 0.0001999282241721781, 'samples': 688640, 'steps': 1344, 'loss/train': 3.9375288486480713} -09/20/2021 19:08:53 - INFO - __main__ - Step 21521: {'lr': 0.00019992798232833475, 'samples': 688672, 'steps': 1345, 'loss/train': 1.8215194940567017} -09/20/2021 19:08:53 - INFO - __main__ - Step 21522: {'lr': 0.00019992798232833475, 'samples': 688704, 'steps': 1345, 'loss/train': 3.3222362995147705} -09/20/2021 19:08:55 - INFO - __main__ - Step 21523: {'lr': 0.00019992798232833475, 'samples': 688736, 'steps': 1345, 'loss/train': 3.471428394317627} -09/20/2021 19:08:55 - INFO - __main__ - Step 21524: {'lr': 0.00019992798232833475, 'samples': 688768, 'steps': 1345, 'loss/train': 3.130000352859497} -09/20/2021 19:08:56 - INFO - __main__ - Step 21525: {'lr': 0.00019992798232833475, 'samples': 688800, 'steps': 1345, 'loss/train': 3.2214810848236084} -09/20/2021 19:08:57 - INFO - __main__ - Step 21526: {'lr': 0.00019992798232833475, 'samples': 688832, 'steps': 1345, 'loss/train': 4.906548023223877} -09/20/2021 19:08:58 - INFO - __main__ - Step 21527: {'lr': 0.00019992798232833475, 'samples': 688864, 'steps': 1345, 'loss/train': 2.942669153213501} -09/20/2021 19:08:58 - INFO - __main__ - Step 21528: {'lr': 0.00019992798232833475, 'samples': 688896, 'steps': 1345, 'loss/train': 2.951673746109009} -09/20/2021 19:08:59 - INFO - __main__ - Step 21529: {'lr': 0.00019992798232833475, 'samples': 688928, 'steps': 1345, 'loss/train': 3.9128119945526123} -09/20/2021 19:09:00 - INFO - __main__ - Step 21530: {'lr': 0.00019992798232833475, 'samples': 688960, 'steps': 1345, 'loss/train': 4.03902006149292} -09/20/2021 19:09:01 - INFO - __main__ - Step 21531: {'lr': 0.00019992798232833475, 'samples': 688992, 'steps': 1345, 'loss/train': 3.0471742153167725} -09/20/2021 19:09:01 - INFO - __main__ - Step 21532: {'lr': 0.00019992798232833475, 'samples': 689024, 'steps': 1345, 'loss/train': 2.3645553588867188} -09/20/2021 19:09:02 - INFO - __main__ - Step 21533: {'lr': 0.00019992798232833475, 'samples': 689056, 'steps': 1345, 'loss/train': 3.6873421669006348} -09/20/2021 19:09:03 - INFO - __main__ - Step 21534: {'lr': 0.00019992798232833475, 'samples': 689088, 'steps': 1345, 'loss/train': 2.9664337635040283} -09/20/2021 19:09:04 - INFO - __main__ - Step 21535: {'lr': 0.00019992798232833475, 'samples': 689120, 'steps': 1345, 'loss/train': 3.2700865268707275} -09/20/2021 19:09:04 - INFO - __main__ - Step 21536: {'lr': 0.00019992798232833475, 'samples': 689152, 'steps': 1345, 'loss/train': 3.0889360904693604} -09/20/2021 19:09:05 - INFO - __main__ - Step 21537: {'lr': 0.0001999277400778848, 'samples': 689184, 'steps': 1346, 'loss/train': 4.2609686851501465} -09/20/2021 19:09:06 - INFO - __main__ - Step 21538: {'lr': 0.0001999277400778848, 'samples': 689216, 'steps': 1346, 'loss/train': 3.4762446880340576} -09/20/2021 19:09:07 - INFO - __main__ - Step 21539: {'lr': 0.0001999277400778848, 'samples': 689248, 'steps': 1346, 'loss/train': 3.7704339027404785} -09/20/2021 19:09:07 - INFO - __main__ - Step 21540: {'lr': 0.0001999277400778848, 'samples': 689280, 'steps': 1346, 'loss/train': 3.70678448677063} -09/20/2021 19:09:08 - INFO - __main__ - Step 21541: {'lr': 0.0001999277400778848, 'samples': 689312, 'steps': 1346, 'loss/train': 4.065203666687012} -09/20/2021 19:09:09 - INFO - __main__ - Step 21542: {'lr': 0.0001999277400778848, 'samples': 689344, 'steps': 1346, 'loss/train': 4.951183795928955} -09/20/2021 19:09:10 - INFO - __main__ - Step 21543: {'lr': 0.0001999277400778848, 'samples': 689376, 'steps': 1346, 'loss/train': 2.667375326156616} -09/20/2021 19:09:10 - INFO - __main__ - Step 21544: {'lr': 0.0001999277400778848, 'samples': 689408, 'steps': 1346, 'loss/train': 3.8669955730438232} -09/20/2021 19:09:11 - INFO - __main__ - Step 21545: {'lr': 0.0001999277400778848, 'samples': 689440, 'steps': 1346, 'loss/train': 3.101168394088745} -09/20/2021 19:09:12 - INFO - __main__ - Step 21546: {'lr': 0.0001999277400778848, 'samples': 689472, 'steps': 1346, 'loss/train': 2.5965728759765625} -09/20/2021 19:09:13 - INFO - __main__ - Step 21547: {'lr': 0.0001999277400778848, 'samples': 689504, 'steps': 1346, 'loss/train': 3.413753032684326} -09/20/2021 19:09:13 - INFO - __main__ - Step 21548: {'lr': 0.0001999277400778848, 'samples': 689536, 'steps': 1346, 'loss/train': 4.116356372833252} -09/20/2021 19:09:14 - INFO - __main__ - Step 21549: {'lr': 0.0001999277400778848, 'samples': 689568, 'steps': 1346, 'loss/train': 2.9125142097473145} -09/20/2021 19:09:15 - INFO - __main__ - Step 21550: {'lr': 0.0001999277400778848, 'samples': 689600, 'steps': 1346, 'loss/train': 4.47401762008667} -09/20/2021 19:09:16 - INFO - __main__ - Step 21551: {'lr': 0.0001999277400778848, 'samples': 689632, 'steps': 1346, 'loss/train': 2.0970497131347656} -09/20/2021 19:09:16 - INFO - __main__ - Step 21552: {'lr': 0.0001999277400778848, 'samples': 689664, 'steps': 1346, 'loss/train': 3.203842878341675} -09/20/2021 19:09:18 - INFO - __main__ - Step 21553: {'lr': 0.00019992749742082927, 'samples': 689696, 'steps': 1347, 'loss/train': 1.1041537523269653} -09/20/2021 19:09:19 - INFO - __main__ - Step 21554: {'lr': 0.00019992749742082927, 'samples': 689728, 'steps': 1347, 'loss/train': 3.3512966632843018} -09/20/2021 19:09:19 - INFO - __main__ - Step 21555: {'lr': 0.00019992749742082927, 'samples': 689760, 'steps': 1347, 'loss/train': 2.6690642833709717} -09/20/2021 19:09:20 - INFO - __main__ - Step 21556: {'lr': 0.00019992749742082927, 'samples': 689792, 'steps': 1347, 'loss/train': 1.0627021789550781} -09/20/2021 19:09:21 - INFO - __main__ - Step 21557: {'lr': 0.00019992749742082927, 'samples': 689824, 'steps': 1347, 'loss/train': 3.210503101348877} -09/20/2021 19:09:22 - INFO - __main__ - Step 21558: {'lr': 0.00019992749742082927, 'samples': 689856, 'steps': 1347, 'loss/train': 3.4170210361480713} -09/20/2021 19:09:22 - INFO - __main__ - Step 21559: {'lr': 0.00019992749742082927, 'samples': 689888, 'steps': 1347, 'loss/train': 3.0104057788848877} -09/20/2021 19:09:23 - INFO - __main__ - Step 21560: {'lr': 0.00019992749742082927, 'samples': 689920, 'steps': 1347, 'loss/train': 3.8837051391601562} -09/20/2021 19:09:24 - INFO - __main__ - Step 21561: {'lr': 0.00019992749742082927, 'samples': 689952, 'steps': 1347, 'loss/train': 3.1196277141571045} -09/20/2021 19:09:25 - INFO - __main__ - Step 21562: {'lr': 0.00019992749742082927, 'samples': 689984, 'steps': 1347, 'loss/train': 3.1768600940704346} -09/20/2021 19:09:25 - INFO - __main__ - Step 21563: {'lr': 0.00019992749742082927, 'samples': 690016, 'steps': 1347, 'loss/train': 3.5964465141296387} -09/20/2021 19:09:26 - INFO - __main__ - Step 21564: {'lr': 0.00019992749742082927, 'samples': 690048, 'steps': 1347, 'loss/train': 3.5804457664489746} -09/20/2021 19:09:27 - INFO - __main__ - Step 21565: {'lr': 0.00019992749742082927, 'samples': 690080, 'steps': 1347, 'loss/train': 2.9924139976501465} -09/20/2021 19:09:28 - INFO - __main__ - Step 21566: {'lr': 0.00019992749742082927, 'samples': 690112, 'steps': 1347, 'loss/train': 3.3418948650360107} -09/20/2021 19:09:28 - INFO - __main__ - Step 21567: {'lr': 0.00019992749742082927, 'samples': 690144, 'steps': 1347, 'loss/train': 3.513892650604248} -09/20/2021 19:09:29 - INFO - __main__ - Step 21568: {'lr': 0.00019992749742082927, 'samples': 690176, 'steps': 1347, 'loss/train': 4.284224510192871} -09/20/2021 19:09:30 - INFO - __main__ - Step 21569: {'lr': 0.00019992725435716911, 'samples': 690208, 'steps': 1348, 'loss/train': 3.056683301925659} -09/20/2021 19:09:31 - INFO - __main__ - Step 21570: {'lr': 0.00019992725435716911, 'samples': 690240, 'steps': 1348, 'loss/train': 3.3440375328063965} -09/20/2021 19:09:31 - INFO - __main__ - Step 21571: {'lr': 0.00019992725435716911, 'samples': 690272, 'steps': 1348, 'loss/train': 2.909615993499756} -09/20/2021 19:09:32 - INFO - __main__ - Step 21572: {'lr': 0.00019992725435716911, 'samples': 690304, 'steps': 1348, 'loss/train': 3.6044576168060303} -09/20/2021 19:09:33 - INFO - __main__ - Step 21573: {'lr': 0.00019992725435716911, 'samples': 690336, 'steps': 1348, 'loss/train': 4.0166215896606445} -09/20/2021 19:09:34 - INFO - __main__ - Step 21574: {'lr': 0.00019992725435716911, 'samples': 690368, 'steps': 1348, 'loss/train': 3.13337779045105} -09/20/2021 19:09:34 - INFO - __main__ - Step 21575: {'lr': 0.00019992725435716911, 'samples': 690400, 'steps': 1348, 'loss/train': 0.6739680171012878} -09/20/2021 19:09:35 - INFO - __main__ - Step 21576: {'lr': 0.00019992725435716911, 'samples': 690432, 'steps': 1348, 'loss/train': 3.3675873279571533} -09/20/2021 19:09:36 - INFO - __main__ - Step 21577: {'lr': 0.00019992725435716911, 'samples': 690464, 'steps': 1348, 'loss/train': 4.434252738952637} -09/20/2021 19:09:37 - INFO - __main__ - Step 21578: {'lr': 0.00019992725435716911, 'samples': 690496, 'steps': 1348, 'loss/train': 3.416914224624634} -09/20/2021 19:09:37 - INFO - __main__ - Step 21579: {'lr': 0.00019992725435716911, 'samples': 690528, 'steps': 1348, 'loss/train': 3.506537914276123} -09/20/2021 19:09:38 - INFO - __main__ - Step 21580: {'lr': 0.00019992725435716911, 'samples': 690560, 'steps': 1348, 'loss/train': 3.1302847862243652} -09/20/2021 19:09:39 - INFO - __main__ - Step 21581: {'lr': 0.00019992725435716911, 'samples': 690592, 'steps': 1348, 'loss/train': 2.612304210662842} -09/20/2021 19:09:40 - INFO - __main__ - Step 21582: {'lr': 0.00019992725435716911, 'samples': 690624, 'steps': 1348, 'loss/train': 3.3698368072509766} -09/20/2021 19:09:41 - INFO - __main__ - Step 21583: {'lr': 0.00019992725435716911, 'samples': 690656, 'steps': 1348, 'loss/train': 3.913656234741211} -09/20/2021 19:09:42 - INFO - __main__ - Step 21584: {'lr': 0.00019992725435716911, 'samples': 690688, 'steps': 1348, 'loss/train': 2.5243031978607178} -09/20/2021 19:09:43 - INFO - __main__ - Step 21585: {'lr': 0.0001999270108869054, 'samples': 690720, 'steps': 1349, 'loss/train': 3.6982548236846924} -09/20/2021 19:09:43 - INFO - __main__ - Step 21586: {'lr': 0.0001999270108869054, 'samples': 690752, 'steps': 1349, 'loss/train': 0.4763047695159912} -09/20/2021 19:09:44 - INFO - __main__ - Step 21587: {'lr': 0.0001999270108869054, 'samples': 690784, 'steps': 1349, 'loss/train': 0.49115946888923645} -09/20/2021 19:09:45 - INFO - __main__ - Step 21588: {'lr': 0.0001999270108869054, 'samples': 690816, 'steps': 1349, 'loss/train': 0.5059199929237366} -09/20/2021 19:09:46 - INFO - __main__ - Step 21589: {'lr': 0.0001999270108869054, 'samples': 690848, 'steps': 1349, 'loss/train': 0.6874698996543884} -09/20/2021 19:09:46 - INFO - __main__ - Step 21590: {'lr': 0.0001999270108869054, 'samples': 690880, 'steps': 1349, 'loss/train': 2.4880475997924805} -09/20/2021 19:09:47 - INFO - __main__ - Step 21591: {'lr': 0.0001999270108869054, 'samples': 690912, 'steps': 1349, 'loss/train': 3.839057445526123} -09/20/2021 19:09:48 - INFO - __main__ - Step 21592: {'lr': 0.0001999270108869054, 'samples': 690944, 'steps': 1349, 'loss/train': 3.9802181720733643} -09/20/2021 19:09:49 - INFO - __main__ - Step 21593: {'lr': 0.0001999270108869054, 'samples': 690976, 'steps': 1349, 'loss/train': 2.9845988750457764} -09/20/2021 19:09:49 - INFO - __main__ - Step 21594: {'lr': 0.0001999270108869054, 'samples': 691008, 'steps': 1349, 'loss/train': 2.69355845451355} -09/20/2021 19:09:50 - INFO - __main__ - Step 21595: {'lr': 0.0001999270108869054, 'samples': 691040, 'steps': 1349, 'loss/train': 2.7956740856170654} -09/20/2021 19:09:51 - INFO - __main__ - Step 21596: {'lr': 0.0001999270108869054, 'samples': 691072, 'steps': 1349, 'loss/train': 2.7745578289031982} -09/20/2021 19:09:52 - INFO - __main__ - Step 21597: {'lr': 0.0001999270108869054, 'samples': 691104, 'steps': 1349, 'loss/train': 3.3256850242614746} -09/20/2021 19:09:52 - INFO - __main__ - Step 21598: {'lr': 0.0001999270108869054, 'samples': 691136, 'steps': 1349, 'loss/train': 2.628605604171753} -09/20/2021 19:09:53 - INFO - __main__ - Step 21599: {'lr': 0.0001999270108869054, 'samples': 691168, 'steps': 1349, 'loss/train': 3.8816030025482178} -09/20/2021 19:09:54 - INFO - __main__ - Step 21600: {'lr': 0.0001999270108869054, 'samples': 691200, 'steps': 1349, 'loss/train': 2.420121431350708} -09/20/2021 19:09:55 - INFO - __main__ - Step 21601: {'lr': 0.00019992676701003904, 'samples': 691232, 'steps': 1350, 'loss/train': 3.1404900550842285} -09/20/2021 19:09:56 - INFO - __main__ - Step 21602: {'lr': 0.00019992676701003904, 'samples': 691264, 'steps': 1350, 'loss/train': 4.069520950317383} -09/20/2021 19:09:56 - INFO - __main__ - Step 21603: {'lr': 0.00019992676701003904, 'samples': 691296, 'steps': 1350, 'loss/train': 3.711989164352417} -09/20/2021 19:09:57 - INFO - __main__ - Step 21604: {'lr': 0.00019992676701003904, 'samples': 691328, 'steps': 1350, 'loss/train': 5.915635585784912} -09/20/2021 19:09:58 - INFO - __main__ - Step 21605: {'lr': 0.00019992676701003904, 'samples': 691360, 'steps': 1350, 'loss/train': 3.429429054260254} -09/20/2021 19:09:59 - INFO - __main__ - Step 21606: {'lr': 0.00019992676701003904, 'samples': 691392, 'steps': 1350, 'loss/train': 3.8202242851257324} -09/20/2021 19:09:59 - INFO - __main__ - Step 21607: {'lr': 0.00019992676701003904, 'samples': 691424, 'steps': 1350, 'loss/train': 4.172403335571289} -09/20/2021 19:10:00 - INFO - __main__ - Step 21608: {'lr': 0.00019992676701003904, 'samples': 691456, 'steps': 1350, 'loss/train': 3.125247001647949} -09/20/2021 19:10:01 - INFO - __main__ - Step 21609: {'lr': 0.00019992676701003904, 'samples': 691488, 'steps': 1350, 'loss/train': 3.475886821746826} -09/20/2021 19:10:02 - INFO - __main__ - Step 21610: {'lr': 0.00019992676701003904, 'samples': 691520, 'steps': 1350, 'loss/train': 3.747852325439453} -09/20/2021 19:10:02 - INFO - __main__ - Step 21611: {'lr': 0.00019992676701003904, 'samples': 691552, 'steps': 1350, 'loss/train': 2.2722861766815186} -09/20/2021 19:10:03 - INFO - __main__ - Step 21612: {'lr': 0.00019992676701003904, 'samples': 691584, 'steps': 1350, 'loss/train': 3.0029938220977783} -09/20/2021 19:10:04 - INFO - __main__ - Step 21613: {'lr': 0.00019992676701003904, 'samples': 691616, 'steps': 1350, 'loss/train': 3.596252918243408} -09/20/2021 19:10:05 - INFO - __main__ - Step 21614: {'lr': 0.00019992676701003904, 'samples': 691648, 'steps': 1350, 'loss/train': 0.8081164360046387} -09/20/2021 19:10:06 - INFO - __main__ - Step 21615: {'lr': 0.00019992676701003904, 'samples': 691680, 'steps': 1350, 'loss/train': 0.6629483103752136} -09/20/2021 19:10:07 - INFO - __main__ - Step 21616: {'lr': 0.00019992676701003904, 'samples': 691712, 'steps': 1350, 'loss/train': 3.3199570178985596} -09/20/2021 19:10:08 - INFO - __main__ - Step 21617: {'lr': 0.00019992652272657108, 'samples': 691744, 'steps': 1351, 'loss/train': 3.1095833778381348} -09/20/2021 19:10:08 - INFO - __main__ - Step 21618: {'lr': 0.00019992652272657108, 'samples': 691776, 'steps': 1351, 'loss/train': 3.611881732940674} -09/20/2021 19:10:09 - INFO - __main__ - Step 21619: {'lr': 0.00019992652272657108, 'samples': 691808, 'steps': 1351, 'loss/train': 2.619687080383301} -09/20/2021 19:10:10 - INFO - __main__ - Step 21620: {'lr': 0.00019992652272657108, 'samples': 691840, 'steps': 1351, 'loss/train': 3.5316691398620605} -09/20/2021 19:10:11 - INFO - __main__ - Step 21621: {'lr': 0.00019992652272657108, 'samples': 691872, 'steps': 1351, 'loss/train': 2.3839457035064697} -09/20/2021 19:10:11 - INFO - __main__ - Step 21622: {'lr': 0.00019992652272657108, 'samples': 691904, 'steps': 1351, 'loss/train': 1.9468352794647217} -09/20/2021 19:10:12 - INFO - __main__ - Step 21623: {'lr': 0.00019992652272657108, 'samples': 691936, 'steps': 1351, 'loss/train': 2.836963176727295} -09/20/2021 19:10:13 - INFO - __main__ - Step 21624: {'lr': 0.00019992652272657108, 'samples': 691968, 'steps': 1351, 'loss/train': 3.227137804031372} -09/20/2021 19:10:14 - INFO - __main__ - Step 21625: {'lr': 0.00019992652272657108, 'samples': 692000, 'steps': 1351, 'loss/train': 2.867051839828491} -09/20/2021 19:10:14 - INFO - __main__ - Step 21626: {'lr': 0.00019992652272657108, 'samples': 692032, 'steps': 1351, 'loss/train': 3.8136157989501953} -09/20/2021 19:10:15 - INFO - __main__ - Step 21627: {'lr': 0.00019992652272657108, 'samples': 692064, 'steps': 1351, 'loss/train': 3.8840959072113037} -09/20/2021 19:10:16 - INFO - __main__ - Step 21628: {'lr': 0.00019992652272657108, 'samples': 692096, 'steps': 1351, 'loss/train': 2.8809468746185303} -09/20/2021 19:10:17 - INFO - __main__ - Step 21629: {'lr': 0.00019992652272657108, 'samples': 692128, 'steps': 1351, 'loss/train': 3.9192562103271484} -09/20/2021 19:10:17 - INFO - __main__ - Step 21630: {'lr': 0.00019992652272657108, 'samples': 692160, 'steps': 1351, 'loss/train': 3.0014913082122803} -09/20/2021 19:10:18 - INFO - __main__ - Step 21631: {'lr': 0.00019992652272657108, 'samples': 692192, 'steps': 1351, 'loss/train': 3.3571813106536865} -09/20/2021 19:10:19 - INFO - __main__ - Step 21632: {'lr': 0.00019992652272657108, 'samples': 692224, 'steps': 1351, 'loss/train': 4.536388397216797} -09/20/2021 19:10:20 - INFO - __main__ - Step 21633: {'lr': 0.00019992627803650247, 'samples': 692256, 'steps': 1352, 'loss/train': 2.608067512512207} -09/20/2021 19:10:20 - INFO - __main__ - Step 21634: {'lr': 0.00019992627803650247, 'samples': 692288, 'steps': 1352, 'loss/train': 3.6711833477020264} -09/20/2021 19:10:21 - INFO - __main__ - Step 21635: {'lr': 0.00019992627803650247, 'samples': 692320, 'steps': 1352, 'loss/train': 4.735069751739502} -09/20/2021 19:10:22 - INFO - __main__ - Step 21636: {'lr': 0.00019992627803650247, 'samples': 692352, 'steps': 1352, 'loss/train': 2.409529447555542} -09/20/2021 19:10:23 - INFO - __main__ - Step 21637: {'lr': 0.00019992627803650247, 'samples': 692384, 'steps': 1352, 'loss/train': 3.9658737182617188} -09/20/2021 19:10:23 - INFO - __main__ - Step 21638: {'lr': 0.00019992627803650247, 'samples': 692416, 'steps': 1352, 'loss/train': 3.8819453716278076} -09/20/2021 19:10:24 - INFO - __main__ - Step 21639: {'lr': 0.00019992627803650247, 'samples': 692448, 'steps': 1352, 'loss/train': 2.6871540546417236} -09/20/2021 19:10:25 - INFO - __main__ - Step 21640: {'lr': 0.00019992627803650247, 'samples': 692480, 'steps': 1352, 'loss/train': 1.5886867046356201} -09/20/2021 19:10:26 - INFO - __main__ - Step 21641: {'lr': 0.00019992627803650247, 'samples': 692512, 'steps': 1352, 'loss/train': 2.6687660217285156} -09/20/2021 19:10:26 - INFO - __main__ - Step 21642: {'lr': 0.00019992627803650247, 'samples': 692544, 'steps': 1352, 'loss/train': 2.8466873168945312} -09/20/2021 19:10:27 - INFO - __main__ - Step 21643: {'lr': 0.00019992627803650247, 'samples': 692576, 'steps': 1352, 'loss/train': 2.8758864402770996} -09/20/2021 19:10:28 - INFO - __main__ - Step 21644: {'lr': 0.00019992627803650247, 'samples': 692608, 'steps': 1352, 'loss/train': 2.5578596591949463} -09/20/2021 19:10:29 - INFO - __main__ - Step 21645: {'lr': 0.00019992627803650247, 'samples': 692640, 'steps': 1352, 'loss/train': 2.7771952152252197} -09/20/2021 19:10:29 - INFO - __main__ - Step 21646: {'lr': 0.00019992627803650247, 'samples': 692672, 'steps': 1352, 'loss/train': 3.102884292602539} -09/20/2021 19:10:31 - INFO - __main__ - Step 21647: {'lr': 0.00019992627803650247, 'samples': 692704, 'steps': 1352, 'loss/train': 3.06304669380188} -09/20/2021 19:10:31 - INFO - __main__ - Step 21648: {'lr': 0.00019992627803650247, 'samples': 692736, 'steps': 1352, 'loss/train': 3.4348056316375732} -09/20/2021 19:10:32 - INFO - __main__ - Step 21649: {'lr': 0.00019992603293983422, 'samples': 692768, 'steps': 1353, 'loss/train': 3.3234026432037354} -09/20/2021 19:10:33 - INFO - __main__ - Step 21650: {'lr': 0.00019992603293983422, 'samples': 692800, 'steps': 1353, 'loss/train': 2.9393391609191895} -09/20/2021 19:10:34 - INFO - __main__ - Step 21651: {'lr': 0.00019992603293983422, 'samples': 692832, 'steps': 1353, 'loss/train': 3.9328038692474365} -09/20/2021 19:10:35 - INFO - __main__ - Step 21652: {'lr': 0.00019992603293983422, 'samples': 692864, 'steps': 1353, 'loss/train': 2.9610683917999268} -09/20/2021 19:10:35 - INFO - __main__ - Step 21653: {'lr': 0.00019992603293983422, 'samples': 692896, 'steps': 1353, 'loss/train': 2.9375882148742676} -09/20/2021 19:10:36 - INFO - __main__ - Step 21654: {'lr': 0.00019992603293983422, 'samples': 692928, 'steps': 1353, 'loss/train': 3.7097270488739014} -09/20/2021 19:10:37 - INFO - __main__ - Step 21655: {'lr': 0.00019992603293983422, 'samples': 692960, 'steps': 1353, 'loss/train': 3.7285072803497314} -09/20/2021 19:10:38 - INFO - __main__ - Step 21656: {'lr': 0.00019992603293983422, 'samples': 692992, 'steps': 1353, 'loss/train': 2.6592156887054443} -09/20/2021 19:10:38 - INFO - __main__ - Step 21657: {'lr': 0.00019992603293983422, 'samples': 693024, 'steps': 1353, 'loss/train': 3.5725669860839844} -09/20/2021 19:10:39 - INFO - __main__ - Step 21658: {'lr': 0.00019992603293983422, 'samples': 693056, 'steps': 1353, 'loss/train': 3.1010184288024902} -09/20/2021 19:10:40 - INFO - __main__ - Step 21659: {'lr': 0.00019992603293983422, 'samples': 693088, 'steps': 1353, 'loss/train': 3.0581586360931396} -09/20/2021 19:10:41 - INFO - __main__ - Step 21660: {'lr': 0.00019992603293983422, 'samples': 693120, 'steps': 1353, 'loss/train': 2.4748003482818604} -09/20/2021 19:10:41 - INFO - __main__ - Step 21661: {'lr': 0.00019992603293983422, 'samples': 693152, 'steps': 1353, 'loss/train': 2.520080089569092} -09/20/2021 19:10:42 - INFO - __main__ - Step 21662: {'lr': 0.00019992603293983422, 'samples': 693184, 'steps': 1353, 'loss/train': 3.4769985675811768} -09/20/2021 19:10:43 - INFO - __main__ - Step 21663: {'lr': 0.00019992603293983422, 'samples': 693216, 'steps': 1353, 'loss/train': 3.093132257461548} -09/20/2021 19:10:44 - INFO - __main__ - Step 21664: {'lr': 0.00019992603293983422, 'samples': 693248, 'steps': 1353, 'loss/train': 3.353118896484375} -09/20/2021 19:10:45 - INFO - __main__ - Step 21665: {'lr': 0.0001999257874365673, 'samples': 693280, 'steps': 1354, 'loss/train': 3.5258541107177734} -09/20/2021 19:10:45 - INFO - __main__ - Step 21666: {'lr': 0.0001999257874365673, 'samples': 693312, 'steps': 1354, 'loss/train': 2.9824562072753906} -09/20/2021 19:10:46 - INFO - __main__ - Step 21667: {'lr': 0.0001999257874365673, 'samples': 693344, 'steps': 1354, 'loss/train': 4.206782341003418} -09/20/2021 19:10:47 - INFO - __main__ - Step 21668: {'lr': 0.0001999257874365673, 'samples': 693376, 'steps': 1354, 'loss/train': 3.106032133102417} -09/20/2021 19:10:48 - INFO - __main__ - Step 21669: {'lr': 0.0001999257874365673, 'samples': 693408, 'steps': 1354, 'loss/train': 3.4022440910339355} -09/20/2021 19:10:48 - INFO - __main__ - Step 21670: {'lr': 0.0001999257874365673, 'samples': 693440, 'steps': 1354, 'loss/train': 3.0169005393981934} -09/20/2021 19:10:49 - INFO - __main__ - Step 21671: {'lr': 0.0001999257874365673, 'samples': 693472, 'steps': 1354, 'loss/train': 3.2389514446258545} -09/20/2021 19:10:50 - INFO - __main__ - Step 21672: {'lr': 0.0001999257874365673, 'samples': 693504, 'steps': 1354, 'loss/train': 3.274803400039673} -09/20/2021 19:10:51 - INFO - __main__ - Step 21673: {'lr': 0.0001999257874365673, 'samples': 693536, 'steps': 1354, 'loss/train': 2.5759503841400146} -09/20/2021 19:10:51 - INFO - __main__ - Step 21674: {'lr': 0.0001999257874365673, 'samples': 693568, 'steps': 1354, 'loss/train': 2.8089606761932373} -09/20/2021 19:10:52 - INFO - __main__ - Step 21675: {'lr': 0.0001999257874365673, 'samples': 693600, 'steps': 1354, 'loss/train': 3.610501289367676} -09/20/2021 19:10:53 - INFO - __main__ - Step 21676: {'lr': 0.0001999257874365673, 'samples': 693632, 'steps': 1354, 'loss/train': 2.9737167358398438} -09/20/2021 19:10:54 - INFO - __main__ - Step 21677: {'lr': 0.0001999257874365673, 'samples': 693664, 'steps': 1354, 'loss/train': 3.148313283920288} -09/20/2021 19:10:55 - INFO - __main__ - Step 21678: {'lr': 0.0001999257874365673, 'samples': 693696, 'steps': 1354, 'loss/train': 3.0321805477142334} -09/20/2021 19:10:56 - INFO - __main__ - Step 21679: {'lr': 0.0001999257874365673, 'samples': 693728, 'steps': 1354, 'loss/train': 2.7424662113189697} -09/20/2021 19:10:57 - INFO - __main__ - Step 21680: {'lr': 0.0001999257874365673, 'samples': 693760, 'steps': 1354, 'loss/train': 3.7074992656707764} -09/20/2021 19:10:58 - INFO - __main__ - Step 21681: {'lr': 0.0001999255415267028, 'samples': 693792, 'steps': 1355, 'loss/train': 3.7352867126464844} -09/20/2021 19:10:58 - INFO - __main__ - Step 21682: {'lr': 0.0001999255415267028, 'samples': 693824, 'steps': 1355, 'loss/train': 3.43642520904541} -09/20/2021 19:10:59 - INFO - __main__ - Step 21683: {'lr': 0.0001999255415267028, 'samples': 693856, 'steps': 1355, 'loss/train': 2.898122549057007} -09/20/2021 19:11:00 - INFO - __main__ - Step 21684: {'lr': 0.0001999255415267028, 'samples': 693888, 'steps': 1355, 'loss/train': 5.461280822753906} -09/20/2021 19:11:01 - INFO - __main__ - Step 21685: {'lr': 0.0001999255415267028, 'samples': 693920, 'steps': 1355, 'loss/train': 5.774898052215576} -09/20/2021 19:11:01 - INFO - __main__ - Step 21686: {'lr': 0.0001999255415267028, 'samples': 693952, 'steps': 1355, 'loss/train': 2.7254624366760254} -09/20/2021 19:11:02 - INFO - __main__ - Step 21687: {'lr': 0.0001999255415267028, 'samples': 693984, 'steps': 1355, 'loss/train': 2.7361769676208496} -09/20/2021 19:11:03 - INFO - __main__ - Step 21688: {'lr': 0.0001999255415267028, 'samples': 694016, 'steps': 1355, 'loss/train': 4.066436290740967} -09/20/2021 19:11:04 - INFO - __main__ - Step 21689: {'lr': 0.0001999255415267028, 'samples': 694048, 'steps': 1355, 'loss/train': 3.113635540008545} -09/20/2021 19:11:04 - INFO - __main__ - Step 21690: {'lr': 0.0001999255415267028, 'samples': 694080, 'steps': 1355, 'loss/train': 3.4988362789154053} -09/20/2021 19:11:05 - INFO - __main__ - Step 21691: {'lr': 0.0001999255415267028, 'samples': 694112, 'steps': 1355, 'loss/train': 3.133730888366699} -09/20/2021 19:11:06 - INFO - __main__ - Step 21692: {'lr': 0.0001999255415267028, 'samples': 694144, 'steps': 1355, 'loss/train': 3.342137336730957} -09/20/2021 19:11:07 - INFO - __main__ - Step 21693: {'lr': 0.0001999255415267028, 'samples': 694176, 'steps': 1355, 'loss/train': 3.533823251724243} -09/20/2021 19:11:07 - INFO - __main__ - Step 21694: {'lr': 0.0001999255415267028, 'samples': 694208, 'steps': 1355, 'loss/train': 3.1307077407836914} -09/20/2021 19:11:08 - INFO - __main__ - Step 21695: {'lr': 0.0001999255415267028, 'samples': 694240, 'steps': 1355, 'loss/train': 3.3316457271575928} -09/20/2021 19:11:09 - INFO - __main__ - Step 21696: {'lr': 0.0001999255415267028, 'samples': 694272, 'steps': 1355, 'loss/train': 3.271920680999756} -09/20/2021 19:11:10 - INFO - __main__ - Step 21697: {'lr': 0.00019992529521024158, 'samples': 694304, 'steps': 1356, 'loss/train': 4.02909517288208} -09/20/2021 19:11:11 - INFO - __main__ - Step 21698: {'lr': 0.00019992529521024158, 'samples': 694336, 'steps': 1356, 'loss/train': 2.715240716934204} -09/20/2021 19:11:11 - INFO - __main__ - Step 21699: {'lr': 0.00019992529521024158, 'samples': 694368, 'steps': 1356, 'loss/train': 2.482367515563965} -09/20/2021 19:11:12 - INFO - __main__ - Step 21700: {'lr': 0.00019992529521024158, 'samples': 694400, 'steps': 1356, 'loss/train': 2.551631212234497} -09/20/2021 19:11:13 - INFO - __main__ - Step 21701: {'lr': 0.00019992529521024158, 'samples': 694432, 'steps': 1356, 'loss/train': 3.78029727935791} -09/20/2021 19:11:14 - INFO - __main__ - Step 21702: {'lr': 0.00019992529521024158, 'samples': 694464, 'steps': 1356, 'loss/train': 3.4926939010620117} -09/20/2021 19:11:14 - INFO - __main__ - Step 21703: {'lr': 0.00019992529521024158, 'samples': 694496, 'steps': 1356, 'loss/train': 3.4121854305267334} -09/20/2021 19:11:15 - INFO - __main__ - Step 21704: {'lr': 0.00019992529521024158, 'samples': 694528, 'steps': 1356, 'loss/train': 2.8486053943634033} -09/20/2021 19:11:16 - INFO - __main__ - Step 21705: {'lr': 0.00019992529521024158, 'samples': 694560, 'steps': 1356, 'loss/train': 3.7934725284576416} -09/20/2021 19:11:17 - INFO - __main__ - Step 21706: {'lr': 0.00019992529521024158, 'samples': 694592, 'steps': 1356, 'loss/train': 2.778348445892334} -09/20/2021 19:11:17 - INFO - __main__ - Step 21707: {'lr': 0.00019992529521024158, 'samples': 694624, 'steps': 1356, 'loss/train': 3.813103199005127} -09/20/2021 19:11:18 - INFO - __main__ - Step 21708: {'lr': 0.00019992529521024158, 'samples': 694656, 'steps': 1356, 'loss/train': 3.4350051879882812} -09/20/2021 19:11:20 - INFO - __main__ - Step 21709: {'lr': 0.00019992529521024158, 'samples': 694688, 'steps': 1356, 'loss/train': 3.5675032138824463} -09/20/2021 19:11:20 - INFO - __main__ - Step 21710: {'lr': 0.00019992529521024158, 'samples': 694720, 'steps': 1356, 'loss/train': 1.8840467929840088} -09/20/2021 19:11:21 - INFO - __main__ - Step 21711: {'lr': 0.00019992529521024158, 'samples': 694752, 'steps': 1356, 'loss/train': 2.7347006797790527} -09/20/2021 19:11:22 - INFO - __main__ - Step 21712: {'lr': 0.00019992529521024158, 'samples': 694784, 'steps': 1356, 'loss/train': 3.3643362522125244} -09/20/2021 19:11:23 - INFO - __main__ - Step 21713: {'lr': 0.00019992504848718477, 'samples': 694816, 'steps': 1357, 'loss/train': 3.618596315383911} -09/20/2021 19:11:23 - INFO - __main__ - Step 21714: {'lr': 0.00019992504848718477, 'samples': 694848, 'steps': 1357, 'loss/train': 3.021641254425049} -09/20/2021 19:11:24 - INFO - __main__ - Step 21715: {'lr': 0.00019992504848718477, 'samples': 694880, 'steps': 1357, 'loss/train': 2.2520625591278076} -09/20/2021 19:11:25 - INFO - __main__ - Step 21716: {'lr': 0.00019992504848718477, 'samples': 694912, 'steps': 1357, 'loss/train': 3.6665995121002197} -09/20/2021 19:11:26 - INFO - __main__ - Step 21717: {'lr': 0.00019992504848718477, 'samples': 694944, 'steps': 1357, 'loss/train': 3.312251091003418} -09/20/2021 19:11:26 - INFO - __main__ - Step 21718: {'lr': 0.00019992504848718477, 'samples': 694976, 'steps': 1357, 'loss/train': 3.2110836505889893} -09/20/2021 19:11:27 - INFO - __main__ - Step 21719: {'lr': 0.00019992504848718477, 'samples': 695008, 'steps': 1357, 'loss/train': 2.722769021987915} -09/20/2021 19:11:28 - INFO - __main__ - Step 21720: {'lr': 0.00019992504848718477, 'samples': 695040, 'steps': 1357, 'loss/train': 4.33501672744751} -09/20/2021 19:11:29 - INFO - __main__ - Step 21721: {'lr': 0.00019992504848718477, 'samples': 695072, 'steps': 1357, 'loss/train': 3.287019729614258} -09/20/2021 19:11:29 - INFO - __main__ - Step 21722: {'lr': 0.00019992504848718477, 'samples': 695104, 'steps': 1357, 'loss/train': 3.4767420291900635} -09/20/2021 19:11:30 - INFO - __main__ - Step 21723: {'lr': 0.00019992504848718477, 'samples': 695136, 'steps': 1357, 'loss/train': 3.3348562717437744} -09/20/2021 19:11:31 - INFO - __main__ - Step 21724: {'lr': 0.00019992504848718477, 'samples': 695168, 'steps': 1357, 'loss/train': 3.523353099822998} -09/20/2021 19:11:32 - INFO - __main__ - Step 21725: {'lr': 0.00019992504848718477, 'samples': 695200, 'steps': 1357, 'loss/train': 3.8759357929229736} -09/20/2021 19:11:32 - INFO - __main__ - Step 21726: {'lr': 0.00019992504848718477, 'samples': 695232, 'steps': 1357, 'loss/train': 3.012411594390869} -09/20/2021 19:11:33 - INFO - __main__ - Step 21727: {'lr': 0.00019992504848718477, 'samples': 695264, 'steps': 1357, 'loss/train': 0.5453623533248901} -09/20/2021 19:11:34 - INFO - __main__ - Step 21728: {'lr': 0.00019992504848718477, 'samples': 695296, 'steps': 1357, 'loss/train': 0.41363027691841125} -09/20/2021 19:11:35 - INFO - __main__ - Step 21729: {'lr': 0.00019992480135753334, 'samples': 695328, 'steps': 1358, 'loss/train': 0.2931286096572876} -09/20/2021 19:11:36 - INFO - __main__ - Step 21730: {'lr': 0.00019992480135753334, 'samples': 695360, 'steps': 1358, 'loss/train': 3.0150883197784424} -09/20/2021 19:11:36 - INFO - __main__ - Step 21731: {'lr': 0.00019992480135753334, 'samples': 695392, 'steps': 1358, 'loss/train': 3.415249824523926} -09/20/2021 19:11:37 - INFO - __main__ - Step 21732: {'lr': 0.00019992480135753334, 'samples': 695424, 'steps': 1358, 'loss/train': 4.567485332489014} -09/20/2021 19:11:38 - INFO - __main__ - Step 21733: {'lr': 0.00019992480135753334, 'samples': 695456, 'steps': 1358, 'loss/train': 2.544950008392334} -09/20/2021 19:11:39 - INFO - __main__ - Step 21734: {'lr': 0.00019992480135753334, 'samples': 695488, 'steps': 1358, 'loss/train': 4.292733669281006} -09/20/2021 19:11:39 - INFO - __main__ - Step 21735: {'lr': 0.00019992480135753334, 'samples': 695520, 'steps': 1358, 'loss/train': 3.793997049331665} -09/20/2021 19:11:40 - INFO - __main__ - Step 21736: {'lr': 0.00019992480135753334, 'samples': 695552, 'steps': 1358, 'loss/train': 2.940199375152588} -09/20/2021 19:11:41 - INFO - __main__ - Step 21737: {'lr': 0.00019992480135753334, 'samples': 695584, 'steps': 1358, 'loss/train': 2.7729716300964355} -09/20/2021 19:11:42 - INFO - __main__ - Step 21738: {'lr': 0.00019992480135753334, 'samples': 695616, 'steps': 1358, 'loss/train': 2.9716289043426514} -09/20/2021 19:11:42 - INFO - __main__ - Step 21739: {'lr': 0.00019992480135753334, 'samples': 695648, 'steps': 1358, 'loss/train': 2.885596990585327} -09/20/2021 19:11:44 - INFO - __main__ - Step 21740: {'lr': 0.00019992480135753334, 'samples': 695680, 'steps': 1358, 'loss/train': 2.855877161026001} -09/20/2021 19:11:44 - INFO - __main__ - Step 21741: {'lr': 0.00019992480135753334, 'samples': 695712, 'steps': 1358, 'loss/train': 3.038320779800415} -09/20/2021 19:11:45 - INFO - __main__ - Step 21742: {'lr': 0.00019992480135753334, 'samples': 695744, 'steps': 1358, 'loss/train': 2.70359206199646} -09/20/2021 19:11:46 - INFO - __main__ - Step 21743: {'lr': 0.00019992480135753334, 'samples': 695776, 'steps': 1358, 'loss/train': 3.4077019691467285} -09/20/2021 19:11:47 - INFO - __main__ - Step 21744: {'lr': 0.00019992480135753334, 'samples': 695808, 'steps': 1358, 'loss/train': 3.566713809967041} -09/20/2021 19:11:47 - INFO - __main__ - Step 21745: {'lr': 0.00019992455382128826, 'samples': 695840, 'steps': 1359, 'loss/train': 1.641644835472107} -09/20/2021 19:11:48 - INFO - __main__ - Step 21746: {'lr': 0.00019992455382128826, 'samples': 695872, 'steps': 1359, 'loss/train': 2.6715810298919678} -09/20/2021 19:11:49 - INFO - __main__ - Step 21747: {'lr': 0.00019992455382128826, 'samples': 695904, 'steps': 1359, 'loss/train': 2.786909818649292} -09/20/2021 19:11:50 - INFO - __main__ - Step 21748: {'lr': 0.00019992455382128826, 'samples': 695936, 'steps': 1359, 'loss/train': 2.8975296020507812} -09/20/2021 19:11:50 - INFO - __main__ - Step 21749: {'lr': 0.00019992455382128826, 'samples': 695968, 'steps': 1359, 'loss/train': 4.133480072021484} -09/20/2021 19:11:51 - INFO - __main__ - Step 21750: {'lr': 0.00019992455382128826, 'samples': 696000, 'steps': 1359, 'loss/train': 1.3338799476623535} -09/20/2021 19:11:52 - INFO - __main__ - Step 21751: {'lr': 0.00019992455382128826, 'samples': 696032, 'steps': 1359, 'loss/train': 3.4017481803894043} -09/20/2021 19:11:53 - INFO - __main__ - Step 21752: {'lr': 0.00019992455382128826, 'samples': 696064, 'steps': 1359, 'loss/train': 2.2888925075531006} -09/20/2021 19:11:53 - INFO - __main__ - Step 21753: {'lr': 0.00019992455382128826, 'samples': 696096, 'steps': 1359, 'loss/train': 3.2447755336761475} -09/20/2021 19:11:54 - INFO - __main__ - Step 21754: {'lr': 0.00019992455382128826, 'samples': 696128, 'steps': 1359, 'loss/train': 4.051359176635742} -09/20/2021 19:11:55 - INFO - __main__ - Step 21755: {'lr': 0.00019992455382128826, 'samples': 696160, 'steps': 1359, 'loss/train': 2.9603068828582764} -09/20/2021 19:11:56 - INFO - __main__ - Step 21756: {'lr': 0.00019992455382128826, 'samples': 696192, 'steps': 1359, 'loss/train': 2.0285160541534424} -09/20/2021 19:11:56 - INFO - __main__ - Step 21757: {'lr': 0.00019992455382128826, 'samples': 696224, 'steps': 1359, 'loss/train': 2.5718722343444824} -09/20/2021 19:11:57 - INFO - __main__ - Step 21758: {'lr': 0.00019992455382128826, 'samples': 696256, 'steps': 1359, 'loss/train': 2.1980199813842773} -09/20/2021 19:11:58 - INFO - __main__ - Step 21759: {'lr': 0.00019992455382128826, 'samples': 696288, 'steps': 1359, 'loss/train': 2.9464008808135986} -09/20/2021 19:11:59 - INFO - __main__ - Step 21760: {'lr': 0.00019992455382128826, 'samples': 696320, 'steps': 1359, 'loss/train': 3.1553828716278076} -09/20/2021 19:12:00 - INFO - __main__ - Step 21761: {'lr': 0.00019992430587845056, 'samples': 696352, 'steps': 1360, 'loss/train': 3.518281936645508} -09/20/2021 19:12:00 - INFO - __main__ - Step 21762: {'lr': 0.00019992430587845056, 'samples': 696384, 'steps': 1360, 'loss/train': 2.6586191654205322} -09/20/2021 19:12:01 - INFO - __main__ - Step 21763: {'lr': 0.00019992430587845056, 'samples': 696416, 'steps': 1360, 'loss/train': 3.1317005157470703} -09/20/2021 19:12:02 - INFO - __main__ - Step 21764: {'lr': 0.00019992430587845056, 'samples': 696448, 'steps': 1360, 'loss/train': 4.032617568969727} -09/20/2021 19:12:03 - INFO - __main__ - Step 21765: {'lr': 0.00019992430587845056, 'samples': 696480, 'steps': 1360, 'loss/train': 2.7551980018615723} -09/20/2021 19:12:03 - INFO - __main__ - Step 21766: {'lr': 0.00019992430587845056, 'samples': 696512, 'steps': 1360, 'loss/train': 3.9383676052093506} -09/20/2021 19:12:04 - INFO - __main__ - Step 21767: {'lr': 0.00019992430587845056, 'samples': 696544, 'steps': 1360, 'loss/train': 3.827786684036255} -09/20/2021 19:12:05 - INFO - __main__ - Step 21768: {'lr': 0.00019992430587845056, 'samples': 696576, 'steps': 1360, 'loss/train': 3.4024477005004883} -09/20/2021 19:12:06 - INFO - __main__ - Step 21769: {'lr': 0.00019992430587845056, 'samples': 696608, 'steps': 1360, 'loss/train': 2.190791130065918} -09/20/2021 19:12:06 - INFO - __main__ - Step 21770: {'lr': 0.00019992430587845056, 'samples': 696640, 'steps': 1360, 'loss/train': 2.3852880001068115} -09/20/2021 19:12:07 - INFO - __main__ - Step 21771: {'lr': 0.00019992430587845056, 'samples': 696672, 'steps': 1360, 'loss/train': 2.2291109561920166} -09/20/2021 19:12:08 - INFO - __main__ - Step 21772: {'lr': 0.00019992430587845056, 'samples': 696704, 'steps': 1360, 'loss/train': 3.1665756702423096} -09/20/2021 19:12:09 - INFO - __main__ - Step 21773: {'lr': 0.00019992430587845056, 'samples': 696736, 'steps': 1360, 'loss/train': 4.078650951385498} -09/20/2021 19:12:10 - INFO - __main__ - Step 21774: {'lr': 0.00019992430587845056, 'samples': 696768, 'steps': 1360, 'loss/train': 3.1355738639831543} -09/20/2021 19:12:11 - INFO - __main__ - Step 21775: {'lr': 0.00019992430587845056, 'samples': 696800, 'steps': 1360, 'loss/train': 3.5532917976379395} -09/20/2021 19:12:11 - INFO - __main__ - Step 21776: {'lr': 0.00019992430587845056, 'samples': 696832, 'steps': 1360, 'loss/train': 3.2312066555023193} -09/20/2021 19:12:12 - INFO - __main__ - Step 21777: {'lr': 0.00019992405752902127, 'samples': 696864, 'steps': 1361, 'loss/train': 3.3410532474517822} -09/20/2021 19:12:13 - INFO - __main__ - Step 21778: {'lr': 0.00019992405752902127, 'samples': 696896, 'steps': 1361, 'loss/train': 4.024118900299072} -09/20/2021 19:12:14 - INFO - __main__ - Step 21779: {'lr': 0.00019992405752902127, 'samples': 696928, 'steps': 1361, 'loss/train': 2.959038496017456} -09/20/2021 19:12:15 - INFO - __main__ - Step 21780: {'lr': 0.00019992405752902127, 'samples': 696960, 'steps': 1361, 'loss/train': 3.8022878170013428} -09/20/2021 19:12:15 - INFO - __main__ - Step 21781: {'lr': 0.00019992405752902127, 'samples': 696992, 'steps': 1361, 'loss/train': 2.978365898132324} -09/20/2021 19:12:16 - INFO - __main__ - Step 21782: {'lr': 0.00019992405752902127, 'samples': 697024, 'steps': 1361, 'loss/train': 2.5992512702941895} -09/20/2021 19:12:17 - INFO - __main__ - Step 21783: {'lr': 0.00019992405752902127, 'samples': 697056, 'steps': 1361, 'loss/train': 3.753099203109741} -09/20/2021 19:12:18 - INFO - __main__ - Step 21784: {'lr': 0.00019992405752902127, 'samples': 697088, 'steps': 1361, 'loss/train': 2.180950164794922} -09/20/2021 19:12:18 - INFO - __main__ - Step 21785: {'lr': 0.00019992405752902127, 'samples': 697120, 'steps': 1361, 'loss/train': 2.273862361907959} -09/20/2021 19:12:19 - INFO - __main__ - Step 21786: {'lr': 0.00019992405752902127, 'samples': 697152, 'steps': 1361, 'loss/train': 3.18603253364563} -09/20/2021 19:12:20 - INFO - __main__ - Step 21787: {'lr': 0.00019992405752902127, 'samples': 697184, 'steps': 1361, 'loss/train': 5.655533790588379} -09/20/2021 19:12:21 - INFO - __main__ - Step 21788: {'lr': 0.00019992405752902127, 'samples': 697216, 'steps': 1361, 'loss/train': 3.313060760498047} -09/20/2021 19:12:21 - INFO - __main__ - Step 21789: {'lr': 0.00019992405752902127, 'samples': 697248, 'steps': 1361, 'loss/train': 2.9398186206817627} -09/20/2021 19:12:22 - INFO - __main__ - Step 21790: {'lr': 0.00019992405752902127, 'samples': 697280, 'steps': 1361, 'loss/train': 3.6330759525299072} -09/20/2021 19:12:23 - INFO - __main__ - Step 21791: {'lr': 0.00019992405752902127, 'samples': 697312, 'steps': 1361, 'loss/train': 2.299896478652954} -09/20/2021 19:12:24 - INFO - __main__ - Step 21792: {'lr': 0.00019992405752902127, 'samples': 697344, 'steps': 1361, 'loss/train': 6.299976348876953} -09/20/2021 19:12:24 - INFO - __main__ - Step 21793: {'lr': 0.00019992380877300133, 'samples': 697376, 'steps': 1362, 'loss/train': 2.6370909214019775} -09/20/2021 19:12:25 - INFO - __main__ - Step 21794: {'lr': 0.00019992380877300133, 'samples': 697408, 'steps': 1362, 'loss/train': 3.1919078826904297} -09/20/2021 19:12:26 - INFO - __main__ - Step 21795: {'lr': 0.00019992380877300133, 'samples': 697440, 'steps': 1362, 'loss/train': 3.3661794662475586} -09/20/2021 19:12:27 - INFO - __main__ - Step 21796: {'lr': 0.00019992380877300133, 'samples': 697472, 'steps': 1362, 'loss/train': 2.7249929904937744} -09/20/2021 19:12:27 - INFO - __main__ - Step 21797: {'lr': 0.00019992380877300133, 'samples': 697504, 'steps': 1362, 'loss/train': 2.9127542972564697} -09/20/2021 19:12:28 - INFO - __main__ - Step 21798: {'lr': 0.00019992380877300133, 'samples': 697536, 'steps': 1362, 'loss/train': 3.1129112243652344} -09/20/2021 19:12:29 - INFO - __main__ - Step 21799: {'lr': 0.00019992380877300133, 'samples': 697568, 'steps': 1362, 'loss/train': 4.341268062591553} -09/20/2021 19:12:30 - INFO - __main__ - Step 21800: {'lr': 0.00019992380877300133, 'samples': 697600, 'steps': 1362, 'loss/train': 3.583465099334717} -09/20/2021 19:12:30 - INFO - __main__ - Step 21801: {'lr': 0.00019992380877300133, 'samples': 697632, 'steps': 1362, 'loss/train': 3.4481828212738037} -09/20/2021 19:12:31 - INFO - __main__ - Step 21802: {'lr': 0.00019992380877300133, 'samples': 697664, 'steps': 1362, 'loss/train': 3.0529427528381348} -09/20/2021 19:12:32 - INFO - __main__ - Step 21803: {'lr': 0.00019992380877300133, 'samples': 697696, 'steps': 1362, 'loss/train': 2.6086156368255615} -09/20/2021 19:12:33 - INFO - __main__ - Step 21804: {'lr': 0.00019992380877300133, 'samples': 697728, 'steps': 1362, 'loss/train': 3.195117235183716} -09/20/2021 19:12:34 - INFO - __main__ - Step 21805: {'lr': 0.00019992380877300133, 'samples': 697760, 'steps': 1362, 'loss/train': 4.271962642669678} -09/20/2021 19:12:35 - INFO - __main__ - Step 21806: {'lr': 0.00019992380877300133, 'samples': 697792, 'steps': 1362, 'loss/train': 3.1614677906036377} -09/20/2021 19:12:35 - INFO - __main__ - Step 21807: {'lr': 0.00019992380877300133, 'samples': 697824, 'steps': 1362, 'loss/train': 0.7703566551208496} -09/20/2021 19:12:36 - INFO - __main__ - Step 21808: {'lr': 0.00019992380877300133, 'samples': 697856, 'steps': 1362, 'loss/train': 2.7064781188964844} -09/20/2021 19:12:37 - INFO - __main__ - Step 21809: {'lr': 0.00019992355961039184, 'samples': 697888, 'steps': 1363, 'loss/train': 2.797699451446533} -09/20/2021 19:12:38 - INFO - __main__ - Step 21810: {'lr': 0.00019992355961039184, 'samples': 697920, 'steps': 1363, 'loss/train': 2.766413927078247} -09/20/2021 19:12:39 - INFO - __main__ - Step 21811: {'lr': 0.00019992355961039184, 'samples': 697952, 'steps': 1363, 'loss/train': 3.8054847717285156} -09/20/2021 19:12:39 - INFO - __main__ - Step 21812: {'lr': 0.00019992355961039184, 'samples': 697984, 'steps': 1363, 'loss/train': 3.634227991104126} -09/20/2021 19:12:40 - INFO - __main__ - Step 21813: {'lr': 0.00019992355961039184, 'samples': 698016, 'steps': 1363, 'loss/train': 3.2345480918884277} -09/20/2021 19:12:41 - INFO - __main__ - Step 21814: {'lr': 0.00019992355961039184, 'samples': 698048, 'steps': 1363, 'loss/train': 3.3739571571350098} -09/20/2021 19:12:42 - INFO - __main__ - Step 21815: {'lr': 0.00019992355961039184, 'samples': 698080, 'steps': 1363, 'loss/train': 3.584040403366089} -09/20/2021 19:12:42 - INFO - __main__ - Step 21816: {'lr': 0.00019992355961039184, 'samples': 698112, 'steps': 1363, 'loss/train': 3.0191702842712402} -09/20/2021 19:12:43 - INFO - __main__ - Step 21817: {'lr': 0.00019992355961039184, 'samples': 698144, 'steps': 1363, 'loss/train': 3.3594257831573486} -09/20/2021 19:12:44 - INFO - __main__ - Step 21818: {'lr': 0.00019992355961039184, 'samples': 698176, 'steps': 1363, 'loss/train': 3.2219390869140625} -09/20/2021 19:12:45 - INFO - __main__ - Step 21819: {'lr': 0.00019992355961039184, 'samples': 698208, 'steps': 1363, 'loss/train': 2.570349931716919} -09/20/2021 19:12:45 - INFO - __main__ - Step 21820: {'lr': 0.00019992355961039184, 'samples': 698240, 'steps': 1363, 'loss/train': 2.493842363357544} -09/20/2021 19:12:46 - INFO - __main__ - Step 21821: {'lr': 0.00019992355961039184, 'samples': 698272, 'steps': 1363, 'loss/train': 2.6553099155426025} -09/20/2021 19:12:47 - INFO - __main__ - Step 21822: {'lr': 0.00019992355961039184, 'samples': 698304, 'steps': 1363, 'loss/train': 2.60392427444458} -09/20/2021 19:12:48 - INFO - __main__ - Step 21823: {'lr': 0.00019992355961039184, 'samples': 698336, 'steps': 1363, 'loss/train': 3.8559277057647705} -09/20/2021 19:12:48 - INFO - __main__ - Step 21824: {'lr': 0.00019992355961039184, 'samples': 698368, 'steps': 1363, 'loss/train': 2.7331793308258057} -09/20/2021 19:12:49 - INFO - __main__ - Step 21825: {'lr': 0.00019992331004119374, 'samples': 698400, 'steps': 1364, 'loss/train': 3.1352157592773438} -09/20/2021 19:12:50 - INFO - __main__ - Step 21826: {'lr': 0.00019992331004119374, 'samples': 698432, 'steps': 1364, 'loss/train': 2.630869150161743} -09/20/2021 19:12:51 - INFO - __main__ - Step 21827: {'lr': 0.00019992331004119374, 'samples': 698464, 'steps': 1364, 'loss/train': 2.625864267349243} -09/20/2021 19:12:51 - INFO - __main__ - Step 21828: {'lr': 0.00019992331004119374, 'samples': 698496, 'steps': 1364, 'loss/train': 3.6228983402252197} -09/20/2021 19:12:52 - INFO - __main__ - Step 21829: {'lr': 0.00019992331004119374, 'samples': 698528, 'steps': 1364, 'loss/train': 3.4786036014556885} -09/20/2021 19:12:53 - INFO - __main__ - Step 21830: {'lr': 0.00019992331004119374, 'samples': 698560, 'steps': 1364, 'loss/train': 3.3923285007476807} -09/20/2021 19:12:54 - INFO - __main__ - Step 21831: {'lr': 0.00019992331004119374, 'samples': 698592, 'steps': 1364, 'loss/train': 1.1959209442138672} -09/20/2021 19:12:54 - INFO - __main__ - Step 21832: {'lr': 0.00019992331004119374, 'samples': 698624, 'steps': 1364, 'loss/train': 1.6310585737228394} -09/20/2021 19:12:55 - INFO - __main__ - Step 21833: {'lr': 0.00019992331004119374, 'samples': 698656, 'steps': 1364, 'loss/train': 4.111669540405273} -09/20/2021 19:12:56 - INFO - __main__ - Step 21834: {'lr': 0.00019992331004119374, 'samples': 698688, 'steps': 1364, 'loss/train': 2.861539602279663} -09/20/2021 19:12:57 - INFO - __main__ - Step 21835: {'lr': 0.00019992331004119374, 'samples': 698720, 'steps': 1364, 'loss/train': 2.9832637310028076} -09/20/2021 19:12:58 - INFO - __main__ - Step 21836: {'lr': 0.00019992331004119374, 'samples': 698752, 'steps': 1364, 'loss/train': 2.4717888832092285} -09/20/2021 19:12:59 - INFO - __main__ - Step 21837: {'lr': 0.00019992331004119374, 'samples': 698784, 'steps': 1364, 'loss/train': 3.686889171600342} -09/20/2021 19:12:59 - INFO - __main__ - Step 21838: {'lr': 0.00019992331004119374, 'samples': 698816, 'steps': 1364, 'loss/train': 3.3611011505126953} -09/20/2021 19:13:00 - INFO - __main__ - Step 21839: {'lr': 0.00019992331004119374, 'samples': 698848, 'steps': 1364, 'loss/train': 3.778017282485962} -09/20/2021 19:13:01 - INFO - __main__ - Step 21840: {'lr': 0.00019992331004119374, 'samples': 698880, 'steps': 1364, 'loss/train': 3.102604627609253} -09/20/2021 19:13:02 - INFO - __main__ - Step 21841: {'lr': 0.0001999230600654081, 'samples': 698912, 'steps': 1365, 'loss/train': 3.155785083770752} -09/20/2021 19:13:03 - INFO - __main__ - Step 21842: {'lr': 0.0001999230600654081, 'samples': 698944, 'steps': 1365, 'loss/train': 3.0255374908447266} -09/20/2021 19:13:03 - INFO - __main__ - Step 21843: {'lr': 0.0001999230600654081, 'samples': 698976, 'steps': 1365, 'loss/train': 3.811263084411621} -09/20/2021 19:13:04 - INFO - __main__ - Step 21844: {'lr': 0.0001999230600654081, 'samples': 699008, 'steps': 1365, 'loss/train': 3.6628923416137695} -09/20/2021 19:13:05 - INFO - __main__ - Step 21845: {'lr': 0.0001999230600654081, 'samples': 699040, 'steps': 1365, 'loss/train': 3.2382113933563232} -09/20/2021 19:13:06 - INFO - __main__ - Step 21846: {'lr': 0.0001999230600654081, 'samples': 699072, 'steps': 1365, 'loss/train': 3.343700885772705} -09/20/2021 19:13:06 - INFO - __main__ - Step 21847: {'lr': 0.0001999230600654081, 'samples': 699104, 'steps': 1365, 'loss/train': 3.130267381668091} -09/20/2021 19:13:07 - INFO - __main__ - Step 21848: {'lr': 0.0001999230600654081, 'samples': 699136, 'steps': 1365, 'loss/train': 3.446211814880371} -09/20/2021 19:13:08 - INFO - __main__ - Step 21849: {'lr': 0.0001999230600654081, 'samples': 699168, 'steps': 1365, 'loss/train': 3.5066134929656982} -09/20/2021 19:13:09 - INFO - __main__ - Step 21850: {'lr': 0.0001999230600654081, 'samples': 699200, 'steps': 1365, 'loss/train': 3.3161823749542236} -09/20/2021 19:13:09 - INFO - __main__ - Step 21851: {'lr': 0.0001999230600654081, 'samples': 699232, 'steps': 1365, 'loss/train': 2.9217913150787354} -09/20/2021 19:13:10 - INFO - __main__ - Step 21852: {'lr': 0.0001999230600654081, 'samples': 699264, 'steps': 1365, 'loss/train': 3.0536420345306396} -09/20/2021 19:13:11 - INFO - __main__ - Step 21853: {'lr': 0.0001999230600654081, 'samples': 699296, 'steps': 1365, 'loss/train': 2.6656923294067383} -09/20/2021 19:13:12 - INFO - __main__ - Step 21854: {'lr': 0.0001999230600654081, 'samples': 699328, 'steps': 1365, 'loss/train': 2.6759657859802246} -09/20/2021 19:13:12 - INFO - __main__ - Step 21855: {'lr': 0.0001999230600654081, 'samples': 699360, 'steps': 1365, 'loss/train': 3.790144681930542} -09/20/2021 19:13:13 - INFO - __main__ - Step 21856: {'lr': 0.0001999230600654081, 'samples': 699392, 'steps': 1365, 'loss/train': 2.2670040130615234} -09/20/2021 19:13:14 - INFO - __main__ - Step 21857: {'lr': 0.00019992280968303595, 'samples': 699424, 'steps': 1366, 'loss/train': 3.7778401374816895} -09/20/2021 19:13:15 - INFO - __main__ - Step 21858: {'lr': 0.00019992280968303595, 'samples': 699456, 'steps': 1366, 'loss/train': 3.0562546253204346} -09/20/2021 19:13:15 - INFO - __main__ - Step 21859: {'lr': 0.00019992280968303595, 'samples': 699488, 'steps': 1366, 'loss/train': 2.6935062408447266} -09/20/2021 19:13:16 - INFO - __main__ - Step 21860: {'lr': 0.00019992280968303595, 'samples': 699520, 'steps': 1366, 'loss/train': 3.255934715270996} -09/20/2021 19:13:17 - INFO - __main__ - Step 21861: {'lr': 0.00019992280968303595, 'samples': 699552, 'steps': 1366, 'loss/train': 3.816521167755127} -09/20/2021 19:13:18 - INFO - __main__ - Step 21862: {'lr': 0.00019992280968303595, 'samples': 699584, 'steps': 1366, 'loss/train': 3.3200337886810303} -09/20/2021 19:13:18 - INFO - __main__ - Step 21863: {'lr': 0.00019992280968303595, 'samples': 699616, 'steps': 1366, 'loss/train': 2.745046615600586} -09/20/2021 19:13:19 - INFO - __main__ - Step 21864: {'lr': 0.00019992280968303595, 'samples': 699648, 'steps': 1366, 'loss/train': 2.076458215713501} -09/20/2021 19:13:21 - INFO - __main__ - Step 21865: {'lr': 0.00019992280968303595, 'samples': 699680, 'steps': 1366, 'loss/train': 3.425058126449585} -09/20/2021 19:13:21 - INFO - __main__ - Step 21866: {'lr': 0.00019992280968303595, 'samples': 699712, 'steps': 1366, 'loss/train': 1.1707292795181274} -09/20/2021 19:13:22 - INFO - __main__ - Step 21867: {'lr': 0.00019992280968303595, 'samples': 699744, 'steps': 1366, 'loss/train': 1.1960312128067017} -09/20/2021 19:13:23 - INFO - __main__ - Step 21868: {'lr': 0.00019992280968303595, 'samples': 699776, 'steps': 1366, 'loss/train': 0.46995681524276733} -09/20/2021 19:13:24 - INFO - __main__ - Step 21869: {'lr': 0.00019992280968303595, 'samples': 699808, 'steps': 1366, 'loss/train': 0.6240479350090027} -09/20/2021 19:13:24 - INFO - __main__ - Step 21870: {'lr': 0.00019992280968303595, 'samples': 699840, 'steps': 1366, 'loss/train': 2.879789352416992} -09/20/2021 19:13:25 - INFO - __main__ - Step 21871: {'lr': 0.00019992280968303595, 'samples': 699872, 'steps': 1366, 'loss/train': 2.847036361694336} -09/20/2021 19:13:26 - INFO - __main__ - Step 21872: {'lr': 0.00019992280968303595, 'samples': 699904, 'steps': 1366, 'loss/train': 4.662391662597656} -09/20/2021 19:13:27 - INFO - __main__ - Step 21873: {'lr': 0.00019992255889407824, 'samples': 699936, 'steps': 1367, 'loss/train': 3.164299488067627} -09/20/2021 19:13:27 - INFO - __main__ - Step 21874: {'lr': 0.00019992255889407824, 'samples': 699968, 'steps': 1367, 'loss/train': 2.7373573780059814} -09/20/2021 19:13:28 - INFO - __main__ - Step 21875: {'lr': 0.00019992255889407824, 'samples': 700000, 'steps': 1367, 'loss/train': 5.988408088684082} -09/20/2021 19:13:29 - INFO - __main__ - Step 21876: {'lr': 0.00019992255889407824, 'samples': 700032, 'steps': 1367, 'loss/train': 3.265963077545166} -09/20/2021 19:13:30 - INFO - __main__ - Step 21877: {'lr': 0.00019992255889407824, 'samples': 700064, 'steps': 1367, 'loss/train': 3.0996530055999756} -09/20/2021 19:13:30 - INFO - __main__ - Step 21878: {'lr': 0.00019992255889407824, 'samples': 700096, 'steps': 1367, 'loss/train': 3.0594868659973145} -09/20/2021 19:13:31 - INFO - __main__ - Step 21879: {'lr': 0.00019992255889407824, 'samples': 700128, 'steps': 1367, 'loss/train': 3.03471040725708} -09/20/2021 19:13:32 - INFO - __main__ - Step 21880: {'lr': 0.00019992255889407824, 'samples': 700160, 'steps': 1367, 'loss/train': 2.299407482147217} -09/20/2021 19:13:33 - INFO - __main__ - Step 21881: {'lr': 0.00019992255889407824, 'samples': 700192, 'steps': 1367, 'loss/train': 3.086641788482666} -09/20/2021 19:13:33 - INFO - __main__ - Step 21882: {'lr': 0.00019992255889407824, 'samples': 700224, 'steps': 1367, 'loss/train': 3.1839513778686523} -09/20/2021 19:13:34 - INFO - __main__ - Step 21883: {'lr': 0.00019992255889407824, 'samples': 700256, 'steps': 1367, 'loss/train': 3.3801138401031494} -09/20/2021 19:13:35 - INFO - __main__ - Step 21884: {'lr': 0.00019992255889407824, 'samples': 700288, 'steps': 1367, 'loss/train': 3.430109977722168} -09/20/2021 19:13:36 - INFO - __main__ - Step 21885: {'lr': 0.00019992255889407824, 'samples': 700320, 'steps': 1367, 'loss/train': 3.152050256729126} -09/20/2021 19:13:36 - INFO - __main__ - Step 21886: {'lr': 0.00019992255889407824, 'samples': 700352, 'steps': 1367, 'loss/train': 2.9046945571899414} -09/20/2021 19:13:37 - INFO - __main__ - Step 21887: {'lr': 0.00019992255889407824, 'samples': 700384, 'steps': 1367, 'loss/train': 2.4231300354003906} -09/20/2021 19:13:38 - INFO - __main__ - Step 21888: {'lr': 0.00019992255889407824, 'samples': 700416, 'steps': 1367, 'loss/train': 2.9990170001983643} -09/20/2021 19:13:39 - INFO - __main__ - Step 21889: {'lr': 0.000199922307698536, 'samples': 700448, 'steps': 1368, 'loss/train': 3.8617146015167236} -09/20/2021 19:13:40 - INFO - __main__ - Step 21890: {'lr': 0.000199922307698536, 'samples': 700480, 'steps': 1368, 'loss/train': 2.3695788383483887} -09/20/2021 19:13:40 - INFO - __main__ - Step 21891: {'lr': 0.000199922307698536, 'samples': 700512, 'steps': 1368, 'loss/train': 1.220442533493042} -09/20/2021 19:13:41 - INFO - __main__ - Step 21892: {'lr': 0.000199922307698536, 'samples': 700544, 'steps': 1368, 'loss/train': 3.1342661380767822} -09/20/2021 19:13:42 - INFO - __main__ - Step 21893: {'lr': 0.000199922307698536, 'samples': 700576, 'steps': 1368, 'loss/train': 2.1104116439819336} -09/20/2021 19:13:43 - INFO - __main__ - Step 21894: {'lr': 0.000199922307698536, 'samples': 700608, 'steps': 1368, 'loss/train': 2.247535467147827} -09/20/2021 19:13:43 - INFO - __main__ - Step 21895: {'lr': 0.000199922307698536, 'samples': 700640, 'steps': 1368, 'loss/train': 5.253411769866943} -09/20/2021 19:13:44 - INFO - __main__ - Step 21896: {'lr': 0.000199922307698536, 'samples': 700672, 'steps': 1368, 'loss/train': 5.339803695678711} -09/20/2021 19:13:45 - INFO - __main__ - Step 21897: {'lr': 0.000199922307698536, 'samples': 700704, 'steps': 1368, 'loss/train': 5.440622806549072} -09/20/2021 19:13:46 - INFO - __main__ - Step 21898: {'lr': 0.000199922307698536, 'samples': 700736, 'steps': 1368, 'loss/train': 5.363778591156006} -09/20/2021 19:13:46 - INFO - __main__ - Step 21899: {'lr': 0.000199922307698536, 'samples': 700768, 'steps': 1368, 'loss/train': 5.32027006149292} -09/20/2021 19:13:48 - INFO - __main__ - Step 21900: {'lr': 0.000199922307698536, 'samples': 700800, 'steps': 1368, 'loss/train': 5.332651615142822} -09/20/2021 19:13:49 - INFO - __main__ - Step 21901: {'lr': 0.000199922307698536, 'samples': 700832, 'steps': 1368, 'loss/train': 2.7767505645751953} -09/20/2021 19:13:49 - INFO - __main__ - Step 21902: {'lr': 0.000199922307698536, 'samples': 700864, 'steps': 1368, 'loss/train': 3.165036916732788} -09/20/2021 19:13:50 - INFO - __main__ - Step 21903: {'lr': 0.000199922307698536, 'samples': 700896, 'steps': 1368, 'loss/train': 3.2528393268585205} -09/20/2021 19:13:51 - INFO - __main__ - Step 21904: {'lr': 0.000199922307698536, 'samples': 700928, 'steps': 1368, 'loss/train': 3.4946577548980713} -09/20/2021 19:13:52 - INFO - __main__ - Step 21905: {'lr': 0.00019992205609641031, 'samples': 700960, 'steps': 1369, 'loss/train': 3.4419844150543213} -09/20/2021 19:13:52 - INFO - __main__ - Step 21906: {'lr': 0.00019992205609641031, 'samples': 700992, 'steps': 1369, 'loss/train': 2.577709436416626} -09/20/2021 19:13:53 - INFO - __main__ - Step 21907: {'lr': 0.00019992205609641031, 'samples': 701024, 'steps': 1369, 'loss/train': 2.6621901988983154} -09/20/2021 19:13:54 - INFO - __main__ - Step 21908: {'lr': 0.00019992205609641031, 'samples': 701056, 'steps': 1369, 'loss/train': 3.1819746494293213} -09/20/2021 19:13:55 - INFO - __main__ - Step 21909: {'lr': 0.00019992205609641031, 'samples': 701088, 'steps': 1369, 'loss/train': 3.5964267253875732} -09/20/2021 19:13:55 - INFO - __main__ - Step 21910: {'lr': 0.00019992205609641031, 'samples': 701120, 'steps': 1369, 'loss/train': 3.7199838161468506} -09/20/2021 19:13:56 - INFO - __main__ - Step 21911: {'lr': 0.00019992205609641031, 'samples': 701152, 'steps': 1369, 'loss/train': 2.381027936935425} -09/20/2021 19:13:57 - INFO - __main__ - Step 21912: {'lr': 0.00019992205609641031, 'samples': 701184, 'steps': 1369, 'loss/train': 0.8012592196464539} -09/20/2021 19:13:58 - INFO - __main__ - Step 21913: {'lr': 0.00019992205609641031, 'samples': 701216, 'steps': 1369, 'loss/train': 2.9346060752868652} -09/20/2021 19:13:58 - INFO - __main__ - Step 21914: {'lr': 0.00019992205609641031, 'samples': 701248, 'steps': 1369, 'loss/train': 0.9698953628540039} -09/20/2021 19:13:59 - INFO - __main__ - Step 21915: {'lr': 0.00019992205609641031, 'samples': 701280, 'steps': 1369, 'loss/train': 2.198122024536133} -09/20/2021 19:14:00 - INFO - __main__ - Step 21916: {'lr': 0.00019992205609641031, 'samples': 701312, 'steps': 1369, 'loss/train': 2.1184725761413574} -09/20/2021 19:14:01 - INFO - __main__ - Step 21917: {'lr': 0.00019992205609641031, 'samples': 701344, 'steps': 1369, 'loss/train': 1.9658691883087158} -09/20/2021 19:14:01 - INFO - __main__ - Step 21918: {'lr': 0.00019992205609641031, 'samples': 701376, 'steps': 1369, 'loss/train': 2.2562191486358643} -09/20/2021 19:14:02 - INFO - __main__ - Step 21919: {'lr': 0.00019992205609641031, 'samples': 701408, 'steps': 1369, 'loss/train': 3.4915246963500977} -09/20/2021 19:14:03 - INFO - __main__ - Step 21920: {'lr': 0.00019992205609641031, 'samples': 701440, 'steps': 1369, 'loss/train': 2.606741428375244} -09/20/2021 19:14:04 - INFO - __main__ - Step 21921: {'lr': 0.00019992180408770217, 'samples': 701472, 'steps': 1370, 'loss/train': 3.2322545051574707} -09/20/2021 19:14:05 - INFO - __main__ - Step 21922: {'lr': 0.00019992180408770217, 'samples': 701504, 'steps': 1370, 'loss/train': 2.7902095317840576} -09/20/2021 19:14:05 - INFO - __main__ - Step 21923: {'lr': 0.00019992180408770217, 'samples': 701536, 'steps': 1370, 'loss/train': 3.930755376815796} -09/20/2021 19:14:06 - INFO - __main__ - Step 21924: {'lr': 0.00019992180408770217, 'samples': 701568, 'steps': 1370, 'loss/train': 3.3314552307128906} -09/20/2021 19:14:07 - INFO - __main__ - Step 21925: {'lr': 0.00019992180408770217, 'samples': 701600, 'steps': 1370, 'loss/train': 2.784949541091919} -09/20/2021 19:14:08 - INFO - __main__ - Step 21926: {'lr': 0.00019992180408770217, 'samples': 701632, 'steps': 1370, 'loss/train': 4.001908779144287} -09/20/2021 19:14:08 - INFO - __main__ - Step 21927: {'lr': 0.00019992180408770217, 'samples': 701664, 'steps': 1370, 'loss/train': 3.9523279666900635} -09/20/2021 19:14:09 - INFO - __main__ - Step 21928: {'lr': 0.00019992180408770217, 'samples': 701696, 'steps': 1370, 'loss/train': 3.2428805828094482} -09/20/2021 19:14:10 - INFO - __main__ - Step 21929: {'lr': 0.00019992180408770217, 'samples': 701728, 'steps': 1370, 'loss/train': 4.292374134063721} -09/20/2021 19:14:11 - INFO - __main__ - Step 21930: {'lr': 0.00019992180408770217, 'samples': 701760, 'steps': 1370, 'loss/train': 2.854858636856079} -09/20/2021 19:14:11 - INFO - __main__ - Step 21931: {'lr': 0.00019992180408770217, 'samples': 701792, 'steps': 1370, 'loss/train': 3.796156167984009} -09/20/2021 19:14:12 - INFO - __main__ - Step 21932: {'lr': 0.00019992180408770217, 'samples': 701824, 'steps': 1370, 'loss/train': 3.511641263961792} -09/20/2021 19:14:13 - INFO - __main__ - Step 21933: {'lr': 0.00019992180408770217, 'samples': 701856, 'steps': 1370, 'loss/train': 3.1721644401550293} -09/20/2021 19:14:14 - INFO - __main__ - Step 21934: {'lr': 0.00019992180408770217, 'samples': 701888, 'steps': 1370, 'loss/train': 2.7832744121551514} -09/20/2021 19:14:15 - INFO - __main__ - Step 21935: {'lr': 0.00019992180408770217, 'samples': 701920, 'steps': 1370, 'loss/train': 1.9066110849380493} -09/20/2021 19:14:16 - INFO - __main__ - Step 21936: {'lr': 0.00019992180408770217, 'samples': 701952, 'steps': 1370, 'loss/train': 3.719684600830078} -09/20/2021 19:14:17 - INFO - __main__ - Step 21937: {'lr': 0.00019992155167241257, 'samples': 701984, 'steps': 1371, 'loss/train': 2.8220059871673584} -09/20/2021 19:14:17 - INFO - __main__ - Step 21938: {'lr': 0.00019992155167241257, 'samples': 702016, 'steps': 1371, 'loss/train': 2.9864532947540283} -09/20/2021 19:14:18 - INFO - __main__ - Step 21939: {'lr': 0.00019992155167241257, 'samples': 702048, 'steps': 1371, 'loss/train': 3.2084763050079346} -09/20/2021 19:14:19 - INFO - __main__ - Step 21940: {'lr': 0.00019992155167241257, 'samples': 702080, 'steps': 1371, 'loss/train': 2.2751119136810303} -09/20/2021 19:14:20 - INFO - __main__ - Step 21941: {'lr': 0.00019992155167241257, 'samples': 702112, 'steps': 1371, 'loss/train': 3.15964412689209} -09/20/2021 19:14:20 - INFO - __main__ - Step 21942: {'lr': 0.00019992155167241257, 'samples': 702144, 'steps': 1371, 'loss/train': 2.231527805328369} -09/20/2021 19:14:21 - INFO - __main__ - Step 21943: {'lr': 0.00019992155167241257, 'samples': 702176, 'steps': 1371, 'loss/train': 3.182727575302124} -09/20/2021 19:14:22 - INFO - __main__ - Step 21944: {'lr': 0.00019992155167241257, 'samples': 702208, 'steps': 1371, 'loss/train': 1.37450110912323} -09/20/2021 19:14:23 - INFO - __main__ - Step 21945: {'lr': 0.00019992155167241257, 'samples': 702240, 'steps': 1371, 'loss/train': 2.6045291423797607} -09/20/2021 19:14:23 - INFO - __main__ - Step 21946: {'lr': 0.00019992155167241257, 'samples': 702272, 'steps': 1371, 'loss/train': 6.304121494293213} -09/20/2021 19:14:24 - INFO - __main__ - Step 21947: {'lr': 0.00019992155167241257, 'samples': 702304, 'steps': 1371, 'loss/train': 3.246906042098999} -09/20/2021 19:14:25 - INFO - __main__ - Step 21948: {'lr': 0.00019992155167241257, 'samples': 702336, 'steps': 1371, 'loss/train': 3.0314252376556396} -09/20/2021 19:14:26 - INFO - __main__ - Step 21949: {'lr': 0.00019992155167241257, 'samples': 702368, 'steps': 1371, 'loss/train': 1.373473048210144} -09/20/2021 19:14:26 - INFO - __main__ - Step 21950: {'lr': 0.00019992155167241257, 'samples': 702400, 'steps': 1371, 'loss/train': 0.7758122086524963} -09/20/2021 19:14:27 - INFO - __main__ - Step 21951: {'lr': 0.00019992155167241257, 'samples': 702432, 'steps': 1371, 'loss/train': 2.986685037612915} -09/20/2021 19:14:28 - INFO - __main__ - Step 21952: {'lr': 0.00019992155167241257, 'samples': 702464, 'steps': 1371, 'loss/train': 3.226942777633667} -09/20/2021 19:14:29 - INFO - __main__ - Step 21953: {'lr': 0.0001999212988505426, 'samples': 702496, 'steps': 1372, 'loss/train': 2.88950514793396} -09/20/2021 19:14:30 - INFO - __main__ - Step 21954: {'lr': 0.0001999212988505426, 'samples': 702528, 'steps': 1372, 'loss/train': 2.8975558280944824} -09/20/2021 19:14:30 - INFO - __main__ - Step 21955: {'lr': 0.0001999212988505426, 'samples': 702560, 'steps': 1372, 'loss/train': 4.7133684158325195} -09/20/2021 19:14:31 - INFO - __main__ - Step 21956: {'lr': 0.0001999212988505426, 'samples': 702592, 'steps': 1372, 'loss/train': 3.9742348194122314} -09/20/2021 19:14:32 - INFO - __main__ - Step 21957: {'lr': 0.0001999212988505426, 'samples': 702624, 'steps': 1372, 'loss/train': 3.955390691757202} -09/20/2021 19:14:33 - INFO - __main__ - Step 21958: {'lr': 0.0001999212988505426, 'samples': 702656, 'steps': 1372, 'loss/train': 1.5367047786712646} -09/20/2021 19:14:33 - INFO - __main__ - Step 21959: {'lr': 0.0001999212988505426, 'samples': 702688, 'steps': 1372, 'loss/train': 2.3792927265167236} -09/20/2021 19:14:34 - INFO - __main__ - Step 21960: {'lr': 0.0001999212988505426, 'samples': 702720, 'steps': 1372, 'loss/train': 4.346665859222412} -09/20/2021 19:14:35 - INFO - __main__ - Step 21961: {'lr': 0.0001999212988505426, 'samples': 702752, 'steps': 1372, 'loss/train': 3.2531239986419678} -09/20/2021 19:14:36 - INFO - __main__ - Step 21962: {'lr': 0.0001999212988505426, 'samples': 702784, 'steps': 1372, 'loss/train': 3.662403106689453} -09/20/2021 19:14:36 - INFO - __main__ - Step 21963: {'lr': 0.0001999212988505426, 'samples': 702816, 'steps': 1372, 'loss/train': 3.434981107711792} -09/20/2021 19:14:37 - INFO - __main__ - Step 21964: {'lr': 0.0001999212988505426, 'samples': 702848, 'steps': 1372, 'loss/train': 2.335448741912842} -09/20/2021 19:14:38 - INFO - __main__ - Step 21965: {'lr': 0.0001999212988505426, 'samples': 702880, 'steps': 1372, 'loss/train': 3.3619437217712402} -09/20/2021 19:14:39 - INFO - __main__ - Step 21966: {'lr': 0.0001999212988505426, 'samples': 702912, 'steps': 1372, 'loss/train': 2.7481541633605957} -09/20/2021 19:14:40 - INFO - __main__ - Step 21967: {'lr': 0.0001999212988505426, 'samples': 702944, 'steps': 1372, 'loss/train': 4.061728000640869} -09/20/2021 19:14:41 - INFO - __main__ - Step 21968: {'lr': 0.0001999212988505426, 'samples': 702976, 'steps': 1372, 'loss/train': 3.013082981109619} -09/20/2021 19:14:41 - INFO - __main__ - Step 21969: {'lr': 0.00019992104562209325, 'samples': 703008, 'steps': 1373, 'loss/train': 3.0313611030578613} -09/20/2021 19:14:42 - INFO - __main__ - Step 21970: {'lr': 0.00019992104562209325, 'samples': 703040, 'steps': 1373, 'loss/train': 4.101011753082275} -09/20/2021 19:14:43 - INFO - __main__ - Step 21971: {'lr': 0.00019992104562209325, 'samples': 703072, 'steps': 1373, 'loss/train': 3.0200650691986084} -09/20/2021 19:14:44 - INFO - __main__ - Step 21972: {'lr': 0.00019992104562209325, 'samples': 703104, 'steps': 1373, 'loss/train': 3.6000595092773438} -09/20/2021 19:14:44 - INFO - __main__ - Step 21973: {'lr': 0.00019992104562209325, 'samples': 703136, 'steps': 1373, 'loss/train': 3.335050344467163} -09/20/2021 19:14:45 - INFO - __main__ - Step 21974: {'lr': 0.00019992104562209325, 'samples': 703168, 'steps': 1373, 'loss/train': 2.433516025543213} -09/20/2021 19:14:46 - INFO - __main__ - Step 21975: {'lr': 0.00019992104562209325, 'samples': 703200, 'steps': 1373, 'loss/train': 3.5492992401123047} -09/20/2021 19:14:47 - INFO - __main__ - Step 21976: {'lr': 0.00019992104562209325, 'samples': 703232, 'steps': 1373, 'loss/train': 2.8342554569244385} -09/20/2021 19:14:48 - INFO - __main__ - Step 21977: {'lr': 0.00019992104562209325, 'samples': 703264, 'steps': 1373, 'loss/train': 3.5324015617370605} -09/20/2021 19:14:48 - INFO - __main__ - Step 21978: {'lr': 0.00019992104562209325, 'samples': 703296, 'steps': 1373, 'loss/train': 3.2478463649749756} -09/20/2021 19:14:49 - INFO - __main__ - Step 21979: {'lr': 0.00019992104562209325, 'samples': 703328, 'steps': 1373, 'loss/train': 3.7741668224334717} -09/20/2021 19:14:50 - INFO - __main__ - Step 21980: {'lr': 0.00019992104562209325, 'samples': 703360, 'steps': 1373, 'loss/train': 3.7227823734283447} -09/20/2021 19:14:51 - INFO - __main__ - Step 21981: {'lr': 0.00019992104562209325, 'samples': 703392, 'steps': 1373, 'loss/train': 3.183995246887207} -09/20/2021 19:14:51 - INFO - __main__ - Step 21982: {'lr': 0.00019992104562209325, 'samples': 703424, 'steps': 1373, 'loss/train': 2.858935594558716} -09/20/2021 19:14:52 - INFO - __main__ - Step 21983: {'lr': 0.00019992104562209325, 'samples': 703456, 'steps': 1373, 'loss/train': 3.045290231704712} -09/20/2021 19:14:53 - INFO - __main__ - Step 21984: {'lr': 0.00019992104562209325, 'samples': 703488, 'steps': 1373, 'loss/train': 3.740358829498291} -09/20/2021 19:14:54 - INFO - __main__ - Step 21985: {'lr': 0.0001999207919870655, 'samples': 703520, 'steps': 1374, 'loss/train': 3.6403634548187256} -09/20/2021 19:14:54 - INFO - __main__ - Step 21986: {'lr': 0.0001999207919870655, 'samples': 703552, 'steps': 1374, 'loss/train': 3.199007511138916} -09/20/2021 19:14:55 - INFO - __main__ - Step 21987: {'lr': 0.0001999207919870655, 'samples': 703584, 'steps': 1374, 'loss/train': 2.7017109394073486} -09/20/2021 19:14:56 - INFO - __main__ - Step 21988: {'lr': 0.0001999207919870655, 'samples': 703616, 'steps': 1374, 'loss/train': 2.4898600578308105} -09/20/2021 19:14:57 - INFO - __main__ - Step 21989: {'lr': 0.0001999207919870655, 'samples': 703648, 'steps': 1374, 'loss/train': 3.034588575363159} -09/20/2021 19:14:57 - INFO - __main__ - Step 21990: {'lr': 0.0001999207919870655, 'samples': 703680, 'steps': 1374, 'loss/train': 3.254315137863159} -09/20/2021 19:14:58 - INFO - __main__ - Step 21991: {'lr': 0.0001999207919870655, 'samples': 703712, 'steps': 1374, 'loss/train': 3.2431578636169434} -09/20/2021 19:14:59 - INFO - __main__ - Step 21992: {'lr': 0.0001999207919870655, 'samples': 703744, 'steps': 1374, 'loss/train': 2.3710665702819824} -09/20/2021 19:15:00 - INFO - __main__ - Step 21993: {'lr': 0.0001999207919870655, 'samples': 703776, 'steps': 1374, 'loss/train': 3.213278293609619} -09/20/2021 19:15:00 - INFO - __main__ - Step 21994: {'lr': 0.0001999207919870655, 'samples': 703808, 'steps': 1374, 'loss/train': 3.3842051029205322} -09/20/2021 19:15:01 - INFO - __main__ - Step 21995: {'lr': 0.0001999207919870655, 'samples': 703840, 'steps': 1374, 'loss/train': 2.0768439769744873} -09/20/2021 19:15:02 - INFO - __main__ - Step 21996: {'lr': 0.0001999207919870655, 'samples': 703872, 'steps': 1374, 'loss/train': 2.1112210750579834} -09/20/2021 19:15:03 - INFO - __main__ - Step 21997: {'lr': 0.0001999207919870655, 'samples': 703904, 'steps': 1374, 'loss/train': 2.0832631587982178} -09/20/2021 19:15:03 - INFO - __main__ - Step 21998: {'lr': 0.0001999207919870655, 'samples': 703936, 'steps': 1374, 'loss/train': 3.2841737270355225} -09/20/2021 19:15:05 - INFO - __main__ - Step 21999: {'lr': 0.0001999207919870655, 'samples': 703968, 'steps': 1374, 'loss/train': 3.3790030479431152} -09/20/2021 19:15:06 - INFO - __main__ - Step 22000: {'lr': 0.0001999207919870655, 'samples': 704000, 'steps': 1374, 'loss/train': 3.432180166244507} -09/20/2021 19:15:07 - INFO - __main__ - Step 22001: {'lr': 0.00019992053794546047, 'samples': 704032, 'steps': 1375, 'loss/train': 3.590749979019165} -09/20/2021 19:15:08 - INFO - __main__ - Step 22002: {'lr': 0.00019992053794546047, 'samples': 704064, 'steps': 1375, 'loss/train': 3.3550405502319336} -09/20/2021 19:15:08 - INFO - __main__ - Step 22003: {'lr': 0.00019992053794546047, 'samples': 704096, 'steps': 1375, 'loss/train': 3.6362645626068115} -09/20/2021 19:15:09 - INFO - __main__ - Step 22004: {'lr': 0.00019992053794546047, 'samples': 704128, 'steps': 1375, 'loss/train': 3.3510167598724365} -09/20/2021 19:15:10 - INFO - __main__ - Step 22005: {'lr': 0.00019992053794546047, 'samples': 704160, 'steps': 1375, 'loss/train': 3.180490016937256} -09/20/2021 19:15:11 - INFO - __main__ - Step 22006: {'lr': 0.00019992053794546047, 'samples': 704192, 'steps': 1375, 'loss/train': 2.6999387741088867} -09/20/2021 19:15:11 - INFO - __main__ - Step 22007: {'lr': 0.00019992053794546047, 'samples': 704224, 'steps': 1375, 'loss/train': 2.6432158946990967} -09/20/2021 19:15:12 - INFO - __main__ - Step 22008: {'lr': 0.00019992053794546047, 'samples': 704256, 'steps': 1375, 'loss/train': 3.3966476917266846} -09/20/2021 19:15:13 - INFO - __main__ - Step 22009: {'lr': 0.00019992053794546047, 'samples': 704288, 'steps': 1375, 'loss/train': 5.3382954597473145} -09/20/2021 19:15:14 - INFO - __main__ - Step 22010: {'lr': 0.00019992053794546047, 'samples': 704320, 'steps': 1375, 'loss/train': 3.1951425075531006} -09/20/2021 19:15:14 - INFO - __main__ - Step 22011: {'lr': 0.00019992053794546047, 'samples': 704352, 'steps': 1375, 'loss/train': 3.349517822265625} -09/20/2021 19:15:15 - INFO - __main__ - Step 22012: {'lr': 0.00019992053794546047, 'samples': 704384, 'steps': 1375, 'loss/train': 3.305248260498047} -09/20/2021 19:15:16 - INFO - __main__ - Step 22013: {'lr': 0.00019992053794546047, 'samples': 704416, 'steps': 1375, 'loss/train': 4.170388698577881} -09/20/2021 19:15:17 - INFO - __main__ - Step 22014: {'lr': 0.00019992053794546047, 'samples': 704448, 'steps': 1375, 'loss/train': 3.4842967987060547} -09/20/2021 19:15:17 - INFO - __main__ - Step 22015: {'lr': 0.00019992053794546047, 'samples': 704480, 'steps': 1375, 'loss/train': 3.749650478363037} -09/20/2021 19:15:18 - INFO - __main__ - Step 22016: {'lr': 0.00019992053794546047, 'samples': 704512, 'steps': 1375, 'loss/train': 3.7561957836151123} -09/20/2021 19:15:19 - INFO - __main__ - Step 22017: {'lr': 0.00019992028349727917, 'samples': 704544, 'steps': 1376, 'loss/train': 3.3130078315734863} -09/20/2021 19:15:20 - INFO - __main__ - Step 22018: {'lr': 0.00019992028349727917, 'samples': 704576, 'steps': 1376, 'loss/train': 2.6414923667907715} -09/20/2021 19:15:21 - INFO - __main__ - Step 22019: {'lr': 0.00019992028349727917, 'samples': 704608, 'steps': 1376, 'loss/train': 3.126527786254883} -09/20/2021 19:15:21 - INFO - __main__ - Step 22020: {'lr': 0.00019992028349727917, 'samples': 704640, 'steps': 1376, 'loss/train': 3.4978208541870117} -09/20/2021 19:15:22 - INFO - __main__ - Step 22021: {'lr': 0.00019992028349727917, 'samples': 704672, 'steps': 1376, 'loss/train': 3.0871169567108154} -09/20/2021 19:15:23 - INFO - __main__ - Step 22022: {'lr': 0.00019992028349727917, 'samples': 704704, 'steps': 1376, 'loss/train': 3.062063455581665} -09/20/2021 19:15:24 - INFO - __main__ - Step 22023: {'lr': 0.00019992028349727917, 'samples': 704736, 'steps': 1376, 'loss/train': 3.2584264278411865} -09/20/2021 19:15:24 - INFO - __main__ - Step 22024: {'lr': 0.00019992028349727917, 'samples': 704768, 'steps': 1376, 'loss/train': 2.276381254196167} -09/20/2021 19:15:25 - INFO - __main__ - Step 22025: {'lr': 0.00019992028349727917, 'samples': 704800, 'steps': 1376, 'loss/train': 0.5345269441604614} -09/20/2021 19:15:26 - INFO - __main__ - Step 22026: {'lr': 0.00019992028349727917, 'samples': 704832, 'steps': 1376, 'loss/train': 2.449687957763672} -09/20/2021 19:15:27 - INFO - __main__ - Step 22027: {'lr': 0.00019992028349727917, 'samples': 704864, 'steps': 1376, 'loss/train': 3.40934681892395} -09/20/2021 19:15:27 - INFO - __main__ - Step 22028: {'lr': 0.00019992028349727917, 'samples': 704896, 'steps': 1376, 'loss/train': 4.452536106109619} -09/20/2021 19:15:28 - INFO - __main__ - Step 22029: {'lr': 0.00019992028349727917, 'samples': 704928, 'steps': 1376, 'loss/train': 5.15168571472168} -09/20/2021 19:15:29 - INFO - __main__ - Step 22030: {'lr': 0.00019992028349727917, 'samples': 704960, 'steps': 1376, 'loss/train': 5.214425563812256} -09/20/2021 19:15:30 - INFO - __main__ - Step 22031: {'lr': 0.00019992028349727917, 'samples': 704992, 'steps': 1376, 'loss/train': 3.1353652477264404} -09/20/2021 19:15:31 - INFO - __main__ - Step 22032: {'lr': 0.00019992028349727917, 'samples': 705024, 'steps': 1376, 'loss/train': 3.6731858253479004} -09/20/2021 19:15:32 - INFO - __main__ - Step 22033: {'lr': 0.0001999200286425226, 'samples': 705056, 'steps': 1377, 'loss/train': 2.5888378620147705} -09/20/2021 19:15:32 - INFO - __main__ - Step 22034: {'lr': 0.0001999200286425226, 'samples': 705088, 'steps': 1377, 'loss/train': 2.7655694484710693} -09/20/2021 19:15:33 - INFO - __main__ - Step 22035: {'lr': 0.0001999200286425226, 'samples': 705120, 'steps': 1377, 'loss/train': 3.485093116760254} -09/20/2021 19:15:34 - INFO - __main__ - Step 22036: {'lr': 0.0001999200286425226, 'samples': 705152, 'steps': 1377, 'loss/train': 2.8363759517669678} -09/20/2021 19:15:35 - INFO - __main__ - Step 22037: {'lr': 0.0001999200286425226, 'samples': 705184, 'steps': 1377, 'loss/train': 3.142463445663452} -09/20/2021 19:15:35 - INFO - __main__ - Step 22038: {'lr': 0.0001999200286425226, 'samples': 705216, 'steps': 1377, 'loss/train': 3.5758869647979736} -09/20/2021 19:15:36 - INFO - __main__ - Step 22039: {'lr': 0.0001999200286425226, 'samples': 705248, 'steps': 1377, 'loss/train': 3.61867356300354} -09/20/2021 19:15:37 - INFO - __main__ - Step 22040: {'lr': 0.0001999200286425226, 'samples': 705280, 'steps': 1377, 'loss/train': 3.8468399047851562} -09/20/2021 19:15:38 - INFO - __main__ - Step 22041: {'lr': 0.0001999200286425226, 'samples': 705312, 'steps': 1377, 'loss/train': 3.3105380535125732} -09/20/2021 19:15:38 - INFO - __main__ - Step 22042: {'lr': 0.0001999200286425226, 'samples': 705344, 'steps': 1377, 'loss/train': 3.0174851417541504} -09/20/2021 19:15:39 - INFO - __main__ - Step 22043: {'lr': 0.0001999200286425226, 'samples': 705376, 'steps': 1377, 'loss/train': 2.8506252765655518} -09/20/2021 19:15:40 - INFO - __main__ - Step 22044: {'lr': 0.0001999200286425226, 'samples': 705408, 'steps': 1377, 'loss/train': 3.330866575241089} -09/20/2021 19:15:41 - INFO - __main__ - Step 22045: {'lr': 0.0001999200286425226, 'samples': 705440, 'steps': 1377, 'loss/train': 1.8564091920852661} -09/20/2021 19:15:41 - INFO - __main__ - Step 22046: {'lr': 0.0001999200286425226, 'samples': 705472, 'steps': 1377, 'loss/train': 3.665408134460449} -09/20/2021 19:15:42 - INFO - __main__ - Step 22047: {'lr': 0.0001999200286425226, 'samples': 705504, 'steps': 1377, 'loss/train': 2.9617342948913574} -09/20/2021 19:15:43 - INFO - __main__ - Step 22048: {'lr': 0.0001999200286425226, 'samples': 705536, 'steps': 1377, 'loss/train': 2.386808156967163} -09/20/2021 19:15:44 - INFO - __main__ - Step 22049: {'lr': 0.00019991977338119186, 'samples': 705568, 'steps': 1378, 'loss/train': 3.114414930343628} -09/20/2021 19:15:45 - INFO - __main__ - Step 22050: {'lr': 0.00019991977338119186, 'samples': 705600, 'steps': 1378, 'loss/train': 4.102816104888916} -09/20/2021 19:15:45 - INFO - __main__ - Step 22051: {'lr': 0.00019991977338119186, 'samples': 705632, 'steps': 1378, 'loss/train': 2.4319093227386475} -09/20/2021 19:15:46 - INFO - __main__ - Step 22052: {'lr': 0.00019991977338119186, 'samples': 705664, 'steps': 1378, 'loss/train': 6.167305946350098} -09/20/2021 19:15:47 - INFO - __main__ - Step 22053: {'lr': 0.00019991977338119186, 'samples': 705696, 'steps': 1378, 'loss/train': 2.758009433746338} -09/20/2021 19:15:48 - INFO - __main__ - Step 22054: {'lr': 0.00019991977338119186, 'samples': 705728, 'steps': 1378, 'loss/train': 0.7229471802711487} -09/20/2021 19:15:48 - INFO - __main__ - Step 22055: {'lr': 0.00019991977338119186, 'samples': 705760, 'steps': 1378, 'loss/train': 3.8096179962158203} -09/20/2021 19:15:49 - INFO - __main__ - Step 22056: {'lr': 0.00019991977338119186, 'samples': 705792, 'steps': 1378, 'loss/train': 3.01831316947937} -09/20/2021 19:15:50 - INFO - __main__ - Step 22057: {'lr': 0.00019991977338119186, 'samples': 705824, 'steps': 1378, 'loss/train': 2.647587776184082} -09/20/2021 19:15:51 - INFO - __main__ - Step 22058: {'lr': 0.00019991977338119186, 'samples': 705856, 'steps': 1378, 'loss/train': 3.392026424407959} -09/20/2021 19:15:51 - INFO - __main__ - Step 22059: {'lr': 0.00019991977338119186, 'samples': 705888, 'steps': 1378, 'loss/train': 2.8225009441375732} -09/20/2021 19:15:52 - INFO - __main__ - Step 22060: {'lr': 0.00019991977338119186, 'samples': 705920, 'steps': 1378, 'loss/train': 3.005448818206787} -09/20/2021 19:15:53 - INFO - __main__ - Step 22061: {'lr': 0.00019991977338119186, 'samples': 705952, 'steps': 1378, 'loss/train': 3.454315662384033} -09/20/2021 19:15:54 - INFO - __main__ - Step 22062: {'lr': 0.00019991977338119186, 'samples': 705984, 'steps': 1378, 'loss/train': 3.150388479232788} -09/20/2021 19:15:55 - INFO - __main__ - Step 22063: {'lr': 0.00019991977338119186, 'samples': 706016, 'steps': 1378, 'loss/train': 2.7307910919189453} -09/20/2021 19:15:56 - INFO - __main__ - Step 22064: {'lr': 0.00019991977338119186, 'samples': 706048, 'steps': 1378, 'loss/train': 3.6624205112457275} -09/20/2021 19:15:56 - INFO - __main__ - Step 22065: {'lr': 0.00019991951771328788, 'samples': 706080, 'steps': 1379, 'loss/train': 3.0674355030059814} -09/20/2021 19:15:57 - INFO - __main__ - Step 22066: {'lr': 0.00019991951771328788, 'samples': 706112, 'steps': 1379, 'loss/train': 3.089684247970581} -09/20/2021 19:15:58 - INFO - __main__ - Step 22067: {'lr': 0.00019991951771328788, 'samples': 706144, 'steps': 1379, 'loss/train': 3.613272190093994} -09/20/2021 19:15:59 - INFO - __main__ - Step 22068: {'lr': 0.00019991951771328788, 'samples': 706176, 'steps': 1379, 'loss/train': 2.8511576652526855} -09/20/2021 19:15:59 - INFO - __main__ - Step 22069: {'lr': 0.00019991951771328788, 'samples': 706208, 'steps': 1379, 'loss/train': 4.099977970123291} -09/20/2021 19:16:00 - INFO - __main__ - Step 22070: {'lr': 0.00019991951771328788, 'samples': 706240, 'steps': 1379, 'loss/train': 2.834925413131714} -09/20/2021 19:16:01 - INFO - __main__ - Step 22071: {'lr': 0.00019991951771328788, 'samples': 706272, 'steps': 1379, 'loss/train': 3.647559404373169} -09/20/2021 19:16:02 - INFO - __main__ - Step 22072: {'lr': 0.00019991951771328788, 'samples': 706304, 'steps': 1379, 'loss/train': 3.703681468963623} -09/20/2021 19:16:02 - INFO - __main__ - Step 22073: {'lr': 0.00019991951771328788, 'samples': 706336, 'steps': 1379, 'loss/train': 3.3786354064941406} -09/20/2021 19:16:03 - INFO - __main__ - Step 22074: {'lr': 0.00019991951771328788, 'samples': 706368, 'steps': 1379, 'loss/train': 2.576697587966919} -09/20/2021 19:16:04 - INFO - __main__ - Step 22075: {'lr': 0.00019991951771328788, 'samples': 706400, 'steps': 1379, 'loss/train': 3.2154502868652344} -09/20/2021 19:16:05 - INFO - __main__ - Step 22076: {'lr': 0.00019991951771328788, 'samples': 706432, 'steps': 1379, 'loss/train': 2.6352150440216064} -09/20/2021 19:16:05 - INFO - __main__ - Step 22077: {'lr': 0.00019991951771328788, 'samples': 706464, 'steps': 1379, 'loss/train': 6.315846920013428} -09/20/2021 19:16:06 - INFO - __main__ - Step 22078: {'lr': 0.00019991951771328788, 'samples': 706496, 'steps': 1379, 'loss/train': 2.3803789615631104} -09/20/2021 19:16:07 - INFO - __main__ - Step 22079: {'lr': 0.00019991951771328788, 'samples': 706528, 'steps': 1379, 'loss/train': 3.8636655807495117} -09/20/2021 19:16:08 - INFO - __main__ - Step 22080: {'lr': 0.00019991951771328788, 'samples': 706560, 'steps': 1379, 'loss/train': 3.9668331146240234} -09/20/2021 19:16:09 - INFO - __main__ - Step 22081: {'lr': 0.00019991926163881183, 'samples': 706592, 'steps': 1380, 'loss/train': 3.207803726196289} -09/20/2021 19:16:09 - INFO - __main__ - Step 22082: {'lr': 0.00019991926163881183, 'samples': 706624, 'steps': 1380, 'loss/train': 2.794679641723633} -09/20/2021 19:16:10 - INFO - __main__ - Step 22083: {'lr': 0.00019991926163881183, 'samples': 706656, 'steps': 1380, 'loss/train': 3.1753036975860596} -09/20/2021 19:16:11 - INFO - __main__ - Step 22084: {'lr': 0.00019991926163881183, 'samples': 706688, 'steps': 1380, 'loss/train': 2.3141303062438965} -09/20/2021 19:16:12 - INFO - __main__ - Step 22085: {'lr': 0.00019991926163881183, 'samples': 706720, 'steps': 1380, 'loss/train': 3.225532293319702} -09/20/2021 19:16:12 - INFO - __main__ - Step 22086: {'lr': 0.00019991926163881183, 'samples': 706752, 'steps': 1380, 'loss/train': 3.666510820388794} -09/20/2021 19:16:13 - INFO - __main__ - Step 22087: {'lr': 0.00019991926163881183, 'samples': 706784, 'steps': 1380, 'loss/train': 3.2701656818389893} -09/20/2021 19:16:14 - INFO - __main__ - Step 22088: {'lr': 0.00019991926163881183, 'samples': 706816, 'steps': 1380, 'loss/train': 3.4936141967773438} -09/20/2021 19:16:15 - INFO - __main__ - Step 22089: {'lr': 0.00019991926163881183, 'samples': 706848, 'steps': 1380, 'loss/train': 3.088564395904541} -09/20/2021 19:16:15 - INFO - __main__ - Step 22090: {'lr': 0.00019991926163881183, 'samples': 706880, 'steps': 1380, 'loss/train': 2.6747775077819824} -09/20/2021 19:16:16 - INFO - __main__ - Step 22091: {'lr': 0.00019991926163881183, 'samples': 706912, 'steps': 1380, 'loss/train': 1.4179670810699463} -09/20/2021 19:16:18 - INFO - __main__ - Step 22092: {'lr': 0.00019991926163881183, 'samples': 706944, 'steps': 1380, 'loss/train': 3.090893507003784} -09/20/2021 19:16:18 - INFO - __main__ - Step 22093: {'lr': 0.00019991926163881183, 'samples': 706976, 'steps': 1380, 'loss/train': 3.4339988231658936} -09/20/2021 19:16:19 - INFO - __main__ - Step 22094: {'lr': 0.00019991926163881183, 'samples': 707008, 'steps': 1380, 'loss/train': 3.92999005317688} -09/20/2021 19:16:20 - INFO - __main__ - Step 22095: {'lr': 0.00019991926163881183, 'samples': 707040, 'steps': 1380, 'loss/train': 2.7416718006134033} -09/20/2021 19:16:21 - INFO - __main__ - Step 22096: {'lr': 0.00019991926163881183, 'samples': 707072, 'steps': 1380, 'loss/train': 2.824275493621826} -09/20/2021 19:16:21 - INFO - __main__ - Step 22097: {'lr': 0.00019991900515776466, 'samples': 707104, 'steps': 1381, 'loss/train': 2.658109664916992} -09/20/2021 19:16:22 - INFO - __main__ - Step 22098: {'lr': 0.00019991900515776466, 'samples': 707136, 'steps': 1381, 'loss/train': 0.7672035098075867} -09/20/2021 19:16:23 - INFO - __main__ - Step 22099: {'lr': 0.00019991900515776466, 'samples': 707168, 'steps': 1381, 'loss/train': 2.993582010269165} -09/20/2021 19:16:24 - INFO - __main__ - Step 22100: {'lr': 0.00019991900515776466, 'samples': 707200, 'steps': 1381, 'loss/train': 3.0048940181732178} -09/20/2021 19:16:24 - INFO - __main__ - Step 22101: {'lr': 0.00019991900515776466, 'samples': 707232, 'steps': 1381, 'loss/train': 2.534557819366455} -09/20/2021 19:16:25 - INFO - __main__ - Step 22102: {'lr': 0.00019991900515776466, 'samples': 707264, 'steps': 1381, 'loss/train': 2.618039131164551} -09/20/2021 19:16:26 - INFO - __main__ - Step 22103: {'lr': 0.00019991900515776466, 'samples': 707296, 'steps': 1381, 'loss/train': 3.248328685760498} -09/20/2021 19:16:27 - INFO - __main__ - Step 22104: {'lr': 0.00019991900515776466, 'samples': 707328, 'steps': 1381, 'loss/train': 4.722838401794434} -09/20/2021 19:16:27 - INFO - __main__ - Step 22105: {'lr': 0.00019991900515776466, 'samples': 707360, 'steps': 1381, 'loss/train': 4.760433197021484} -09/20/2021 19:16:28 - INFO - __main__ - Step 22106: {'lr': 0.00019991900515776466, 'samples': 707392, 'steps': 1381, 'loss/train': 4.520867824554443} -09/20/2021 19:16:29 - INFO - __main__ - Step 22107: {'lr': 0.00019991900515776466, 'samples': 707424, 'steps': 1381, 'loss/train': 4.696938991546631} -09/20/2021 19:16:30 - INFO - __main__ - Step 22108: {'lr': 0.00019991900515776466, 'samples': 707456, 'steps': 1381, 'loss/train': 4.537664890289307} -09/20/2021 19:16:30 - INFO - __main__ - Step 22109: {'lr': 0.00019991900515776466, 'samples': 707488, 'steps': 1381, 'loss/train': 4.826689720153809} -09/20/2021 19:16:31 - INFO - __main__ - Step 22110: {'lr': 0.00019991900515776466, 'samples': 707520, 'steps': 1381, 'loss/train': 4.733426094055176} -09/20/2021 19:16:32 - INFO - __main__ - Step 22111: {'lr': 0.00019991900515776466, 'samples': 707552, 'steps': 1381, 'loss/train': 4.8116374015808105} -09/20/2021 19:16:33 - INFO - __main__ - Step 22112: {'lr': 0.00019991900515776466, 'samples': 707584, 'steps': 1381, 'loss/train': 3.184061288833618} -09/20/2021 19:16:34 - INFO - __main__ - Step 22113: {'lr': 0.0001999187482701475, 'samples': 707616, 'steps': 1382, 'loss/train': 2.8756954669952393} -09/20/2021 19:16:34 - INFO - __main__ - Step 22114: {'lr': 0.0001999187482701475, 'samples': 707648, 'steps': 1382, 'loss/train': 3.7603824138641357} -09/20/2021 19:16:35 - INFO - __main__ - Step 22115: {'lr': 0.0001999187482701475, 'samples': 707680, 'steps': 1382, 'loss/train': 2.8941144943237305} -09/20/2021 19:16:36 - INFO - __main__ - Step 22116: {'lr': 0.0001999187482701475, 'samples': 707712, 'steps': 1382, 'loss/train': 4.653942108154297} -09/20/2021 19:16:37 - INFO - __main__ - Step 22117: {'lr': 0.0001999187482701475, 'samples': 707744, 'steps': 1382, 'loss/train': 3.4641776084899902} -09/20/2021 19:16:37 - INFO - __main__ - Step 22118: {'lr': 0.0001999187482701475, 'samples': 707776, 'steps': 1382, 'loss/train': 3.6179492473602295} -09/20/2021 19:16:38 - INFO - __main__ - Step 22119: {'lr': 0.0001999187482701475, 'samples': 707808, 'steps': 1382, 'loss/train': 3.473919630050659} -09/20/2021 19:16:39 - INFO - __main__ - Step 22120: {'lr': 0.0001999187482701475, 'samples': 707840, 'steps': 1382, 'loss/train': 3.199801445007324} -09/20/2021 19:16:40 - INFO - __main__ - Step 22121: {'lr': 0.0001999187482701475, 'samples': 707872, 'steps': 1382, 'loss/train': 4.323661804199219} -09/20/2021 19:16:40 - INFO - __main__ - Step 22122: {'lr': 0.0001999187482701475, 'samples': 707904, 'steps': 1382, 'loss/train': 3.194169044494629} -09/20/2021 19:16:41 - INFO - __main__ - Step 22123: {'lr': 0.0001999187482701475, 'samples': 707936, 'steps': 1382, 'loss/train': 2.9297969341278076} -09/20/2021 19:16:42 - INFO - __main__ - Step 22124: {'lr': 0.0001999187482701475, 'samples': 707968, 'steps': 1382, 'loss/train': 3.9694905281066895} -09/20/2021 19:16:43 - INFO - __main__ - Step 22125: {'lr': 0.0001999187482701475, 'samples': 708000, 'steps': 1382, 'loss/train': 3.003035068511963} -09/20/2021 19:16:43 - INFO - __main__ - Step 22126: {'lr': 0.0001999187482701475, 'samples': 708032, 'steps': 1382, 'loss/train': 3.2719249725341797} -09/20/2021 19:16:44 - INFO - __main__ - Step 22127: {'lr': 0.0001999187482701475, 'samples': 708064, 'steps': 1382, 'loss/train': 2.8974125385284424} -09/20/2021 19:16:45 - INFO - __main__ - Step 22128: {'lr': 0.0001999187482701475, 'samples': 708096, 'steps': 1382, 'loss/train': 3.3322062492370605} -09/20/2021 19:16:46 - INFO - __main__ - Step 22129: {'lr': 0.0001999184909759613, 'samples': 708128, 'steps': 1383, 'loss/train': 3.3001303672790527} -09/20/2021 19:16:47 - INFO - __main__ - Step 22130: {'lr': 0.0001999184909759613, 'samples': 708160, 'steps': 1383, 'loss/train': 4.185988426208496} -09/20/2021 19:16:48 - INFO - __main__ - Step 22131: {'lr': 0.0001999184909759613, 'samples': 708192, 'steps': 1383, 'loss/train': 4.0455169677734375} -09/20/2021 19:16:48 - INFO - __main__ - Step 22132: {'lr': 0.0001999184909759613, 'samples': 708224, 'steps': 1383, 'loss/train': 4.253261089324951} -09/20/2021 19:16:49 - INFO - __main__ - Step 22133: {'lr': 0.0001999184909759613, 'samples': 708256, 'steps': 1383, 'loss/train': 3.5799789428710938} -09/20/2021 19:16:50 - INFO - __main__ - Step 22134: {'lr': 0.0001999184909759613, 'samples': 708288, 'steps': 1383, 'loss/train': 4.137418746948242} -09/20/2021 19:16:51 - INFO - __main__ - Step 22135: {'lr': 0.0001999184909759613, 'samples': 708320, 'steps': 1383, 'loss/train': 3.2320973873138428} -09/20/2021 19:16:51 - INFO - __main__ - Step 22136: {'lr': 0.0001999184909759613, 'samples': 708352, 'steps': 1383, 'loss/train': 2.9442648887634277} -09/20/2021 19:16:52 - INFO - __main__ - Step 22137: {'lr': 0.0001999184909759613, 'samples': 708384, 'steps': 1383, 'loss/train': 3.524972915649414} -09/20/2021 19:16:53 - INFO - __main__ - Step 22138: {'lr': 0.0001999184909759613, 'samples': 708416, 'steps': 1383, 'loss/train': 5.05739164352417} -09/20/2021 19:16:54 - INFO - __main__ - Step 22139: {'lr': 0.0001999184909759613, 'samples': 708448, 'steps': 1383, 'loss/train': 3.3782851696014404} -09/20/2021 19:16:54 - INFO - __main__ - Step 22140: {'lr': 0.0001999184909759613, 'samples': 708480, 'steps': 1383, 'loss/train': 3.380758762359619} -09/20/2021 19:16:55 - INFO - __main__ - Step 22141: {'lr': 0.0001999184909759613, 'samples': 708512, 'steps': 1383, 'loss/train': 2.835008144378662} -09/20/2021 19:16:56 - INFO - __main__ - Step 22142: {'lr': 0.0001999184909759613, 'samples': 708544, 'steps': 1383, 'loss/train': 2.3776695728302} -09/20/2021 19:16:57 - INFO - __main__ - Step 22143: {'lr': 0.0001999184909759613, 'samples': 708576, 'steps': 1383, 'loss/train': 3.3257932662963867} -09/20/2021 19:16:57 - INFO - __main__ - Step 22144: {'lr': 0.0001999184909759613, 'samples': 708608, 'steps': 1383, 'loss/train': 2.350261688232422} -09/20/2021 19:16:58 - INFO - __main__ - Step 22145: {'lr': 0.00019991823327520717, 'samples': 708640, 'steps': 1384, 'loss/train': 3.7687978744506836} -09/20/2021 19:16:59 - INFO - __main__ - Step 22146: {'lr': 0.00019991823327520717, 'samples': 708672, 'steps': 1384, 'loss/train': 2.924337148666382} -09/20/2021 19:17:00 - INFO - __main__ - Step 22147: {'lr': 0.00019991823327520717, 'samples': 708704, 'steps': 1384, 'loss/train': 2.763695001602173} -09/20/2021 19:17:01 - INFO - __main__ - Step 22148: {'lr': 0.00019991823327520717, 'samples': 708736, 'steps': 1384, 'loss/train': 4.111428737640381} -09/20/2021 19:17:01 - INFO - __main__ - Step 22149: {'lr': 0.00019991823327520717, 'samples': 708768, 'steps': 1384, 'loss/train': 3.40197491645813} -09/20/2021 19:17:02 - INFO - __main__ - Step 22150: {'lr': 0.00019991823327520717, 'samples': 708800, 'steps': 1384, 'loss/train': 2.9232800006866455} -09/20/2021 19:17:03 - INFO - __main__ - Step 22151: {'lr': 0.00019991823327520717, 'samples': 708832, 'steps': 1384, 'loss/train': 2.851095676422119} -09/20/2021 19:17:04 - INFO - __main__ - Step 22152: {'lr': 0.00019991823327520717, 'samples': 708864, 'steps': 1384, 'loss/train': 3.938373327255249} -09/20/2021 19:17:04 - INFO - __main__ - Step 22153: {'lr': 0.00019991823327520717, 'samples': 708896, 'steps': 1384, 'loss/train': 2.6971418857574463} -09/20/2021 19:17:05 - INFO - __main__ - Step 22154: {'lr': 0.00019991823327520717, 'samples': 708928, 'steps': 1384, 'loss/train': 2.9320690631866455} -09/20/2021 19:17:06 - INFO - __main__ - Step 22155: {'lr': 0.00019991823327520717, 'samples': 708960, 'steps': 1384, 'loss/train': 3.1401426792144775} -09/20/2021 19:17:07 - INFO - __main__ - Step 22156: {'lr': 0.00019991823327520717, 'samples': 708992, 'steps': 1384, 'loss/train': 2.694701910018921} -09/20/2021 19:17:07 - INFO - __main__ - Step 22157: {'lr': 0.00019991823327520717, 'samples': 709024, 'steps': 1384, 'loss/train': 2.488909959793091} -09/20/2021 19:17:09 - INFO - __main__ - Step 22158: {'lr': 0.00019991823327520717, 'samples': 709056, 'steps': 1384, 'loss/train': 3.634876012802124} -09/20/2021 19:17:09 - INFO - __main__ - Step 22159: {'lr': 0.00019991823327520717, 'samples': 709088, 'steps': 1384, 'loss/train': 2.8629560470581055} -09/20/2021 19:17:10 - INFO - __main__ - Step 22160: {'lr': 0.00019991823327520717, 'samples': 709120, 'steps': 1384, 'loss/train': 2.9554877281188965} -09/20/2021 19:17:11 - INFO - __main__ - Step 22161: {'lr': 0.0001999179751678861, 'samples': 709152, 'steps': 1385, 'loss/train': 3.4057815074920654} -09/20/2021 19:17:12 - INFO - __main__ - Step 22162: {'lr': 0.0001999179751678861, 'samples': 709184, 'steps': 1385, 'loss/train': 2.600242853164673} -09/20/2021 19:17:13 - INFO - __main__ - Step 22163: {'lr': 0.0001999179751678861, 'samples': 709216, 'steps': 1385, 'loss/train': 3.099961280822754} -09/20/2021 19:17:13 - INFO - __main__ - Step 22164: {'lr': 0.0001999179751678861, 'samples': 709248, 'steps': 1385, 'loss/train': 3.0871360301971436} -09/20/2021 19:17:14 - INFO - __main__ - Step 22165: {'lr': 0.0001999179751678861, 'samples': 709280, 'steps': 1385, 'loss/train': 3.7255849838256836} -09/20/2021 19:17:15 - INFO - __main__ - Step 22166: {'lr': 0.0001999179751678861, 'samples': 709312, 'steps': 1385, 'loss/train': 1.0546271800994873} -09/20/2021 19:17:16 - INFO - __main__ - Step 22167: {'lr': 0.0001999179751678861, 'samples': 709344, 'steps': 1385, 'loss/train': 2.2283923625946045} -09/20/2021 19:17:16 - INFO - __main__ - Step 22168: {'lr': 0.0001999179751678861, 'samples': 709376, 'steps': 1385, 'loss/train': 2.786815643310547} -09/20/2021 19:17:17 - INFO - __main__ - Step 22169: {'lr': 0.0001999179751678861, 'samples': 709408, 'steps': 1385, 'loss/train': 2.4193003177642822} -09/20/2021 19:17:18 - INFO - __main__ - Step 22170: {'lr': 0.0001999179751678861, 'samples': 709440, 'steps': 1385, 'loss/train': 2.7889859676361084} -09/20/2021 19:17:19 - INFO - __main__ - Step 22171: {'lr': 0.0001999179751678861, 'samples': 709472, 'steps': 1385, 'loss/train': 3.423487424850464} -09/20/2021 19:17:19 - INFO - __main__ - Step 22172: {'lr': 0.0001999179751678861, 'samples': 709504, 'steps': 1385, 'loss/train': 2.7991325855255127} -09/20/2021 19:17:20 - INFO - __main__ - Step 22173: {'lr': 0.0001999179751678861, 'samples': 709536, 'steps': 1385, 'loss/train': 2.8788630962371826} -09/20/2021 19:17:21 - INFO - __main__ - Step 22174: {'lr': 0.0001999179751678861, 'samples': 709568, 'steps': 1385, 'loss/train': 3.5601487159729004} -09/20/2021 19:17:22 - INFO - __main__ - Step 22175: {'lr': 0.0001999179751678861, 'samples': 709600, 'steps': 1385, 'loss/train': 3.844444513320923} -09/20/2021 19:17:22 - INFO - __main__ - Step 22176: {'lr': 0.0001999179751678861, 'samples': 709632, 'steps': 1385, 'loss/train': 4.037478923797607} -09/20/2021 19:17:23 - INFO - __main__ - Step 22177: {'lr': 0.0001999177166539992, 'samples': 709664, 'steps': 1386, 'loss/train': 2.7617666721343994} -09/20/2021 19:17:24 - INFO - __main__ - Step 22178: {'lr': 0.0001999177166539992, 'samples': 709696, 'steps': 1386, 'loss/train': 3.1079065799713135} -09/20/2021 19:17:25 - INFO - __main__ - Step 22179: {'lr': 0.0001999177166539992, 'samples': 709728, 'steps': 1386, 'loss/train': 3.619490623474121} -09/20/2021 19:17:25 - INFO - __main__ - Step 22180: {'lr': 0.0001999177166539992, 'samples': 709760, 'steps': 1386, 'loss/train': 3.2156310081481934} -09/20/2021 19:17:26 - INFO - __main__ - Step 22181: {'lr': 0.0001999177166539992, 'samples': 709792, 'steps': 1386, 'loss/train': 3.694030284881592} -09/20/2021 19:17:27 - INFO - __main__ - Step 22182: {'lr': 0.0001999177166539992, 'samples': 709824, 'steps': 1386, 'loss/train': 3.172851324081421} -09/20/2021 19:17:28 - INFO - __main__ - Step 22183: {'lr': 0.0001999177166539992, 'samples': 709856, 'steps': 1386, 'loss/train': 3.526136875152588} -09/20/2021 19:17:28 - INFO - __main__ - Step 22184: {'lr': 0.0001999177166539992, 'samples': 709888, 'steps': 1386, 'loss/train': 2.9361915588378906} -09/20/2021 19:17:29 - INFO - __main__ - Step 22185: {'lr': 0.0001999177166539992, 'samples': 709920, 'steps': 1386, 'loss/train': 3.2135732173919678} -09/20/2021 19:17:30 - INFO - __main__ - Step 22186: {'lr': 0.0001999177166539992, 'samples': 709952, 'steps': 1386, 'loss/train': 3.8070521354675293} -09/20/2021 19:17:31 - INFO - __main__ - Step 22187: {'lr': 0.0001999177166539992, 'samples': 709984, 'steps': 1386, 'loss/train': 2.422750234603882} -09/20/2021 19:17:31 - INFO - __main__ - Step 22188: {'lr': 0.0001999177166539992, 'samples': 710016, 'steps': 1386, 'loss/train': 3.02021861076355} -09/20/2021 19:17:33 - INFO - __main__ - Step 22189: {'lr': 0.0001999177166539992, 'samples': 710048, 'steps': 1386, 'loss/train': 2.5824241638183594} -09/20/2021 19:17:34 - INFO - __main__ - Step 22190: {'lr': 0.0001999177166539992, 'samples': 710080, 'steps': 1386, 'loss/train': 3.61845064163208} -09/20/2021 19:17:34 - INFO - __main__ - Step 22191: {'lr': 0.0001999177166539992, 'samples': 710112, 'steps': 1386, 'loss/train': 3.643044948577881} -09/20/2021 19:17:35 - INFO - __main__ - Step 22192: {'lr': 0.0001999177166539992, 'samples': 710144, 'steps': 1386, 'loss/train': 3.362917423248291} -09/20/2021 19:17:36 - INFO - __main__ - Step 22193: {'lr': 0.0001999174577335475, 'samples': 710176, 'steps': 1387, 'loss/train': 4.444262504577637} -09/20/2021 19:17:37 - INFO - __main__ - Step 22194: {'lr': 0.0001999174577335475, 'samples': 710208, 'steps': 1387, 'loss/train': 4.549026012420654} -09/20/2021 19:17:37 - INFO - __main__ - Step 22195: {'lr': 0.0001999174577335475, 'samples': 710240, 'steps': 1387, 'loss/train': 3.1217310428619385} -09/20/2021 19:17:38 - INFO - __main__ - Step 22196: {'lr': 0.0001999174577335475, 'samples': 710272, 'steps': 1387, 'loss/train': 3.6138455867767334} -09/20/2021 19:17:39 - INFO - __main__ - Step 22197: {'lr': 0.0001999174577335475, 'samples': 710304, 'steps': 1387, 'loss/train': 2.77067232131958} -09/20/2021 19:17:40 - INFO - __main__ - Step 22198: {'lr': 0.0001999174577335475, 'samples': 710336, 'steps': 1387, 'loss/train': 3.73907208442688} -09/20/2021 19:17:40 - INFO - __main__ - Step 22199: {'lr': 0.0001999174577335475, 'samples': 710368, 'steps': 1387, 'loss/train': 3.1881089210510254} -09/20/2021 19:17:41 - INFO - __main__ - Step 22200: {'lr': 0.0001999174577335475, 'samples': 710400, 'steps': 1387, 'loss/train': 1.2747873067855835} -09/20/2021 19:17:42 - INFO - __main__ - Step 22201: {'lr': 0.0001999174577335475, 'samples': 710432, 'steps': 1387, 'loss/train': 1.140731930732727} -09/20/2021 19:17:43 - INFO - __main__ - Step 22202: {'lr': 0.0001999174577335475, 'samples': 710464, 'steps': 1387, 'loss/train': 3.1475014686584473} -09/20/2021 19:17:43 - INFO - __main__ - Step 22203: {'lr': 0.0001999174577335475, 'samples': 710496, 'steps': 1387, 'loss/train': 1.6800705194473267} -09/20/2021 19:17:44 - INFO - __main__ - Step 22204: {'lr': 0.0001999174577335475, 'samples': 710528, 'steps': 1387, 'loss/train': 2.343473434448242} -09/20/2021 19:17:45 - INFO - __main__ - Step 22205: {'lr': 0.0001999174577335475, 'samples': 710560, 'steps': 1387, 'loss/train': 4.083131790161133} -09/20/2021 19:17:46 - INFO - __main__ - Step 22206: {'lr': 0.0001999174577335475, 'samples': 710592, 'steps': 1387, 'loss/train': 3.113126277923584} -09/20/2021 19:17:46 - INFO - __main__ - Step 22207: {'lr': 0.0001999174577335475, 'samples': 710624, 'steps': 1387, 'loss/train': 3.7488486766815186} -09/20/2021 19:17:47 - INFO - __main__ - Step 22208: {'lr': 0.0001999174577335475, 'samples': 710656, 'steps': 1387, 'loss/train': 4.521060466766357} -09/20/2021 19:17:48 - INFO - __main__ - Step 22209: {'lr': 0.000199917198406532, 'samples': 710688, 'steps': 1388, 'loss/train': 3.7016422748565674} -09/20/2021 19:17:49 - INFO - __main__ - Step 22210: {'lr': 0.000199917198406532, 'samples': 710720, 'steps': 1388, 'loss/train': 2.951040029525757} -09/20/2021 19:17:50 - INFO - __main__ - Step 22211: {'lr': 0.000199917198406532, 'samples': 710752, 'steps': 1388, 'loss/train': 3.3109734058380127} -09/20/2021 19:17:50 - INFO - __main__ - Step 22212: {'lr': 0.000199917198406532, 'samples': 710784, 'steps': 1388, 'loss/train': 2.502037763595581} -09/20/2021 19:17:51 - INFO - __main__ - Step 22213: {'lr': 0.000199917198406532, 'samples': 710816, 'steps': 1388, 'loss/train': 1.8130382299423218} -09/20/2021 19:17:52 - INFO - __main__ - Step 22214: {'lr': 0.000199917198406532, 'samples': 710848, 'steps': 1388, 'loss/train': 4.223461151123047} -09/20/2021 19:17:53 - INFO - __main__ - Step 22215: {'lr': 0.000199917198406532, 'samples': 710880, 'steps': 1388, 'loss/train': 3.4095306396484375} -09/20/2021 19:17:53 - INFO - __main__ - Step 22216: {'lr': 0.000199917198406532, 'samples': 710912, 'steps': 1388, 'loss/train': 1.6904220581054688} -09/20/2021 19:17:54 - INFO - __main__ - Step 22217: {'lr': 0.000199917198406532, 'samples': 710944, 'steps': 1388, 'loss/train': 3.2729737758636475} -09/20/2021 19:17:55 - INFO - __main__ - Step 22218: {'lr': 0.000199917198406532, 'samples': 710976, 'steps': 1388, 'loss/train': 3.6909847259521484} -09/20/2021 19:17:56 - INFO - __main__ - Step 22219: {'lr': 0.000199917198406532, 'samples': 711008, 'steps': 1388, 'loss/train': 3.1467745304107666} -09/20/2021 19:17:56 - INFO - __main__ - Step 22220: {'lr': 0.000199917198406532, 'samples': 711040, 'steps': 1388, 'loss/train': 3.0989115238189697} -09/20/2021 19:17:57 - INFO - __main__ - Step 22221: {'lr': 0.000199917198406532, 'samples': 711072, 'steps': 1388, 'loss/train': 3.0236377716064453} -09/20/2021 19:17:58 - INFO - __main__ - Step 22222: {'lr': 0.000199917198406532, 'samples': 711104, 'steps': 1388, 'loss/train': 3.519836187362671} -09/20/2021 19:17:59 - INFO - __main__ - Step 22223: {'lr': 0.000199917198406532, 'samples': 711136, 'steps': 1388, 'loss/train': 3.6426339149475098} -09/20/2021 19:18:00 - INFO - __main__ - Step 22224: {'lr': 0.000199917198406532, 'samples': 711168, 'steps': 1388, 'loss/train': 3.611135959625244} -09/20/2021 19:18:01 - INFO - __main__ - Step 22225: {'lr': 0.0001999169386729539, 'samples': 711200, 'steps': 1389, 'loss/train': 3.6787655353546143} -09/20/2021 19:18:01 - INFO - __main__ - Step 22226: {'lr': 0.0001999169386729539, 'samples': 711232, 'steps': 1389, 'loss/train': 3.435659170150757} -09/20/2021 19:18:02 - INFO - __main__ - Step 22227: {'lr': 0.0001999169386729539, 'samples': 711264, 'steps': 1389, 'loss/train': 3.4965908527374268} -09/20/2021 19:18:03 - INFO - __main__ - Step 22228: {'lr': 0.0001999169386729539, 'samples': 711296, 'steps': 1389, 'loss/train': 2.3755202293395996} -09/20/2021 19:18:04 - INFO - __main__ - Step 22229: {'lr': 0.0001999169386729539, 'samples': 711328, 'steps': 1389, 'loss/train': 1.2077717781066895} -09/20/2021 19:18:04 - INFO - __main__ - Step 22230: {'lr': 0.0001999169386729539, 'samples': 711360, 'steps': 1389, 'loss/train': 5.246467113494873} -09/20/2021 19:18:05 - INFO - __main__ - Step 22231: {'lr': 0.0001999169386729539, 'samples': 711392, 'steps': 1389, 'loss/train': 3.7660319805145264} -09/20/2021 19:18:06 - INFO - __main__ - Step 22232: {'lr': 0.0001999169386729539, 'samples': 711424, 'steps': 1389, 'loss/train': 2.831082582473755} -09/20/2021 19:18:07 - INFO - __main__ - Step 22233: {'lr': 0.0001999169386729539, 'samples': 711456, 'steps': 1389, 'loss/train': 2.86721134185791} -09/20/2021 19:18:07 - INFO - __main__ - Step 22234: {'lr': 0.0001999169386729539, 'samples': 711488, 'steps': 1389, 'loss/train': 3.4620208740234375} -09/20/2021 19:18:08 - INFO - __main__ - Step 22235: {'lr': 0.0001999169386729539, 'samples': 711520, 'steps': 1389, 'loss/train': 2.670703887939453} -09/20/2021 19:18:09 - INFO - __main__ - Step 22236: {'lr': 0.0001999169386729539, 'samples': 711552, 'steps': 1389, 'loss/train': 2.8439877033233643} -09/20/2021 19:18:10 - INFO - __main__ - Step 22237: {'lr': 0.0001999169386729539, 'samples': 711584, 'steps': 1389, 'loss/train': 2.9683024883270264} -09/20/2021 19:18:10 - INFO - __main__ - Step 22238: {'lr': 0.0001999169386729539, 'samples': 711616, 'steps': 1389, 'loss/train': 4.27583122253418} -09/20/2021 19:18:11 - INFO - __main__ - Step 22239: {'lr': 0.0001999169386729539, 'samples': 711648, 'steps': 1389, 'loss/train': 3.7219555377960205} -09/20/2021 19:18:12 - INFO - __main__ - Step 22240: {'lr': 0.0001999169386729539, 'samples': 711680, 'steps': 1389, 'loss/train': 3.1294524669647217} -09/20/2021 19:18:13 - INFO - __main__ - Step 22241: {'lr': 0.0001999166785328141, 'samples': 711712, 'steps': 1390, 'loss/train': 2.806833267211914} -09/20/2021 19:18:14 - INFO - __main__ - Step 22242: {'lr': 0.0001999166785328141, 'samples': 711744, 'steps': 1390, 'loss/train': 3.2334630489349365} -09/20/2021 19:18:14 - INFO - __main__ - Step 22243: {'lr': 0.0001999166785328141, 'samples': 711776, 'steps': 1390, 'loss/train': 3.2133734226226807} -09/20/2021 19:18:15 - INFO - __main__ - Step 22244: {'lr': 0.0001999166785328141, 'samples': 711808, 'steps': 1390, 'loss/train': 3.0011913776397705} -09/20/2021 19:18:16 - INFO - __main__ - Step 22245: {'lr': 0.0001999166785328141, 'samples': 711840, 'steps': 1390, 'loss/train': 2.9425528049468994} -09/20/2021 19:18:17 - INFO - __main__ - Step 22246: {'lr': 0.0001999166785328141, 'samples': 711872, 'steps': 1390, 'loss/train': 3.424123525619507} -09/20/2021 19:18:17 - INFO - __main__ - Step 22247: {'lr': 0.0001999166785328141, 'samples': 711904, 'steps': 1390, 'loss/train': 3.6777536869049072} -09/20/2021 19:18:18 - INFO - __main__ - Step 22248: {'lr': 0.0001999166785328141, 'samples': 711936, 'steps': 1390, 'loss/train': 2.72257399559021} -09/20/2021 19:18:19 - INFO - __main__ - Step 22249: {'lr': 0.0001999166785328141, 'samples': 711968, 'steps': 1390, 'loss/train': 3.2923338413238525} -09/20/2021 19:18:20 - INFO - __main__ - Step 22250: {'lr': 0.0001999166785328141, 'samples': 712000, 'steps': 1390, 'loss/train': 2.055422782897949} -09/20/2021 19:18:20 - INFO - __main__ - Step 22251: {'lr': 0.0001999166785328141, 'samples': 712032, 'steps': 1390, 'loss/train': 2.5503101348876953} -09/20/2021 19:18:21 - INFO - __main__ - Step 22252: {'lr': 0.0001999166785328141, 'samples': 712064, 'steps': 1390, 'loss/train': 4.121345520019531} -09/20/2021 19:18:22 - INFO - __main__ - Step 22253: {'lr': 0.0001999166785328141, 'samples': 712096, 'steps': 1390, 'loss/train': 2.0995562076568604} -09/20/2021 19:18:23 - INFO - __main__ - Step 22254: {'lr': 0.0001999166785328141, 'samples': 712128, 'steps': 1390, 'loss/train': 2.6076464653015137} -09/20/2021 19:18:24 - INFO - __main__ - Step 22255: {'lr': 0.0001999166785328141, 'samples': 712160, 'steps': 1390, 'loss/train': 2.7244362831115723} -09/20/2021 19:18:25 - INFO - __main__ - Step 22256: {'lr': 0.0001999166785328141, 'samples': 712192, 'steps': 1390, 'loss/train': 3.2393746376037598} -09/20/2021 19:18:26 - INFO - __main__ - Step 22257: {'lr': 0.00019991641798611373, 'samples': 712224, 'steps': 1391, 'loss/train': 2.9437484741210938} -09/20/2021 19:18:26 - INFO - __main__ - Step 22258: {'lr': 0.00019991641798611373, 'samples': 712256, 'steps': 1391, 'loss/train': 4.091488361358643} -09/20/2021 19:18:27 - INFO - __main__ - Step 22259: {'lr': 0.00019991641798611373, 'samples': 712288, 'steps': 1391, 'loss/train': 2.914970874786377} -09/20/2021 19:18:28 - INFO - __main__ - Step 22260: {'lr': 0.00019991641798611373, 'samples': 712320, 'steps': 1391, 'loss/train': 5.589171409606934} -09/20/2021 19:18:29 - INFO - __main__ - Step 22261: {'lr': 0.00019991641798611373, 'samples': 712352, 'steps': 1391, 'loss/train': 3.459167957305908} -09/20/2021 19:18:29 - INFO - __main__ - Step 22262: {'lr': 0.00019991641798611373, 'samples': 712384, 'steps': 1391, 'loss/train': 1.5151467323303223} -09/20/2021 19:18:30 - INFO - __main__ - Step 22263: {'lr': 0.00019991641798611373, 'samples': 712416, 'steps': 1391, 'loss/train': 3.3389604091644287} -09/20/2021 19:18:31 - INFO - __main__ - Step 22264: {'lr': 0.00019991641798611373, 'samples': 712448, 'steps': 1391, 'loss/train': 3.1733157634735107} -09/20/2021 19:18:32 - INFO - __main__ - Step 22265: {'lr': 0.00019991641798611373, 'samples': 712480, 'steps': 1391, 'loss/train': 3.9769554138183594} -09/20/2021 19:18:32 - INFO - __main__ - Step 22266: {'lr': 0.00019991641798611373, 'samples': 712512, 'steps': 1391, 'loss/train': 3.8438258171081543} -09/20/2021 19:18:33 - INFO - __main__ - Step 22267: {'lr': 0.00019991641798611373, 'samples': 712544, 'steps': 1391, 'loss/train': 3.0412721633911133} -09/20/2021 19:18:34 - INFO - __main__ - Step 22268: {'lr': 0.00019991641798611373, 'samples': 712576, 'steps': 1391, 'loss/train': 5.175124168395996} -09/20/2021 19:18:35 - INFO - __main__ - Step 22269: {'lr': 0.00019991641798611373, 'samples': 712608, 'steps': 1391, 'loss/train': 3.1706371307373047} -09/20/2021 19:18:35 - INFO - __main__ - Step 22270: {'lr': 0.00019991641798611373, 'samples': 712640, 'steps': 1391, 'loss/train': 2.6514241695404053} -09/20/2021 19:18:36 - INFO - __main__ - Step 22271: {'lr': 0.00019991641798611373, 'samples': 712672, 'steps': 1391, 'loss/train': 2.619180679321289} -09/20/2021 19:18:37 - INFO - __main__ - Step 22272: {'lr': 0.00019991641798611373, 'samples': 712704, 'steps': 1391, 'loss/train': 3.567497968673706} -09/20/2021 19:18:38 - INFO - __main__ - Step 22273: {'lr': 0.00019991615703285386, 'samples': 712736, 'steps': 1392, 'loss/train': 3.6337239742279053} -09/20/2021 19:18:38 - INFO - __main__ - Step 22274: {'lr': 0.00019991615703285386, 'samples': 712768, 'steps': 1392, 'loss/train': 3.2403366565704346} -09/20/2021 19:18:39 - INFO - __main__ - Step 22275: {'lr': 0.00019991615703285386, 'samples': 712800, 'steps': 1392, 'loss/train': 2.4865424633026123} -09/20/2021 19:18:40 - INFO - __main__ - Step 22276: {'lr': 0.00019991615703285386, 'samples': 712832, 'steps': 1392, 'loss/train': 2.8909075260162354} -09/20/2021 19:18:41 - INFO - __main__ - Step 22277: {'lr': 0.00019991615703285386, 'samples': 712864, 'steps': 1392, 'loss/train': 3.6366147994995117} -09/20/2021 19:18:41 - INFO - __main__ - Step 22278: {'lr': 0.00019991615703285386, 'samples': 712896, 'steps': 1392, 'loss/train': 3.5381505489349365} -09/20/2021 19:18:42 - INFO - __main__ - Step 22279: {'lr': 0.00019991615703285386, 'samples': 712928, 'steps': 1392, 'loss/train': 3.606069564819336} -09/20/2021 19:18:43 - INFO - __main__ - Step 22280: {'lr': 0.00019991615703285386, 'samples': 712960, 'steps': 1392, 'loss/train': 3.39060115814209} -09/20/2021 19:18:44 - INFO - __main__ - Step 22281: {'lr': 0.00019991615703285386, 'samples': 712992, 'steps': 1392, 'loss/train': 2.7273316383361816} -09/20/2021 19:18:44 - INFO - __main__ - Step 22282: {'lr': 0.00019991615703285386, 'samples': 713024, 'steps': 1392, 'loss/train': 3.3454477787017822} -09/20/2021 19:18:45 - INFO - __main__ - Step 22283: {'lr': 0.00019991615703285386, 'samples': 713056, 'steps': 1392, 'loss/train': 3.177379846572876} -09/20/2021 19:18:46 - INFO - __main__ - Step 22284: {'lr': 0.00019991615703285386, 'samples': 713088, 'steps': 1392, 'loss/train': 1.1973967552185059} -09/20/2021 19:18:47 - INFO - __main__ - Step 22285: {'lr': 0.00019991615703285386, 'samples': 713120, 'steps': 1392, 'loss/train': 3.1332743167877197} -09/20/2021 19:18:48 - INFO - __main__ - Step 22286: {'lr': 0.00019991615703285386, 'samples': 713152, 'steps': 1392, 'loss/train': 3.319084405899048} -09/20/2021 19:18:49 - INFO - __main__ - Step 22287: {'lr': 0.00019991615703285386, 'samples': 713184, 'steps': 1392, 'loss/train': 3.165616512298584} -09/20/2021 19:18:49 - INFO - __main__ - Step 22288: {'lr': 0.00019991615703285386, 'samples': 713216, 'steps': 1392, 'loss/train': 3.1904163360595703} -09/20/2021 19:18:50 - INFO - __main__ - Step 22289: {'lr': 0.00019991589567303555, 'samples': 713248, 'steps': 1393, 'loss/train': 1.0419210195541382} -09/20/2021 19:18:51 - INFO - __main__ - Step 22290: {'lr': 0.00019991589567303555, 'samples': 713280, 'steps': 1393, 'loss/train': 3.2417542934417725} -09/20/2021 19:18:52 - INFO - __main__ - Step 22291: {'lr': 0.00019991589567303555, 'samples': 713312, 'steps': 1393, 'loss/train': 2.4450883865356445} -09/20/2021 19:18:53 - INFO - __main__ - Step 22292: {'lr': 0.00019991589567303555, 'samples': 713344, 'steps': 1393, 'loss/train': 2.3592770099639893} -09/20/2021 19:18:53 - INFO - __main__ - Step 22293: {'lr': 0.00019991589567303555, 'samples': 713376, 'steps': 1393, 'loss/train': 3.3234245777130127} -09/20/2021 19:18:54 - INFO - __main__ - Step 22294: {'lr': 0.00019991589567303555, 'samples': 713408, 'steps': 1393, 'loss/train': 3.0007588863372803} -09/20/2021 19:18:55 - INFO - __main__ - Step 22295: {'lr': 0.00019991589567303555, 'samples': 713440, 'steps': 1393, 'loss/train': 4.415491104125977} -09/20/2021 19:18:56 - INFO - __main__ - Step 22296: {'lr': 0.00019991589567303555, 'samples': 713472, 'steps': 1393, 'loss/train': 3.4259939193725586} -09/20/2021 19:18:56 - INFO - __main__ - Step 22297: {'lr': 0.00019991589567303555, 'samples': 713504, 'steps': 1393, 'loss/train': 3.023211717605591} -09/20/2021 19:18:57 - INFO - __main__ - Step 22298: {'lr': 0.00019991589567303555, 'samples': 713536, 'steps': 1393, 'loss/train': 2.8387458324432373} -09/20/2021 19:18:58 - INFO - __main__ - Step 22299: {'lr': 0.00019991589567303555, 'samples': 713568, 'steps': 1393, 'loss/train': 3.139200448989868} -09/20/2021 19:18:59 - INFO - __main__ - Step 22300: {'lr': 0.00019991589567303555, 'samples': 713600, 'steps': 1393, 'loss/train': 3.3357632160186768} -09/20/2021 19:18:59 - INFO - __main__ - Step 22301: {'lr': 0.00019991589567303555, 'samples': 713632, 'steps': 1393, 'loss/train': 2.7221388816833496} -09/20/2021 19:19:00 - INFO - __main__ - Step 22302: {'lr': 0.00019991589567303555, 'samples': 713664, 'steps': 1393, 'loss/train': 2.4927892684936523} -09/20/2021 19:19:01 - INFO - __main__ - Step 22303: {'lr': 0.00019991589567303555, 'samples': 713696, 'steps': 1393, 'loss/train': 3.8641066551208496} -09/20/2021 19:19:02 - INFO - __main__ - Step 22304: {'lr': 0.00019991589567303555, 'samples': 713728, 'steps': 1393, 'loss/train': 1.2707229852676392} -09/20/2021 19:19:02 - INFO - __main__ - Step 22305: {'lr': 0.00019991563390665983, 'samples': 713760, 'steps': 1394, 'loss/train': 2.7770168781280518} -09/20/2021 19:19:03 - INFO - __main__ - Step 22306: {'lr': 0.00019991563390665983, 'samples': 713792, 'steps': 1394, 'loss/train': 3.489874839782715} -09/20/2021 19:19:04 - INFO - __main__ - Step 22307: {'lr': 0.00019991563390665983, 'samples': 713824, 'steps': 1394, 'loss/train': 2.6805057525634766} -09/20/2021 19:19:05 - INFO - __main__ - Step 22308: {'lr': 0.00019991563390665983, 'samples': 713856, 'steps': 1394, 'loss/train': 2.993298053741455} -09/20/2021 19:19:05 - INFO - __main__ - Step 22309: {'lr': 0.00019991563390665983, 'samples': 713888, 'steps': 1394, 'loss/train': 2.6671836376190186} -09/20/2021 19:19:06 - INFO - __main__ - Step 22310: {'lr': 0.00019991563390665983, 'samples': 713920, 'steps': 1394, 'loss/train': 3.343735456466675} -09/20/2021 19:19:07 - INFO - __main__ - Step 22311: {'lr': 0.00019991563390665983, 'samples': 713952, 'steps': 1394, 'loss/train': 4.203754901885986} -09/20/2021 19:19:08 - INFO - __main__ - Step 22312: {'lr': 0.00019991563390665983, 'samples': 713984, 'steps': 1394, 'loss/train': 2.8923988342285156} -09/20/2021 19:19:08 - INFO - __main__ - Step 22313: {'lr': 0.00019991563390665983, 'samples': 714016, 'steps': 1394, 'loss/train': 3.156949996948242} -09/20/2021 19:19:09 - INFO - __main__ - Step 22314: {'lr': 0.00019991563390665983, 'samples': 714048, 'steps': 1394, 'loss/train': 3.1708223819732666} -09/20/2021 19:19:10 - INFO - __main__ - Step 22315: {'lr': 0.00019991563390665983, 'samples': 714080, 'steps': 1394, 'loss/train': 4.138490200042725} -09/20/2021 19:19:12 - INFO - __main__ - Step 22316: {'lr': 0.00019991563390665983, 'samples': 714112, 'steps': 1394, 'loss/train': 4.0336127281188965} -09/20/2021 19:19:13 - INFO - __main__ - Step 22317: {'lr': 0.00019991563390665983, 'samples': 714144, 'steps': 1394, 'loss/train': 3.281529426574707} -09/20/2021 19:19:13 - INFO - __main__ - Step 22318: {'lr': 0.00019991563390665983, 'samples': 714176, 'steps': 1394, 'loss/train': 2.6822125911712646} -09/20/2021 19:19:14 - INFO - __main__ - Step 22319: {'lr': 0.00019991563390665983, 'samples': 714208, 'steps': 1394, 'loss/train': 3.866788387298584} -09/20/2021 19:19:15 - INFO - __main__ - Step 22320: {'lr': 0.00019991563390665983, 'samples': 714240, 'steps': 1394, 'loss/train': 3.2696778774261475} -09/20/2021 19:19:16 - INFO - __main__ - Step 22321: {'lr': 0.00019991537173372776, 'samples': 714272, 'steps': 1395, 'loss/train': 4.112732887268066} -09/20/2021 19:19:17 - INFO - __main__ - Step 22322: {'lr': 0.00019991537173372776, 'samples': 714304, 'steps': 1395, 'loss/train': 2.673447370529175} -09/20/2021 19:19:17 - INFO - __main__ - Step 22323: {'lr': 0.00019991537173372776, 'samples': 714336, 'steps': 1395, 'loss/train': 3.1195926666259766} -09/20/2021 19:19:18 - INFO - __main__ - Step 22324: {'lr': 0.00019991537173372776, 'samples': 714368, 'steps': 1395, 'loss/train': 3.6022305488586426} -09/20/2021 19:19:19 - INFO - __main__ - Step 22325: {'lr': 0.00019991537173372776, 'samples': 714400, 'steps': 1395, 'loss/train': 2.3176770210266113} -09/20/2021 19:19:20 - INFO - __main__ - Step 22326: {'lr': 0.00019991537173372776, 'samples': 714432, 'steps': 1395, 'loss/train': 2.5139319896698} -09/20/2021 19:19:20 - INFO - __main__ - Step 22327: {'lr': 0.00019991537173372776, 'samples': 714464, 'steps': 1395, 'loss/train': 3.096151828765869} -09/20/2021 19:19:21 - INFO - __main__ - Step 22328: {'lr': 0.00019991537173372776, 'samples': 714496, 'steps': 1395, 'loss/train': 3.0862512588500977} -09/20/2021 19:19:22 - INFO - __main__ - Step 22329: {'lr': 0.00019991537173372776, 'samples': 714528, 'steps': 1395, 'loss/train': 2.4397754669189453} -09/20/2021 19:19:23 - INFO - __main__ - Step 22330: {'lr': 0.00019991537173372776, 'samples': 714560, 'steps': 1395, 'loss/train': 3.5061986446380615} -09/20/2021 19:19:23 - INFO - __main__ - Step 22331: {'lr': 0.00019991537173372776, 'samples': 714592, 'steps': 1395, 'loss/train': 2.384075880050659} -09/20/2021 19:19:24 - INFO - __main__ - Step 22332: {'lr': 0.00019991537173372776, 'samples': 714624, 'steps': 1395, 'loss/train': 3.4660632610321045} -09/20/2021 19:19:25 - INFO - __main__ - Step 22333: {'lr': 0.00019991537173372776, 'samples': 714656, 'steps': 1395, 'loss/train': 3.4223668575286865} -09/20/2021 19:19:26 - INFO - __main__ - Step 22334: {'lr': 0.00019991537173372776, 'samples': 714688, 'steps': 1395, 'loss/train': 3.1869215965270996} -09/20/2021 19:19:26 - INFO - __main__ - Step 22335: {'lr': 0.00019991537173372776, 'samples': 714720, 'steps': 1395, 'loss/train': 2.410905122756958} -09/20/2021 19:19:27 - INFO - __main__ - Step 22336: {'lr': 0.00019991537173372776, 'samples': 714752, 'steps': 1395, 'loss/train': 2.7406318187713623} -09/20/2021 19:19:28 - INFO - __main__ - Step 22337: {'lr': 0.00019991510915424044, 'samples': 714784, 'steps': 1396, 'loss/train': 3.0742688179016113} -09/20/2021 19:19:29 - INFO - __main__ - Step 22338: {'lr': 0.00019991510915424044, 'samples': 714816, 'steps': 1396, 'loss/train': 0.889491856098175} -09/20/2021 19:19:29 - INFO - __main__ - Step 22339: {'lr': 0.00019991510915424044, 'samples': 714848, 'steps': 1396, 'loss/train': 0.6480442881584167} -09/20/2021 19:19:30 - INFO - __main__ - Step 22340: {'lr': 0.00019991510915424044, 'samples': 714880, 'steps': 1396, 'loss/train': 1.12053382396698} -09/20/2021 19:19:31 - INFO - __main__ - Step 22341: {'lr': 0.00019991510915424044, 'samples': 714912, 'steps': 1396, 'loss/train': 0.6815580129623413} -09/20/2021 19:19:32 - INFO - __main__ - Step 22342: {'lr': 0.00019991510915424044, 'samples': 714944, 'steps': 1396, 'loss/train': 2.910446882247925} -09/20/2021 19:19:32 - INFO - __main__ - Step 22343: {'lr': 0.00019991510915424044, 'samples': 714976, 'steps': 1396, 'loss/train': 1.6902803182601929} -09/20/2021 19:19:33 - INFO - __main__ - Step 22344: {'lr': 0.00019991510915424044, 'samples': 715008, 'steps': 1396, 'loss/train': 4.1966400146484375} -09/20/2021 19:19:34 - INFO - __main__ - Step 22345: {'lr': 0.00019991510915424044, 'samples': 715040, 'steps': 1396, 'loss/train': 3.2375810146331787} -09/20/2021 19:19:35 - INFO - __main__ - Step 22346: {'lr': 0.00019991510915424044, 'samples': 715072, 'steps': 1396, 'loss/train': 2.9098973274230957} -09/20/2021 19:19:35 - INFO - __main__ - Step 22347: {'lr': 0.00019991510915424044, 'samples': 715104, 'steps': 1396, 'loss/train': 3.1064796447753906} -09/20/2021 19:19:37 - INFO - __main__ - Step 22348: {'lr': 0.00019991510915424044, 'samples': 715136, 'steps': 1396, 'loss/train': 2.681448459625244} -09/20/2021 19:19:37 - INFO - __main__ - Step 22349: {'lr': 0.00019991510915424044, 'samples': 715168, 'steps': 1396, 'loss/train': 3.086486577987671} -09/20/2021 19:19:38 - INFO - __main__ - Step 22350: {'lr': 0.00019991510915424044, 'samples': 715200, 'steps': 1396, 'loss/train': 0.5864717364311218} -09/20/2021 19:19:39 - INFO - __main__ - Step 22351: {'lr': 0.00019991510915424044, 'samples': 715232, 'steps': 1396, 'loss/train': 4.070915222167969} -09/20/2021 19:19:40 - INFO - __main__ - Step 22352: {'lr': 0.00019991510915424044, 'samples': 715264, 'steps': 1396, 'loss/train': 2.9726853370666504} -09/20/2021 19:19:41 - INFO - __main__ - Step 22353: {'lr': 0.00019991484616819894, 'samples': 715296, 'steps': 1397, 'loss/train': 2.9825215339660645} -09/20/2021 19:19:41 - INFO - __main__ - Step 22354: {'lr': 0.00019991484616819894, 'samples': 715328, 'steps': 1397, 'loss/train': 2.8562283515930176} -09/20/2021 19:19:42 - INFO - __main__ - Step 22355: {'lr': 0.00019991484616819894, 'samples': 715360, 'steps': 1397, 'loss/train': 5.125676155090332} -09/20/2021 19:19:43 - INFO - __main__ - Step 22356: {'lr': 0.00019991484616819894, 'samples': 715392, 'steps': 1397, 'loss/train': 3.1955418586730957} -09/20/2021 19:19:44 - INFO - __main__ - Step 22357: {'lr': 0.00019991484616819894, 'samples': 715424, 'steps': 1397, 'loss/train': 2.850623369216919} -09/20/2021 19:19:44 - INFO - __main__ - Step 22358: {'lr': 0.00019991484616819894, 'samples': 715456, 'steps': 1397, 'loss/train': 3.1187057495117188} -09/20/2021 19:19:45 - INFO - __main__ - Step 22359: {'lr': 0.00019991484616819894, 'samples': 715488, 'steps': 1397, 'loss/train': 5.055492401123047} -09/20/2021 19:19:46 - INFO - __main__ - Step 22360: {'lr': 0.00019991484616819894, 'samples': 715520, 'steps': 1397, 'loss/train': 2.6038403511047363} -09/20/2021 19:19:47 - INFO - __main__ - Step 22361: {'lr': 0.00019991484616819894, 'samples': 715552, 'steps': 1397, 'loss/train': 2.755829334259033} -09/20/2021 19:19:47 - INFO - __main__ - Step 22362: {'lr': 0.00019991484616819894, 'samples': 715584, 'steps': 1397, 'loss/train': 2.9745490550994873} -09/20/2021 19:19:48 - INFO - __main__ - Step 22363: {'lr': 0.00019991484616819894, 'samples': 715616, 'steps': 1397, 'loss/train': 2.6712758541107178} -09/20/2021 19:19:49 - INFO - __main__ - Step 22364: {'lr': 0.00019991484616819894, 'samples': 715648, 'steps': 1397, 'loss/train': 1.539914608001709} -09/20/2021 19:19:50 - INFO - __main__ - Step 22365: {'lr': 0.00019991484616819894, 'samples': 715680, 'steps': 1397, 'loss/train': 2.5256567001342773} -09/20/2021 19:19:50 - INFO - __main__ - Step 22366: {'lr': 0.00019991484616819894, 'samples': 715712, 'steps': 1397, 'loss/train': 0.7405441403388977} -09/20/2021 19:19:51 - INFO - __main__ - Step 22367: {'lr': 0.00019991484616819894, 'samples': 715744, 'steps': 1397, 'loss/train': 2.5878026485443115} -09/20/2021 19:19:52 - INFO - __main__ - Step 22368: {'lr': 0.00019991484616819894, 'samples': 715776, 'steps': 1397, 'loss/train': 3.5353221893310547} -09/20/2021 19:19:53 - INFO - __main__ - Step 22369: {'lr': 0.00019991458277560434, 'samples': 715808, 'steps': 1398, 'loss/train': 2.351755380630493} -09/20/2021 19:19:53 - INFO - __main__ - Step 22370: {'lr': 0.00019991458277560434, 'samples': 715840, 'steps': 1398, 'loss/train': 3.1809628009796143} -09/20/2021 19:19:54 - INFO - __main__ - Step 22371: {'lr': 0.00019991458277560434, 'samples': 715872, 'steps': 1398, 'loss/train': 3.7096285820007324} -09/20/2021 19:19:55 - INFO - __main__ - Step 22372: {'lr': 0.00019991458277560434, 'samples': 715904, 'steps': 1398, 'loss/train': 3.3893585205078125} -09/20/2021 19:19:56 - INFO - __main__ - Step 22373: {'lr': 0.00019991458277560434, 'samples': 715936, 'steps': 1398, 'loss/train': 2.5997960567474365} -09/20/2021 19:19:56 - INFO - __main__ - Step 22374: {'lr': 0.00019991458277560434, 'samples': 715968, 'steps': 1398, 'loss/train': 3.1941909790039062} -09/20/2021 19:19:57 - INFO - __main__ - Step 22375: {'lr': 0.00019991458277560434, 'samples': 716000, 'steps': 1398, 'loss/train': 2.532015800476074} -09/20/2021 19:19:58 - INFO - __main__ - Step 22376: {'lr': 0.00019991458277560434, 'samples': 716032, 'steps': 1398, 'loss/train': 2.394099712371826} -09/20/2021 19:19:59 - INFO - __main__ - Step 22377: {'lr': 0.00019991458277560434, 'samples': 716064, 'steps': 1398, 'loss/train': 3.610675811767578} -09/20/2021 19:19:59 - INFO - __main__ - Step 22378: {'lr': 0.00019991458277560434, 'samples': 716096, 'steps': 1398, 'loss/train': 3.288376569747925} -09/20/2021 19:20:00 - INFO - __main__ - Step 22379: {'lr': 0.00019991458277560434, 'samples': 716128, 'steps': 1398, 'loss/train': 3.9889111518859863} -09/20/2021 19:20:02 - INFO - __main__ - Step 22380: {'lr': 0.00019991458277560434, 'samples': 716160, 'steps': 1398, 'loss/train': 3.0799264907836914} -09/20/2021 19:20:03 - INFO - __main__ - Step 22381: {'lr': 0.00019991458277560434, 'samples': 716192, 'steps': 1398, 'loss/train': 2.523085832595825} -09/20/2021 19:20:03 - INFO - __main__ - Step 22382: {'lr': 0.00019991458277560434, 'samples': 716224, 'steps': 1398, 'loss/train': 2.750109910964966} -09/20/2021 19:20:04 - INFO - __main__ - Step 22383: {'lr': 0.00019991458277560434, 'samples': 716256, 'steps': 1398, 'loss/train': 3.232635259628296} -09/20/2021 19:20:05 - INFO - __main__ - Step 22384: {'lr': 0.00019991458277560434, 'samples': 716288, 'steps': 1398, 'loss/train': 3.264378309249878} -09/20/2021 19:20:06 - INFO - __main__ - Step 22385: {'lr': 0.00019991431897645767, 'samples': 716320, 'steps': 1399, 'loss/train': 1.1953717470169067} -09/20/2021 19:20:06 - INFO - __main__ - Step 22386: {'lr': 0.00019991431897645767, 'samples': 716352, 'steps': 1399, 'loss/train': 2.268622875213623} -09/20/2021 19:20:07 - INFO - __main__ - Step 22387: {'lr': 0.00019991431897645767, 'samples': 716384, 'steps': 1399, 'loss/train': 2.73734712600708} -09/20/2021 19:20:08 - INFO - __main__ - Step 22388: {'lr': 0.00019991431897645767, 'samples': 716416, 'steps': 1399, 'loss/train': 3.5286037921905518} -09/20/2021 19:20:09 - INFO - __main__ - Step 22389: {'lr': 0.00019991431897645767, 'samples': 716448, 'steps': 1399, 'loss/train': 1.8690861463546753} -09/20/2021 19:20:09 - INFO - __main__ - Step 22390: {'lr': 0.00019991431897645767, 'samples': 716480, 'steps': 1399, 'loss/train': 2.207210063934326} -09/20/2021 19:20:10 - INFO - __main__ - Step 22391: {'lr': 0.00019991431897645767, 'samples': 716512, 'steps': 1399, 'loss/train': 3.7766900062561035} -09/20/2021 19:20:11 - INFO - __main__ - Step 22392: {'lr': 0.00019991431897645767, 'samples': 716544, 'steps': 1399, 'loss/train': 2.639613389968872} -09/20/2021 19:20:12 - INFO - __main__ - Step 22393: {'lr': 0.00019991431897645767, 'samples': 716576, 'steps': 1399, 'loss/train': 2.422244071960449} -09/20/2021 19:20:12 - INFO - __main__ - Step 22394: {'lr': 0.00019991431897645767, 'samples': 716608, 'steps': 1399, 'loss/train': 3.1266512870788574} -09/20/2021 19:20:13 - INFO - __main__ - Step 22395: {'lr': 0.00019991431897645767, 'samples': 716640, 'steps': 1399, 'loss/train': 2.6112139225006104} -09/20/2021 19:20:14 - INFO - __main__ - Step 22396: {'lr': 0.00019991431897645767, 'samples': 716672, 'steps': 1399, 'loss/train': 3.3850772380828857} -09/20/2021 19:20:15 - INFO - __main__ - Step 22397: {'lr': 0.00019991431897645767, 'samples': 716704, 'steps': 1399, 'loss/train': 3.6385209560394287} -09/20/2021 19:20:15 - INFO - __main__ - Step 22398: {'lr': 0.00019991431897645767, 'samples': 716736, 'steps': 1399, 'loss/train': 1.7603442668914795} -09/20/2021 19:20:16 - INFO - __main__ - Step 22399: {'lr': 0.00019991431897645767, 'samples': 716768, 'steps': 1399, 'loss/train': 2.133226156234741} -09/20/2021 19:20:17 - INFO - __main__ - Step 22400: {'lr': 0.00019991431897645767, 'samples': 716800, 'steps': 1399, 'loss/train': 2.6713972091674805} -09/20/2021 19:20:18 - INFO - __main__ - Step 22401: {'lr': 0.00019991405477076, 'samples': 716832, 'steps': 1400, 'loss/train': 2.7167983055114746} -09/20/2021 19:20:19 - INFO - __main__ - Step 22402: {'lr': 0.00019991405477076, 'samples': 716864, 'steps': 1400, 'loss/train': 3.332742214202881} -09/20/2021 19:20:19 - INFO - __main__ - Step 22403: {'lr': 0.00019991405477076, 'samples': 716896, 'steps': 1400, 'loss/train': 3.2298648357391357} -09/20/2021 19:20:20 - INFO - __main__ - Step 22404: {'lr': 0.00019991405477076, 'samples': 716928, 'steps': 1400, 'loss/train': 3.0926971435546875} -09/20/2021 19:20:21 - INFO - __main__ - Step 22405: {'lr': 0.00019991405477076, 'samples': 716960, 'steps': 1400, 'loss/train': 2.7407164573669434} -09/20/2021 19:20:22 - INFO - __main__ - Step 22406: {'lr': 0.00019991405477076, 'samples': 716992, 'steps': 1400, 'loss/train': 3.084418296813965} -09/20/2021 19:20:22 - INFO - __main__ - Step 22407: {'lr': 0.00019991405477076, 'samples': 717024, 'steps': 1400, 'loss/train': 3.9399218559265137} -09/20/2021 19:20:23 - INFO - __main__ - Step 22408: {'lr': 0.00019991405477076, 'samples': 717056, 'steps': 1400, 'loss/train': 2.88753342628479} -09/20/2021 19:20:24 - INFO - __main__ - Step 22409: {'lr': 0.00019991405477076, 'samples': 717088, 'steps': 1400, 'loss/train': 3.709028482437134} -09/20/2021 19:20:25 - INFO - __main__ - Step 22410: {'lr': 0.00019991405477076, 'samples': 717120, 'steps': 1400, 'loss/train': 0.6107503771781921} -09/20/2021 19:20:25 - INFO - __main__ - Step 22411: {'lr': 0.00019991405477076, 'samples': 717152, 'steps': 1400, 'loss/train': 0.7420799136161804} -09/20/2021 19:20:26 - INFO - __main__ - Step 22412: {'lr': 0.00019991405477076, 'samples': 717184, 'steps': 1400, 'loss/train': 0.4666751027107239} -09/20/2021 19:20:27 - INFO - __main__ - Step 22413: {'lr': 0.00019991405477076, 'samples': 717216, 'steps': 1400, 'loss/train': 0.48192670941352844} -09/20/2021 19:20:28 - INFO - __main__ - Step 22414: {'lr': 0.00019991405477076, 'samples': 717248, 'steps': 1400, 'loss/train': 0.7105345129966736} -09/20/2021 19:20:29 - INFO - __main__ - Step 22415: {'lr': 0.00019991405477076, 'samples': 717280, 'steps': 1400, 'loss/train': 1.735026478767395} -09/20/2021 19:20:30 - INFO - __main__ - Step 22416: {'lr': 0.00019991405477076, 'samples': 717312, 'steps': 1400, 'loss/train': 3.15081787109375} -09/20/2021 19:20:31 - INFO - __main__ - Step 22417: {'lr': 0.00019991379015851245, 'samples': 717344, 'steps': 1401, 'loss/train': 3.5703439712524414} -09/20/2021 19:20:32 - INFO - __main__ - Step 22418: {'lr': 0.00019991379015851245, 'samples': 717376, 'steps': 1401, 'loss/train': 4.062155246734619} -09/20/2021 19:20:32 - INFO - __main__ - Step 22419: {'lr': 0.00019991379015851245, 'samples': 717408, 'steps': 1401, 'loss/train': 5.025026321411133} -09/20/2021 19:20:33 - INFO - __main__ - Step 22420: {'lr': 0.00019991379015851245, 'samples': 717440, 'steps': 1401, 'loss/train': 2.6414084434509277} -09/20/2021 19:20:34 - INFO - __main__ - Step 22421: {'lr': 0.00019991379015851245, 'samples': 717472, 'steps': 1401, 'loss/train': 3.466386556625366} -09/20/2021 19:20:35 - INFO - __main__ - Step 22422: {'lr': 0.00019991379015851245, 'samples': 717504, 'steps': 1401, 'loss/train': 1.8832921981811523} -09/20/2021 19:20:35 - INFO - __main__ - Step 22423: {'lr': 0.00019991379015851245, 'samples': 717536, 'steps': 1401, 'loss/train': 2.748448371887207} -09/20/2021 19:20:36 - INFO - __main__ - Step 22424: {'lr': 0.00019991379015851245, 'samples': 717568, 'steps': 1401, 'loss/train': 2.837526321411133} -09/20/2021 19:20:37 - INFO - __main__ - Step 22425: {'lr': 0.00019991379015851245, 'samples': 717600, 'steps': 1401, 'loss/train': 3.737445592880249} -09/20/2021 19:20:38 - INFO - __main__ - Step 22426: {'lr': 0.00019991379015851245, 'samples': 717632, 'steps': 1401, 'loss/train': 3.3219282627105713} -09/20/2021 19:20:38 - INFO - __main__ - Step 22427: {'lr': 0.00019991379015851245, 'samples': 717664, 'steps': 1401, 'loss/train': 3.395235538482666} -09/20/2021 19:20:39 - INFO - __main__ - Step 22428: {'lr': 0.00019991379015851245, 'samples': 717696, 'steps': 1401, 'loss/train': 3.91365122795105} -09/20/2021 19:20:40 - INFO - __main__ - Step 22429: {'lr': 0.00019991379015851245, 'samples': 717728, 'steps': 1401, 'loss/train': 2.595958709716797} -09/20/2021 19:20:41 - INFO - __main__ - Step 22430: {'lr': 0.00019991379015851245, 'samples': 717760, 'steps': 1401, 'loss/train': 3.6444249153137207} -09/20/2021 19:20:41 - INFO - __main__ - Step 22431: {'lr': 0.00019991379015851245, 'samples': 717792, 'steps': 1401, 'loss/train': 3.265760898590088} -09/20/2021 19:20:42 - INFO - __main__ - Step 22432: {'lr': 0.00019991379015851245, 'samples': 717824, 'steps': 1401, 'loss/train': 2.8453550338745117} -09/20/2021 19:20:43 - INFO - __main__ - Step 22433: {'lr': 0.00019991352513971608, 'samples': 717856, 'steps': 1402, 'loss/train': 1.9823092222213745} -09/20/2021 19:20:44 - INFO - __main__ - Step 22434: {'lr': 0.00019991352513971608, 'samples': 717888, 'steps': 1402, 'loss/train': 2.9361720085144043} -09/20/2021 19:20:44 - INFO - __main__ - Step 22435: {'lr': 0.00019991352513971608, 'samples': 717920, 'steps': 1402, 'loss/train': 3.591648578643799} -09/20/2021 19:20:45 - INFO - __main__ - Step 22436: {'lr': 0.00019991352513971608, 'samples': 717952, 'steps': 1402, 'loss/train': 3.3569414615631104} -09/20/2021 19:20:46 - INFO - __main__ - Step 22437: {'lr': 0.00019991352513971608, 'samples': 717984, 'steps': 1402, 'loss/train': 1.6810144186019897} -09/20/2021 19:20:47 - INFO - __main__ - Step 22438: {'lr': 0.00019991352513971608, 'samples': 718016, 'steps': 1402, 'loss/train': 1.6823782920837402} -09/20/2021 19:20:47 - INFO - __main__ - Step 22439: {'lr': 0.00019991352513971608, 'samples': 718048, 'steps': 1402, 'loss/train': 1.653786540031433} -09/20/2021 19:20:48 - INFO - __main__ - Step 22440: {'lr': 0.00019991352513971608, 'samples': 718080, 'steps': 1402, 'loss/train': 1.5474553108215332} -09/20/2021 19:20:49 - INFO - __main__ - Step 22441: {'lr': 0.00019991352513971608, 'samples': 718112, 'steps': 1402, 'loss/train': 1.7570909261703491} -09/20/2021 19:20:50 - INFO - __main__ - Step 22442: {'lr': 0.00019991352513971608, 'samples': 718144, 'steps': 1402, 'loss/train': 1.9978059530258179} -09/20/2021 19:20:50 - INFO - __main__ - Step 22443: {'lr': 0.00019991352513971608, 'samples': 718176, 'steps': 1402, 'loss/train': 1.783894419670105} -09/20/2021 19:20:51 - INFO - __main__ - Step 22444: {'lr': 0.00019991352513971608, 'samples': 718208, 'steps': 1402, 'loss/train': 1.842037320137024} -09/20/2021 19:20:52 - INFO - __main__ - Step 22445: {'lr': 0.00019991352513971608, 'samples': 718240, 'steps': 1402, 'loss/train': 1.7609225511550903} -09/20/2021 19:20:53 - INFO - __main__ - Step 22446: {'lr': 0.00019991352513971608, 'samples': 718272, 'steps': 1402, 'loss/train': 2.9640913009643555} -09/20/2021 19:20:53 - INFO - __main__ - Step 22447: {'lr': 0.00019991352513971608, 'samples': 718304, 'steps': 1402, 'loss/train': 2.6324925422668457} -09/20/2021 19:20:54 - INFO - __main__ - Step 22448: {'lr': 0.00019991352513971608, 'samples': 718336, 'steps': 1402, 'loss/train': 3.0569286346435547} -09/20/2021 19:20:55 - INFO - __main__ - Step 22449: {'lr': 0.000199913259714372, 'samples': 718368, 'steps': 1403, 'loss/train': 2.766812801361084} -09/20/2021 19:20:56 - INFO - __main__ - Step 22450: {'lr': 0.000199913259714372, 'samples': 718400, 'steps': 1403, 'loss/train': 2.9438698291778564} -09/20/2021 19:20:57 - INFO - __main__ - Step 22451: {'lr': 0.000199913259714372, 'samples': 718432, 'steps': 1403, 'loss/train': 2.4117019176483154} -09/20/2021 19:20:58 - INFO - __main__ - Step 22452: {'lr': 0.000199913259714372, 'samples': 718464, 'steps': 1403, 'loss/train': 4.263749599456787} -09/20/2021 19:20:59 - INFO - __main__ - Step 22453: {'lr': 0.000199913259714372, 'samples': 718496, 'steps': 1403, 'loss/train': 3.317889451980591} -09/20/2021 19:20:59 - INFO - __main__ - Step 22454: {'lr': 0.000199913259714372, 'samples': 718528, 'steps': 1403, 'loss/train': 3.754920244216919} -09/20/2021 19:21:00 - INFO - __main__ - Step 22455: {'lr': 0.000199913259714372, 'samples': 718560, 'steps': 1403, 'loss/train': 3.359164237976074} -09/20/2021 19:21:01 - INFO - __main__ - Step 22456: {'lr': 0.000199913259714372, 'samples': 718592, 'steps': 1403, 'loss/train': 3.221967935562134} -09/20/2021 19:21:02 - INFO - __main__ - Step 22457: {'lr': 0.000199913259714372, 'samples': 718624, 'steps': 1403, 'loss/train': 3.2371082305908203} -09/20/2021 19:21:02 - INFO - __main__ - Step 22458: {'lr': 0.000199913259714372, 'samples': 718656, 'steps': 1403, 'loss/train': 3.6188764572143555} -09/20/2021 19:21:03 - INFO - __main__ - Step 22459: {'lr': 0.000199913259714372, 'samples': 718688, 'steps': 1403, 'loss/train': 3.4177753925323486} -09/20/2021 19:21:04 - INFO - __main__ - Step 22460: {'lr': 0.000199913259714372, 'samples': 718720, 'steps': 1403, 'loss/train': 2.8614420890808105} -09/20/2021 19:21:05 - INFO - __main__ - Step 22461: {'lr': 0.000199913259714372, 'samples': 718752, 'steps': 1403, 'loss/train': 2.9710171222686768} -09/20/2021 19:21:05 - INFO - __main__ - Step 22462: {'lr': 0.000199913259714372, 'samples': 718784, 'steps': 1403, 'loss/train': 3.229917287826538} -09/20/2021 19:21:06 - INFO - __main__ - Step 22463: {'lr': 0.000199913259714372, 'samples': 718816, 'steps': 1403, 'loss/train': 2.585052013397217} -09/20/2021 19:21:07 - INFO - __main__ - Step 22464: {'lr': 0.000199913259714372, 'samples': 718848, 'steps': 1403, 'loss/train': 2.952134370803833} -09/20/2021 19:21:08 - INFO - __main__ - Step 22465: {'lr': 0.00019991299388248118, 'samples': 718880, 'steps': 1404, 'loss/train': 3.541548252105713} -09/20/2021 19:21:09 - INFO - __main__ - Step 22466: {'lr': 0.00019991299388248118, 'samples': 718912, 'steps': 1404, 'loss/train': 2.6827504634857178} -09/20/2021 19:21:09 - INFO - __main__ - Step 22467: {'lr': 0.00019991299388248118, 'samples': 718944, 'steps': 1404, 'loss/train': 4.107794761657715} -09/20/2021 19:21:10 - INFO - __main__ - Step 22468: {'lr': 0.00019991299388248118, 'samples': 718976, 'steps': 1404, 'loss/train': 2.910874366760254} -09/20/2021 19:21:11 - INFO - __main__ - Step 22469: {'lr': 0.00019991299388248118, 'samples': 719008, 'steps': 1404, 'loss/train': 3.381626605987549} -09/20/2021 19:21:12 - INFO - __main__ - Step 22470: {'lr': 0.00019991299388248118, 'samples': 719040, 'steps': 1404, 'loss/train': 3.217034339904785} -09/20/2021 19:21:12 - INFO - __main__ - Step 22471: {'lr': 0.00019991299388248118, 'samples': 719072, 'steps': 1404, 'loss/train': 2.840517282485962} -09/20/2021 19:21:13 - INFO - __main__ - Step 22472: {'lr': 0.00019991299388248118, 'samples': 719104, 'steps': 1404, 'loss/train': 0.7608882188796997} -09/20/2021 19:21:14 - INFO - __main__ - Step 22473: {'lr': 0.00019991299388248118, 'samples': 719136, 'steps': 1404, 'loss/train': 0.5675144195556641} -09/20/2021 19:21:15 - INFO - __main__ - Step 22474: {'lr': 0.00019991299388248118, 'samples': 719168, 'steps': 1404, 'loss/train': 0.9263640642166138} -09/20/2021 19:21:15 - INFO - __main__ - Step 22475: {'lr': 0.00019991299388248118, 'samples': 719200, 'steps': 1404, 'loss/train': 0.43255510926246643} -09/20/2021 19:21:16 - INFO - __main__ - Step 22476: {'lr': 0.00019991299388248118, 'samples': 719232, 'steps': 1404, 'loss/train': 0.47972947359085083} -09/20/2021 19:21:17 - INFO - __main__ - Step 22477: {'lr': 0.00019991299388248118, 'samples': 719264, 'steps': 1404, 'loss/train': 3.7931063175201416} -09/20/2021 19:21:18 - INFO - __main__ - Step 22478: {'lr': 0.00019991299388248118, 'samples': 719296, 'steps': 1404, 'loss/train': 2.43269681930542} -09/20/2021 19:21:18 - INFO - __main__ - Step 22479: {'lr': 0.00019991299388248118, 'samples': 719328, 'steps': 1404, 'loss/train': 3.58026385307312} -09/20/2021 19:21:19 - INFO - __main__ - Step 22480: {'lr': 0.00019991299388248118, 'samples': 719360, 'steps': 1404, 'loss/train': 3.906003713607788} -09/20/2021 19:21:20 - INFO - __main__ - Step 22481: {'lr': 0.0001999127276440448, 'samples': 719392, 'steps': 1405, 'loss/train': 4.173460006713867} -09/20/2021 19:21:21 - INFO - __main__ - Step 22482: {'lr': 0.0001999127276440448, 'samples': 719424, 'steps': 1405, 'loss/train': 3.205540180206299} -09/20/2021 19:21:22 - INFO - __main__ - Step 22483: {'lr': 0.0001999127276440448, 'samples': 719456, 'steps': 1405, 'loss/train': 2.997901201248169} -09/20/2021 19:21:23 - INFO - __main__ - Step 22484: {'lr': 0.0001999127276440448, 'samples': 719488, 'steps': 1405, 'loss/train': 2.7958667278289795} -09/20/2021 19:21:23 - INFO - __main__ - Step 22485: {'lr': 0.0001999127276440448, 'samples': 719520, 'steps': 1405, 'loss/train': 2.6899890899658203} -09/20/2021 19:21:24 - INFO - __main__ - Step 22486: {'lr': 0.0001999127276440448, 'samples': 719552, 'steps': 1405, 'loss/train': 2.469433546066284} -09/20/2021 19:21:25 - INFO - __main__ - Step 22487: {'lr': 0.0001999127276440448, 'samples': 719584, 'steps': 1405, 'loss/train': 1.1444140672683716} -09/20/2021 19:21:26 - INFO - __main__ - Step 22488: {'lr': 0.0001999127276440448, 'samples': 719616, 'steps': 1405, 'loss/train': 2.8867766857147217} -09/20/2021 19:21:26 - INFO - __main__ - Step 22489: {'lr': 0.0001999127276440448, 'samples': 719648, 'steps': 1405, 'loss/train': 3.128859281539917} -09/20/2021 19:21:27 - INFO - __main__ - Step 22490: {'lr': 0.0001999127276440448, 'samples': 719680, 'steps': 1405, 'loss/train': 4.568650722503662} -09/20/2021 19:21:28 - INFO - __main__ - Step 22491: {'lr': 0.0001999127276440448, 'samples': 719712, 'steps': 1405, 'loss/train': 3.206878423690796} -09/20/2021 19:21:29 - INFO - __main__ - Step 22492: {'lr': 0.0001999127276440448, 'samples': 719744, 'steps': 1405, 'loss/train': 3.4671618938446045} -09/20/2021 19:21:30 - INFO - __main__ - Step 22493: {'lr': 0.0001999127276440448, 'samples': 719776, 'steps': 1405, 'loss/train': 3.7221388816833496} -09/20/2021 19:21:30 - INFO - __main__ - Step 22494: {'lr': 0.0001999127276440448, 'samples': 719808, 'steps': 1405, 'loss/train': 2.097979784011841} -09/20/2021 19:21:31 - INFO - __main__ - Step 22495: {'lr': 0.0001999127276440448, 'samples': 719840, 'steps': 1405, 'loss/train': 2.267528772354126} -09/20/2021 19:21:32 - INFO - __main__ - Step 22496: {'lr': 0.0001999127276440448, 'samples': 719872, 'steps': 1405, 'loss/train': 2.8042211532592773} -09/20/2021 19:21:33 - INFO - __main__ - Step 22497: {'lr': 0.00019991246099906396, 'samples': 719904, 'steps': 1406, 'loss/train': 3.7500159740448} -09/20/2021 19:21:33 - INFO - __main__ - Step 22498: {'lr': 0.00019991246099906396, 'samples': 719936, 'steps': 1406, 'loss/train': 3.323296070098877} -09/20/2021 19:21:34 - INFO - __main__ - Step 22499: {'lr': 0.00019991246099906396, 'samples': 719968, 'steps': 1406, 'loss/train': 2.9030966758728027} -09/20/2021 19:21:35 - INFO - __main__ - Step 22500: {'lr': 0.00019991246099906396, 'samples': 720000, 'steps': 1406, 'loss/train': 2.7387428283691406} -09/20/2021 19:21:36 - INFO - __main__ - Step 22501: {'lr': 0.00019991246099906396, 'samples': 720032, 'steps': 1406, 'loss/train': 2.57391619682312} -09/20/2021 19:21:36 - INFO - __main__ - Step 22502: {'lr': 0.00019991246099906396, 'samples': 720064, 'steps': 1406, 'loss/train': 3.280245542526245} -09/20/2021 19:21:37 - INFO - __main__ - Step 22503: {'lr': 0.00019991246099906396, 'samples': 720096, 'steps': 1406, 'loss/train': 3.510564088821411} -09/20/2021 19:21:38 - INFO - __main__ - Step 22504: {'lr': 0.00019991246099906396, 'samples': 720128, 'steps': 1406, 'loss/train': 2.4239065647125244} -09/20/2021 19:21:39 - INFO - __main__ - Step 22505: {'lr': 0.00019991246099906396, 'samples': 720160, 'steps': 1406, 'loss/train': 2.142624855041504} -09/20/2021 19:21:39 - INFO - __main__ - Step 22506: {'lr': 0.00019991246099906396, 'samples': 720192, 'steps': 1406, 'loss/train': 2.945509910583496} -09/20/2021 19:21:40 - INFO - __main__ - Step 22507: {'lr': 0.00019991246099906396, 'samples': 720224, 'steps': 1406, 'loss/train': 3.692286729812622} -09/20/2021 19:21:41 - INFO - __main__ - Step 22508: {'lr': 0.00019991246099906396, 'samples': 720256, 'steps': 1406, 'loss/train': 5.084542274475098} -09/20/2021 19:21:42 - INFO - __main__ - Step 22509: {'lr': 0.00019991246099906396, 'samples': 720288, 'steps': 1406, 'loss/train': 3.2267208099365234} -09/20/2021 19:21:42 - INFO - __main__ - Step 22510: {'lr': 0.00019991246099906396, 'samples': 720320, 'steps': 1406, 'loss/train': 2.66015625} -09/20/2021 19:21:44 - INFO - __main__ - Step 22511: {'lr': 0.00019991246099906396, 'samples': 720352, 'steps': 1406, 'loss/train': 2.967414379119873} -09/20/2021 19:21:44 - INFO - __main__ - Step 22512: {'lr': 0.00019991246099906396, 'samples': 720384, 'steps': 1406, 'loss/train': 3.478778600692749} -09/20/2021 19:21:45 - INFO - __main__ - Step 22513: {'lr': 0.00019991219394753965, 'samples': 720416, 'steps': 1407, 'loss/train': 2.494277238845825} -09/20/2021 19:21:46 - INFO - __main__ - Step 22514: {'lr': 0.00019991219394753965, 'samples': 720448, 'steps': 1407, 'loss/train': 2.932210683822632} -09/20/2021 19:21:47 - INFO - __main__ - Step 22515: {'lr': 0.00019991219394753965, 'samples': 720480, 'steps': 1407, 'loss/train': 3.3150715827941895} -09/20/2021 19:21:48 - INFO - __main__ - Step 22516: {'lr': 0.00019991219394753965, 'samples': 720512, 'steps': 1407, 'loss/train': 3.2125091552734375} -09/20/2021 19:21:48 - INFO - __main__ - Step 22517: {'lr': 0.00019991219394753965, 'samples': 720544, 'steps': 1407, 'loss/train': 3.7426271438598633} -09/20/2021 19:21:49 - INFO - __main__ - Step 22518: {'lr': 0.00019991219394753965, 'samples': 720576, 'steps': 1407, 'loss/train': 3.3035056591033936} -09/20/2021 19:21:50 - INFO - __main__ - Step 22519: {'lr': 0.00019991219394753965, 'samples': 720608, 'steps': 1407, 'loss/train': 2.8218207359313965} -09/20/2021 19:21:51 - INFO - __main__ - Step 22520: {'lr': 0.00019991219394753965, 'samples': 720640, 'steps': 1407, 'loss/train': 3.869767665863037} -09/20/2021 19:21:51 - INFO - __main__ - Step 22521: {'lr': 0.00019991219394753965, 'samples': 720672, 'steps': 1407, 'loss/train': 3.4266579151153564} -09/20/2021 19:21:52 - INFO - __main__ - Step 22522: {'lr': 0.00019991219394753965, 'samples': 720704, 'steps': 1407, 'loss/train': 2.4654324054718018} -09/20/2021 19:21:53 - INFO - __main__ - Step 22523: {'lr': 0.00019991219394753965, 'samples': 720736, 'steps': 1407, 'loss/train': 3.0747313499450684} -09/20/2021 19:21:54 - INFO - __main__ - Step 22524: {'lr': 0.00019991219394753965, 'samples': 720768, 'steps': 1407, 'loss/train': 2.855018138885498} -09/20/2021 19:21:54 - INFO - __main__ - Step 22525: {'lr': 0.00019991219394753965, 'samples': 720800, 'steps': 1407, 'loss/train': 2.9083411693573} -09/20/2021 19:21:55 - INFO - __main__ - Step 22526: {'lr': 0.00019991219394753965, 'samples': 720832, 'steps': 1407, 'loss/train': 3.945490837097168} -09/20/2021 19:21:56 - INFO - __main__ - Step 22527: {'lr': 0.00019991219394753965, 'samples': 720864, 'steps': 1407, 'loss/train': 2.3122925758361816} -09/20/2021 19:21:57 - INFO - __main__ - Step 22528: {'lr': 0.00019991219394753965, 'samples': 720896, 'steps': 1407, 'loss/train': 3.209526777267456} -09/20/2021 19:21:57 - INFO - __main__ - Step 22529: {'lr': 0.00019991192648947305, 'samples': 720928, 'steps': 1408, 'loss/train': 3.7290711402893066} -09/20/2021 19:21:58 - INFO - __main__ - Step 22530: {'lr': 0.00019991192648947305, 'samples': 720960, 'steps': 1408, 'loss/train': 4.157434463500977} -09/20/2021 19:21:59 - INFO - __main__ - Step 22531: {'lr': 0.00019991192648947305, 'samples': 720992, 'steps': 1408, 'loss/train': 3.0078539848327637} -09/20/2021 19:22:00 - INFO - __main__ - Step 22532: {'lr': 0.00019991192648947305, 'samples': 721024, 'steps': 1408, 'loss/train': 3.492844581604004} -09/20/2021 19:22:00 - INFO - __main__ - Step 22533: {'lr': 0.00019991192648947305, 'samples': 721056, 'steps': 1408, 'loss/train': 3.35255765914917} -09/20/2021 19:22:01 - INFO - __main__ - Step 22534: {'lr': 0.00019991192648947305, 'samples': 721088, 'steps': 1408, 'loss/train': 2.6356141567230225} -09/20/2021 19:22:02 - INFO - __main__ - Step 22535: {'lr': 0.00019991192648947305, 'samples': 721120, 'steps': 1408, 'loss/train': 2.8945045471191406} -09/20/2021 19:22:03 - INFO - __main__ - Step 22536: {'lr': 0.00019991192648947305, 'samples': 721152, 'steps': 1408, 'loss/train': 3.012545108795166} -09/20/2021 19:22:03 - INFO - __main__ - Step 22537: {'lr': 0.00019991192648947305, 'samples': 721184, 'steps': 1408, 'loss/train': 3.083545684814453} -09/20/2021 19:22:04 - INFO - __main__ - Step 22538: {'lr': 0.00019991192648947305, 'samples': 721216, 'steps': 1408, 'loss/train': 3.813467264175415} -09/20/2021 19:22:05 - INFO - __main__ - Step 22539: {'lr': 0.00019991192648947305, 'samples': 721248, 'steps': 1408, 'loss/train': 2.843980550765991} -09/20/2021 19:22:06 - INFO - __main__ - Step 22540: {'lr': 0.00019991192648947305, 'samples': 721280, 'steps': 1408, 'loss/train': 3.3125112056732178} -09/20/2021 19:22:06 - INFO - __main__ - Step 22541: {'lr': 0.00019991192648947305, 'samples': 721312, 'steps': 1408, 'loss/train': 3.285346031188965} -09/20/2021 19:22:08 - INFO - __main__ - Step 22542: {'lr': 0.00019991192648947305, 'samples': 721344, 'steps': 1408, 'loss/train': 1.416029930114746} -09/20/2021 19:22:09 - INFO - __main__ - Step 22543: {'lr': 0.00019991192648947305, 'samples': 721376, 'steps': 1408, 'loss/train': 3.2496964931488037} -09/20/2021 19:22:09 - INFO - __main__ - Step 22544: {'lr': 0.00019991192648947305, 'samples': 721408, 'steps': 1408, 'loss/train': 0.6149399876594543} -09/20/2021 19:22:10 - INFO - __main__ - Step 22545: {'lr': 0.0001999116586248652, 'samples': 721440, 'steps': 1409, 'loss/train': 3.540264129638672} -09/20/2021 19:22:11 - INFO - __main__ - Step 22546: {'lr': 0.0001999116586248652, 'samples': 721472, 'steps': 1409, 'loss/train': 3.317911386489868} -09/20/2021 19:22:12 - INFO - __main__ - Step 22547: {'lr': 0.0001999116586248652, 'samples': 721504, 'steps': 1409, 'loss/train': 3.1728925704956055} -09/20/2021 19:22:12 - INFO - __main__ - Step 22548: {'lr': 0.0001999116586248652, 'samples': 721536, 'steps': 1409, 'loss/train': 2.796454429626465} -09/20/2021 19:22:13 - INFO - __main__ - Step 22549: {'lr': 0.0001999116586248652, 'samples': 721568, 'steps': 1409, 'loss/train': 2.527249813079834} -09/20/2021 19:22:14 - INFO - __main__ - Step 22550: {'lr': 0.0001999116586248652, 'samples': 721600, 'steps': 1409, 'loss/train': 3.4485790729522705} -09/20/2021 19:22:15 - INFO - __main__ - Step 22551: {'lr': 0.0001999116586248652, 'samples': 721632, 'steps': 1409, 'loss/train': 3.5078794956207275} -09/20/2021 19:22:15 - INFO - __main__ - Step 22552: {'lr': 0.0001999116586248652, 'samples': 721664, 'steps': 1409, 'loss/train': 3.0494794845581055} -09/20/2021 19:22:16 - INFO - __main__ - Step 22553: {'lr': 0.0001999116586248652, 'samples': 721696, 'steps': 1409, 'loss/train': 2.169459819793701} -09/20/2021 19:22:17 - INFO - __main__ - Step 22554: {'lr': 0.0001999116586248652, 'samples': 721728, 'steps': 1409, 'loss/train': 3.13627552986145} -09/20/2021 19:22:18 - INFO - __main__ - Step 22555: {'lr': 0.0001999116586248652, 'samples': 721760, 'steps': 1409, 'loss/train': 3.4219119548797607} -09/20/2021 19:22:18 - INFO - __main__ - Step 22556: {'lr': 0.0001999116586248652, 'samples': 721792, 'steps': 1409, 'loss/train': 3.6492035388946533} -09/20/2021 19:22:19 - INFO - __main__ - Step 22557: {'lr': 0.0001999116586248652, 'samples': 721824, 'steps': 1409, 'loss/train': 3.049710273742676} -09/20/2021 19:22:20 - INFO - __main__ - Step 22558: {'lr': 0.0001999116586248652, 'samples': 721856, 'steps': 1409, 'loss/train': 3.172700881958008} -09/20/2021 19:22:21 - INFO - __main__ - Step 22559: {'lr': 0.0001999116586248652, 'samples': 721888, 'steps': 1409, 'loss/train': 2.5946428775787354} -09/20/2021 19:22:21 - INFO - __main__ - Step 22560: {'lr': 0.0001999116586248652, 'samples': 721920, 'steps': 1409, 'loss/train': 4.077792644500732} -09/20/2021 19:22:22 - INFO - __main__ - Step 22561: {'lr': 0.00019991139035371717, 'samples': 721952, 'steps': 1410, 'loss/train': 3.9469282627105713} -09/20/2021 19:22:23 - INFO - __main__ - Step 22562: {'lr': 0.00019991139035371717, 'samples': 721984, 'steps': 1410, 'loss/train': 3.323887825012207} -09/20/2021 19:22:24 - INFO - __main__ - Step 22563: {'lr': 0.00019991139035371717, 'samples': 722016, 'steps': 1410, 'loss/train': 3.4141900539398193} -09/20/2021 19:22:25 - INFO - __main__ - Step 22564: {'lr': 0.00019991139035371717, 'samples': 722048, 'steps': 1410, 'loss/train': 3.0908172130584717} -09/20/2021 19:22:25 - INFO - __main__ - Step 22565: {'lr': 0.00019991139035371717, 'samples': 722080, 'steps': 1410, 'loss/train': 3.208425998687744} -09/20/2021 19:22:26 - INFO - __main__ - Step 22566: {'lr': 0.00019991139035371717, 'samples': 722112, 'steps': 1410, 'loss/train': 2.9350810050964355} -09/20/2021 19:22:27 - INFO - __main__ - Step 22567: {'lr': 0.00019991139035371717, 'samples': 722144, 'steps': 1410, 'loss/train': 3.365391731262207} -09/20/2021 19:22:28 - INFO - __main__ - Step 22568: {'lr': 0.00019991139035371717, 'samples': 722176, 'steps': 1410, 'loss/train': 3.8000855445861816} -09/20/2021 19:22:28 - INFO - __main__ - Step 22569: {'lr': 0.00019991139035371717, 'samples': 722208, 'steps': 1410, 'loss/train': 3.2566773891448975} -09/20/2021 19:22:29 - INFO - __main__ - Step 22570: {'lr': 0.00019991139035371717, 'samples': 722240, 'steps': 1410, 'loss/train': 3.4995508193969727} -09/20/2021 19:22:30 - INFO - __main__ - Step 22571: {'lr': 0.00019991139035371717, 'samples': 722272, 'steps': 1410, 'loss/train': 2.7239322662353516} -09/20/2021 19:22:31 - INFO - __main__ - Step 22572: {'lr': 0.00019991139035371717, 'samples': 722304, 'steps': 1410, 'loss/train': 3.2961854934692383} -09/20/2021 19:22:32 - INFO - __main__ - Step 22573: {'lr': 0.00019991139035371717, 'samples': 722336, 'steps': 1410, 'loss/train': 3.8690402507781982} -09/20/2021 19:22:33 - INFO - __main__ - Step 22574: {'lr': 0.00019991139035371717, 'samples': 722368, 'steps': 1410, 'loss/train': 2.4820077419281006} -09/20/2021 19:22:33 - INFO - __main__ - Step 22575: {'lr': 0.00019991139035371717, 'samples': 722400, 'steps': 1410, 'loss/train': 4.2521257400512695} -09/20/2021 19:22:34 - INFO - __main__ - Step 22576: {'lr': 0.00019991139035371717, 'samples': 722432, 'steps': 1410, 'loss/train': 2.3093926906585693} -09/20/2021 19:22:35 - INFO - __main__ - Step 22577: {'lr': 0.0001999111216760301, 'samples': 722464, 'steps': 1411, 'loss/train': 3.662715196609497} -09/20/2021 19:22:36 - INFO - __main__ - Step 22578: {'lr': 0.0001999111216760301, 'samples': 722496, 'steps': 1411, 'loss/train': 1.7225069999694824} -09/20/2021 19:22:36 - INFO - __main__ - Step 22579: {'lr': 0.0001999111216760301, 'samples': 722528, 'steps': 1411, 'loss/train': 3.359335422515869} -09/20/2021 19:22:37 - INFO - __main__ - Step 22580: {'lr': 0.0001999111216760301, 'samples': 722560, 'steps': 1411, 'loss/train': 3.1656289100646973} -09/20/2021 19:22:38 - INFO - __main__ - Step 22581: {'lr': 0.0001999111216760301, 'samples': 722592, 'steps': 1411, 'loss/train': 3.8354218006134033} -09/20/2021 19:22:39 - INFO - __main__ - Step 22582: {'lr': 0.0001999111216760301, 'samples': 722624, 'steps': 1411, 'loss/train': 1.7405753135681152} -09/20/2021 19:22:39 - INFO - __main__ - Step 22583: {'lr': 0.0001999111216760301, 'samples': 722656, 'steps': 1411, 'loss/train': 2.886902332305908} -09/20/2021 19:22:40 - INFO - __main__ - Step 22584: {'lr': 0.0001999111216760301, 'samples': 722688, 'steps': 1411, 'loss/train': 3.1697750091552734} -09/20/2021 19:22:41 - INFO - __main__ - Step 22585: {'lr': 0.0001999111216760301, 'samples': 722720, 'steps': 1411, 'loss/train': 0.7658512592315674} -09/20/2021 19:22:42 - INFO - __main__ - Step 22586: {'lr': 0.0001999111216760301, 'samples': 722752, 'steps': 1411, 'loss/train': 1.730344533920288} -09/20/2021 19:22:42 - INFO - __main__ - Step 22587: {'lr': 0.0001999111216760301, 'samples': 722784, 'steps': 1411, 'loss/train': 3.6043272018432617} -09/20/2021 19:22:43 - INFO - __main__ - Step 22588: {'lr': 0.0001999111216760301, 'samples': 722816, 'steps': 1411, 'loss/train': 2.6145546436309814} -09/20/2021 19:22:44 - INFO - __main__ - Step 22589: {'lr': 0.0001999111216760301, 'samples': 722848, 'steps': 1411, 'loss/train': 3.054504632949829} -09/20/2021 19:22:45 - INFO - __main__ - Step 22590: {'lr': 0.0001999111216760301, 'samples': 722880, 'steps': 1411, 'loss/train': 2.535461187362671} -09/20/2021 19:22:45 - INFO - __main__ - Step 22591: {'lr': 0.0001999111216760301, 'samples': 722912, 'steps': 1411, 'loss/train': 3.295219898223877} -09/20/2021 19:22:46 - INFO - __main__ - Step 22592: {'lr': 0.0001999111216760301, 'samples': 722944, 'steps': 1411, 'loss/train': 3.2146425247192383} -09/20/2021 19:22:47 - INFO - __main__ - Step 22593: {'lr': 0.00019991085259180507, 'samples': 722976, 'steps': 1412, 'loss/train': 2.5938897132873535} -09/20/2021 19:22:48 - INFO - __main__ - Step 22594: {'lr': 0.00019991085259180507, 'samples': 723008, 'steps': 1412, 'loss/train': 1.7473922967910767} -09/20/2021 19:22:49 - INFO - __main__ - Step 22595: {'lr': 0.00019991085259180507, 'samples': 723040, 'steps': 1412, 'loss/train': 2.4688494205474854} -09/20/2021 19:22:49 - INFO - __main__ - Step 22596: {'lr': 0.00019991085259180507, 'samples': 723072, 'steps': 1412, 'loss/train': 3.1480791568756104} -09/20/2021 19:22:50 - INFO - __main__ - Step 22597: {'lr': 0.00019991085259180507, 'samples': 723104, 'steps': 1412, 'loss/train': 3.2184250354766846} -09/20/2021 19:22:51 - INFO - __main__ - Step 22598: {'lr': 0.00019991085259180507, 'samples': 723136, 'steps': 1412, 'loss/train': 3.2386980056762695} -09/20/2021 19:22:52 - INFO - __main__ - Step 22599: {'lr': 0.00019991085259180507, 'samples': 723168, 'steps': 1412, 'loss/train': 3.474663496017456} -09/20/2021 19:22:52 - INFO - __main__ - Step 22600: {'lr': 0.00019991085259180507, 'samples': 723200, 'steps': 1412, 'loss/train': 3.5768415927886963} -09/20/2021 19:22:53 - INFO - __main__ - Step 22601: {'lr': 0.00019991085259180507, 'samples': 723232, 'steps': 1412, 'loss/train': 2.881230592727661} -09/20/2021 19:22:54 - INFO - __main__ - Step 22602: {'lr': 0.00019991085259180507, 'samples': 723264, 'steps': 1412, 'loss/train': 3.8449008464813232} -09/20/2021 19:22:55 - INFO - __main__ - Step 22603: {'lr': 0.00019991085259180507, 'samples': 723296, 'steps': 1412, 'loss/train': 2.877931833267212} -09/20/2021 19:22:56 - INFO - __main__ - Step 22604: {'lr': 0.00019991085259180507, 'samples': 723328, 'steps': 1412, 'loss/train': 2.7024824619293213} -09/20/2021 19:22:57 - INFO - __main__ - Step 22605: {'lr': 0.00019991085259180507, 'samples': 723360, 'steps': 1412, 'loss/train': 3.326364040374756} -09/20/2021 19:22:58 - INFO - __main__ - Step 22606: {'lr': 0.00019991085259180507, 'samples': 723392, 'steps': 1412, 'loss/train': 3.6179213523864746} -09/20/2021 19:22:59 - INFO - __main__ - Step 22607: {'lr': 0.00019991085259180507, 'samples': 723424, 'steps': 1412, 'loss/train': 3.1466269493103027} -09/20/2021 19:22:59 - INFO - __main__ - Step 22608: {'lr': 0.00019991085259180507, 'samples': 723456, 'steps': 1412, 'loss/train': 2.8902060985565186} -09/20/2021 19:23:00 - INFO - __main__ - Step 22609: {'lr': 0.00019991058310104317, 'samples': 723488, 'steps': 1413, 'loss/train': 3.3855884075164795} -09/20/2021 19:23:01 - INFO - __main__ - Step 22610: {'lr': 0.00019991058310104317, 'samples': 723520, 'steps': 1413, 'loss/train': 3.2201433181762695} -09/20/2021 19:23:02 - INFO - __main__ - Step 22611: {'lr': 0.00019991058310104317, 'samples': 723552, 'steps': 1413, 'loss/train': 3.9557816982269287} -09/20/2021 19:23:02 - INFO - __main__ - Step 22612: {'lr': 0.00019991058310104317, 'samples': 723584, 'steps': 1413, 'loss/train': 3.385396718978882} -09/20/2021 19:23:03 - INFO - __main__ - Step 22613: {'lr': 0.00019991058310104317, 'samples': 723616, 'steps': 1413, 'loss/train': 3.900390148162842} -09/20/2021 19:23:04 - INFO - __main__ - Step 22614: {'lr': 0.00019991058310104317, 'samples': 723648, 'steps': 1413, 'loss/train': 2.3270552158355713} -09/20/2021 19:23:05 - INFO - __main__ - Step 22615: {'lr': 0.00019991058310104317, 'samples': 723680, 'steps': 1413, 'loss/train': 2.155442237854004} -09/20/2021 19:23:05 - INFO - __main__ - Step 22616: {'lr': 0.00019991058310104317, 'samples': 723712, 'steps': 1413, 'loss/train': 1.9730076789855957} -09/20/2021 19:23:06 - INFO - __main__ - Step 22617: {'lr': 0.00019991058310104317, 'samples': 723744, 'steps': 1413, 'loss/train': 2.999185085296631} -09/20/2021 19:23:07 - INFO - __main__ - Step 22618: {'lr': 0.00019991058310104317, 'samples': 723776, 'steps': 1413, 'loss/train': 2.38277006149292} -09/20/2021 19:23:08 - INFO - __main__ - Step 22619: {'lr': 0.00019991058310104317, 'samples': 723808, 'steps': 1413, 'loss/train': 2.8666062355041504} -09/20/2021 19:23:08 - INFO - __main__ - Step 22620: {'lr': 0.00019991058310104317, 'samples': 723840, 'steps': 1413, 'loss/train': 3.270596981048584} -09/20/2021 19:23:09 - INFO - __main__ - Step 22621: {'lr': 0.00019991058310104317, 'samples': 723872, 'steps': 1413, 'loss/train': 2.908104181289673} -09/20/2021 19:23:10 - INFO - __main__ - Step 22622: {'lr': 0.00019991058310104317, 'samples': 723904, 'steps': 1413, 'loss/train': 2.7580697536468506} -09/20/2021 19:23:11 - INFO - __main__ - Step 22623: {'lr': 0.00019991058310104317, 'samples': 723936, 'steps': 1413, 'loss/train': 2.975858211517334} -09/20/2021 19:23:11 - INFO - __main__ - Step 22624: {'lr': 0.00019991058310104317, 'samples': 723968, 'steps': 1413, 'loss/train': 2.7859151363372803} -09/20/2021 19:23:12 - INFO - __main__ - Step 22625: {'lr': 0.0001999103132037455, 'samples': 724000, 'steps': 1414, 'loss/train': 2.298819065093994} -09/20/2021 19:23:13 - INFO - __main__ - Step 22626: {'lr': 0.0001999103132037455, 'samples': 724032, 'steps': 1414, 'loss/train': 3.123823881149292} -09/20/2021 19:23:14 - INFO - __main__ - Step 22627: {'lr': 0.0001999103132037455, 'samples': 724064, 'steps': 1414, 'loss/train': 3.4771881103515625} -09/20/2021 19:23:15 - INFO - __main__ - Step 22628: {'lr': 0.0001999103132037455, 'samples': 724096, 'steps': 1414, 'loss/train': 2.104020357131958} -09/20/2021 19:23:15 - INFO - __main__ - Step 22629: {'lr': 0.0001999103132037455, 'samples': 724128, 'steps': 1414, 'loss/train': 2.6442923545837402} -09/20/2021 19:23:16 - INFO - __main__ - Step 22630: {'lr': 0.0001999103132037455, 'samples': 724160, 'steps': 1414, 'loss/train': 3.6205883026123047} -09/20/2021 19:23:17 - INFO - __main__ - Step 22631: {'lr': 0.0001999103132037455, 'samples': 724192, 'steps': 1414, 'loss/train': 2.473237991333008} -09/20/2021 19:23:18 - INFO - __main__ - Step 22632: {'lr': 0.0001999103132037455, 'samples': 724224, 'steps': 1414, 'loss/train': 2.2382652759552} -09/20/2021 19:23:18 - INFO - __main__ - Step 22633: {'lr': 0.0001999103132037455, 'samples': 724256, 'steps': 1414, 'loss/train': 2.37800669670105} -09/20/2021 19:23:19 - INFO - __main__ - Step 22634: {'lr': 0.0001999103132037455, 'samples': 724288, 'steps': 1414, 'loss/train': 2.369189500808716} -09/20/2021 19:23:20 - INFO - __main__ - Step 22635: {'lr': 0.0001999103132037455, 'samples': 724320, 'steps': 1414, 'loss/train': 2.4266161918640137} -09/20/2021 19:23:21 - INFO - __main__ - Step 22636: {'lr': 0.0001999103132037455, 'samples': 724352, 'steps': 1414, 'loss/train': 2.0370826721191406} -09/20/2021 19:23:21 - INFO - __main__ - Step 22637: {'lr': 0.0001999103132037455, 'samples': 724384, 'steps': 1414, 'loss/train': 2.199500322341919} -09/20/2021 19:23:22 - INFO - __main__ - Step 22638: {'lr': 0.0001999103132037455, 'samples': 724416, 'steps': 1414, 'loss/train': 2.3060221672058105} -09/20/2021 19:23:23 - INFO - __main__ - Step 22639: {'lr': 0.0001999103132037455, 'samples': 724448, 'steps': 1414, 'loss/train': 1.9660985469818115} -09/20/2021 19:23:24 - INFO - __main__ - Step 22640: {'lr': 0.0001999103132037455, 'samples': 724480, 'steps': 1414, 'loss/train': 2.9947245121002197} -09/20/2021 19:23:25 - INFO - __main__ - Step 22641: {'lr': 0.00019991004289991314, 'samples': 724512, 'steps': 1415, 'loss/train': 3.1152167320251465} -09/20/2021 19:23:26 - INFO - __main__ - Step 22642: {'lr': 0.00019991004289991314, 'samples': 724544, 'steps': 1415, 'loss/train': 3.1583938598632812} -09/20/2021 19:23:27 - INFO - __main__ - Step 22643: {'lr': 0.00019991004289991314, 'samples': 724576, 'steps': 1415, 'loss/train': 2.506735324859619} -09/20/2021 19:23:27 - INFO - __main__ - Step 22644: {'lr': 0.00019991004289991314, 'samples': 724608, 'steps': 1415, 'loss/train': 3.8188860416412354} -09/20/2021 19:23:28 - INFO - __main__ - Step 22645: {'lr': 0.00019991004289991314, 'samples': 724640, 'steps': 1415, 'loss/train': 3.3632893562316895} -09/20/2021 19:23:29 - INFO - __main__ - Step 22646: {'lr': 0.00019991004289991314, 'samples': 724672, 'steps': 1415, 'loss/train': 2.991293430328369} -09/20/2021 19:23:30 - INFO - __main__ - Step 22647: {'lr': 0.00019991004289991314, 'samples': 724704, 'steps': 1415, 'loss/train': 1.056067705154419} -09/20/2021 19:23:30 - INFO - __main__ - Step 22648: {'lr': 0.00019991004289991314, 'samples': 724736, 'steps': 1415, 'loss/train': 3.5857417583465576} -09/20/2021 19:23:31 - INFO - __main__ - Step 22649: {'lr': 0.00019991004289991314, 'samples': 724768, 'steps': 1415, 'loss/train': 3.418391227722168} -09/20/2021 19:23:32 - INFO - __main__ - Step 22650: {'lr': 0.00019991004289991314, 'samples': 724800, 'steps': 1415, 'loss/train': 1.155182123184204} -09/20/2021 19:23:33 - INFO - __main__ - Step 22651: {'lr': 0.00019991004289991314, 'samples': 724832, 'steps': 1415, 'loss/train': 4.083247184753418} -09/20/2021 19:23:33 - INFO - __main__ - Step 22652: {'lr': 0.00019991004289991314, 'samples': 724864, 'steps': 1415, 'loss/train': 1.8560806512832642} -09/20/2021 19:23:34 - INFO - __main__ - Step 22653: {'lr': 0.00019991004289991314, 'samples': 724896, 'steps': 1415, 'loss/train': 3.659240484237671} -09/20/2021 19:23:35 - INFO - __main__ - Step 22654: {'lr': 0.00019991004289991314, 'samples': 724928, 'steps': 1415, 'loss/train': 3.588131904602051} -09/20/2021 19:23:36 - INFO - __main__ - Step 22655: {'lr': 0.00019991004289991314, 'samples': 724960, 'steps': 1415, 'loss/train': 2.1572821140289307} -09/20/2021 19:23:36 - INFO - __main__ - Step 22656: {'lr': 0.00019991004289991314, 'samples': 724992, 'steps': 1415, 'loss/train': 3.77634596824646} -09/20/2021 19:23:37 - INFO - __main__ - Step 22657: {'lr': 0.0001999097721895472, 'samples': 725024, 'steps': 1416, 'loss/train': 1.322374939918518} -09/20/2021 19:23:38 - INFO - __main__ - Step 22658: {'lr': 0.0001999097721895472, 'samples': 725056, 'steps': 1416, 'loss/train': 3.8214190006256104} -09/20/2021 19:23:39 - INFO - __main__ - Step 22659: {'lr': 0.0001999097721895472, 'samples': 725088, 'steps': 1416, 'loss/train': 3.3402650356292725} -09/20/2021 19:23:39 - INFO - __main__ - Step 22660: {'lr': 0.0001999097721895472, 'samples': 725120, 'steps': 1416, 'loss/train': 0.5103558897972107} -09/20/2021 19:23:40 - INFO - __main__ - Step 22661: {'lr': 0.0001999097721895472, 'samples': 725152, 'steps': 1416, 'loss/train': 0.6723296642303467} -09/20/2021 19:23:41 - INFO - __main__ - Step 22662: {'lr': 0.0001999097721895472, 'samples': 725184, 'steps': 1416, 'loss/train': 3.1922011375427246} -09/20/2021 19:23:42 - INFO - __main__ - Step 22663: {'lr': 0.0001999097721895472, 'samples': 725216, 'steps': 1416, 'loss/train': 2.3589026927948} -09/20/2021 19:23:42 - INFO - __main__ - Step 22664: {'lr': 0.0001999097721895472, 'samples': 725248, 'steps': 1416, 'loss/train': 1.5080270767211914} -09/20/2021 19:23:43 - INFO - __main__ - Step 22665: {'lr': 0.0001999097721895472, 'samples': 725280, 'steps': 1416, 'loss/train': 3.967676877975464} -09/20/2021 19:23:44 - INFO - __main__ - Step 22666: {'lr': 0.0001999097721895472, 'samples': 725312, 'steps': 1416, 'loss/train': 2.8949713706970215} -09/20/2021 19:23:45 - INFO - __main__ - Step 22667: {'lr': 0.0001999097721895472, 'samples': 725344, 'steps': 1416, 'loss/train': 2.335942268371582} -09/20/2021 19:23:45 - INFO - __main__ - Step 22668: {'lr': 0.0001999097721895472, 'samples': 725376, 'steps': 1416, 'loss/train': 3.7819783687591553} -09/20/2021 19:23:46 - INFO - __main__ - Step 22669: {'lr': 0.0001999097721895472, 'samples': 725408, 'steps': 1416, 'loss/train': 3.119845151901245} -09/20/2021 19:23:48 - INFO - __main__ - Step 22670: {'lr': 0.0001999097721895472, 'samples': 725440, 'steps': 1416, 'loss/train': 3.425569534301758} -09/20/2021 19:23:49 - INFO - __main__ - Step 22671: {'lr': 0.0001999097721895472, 'samples': 725472, 'steps': 1416, 'loss/train': 2.9086639881134033} -09/20/2021 19:23:50 - INFO - __main__ - Step 22672: {'lr': 0.0001999097721895472, 'samples': 725504, 'steps': 1416, 'loss/train': 2.75874662399292} -09/20/2021 19:23:51 - INFO - __main__ - Step 22673: {'lr': 0.00019990950107264877, 'samples': 725536, 'steps': 1417, 'loss/train': 3.26900315284729} -09/20/2021 19:23:51 - INFO - __main__ - Step 22674: {'lr': 0.00019990950107264877, 'samples': 725568, 'steps': 1417, 'loss/train': 3.434147834777832} -09/20/2021 19:23:52 - INFO - __main__ - Step 22675: {'lr': 0.00019990950107264877, 'samples': 725600, 'steps': 1417, 'loss/train': 2.5249648094177246} -09/20/2021 19:23:53 - INFO - __main__ - Step 22676: {'lr': 0.00019990950107264877, 'samples': 725632, 'steps': 1417, 'loss/train': 2.312748908996582} -09/20/2021 19:23:54 - INFO - __main__ - Step 22677: {'lr': 0.00019990950107264877, 'samples': 725664, 'steps': 1417, 'loss/train': 3.527202606201172} -09/20/2021 19:23:54 - INFO - __main__ - Step 22678: {'lr': 0.00019990950107264877, 'samples': 725696, 'steps': 1417, 'loss/train': 2.6590991020202637} -09/20/2021 19:23:55 - INFO - __main__ - Step 22679: {'lr': 0.00019990950107264877, 'samples': 725728, 'steps': 1417, 'loss/train': 3.8556675910949707} -09/20/2021 19:23:56 - INFO - __main__ - Step 22680: {'lr': 0.00019990950107264877, 'samples': 725760, 'steps': 1417, 'loss/train': 2.5549986362457275} -09/20/2021 19:23:57 - INFO - __main__ - Step 22681: {'lr': 0.00019990950107264877, 'samples': 725792, 'steps': 1417, 'loss/train': 3.4714174270629883} -09/20/2021 19:23:57 - INFO - __main__ - Step 22682: {'lr': 0.00019990950107264877, 'samples': 725824, 'steps': 1417, 'loss/train': 3.4472243785858154} -09/20/2021 19:23:58 - INFO - __main__ - Step 22683: {'lr': 0.00019990950107264877, 'samples': 725856, 'steps': 1417, 'loss/train': 2.413132429122925} -09/20/2021 19:23:59 - INFO - __main__ - Step 22684: {'lr': 0.00019990950107264877, 'samples': 725888, 'steps': 1417, 'loss/train': 4.323746204376221} -09/20/2021 19:24:00 - INFO - __main__ - Step 22685: {'lr': 0.00019990950107264877, 'samples': 725920, 'steps': 1417, 'loss/train': 4.307604789733887} -09/20/2021 19:24:00 - INFO - __main__ - Step 22686: {'lr': 0.00019990950107264877, 'samples': 725952, 'steps': 1417, 'loss/train': 4.21397590637207} -09/20/2021 19:24:01 - INFO - __main__ - Step 22687: {'lr': 0.00019990950107264877, 'samples': 725984, 'steps': 1417, 'loss/train': 4.232447624206543} -09/20/2021 19:24:02 - INFO - __main__ - Step 22688: {'lr': 0.00019990950107264877, 'samples': 726016, 'steps': 1417, 'loss/train': 4.371649742126465} -09/20/2021 19:24:03 - INFO - __main__ - Step 22689: {'lr': 0.000199909229549219, 'samples': 726048, 'steps': 1418, 'loss/train': 4.008472919464111} -09/20/2021 19:24:03 - INFO - __main__ - Step 22690: {'lr': 0.000199909229549219, 'samples': 726080, 'steps': 1418, 'loss/train': 3.761671781539917} -09/20/2021 19:24:04 - INFO - __main__ - Step 22691: {'lr': 0.000199909229549219, 'samples': 726112, 'steps': 1418, 'loss/train': 4.050673007965088} -09/20/2021 19:24:05 - INFO - __main__ - Step 22692: {'lr': 0.000199909229549219, 'samples': 726144, 'steps': 1418, 'loss/train': 3.917475461959839} -09/20/2021 19:24:06 - INFO - __main__ - Step 22693: {'lr': 0.000199909229549219, 'samples': 726176, 'steps': 1418, 'loss/train': 3.3365297317504883} -09/20/2021 19:24:06 - INFO - __main__ - Step 22694: {'lr': 0.000199909229549219, 'samples': 726208, 'steps': 1418, 'loss/train': 2.707909107208252} -09/20/2021 19:24:07 - INFO - __main__ - Step 22695: {'lr': 0.000199909229549219, 'samples': 726240, 'steps': 1418, 'loss/train': 2.989553928375244} -09/20/2021 19:24:08 - INFO - __main__ - Step 22696: {'lr': 0.000199909229549219, 'samples': 726272, 'steps': 1418, 'loss/train': 3.2006592750549316} -09/20/2021 19:24:09 - INFO - __main__ - Step 22697: {'lr': 0.000199909229549219, 'samples': 726304, 'steps': 1418, 'loss/train': 1.3508820533752441} -09/20/2021 19:24:09 - INFO - __main__ - Step 22698: {'lr': 0.000199909229549219, 'samples': 726336, 'steps': 1418, 'loss/train': 4.224271297454834} -09/20/2021 19:24:10 - INFO - __main__ - Step 22699: {'lr': 0.000199909229549219, 'samples': 726368, 'steps': 1418, 'loss/train': 3.052556037902832} -09/20/2021 19:24:11 - INFO - __main__ - Step 22700: {'lr': 0.000199909229549219, 'samples': 726400, 'steps': 1418, 'loss/train': 3.7158336639404297} -09/20/2021 19:24:12 - INFO - __main__ - Step 22701: {'lr': 0.000199909229549219, 'samples': 726432, 'steps': 1418, 'loss/train': 2.9562673568725586} -09/20/2021 19:24:12 - INFO - __main__ - Step 22702: {'lr': 0.000199909229549219, 'samples': 726464, 'steps': 1418, 'loss/train': 4.076417922973633} -09/20/2021 19:24:13 - INFO - __main__ - Step 22703: {'lr': 0.000199909229549219, 'samples': 726496, 'steps': 1418, 'loss/train': 3.6921660900115967} -09/20/2021 19:24:14 - INFO - __main__ - Step 22704: {'lr': 0.000199909229549219, 'samples': 726528, 'steps': 1418, 'loss/train': 1.1442108154296875} -09/20/2021 19:24:15 - INFO - __main__ - Step 22705: {'lr': 0.00019990895761925895, 'samples': 726560, 'steps': 1419, 'loss/train': 3.6977622509002686} -09/20/2021 19:24:16 - INFO - __main__ - Step 22706: {'lr': 0.00019990895761925895, 'samples': 726592, 'steps': 1419, 'loss/train': 2.714298725128174} -09/20/2021 19:24:16 - INFO - __main__ - Step 22707: {'lr': 0.00019990895761925895, 'samples': 726624, 'steps': 1419, 'loss/train': 2.103123426437378} -09/20/2021 19:24:17 - INFO - __main__ - Step 22708: {'lr': 0.00019990895761925895, 'samples': 726656, 'steps': 1419, 'loss/train': 2.501776695251465} -09/20/2021 19:24:19 - INFO - __main__ - Step 22709: {'lr': 0.00019990895761925895, 'samples': 726688, 'steps': 1419, 'loss/train': 3.5178427696228027} -09/20/2021 19:24:19 - INFO - __main__ - Step 22710: {'lr': 0.00019990895761925895, 'samples': 726720, 'steps': 1419, 'loss/train': 3.936079263687134} -09/20/2021 19:24:20 - INFO - __main__ - Step 22711: {'lr': 0.00019990895761925895, 'samples': 726752, 'steps': 1419, 'loss/train': 3.3983349800109863} -09/20/2021 19:24:21 - INFO - __main__ - Step 22712: {'lr': 0.00019990895761925895, 'samples': 726784, 'steps': 1419, 'loss/train': 3.2576828002929688} -09/20/2021 19:24:22 - INFO - __main__ - Step 22713: {'lr': 0.00019990895761925895, 'samples': 726816, 'steps': 1419, 'loss/train': 2.5015125274658203} -09/20/2021 19:24:22 - INFO - __main__ - Step 22714: {'lr': 0.00019990895761925895, 'samples': 726848, 'steps': 1419, 'loss/train': 3.964223861694336} -09/20/2021 19:24:23 - INFO - __main__ - Step 22715: {'lr': 0.00019990895761925895, 'samples': 726880, 'steps': 1419, 'loss/train': 3.792328119277954} -09/20/2021 19:24:24 - INFO - __main__ - Step 22716: {'lr': 0.00019990895761925895, 'samples': 726912, 'steps': 1419, 'loss/train': 3.169839859008789} -09/20/2021 19:24:25 - INFO - __main__ - Step 22717: {'lr': 0.00019990895761925895, 'samples': 726944, 'steps': 1419, 'loss/train': 1.923454761505127} -09/20/2021 19:24:25 - INFO - __main__ - Step 22718: {'lr': 0.00019990895761925895, 'samples': 726976, 'steps': 1419, 'loss/train': 3.923232316970825} -09/20/2021 19:24:26 - INFO - __main__ - Step 22719: {'lr': 0.00019990895761925895, 'samples': 727008, 'steps': 1419, 'loss/train': 3.0033915042877197} -09/20/2021 19:24:27 - INFO - __main__ - Step 22720: {'lr': 0.00019990895761925895, 'samples': 727040, 'steps': 1419, 'loss/train': 3.052887439727783} -09/20/2021 19:24:28 - INFO - __main__ - Step 22721: {'lr': 0.00019990868528276976, 'samples': 727072, 'steps': 1420, 'loss/train': 3.1777117252349854} -09/20/2021 19:24:29 - INFO - __main__ - Step 22722: {'lr': 0.00019990868528276976, 'samples': 727104, 'steps': 1420, 'loss/train': 3.4120869636535645} -09/20/2021 19:24:29 - INFO - __main__ - Step 22723: {'lr': 0.00019990868528276976, 'samples': 727136, 'steps': 1420, 'loss/train': 2.5050055980682373} -09/20/2021 19:24:30 - INFO - __main__ - Step 22724: {'lr': 0.00019990868528276976, 'samples': 727168, 'steps': 1420, 'loss/train': 4.133420944213867} -09/20/2021 19:24:31 - INFO - __main__ - Step 22725: {'lr': 0.00019990868528276976, 'samples': 727200, 'steps': 1420, 'loss/train': 2.9155492782592773} -09/20/2021 19:24:32 - INFO - __main__ - Step 22726: {'lr': 0.00019990868528276976, 'samples': 727232, 'steps': 1420, 'loss/train': 3.3883790969848633} -09/20/2021 19:24:32 - INFO - __main__ - Step 22727: {'lr': 0.00019990868528276976, 'samples': 727264, 'steps': 1420, 'loss/train': 2.4677634239196777} -09/20/2021 19:24:33 - INFO - __main__ - Step 22728: {'lr': 0.00019990868528276976, 'samples': 727296, 'steps': 1420, 'loss/train': 2.964913845062256} -09/20/2021 19:24:34 - INFO - __main__ - Step 22729: {'lr': 0.00019990868528276976, 'samples': 727328, 'steps': 1420, 'loss/train': 2.3679006099700928} -09/20/2021 19:24:35 - INFO - __main__ - Step 22730: {'lr': 0.00019990868528276976, 'samples': 727360, 'steps': 1420, 'loss/train': 0.598712146282196} -09/20/2021 19:24:35 - INFO - __main__ - Step 22731: {'lr': 0.00019990868528276976, 'samples': 727392, 'steps': 1420, 'loss/train': 0.46647563576698303} -09/20/2021 19:24:36 - INFO - __main__ - Step 22732: {'lr': 0.00019990868528276976, 'samples': 727424, 'steps': 1420, 'loss/train': 0.6509757041931152} -09/20/2021 19:24:37 - INFO - __main__ - Step 22733: {'lr': 0.00019990868528276976, 'samples': 727456, 'steps': 1420, 'loss/train': 2.2380001544952393} -09/20/2021 19:24:38 - INFO - __main__ - Step 22734: {'lr': 0.00019990868528276976, 'samples': 727488, 'steps': 1420, 'loss/train': 2.479313611984253} -09/20/2021 19:24:38 - INFO - __main__ - Step 22735: {'lr': 0.00019990868528276976, 'samples': 727520, 'steps': 1420, 'loss/train': 2.732654333114624} -09/20/2021 19:24:39 - INFO - __main__ - Step 22736: {'lr': 0.00019990868528276976, 'samples': 727552, 'steps': 1420, 'loss/train': 3.083181381225586} -09/20/2021 19:24:40 - INFO - __main__ - Step 22737: {'lr': 0.0001999084125397525, 'samples': 727584, 'steps': 1421, 'loss/train': 2.873774528503418} -09/20/2021 19:24:41 - INFO - __main__ - Step 22738: {'lr': 0.0001999084125397525, 'samples': 727616, 'steps': 1421, 'loss/train': 2.9773685932159424} -09/20/2021 19:24:41 - INFO - __main__ - Step 22739: {'lr': 0.0001999084125397525, 'samples': 727648, 'steps': 1421, 'loss/train': 1.8004333972930908} -09/20/2021 19:24:42 - INFO - __main__ - Step 22740: {'lr': 0.0001999084125397525, 'samples': 727680, 'steps': 1421, 'loss/train': 2.226778507232666} -09/20/2021 19:24:43 - INFO - __main__ - Step 22741: {'lr': 0.0001999084125397525, 'samples': 727712, 'steps': 1421, 'loss/train': 2.11639142036438} -09/20/2021 19:24:44 - INFO - __main__ - Step 22742: {'lr': 0.0001999084125397525, 'samples': 727744, 'steps': 1421, 'loss/train': 2.2809784412384033} -09/20/2021 19:24:45 - INFO - __main__ - Step 22743: {'lr': 0.0001999084125397525, 'samples': 727776, 'steps': 1421, 'loss/train': 1.9330703020095825} -09/20/2021 19:24:46 - INFO - __main__ - Step 22744: {'lr': 0.0001999084125397525, 'samples': 727808, 'steps': 1421, 'loss/train': 2.811645269393921} -09/20/2021 19:24:46 - INFO - __main__ - Step 22745: {'lr': 0.0001999084125397525, 'samples': 727840, 'steps': 1421, 'loss/train': 3.264679431915283} -09/20/2021 19:24:47 - INFO - __main__ - Step 22746: {'lr': 0.0001999084125397525, 'samples': 727872, 'steps': 1421, 'loss/train': 3.331845760345459} -09/20/2021 19:24:48 - INFO - __main__ - Step 22747: {'lr': 0.0001999084125397525, 'samples': 727904, 'steps': 1421, 'loss/train': 1.5384771823883057} -09/20/2021 19:24:49 - INFO - __main__ - Step 22748: {'lr': 0.0001999084125397525, 'samples': 727936, 'steps': 1421, 'loss/train': 3.2198004722595215} -09/20/2021 19:24:49 - INFO - __main__ - Step 22749: {'lr': 0.0001999084125397525, 'samples': 727968, 'steps': 1421, 'loss/train': 0.8631383776664734} -09/20/2021 19:24:50 - INFO - __main__ - Step 22750: {'lr': 0.0001999084125397525, 'samples': 728000, 'steps': 1421, 'loss/train': 3.084310531616211} -09/20/2021 19:24:51 - INFO - __main__ - Step 22751: {'lr': 0.0001999084125397525, 'samples': 728032, 'steps': 1421, 'loss/train': 2.332120895385742} -09/20/2021 19:24:52 - INFO - __main__ - Step 22752: {'lr': 0.0001999084125397525, 'samples': 728064, 'steps': 1421, 'loss/train': 3.318918466567993} -09/20/2021 19:24:53 - INFO - __main__ - Step 22753: {'lr': 0.0001999081393902083, 'samples': 728096, 'steps': 1422, 'loss/train': 2.59275484085083} -09/20/2021 19:24:53 - INFO - __main__ - Step 22754: {'lr': 0.0001999081393902083, 'samples': 728128, 'steps': 1422, 'loss/train': 3.5610744953155518} -09/20/2021 19:24:54 - INFO - __main__ - Step 22755: {'lr': 0.0001999081393902083, 'samples': 728160, 'steps': 1422, 'loss/train': 3.818338632583618} -09/20/2021 19:24:55 - INFO - __main__ - Step 22756: {'lr': 0.0001999081393902083, 'samples': 728192, 'steps': 1422, 'loss/train': 3.5913987159729004} -09/20/2021 19:24:56 - INFO - __main__ - Step 22757: {'lr': 0.0001999081393902083, 'samples': 728224, 'steps': 1422, 'loss/train': 3.541344404220581} -09/20/2021 19:24:56 - INFO - __main__ - Step 22758: {'lr': 0.0001999081393902083, 'samples': 728256, 'steps': 1422, 'loss/train': 1.026831030845642} -09/20/2021 19:24:57 - INFO - __main__ - Step 22759: {'lr': 0.0001999081393902083, 'samples': 728288, 'steps': 1422, 'loss/train': 2.424572229385376} -09/20/2021 19:24:58 - INFO - __main__ - Step 22760: {'lr': 0.0001999081393902083, 'samples': 728320, 'steps': 1422, 'loss/train': 0.37962567806243896} -09/20/2021 19:24:59 - INFO - __main__ - Step 22761: {'lr': 0.0001999081393902083, 'samples': 728352, 'steps': 1422, 'loss/train': 2.981395721435547} -09/20/2021 19:24:59 - INFO - __main__ - Step 22762: {'lr': 0.0001999081393902083, 'samples': 728384, 'steps': 1422, 'loss/train': 3.180026054382324} -09/20/2021 19:25:00 - INFO - __main__ - Step 22763: {'lr': 0.0001999081393902083, 'samples': 728416, 'steps': 1422, 'loss/train': 2.268673896789551} -09/20/2021 19:25:01 - INFO - __main__ - Step 22764: {'lr': 0.0001999081393902083, 'samples': 728448, 'steps': 1422, 'loss/train': 2.870027780532837} -09/20/2021 19:25:02 - INFO - __main__ - Step 22765: {'lr': 0.0001999081393902083, 'samples': 728480, 'steps': 1422, 'loss/train': 7.943624019622803} -09/20/2021 19:25:02 - INFO - __main__ - Step 22766: {'lr': 0.0001999081393902083, 'samples': 728512, 'steps': 1422, 'loss/train': 6.416791915893555} -09/20/2021 19:25:03 - INFO - __main__ - Step 22767: {'lr': 0.0001999081393902083, 'samples': 728544, 'steps': 1422, 'loss/train': 3.637925148010254} -09/20/2021 19:25:04 - INFO - __main__ - Step 22768: {'lr': 0.0001999081393902083, 'samples': 728576, 'steps': 1422, 'loss/train': 3.0575053691864014} -09/20/2021 19:25:05 - INFO - __main__ - Step 22769: {'lr': 0.00019990786583413828, 'samples': 728608, 'steps': 1423, 'loss/train': 2.57673716545105} -09/20/2021 19:25:05 - INFO - __main__ - Step 22770: {'lr': 0.00019990786583413828, 'samples': 728640, 'steps': 1423, 'loss/train': 3.1783204078674316} -09/20/2021 19:25:06 - INFO - __main__ - Step 22771: {'lr': 0.00019990786583413828, 'samples': 728672, 'steps': 1423, 'loss/train': 3.0134217739105225} -09/20/2021 19:25:07 - INFO - __main__ - Step 22772: {'lr': 0.00019990786583413828, 'samples': 728704, 'steps': 1423, 'loss/train': 3.2127766609191895} -09/20/2021 19:25:08 - INFO - __main__ - Step 22773: {'lr': 0.00019990786583413828, 'samples': 728736, 'steps': 1423, 'loss/train': 2.018064260482788} -09/20/2021 19:25:08 - INFO - __main__ - Step 22774: {'lr': 0.00019990786583413828, 'samples': 728768, 'steps': 1423, 'loss/train': 3.1244568824768066} -09/20/2021 19:25:10 - INFO - __main__ - Step 22775: {'lr': 0.00019990786583413828, 'samples': 728800, 'steps': 1423, 'loss/train': 3.506722927093506} -09/20/2021 19:25:11 - INFO - __main__ - Step 22776: {'lr': 0.00019990786583413828, 'samples': 728832, 'steps': 1423, 'loss/train': 3.588710069656372} -09/20/2021 19:25:11 - INFO - __main__ - Step 22777: {'lr': 0.00019990786583413828, 'samples': 728864, 'steps': 1423, 'loss/train': 2.6445231437683105} -09/20/2021 19:25:12 - INFO - __main__ - Step 22778: {'lr': 0.00019990786583413828, 'samples': 728896, 'steps': 1423, 'loss/train': 3.6278138160705566} -09/20/2021 19:25:13 - INFO - __main__ - Step 22779: {'lr': 0.00019990786583413828, 'samples': 728928, 'steps': 1423, 'loss/train': 3.6130499839782715} -09/20/2021 19:25:14 - INFO - __main__ - Step 22780: {'lr': 0.00019990786583413828, 'samples': 728960, 'steps': 1423, 'loss/train': 2.9311962127685547} -09/20/2021 19:25:14 - INFO - __main__ - Step 22781: {'lr': 0.00019990786583413828, 'samples': 728992, 'steps': 1423, 'loss/train': 2.843334674835205} -09/20/2021 19:25:15 - INFO - __main__ - Step 22782: {'lr': 0.00019990786583413828, 'samples': 729024, 'steps': 1423, 'loss/train': 3.339916229248047} -09/20/2021 19:25:16 - INFO - __main__ - Step 22783: {'lr': 0.00019990786583413828, 'samples': 729056, 'steps': 1423, 'loss/train': 4.115602493286133} -09/20/2021 19:25:17 - INFO - __main__ - Step 22784: {'lr': 0.00019990786583413828, 'samples': 729088, 'steps': 1423, 'loss/train': 3.398280143737793} -09/20/2021 19:25:17 - INFO - __main__ - Step 22785: {'lr': 0.0001999075918715435, 'samples': 729120, 'steps': 1424, 'loss/train': 3.2649362087249756} -09/20/2021 19:25:18 - INFO - __main__ - Step 22786: {'lr': 0.0001999075918715435, 'samples': 729152, 'steps': 1424, 'loss/train': 2.4460690021514893} -09/20/2021 19:25:19 - INFO - __main__ - Step 22787: {'lr': 0.0001999075918715435, 'samples': 729184, 'steps': 1424, 'loss/train': 3.777916431427002} -09/20/2021 19:25:20 - INFO - __main__ - Step 22788: {'lr': 0.0001999075918715435, 'samples': 729216, 'steps': 1424, 'loss/train': 2.2381131649017334} -09/20/2021 19:25:20 - INFO - __main__ - Step 22789: {'lr': 0.0001999075918715435, 'samples': 729248, 'steps': 1424, 'loss/train': 3.1944708824157715} -09/20/2021 19:25:21 - INFO - __main__ - Step 22790: {'lr': 0.0001999075918715435, 'samples': 729280, 'steps': 1424, 'loss/train': 3.4826626777648926} -09/20/2021 19:25:22 - INFO - __main__ - Step 22791: {'lr': 0.0001999075918715435, 'samples': 729312, 'steps': 1424, 'loss/train': 2.6647839546203613} -09/20/2021 19:25:23 - INFO - __main__ - Step 22792: {'lr': 0.0001999075918715435, 'samples': 729344, 'steps': 1424, 'loss/train': 3.033972978591919} -09/20/2021 19:25:23 - INFO - __main__ - Step 22793: {'lr': 0.0001999075918715435, 'samples': 729376, 'steps': 1424, 'loss/train': 4.0841064453125} -09/20/2021 19:25:24 - INFO - __main__ - Step 22794: {'lr': 0.0001999075918715435, 'samples': 729408, 'steps': 1424, 'loss/train': 3.5469143390655518} -09/20/2021 19:25:25 - INFO - __main__ - Step 22795: {'lr': 0.0001999075918715435, 'samples': 729440, 'steps': 1424, 'loss/train': 3.3407089710235596} -09/20/2021 19:25:26 - INFO - __main__ - Step 22796: {'lr': 0.0001999075918715435, 'samples': 729472, 'steps': 1424, 'loss/train': 2.7338531017303467} -09/20/2021 19:25:26 - INFO - __main__ - Step 22797: {'lr': 0.0001999075918715435, 'samples': 729504, 'steps': 1424, 'loss/train': 5.134641647338867} -09/20/2021 19:25:27 - INFO - __main__ - Step 22798: {'lr': 0.0001999075918715435, 'samples': 729536, 'steps': 1424, 'loss/train': 0.4764484167098999} -09/20/2021 19:25:28 - INFO - __main__ - Step 22799: {'lr': 0.0001999075918715435, 'samples': 729568, 'steps': 1424, 'loss/train': 0.689857006072998} -09/20/2021 19:25:29 - INFO - __main__ - Step 22800: {'lr': 0.0001999075918715435, 'samples': 729600, 'steps': 1424, 'loss/train': 1.5283852815628052} -09/20/2021 19:25:30 - INFO - __main__ - Step 22801: {'lr': 0.00019990731750242516, 'samples': 729632, 'steps': 1425, 'loss/train': 2.7531349658966064} -09/20/2021 19:25:30 - INFO - __main__ - Step 22802: {'lr': 0.00019990731750242516, 'samples': 729664, 'steps': 1425, 'loss/train': 3.7535817623138428} -09/20/2021 19:25:31 - INFO - __main__ - Step 22803: {'lr': 0.00019990731750242516, 'samples': 729696, 'steps': 1425, 'loss/train': 4.495723247528076} -09/20/2021 19:25:32 - INFO - __main__ - Step 22804: {'lr': 0.00019990731750242516, 'samples': 729728, 'steps': 1425, 'loss/train': 4.086474895477295} -09/20/2021 19:25:34 - INFO - __main__ - Step 22805: {'lr': 0.00019990731750242516, 'samples': 729760, 'steps': 1425, 'loss/train': 3.4738059043884277} -09/20/2021 19:25:34 - INFO - __main__ - Step 22806: {'lr': 0.00019990731750242516, 'samples': 729792, 'steps': 1425, 'loss/train': 2.2093420028686523} -09/20/2021 19:25:35 - INFO - __main__ - Step 22807: {'lr': 0.00019990731750242516, 'samples': 729824, 'steps': 1425, 'loss/train': 3.50700044631958} -09/20/2021 19:25:36 - INFO - __main__ - Step 22808: {'lr': 0.00019990731750242516, 'samples': 729856, 'steps': 1425, 'loss/train': 3.864879608154297} -09/20/2021 19:25:37 - INFO - __main__ - Step 22809: {'lr': 0.00019990731750242516, 'samples': 729888, 'steps': 1425, 'loss/train': 2.6201953887939453} -09/20/2021 19:25:37 - INFO - __main__ - Step 22810: {'lr': 0.00019990731750242516, 'samples': 729920, 'steps': 1425, 'loss/train': 3.008115768432617} -09/20/2021 19:25:38 - INFO - __main__ - Step 22811: {'lr': 0.00019990731750242516, 'samples': 729952, 'steps': 1425, 'loss/train': 2.5622217655181885} -09/20/2021 19:25:39 - INFO - __main__ - Step 22812: {'lr': 0.00019990731750242516, 'samples': 729984, 'steps': 1425, 'loss/train': 2.8679141998291016} -09/20/2021 19:25:40 - INFO - __main__ - Step 22813: {'lr': 0.00019990731750242516, 'samples': 730016, 'steps': 1425, 'loss/train': 2.6001980304718018} -09/20/2021 19:25:40 - INFO - __main__ - Step 22814: {'lr': 0.00019990731750242516, 'samples': 730048, 'steps': 1425, 'loss/train': 3.3267972469329834} -09/20/2021 19:25:41 - INFO - __main__ - Step 22815: {'lr': 0.00019990731750242516, 'samples': 730080, 'steps': 1425, 'loss/train': 3.231520175933838} -09/20/2021 19:25:42 - INFO - __main__ - Step 22816: {'lr': 0.00019990731750242516, 'samples': 730112, 'steps': 1425, 'loss/train': 3.5453147888183594} -09/20/2021 19:25:43 - INFO - __main__ - Step 22817: {'lr': 0.0001999070427267843, 'samples': 730144, 'steps': 1426, 'loss/train': 1.8341940641403198} -09/20/2021 19:25:44 - INFO - __main__ - Step 22818: {'lr': 0.0001999070427267843, 'samples': 730176, 'steps': 1426, 'loss/train': 3.340596914291382} -09/20/2021 19:25:44 - INFO - __main__ - Step 22819: {'lr': 0.0001999070427267843, 'samples': 730208, 'steps': 1426, 'loss/train': 3.01017427444458} -09/20/2021 19:25:45 - INFO - __main__ - Step 22820: {'lr': 0.0001999070427267843, 'samples': 730240, 'steps': 1426, 'loss/train': 3.3160386085510254} -09/20/2021 19:25:46 - INFO - __main__ - Step 22821: {'lr': 0.0001999070427267843, 'samples': 730272, 'steps': 1426, 'loss/train': 2.8036930561065674} -09/20/2021 19:25:47 - INFO - __main__ - Step 22822: {'lr': 0.0001999070427267843, 'samples': 730304, 'steps': 1426, 'loss/train': 0.49478235840797424} -09/20/2021 19:25:47 - INFO - __main__ - Step 22823: {'lr': 0.0001999070427267843, 'samples': 730336, 'steps': 1426, 'loss/train': 0.7395066022872925} -09/20/2021 19:25:48 - INFO - __main__ - Step 22824: {'lr': 0.0001999070427267843, 'samples': 730368, 'steps': 1426, 'loss/train': 0.732288122177124} -09/20/2021 19:25:49 - INFO - __main__ - Step 22825: {'lr': 0.0001999070427267843, 'samples': 730400, 'steps': 1426, 'loss/train': 3.6300716400146484} -09/20/2021 19:25:50 - INFO - __main__ - Step 22826: {'lr': 0.0001999070427267843, 'samples': 730432, 'steps': 1426, 'loss/train': 2.817610740661621} -09/20/2021 19:25:50 - INFO - __main__ - Step 22827: {'lr': 0.0001999070427267843, 'samples': 730464, 'steps': 1426, 'loss/train': 4.0602898597717285} -09/20/2021 19:25:51 - INFO - __main__ - Step 22828: {'lr': 0.0001999070427267843, 'samples': 730496, 'steps': 1426, 'loss/train': 3.888535499572754} -09/20/2021 19:25:52 - INFO - __main__ - Step 22829: {'lr': 0.0001999070427267843, 'samples': 730528, 'steps': 1426, 'loss/train': 2.9611997604370117} -09/20/2021 19:25:53 - INFO - __main__ - Step 22830: {'lr': 0.0001999070427267843, 'samples': 730560, 'steps': 1426, 'loss/train': 3.0163822174072266} -09/20/2021 19:25:53 - INFO - __main__ - Step 22831: {'lr': 0.0001999070427267843, 'samples': 730592, 'steps': 1426, 'loss/train': 2.6640262603759766} -09/20/2021 19:25:54 - INFO - __main__ - Step 22832: {'lr': 0.0001999070427267843, 'samples': 730624, 'steps': 1426, 'loss/train': 2.5689175128936768} -09/20/2021 19:25:55 - INFO - __main__ - Step 22833: {'lr': 0.0001999067675446221, 'samples': 730656, 'steps': 1427, 'loss/train': 3.086214542388916} -09/20/2021 19:25:56 - INFO - __main__ - Step 22834: {'lr': 0.0001999067675446221, 'samples': 730688, 'steps': 1427, 'loss/train': 2.929093599319458} -09/20/2021 19:25:56 - INFO - __main__ - Step 22835: {'lr': 0.0001999067675446221, 'samples': 730720, 'steps': 1427, 'loss/train': 3.2263922691345215} -09/20/2021 19:25:57 - INFO - __main__ - Step 22836: {'lr': 0.0001999067675446221, 'samples': 730752, 'steps': 1427, 'loss/train': 0.5175871253013611} -09/20/2021 19:25:58 - INFO - __main__ - Step 22837: {'lr': 0.0001999067675446221, 'samples': 730784, 'steps': 1427, 'loss/train': 0.4960515797138214} -09/20/2021 19:25:59 - INFO - __main__ - Step 22838: {'lr': 0.0001999067675446221, 'samples': 730816, 'steps': 1427, 'loss/train': 0.927929162979126} -09/20/2021 19:25:59 - INFO - __main__ - Step 22839: {'lr': 0.0001999067675446221, 'samples': 730848, 'steps': 1427, 'loss/train': 0.41925013065338135} -09/20/2021 19:26:00 - INFO - __main__ - Step 22840: {'lr': 0.0001999067675446221, 'samples': 730880, 'steps': 1427, 'loss/train': 0.7568055391311646} -09/20/2021 19:26:01 - INFO - __main__ - Step 22841: {'lr': 0.0001999067675446221, 'samples': 730912, 'steps': 1427, 'loss/train': 1.8443882465362549} -09/20/2021 19:26:02 - INFO - __main__ - Step 22842: {'lr': 0.0001999067675446221, 'samples': 730944, 'steps': 1427, 'loss/train': 1.710557460784912} -09/20/2021 19:26:03 - INFO - __main__ - Step 22843: {'lr': 0.0001999067675446221, 'samples': 730976, 'steps': 1427, 'loss/train': 3.691995143890381} -09/20/2021 19:26:04 - INFO - __main__ - Step 22844: {'lr': 0.0001999067675446221, 'samples': 731008, 'steps': 1427, 'loss/train': 3.1483616828918457} -09/20/2021 19:26:05 - INFO - __main__ - Step 22845: {'lr': 0.0001999067675446221, 'samples': 731040, 'steps': 1427, 'loss/train': 3.223358631134033} -09/20/2021 19:26:05 - INFO - __main__ - Step 22846: {'lr': 0.0001999067675446221, 'samples': 731072, 'steps': 1427, 'loss/train': 1.7428406476974487} -09/20/2021 19:26:06 - INFO - __main__ - Step 22847: {'lr': 0.0001999067675446221, 'samples': 731104, 'steps': 1427, 'loss/train': 2.6377832889556885} -09/20/2021 19:26:07 - INFO - __main__ - Step 22848: {'lr': 0.0001999067675446221, 'samples': 731136, 'steps': 1427, 'loss/train': 3.0375783443450928} -09/20/2021 19:26:08 - INFO - __main__ - Step 22849: {'lr': 0.00019990649195593963, 'samples': 731168, 'steps': 1428, 'loss/train': 3.844393491744995} -09/20/2021 19:26:08 - INFO - __main__ - Step 22850: {'lr': 0.00019990649195593963, 'samples': 731200, 'steps': 1428, 'loss/train': 3.317448377609253} -09/20/2021 19:26:09 - INFO - __main__ - Step 22851: {'lr': 0.00019990649195593963, 'samples': 731232, 'steps': 1428, 'loss/train': 2.7049062252044678} -09/20/2021 19:26:10 - INFO - __main__ - Step 22852: {'lr': 0.00019990649195593963, 'samples': 731264, 'steps': 1428, 'loss/train': 2.9678139686584473} -09/20/2021 19:26:11 - INFO - __main__ - Step 22853: {'lr': 0.00019990649195593963, 'samples': 731296, 'steps': 1428, 'loss/train': 4.7176361083984375} -09/20/2021 19:26:11 - INFO - __main__ - Step 22854: {'lr': 0.00019990649195593963, 'samples': 731328, 'steps': 1428, 'loss/train': 3.379399061203003} -09/20/2021 19:26:12 - INFO - __main__ - Step 22855: {'lr': 0.00019990649195593963, 'samples': 731360, 'steps': 1428, 'loss/train': 4.638082027435303} -09/20/2021 19:26:13 - INFO - __main__ - Step 22856: {'lr': 0.00019990649195593963, 'samples': 731392, 'steps': 1428, 'loss/train': 3.2030060291290283} -09/20/2021 19:26:14 - INFO - __main__ - Step 22857: {'lr': 0.00019990649195593963, 'samples': 731424, 'steps': 1428, 'loss/train': 2.9744205474853516} -09/20/2021 19:26:14 - INFO - __main__ - Step 22858: {'lr': 0.00019990649195593963, 'samples': 731456, 'steps': 1428, 'loss/train': 3.276611566543579} -09/20/2021 19:26:15 - INFO - __main__ - Step 22859: {'lr': 0.00019990649195593963, 'samples': 731488, 'steps': 1428, 'loss/train': 3.6173746585845947} -09/20/2021 19:26:16 - INFO - __main__ - Step 22860: {'lr': 0.00019990649195593963, 'samples': 731520, 'steps': 1428, 'loss/train': 3.522120237350464} -09/20/2021 19:26:17 - INFO - __main__ - Step 22861: {'lr': 0.00019990649195593963, 'samples': 731552, 'steps': 1428, 'loss/train': 3.2603437900543213} -09/20/2021 19:26:17 - INFO - __main__ - Step 22862: {'lr': 0.00019990649195593963, 'samples': 731584, 'steps': 1428, 'loss/train': 3.9021413326263428} -09/20/2021 19:26:18 - INFO - __main__ - Step 22863: {'lr': 0.00019990649195593963, 'samples': 731616, 'steps': 1428, 'loss/train': 3.231909990310669} -09/20/2021 19:26:19 - INFO - __main__ - Step 22864: {'lr': 0.00019990649195593963, 'samples': 731648, 'steps': 1428, 'loss/train': 2.866874933242798} -09/20/2021 19:26:20 - INFO - __main__ - Step 22865: {'lr': 0.00019990621596073803, 'samples': 731680, 'steps': 1429, 'loss/train': 0.9003180861473083} -09/20/2021 19:26:21 - INFO - __main__ - Step 22866: {'lr': 0.00019990621596073803, 'samples': 731712, 'steps': 1429, 'loss/train': 3.5715677738189697} -09/20/2021 19:26:21 - INFO - __main__ - Step 22867: {'lr': 0.00019990621596073803, 'samples': 731744, 'steps': 1429, 'loss/train': 2.7629735469818115} -09/20/2021 19:26:22 - INFO - __main__ - Step 22868: {'lr': 0.00019990621596073803, 'samples': 731776, 'steps': 1429, 'loss/train': 2.606642723083496} -09/20/2021 19:26:23 - INFO - __main__ - Step 22869: {'lr': 0.00019990621596073803, 'samples': 731808, 'steps': 1429, 'loss/train': 2.7795450687408447} -09/20/2021 19:26:24 - INFO - __main__ - Step 22870: {'lr': 0.00019990621596073803, 'samples': 731840, 'steps': 1429, 'loss/train': 3.3636367321014404} -09/20/2021 19:26:24 - INFO - __main__ - Step 22871: {'lr': 0.00019990621596073803, 'samples': 731872, 'steps': 1429, 'loss/train': 3.7396352291107178} -09/20/2021 19:26:26 - INFO - __main__ - Step 22872: {'lr': 0.00019990621596073803, 'samples': 731904, 'steps': 1429, 'loss/train': 2.964501142501831} -09/20/2021 19:26:26 - INFO - __main__ - Step 22873: {'lr': 0.00019990621596073803, 'samples': 731936, 'steps': 1429, 'loss/train': 2.5958664417266846} -09/20/2021 19:26:27 - INFO - __main__ - Step 22874: {'lr': 0.00019990621596073803, 'samples': 731968, 'steps': 1429, 'loss/train': 3.283557176589966} -09/20/2021 19:26:28 - INFO - __main__ - Step 22875: {'lr': 0.00019990621596073803, 'samples': 732000, 'steps': 1429, 'loss/train': 2.6211345195770264} -09/20/2021 19:26:29 - INFO - __main__ - Step 22876: {'lr': 0.00019990621596073803, 'samples': 732032, 'steps': 1429, 'loss/train': 1.251619815826416} -09/20/2021 19:26:29 - INFO - __main__ - Step 22877: {'lr': 0.00019990621596073803, 'samples': 732064, 'steps': 1429, 'loss/train': 2.811288595199585} -09/20/2021 19:26:30 - INFO - __main__ - Step 22878: {'lr': 0.00019990621596073803, 'samples': 732096, 'steps': 1429, 'loss/train': 3.296037197113037} -09/20/2021 19:26:31 - INFO - __main__ - Step 22879: {'lr': 0.00019990621596073803, 'samples': 732128, 'steps': 1429, 'loss/train': 1.3800146579742432} -09/20/2021 19:26:32 - INFO - __main__ - Step 22880: {'lr': 0.00019990621596073803, 'samples': 732160, 'steps': 1429, 'loss/train': 3.2520909309387207} -09/20/2021 19:26:32 - INFO - __main__ - Step 22881: {'lr': 0.00019990593955901843, 'samples': 732192, 'steps': 1430, 'loss/train': 3.461794137954712} -09/20/2021 19:26:33 - INFO - __main__ - Step 22882: {'lr': 0.00019990593955901843, 'samples': 732224, 'steps': 1430, 'loss/train': 3.5187482833862305} -09/20/2021 19:26:34 - INFO - __main__ - Step 22883: {'lr': 0.00019990593955901843, 'samples': 732256, 'steps': 1430, 'loss/train': 2.619647741317749} -09/20/2021 19:26:35 - INFO - __main__ - Step 22884: {'lr': 0.00019990593955901843, 'samples': 732288, 'steps': 1430, 'loss/train': 3.7870986461639404} -09/20/2021 19:26:35 - INFO - __main__ - Step 22885: {'lr': 0.00019990593955901843, 'samples': 732320, 'steps': 1430, 'loss/train': 3.061624765396118} -09/20/2021 19:26:36 - INFO - __main__ - Step 22886: {'lr': 0.00019990593955901843, 'samples': 732352, 'steps': 1430, 'loss/train': 3.227224826812744} -09/20/2021 19:26:37 - INFO - __main__ - Step 22887: {'lr': 0.00019990593955901843, 'samples': 732384, 'steps': 1430, 'loss/train': 3.7877016067504883} -09/20/2021 19:26:38 - INFO - __main__ - Step 22888: {'lr': 0.00019990593955901843, 'samples': 732416, 'steps': 1430, 'loss/train': 3.8646342754364014} -09/20/2021 19:26:38 - INFO - __main__ - Step 22889: {'lr': 0.00019990593955901843, 'samples': 732448, 'steps': 1430, 'loss/train': 2.9137868881225586} -09/20/2021 19:26:39 - INFO - __main__ - Step 22890: {'lr': 0.00019990593955901843, 'samples': 732480, 'steps': 1430, 'loss/train': 3.0231215953826904} -09/20/2021 19:26:40 - INFO - __main__ - Step 22891: {'lr': 0.00019990593955901843, 'samples': 732512, 'steps': 1430, 'loss/train': 3.7197277545928955} -09/20/2021 19:26:41 - INFO - __main__ - Step 22892: {'lr': 0.00019990593955901843, 'samples': 732544, 'steps': 1430, 'loss/train': 2.448556900024414} -09/20/2021 19:26:41 - INFO - __main__ - Step 22893: {'lr': 0.00019990593955901843, 'samples': 732576, 'steps': 1430, 'loss/train': 2.965066432952881} -09/20/2021 19:26:42 - INFO - __main__ - Step 22894: {'lr': 0.00019990593955901843, 'samples': 732608, 'steps': 1430, 'loss/train': 3.8001291751861572} -09/20/2021 19:26:43 - INFO - __main__ - Step 22895: {'lr': 0.00019990593955901843, 'samples': 732640, 'steps': 1430, 'loss/train': 3.1731250286102295} -09/20/2021 19:26:44 - INFO - __main__ - Step 22896: {'lr': 0.00019990593955901843, 'samples': 732672, 'steps': 1430, 'loss/train': 3.2815089225769043} -09/20/2021 19:26:45 - INFO - __main__ - Step 22897: {'lr': 0.00019990566275078194, 'samples': 732704, 'steps': 1431, 'loss/train': 3.8304195404052734} -09/20/2021 19:26:45 - INFO - __main__ - Step 22898: {'lr': 0.00019990566275078194, 'samples': 732736, 'steps': 1431, 'loss/train': 3.885429620742798} -09/20/2021 19:26:46 - INFO - __main__ - Step 22899: {'lr': 0.00019990566275078194, 'samples': 732768, 'steps': 1431, 'loss/train': 2.6833336353302} -09/20/2021 19:26:47 - INFO - __main__ - Step 22900: {'lr': 0.00019990566275078194, 'samples': 732800, 'steps': 1431, 'loss/train': 3.2836155891418457} -09/20/2021 19:26:48 - INFO - __main__ - Step 22901: {'lr': 0.00019990566275078194, 'samples': 732832, 'steps': 1431, 'loss/train': 3.638032913208008} -09/20/2021 19:26:48 - INFO - __main__ - Step 22902: {'lr': 0.00019990566275078194, 'samples': 732864, 'steps': 1431, 'loss/train': 3.0517678260803223} -09/20/2021 19:26:50 - INFO - __main__ - Step 22903: {'lr': 0.00019990566275078194, 'samples': 732896, 'steps': 1431, 'loss/train': 2.5818731784820557} -09/20/2021 19:26:50 - INFO - __main__ - Step 22904: {'lr': 0.00019990566275078194, 'samples': 732928, 'steps': 1431, 'loss/train': 2.638385534286499} -09/20/2021 19:26:51 - INFO - __main__ - Step 22905: {'lr': 0.00019990566275078194, 'samples': 732960, 'steps': 1431, 'loss/train': 3.6547019481658936} -09/20/2021 19:26:52 - INFO - __main__ - Step 22906: {'lr': 0.00019990566275078194, 'samples': 732992, 'steps': 1431, 'loss/train': 3.0806496143341064} -09/20/2021 19:26:53 - INFO - __main__ - Step 22907: {'lr': 0.00019990566275078194, 'samples': 733024, 'steps': 1431, 'loss/train': 3.902505874633789} -09/20/2021 19:26:53 - INFO - __main__ - Step 22908: {'lr': 0.00019990566275078194, 'samples': 733056, 'steps': 1431, 'loss/train': 3.0769388675689697} -09/20/2021 19:26:54 - INFO - __main__ - Step 22909: {'lr': 0.00019990566275078194, 'samples': 733088, 'steps': 1431, 'loss/train': 2.554027557373047} -09/20/2021 19:26:55 - INFO - __main__ - Step 22910: {'lr': 0.00019990566275078194, 'samples': 733120, 'steps': 1431, 'loss/train': 3.665426254272461} -09/20/2021 19:26:56 - INFO - __main__ - Step 22911: {'lr': 0.00019990566275078194, 'samples': 733152, 'steps': 1431, 'loss/train': 2.8884384632110596} -09/20/2021 19:26:56 - INFO - __main__ - Step 22912: {'lr': 0.00019990566275078194, 'samples': 733184, 'steps': 1431, 'loss/train': 3.762587547302246} -09/20/2021 19:26:57 - INFO - __main__ - Step 22913: {'lr': 0.00019990538553602973, 'samples': 733216, 'steps': 1432, 'loss/train': 3.283328056335449} -09/20/2021 19:26:58 - INFO - __main__ - Step 22914: {'lr': 0.00019990538553602973, 'samples': 733248, 'steps': 1432, 'loss/train': 2.7227914333343506} -09/20/2021 19:26:59 - INFO - __main__ - Step 22915: {'lr': 0.00019990538553602973, 'samples': 733280, 'steps': 1432, 'loss/train': 3.4523611068725586} -09/20/2021 19:26:59 - INFO - __main__ - Step 22916: {'lr': 0.00019990538553602973, 'samples': 733312, 'steps': 1432, 'loss/train': 3.484604835510254} -09/20/2021 19:27:00 - INFO - __main__ - Step 22917: {'lr': 0.00019990538553602973, 'samples': 733344, 'steps': 1432, 'loss/train': 3.525056838989258} -09/20/2021 19:27:01 - INFO - __main__ - Step 22918: {'lr': 0.00019990538553602973, 'samples': 733376, 'steps': 1432, 'loss/train': 2.8009777069091797} -09/20/2021 19:27:02 - INFO - __main__ - Step 22919: {'lr': 0.00019990538553602973, 'samples': 733408, 'steps': 1432, 'loss/train': 0.44307470321655273} -09/20/2021 19:27:02 - INFO - __main__ - Step 22920: {'lr': 0.00019990538553602973, 'samples': 733440, 'steps': 1432, 'loss/train': 3.163628101348877} -09/20/2021 19:27:03 - INFO - __main__ - Step 22921: {'lr': 0.00019990538553602973, 'samples': 733472, 'steps': 1432, 'loss/train': 0.6892921328544617} -09/20/2021 19:27:04 - INFO - __main__ - Step 22922: {'lr': 0.00019990538553602973, 'samples': 733504, 'steps': 1432, 'loss/train': 4.609671115875244} -09/20/2021 19:27:05 - INFO - __main__ - Step 22923: {'lr': 0.00019990538553602973, 'samples': 733536, 'steps': 1432, 'loss/train': 2.765500068664551} -09/20/2021 19:27:05 - INFO - __main__ - Step 22924: {'lr': 0.00019990538553602973, 'samples': 733568, 'steps': 1432, 'loss/train': 3.9180545806884766} -09/20/2021 19:27:06 - INFO - __main__ - Step 22925: {'lr': 0.00019990538553602973, 'samples': 733600, 'steps': 1432, 'loss/train': 2.8932085037231445} -09/20/2021 19:27:07 - INFO - __main__ - Step 22926: {'lr': 0.00019990538553602973, 'samples': 733632, 'steps': 1432, 'loss/train': 3.124568462371826} -09/20/2021 19:27:08 - INFO - __main__ - Step 22927: {'lr': 0.00019990538553602973, 'samples': 733664, 'steps': 1432, 'loss/train': 2.9129133224487305} -09/20/2021 19:27:08 - INFO - __main__ - Step 22928: {'lr': 0.00019990538553602973, 'samples': 733696, 'steps': 1432, 'loss/train': 3.1140947341918945} -09/20/2021 19:27:09 - INFO - __main__ - Step 22929: {'lr': 0.00019990510791476288, 'samples': 733728, 'steps': 1433, 'loss/train': 3.0255990028381348} -09/20/2021 19:27:10 - INFO - __main__ - Step 22930: {'lr': 0.00019990510791476288, 'samples': 733760, 'steps': 1433, 'loss/train': 3.598005771636963} -09/20/2021 19:27:11 - INFO - __main__ - Step 22931: {'lr': 0.00019990510791476288, 'samples': 733792, 'steps': 1433, 'loss/train': 2.9782605171203613} -09/20/2021 19:27:12 - INFO - __main__ - Step 22932: {'lr': 0.00019990510791476288, 'samples': 733824, 'steps': 1433, 'loss/train': 1.0403021574020386} -09/20/2021 19:27:12 - INFO - __main__ - Step 22933: {'lr': 0.00019990510791476288, 'samples': 733856, 'steps': 1433, 'loss/train': 3.583514451980591} -09/20/2021 19:27:14 - INFO - __main__ - Step 22934: {'lr': 0.00019990510791476288, 'samples': 733888, 'steps': 1433, 'loss/train': 2.6475095748901367} -09/20/2021 19:27:14 - INFO - __main__ - Step 22935: {'lr': 0.00019990510791476288, 'samples': 733920, 'steps': 1433, 'loss/train': 3.3190114498138428} -09/20/2021 19:27:15 - INFO - __main__ - Step 22936: {'lr': 0.00019990510791476288, 'samples': 733952, 'steps': 1433, 'loss/train': 0.9095749855041504} -09/20/2021 19:27:16 - INFO - __main__ - Step 22937: {'lr': 0.00019990510791476288, 'samples': 733984, 'steps': 1433, 'loss/train': 3.301929473876953} -09/20/2021 19:27:17 - INFO - __main__ - Step 22938: {'lr': 0.00019990510791476288, 'samples': 734016, 'steps': 1433, 'loss/train': 2.772864580154419} -09/20/2021 19:27:17 - INFO - __main__ - Step 22939: {'lr': 0.00019990510791476288, 'samples': 734048, 'steps': 1433, 'loss/train': 2.3725719451904297} -09/20/2021 19:27:18 - INFO - __main__ - Step 22940: {'lr': 0.00019990510791476288, 'samples': 734080, 'steps': 1433, 'loss/train': 0.8303013443946838} -09/20/2021 19:27:19 - INFO - __main__ - Step 22941: {'lr': 0.00019990510791476288, 'samples': 734112, 'steps': 1433, 'loss/train': 3.2323806285858154} -09/20/2021 19:27:20 - INFO - __main__ - Step 22942: {'lr': 0.00019990510791476288, 'samples': 734144, 'steps': 1433, 'loss/train': 3.0631911754608154} -09/20/2021 19:27:20 - INFO - __main__ - Step 22943: {'lr': 0.00019990510791476288, 'samples': 734176, 'steps': 1433, 'loss/train': 3.3426101207733154} -09/20/2021 19:27:21 - INFO - __main__ - Step 22944: {'lr': 0.00019990510791476288, 'samples': 734208, 'steps': 1433, 'loss/train': 3.093317747116089} -09/20/2021 19:27:22 - INFO - __main__ - Step 22945: {'lr': 0.0001999048298869825, 'samples': 734240, 'steps': 1434, 'loss/train': 2.4453530311584473} -09/20/2021 19:27:23 - INFO - __main__ - Step 22946: {'lr': 0.0001999048298869825, 'samples': 734272, 'steps': 1434, 'loss/train': 3.1690990924835205} -09/20/2021 19:27:24 - INFO - __main__ - Step 22947: {'lr': 0.0001999048298869825, 'samples': 734304, 'steps': 1434, 'loss/train': 2.6232736110687256} -09/20/2021 19:27:24 - INFO - __main__ - Step 22948: {'lr': 0.0001999048298869825, 'samples': 734336, 'steps': 1434, 'loss/train': 4.392711639404297} -09/20/2021 19:27:25 - INFO - __main__ - Step 22949: {'lr': 0.0001999048298869825, 'samples': 734368, 'steps': 1434, 'loss/train': 3.1006898880004883} -09/20/2021 19:27:26 - INFO - __main__ - Step 22950: {'lr': 0.0001999048298869825, 'samples': 734400, 'steps': 1434, 'loss/train': 3.4636833667755127} -09/20/2021 19:27:27 - INFO - __main__ - Step 22951: {'lr': 0.0001999048298869825, 'samples': 734432, 'steps': 1434, 'loss/train': 4.677304744720459} -09/20/2021 19:27:27 - INFO - __main__ - Step 22952: {'lr': 0.0001999048298869825, 'samples': 734464, 'steps': 1434, 'loss/train': 3.449871063232422} -09/20/2021 19:27:28 - INFO - __main__ - Step 22953: {'lr': 0.0001999048298869825, 'samples': 734496, 'steps': 1434, 'loss/train': 3.134584903717041} -09/20/2021 19:27:29 - INFO - __main__ - Step 22954: {'lr': 0.0001999048298869825, 'samples': 734528, 'steps': 1434, 'loss/train': 3.152001142501831} -09/20/2021 19:27:30 - INFO - __main__ - Step 22955: {'lr': 0.0001999048298869825, 'samples': 734560, 'steps': 1434, 'loss/train': 3.0763797760009766} -09/20/2021 19:27:30 - INFO - __main__ - Step 22956: {'lr': 0.0001999048298869825, 'samples': 734592, 'steps': 1434, 'loss/train': 0.7982379198074341} -09/20/2021 19:27:31 - INFO - __main__ - Step 22957: {'lr': 0.0001999048298869825, 'samples': 734624, 'steps': 1434, 'loss/train': 2.543933153152466} -09/20/2021 19:27:32 - INFO - __main__ - Step 22958: {'lr': 0.0001999048298869825, 'samples': 734656, 'steps': 1434, 'loss/train': 2.535654306411743} -09/20/2021 19:27:33 - INFO - __main__ - Step 22959: {'lr': 0.0001999048298869825, 'samples': 734688, 'steps': 1434, 'loss/train': 0.48310738801956177} -09/20/2021 19:27:33 - INFO - __main__ - Step 22960: {'lr': 0.0001999048298869825, 'samples': 734720, 'steps': 1434, 'loss/train': 1.0798876285552979} -09/20/2021 19:27:34 - INFO - __main__ - Step 22961: {'lr': 0.00019990455145268982, 'samples': 734752, 'steps': 1435, 'loss/train': 0.37224143743515015} -09/20/2021 19:27:35 - INFO - __main__ - Step 22962: {'lr': 0.00019990455145268982, 'samples': 734784, 'steps': 1435, 'loss/train': 3.6456620693206787} -09/20/2021 19:27:36 - INFO - __main__ - Step 22963: {'lr': 0.00019990455145268982, 'samples': 734816, 'steps': 1435, 'loss/train': 4.531297206878662} -09/20/2021 19:27:36 - INFO - __main__ - Step 22964: {'lr': 0.00019990455145268982, 'samples': 734848, 'steps': 1435, 'loss/train': 3.237861156463623} -09/20/2021 19:27:38 - INFO - __main__ - Step 22965: {'lr': 0.00019990455145268982, 'samples': 734880, 'steps': 1435, 'loss/train': 3.1356990337371826} -09/20/2021 19:27:39 - INFO - __main__ - Step 22966: {'lr': 0.00019990455145268982, 'samples': 734912, 'steps': 1435, 'loss/train': 2.2803170680999756} -09/20/2021 19:27:39 - INFO - __main__ - Step 22967: {'lr': 0.00019990455145268982, 'samples': 734944, 'steps': 1435, 'loss/train': 3.674240827560425} -09/20/2021 19:27:40 - INFO - __main__ - Step 22968: {'lr': 0.00019990455145268982, 'samples': 734976, 'steps': 1435, 'loss/train': 3.195374011993408} -09/20/2021 19:27:41 - INFO - __main__ - Step 22969: {'lr': 0.00019990455145268982, 'samples': 735008, 'steps': 1435, 'loss/train': 3.4012222290039062} -09/20/2021 19:27:42 - INFO - __main__ - Step 22970: {'lr': 0.00019990455145268982, 'samples': 735040, 'steps': 1435, 'loss/train': 3.072129726409912} -09/20/2021 19:27:42 - INFO - __main__ - Step 22971: {'lr': 0.00019990455145268982, 'samples': 735072, 'steps': 1435, 'loss/train': 3.1256303787231445} -09/20/2021 19:27:43 - INFO - __main__ - Step 22972: {'lr': 0.00019990455145268982, 'samples': 735104, 'steps': 1435, 'loss/train': 3.276812791824341} -09/20/2021 19:27:44 - INFO - __main__ - Step 22973: {'lr': 0.00019990455145268982, 'samples': 735136, 'steps': 1435, 'loss/train': 3.0453407764434814} -09/20/2021 19:27:45 - INFO - __main__ - Step 22974: {'lr': 0.00019990455145268982, 'samples': 735168, 'steps': 1435, 'loss/train': 3.382560968399048} -09/20/2021 19:27:45 - INFO - __main__ - Step 22975: {'lr': 0.00019990455145268982, 'samples': 735200, 'steps': 1435, 'loss/train': 1.9717111587524414} -09/20/2021 19:27:46 - INFO - __main__ - Step 22976: {'lr': 0.00019990455145268982, 'samples': 735232, 'steps': 1435, 'loss/train': 3.3932063579559326} -09/20/2021 19:27:47 - INFO - __main__ - Step 22977: {'lr': 0.00019990427261188588, 'samples': 735264, 'steps': 1436, 'loss/train': 2.832350969314575} -09/20/2021 19:27:48 - INFO - __main__ - Step 22978: {'lr': 0.00019990427261188588, 'samples': 735296, 'steps': 1436, 'loss/train': 4.013672828674316} -09/20/2021 19:27:48 - INFO - __main__ - Step 22979: {'lr': 0.00019990427261188588, 'samples': 735328, 'steps': 1436, 'loss/train': 2.9795711040496826} -09/20/2021 19:27:49 - INFO - __main__ - Step 22980: {'lr': 0.00019990427261188588, 'samples': 735360, 'steps': 1436, 'loss/train': 2.664748430252075} -09/20/2021 19:27:50 - INFO - __main__ - Step 22981: {'lr': 0.00019990427261188588, 'samples': 735392, 'steps': 1436, 'loss/train': 4.581803321838379} -09/20/2021 19:27:51 - INFO - __main__ - Step 22982: {'lr': 0.00019990427261188588, 'samples': 735424, 'steps': 1436, 'loss/train': 2.7785115242004395} -09/20/2021 19:27:51 - INFO - __main__ - Step 22983: {'lr': 0.00019990427261188588, 'samples': 735456, 'steps': 1436, 'loss/train': 2.7773587703704834} -09/20/2021 19:27:52 - INFO - __main__ - Step 22984: {'lr': 0.00019990427261188588, 'samples': 735488, 'steps': 1436, 'loss/train': 3.9390177726745605} -09/20/2021 19:27:53 - INFO - __main__ - Step 22985: {'lr': 0.00019990427261188588, 'samples': 735520, 'steps': 1436, 'loss/train': 2.440559148788452} -09/20/2021 19:27:54 - INFO - __main__ - Step 22986: {'lr': 0.00019990427261188588, 'samples': 735552, 'steps': 1436, 'loss/train': 1.8584765195846558} -09/20/2021 19:27:54 - INFO - __main__ - Step 22987: {'lr': 0.00019990427261188588, 'samples': 735584, 'steps': 1436, 'loss/train': 2.041005849838257} -09/20/2021 19:27:55 - INFO - __main__ - Step 22988: {'lr': 0.00019990427261188588, 'samples': 735616, 'steps': 1436, 'loss/train': 3.3295319080352783} -09/20/2021 19:27:56 - INFO - __main__ - Step 22989: {'lr': 0.00019990427261188588, 'samples': 735648, 'steps': 1436, 'loss/train': 2.2540204524993896} -09/20/2021 19:27:57 - INFO - __main__ - Step 22990: {'lr': 0.00019990427261188588, 'samples': 735680, 'steps': 1436, 'loss/train': 3.7394797801971436} -09/20/2021 19:27:57 - INFO - __main__ - Step 22991: {'lr': 0.00019990427261188588, 'samples': 735712, 'steps': 1436, 'loss/train': 3.644150495529175} -09/20/2021 19:27:58 - INFO - __main__ - Step 22992: {'lr': 0.00019990427261188588, 'samples': 735744, 'steps': 1436, 'loss/train': 2.8048224449157715} -09/20/2021 19:27:59 - INFO - __main__ - Step 22993: {'lr': 0.0001999039933645718, 'samples': 735776, 'steps': 1437, 'loss/train': 2.6713507175445557} -09/20/2021 19:28:00 - INFO - __main__ - Step 22994: {'lr': 0.0001999039933645718, 'samples': 735808, 'steps': 1437, 'loss/train': 3.135265350341797} -09/20/2021 19:28:01 - INFO - __main__ - Step 22995: {'lr': 0.0001999039933645718, 'samples': 735840, 'steps': 1437, 'loss/train': 3.1165778636932373} -09/20/2021 19:28:02 - INFO - __main__ - Step 22996: {'lr': 0.0001999039933645718, 'samples': 735872, 'steps': 1437, 'loss/train': 3.5197360515594482} -09/20/2021 19:28:03 - INFO - __main__ - Step 22997: {'lr': 0.0001999039933645718, 'samples': 735904, 'steps': 1437, 'loss/train': 3.325077772140503} -09/20/2021 19:28:04 - INFO - __main__ - Step 22998: {'lr': 0.0001999039933645718, 'samples': 735936, 'steps': 1437, 'loss/train': 3.324580192565918} -09/20/2021 19:28:05 - INFO - __main__ - Step 22999: {'lr': 0.0001999039933645718, 'samples': 735968, 'steps': 1437, 'loss/train': 3.341111898422241} -09/20/2021 19:28:05 - INFO - __main__ - Step 23000: {'lr': 0.0001999039933645718, 'samples': 736000, 'steps': 1437, 'loss/train': 3.0733189582824707} -09/20/2021 19:28:06 - INFO - __main__ - Step 23001: {'lr': 0.0001999039933645718, 'samples': 736032, 'steps': 1437, 'loss/train': 3.050118923187256} -09/20/2021 19:28:07 - INFO - __main__ - Step 23002: {'lr': 0.0001999039933645718, 'samples': 736064, 'steps': 1437, 'loss/train': 2.565028429031372} -09/20/2021 19:28:08 - INFO - __main__ - Step 23003: {'lr': 0.0001999039933645718, 'samples': 736096, 'steps': 1437, 'loss/train': 2.9591763019561768} -09/20/2021 19:28:08 - INFO - __main__ - Step 23004: {'lr': 0.0001999039933645718, 'samples': 736128, 'steps': 1437, 'loss/train': 3.387352705001831} -09/20/2021 19:28:09 - INFO - __main__ - Step 23005: {'lr': 0.0001999039933645718, 'samples': 736160, 'steps': 1437, 'loss/train': 3.285022497177124} -09/20/2021 19:28:10 - INFO - __main__ - Step 23006: {'lr': 0.0001999039933645718, 'samples': 736192, 'steps': 1437, 'loss/train': 3.040148973464966} -09/20/2021 19:28:11 - INFO - __main__ - Step 23007: {'lr': 0.0001999039933645718, 'samples': 736224, 'steps': 1437, 'loss/train': 3.4743545055389404} -09/20/2021 19:28:11 - INFO - __main__ - Step 23008: {'lr': 0.0001999039933645718, 'samples': 736256, 'steps': 1437, 'loss/train': 3.00956654548645} -09/20/2021 19:28:12 - INFO - __main__ - Step 23009: {'lr': 0.0001999037137107488, 'samples': 736288, 'steps': 1438, 'loss/train': 4.45135498046875} -09/20/2021 19:28:13 - INFO - __main__ - Step 23010: {'lr': 0.0001999037137107488, 'samples': 736320, 'steps': 1438, 'loss/train': 2.3411428928375244} -09/20/2021 19:28:14 - INFO - __main__ - Step 23011: {'lr': 0.0001999037137107488, 'samples': 736352, 'steps': 1438, 'loss/train': 0.8110063672065735} -09/20/2021 19:28:14 - INFO - __main__ - Step 23012: {'lr': 0.0001999037137107488, 'samples': 736384, 'steps': 1438, 'loss/train': 3.213935136795044} -09/20/2021 19:28:15 - INFO - __main__ - Step 23013: {'lr': 0.0001999037137107488, 'samples': 736416, 'steps': 1438, 'loss/train': 3.3254220485687256} -09/20/2021 19:28:16 - INFO - __main__ - Step 23014: {'lr': 0.0001999037137107488, 'samples': 736448, 'steps': 1438, 'loss/train': 2.4716997146606445} -09/20/2021 19:28:17 - INFO - __main__ - Step 23015: {'lr': 0.0001999037137107488, 'samples': 736480, 'steps': 1438, 'loss/train': 3.7283577919006348} -09/20/2021 19:28:17 - INFO - __main__ - Step 23016: {'lr': 0.0001999037137107488, 'samples': 736512, 'steps': 1438, 'loss/train': 3.3907828330993652} -09/20/2021 19:28:18 - INFO - __main__ - Step 23017: {'lr': 0.0001999037137107488, 'samples': 736544, 'steps': 1438, 'loss/train': 2.6553409099578857} -09/20/2021 19:28:19 - INFO - __main__ - Step 23018: {'lr': 0.0001999037137107488, 'samples': 736576, 'steps': 1438, 'loss/train': 1.8900270462036133} -09/20/2021 19:28:20 - INFO - __main__ - Step 23019: {'lr': 0.0001999037137107488, 'samples': 736608, 'steps': 1438, 'loss/train': 2.679798126220703} -09/20/2021 19:28:20 - INFO - __main__ - Step 23020: {'lr': 0.0001999037137107488, 'samples': 736640, 'steps': 1438, 'loss/train': 3.083902359008789} -09/20/2021 19:28:21 - INFO - __main__ - Step 23021: {'lr': 0.0001999037137107488, 'samples': 736672, 'steps': 1438, 'loss/train': 2.3116471767425537} -09/20/2021 19:28:22 - INFO - __main__ - Step 23022: {'lr': 0.0001999037137107488, 'samples': 736704, 'steps': 1438, 'loss/train': 3.395320415496826} -09/20/2021 19:28:23 - INFO - __main__ - Step 23023: {'lr': 0.0001999037137107488, 'samples': 736736, 'steps': 1438, 'loss/train': 2.4194250106811523} -09/20/2021 19:28:23 - INFO - __main__ - Step 23024: {'lr': 0.0001999037137107488, 'samples': 736768, 'steps': 1438, 'loss/train': 3.2547545433044434} -09/20/2021 19:28:24 - INFO - __main__ - Step 23025: {'lr': 0.00019990343365041798, 'samples': 736800, 'steps': 1439, 'loss/train': 2.4310073852539062} -09/20/2021 19:28:25 - INFO - __main__ - Step 23026: {'lr': 0.00019990343365041798, 'samples': 736832, 'steps': 1439, 'loss/train': 3.1911890506744385} -09/20/2021 19:28:26 - INFO - __main__ - Step 23027: {'lr': 0.00019990343365041798, 'samples': 736864, 'steps': 1439, 'loss/train': 3.5709941387176514} -09/20/2021 19:28:27 - INFO - __main__ - Step 23028: {'lr': 0.00019990343365041798, 'samples': 736896, 'steps': 1439, 'loss/train': 2.6452136039733887} -09/20/2021 19:28:28 - INFO - __main__ - Step 23029: {'lr': 0.00019990343365041798, 'samples': 736928, 'steps': 1439, 'loss/train': 3.256789207458496} -09/20/2021 19:28:29 - INFO - __main__ - Step 23030: {'lr': 0.00019990343365041798, 'samples': 736960, 'steps': 1439, 'loss/train': 3.1297316551208496} -09/20/2021 19:28:29 - INFO - __main__ - Step 23031: {'lr': 0.00019990343365041798, 'samples': 736992, 'steps': 1439, 'loss/train': 3.0157723426818848} -09/20/2021 19:28:30 - INFO - __main__ - Step 23032: {'lr': 0.00019990343365041798, 'samples': 737024, 'steps': 1439, 'loss/train': 3.111607789993286} -09/20/2021 19:28:31 - INFO - __main__ - Step 23033: {'lr': 0.00019990343365041798, 'samples': 737056, 'steps': 1439, 'loss/train': 3.354804039001465} -09/20/2021 19:28:32 - INFO - __main__ - Step 23034: {'lr': 0.00019990343365041798, 'samples': 737088, 'steps': 1439, 'loss/train': 3.0940709114074707} -09/20/2021 19:28:32 - INFO - __main__ - Step 23035: {'lr': 0.00019990343365041798, 'samples': 737120, 'steps': 1439, 'loss/train': 3.562061071395874} -09/20/2021 19:28:33 - INFO - __main__ - Step 23036: {'lr': 0.00019990343365041798, 'samples': 737152, 'steps': 1439, 'loss/train': 3.2798240184783936} -09/20/2021 19:28:34 - INFO - __main__ - Step 23037: {'lr': 0.00019990343365041798, 'samples': 737184, 'steps': 1439, 'loss/train': 3.075355052947998} -09/20/2021 19:28:35 - INFO - __main__ - Step 23038: {'lr': 0.00019990343365041798, 'samples': 737216, 'steps': 1439, 'loss/train': 3.681919574737549} -09/20/2021 19:28:35 - INFO - __main__ - Step 23039: {'lr': 0.00019990343365041798, 'samples': 737248, 'steps': 1439, 'loss/train': 2.8428916931152344} -09/20/2021 19:28:36 - INFO - __main__ - Step 23040: {'lr': 0.00019990343365041798, 'samples': 737280, 'steps': 1439, 'loss/train': 3.5536248683929443} -09/20/2021 19:28:37 - INFO - __main__ - Step 23041: {'lr': 0.00019990315318358046, 'samples': 737312, 'steps': 1440, 'loss/train': 3.1076784133911133} -09/20/2021 19:28:38 - INFO - __main__ - Step 23042: {'lr': 0.00019990315318358046, 'samples': 737344, 'steps': 1440, 'loss/train': 2.828984498977661} -09/20/2021 19:28:38 - INFO - __main__ - Step 23043: {'lr': 0.00019990315318358046, 'samples': 737376, 'steps': 1440, 'loss/train': 3.7367775440216064} -09/20/2021 19:28:39 - INFO - __main__ - Step 23044: {'lr': 0.00019990315318358046, 'samples': 737408, 'steps': 1440, 'loss/train': 3.00614857673645} -09/20/2021 19:28:40 - INFO - __main__ - Step 23045: {'lr': 0.00019990315318358046, 'samples': 737440, 'steps': 1440, 'loss/train': 2.7516157627105713} -09/20/2021 19:28:41 - INFO - __main__ - Step 23046: {'lr': 0.00019990315318358046, 'samples': 737472, 'steps': 1440, 'loss/train': 3.1338589191436768} -09/20/2021 19:28:41 - INFO - __main__ - Step 23047: {'lr': 0.00019990315318358046, 'samples': 737504, 'steps': 1440, 'loss/train': 2.637824535369873} -09/20/2021 19:28:42 - INFO - __main__ - Step 23048: {'lr': 0.00019990315318358046, 'samples': 737536, 'steps': 1440, 'loss/train': 3.452303409576416} -09/20/2021 19:28:43 - INFO - __main__ - Step 23049: {'lr': 0.00019990315318358046, 'samples': 737568, 'steps': 1440, 'loss/train': 3.118628978729248} -09/20/2021 19:28:44 - INFO - __main__ - Step 23050: {'lr': 0.00019990315318358046, 'samples': 737600, 'steps': 1440, 'loss/train': 2.2899460792541504} -09/20/2021 19:28:44 - INFO - __main__ - Step 23051: {'lr': 0.00019990315318358046, 'samples': 737632, 'steps': 1440, 'loss/train': 3.2042088508605957} -09/20/2021 19:28:45 - INFO - __main__ - Step 23052: {'lr': 0.00019990315318358046, 'samples': 737664, 'steps': 1440, 'loss/train': 2.494529962539673} -09/20/2021 19:28:46 - INFO - __main__ - Step 23053: {'lr': 0.00019990315318358046, 'samples': 737696, 'steps': 1440, 'loss/train': 2.6050922870635986} -09/20/2021 19:28:47 - INFO - __main__ - Step 23054: {'lr': 0.00019990315318358046, 'samples': 737728, 'steps': 1440, 'loss/train': 2.86905574798584} -09/20/2021 19:28:47 - INFO - __main__ - Step 23055: {'lr': 0.00019990315318358046, 'samples': 737760, 'steps': 1440, 'loss/train': 4.009888172149658} -09/20/2021 19:28:48 - INFO - __main__ - Step 23056: {'lr': 0.00019990315318358046, 'samples': 737792, 'steps': 1440, 'loss/train': 3.035595178604126} -09/20/2021 19:28:50 - INFO - __main__ - Step 23057: {'lr': 0.0001999028723102374, 'samples': 737824, 'steps': 1441, 'loss/train': 3.173060655593872} -09/20/2021 19:28:50 - INFO - __main__ - Step 23058: {'lr': 0.0001999028723102374, 'samples': 737856, 'steps': 1441, 'loss/train': 2.9572253227233887} -09/20/2021 19:28:51 - INFO - __main__ - Step 23059: {'lr': 0.0001999028723102374, 'samples': 737888, 'steps': 1441, 'loss/train': 2.8493478298187256} -09/20/2021 19:28:52 - INFO - __main__ - Step 23060: {'lr': 0.0001999028723102374, 'samples': 737920, 'steps': 1441, 'loss/train': 3.355005979537964} -09/20/2021 19:28:53 - INFO - __main__ - Step 23061: {'lr': 0.0001999028723102374, 'samples': 737952, 'steps': 1441, 'loss/train': 3.7255961894989014} -09/20/2021 19:28:53 - INFO - __main__ - Step 23062: {'lr': 0.0001999028723102374, 'samples': 737984, 'steps': 1441, 'loss/train': 2.982586622238159} -09/20/2021 19:28:54 - INFO - __main__ - Step 23063: {'lr': 0.0001999028723102374, 'samples': 738016, 'steps': 1441, 'loss/train': 3.1803107261657715} -09/20/2021 19:28:55 - INFO - __main__ - Step 23064: {'lr': 0.0001999028723102374, 'samples': 738048, 'steps': 1441, 'loss/train': 2.8149189949035645} -09/20/2021 19:28:56 - INFO - __main__ - Step 23065: {'lr': 0.0001999028723102374, 'samples': 738080, 'steps': 1441, 'loss/train': 3.560056686401367} -09/20/2021 19:28:56 - INFO - __main__ - Step 23066: {'lr': 0.0001999028723102374, 'samples': 738112, 'steps': 1441, 'loss/train': 3.3446567058563232} -09/20/2021 19:28:57 - INFO - __main__ - Step 23067: {'lr': 0.0001999028723102374, 'samples': 738144, 'steps': 1441, 'loss/train': 3.1515555381774902} -09/20/2021 19:28:58 - INFO - __main__ - Step 23068: {'lr': 0.0001999028723102374, 'samples': 738176, 'steps': 1441, 'loss/train': 3.6730072498321533} -09/20/2021 19:28:59 - INFO - __main__ - Step 23069: {'lr': 0.0001999028723102374, 'samples': 738208, 'steps': 1441, 'loss/train': 2.961395263671875} -09/20/2021 19:28:59 - INFO - __main__ - Step 23070: {'lr': 0.0001999028723102374, 'samples': 738240, 'steps': 1441, 'loss/train': 3.306981086730957} -09/20/2021 19:29:00 - INFO - __main__ - Step 23071: {'lr': 0.0001999028723102374, 'samples': 738272, 'steps': 1441, 'loss/train': 2.4255266189575195} -09/20/2021 19:29:01 - INFO - __main__ - Step 23072: {'lr': 0.0001999028723102374, 'samples': 738304, 'steps': 1441, 'loss/train': 2.61906361579895} -09/20/2021 19:29:02 - INFO - __main__ - Step 23073: {'lr': 0.00019990259103038995, 'samples': 738336, 'steps': 1442, 'loss/train': 2.5417981147766113} -09/20/2021 19:29:03 - INFO - __main__ - Step 23074: {'lr': 0.00019990259103038995, 'samples': 738368, 'steps': 1442, 'loss/train': 2.3087568283081055} -09/20/2021 19:29:03 - INFO - __main__ - Step 23075: {'lr': 0.00019990259103038995, 'samples': 738400, 'steps': 1442, 'loss/train': 2.9585323333740234} -09/20/2021 19:29:04 - INFO - __main__ - Step 23076: {'lr': 0.00019990259103038995, 'samples': 738432, 'steps': 1442, 'loss/train': 3.6762070655822754} -09/20/2021 19:29:05 - INFO - __main__ - Step 23077: {'lr': 0.00019990259103038995, 'samples': 738464, 'steps': 1442, 'loss/train': 2.7970283031463623} -09/20/2021 19:29:06 - INFO - __main__ - Step 23078: {'lr': 0.00019990259103038995, 'samples': 738496, 'steps': 1442, 'loss/train': 3.2535579204559326} -09/20/2021 19:29:06 - INFO - __main__ - Step 23079: {'lr': 0.00019990259103038995, 'samples': 738528, 'steps': 1442, 'loss/train': 3.3354718685150146} -09/20/2021 19:29:07 - INFO - __main__ - Step 23080: {'lr': 0.00019990259103038995, 'samples': 738560, 'steps': 1442, 'loss/train': 2.9504032135009766} -09/20/2021 19:29:08 - INFO - __main__ - Step 23081: {'lr': 0.00019990259103038995, 'samples': 738592, 'steps': 1442, 'loss/train': 0.47248613834381104} -09/20/2021 19:29:09 - INFO - __main__ - Step 23082: {'lr': 0.00019990259103038995, 'samples': 738624, 'steps': 1442, 'loss/train': 3.138564348220825} -09/20/2021 19:29:09 - INFO - __main__ - Step 23083: {'lr': 0.00019990259103038995, 'samples': 738656, 'steps': 1442, 'loss/train': 3.863887310028076} -09/20/2021 19:29:10 - INFO - __main__ - Step 23084: {'lr': 0.00019990259103038995, 'samples': 738688, 'steps': 1442, 'loss/train': 0.9328632950782776} -09/20/2021 19:29:11 - INFO - __main__ - Step 23085: {'lr': 0.00019990259103038995, 'samples': 738720, 'steps': 1442, 'loss/train': 4.448206901550293} -09/20/2021 19:29:12 - INFO - __main__ - Step 23086: {'lr': 0.00019990259103038995, 'samples': 738752, 'steps': 1442, 'loss/train': 3.288050413131714} -09/20/2021 19:29:13 - INFO - __main__ - Step 23087: {'lr': 0.00019990259103038995, 'samples': 738784, 'steps': 1442, 'loss/train': 3.008209228515625} -09/20/2021 19:29:14 - INFO - __main__ - Step 23088: {'lr': 0.00019990259103038995, 'samples': 738816, 'steps': 1442, 'loss/train': 2.415557384490967} -09/20/2021 19:29:15 - INFO - __main__ - Step 23089: {'lr': 0.00019990230934403922, 'samples': 738848, 'steps': 1443, 'loss/train': 2.4854846000671387} -09/20/2021 19:29:16 - INFO - __main__ - Step 23090: {'lr': 0.00019990230934403922, 'samples': 738880, 'steps': 1443, 'loss/train': 3.3385348320007324} -09/20/2021 19:29:16 - INFO - __main__ - Step 23091: {'lr': 0.00019990230934403922, 'samples': 738912, 'steps': 1443, 'loss/train': 3.1007449626922607} -09/20/2021 19:29:17 - INFO - __main__ - Step 23092: {'lr': 0.00019990230934403922, 'samples': 738944, 'steps': 1443, 'loss/train': 3.1475582122802734} -09/20/2021 19:29:18 - INFO - __main__ - Step 23093: {'lr': 0.00019990230934403922, 'samples': 738976, 'steps': 1443, 'loss/train': 2.829899549484253} -09/20/2021 19:29:19 - INFO - __main__ - Step 23094: {'lr': 0.00019990230934403922, 'samples': 739008, 'steps': 1443, 'loss/train': 2.7210423946380615} -09/20/2021 19:29:19 - INFO - __main__ - Step 23095: {'lr': 0.00019990230934403922, 'samples': 739040, 'steps': 1443, 'loss/train': 0.6987234354019165} -09/20/2021 19:29:20 - INFO - __main__ - Step 23096: {'lr': 0.00019990230934403922, 'samples': 739072, 'steps': 1443, 'loss/train': 0.7980306148529053} -09/20/2021 19:29:21 - INFO - __main__ - Step 23097: {'lr': 0.00019990230934403922, 'samples': 739104, 'steps': 1443, 'loss/train': 0.6395014524459839} -09/20/2021 19:29:22 - INFO - __main__ - Step 23098: {'lr': 0.00019990230934403922, 'samples': 739136, 'steps': 1443, 'loss/train': 2.8651630878448486} -09/20/2021 19:29:22 - INFO - __main__ - Step 23099: {'lr': 0.00019990230934403922, 'samples': 739168, 'steps': 1443, 'loss/train': 2.168120861053467} -09/20/2021 19:29:23 - INFO - __main__ - Step 23100: {'lr': 0.00019990230934403922, 'samples': 739200, 'steps': 1443, 'loss/train': 2.207510471343994} -09/20/2021 19:29:24 - INFO - __main__ - Step 23101: {'lr': 0.00019990230934403922, 'samples': 739232, 'steps': 1443, 'loss/train': 2.4224164485931396} -09/20/2021 19:29:25 - INFO - __main__ - Step 23102: {'lr': 0.00019990230934403922, 'samples': 739264, 'steps': 1443, 'loss/train': 2.1719532012939453} -09/20/2021 19:29:25 - INFO - __main__ - Step 23103: {'lr': 0.00019990230934403922, 'samples': 739296, 'steps': 1443, 'loss/train': 2.236753225326538} -09/20/2021 19:29:26 - INFO - __main__ - Step 23104: {'lr': 0.00019990230934403922, 'samples': 739328, 'steps': 1443, 'loss/train': 2.2604339122772217} -09/20/2021 19:29:27 - INFO - __main__ - Step 23105: {'lr': 0.0001999020272511864, 'samples': 739360, 'steps': 1444, 'loss/train': 1.7719041109085083} -09/20/2021 19:29:28 - INFO - __main__ - Step 23106: {'lr': 0.0001999020272511864, 'samples': 739392, 'steps': 1444, 'loss/train': 2.0069546699523926} -09/20/2021 19:29:28 - INFO - __main__ - Step 23107: {'lr': 0.0001999020272511864, 'samples': 739424, 'steps': 1444, 'loss/train': 2.7698423862457275} -09/20/2021 19:29:29 - INFO - __main__ - Step 23108: {'lr': 0.0001999020272511864, 'samples': 739456, 'steps': 1444, 'loss/train': 3.146300792694092} -09/20/2021 19:29:30 - INFO - __main__ - Step 23109: {'lr': 0.0001999020272511864, 'samples': 739488, 'steps': 1444, 'loss/train': 3.4960756301879883} -09/20/2021 19:29:31 - INFO - __main__ - Step 23110: {'lr': 0.0001999020272511864, 'samples': 739520, 'steps': 1444, 'loss/train': 2.822049379348755} -09/20/2021 19:29:31 - INFO - __main__ - Step 23111: {'lr': 0.0001999020272511864, 'samples': 739552, 'steps': 1444, 'loss/train': 2.8516252040863037} -09/20/2021 19:29:32 - INFO - __main__ - Step 23112: {'lr': 0.0001999020272511864, 'samples': 739584, 'steps': 1444, 'loss/train': 2.969104290008545} -09/20/2021 19:29:33 - INFO - __main__ - Step 23113: {'lr': 0.0001999020272511864, 'samples': 739616, 'steps': 1444, 'loss/train': 0.8818982839584351} -09/20/2021 19:29:34 - INFO - __main__ - Step 23114: {'lr': 0.0001999020272511864, 'samples': 739648, 'steps': 1444, 'loss/train': 3.973031520843506} -09/20/2021 19:29:34 - INFO - __main__ - Step 23115: {'lr': 0.0001999020272511864, 'samples': 739680, 'steps': 1444, 'loss/train': 4.934118270874023} -09/20/2021 19:29:35 - INFO - __main__ - Step 23116: {'lr': 0.0001999020272511864, 'samples': 739712, 'steps': 1444, 'loss/train': 2.841167449951172} -09/20/2021 19:29:36 - INFO - __main__ - Step 23117: {'lr': 0.0001999020272511864, 'samples': 739744, 'steps': 1444, 'loss/train': 3.6490015983581543} -09/20/2021 19:29:37 - INFO - __main__ - Step 23118: {'lr': 0.0001999020272511864, 'samples': 739776, 'steps': 1444, 'loss/train': 2.947774887084961} -09/20/2021 19:29:37 - INFO - __main__ - Step 23119: {'lr': 0.0001999020272511864, 'samples': 739808, 'steps': 1444, 'loss/train': 1.8950051069259644} -09/20/2021 19:29:38 - INFO - __main__ - Step 23120: {'lr': 0.0001999020272511864, 'samples': 739840, 'steps': 1444, 'loss/train': 2.5240516662597656} -09/20/2021 19:29:39 - INFO - __main__ - Step 23121: {'lr': 0.00019990174475183263, 'samples': 739872, 'steps': 1445, 'loss/train': 1.9299554824829102} -09/20/2021 19:29:40 - INFO - __main__ - Step 23122: {'lr': 0.00019990174475183263, 'samples': 739904, 'steps': 1445, 'loss/train': 2.030548334121704} -09/20/2021 19:29:41 - INFO - __main__ - Step 23123: {'lr': 0.00019990174475183263, 'samples': 739936, 'steps': 1445, 'loss/train': 3.183995246887207} -09/20/2021 19:29:42 - INFO - __main__ - Step 23124: {'lr': 0.00019990174475183263, 'samples': 739968, 'steps': 1445, 'loss/train': 2.6951780319213867} -09/20/2021 19:29:43 - INFO - __main__ - Step 23125: {'lr': 0.00019990174475183263, 'samples': 740000, 'steps': 1445, 'loss/train': 2.2899703979492188} -09/20/2021 19:29:43 - INFO - __main__ - Step 23126: {'lr': 0.00019990174475183263, 'samples': 740032, 'steps': 1445, 'loss/train': 3.5992271900177} -09/20/2021 19:29:44 - INFO - __main__ - Step 23127: {'lr': 0.00019990174475183263, 'samples': 740064, 'steps': 1445, 'loss/train': 3.946337938308716} -09/20/2021 19:29:45 - INFO - __main__ - Step 23128: {'lr': 0.00019990174475183263, 'samples': 740096, 'steps': 1445, 'loss/train': 3.2174417972564697} -09/20/2021 19:29:46 - INFO - __main__ - Step 23129: {'lr': 0.00019990174475183263, 'samples': 740128, 'steps': 1445, 'loss/train': 2.9047937393188477} -09/20/2021 19:29:46 - INFO - __main__ - Step 23130: {'lr': 0.00019990174475183263, 'samples': 740160, 'steps': 1445, 'loss/train': 3.378425359725952} -09/20/2021 19:29:47 - INFO - __main__ - Step 23131: {'lr': 0.00019990174475183263, 'samples': 740192, 'steps': 1445, 'loss/train': 3.087475538253784} -09/20/2021 19:29:48 - INFO - __main__ - Step 23132: {'lr': 0.00019990174475183263, 'samples': 740224, 'steps': 1445, 'loss/train': 3.68935227394104} -09/20/2021 19:29:49 - INFO - __main__ - Step 23133: {'lr': 0.00019990174475183263, 'samples': 740256, 'steps': 1445, 'loss/train': 4.838827610015869} -09/20/2021 19:29:49 - INFO - __main__ - Step 23134: {'lr': 0.00019990174475183263, 'samples': 740288, 'steps': 1445, 'loss/train': 2.739732503890991} -09/20/2021 19:29:50 - INFO - __main__ - Step 23135: {'lr': 0.00019990174475183263, 'samples': 740320, 'steps': 1445, 'loss/train': 3.115638256072998} -09/20/2021 19:29:51 - INFO - __main__ - Step 23136: {'lr': 0.00019990174475183263, 'samples': 740352, 'steps': 1445, 'loss/train': 3.2500462532043457} -09/20/2021 19:29:52 - INFO - __main__ - Step 23137: {'lr': 0.00019990146184597905, 'samples': 740384, 'steps': 1446, 'loss/train': 1.1182165145874023} -09/20/2021 19:29:53 - INFO - __main__ - Step 23138: {'lr': 0.00019990146184597905, 'samples': 740416, 'steps': 1446, 'loss/train': 2.512634515762329} -09/20/2021 19:29:53 - INFO - __main__ - Step 23139: {'lr': 0.00019990146184597905, 'samples': 740448, 'steps': 1446, 'loss/train': 2.519636392593384} -09/20/2021 19:29:54 - INFO - __main__ - Step 23140: {'lr': 0.00019990146184597905, 'samples': 740480, 'steps': 1446, 'loss/train': 0.7378455400466919} -09/20/2021 19:29:55 - INFO - __main__ - Step 23141: {'lr': 0.00019990146184597905, 'samples': 740512, 'steps': 1446, 'loss/train': 0.7234638333320618} -09/20/2021 19:29:56 - INFO - __main__ - Step 23142: {'lr': 0.00019990146184597905, 'samples': 740544, 'steps': 1446, 'loss/train': 3.190685987472534} -09/20/2021 19:29:56 - INFO - __main__ - Step 23143: {'lr': 0.00019990146184597905, 'samples': 740576, 'steps': 1446, 'loss/train': 3.385770797729492} -09/20/2021 19:29:57 - INFO - __main__ - Step 23144: {'lr': 0.00019990146184597905, 'samples': 740608, 'steps': 1446, 'loss/train': 2.4103915691375732} -09/20/2021 19:29:58 - INFO - __main__ - Step 23145: {'lr': 0.00019990146184597905, 'samples': 740640, 'steps': 1446, 'loss/train': 3.661395311355591} -09/20/2021 19:29:59 - INFO - __main__ - Step 23146: {'lr': 0.00019990146184597905, 'samples': 740672, 'steps': 1446, 'loss/train': 1.0809317827224731} -09/20/2021 19:29:59 - INFO - __main__ - Step 23147: {'lr': 0.00019990146184597905, 'samples': 740704, 'steps': 1446, 'loss/train': 2.9389336109161377} -09/20/2021 19:30:00 - INFO - __main__ - Step 23148: {'lr': 0.00019990146184597905, 'samples': 740736, 'steps': 1446, 'loss/train': 2.6323914527893066} -09/20/2021 19:30:01 - INFO - __main__ - Step 23149: {'lr': 0.00019990146184597905, 'samples': 740768, 'steps': 1446, 'loss/train': 4.39642858505249} -09/20/2021 19:30:02 - INFO - __main__ - Step 23150: {'lr': 0.00019990146184597905, 'samples': 740800, 'steps': 1446, 'loss/train': 2.6901025772094727} -09/20/2021 19:30:02 - INFO - __main__ - Step 23151: {'lr': 0.00019990146184597905, 'samples': 740832, 'steps': 1446, 'loss/train': 2.781731367111206} -09/20/2021 19:30:03 - INFO - __main__ - Step 23152: {'lr': 0.00019990146184597905, 'samples': 740864, 'steps': 1446, 'loss/train': 2.6554925441741943} -09/20/2021 19:30:04 - INFO - __main__ - Step 23153: {'lr': 0.0001999011785336268, 'samples': 740896, 'steps': 1447, 'loss/train': 2.8258919715881348} -09/20/2021 19:30:05 - INFO - __main__ - Step 23154: {'lr': 0.0001999011785336268, 'samples': 740928, 'steps': 1447, 'loss/train': 1.7972031831741333} -09/20/2021 19:30:06 - INFO - __main__ - Step 23155: {'lr': 0.0001999011785336268, 'samples': 740960, 'steps': 1447, 'loss/train': 3.048144817352295} -09/20/2021 19:30:07 - INFO - __main__ - Step 23156: {'lr': 0.0001999011785336268, 'samples': 740992, 'steps': 1447, 'loss/train': 2.9389684200286865} -09/20/2021 19:30:08 - INFO - __main__ - Step 23157: {'lr': 0.0001999011785336268, 'samples': 741024, 'steps': 1447, 'loss/train': 2.947554588317871} -09/20/2021 19:30:08 - INFO - __main__ - Step 23158: {'lr': 0.0001999011785336268, 'samples': 741056, 'steps': 1447, 'loss/train': 2.8366808891296387} -09/20/2021 19:30:09 - INFO - __main__ - Step 23159: {'lr': 0.0001999011785336268, 'samples': 741088, 'steps': 1447, 'loss/train': 3.5795657634735107} -09/20/2021 19:30:10 - INFO - __main__ - Step 23160: {'lr': 0.0001999011785336268, 'samples': 741120, 'steps': 1447, 'loss/train': 3.369276762008667} -09/20/2021 19:30:11 - INFO - __main__ - Step 23161: {'lr': 0.0001999011785336268, 'samples': 741152, 'steps': 1447, 'loss/train': 2.464099884033203} -09/20/2021 19:30:11 - INFO - __main__ - Step 23162: {'lr': 0.0001999011785336268, 'samples': 741184, 'steps': 1447, 'loss/train': 2.7751543521881104} -09/20/2021 19:30:12 - INFO - __main__ - Step 23163: {'lr': 0.0001999011785336268, 'samples': 741216, 'steps': 1447, 'loss/train': 3.2010207176208496} -09/20/2021 19:30:13 - INFO - __main__ - Step 23164: {'lr': 0.0001999011785336268, 'samples': 741248, 'steps': 1447, 'loss/train': 4.221067428588867} -09/20/2021 19:30:13 - INFO - __main__ - Step 23165: {'lr': 0.0001999011785336268, 'samples': 741280, 'steps': 1447, 'loss/train': 3.4507620334625244} -09/20/2021 19:30:14 - INFO - __main__ - Step 23166: {'lr': 0.0001999011785336268, 'samples': 741312, 'steps': 1447, 'loss/train': 2.752199411392212} -09/20/2021 19:30:15 - INFO - __main__ - Step 23167: {'lr': 0.0001999011785336268, 'samples': 741344, 'steps': 1447, 'loss/train': 2.575547456741333} -09/20/2021 19:30:16 - INFO - __main__ - Step 23168: {'lr': 0.0001999011785336268, 'samples': 741376, 'steps': 1447, 'loss/train': 2.5400235652923584} -09/20/2021 19:30:17 - INFO - __main__ - Step 23169: {'lr': 0.000199900894814777, 'samples': 741408, 'steps': 1448, 'loss/train': 3.7393128871917725} -09/20/2021 19:30:17 - INFO - __main__ - Step 23170: {'lr': 0.000199900894814777, 'samples': 741440, 'steps': 1448, 'loss/train': 2.905937671661377} -09/20/2021 19:30:18 - INFO - __main__ - Step 23171: {'lr': 0.000199900894814777, 'samples': 741472, 'steps': 1448, 'loss/train': 2.958503007888794} -09/20/2021 19:30:19 - INFO - __main__ - Step 23172: {'lr': 0.000199900894814777, 'samples': 741504, 'steps': 1448, 'loss/train': 2.9897775650024414} -09/20/2021 19:30:20 - INFO - __main__ - Step 23173: {'lr': 0.000199900894814777, 'samples': 741536, 'steps': 1448, 'loss/train': 2.955249547958374} -09/20/2021 19:30:20 - INFO - __main__ - Step 23174: {'lr': 0.000199900894814777, 'samples': 741568, 'steps': 1448, 'loss/train': 3.3824453353881836} -09/20/2021 19:30:21 - INFO - __main__ - Step 23175: {'lr': 0.000199900894814777, 'samples': 741600, 'steps': 1448, 'loss/train': 2.8602192401885986} -09/20/2021 19:30:22 - INFO - __main__ - Step 23176: {'lr': 0.000199900894814777, 'samples': 741632, 'steps': 1448, 'loss/train': 2.936530351638794} -09/20/2021 19:30:23 - INFO - __main__ - Step 23177: {'lr': 0.000199900894814777, 'samples': 741664, 'steps': 1448, 'loss/train': 2.7984182834625244} -09/20/2021 19:30:23 - INFO - __main__ - Step 23178: {'lr': 0.000199900894814777, 'samples': 741696, 'steps': 1448, 'loss/train': 3.6185760498046875} -09/20/2021 19:30:24 - INFO - __main__ - Step 23179: {'lr': 0.000199900894814777, 'samples': 741728, 'steps': 1448, 'loss/train': 0.5541381239891052} -09/20/2021 19:30:25 - INFO - __main__ - Step 23180: {'lr': 0.000199900894814777, 'samples': 741760, 'steps': 1448, 'loss/train': 0.5049427151679993} -09/20/2021 19:30:26 - INFO - __main__ - Step 23181: {'lr': 0.000199900894814777, 'samples': 741792, 'steps': 1448, 'loss/train': 0.6566279530525208} -09/20/2021 19:30:26 - INFO - __main__ - Step 23182: {'lr': 0.000199900894814777, 'samples': 741824, 'steps': 1448, 'loss/train': 3.9154539108276367} -09/20/2021 19:30:27 - INFO - __main__ - Step 23183: {'lr': 0.000199900894814777, 'samples': 741856, 'steps': 1448, 'loss/train': 2.8683085441589355} -09/20/2021 19:30:28 - INFO - __main__ - Step 23184: {'lr': 0.000199900894814777, 'samples': 741888, 'steps': 1448, 'loss/train': 3.407294511795044} -09/20/2021 19:30:30 - INFO - __main__ - Step 23185: {'lr': 0.00019990061068943092, 'samples': 741920, 'steps': 1449, 'loss/train': 2.943401575088501} -09/20/2021 19:30:30 - INFO - __main__ - Step 23186: {'lr': 0.00019990061068943092, 'samples': 741952, 'steps': 1449, 'loss/train': 3.078476905822754} -09/20/2021 19:30:31 - INFO - __main__ - Step 23187: {'lr': 0.00019990061068943092, 'samples': 741984, 'steps': 1449, 'loss/train': 4.182049751281738} -09/20/2021 19:30:32 - INFO - __main__ - Step 23188: {'lr': 0.00019990061068943092, 'samples': 742016, 'steps': 1449, 'loss/train': 3.538175344467163} -09/20/2021 19:30:33 - INFO - __main__ - Step 23189: {'lr': 0.00019990061068943092, 'samples': 742048, 'steps': 1449, 'loss/train': 2.9048049449920654} -09/20/2021 19:30:33 - INFO - __main__ - Step 23190: {'lr': 0.00019990061068943092, 'samples': 742080, 'steps': 1449, 'loss/train': 3.490741491317749} -09/20/2021 19:30:34 - INFO - __main__ - Step 23191: {'lr': 0.00019990061068943092, 'samples': 742112, 'steps': 1449, 'loss/train': 2.014963150024414} -09/20/2021 19:30:35 - INFO - __main__ - Step 23192: {'lr': 0.00019990061068943092, 'samples': 742144, 'steps': 1449, 'loss/train': 2.397005796432495} -09/20/2021 19:30:36 - INFO - __main__ - Step 23193: {'lr': 0.00019990061068943092, 'samples': 742176, 'steps': 1449, 'loss/train': 3.2254068851470947} -09/20/2021 19:30:36 - INFO - __main__ - Step 23194: {'lr': 0.00019990061068943092, 'samples': 742208, 'steps': 1449, 'loss/train': 2.873927354812622} -09/20/2021 19:30:37 - INFO - __main__ - Step 23195: {'lr': 0.00019990061068943092, 'samples': 742240, 'steps': 1449, 'loss/train': 2.796757459640503} -09/20/2021 19:30:38 - INFO - __main__ - Step 23196: {'lr': 0.00019990061068943092, 'samples': 742272, 'steps': 1449, 'loss/train': 3.4227311611175537} -09/20/2021 19:30:39 - INFO - __main__ - Step 23197: {'lr': 0.00019990061068943092, 'samples': 742304, 'steps': 1449, 'loss/train': 2.89906644821167} -09/20/2021 19:30:39 - INFO - __main__ - Step 23198: {'lr': 0.00019990061068943092, 'samples': 742336, 'steps': 1449, 'loss/train': 2.8842039108276367} -09/20/2021 19:30:40 - INFO - __main__ - Step 23199: {'lr': 0.00019990061068943092, 'samples': 742368, 'steps': 1449, 'loss/train': 3.144955635070801} -09/20/2021 19:30:41 - INFO - __main__ - Step 23200: {'lr': 0.00019990061068943092, 'samples': 742400, 'steps': 1449, 'loss/train': 2.912790298461914} -09/20/2021 19:30:42 - INFO - __main__ - Step 23201: {'lr': 0.00019990032615758958, 'samples': 742432, 'steps': 1450, 'loss/train': 2.446385622024536} -09/20/2021 19:30:42 - INFO - __main__ - Step 23202: {'lr': 0.00019990032615758958, 'samples': 742464, 'steps': 1450, 'loss/train': 1.4812653064727783} -09/20/2021 19:30:43 - INFO - __main__ - Step 23203: {'lr': 0.00019990032615758958, 'samples': 742496, 'steps': 1450, 'loss/train': 2.224231719970703} -09/20/2021 19:30:44 - INFO - __main__ - Step 23204: {'lr': 0.00019990032615758958, 'samples': 742528, 'steps': 1450, 'loss/train': 2.7743892669677734} -09/20/2021 19:30:45 - INFO - __main__ - Step 23205: {'lr': 0.00019990032615758958, 'samples': 742560, 'steps': 1450, 'loss/train': 1.9337536096572876} -09/20/2021 19:30:45 - INFO - __main__ - Step 23206: {'lr': 0.00019990032615758958, 'samples': 742592, 'steps': 1450, 'loss/train': 2.4841246604919434} -09/20/2021 19:30:46 - INFO - __main__ - Step 23207: {'lr': 0.00019990032615758958, 'samples': 742624, 'steps': 1450, 'loss/train': 2.120570182800293} -09/20/2021 19:30:47 - INFO - __main__ - Step 23208: {'lr': 0.00019990032615758958, 'samples': 742656, 'steps': 1450, 'loss/train': 1.983971118927002} -09/20/2021 19:30:48 - INFO - __main__ - Step 23209: {'lr': 0.00019990032615758958, 'samples': 742688, 'steps': 1450, 'loss/train': 2.815572500228882} -09/20/2021 19:30:48 - INFO - __main__ - Step 23210: {'lr': 0.00019990032615758958, 'samples': 742720, 'steps': 1450, 'loss/train': 3.4092185497283936} -09/20/2021 19:30:49 - INFO - __main__ - Step 23211: {'lr': 0.00019990032615758958, 'samples': 742752, 'steps': 1450, 'loss/train': 2.9950709342956543} -09/20/2021 19:30:50 - INFO - __main__ - Step 23212: {'lr': 0.00019990032615758958, 'samples': 742784, 'steps': 1450, 'loss/train': 1.2808492183685303} -09/20/2021 19:30:51 - INFO - __main__ - Step 23213: {'lr': 0.00019990032615758958, 'samples': 742816, 'steps': 1450, 'loss/train': 2.9261438846588135} -09/20/2021 19:30:51 - INFO - __main__ - Step 23214: {'lr': 0.00019990032615758958, 'samples': 742848, 'steps': 1450, 'loss/train': 1.3010090589523315} -09/20/2021 19:30:52 - INFO - __main__ - Step 23215: {'lr': 0.00019990032615758958, 'samples': 742880, 'steps': 1450, 'loss/train': 2.613548755645752} -09/20/2021 19:30:53 - INFO - __main__ - Step 23216: {'lr': 0.00019990032615758958, 'samples': 742912, 'steps': 1450, 'loss/train': 2.8639674186706543} -09/20/2021 19:30:54 - INFO - __main__ - Step 23217: {'lr': 0.00019990004121925425, 'samples': 742944, 'steps': 1451, 'loss/train': 1.0070608854293823} -09/20/2021 19:30:55 - INFO - __main__ - Step 23218: {'lr': 0.00019990004121925425, 'samples': 742976, 'steps': 1451, 'loss/train': 3.2097344398498535} -09/20/2021 19:30:56 - INFO - __main__ - Step 23219: {'lr': 0.00019990004121925425, 'samples': 743008, 'steps': 1451, 'loss/train': 2.971623182296753} -09/20/2021 19:30:57 - INFO - __main__ - Step 23220: {'lr': 0.00019990004121925425, 'samples': 743040, 'steps': 1451, 'loss/train': 4.041598320007324} -09/20/2021 19:30:57 - INFO - __main__ - Step 23221: {'lr': 0.00019990004121925425, 'samples': 743072, 'steps': 1451, 'loss/train': 3.0655746459960938} -09/20/2021 19:30:58 - INFO - __main__ - Step 23222: {'lr': 0.00019990004121925425, 'samples': 743104, 'steps': 1451, 'loss/train': 3.4306817054748535} -09/20/2021 19:30:59 - INFO - __main__ - Step 23223: {'lr': 0.00019990004121925425, 'samples': 743136, 'steps': 1451, 'loss/train': 3.0401062965393066} -09/20/2021 19:31:00 - INFO - __main__ - Step 23224: {'lr': 0.00019990004121925425, 'samples': 743168, 'steps': 1451, 'loss/train': 1.7747180461883545} -09/20/2021 19:31:00 - INFO - __main__ - Step 23225: {'lr': 0.00019990004121925425, 'samples': 743200, 'steps': 1451, 'loss/train': 3.554091691970825} -09/20/2021 19:31:01 - INFO - __main__ - Step 23226: {'lr': 0.00019990004121925425, 'samples': 743232, 'steps': 1451, 'loss/train': 2.4254038333892822} -09/20/2021 19:31:02 - INFO - __main__ - Step 23227: {'lr': 0.00019990004121925425, 'samples': 743264, 'steps': 1451, 'loss/train': 3.3105955123901367} -09/20/2021 19:31:03 - INFO - __main__ - Step 23228: {'lr': 0.00019990004121925425, 'samples': 743296, 'steps': 1451, 'loss/train': 2.302450656890869} -09/20/2021 19:31:03 - INFO - __main__ - Step 23229: {'lr': 0.00019990004121925425, 'samples': 743328, 'steps': 1451, 'loss/train': 3.7626824378967285} -09/20/2021 19:31:04 - INFO - __main__ - Step 23230: {'lr': 0.00019990004121925425, 'samples': 743360, 'steps': 1451, 'loss/train': 3.8808467388153076} -09/20/2021 19:31:05 - INFO - __main__ - Step 23231: {'lr': 0.00019990004121925425, 'samples': 743392, 'steps': 1451, 'loss/train': 2.692089080810547} -09/20/2021 19:31:06 - INFO - __main__ - Step 23232: {'lr': 0.00019990004121925425, 'samples': 743424, 'steps': 1451, 'loss/train': 4.034153938293457} -09/20/2021 19:31:07 - INFO - __main__ - Step 23233: {'lr': 0.000199899755874426, 'samples': 743456, 'steps': 1452, 'loss/train': 3.209397792816162} -09/20/2021 19:31:07 - INFO - __main__ - Step 23234: {'lr': 0.000199899755874426, 'samples': 743488, 'steps': 1452, 'loss/train': 3.3308138847351074} -09/20/2021 19:31:08 - INFO - __main__ - Step 23235: {'lr': 0.000199899755874426, 'samples': 743520, 'steps': 1452, 'loss/train': 2.871039628982544} -09/20/2021 19:31:09 - INFO - __main__ - Step 23236: {'lr': 0.000199899755874426, 'samples': 743552, 'steps': 1452, 'loss/train': 2.2940824031829834} -09/20/2021 19:31:10 - INFO - __main__ - Step 23237: {'lr': 0.000199899755874426, 'samples': 743584, 'steps': 1452, 'loss/train': 2.7489330768585205} -09/20/2021 19:31:10 - INFO - __main__ - Step 23238: {'lr': 0.000199899755874426, 'samples': 743616, 'steps': 1452, 'loss/train': 3.3303110599517822} -09/20/2021 19:31:11 - INFO - __main__ - Step 23239: {'lr': 0.000199899755874426, 'samples': 743648, 'steps': 1452, 'loss/train': 4.046963691711426} -09/20/2021 19:31:12 - INFO - __main__ - Step 23240: {'lr': 0.000199899755874426, 'samples': 743680, 'steps': 1452, 'loss/train': 2.759213447570801} -09/20/2021 19:31:13 - INFO - __main__ - Step 23241: {'lr': 0.000199899755874426, 'samples': 743712, 'steps': 1452, 'loss/train': 4.459073543548584} -09/20/2021 19:31:13 - INFO - __main__ - Step 23242: {'lr': 0.000199899755874426, 'samples': 743744, 'steps': 1452, 'loss/train': 2.2715001106262207} -09/20/2021 19:31:14 - INFO - __main__ - Step 23243: {'lr': 0.000199899755874426, 'samples': 743776, 'steps': 1452, 'loss/train': 4.032297611236572} -09/20/2021 19:31:15 - INFO - __main__ - Step 23244: {'lr': 0.000199899755874426, 'samples': 743808, 'steps': 1452, 'loss/train': 3.428955316543579} -09/20/2021 19:31:16 - INFO - __main__ - Step 23245: {'lr': 0.000199899755874426, 'samples': 743840, 'steps': 1452, 'loss/train': 2.410829782485962} -09/20/2021 19:31:16 - INFO - __main__ - Step 23246: {'lr': 0.000199899755874426, 'samples': 743872, 'steps': 1452, 'loss/train': 2.8788084983825684} -09/20/2021 19:31:17 - INFO - __main__ - Step 23247: {'lr': 0.000199899755874426, 'samples': 743904, 'steps': 1452, 'loss/train': 3.513315200805664} -09/20/2021 19:31:18 - INFO - __main__ - Step 23248: {'lr': 0.000199899755874426, 'samples': 743936, 'steps': 1452, 'loss/train': 2.644437074661255} -09/20/2021 19:31:19 - INFO - __main__ - Step 23249: {'lr': 0.00019989947012310607, 'samples': 743968, 'steps': 1453, 'loss/train': 4.252246856689453} -09/20/2021 19:31:20 - INFO - __main__ - Step 23250: {'lr': 0.00019989947012310607, 'samples': 744000, 'steps': 1453, 'loss/train': 3.3013827800750732} -09/20/2021 19:31:21 - INFO - __main__ - Step 23251: {'lr': 0.00019989947012310607, 'samples': 744032, 'steps': 1453, 'loss/train': 3.513434648513794} -09/20/2021 19:31:21 - INFO - __main__ - Step 23252: {'lr': 0.00019989947012310607, 'samples': 744064, 'steps': 1453, 'loss/train': 3.095150947570801} -09/20/2021 19:31:22 - INFO - __main__ - Step 23253: {'lr': 0.00019989947012310607, 'samples': 744096, 'steps': 1453, 'loss/train': 3.9690139293670654} -09/20/2021 19:31:23 - INFO - __main__ - Step 23254: {'lr': 0.00019989947012310607, 'samples': 744128, 'steps': 1453, 'loss/train': 3.4037885665893555} -09/20/2021 19:31:24 - INFO - __main__ - Step 23255: {'lr': 0.00019989947012310607, 'samples': 744160, 'steps': 1453, 'loss/train': 2.5106446743011475} -09/20/2021 19:31:24 - INFO - __main__ - Step 23256: {'lr': 0.00019989947012310607, 'samples': 744192, 'steps': 1453, 'loss/train': 2.4337825775146484} -09/20/2021 19:31:25 - INFO - __main__ - Step 23257: {'lr': 0.00019989947012310607, 'samples': 744224, 'steps': 1453, 'loss/train': 3.414647102355957} -09/20/2021 19:31:26 - INFO - __main__ - Step 23258: {'lr': 0.00019989947012310607, 'samples': 744256, 'steps': 1453, 'loss/train': 3.134803056716919} -09/20/2021 19:31:27 - INFO - __main__ - Step 23259: {'lr': 0.00019989947012310607, 'samples': 744288, 'steps': 1453, 'loss/train': 3.1056721210479736} -09/20/2021 19:31:27 - INFO - __main__ - Step 23260: {'lr': 0.00019989947012310607, 'samples': 744320, 'steps': 1453, 'loss/train': 3.0103025436401367} -09/20/2021 19:31:28 - INFO - __main__ - Step 23261: {'lr': 0.00019989947012310607, 'samples': 744352, 'steps': 1453, 'loss/train': 2.670966863632202} -09/20/2021 19:31:29 - INFO - __main__ - Step 23262: {'lr': 0.00019989947012310607, 'samples': 744384, 'steps': 1453, 'loss/train': 2.5144360065460205} -09/20/2021 19:31:30 - INFO - __main__ - Step 23263: {'lr': 0.00019989947012310607, 'samples': 744416, 'steps': 1453, 'loss/train': 3.383819580078125} -09/20/2021 19:31:30 - INFO - __main__ - Step 23264: {'lr': 0.00019989947012310607, 'samples': 744448, 'steps': 1453, 'loss/train': 2.8873209953308105} -09/20/2021 19:31:31 - INFO - __main__ - Step 23265: {'lr': 0.00019989918396529554, 'samples': 744480, 'steps': 1454, 'loss/train': 3.57475209236145} -09/20/2021 19:31:32 - INFO - __main__ - Step 23266: {'lr': 0.00019989918396529554, 'samples': 744512, 'steps': 1454, 'loss/train': 2.212167739868164} -09/20/2021 19:31:33 - INFO - __main__ - Step 23267: {'lr': 0.00019989918396529554, 'samples': 744544, 'steps': 1454, 'loss/train': 3.0823678970336914} -09/20/2021 19:31:34 - INFO - __main__ - Step 23268: {'lr': 0.00019989918396529554, 'samples': 744576, 'steps': 1454, 'loss/train': 2.427225351333618} -09/20/2021 19:31:34 - INFO - __main__ - Step 23269: {'lr': 0.00019989918396529554, 'samples': 744608, 'steps': 1454, 'loss/train': 0.9535689949989319} -09/20/2021 19:31:35 - INFO - __main__ - Step 23270: {'lr': 0.00019989918396529554, 'samples': 744640, 'steps': 1454, 'loss/train': 2.877133369445801} -09/20/2021 19:31:36 - INFO - __main__ - Step 23271: {'lr': 0.00019989918396529554, 'samples': 744672, 'steps': 1454, 'loss/train': 3.6693825721740723} -09/20/2021 19:31:37 - INFO - __main__ - Step 23272: {'lr': 0.00019989918396529554, 'samples': 744704, 'steps': 1454, 'loss/train': 3.661372423171997} -09/20/2021 19:31:37 - INFO - __main__ - Step 23273: {'lr': 0.00019989918396529554, 'samples': 744736, 'steps': 1454, 'loss/train': 2.9355359077453613} -09/20/2021 19:31:38 - INFO - __main__ - Step 23274: {'lr': 0.00019989918396529554, 'samples': 744768, 'steps': 1454, 'loss/train': 3.3565139770507812} -09/20/2021 19:31:39 - INFO - __main__ - Step 23275: {'lr': 0.00019989918396529554, 'samples': 744800, 'steps': 1454, 'loss/train': 3.583503484725952} -09/20/2021 19:31:40 - INFO - __main__ - Step 23276: {'lr': 0.00019989918396529554, 'samples': 744832, 'steps': 1454, 'loss/train': 3.460310697555542} -09/20/2021 19:31:40 - INFO - __main__ - Step 23277: {'lr': 0.00019989918396529554, 'samples': 744864, 'steps': 1454, 'loss/train': 3.194216728210449} -09/20/2021 19:31:41 - INFO - __main__ - Step 23278: {'lr': 0.00019989918396529554, 'samples': 744896, 'steps': 1454, 'loss/train': 2.700927972793579} -09/20/2021 19:31:42 - INFO - __main__ - Step 23279: {'lr': 0.00019989918396529554, 'samples': 744928, 'steps': 1454, 'loss/train': 3.022294759750366} -09/20/2021 19:31:43 - INFO - __main__ - Step 23280: {'lr': 0.00019989918396529554, 'samples': 744960, 'steps': 1454, 'loss/train': 3.105560779571533} -09/20/2021 19:31:44 - INFO - __main__ - Step 23281: {'lr': 0.00019989889740099567, 'samples': 744992, 'steps': 1455, 'loss/train': 1.1589019298553467} -09/20/2021 19:31:45 - INFO - __main__ - Step 23282: {'lr': 0.00019989889740099567, 'samples': 745024, 'steps': 1455, 'loss/train': 2.3474130630493164} -09/20/2021 19:31:46 - INFO - __main__ - Step 23283: {'lr': 0.00019989889740099567, 'samples': 745056, 'steps': 1455, 'loss/train': 3.258859634399414} -09/20/2021 19:31:46 - INFO - __main__ - Step 23284: {'lr': 0.00019989889740099567, 'samples': 745088, 'steps': 1455, 'loss/train': 2.746797561645508} -09/20/2021 19:31:47 - INFO - __main__ - Step 23285: {'lr': 0.00019989889740099567, 'samples': 745120, 'steps': 1455, 'loss/train': 2.4801368713378906} -09/20/2021 19:31:48 - INFO - __main__ - Step 23286: {'lr': 0.00019989889740099567, 'samples': 745152, 'steps': 1455, 'loss/train': 3.4872214794158936} -09/20/2021 19:31:49 - INFO - __main__ - Step 23287: {'lr': 0.00019989889740099567, 'samples': 745184, 'steps': 1455, 'loss/train': 3.0579352378845215} -09/20/2021 19:31:49 - INFO - __main__ - Step 23288: {'lr': 0.00019989889740099567, 'samples': 745216, 'steps': 1455, 'loss/train': 2.731520652770996} -09/20/2021 19:31:50 - INFO - __main__ - Step 23289: {'lr': 0.00019989889740099567, 'samples': 745248, 'steps': 1455, 'loss/train': 3.8526899814605713} -09/20/2021 19:31:51 - INFO - __main__ - Step 23290: {'lr': 0.00019989889740099567, 'samples': 745280, 'steps': 1455, 'loss/train': 1.7952325344085693} -09/20/2021 19:31:52 - INFO - __main__ - Step 23291: {'lr': 0.00019989889740099567, 'samples': 745312, 'steps': 1455, 'loss/train': 2.8824586868286133} -09/20/2021 19:31:52 - INFO - __main__ - Step 23292: {'lr': 0.00019989889740099567, 'samples': 745344, 'steps': 1455, 'loss/train': 3.7149691581726074} -09/20/2021 19:31:53 - INFO - __main__ - Step 23293: {'lr': 0.00019989889740099567, 'samples': 745376, 'steps': 1455, 'loss/train': 3.3064939975738525} -09/20/2021 19:31:54 - INFO - __main__ - Step 23294: {'lr': 0.00019989889740099567, 'samples': 745408, 'steps': 1455, 'loss/train': 3.3421876430511475} -09/20/2021 19:31:55 - INFO - __main__ - Step 23295: {'lr': 0.00019989889740099567, 'samples': 745440, 'steps': 1455, 'loss/train': 3.6445391178131104} -09/20/2021 19:31:55 - INFO - __main__ - Step 23296: {'lr': 0.00019989889740099567, 'samples': 745472, 'steps': 1455, 'loss/train': 2.001143455505371} -09/20/2021 19:31:56 - INFO - __main__ - Step 23297: {'lr': 0.00019989861043020752, 'samples': 745504, 'steps': 1456, 'loss/train': 1.8906623125076294} -09/20/2021 19:31:57 - INFO - __main__ - Step 23298: {'lr': 0.00019989861043020752, 'samples': 745536, 'steps': 1456, 'loss/train': 2.5314831733703613} -09/20/2021 19:31:58 - INFO - __main__ - Step 23299: {'lr': 0.00019989861043020752, 'samples': 745568, 'steps': 1456, 'loss/train': 2.8830275535583496} -09/20/2021 19:31:58 - INFO - __main__ - Step 23300: {'lr': 0.00019989861043020752, 'samples': 745600, 'steps': 1456, 'loss/train': 4.023322105407715} -09/20/2021 19:31:59 - INFO - __main__ - Step 23301: {'lr': 0.00019989861043020752, 'samples': 745632, 'steps': 1456, 'loss/train': 2.8038933277130127} -09/20/2021 19:32:00 - INFO - __main__ - Step 23302: {'lr': 0.00019989861043020752, 'samples': 745664, 'steps': 1456, 'loss/train': 2.8027329444885254} -09/20/2021 19:32:01 - INFO - __main__ - Step 23303: {'lr': 0.00019989861043020752, 'samples': 745696, 'steps': 1456, 'loss/train': 3.193660259246826} -09/20/2021 19:32:01 - INFO - __main__ - Step 23304: {'lr': 0.00019989861043020752, 'samples': 745728, 'steps': 1456, 'loss/train': 2.5711092948913574} -09/20/2021 19:32:02 - INFO - __main__ - Step 23305: {'lr': 0.00019989861043020752, 'samples': 745760, 'steps': 1456, 'loss/train': 2.78718638420105} -09/20/2021 19:32:03 - INFO - __main__ - Step 23306: {'lr': 0.00019989861043020752, 'samples': 745792, 'steps': 1456, 'loss/train': 3.403688669204712} -09/20/2021 19:32:04 - INFO - __main__ - Step 23307: {'lr': 0.00019989861043020752, 'samples': 745824, 'steps': 1456, 'loss/train': 2.336919069290161} -09/20/2021 19:32:04 - INFO - __main__ - Step 23308: {'lr': 0.00019989861043020752, 'samples': 745856, 'steps': 1456, 'loss/train': 2.5873615741729736} -09/20/2021 19:32:05 - INFO - __main__ - Step 23309: {'lr': 0.00019989861043020752, 'samples': 745888, 'steps': 1456, 'loss/train': 0.9502819776535034} -09/20/2021 19:32:06 - INFO - __main__ - Step 23310: {'lr': 0.00019989861043020752, 'samples': 745920, 'steps': 1456, 'loss/train': 3.6341934204101562} -09/20/2021 19:32:08 - INFO - __main__ - Step 23311: {'lr': 0.00019989861043020752, 'samples': 745952, 'steps': 1456, 'loss/train': 3.317528247833252} -09/20/2021 19:32:08 - INFO - __main__ - Step 23312: {'lr': 0.00019989861043020752, 'samples': 745984, 'steps': 1456, 'loss/train': 2.279033899307251} -09/20/2021 19:32:09 - INFO - __main__ - Step 23313: {'lr': 0.00019989832305293234, 'samples': 746016, 'steps': 1457, 'loss/train': 2.682840585708618} -09/20/2021 19:32:10 - INFO - __main__ - Step 23314: {'lr': 0.00019989832305293234, 'samples': 746048, 'steps': 1457, 'loss/train': 3.7714006900787354} -09/20/2021 19:32:11 - INFO - __main__ - Step 23315: {'lr': 0.00019989832305293234, 'samples': 746080, 'steps': 1457, 'loss/train': 3.8799490928649902} -09/20/2021 19:32:12 - INFO - __main__ - Step 23316: {'lr': 0.00019989832305293234, 'samples': 746112, 'steps': 1457, 'loss/train': 3.6220924854278564} -09/20/2021 19:32:12 - INFO - __main__ - Step 23317: {'lr': 0.00019989832305293234, 'samples': 746144, 'steps': 1457, 'loss/train': 2.609819173812866} -09/20/2021 19:32:13 - INFO - __main__ - Step 23318: {'lr': 0.00019989832305293234, 'samples': 746176, 'steps': 1457, 'loss/train': 3.2042386531829834} -09/20/2021 19:32:14 - INFO - __main__ - Step 23319: {'lr': 0.00019989832305293234, 'samples': 746208, 'steps': 1457, 'loss/train': 3.8062424659729004} -09/20/2021 19:32:15 - INFO - __main__ - Step 23320: {'lr': 0.00019989832305293234, 'samples': 746240, 'steps': 1457, 'loss/train': 3.1521430015563965} -09/20/2021 19:32:15 - INFO - __main__ - Step 23321: {'lr': 0.00019989832305293234, 'samples': 746272, 'steps': 1457, 'loss/train': 2.805535078048706} -09/20/2021 19:32:16 - INFO - __main__ - Step 23322: {'lr': 0.00019989832305293234, 'samples': 746304, 'steps': 1457, 'loss/train': 3.1958441734313965} -09/20/2021 19:32:17 - INFO - __main__ - Step 23323: {'lr': 0.00019989832305293234, 'samples': 746336, 'steps': 1457, 'loss/train': 3.5534284114837646} -09/20/2021 19:32:18 - INFO - __main__ - Step 23324: {'lr': 0.00019989832305293234, 'samples': 746368, 'steps': 1457, 'loss/train': 3.557873010635376} -09/20/2021 19:32:18 - INFO - __main__ - Step 23325: {'lr': 0.00019989832305293234, 'samples': 746400, 'steps': 1457, 'loss/train': 2.534092664718628} -09/20/2021 19:32:19 - INFO - __main__ - Step 23326: {'lr': 0.00019989832305293234, 'samples': 746432, 'steps': 1457, 'loss/train': 2.7540528774261475} -09/20/2021 19:32:20 - INFO - __main__ - Step 23327: {'lr': 0.00019989832305293234, 'samples': 746464, 'steps': 1457, 'loss/train': 2.9780173301696777} -09/20/2021 19:32:21 - INFO - __main__ - Step 23328: {'lr': 0.00019989832305293234, 'samples': 746496, 'steps': 1457, 'loss/train': 2.8938140869140625} -09/20/2021 19:32:21 - INFO - __main__ - Step 23329: {'lr': 0.00019989803526917127, 'samples': 746528, 'steps': 1458, 'loss/train': 4.0270514488220215} -09/20/2021 19:32:22 - INFO - __main__ - Step 23330: {'lr': 0.00019989803526917127, 'samples': 746560, 'steps': 1458, 'loss/train': 3.6055479049682617} -09/20/2021 19:32:23 - INFO - __main__ - Step 23331: {'lr': 0.00019989803526917127, 'samples': 746592, 'steps': 1458, 'loss/train': 3.963144540786743} -09/20/2021 19:32:24 - INFO - __main__ - Step 23332: {'lr': 0.00019989803526917127, 'samples': 746624, 'steps': 1458, 'loss/train': 2.986470937728882} -09/20/2021 19:32:24 - INFO - __main__ - Step 23333: {'lr': 0.00019989803526917127, 'samples': 746656, 'steps': 1458, 'loss/train': 3.807863712310791} -09/20/2021 19:32:25 - INFO - __main__ - Step 23334: {'lr': 0.00019989803526917127, 'samples': 746688, 'steps': 1458, 'loss/train': 3.2833635807037354} -09/20/2021 19:32:26 - INFO - __main__ - Step 23335: {'lr': 0.00019989803526917127, 'samples': 746720, 'steps': 1458, 'loss/train': 3.4602558612823486} -09/20/2021 19:32:27 - INFO - __main__ - Step 23336: {'lr': 0.00019989803526917127, 'samples': 746752, 'steps': 1458, 'loss/train': 3.5969507694244385} -09/20/2021 19:32:27 - INFO - __main__ - Step 23337: {'lr': 0.00019989803526917127, 'samples': 746784, 'steps': 1458, 'loss/train': 3.0024304389953613} -09/20/2021 19:32:28 - INFO - __main__ - Step 23338: {'lr': 0.00019989803526917127, 'samples': 746816, 'steps': 1458, 'loss/train': 3.236968517303467} -09/20/2021 19:32:29 - INFO - __main__ - Step 23339: {'lr': 0.00019989803526917127, 'samples': 746848, 'steps': 1458, 'loss/train': 1.9969438314437866} -09/20/2021 19:32:30 - INFO - __main__ - Step 23340: {'lr': 0.00019989803526917127, 'samples': 746880, 'steps': 1458, 'loss/train': 3.475278854370117} -09/20/2021 19:32:30 - INFO - __main__ - Step 23341: {'lr': 0.00019989803526917127, 'samples': 746912, 'steps': 1458, 'loss/train': 3.0053298473358154} -09/20/2021 19:32:32 - INFO - __main__ - Step 23342: {'lr': 0.00019989803526917127, 'samples': 746944, 'steps': 1458, 'loss/train': 3.3719537258148193} -09/20/2021 19:32:32 - INFO - __main__ - Step 23343: {'lr': 0.00019989803526917127, 'samples': 746976, 'steps': 1458, 'loss/train': 2.9265904426574707} -09/20/2021 19:32:33 - INFO - __main__ - Step 23344: {'lr': 0.00019989803526917127, 'samples': 747008, 'steps': 1458, 'loss/train': 2.3656342029571533} -09/20/2021 19:32:34 - INFO - __main__ - Step 23345: {'lr': 0.00019989774707892548, 'samples': 747040, 'steps': 1459, 'loss/train': 3.183706283569336} -09/20/2021 19:32:35 - INFO - __main__ - Step 23346: {'lr': 0.00019989774707892548, 'samples': 747072, 'steps': 1459, 'loss/train': 3.5283727645874023} -09/20/2021 19:32:36 - INFO - __main__ - Step 23347: {'lr': 0.00019989774707892548, 'samples': 747104, 'steps': 1459, 'loss/train': 2.7911646366119385} -09/20/2021 19:32:36 - INFO - __main__ - Step 23348: {'lr': 0.00019989774707892548, 'samples': 747136, 'steps': 1459, 'loss/train': 2.722273826599121} -09/20/2021 19:32:37 - INFO - __main__ - Step 23349: {'lr': 0.00019989774707892548, 'samples': 747168, 'steps': 1459, 'loss/train': 2.9130635261535645} -09/20/2021 19:32:38 - INFO - __main__ - Step 23350: {'lr': 0.00019989774707892548, 'samples': 747200, 'steps': 1459, 'loss/train': 2.002856969833374} -09/20/2021 19:32:39 - INFO - __main__ - Step 23351: {'lr': 0.00019989774707892548, 'samples': 747232, 'steps': 1459, 'loss/train': 3.0358335971832275} -09/20/2021 19:32:39 - INFO - __main__ - Step 23352: {'lr': 0.00019989774707892548, 'samples': 747264, 'steps': 1459, 'loss/train': 3.343398094177246} -09/20/2021 19:32:40 - INFO - __main__ - Step 23353: {'lr': 0.00019989774707892548, 'samples': 747296, 'steps': 1459, 'loss/train': 3.4782791137695312} -09/20/2021 19:32:41 - INFO - __main__ - Step 23354: {'lr': 0.00019989774707892548, 'samples': 747328, 'steps': 1459, 'loss/train': 4.1121673583984375} -09/20/2021 19:32:42 - INFO - __main__ - Step 23355: {'lr': 0.00019989774707892548, 'samples': 747360, 'steps': 1459, 'loss/train': 3.0957696437835693} -09/20/2021 19:32:42 - INFO - __main__ - Step 23356: {'lr': 0.00019989774707892548, 'samples': 747392, 'steps': 1459, 'loss/train': 2.329000473022461} -09/20/2021 19:32:43 - INFO - __main__ - Step 23357: {'lr': 0.00019989774707892548, 'samples': 747424, 'steps': 1459, 'loss/train': 3.007551431655884} -09/20/2021 19:32:44 - INFO - __main__ - Step 23358: {'lr': 0.00019989774707892548, 'samples': 747456, 'steps': 1459, 'loss/train': 2.398023843765259} -09/20/2021 19:32:45 - INFO - __main__ - Step 23359: {'lr': 0.00019989774707892548, 'samples': 747488, 'steps': 1459, 'loss/train': 2.9921231269836426} -09/20/2021 19:32:45 - INFO - __main__ - Step 23360: {'lr': 0.00019989774707892548, 'samples': 747520, 'steps': 1459, 'loss/train': 3.6353771686553955} -09/20/2021 19:32:46 - INFO - __main__ - Step 23361: {'lr': 0.00019989745848219615, 'samples': 747552, 'steps': 1460, 'loss/train': 2.253345012664795} -09/20/2021 19:32:47 - INFO - __main__ - Step 23362: {'lr': 0.00019989745848219615, 'samples': 747584, 'steps': 1460, 'loss/train': 2.3091611862182617} -09/20/2021 19:32:48 - INFO - __main__ - Step 23363: {'lr': 0.00019989745848219615, 'samples': 747616, 'steps': 1460, 'loss/train': 3.6922833919525146} -09/20/2021 19:32:49 - INFO - __main__ - Step 23364: {'lr': 0.00019989745848219615, 'samples': 747648, 'steps': 1460, 'loss/train': 2.079418897628784} -09/20/2021 19:32:49 - INFO - __main__ - Step 23365: {'lr': 0.00019989745848219615, 'samples': 747680, 'steps': 1460, 'loss/train': 5.568918228149414} -09/20/2021 19:32:50 - INFO - __main__ - Step 23366: {'lr': 0.00019989745848219615, 'samples': 747712, 'steps': 1460, 'loss/train': 3.6379895210266113} -09/20/2021 19:32:51 - INFO - __main__ - Step 23367: {'lr': 0.00019989745848219615, 'samples': 747744, 'steps': 1460, 'loss/train': 3.437079906463623} -09/20/2021 19:32:52 - INFO - __main__ - Step 23368: {'lr': 0.00019989745848219615, 'samples': 747776, 'steps': 1460, 'loss/train': 3.4485671520233154} -09/20/2021 19:32:52 - INFO - __main__ - Step 23369: {'lr': 0.00019989745848219615, 'samples': 747808, 'steps': 1460, 'loss/train': 3.5582823753356934} -09/20/2021 19:32:53 - INFO - __main__ - Step 23370: {'lr': 0.00019989745848219615, 'samples': 747840, 'steps': 1460, 'loss/train': 1.861120581626892} -09/20/2021 19:32:54 - INFO - __main__ - Step 23371: {'lr': 0.00019989745848219615, 'samples': 747872, 'steps': 1460, 'loss/train': 3.5918784141540527} -09/20/2021 19:32:55 - INFO - __main__ - Step 23372: {'lr': 0.00019989745848219615, 'samples': 747904, 'steps': 1460, 'loss/train': 2.803647041320801} -09/20/2021 19:32:56 - INFO - __main__ - Step 23373: {'lr': 0.00019989745848219615, 'samples': 747936, 'steps': 1460, 'loss/train': 3.082669734954834} -09/20/2021 19:32:57 - INFO - __main__ - Step 23374: {'lr': 0.00019989745848219615, 'samples': 747968, 'steps': 1460, 'loss/train': 2.8995566368103027} -09/20/2021 19:32:57 - INFO - __main__ - Step 23375: {'lr': 0.00019989745848219615, 'samples': 748000, 'steps': 1460, 'loss/train': 3.6352896690368652} -09/20/2021 19:32:58 - INFO - __main__ - Step 23376: {'lr': 0.00019989745848219615, 'samples': 748032, 'steps': 1460, 'loss/train': 2.5156357288360596} -09/20/2021 19:32:59 - INFO - __main__ - Step 23377: {'lr': 0.00019989716947898444, 'samples': 748064, 'steps': 1461, 'loss/train': 2.284162998199463} -09/20/2021 19:33:00 - INFO - __main__ - Step 23378: {'lr': 0.00019989716947898444, 'samples': 748096, 'steps': 1461, 'loss/train': 2.639056921005249} -09/20/2021 19:33:01 - INFO - __main__ - Step 23379: {'lr': 0.00019989716947898444, 'samples': 748128, 'steps': 1461, 'loss/train': 4.534629821777344} -09/20/2021 19:33:01 - INFO - __main__ - Step 23380: {'lr': 0.00019989716947898444, 'samples': 748160, 'steps': 1461, 'loss/train': 2.9566149711608887} -09/20/2021 19:33:02 - INFO - __main__ - Step 23381: {'lr': 0.00019989716947898444, 'samples': 748192, 'steps': 1461, 'loss/train': 3.470625877380371} -09/20/2021 19:33:03 - INFO - __main__ - Step 23382: {'lr': 0.00019989716947898444, 'samples': 748224, 'steps': 1461, 'loss/train': 2.7497103214263916} -09/20/2021 19:33:04 - INFO - __main__ - Step 23383: {'lr': 0.00019989716947898444, 'samples': 748256, 'steps': 1461, 'loss/train': 3.6950325965881348} -09/20/2021 19:33:04 - INFO - __main__ - Step 23384: {'lr': 0.00019989716947898444, 'samples': 748288, 'steps': 1461, 'loss/train': 3.5912468433380127} -09/20/2021 19:33:05 - INFO - __main__ - Step 23385: {'lr': 0.00019989716947898444, 'samples': 748320, 'steps': 1461, 'loss/train': 2.81785249710083} -09/20/2021 19:33:06 - INFO - __main__ - Step 23386: {'lr': 0.00019989716947898444, 'samples': 748352, 'steps': 1461, 'loss/train': 2.8446764945983887} -09/20/2021 19:33:07 - INFO - __main__ - Step 23387: {'lr': 0.00019989716947898444, 'samples': 748384, 'steps': 1461, 'loss/train': 3.4071497917175293} -09/20/2021 19:33:07 - INFO - __main__ - Step 23388: {'lr': 0.00019989716947898444, 'samples': 748416, 'steps': 1461, 'loss/train': 3.8542985916137695} -09/20/2021 19:33:08 - INFO - __main__ - Step 23389: {'lr': 0.00019989716947898444, 'samples': 748448, 'steps': 1461, 'loss/train': 4.508871555328369} -09/20/2021 19:33:09 - INFO - __main__ - Step 23390: {'lr': 0.00019989716947898444, 'samples': 748480, 'steps': 1461, 'loss/train': 2.4680466651916504} -09/20/2021 19:33:10 - INFO - __main__ - Step 23391: {'lr': 0.00019989716947898444, 'samples': 748512, 'steps': 1461, 'loss/train': 2.5327768325805664} -09/20/2021 19:33:10 - INFO - __main__ - Step 23392: {'lr': 0.00019989716947898444, 'samples': 748544, 'steps': 1461, 'loss/train': 4.852382659912109} -09/20/2021 19:33:11 - INFO - __main__ - Step 23393: {'lr': 0.00019989688006929156, 'samples': 748576, 'steps': 1462, 'loss/train': 5.273799896240234} -09/20/2021 19:33:12 - INFO - __main__ - Step 23394: {'lr': 0.00019989688006929156, 'samples': 748608, 'steps': 1462, 'loss/train': 5.248232364654541} -09/20/2021 19:33:13 - INFO - __main__ - Step 23395: {'lr': 0.00019989688006929156, 'samples': 748640, 'steps': 1462, 'loss/train': 5.669435977935791} -09/20/2021 19:33:13 - INFO - __main__ - Step 23396: {'lr': 0.00019989688006929156, 'samples': 748672, 'steps': 1462, 'loss/train': 4.5693464279174805} -09/20/2021 19:33:14 - INFO - __main__ - Step 23397: {'lr': 0.00019989688006929156, 'samples': 748704, 'steps': 1462, 'loss/train': 4.033482074737549} -09/20/2021 19:33:15 - INFO - __main__ - Step 23398: {'lr': 0.00019989688006929156, 'samples': 748736, 'steps': 1462, 'loss/train': 2.0416598320007324} -09/20/2021 19:33:16 - INFO - __main__ - Step 23399: {'lr': 0.00019989688006929156, 'samples': 748768, 'steps': 1462, 'loss/train': 3.4260342121124268} -09/20/2021 19:33:16 - INFO - __main__ - Step 23400: {'lr': 0.00019989688006929156, 'samples': 748800, 'steps': 1462, 'loss/train': 2.999774217605591} -09/20/2021 19:33:17 - INFO - __main__ - Step 23401: {'lr': 0.00019989688006929156, 'samples': 748832, 'steps': 1462, 'loss/train': 2.9747064113616943} -09/20/2021 19:33:18 - INFO - __main__ - Step 23402: {'lr': 0.00019989688006929156, 'samples': 748864, 'steps': 1462, 'loss/train': 2.654301881790161} -09/20/2021 19:33:19 - INFO - __main__ - Step 23403: {'lr': 0.00019989688006929156, 'samples': 748896, 'steps': 1462, 'loss/train': 2.1782896518707275} -09/20/2021 19:33:20 - INFO - __main__ - Step 23404: {'lr': 0.00019989688006929156, 'samples': 748928, 'steps': 1462, 'loss/train': 2.6932318210601807} -09/20/2021 19:33:21 - INFO - __main__ - Step 23405: {'lr': 0.00019989688006929156, 'samples': 748960, 'steps': 1462, 'loss/train': 3.03009033203125} -09/20/2021 19:33:21 - INFO - __main__ - Step 23406: {'lr': 0.00019989688006929156, 'samples': 748992, 'steps': 1462, 'loss/train': 3.494823694229126} -09/20/2021 19:33:22 - INFO - __main__ - Step 23407: {'lr': 0.00019989688006929156, 'samples': 749024, 'steps': 1462, 'loss/train': 3.599163055419922} -09/20/2021 19:33:23 - INFO - __main__ - Step 23408: {'lr': 0.00019989688006929156, 'samples': 749056, 'steps': 1462, 'loss/train': 2.705191135406494} -09/20/2021 19:33:24 - INFO - __main__ - Step 23409: {'lr': 0.00019989659025311862, 'samples': 749088, 'steps': 1463, 'loss/train': 3.4028310775756836} -09/20/2021 19:33:25 - INFO - __main__ - Step 23410: {'lr': 0.00019989659025311862, 'samples': 749120, 'steps': 1463, 'loss/train': 2.9886322021484375} -09/20/2021 19:33:25 - INFO - __main__ - Step 23411: {'lr': 0.00019989659025311862, 'samples': 749152, 'steps': 1463, 'loss/train': 2.1905107498168945} -09/20/2021 19:33:26 - INFO - __main__ - Step 23412: {'lr': 0.00019989659025311862, 'samples': 749184, 'steps': 1463, 'loss/train': 3.0752179622650146} -09/20/2021 19:33:27 - INFO - __main__ - Step 23413: {'lr': 0.00019989659025311862, 'samples': 749216, 'steps': 1463, 'loss/train': 3.3114163875579834} -09/20/2021 19:33:28 - INFO - __main__ - Step 23414: {'lr': 0.00019989659025311862, 'samples': 749248, 'steps': 1463, 'loss/train': 3.725785970687866} -09/20/2021 19:33:28 - INFO - __main__ - Step 23415: {'lr': 0.00019989659025311862, 'samples': 749280, 'steps': 1463, 'loss/train': 2.899712562561035} -09/20/2021 19:33:29 - INFO - __main__ - Step 23416: {'lr': 0.00019989659025311862, 'samples': 749312, 'steps': 1463, 'loss/train': 2.1703972816467285} -09/20/2021 19:33:30 - INFO - __main__ - Step 23417: {'lr': 0.00019989659025311862, 'samples': 749344, 'steps': 1463, 'loss/train': 2.827047824859619} -09/20/2021 19:33:31 - INFO - __main__ - Step 23418: {'lr': 0.00019989659025311862, 'samples': 749376, 'steps': 1463, 'loss/train': 2.7328310012817383} -09/20/2021 19:33:31 - INFO - __main__ - Step 23419: {'lr': 0.00019989659025311862, 'samples': 749408, 'steps': 1463, 'loss/train': 2.733506679534912} -09/20/2021 19:33:32 - INFO - __main__ - Step 23420: {'lr': 0.00019989659025311862, 'samples': 749440, 'steps': 1463, 'loss/train': 2.9419806003570557} -09/20/2021 19:33:33 - INFO - __main__ - Step 23421: {'lr': 0.00019989659025311862, 'samples': 749472, 'steps': 1463, 'loss/train': 2.883941650390625} -09/20/2021 19:33:34 - INFO - __main__ - Step 23422: {'lr': 0.00019989659025311862, 'samples': 749504, 'steps': 1463, 'loss/train': 3.325993537902832} -09/20/2021 19:33:34 - INFO - __main__ - Step 23423: {'lr': 0.00019989659025311862, 'samples': 749536, 'steps': 1463, 'loss/train': 3.105638265609741} -09/20/2021 19:33:35 - INFO - __main__ - Step 23424: {'lr': 0.00019989659025311862, 'samples': 749568, 'steps': 1463, 'loss/train': 2.439582109451294} -09/20/2021 19:33:36 - INFO - __main__ - Step 23425: {'lr': 0.00019989630003046686, 'samples': 749600, 'steps': 1464, 'loss/train': 3.3586654663085938} -09/20/2021 19:33:37 - INFO - __main__ - Step 23426: {'lr': 0.00019989630003046686, 'samples': 749632, 'steps': 1464, 'loss/train': 3.986137628555298} -09/20/2021 19:33:38 - INFO - __main__ - Step 23427: {'lr': 0.00019989630003046686, 'samples': 749664, 'steps': 1464, 'loss/train': 3.0760385990142822} -09/20/2021 19:33:38 - INFO - __main__ - Step 23428: {'lr': 0.00019989630003046686, 'samples': 749696, 'steps': 1464, 'loss/train': 3.2233340740203857} -09/20/2021 19:33:39 - INFO - __main__ - Step 23429: {'lr': 0.00019989630003046686, 'samples': 749728, 'steps': 1464, 'loss/train': 2.3871428966522217} -09/20/2021 19:33:40 - INFO - __main__ - Step 23430: {'lr': 0.00019989630003046686, 'samples': 749760, 'steps': 1464, 'loss/train': 3.331556558609009} -09/20/2021 19:33:41 - INFO - __main__ - Step 23431: {'lr': 0.00019989630003046686, 'samples': 749792, 'steps': 1464, 'loss/train': 2.4633772373199463} -09/20/2021 19:33:41 - INFO - __main__ - Step 23432: {'lr': 0.00019989630003046686, 'samples': 749824, 'steps': 1464, 'loss/train': 2.87790584564209} -09/20/2021 19:33:42 - INFO - __main__ - Step 23433: {'lr': 0.00019989630003046686, 'samples': 749856, 'steps': 1464, 'loss/train': 3.007294178009033} -09/20/2021 19:33:43 - INFO - __main__ - Step 23434: {'lr': 0.00019989630003046686, 'samples': 749888, 'steps': 1464, 'loss/train': 2.0749638080596924} -09/20/2021 19:33:44 - INFO - __main__ - Step 23435: {'lr': 0.00019989630003046686, 'samples': 749920, 'steps': 1464, 'loss/train': 2.9631729125976562} -09/20/2021 19:33:45 - INFO - __main__ - Step 23436: {'lr': 0.00019989630003046686, 'samples': 749952, 'steps': 1464, 'loss/train': 3.2515735626220703} -09/20/2021 19:33:46 - INFO - __main__ - Step 23437: {'lr': 0.00019989630003046686, 'samples': 749984, 'steps': 1464, 'loss/train': 1.8001189231872559} -09/20/2021 19:33:46 - INFO - __main__ - Step 23438: {'lr': 0.00019989630003046686, 'samples': 750016, 'steps': 1464, 'loss/train': 2.543853759765625} -09/20/2021 19:33:47 - INFO - __main__ - Step 23439: {'lr': 0.00019989630003046686, 'samples': 750048, 'steps': 1464, 'loss/train': 2.4629249572753906} -09/20/2021 19:33:48 - INFO - __main__ - Step 23440: {'lr': 0.00019989630003046686, 'samples': 750080, 'steps': 1464, 'loss/train': 2.8451287746429443} -09/20/2021 19:33:49 - INFO - __main__ - Step 23441: {'lr': 0.00019989600940133745, 'samples': 750112, 'steps': 1465, 'loss/train': 1.6919020414352417} -09/20/2021 19:33:49 - INFO - __main__ - Step 23442: {'lr': 0.00019989600940133745, 'samples': 750144, 'steps': 1465, 'loss/train': 3.617793321609497} -09/20/2021 19:33:50 - INFO - __main__ - Step 23443: {'lr': 0.00019989600940133745, 'samples': 750176, 'steps': 1465, 'loss/train': 3.0928826332092285} -09/20/2021 19:33:51 - INFO - __main__ - Step 23444: {'lr': 0.00019989600940133745, 'samples': 750208, 'steps': 1465, 'loss/train': 2.855642080307007} -09/20/2021 19:33:52 - INFO - __main__ - Step 23445: {'lr': 0.00019989600940133745, 'samples': 750240, 'steps': 1465, 'loss/train': 3.3225831985473633} -09/20/2021 19:33:52 - INFO - __main__ - Step 23446: {'lr': 0.00019989600940133745, 'samples': 750272, 'steps': 1465, 'loss/train': 0.46614256501197815} -09/20/2021 19:33:53 - INFO - __main__ - Step 23447: {'lr': 0.00019989600940133745, 'samples': 750304, 'steps': 1465, 'loss/train': 0.4551665186882019} -09/20/2021 19:33:54 - INFO - __main__ - Step 23448: {'lr': 0.00019989600940133745, 'samples': 750336, 'steps': 1465, 'loss/train': 2.3790347576141357} -09/20/2021 19:33:55 - INFO - __main__ - Step 23449: {'lr': 0.00019989600940133745, 'samples': 750368, 'steps': 1465, 'loss/train': 3.42403244972229} -09/20/2021 19:33:55 - INFO - __main__ - Step 23450: {'lr': 0.00019989600940133745, 'samples': 750400, 'steps': 1465, 'loss/train': 2.3919448852539062} -09/20/2021 19:33:56 - INFO - __main__ - Step 23451: {'lr': 0.00019989600940133745, 'samples': 750432, 'steps': 1465, 'loss/train': 3.2336575984954834} -09/20/2021 19:33:57 - INFO - __main__ - Step 23452: {'lr': 0.00019989600940133745, 'samples': 750464, 'steps': 1465, 'loss/train': 2.9038939476013184} -09/20/2021 19:33:58 - INFO - __main__ - Step 23453: {'lr': 0.00019989600940133745, 'samples': 750496, 'steps': 1465, 'loss/train': 2.9187052249908447} -09/20/2021 19:33:58 - INFO - __main__ - Step 23454: {'lr': 0.00019989600940133745, 'samples': 750528, 'steps': 1465, 'loss/train': 2.725431442260742} -09/20/2021 19:33:59 - INFO - __main__ - Step 23455: {'lr': 0.00019989600940133745, 'samples': 750560, 'steps': 1465, 'loss/train': 2.866129159927368} -09/20/2021 19:34:00 - INFO - __main__ - Step 23456: {'lr': 0.00019989600940133745, 'samples': 750592, 'steps': 1465, 'loss/train': 1.8807916641235352} -09/20/2021 19:34:01 - INFO - __main__ - Step 23457: {'lr': 0.00019989571836573157, 'samples': 750624, 'steps': 1466, 'loss/train': 2.7786383628845215} -09/20/2021 19:34:02 - INFO - __main__ - Step 23458: {'lr': 0.00019989571836573157, 'samples': 750656, 'steps': 1466, 'loss/train': 2.8613929748535156} -09/20/2021 19:34:02 - INFO - __main__ - Step 23459: {'lr': 0.00019989571836573157, 'samples': 750688, 'steps': 1466, 'loss/train': 2.7300097942352295} -09/20/2021 19:34:03 - INFO - __main__ - Step 23460: {'lr': 0.00019989571836573157, 'samples': 750720, 'steps': 1466, 'loss/train': 2.0429835319519043} -09/20/2021 19:34:04 - INFO - __main__ - Step 23461: {'lr': 0.00019989571836573157, 'samples': 750752, 'steps': 1466, 'loss/train': 2.8458173274993896} -09/20/2021 19:34:05 - INFO - __main__ - Step 23462: {'lr': 0.00019989571836573157, 'samples': 750784, 'steps': 1466, 'loss/train': 2.8644168376922607} -09/20/2021 19:34:05 - INFO - __main__ - Step 23463: {'lr': 0.00019989571836573157, 'samples': 750816, 'steps': 1466, 'loss/train': 4.62785005569458} -09/20/2021 19:34:07 - INFO - __main__ - Step 23464: {'lr': 0.00019989571836573157, 'samples': 750848, 'steps': 1466, 'loss/train': 2.2933173179626465} -09/20/2021 19:34:08 - INFO - __main__ - Step 23465: {'lr': 0.00019989571836573157, 'samples': 750880, 'steps': 1466, 'loss/train': 2.6297051906585693} -09/20/2021 19:34:08 - INFO - __main__ - Step 23466: {'lr': 0.00019989571836573157, 'samples': 750912, 'steps': 1466, 'loss/train': 2.6121575832366943} -09/20/2021 19:34:09 - INFO - __main__ - Step 23467: {'lr': 0.00019989571836573157, 'samples': 750944, 'steps': 1466, 'loss/train': 2.6091761589050293} -09/20/2021 19:34:10 - INFO - __main__ - Step 23468: {'lr': 0.00019989571836573157, 'samples': 750976, 'steps': 1466, 'loss/train': 2.4279568195343018} -09/20/2021 19:34:11 - INFO - __main__ - Step 23469: {'lr': 0.00019989571836573157, 'samples': 751008, 'steps': 1466, 'loss/train': 2.824847936630249} -09/20/2021 19:34:11 - INFO - __main__ - Step 23470: {'lr': 0.00019989571836573157, 'samples': 751040, 'steps': 1466, 'loss/train': 2.7871782779693604} -09/20/2021 19:34:12 - INFO - __main__ - Step 23471: {'lr': 0.00019989571836573157, 'samples': 751072, 'steps': 1466, 'loss/train': 2.318593740463257} -09/20/2021 19:34:13 - INFO - __main__ - Step 23472: {'lr': 0.00019989571836573157, 'samples': 751104, 'steps': 1466, 'loss/train': 4.1982269287109375} -09/20/2021 19:34:14 - INFO - __main__ - Step 23473: {'lr': 0.00019989542692365039, 'samples': 751136, 'steps': 1467, 'loss/train': 2.83444881439209} -09/20/2021 19:34:15 - INFO - __main__ - Step 23474: {'lr': 0.00019989542692365039, 'samples': 751168, 'steps': 1467, 'loss/train': 3.417297124862671} -09/20/2021 19:34:15 - INFO - __main__ - Step 23475: {'lr': 0.00019989542692365039, 'samples': 751200, 'steps': 1467, 'loss/train': 1.7094374895095825} -09/20/2021 19:34:16 - INFO - __main__ - Step 23476: {'lr': 0.00019989542692365039, 'samples': 751232, 'steps': 1467, 'loss/train': 1.5023845434188843} -09/20/2021 19:34:17 - INFO - __main__ - Step 23477: {'lr': 0.00019989542692365039, 'samples': 751264, 'steps': 1467, 'loss/train': 1.8388636112213135} -09/20/2021 19:34:18 - INFO - __main__ - Step 23478: {'lr': 0.00019989542692365039, 'samples': 751296, 'steps': 1467, 'loss/train': 1.7181717157363892} -09/20/2021 19:34:18 - INFO - __main__ - Step 23479: {'lr': 0.00019989542692365039, 'samples': 751328, 'steps': 1467, 'loss/train': 1.7363629341125488} -09/20/2021 19:34:19 - INFO - __main__ - Step 23480: {'lr': 0.00019989542692365039, 'samples': 751360, 'steps': 1467, 'loss/train': 1.5641013383865356} -09/20/2021 19:34:20 - INFO - __main__ - Step 23481: {'lr': 0.00019989542692365039, 'samples': 751392, 'steps': 1467, 'loss/train': 1.3246982097625732} -09/20/2021 19:34:21 - INFO - __main__ - Step 23482: {'lr': 0.00019989542692365039, 'samples': 751424, 'steps': 1467, 'loss/train': 1.5031111240386963} -09/20/2021 19:34:21 - INFO - __main__ - Step 23483: {'lr': 0.00019989542692365039, 'samples': 751456, 'steps': 1467, 'loss/train': 1.7512445449829102} -09/20/2021 19:34:22 - INFO - __main__ - Step 23484: {'lr': 0.00019989542692365039, 'samples': 751488, 'steps': 1467, 'loss/train': 3.384626626968384} -09/20/2021 19:34:23 - INFO - __main__ - Step 23485: {'lr': 0.00019989542692365039, 'samples': 751520, 'steps': 1467, 'loss/train': 3.00459361076355} -09/20/2021 19:34:24 - INFO - __main__ - Step 23486: {'lr': 0.00019989542692365039, 'samples': 751552, 'steps': 1467, 'loss/train': 3.046977996826172} -09/20/2021 19:34:24 - INFO - __main__ - Step 23487: {'lr': 0.00019989542692365039, 'samples': 751584, 'steps': 1467, 'loss/train': 2.6240501403808594} -09/20/2021 19:34:25 - INFO - __main__ - Step 23488: {'lr': 0.00019989542692365039, 'samples': 751616, 'steps': 1467, 'loss/train': 2.4266276359558105} -09/20/2021 19:34:26 - INFO - __main__ - Step 23489: {'lr': 0.0001998951350750951, 'samples': 751648, 'steps': 1468, 'loss/train': 2.636528968811035} -09/20/2021 19:34:27 - INFO - __main__ - Step 23490: {'lr': 0.0001998951350750951, 'samples': 751680, 'steps': 1468, 'loss/train': 3.478588581085205} -09/20/2021 19:34:27 - INFO - __main__ - Step 23491: {'lr': 0.0001998951350750951, 'samples': 751712, 'steps': 1468, 'loss/train': 0.7747811079025269} -09/20/2021 19:34:28 - INFO - __main__ - Step 23492: {'lr': 0.0001998951350750951, 'samples': 751744, 'steps': 1468, 'loss/train': 3.178696870803833} -09/20/2021 19:34:29 - INFO - __main__ - Step 23493: {'lr': 0.0001998951350750951, 'samples': 751776, 'steps': 1468, 'loss/train': 2.1159069538116455} -09/20/2021 19:34:30 - INFO - __main__ - Step 23494: {'lr': 0.0001998951350750951, 'samples': 751808, 'steps': 1468, 'loss/train': 2.69503116607666} -09/20/2021 19:34:30 - INFO - __main__ - Step 23495: {'lr': 0.0001998951350750951, 'samples': 751840, 'steps': 1468, 'loss/train': 1.6491525173187256} -09/20/2021 19:34:31 - INFO - __main__ - Step 23496: {'lr': 0.0001998951350750951, 'samples': 751872, 'steps': 1468, 'loss/train': 2.4167733192443848} -09/20/2021 19:34:32 - INFO - __main__ - Step 23497: {'lr': 0.0001998951350750951, 'samples': 751904, 'steps': 1468, 'loss/train': 2.443422317504883} -09/20/2021 19:34:33 - INFO - __main__ - Step 23498: {'lr': 0.0001998951350750951, 'samples': 751936, 'steps': 1468, 'loss/train': 2.973020076751709} -09/20/2021 19:34:33 - INFO - __main__ - Step 23499: {'lr': 0.0001998951350750951, 'samples': 751968, 'steps': 1468, 'loss/train': 2.9292893409729004} -09/20/2021 19:34:34 - INFO - __main__ - Step 23500: {'lr': 0.0001998951350750951, 'samples': 752000, 'steps': 1468, 'loss/train': 2.9460954666137695} -09/20/2021 19:34:36 - INFO - __main__ - Step 23501: {'lr': 0.0001998951350750951, 'samples': 752032, 'steps': 1468, 'loss/train': 1.1572778224945068} -09/20/2021 19:34:36 - INFO - __main__ - Step 23502: {'lr': 0.0001998951350750951, 'samples': 752064, 'steps': 1468, 'loss/train': 3.399484872817993} -09/20/2021 19:34:37 - INFO - __main__ - Step 23503: {'lr': 0.0001998951350750951, 'samples': 752096, 'steps': 1468, 'loss/train': 2.4319279193878174} -09/20/2021 19:34:38 - INFO - __main__ - Step 23504: {'lr': 0.0001998951350750951, 'samples': 752128, 'steps': 1468, 'loss/train': 2.070929527282715} -09/20/2021 19:34:39 - INFO - __main__ - Step 23505: {'lr': 0.0001998948428200669, 'samples': 752160, 'steps': 1469, 'loss/train': 3.3426127433776855} -09/20/2021 19:34:39 - INFO - __main__ - Step 23506: {'lr': 0.0001998948428200669, 'samples': 752192, 'steps': 1469, 'loss/train': 2.9674935340881348} -09/20/2021 19:34:40 - INFO - __main__ - Step 23507: {'lr': 0.0001998948428200669, 'samples': 752224, 'steps': 1469, 'loss/train': 2.235565662384033} -09/20/2021 19:34:41 - INFO - __main__ - Step 23508: {'lr': 0.0001998948428200669, 'samples': 752256, 'steps': 1469, 'loss/train': 2.772045850753784} -09/20/2021 19:34:42 - INFO - __main__ - Step 23509: {'lr': 0.0001998948428200669, 'samples': 752288, 'steps': 1469, 'loss/train': 2.2608840465545654} -09/20/2021 19:34:42 - INFO - __main__ - Step 23510: {'lr': 0.0001998948428200669, 'samples': 752320, 'steps': 1469, 'loss/train': 3.499950647354126} -09/20/2021 19:34:43 - INFO - __main__ - Step 23511: {'lr': 0.0001998948428200669, 'samples': 752352, 'steps': 1469, 'loss/train': 2.6190524101257324} -09/20/2021 19:34:44 - INFO - __main__ - Step 23512: {'lr': 0.0001998948428200669, 'samples': 752384, 'steps': 1469, 'loss/train': 2.789196729660034} -09/20/2021 19:34:45 - INFO - __main__ - Step 23513: {'lr': 0.0001998948428200669, 'samples': 752416, 'steps': 1469, 'loss/train': 2.237107753753662} -09/20/2021 19:34:45 - INFO - __main__ - Step 23514: {'lr': 0.0001998948428200669, 'samples': 752448, 'steps': 1469, 'loss/train': 2.6500961780548096} -09/20/2021 19:34:46 - INFO - __main__ - Step 23515: {'lr': 0.0001998948428200669, 'samples': 752480, 'steps': 1469, 'loss/train': 3.2902376651763916} -09/20/2021 19:34:47 - INFO - __main__ - Step 23516: {'lr': 0.0001998948428200669, 'samples': 752512, 'steps': 1469, 'loss/train': 2.868635892868042} -09/20/2021 19:34:48 - INFO - __main__ - Step 23517: {'lr': 0.0001998948428200669, 'samples': 752544, 'steps': 1469, 'loss/train': 3.2883708477020264} -09/20/2021 19:34:48 - INFO - __main__ - Step 23518: {'lr': 0.0001998948428200669, 'samples': 752576, 'steps': 1469, 'loss/train': 3.0058398246765137} -09/20/2021 19:34:49 - INFO - __main__ - Step 23519: {'lr': 0.0001998948428200669, 'samples': 752608, 'steps': 1469, 'loss/train': 2.6622114181518555} -09/20/2021 19:34:50 - INFO - __main__ - Step 23520: {'lr': 0.0001998948428200669, 'samples': 752640, 'steps': 1469, 'loss/train': 2.8170623779296875} -09/20/2021 19:34:51 - INFO - __main__ - Step 23521: {'lr': 0.000199894550158567, 'samples': 752672, 'steps': 1470, 'loss/train': 3.18384051322937} -09/20/2021 19:34:52 - INFO - __main__ - Step 23522: {'lr': 0.000199894550158567, 'samples': 752704, 'steps': 1470, 'loss/train': 3.3150172233581543} -09/20/2021 19:34:52 - INFO - __main__ - Step 23523: {'lr': 0.000199894550158567, 'samples': 752736, 'steps': 1470, 'loss/train': 3.879302978515625} -09/20/2021 19:34:53 - INFO - __main__ - Step 23524: {'lr': 0.000199894550158567, 'samples': 752768, 'steps': 1470, 'loss/train': 2.608506917953491} -09/20/2021 19:34:54 - INFO - __main__ - Step 23525: {'lr': 0.000199894550158567, 'samples': 752800, 'steps': 1470, 'loss/train': 3.129467248916626} -09/20/2021 19:34:55 - INFO - __main__ - Step 23526: {'lr': 0.000199894550158567, 'samples': 752832, 'steps': 1470, 'loss/train': 3.981557607650757} -09/20/2021 19:34:55 - INFO - __main__ - Step 23527: {'lr': 0.000199894550158567, 'samples': 752864, 'steps': 1470, 'loss/train': 1.306494951248169} -09/20/2021 19:34:56 - INFO - __main__ - Step 23528: {'lr': 0.000199894550158567, 'samples': 752896, 'steps': 1470, 'loss/train': 2.919909954071045} -09/20/2021 19:34:57 - INFO - __main__ - Step 23529: {'lr': 0.000199894550158567, 'samples': 752928, 'steps': 1470, 'loss/train': 1.3547544479370117} -09/20/2021 19:34:58 - INFO - __main__ - Step 23530: {'lr': 0.000199894550158567, 'samples': 752960, 'steps': 1470, 'loss/train': 4.894534111022949} -09/20/2021 19:34:59 - INFO - __main__ - Step 23531: {'lr': 0.000199894550158567, 'samples': 752992, 'steps': 1470, 'loss/train': 3.493103265762329} -09/20/2021 19:35:00 - INFO - __main__ - Step 23532: {'lr': 0.000199894550158567, 'samples': 753024, 'steps': 1470, 'loss/train': 3.1327123641967773} -09/20/2021 19:35:00 - INFO - __main__ - Step 23533: {'lr': 0.000199894550158567, 'samples': 753056, 'steps': 1470, 'loss/train': 2.7112913131713867} -09/20/2021 19:35:01 - INFO - __main__ - Step 23534: {'lr': 0.000199894550158567, 'samples': 753088, 'steps': 1470, 'loss/train': 3.8843441009521484} -09/20/2021 19:35:02 - INFO - __main__ - Step 23535: {'lr': 0.000199894550158567, 'samples': 753120, 'steps': 1470, 'loss/train': 3.5498552322387695} -09/20/2021 19:35:03 - INFO - __main__ - Step 23536: {'lr': 0.000199894550158567, 'samples': 753152, 'steps': 1470, 'loss/train': 3.0888514518737793} -09/20/2021 19:35:03 - INFO - __main__ - Step 23537: {'lr': 0.00019989425709059653, 'samples': 753184, 'steps': 1471, 'loss/train': 3.059229612350464} -09/20/2021 19:35:04 - INFO - __main__ - Step 23538: {'lr': 0.00019989425709059653, 'samples': 753216, 'steps': 1471, 'loss/train': 3.71848201751709} -09/20/2021 19:35:05 - INFO - __main__ - Step 23539: {'lr': 0.00019989425709059653, 'samples': 753248, 'steps': 1471, 'loss/train': 3.229541301727295} -09/20/2021 19:35:06 - INFO - __main__ - Step 23540: {'lr': 0.00019989425709059653, 'samples': 753280, 'steps': 1471, 'loss/train': 4.278003215789795} -09/20/2021 19:35:06 - INFO - __main__ - Step 23541: {'lr': 0.00019989425709059653, 'samples': 753312, 'steps': 1471, 'loss/train': 2.9255568981170654} -09/20/2021 19:35:07 - INFO - __main__ - Step 23542: {'lr': 0.00019989425709059653, 'samples': 753344, 'steps': 1471, 'loss/train': 2.67478084564209} -09/20/2021 19:35:08 - INFO - __main__ - Step 23543: {'lr': 0.00019989425709059653, 'samples': 753376, 'steps': 1471, 'loss/train': 4.726502418518066} -09/20/2021 19:35:09 - INFO - __main__ - Step 23544: {'lr': 0.00019989425709059653, 'samples': 753408, 'steps': 1471, 'loss/train': 2.887211799621582} -09/20/2021 19:35:09 - INFO - __main__ - Step 23545: {'lr': 0.00019989425709059653, 'samples': 753440, 'steps': 1471, 'loss/train': 2.6939876079559326} -09/20/2021 19:35:10 - INFO - __main__ - Step 23546: {'lr': 0.00019989425709059653, 'samples': 753472, 'steps': 1471, 'loss/train': 3.437774658203125} -09/20/2021 19:35:11 - INFO - __main__ - Step 23547: {'lr': 0.00019989425709059653, 'samples': 753504, 'steps': 1471, 'loss/train': 2.3760595321655273} -09/20/2021 19:35:12 - INFO - __main__ - Step 23548: {'lr': 0.00019989425709059653, 'samples': 753536, 'steps': 1471, 'loss/train': 2.787419557571411} -09/20/2021 19:35:12 - INFO - __main__ - Step 23549: {'lr': 0.00019989425709059653, 'samples': 753568, 'steps': 1471, 'loss/train': 2.3191945552825928} -09/20/2021 19:35:13 - INFO - __main__ - Step 23550: {'lr': 0.00019989425709059653, 'samples': 753600, 'steps': 1471, 'loss/train': 2.510981798171997} -09/20/2021 19:35:14 - INFO - __main__ - Step 23551: {'lr': 0.00019989425709059653, 'samples': 753632, 'steps': 1471, 'loss/train': 3.117727756500244} -09/20/2021 19:35:15 - INFO - __main__ - Step 23552: {'lr': 0.00019989425709059653, 'samples': 753664, 'steps': 1471, 'loss/train': 3.3878307342529297} -09/20/2021 19:35:16 - INFO - __main__ - Step 23553: {'lr': 0.0001998939636161567, 'samples': 753696, 'steps': 1472, 'loss/train': 3.1389083862304688} -09/20/2021 19:35:16 - INFO - __main__ - Step 23554: {'lr': 0.0001998939636161567, 'samples': 753728, 'steps': 1472, 'loss/train': 2.928907632827759} -09/20/2021 19:35:17 - INFO - __main__ - Step 23555: {'lr': 0.0001998939636161567, 'samples': 753760, 'steps': 1472, 'loss/train': 3.126086711883545} -09/20/2021 19:35:18 - INFO - __main__ - Step 23556: {'lr': 0.0001998939636161567, 'samples': 753792, 'steps': 1472, 'loss/train': 2.7814207077026367} -09/20/2021 19:35:19 - INFO - __main__ - Step 23557: {'lr': 0.0001998939636161567, 'samples': 753824, 'steps': 1472, 'loss/train': 4.638119220733643} -09/20/2021 19:35:19 - INFO - __main__ - Step 23558: {'lr': 0.0001998939636161567, 'samples': 753856, 'steps': 1472, 'loss/train': 2.950923204421997} -09/20/2021 19:35:20 - INFO - __main__ - Step 23559: {'lr': 0.0001998939636161567, 'samples': 753888, 'steps': 1472, 'loss/train': 3.3337326049804688} -09/20/2021 19:35:21 - INFO - __main__ - Step 23560: {'lr': 0.0001998939636161567, 'samples': 753920, 'steps': 1472, 'loss/train': 2.2282588481903076} -09/20/2021 19:35:22 - INFO - __main__ - Step 23561: {'lr': 0.0001998939636161567, 'samples': 753952, 'steps': 1472, 'loss/train': 2.284334421157837} -09/20/2021 19:35:23 - INFO - __main__ - Step 23562: {'lr': 0.0001998939636161567, 'samples': 753984, 'steps': 1472, 'loss/train': 3.7193117141723633} -09/20/2021 19:35:24 - INFO - __main__ - Step 23563: {'lr': 0.0001998939636161567, 'samples': 754016, 'steps': 1472, 'loss/train': 2.6676836013793945} -09/20/2021 19:35:24 - INFO - __main__ - Step 23564: {'lr': 0.0001998939636161567, 'samples': 754048, 'steps': 1472, 'loss/train': 3.208244562149048} -09/20/2021 19:35:25 - INFO - __main__ - Step 23565: {'lr': 0.0001998939636161567, 'samples': 754080, 'steps': 1472, 'loss/train': 2.7157676219940186} -09/20/2021 19:35:26 - INFO - __main__ - Step 23566: {'lr': 0.0001998939636161567, 'samples': 754112, 'steps': 1472, 'loss/train': 2.2630765438079834} -09/20/2021 19:35:27 - INFO - __main__ - Step 23567: {'lr': 0.0001998939636161567, 'samples': 754144, 'steps': 1472, 'loss/train': 3.231309652328491} -09/20/2021 19:35:27 - INFO - __main__ - Step 23568: {'lr': 0.0001998939636161567, 'samples': 754176, 'steps': 1472, 'loss/train': 3.2928237915039062} -09/20/2021 19:35:28 - INFO - __main__ - Step 23569: {'lr': 0.00019989366973524874, 'samples': 754208, 'steps': 1473, 'loss/train': 4.546334743499756} -09/20/2021 19:35:29 - INFO - __main__ - Step 23570: {'lr': 0.00019989366973524874, 'samples': 754240, 'steps': 1473, 'loss/train': 2.772108316421509} -09/20/2021 19:35:30 - INFO - __main__ - Step 23571: {'lr': 0.00019989366973524874, 'samples': 754272, 'steps': 1473, 'loss/train': 2.904902696609497} -09/20/2021 19:35:30 - INFO - __main__ - Step 23572: {'lr': 0.00019989366973524874, 'samples': 754304, 'steps': 1473, 'loss/train': 2.2557592391967773} -09/20/2021 19:35:31 - INFO - __main__ - Step 23573: {'lr': 0.00019989366973524874, 'samples': 754336, 'steps': 1473, 'loss/train': 3.383824348449707} -09/20/2021 19:35:32 - INFO - __main__ - Step 23574: {'lr': 0.00019989366973524874, 'samples': 754368, 'steps': 1473, 'loss/train': 3.072598457336426} -09/20/2021 19:35:33 - INFO - __main__ - Step 23575: {'lr': 0.00019989366973524874, 'samples': 754400, 'steps': 1473, 'loss/train': 3.0120465755462646} -09/20/2021 19:35:33 - INFO - __main__ - Step 23576: {'lr': 0.00019989366973524874, 'samples': 754432, 'steps': 1473, 'loss/train': 2.154331684112549} -09/20/2021 19:35:34 - INFO - __main__ - Step 23577: {'lr': 0.00019989366973524874, 'samples': 754464, 'steps': 1473, 'loss/train': 2.984833002090454} -09/20/2021 19:35:35 - INFO - __main__ - Step 23578: {'lr': 0.00019989366973524874, 'samples': 754496, 'steps': 1473, 'loss/train': 1.9586181640625} -09/20/2021 19:35:36 - INFO - __main__ - Step 23579: {'lr': 0.00019989366973524874, 'samples': 754528, 'steps': 1473, 'loss/train': 2.903553009033203} -09/20/2021 19:35:36 - INFO - __main__ - Step 23580: {'lr': 0.00019989366973524874, 'samples': 754560, 'steps': 1473, 'loss/train': 2.067409038543701} -09/20/2021 19:35:37 - INFO - __main__ - Step 23581: {'lr': 0.00019989366973524874, 'samples': 754592, 'steps': 1473, 'loss/train': 3.6993279457092285} -09/20/2021 19:35:38 - INFO - __main__ - Step 23582: {'lr': 0.00019989366973524874, 'samples': 754624, 'steps': 1473, 'loss/train': 3.4539108276367188} -09/20/2021 19:35:39 - INFO - __main__ - Step 23583: {'lr': 0.00019989366973524874, 'samples': 754656, 'steps': 1473, 'loss/train': 3.274895429611206} -09/20/2021 19:35:39 - INFO - __main__ - Step 23584: {'lr': 0.00019989366973524874, 'samples': 754688, 'steps': 1473, 'loss/train': 2.765996217727661} -09/20/2021 19:35:40 - INFO - __main__ - Step 23585: {'lr': 0.00019989337544787386, 'samples': 754720, 'steps': 1474, 'loss/train': 2.5869600772857666} -09/20/2021 19:35:41 - INFO - __main__ - Step 23586: {'lr': 0.00019989337544787386, 'samples': 754752, 'steps': 1474, 'loss/train': 3.1090824604034424} -09/20/2021 19:35:42 - INFO - __main__ - Step 23587: {'lr': 0.00019989337544787386, 'samples': 754784, 'steps': 1474, 'loss/train': 3.453080654144287} -09/20/2021 19:35:43 - INFO - __main__ - Step 23588: {'lr': 0.00019989337544787386, 'samples': 754816, 'steps': 1474, 'loss/train': 3.2254133224487305} -09/20/2021 19:35:43 - INFO - __main__ - Step 23589: {'lr': 0.00019989337544787386, 'samples': 754848, 'steps': 1474, 'loss/train': 2.764490842819214} -09/20/2021 19:35:44 - INFO - __main__ - Step 23590: {'lr': 0.00019989337544787386, 'samples': 754880, 'steps': 1474, 'loss/train': 2.7893993854522705} -09/20/2021 19:35:45 - INFO - __main__ - Step 23591: {'lr': 0.00019989337544787386, 'samples': 754912, 'steps': 1474, 'loss/train': 2.295395851135254} -09/20/2021 19:35:46 - INFO - __main__ - Step 23592: {'lr': 0.00019989337544787386, 'samples': 754944, 'steps': 1474, 'loss/train': 2.4083638191223145} -09/20/2021 19:35:47 - INFO - __main__ - Step 23593: {'lr': 0.00019989337544787386, 'samples': 754976, 'steps': 1474, 'loss/train': 3.147324800491333} -09/20/2021 19:35:48 - INFO - __main__ - Step 23594: {'lr': 0.00019989337544787386, 'samples': 755008, 'steps': 1474, 'loss/train': 1.4198044538497925} -09/20/2021 19:35:48 - INFO - __main__ - Step 23595: {'lr': 0.00019989337544787386, 'samples': 755040, 'steps': 1474, 'loss/train': 3.4773917198181152} -09/20/2021 19:35:49 - INFO - __main__ - Step 23596: {'lr': 0.00019989337544787386, 'samples': 755072, 'steps': 1474, 'loss/train': 2.494122266769409} -09/20/2021 19:35:50 - INFO - __main__ - Step 23597: {'lr': 0.00019989337544787386, 'samples': 755104, 'steps': 1474, 'loss/train': 3.131767988204956} -09/20/2021 19:35:51 - INFO - __main__ - Step 23598: {'lr': 0.00019989337544787386, 'samples': 755136, 'steps': 1474, 'loss/train': 2.511774778366089} -09/20/2021 19:35:51 - INFO - __main__ - Step 23599: {'lr': 0.00019989337544787386, 'samples': 755168, 'steps': 1474, 'loss/train': 2.8449268341064453} -09/20/2021 19:35:52 - INFO - __main__ - Step 23600: {'lr': 0.00019989337544787386, 'samples': 755200, 'steps': 1474, 'loss/train': 2.503676652908325} -09/20/2021 19:35:53 - INFO - __main__ - Step 23601: {'lr': 0.00019989308075403316, 'samples': 755232, 'steps': 1475, 'loss/train': 2.8656809329986572} -09/20/2021 19:35:54 - INFO - __main__ - Step 23602: {'lr': 0.00019989308075403316, 'samples': 755264, 'steps': 1475, 'loss/train': 2.7858545780181885} -09/20/2021 19:35:55 - INFO - __main__ - Step 23603: {'lr': 0.00019989308075403316, 'samples': 755296, 'steps': 1475, 'loss/train': 3.0656492710113525} -09/20/2021 19:35:55 - INFO - __main__ - Step 23604: {'lr': 0.00019989308075403316, 'samples': 755328, 'steps': 1475, 'loss/train': 2.4307548999786377} -09/20/2021 19:35:56 - INFO - __main__ - Step 23605: {'lr': 0.00019989308075403316, 'samples': 755360, 'steps': 1475, 'loss/train': 2.9423019886016846} -09/20/2021 19:35:57 - INFO - __main__ - Step 23606: {'lr': 0.00019989308075403316, 'samples': 755392, 'steps': 1475, 'loss/train': 2.847470760345459} -09/20/2021 19:35:58 - INFO - __main__ - Step 23607: {'lr': 0.00019989308075403316, 'samples': 755424, 'steps': 1475, 'loss/train': 2.7053616046905518} -09/20/2021 19:35:58 - INFO - __main__ - Step 23608: {'lr': 0.00019989308075403316, 'samples': 755456, 'steps': 1475, 'loss/train': 2.9035897254943848} -09/20/2021 19:35:59 - INFO - __main__ - Step 23609: {'lr': 0.00019989308075403316, 'samples': 755488, 'steps': 1475, 'loss/train': 3.0998995304107666} -09/20/2021 19:36:00 - INFO - __main__ - Step 23610: {'lr': 0.00019989308075403316, 'samples': 755520, 'steps': 1475, 'loss/train': 3.0365614891052246} -09/20/2021 19:36:01 - INFO - __main__ - Step 23611: {'lr': 0.00019989308075403316, 'samples': 755552, 'steps': 1475, 'loss/train': 2.515159845352173} -09/20/2021 19:36:01 - INFO - __main__ - Step 23612: {'lr': 0.00019989308075403316, 'samples': 755584, 'steps': 1475, 'loss/train': 2.183058023452759} -09/20/2021 19:36:02 - INFO - __main__ - Step 23613: {'lr': 0.00019989308075403316, 'samples': 755616, 'steps': 1475, 'loss/train': 3.1998367309570312} -09/20/2021 19:36:03 - INFO - __main__ - Step 23614: {'lr': 0.00019989308075403316, 'samples': 755648, 'steps': 1475, 'loss/train': 3.0832359790802} -09/20/2021 19:36:04 - INFO - __main__ - Step 23615: {'lr': 0.00019989308075403316, 'samples': 755680, 'steps': 1475, 'loss/train': 2.0916833877563477} -09/20/2021 19:36:04 - INFO - __main__ - Step 23616: {'lr': 0.00019989308075403316, 'samples': 755712, 'steps': 1475, 'loss/train': 4.160648345947266} -09/20/2021 19:36:05 - INFO - __main__ - Step 23617: {'lr': 0.00019989278565372796, 'samples': 755744, 'steps': 1476, 'loss/train': 2.980696201324463} -09/20/2021 19:36:06 - INFO - __main__ - Step 23618: {'lr': 0.00019989278565372796, 'samples': 755776, 'steps': 1476, 'loss/train': 2.395352840423584} -09/20/2021 19:36:07 - INFO - __main__ - Step 23619: {'lr': 0.00019989278565372796, 'samples': 755808, 'steps': 1476, 'loss/train': 2.5663082599639893} -09/20/2021 19:36:08 - INFO - __main__ - Step 23620: {'lr': 0.00019989278565372796, 'samples': 755840, 'steps': 1476, 'loss/train': 2.778240203857422} -09/20/2021 19:36:08 - INFO - __main__ - Step 23621: {'lr': 0.00019989278565372796, 'samples': 755872, 'steps': 1476, 'loss/train': 3.3960537910461426} -09/20/2021 19:36:09 - INFO - __main__ - Step 23622: {'lr': 0.00019989278565372796, 'samples': 755904, 'steps': 1476, 'loss/train': 3.8515524864196777} -09/20/2021 19:36:10 - INFO - __main__ - Step 23623: {'lr': 0.00019989278565372796, 'samples': 755936, 'steps': 1476, 'loss/train': 3.020397663116455} -09/20/2021 19:36:11 - INFO - __main__ - Step 23624: {'lr': 0.00019989278565372796, 'samples': 755968, 'steps': 1476, 'loss/train': 2.7728965282440186} -09/20/2021 19:36:11 - INFO - __main__ - Step 23625: {'lr': 0.00019989278565372796, 'samples': 756000, 'steps': 1476, 'loss/train': 3.6952643394470215} -09/20/2021 19:36:13 - INFO - __main__ - Step 23626: {'lr': 0.00019989278565372796, 'samples': 756032, 'steps': 1476, 'loss/train': 2.5149288177490234} -09/20/2021 19:36:13 - INFO - __main__ - Step 23627: {'lr': 0.00019989278565372796, 'samples': 756064, 'steps': 1476, 'loss/train': 2.3742024898529053} -09/20/2021 19:36:14 - INFO - __main__ - Step 23628: {'lr': 0.00019989278565372796, 'samples': 756096, 'steps': 1476, 'loss/train': 3.505903959274292} -09/20/2021 19:36:15 - INFO - __main__ - Step 23629: {'lr': 0.00019989278565372796, 'samples': 756128, 'steps': 1476, 'loss/train': 2.2404441833496094} -09/20/2021 19:36:16 - INFO - __main__ - Step 23630: {'lr': 0.00019989278565372796, 'samples': 756160, 'steps': 1476, 'loss/train': 2.934324264526367} -09/20/2021 19:36:16 - INFO - __main__ - Step 23631: {'lr': 0.00019989278565372796, 'samples': 756192, 'steps': 1476, 'loss/train': 3.2131471633911133} -09/20/2021 19:36:17 - INFO - __main__ - Step 23632: {'lr': 0.00019989278565372796, 'samples': 756224, 'steps': 1476, 'loss/train': 0.9044367074966431} -09/20/2021 19:36:18 - INFO - __main__ - Step 23633: {'lr': 0.00019989249014695936, 'samples': 756256, 'steps': 1477, 'loss/train': 1.9670466184616089} -09/20/2021 19:36:19 - INFO - __main__ - Step 23634: {'lr': 0.00019989249014695936, 'samples': 756288, 'steps': 1477, 'loss/train': 2.1789634227752686} -09/20/2021 19:36:19 - INFO - __main__ - Step 23635: {'lr': 0.00019989249014695936, 'samples': 756320, 'steps': 1477, 'loss/train': 3.1381325721740723} -09/20/2021 19:36:20 - INFO - __main__ - Step 23636: {'lr': 0.00019989249014695936, 'samples': 756352, 'steps': 1477, 'loss/train': 2.586683511734009} -09/20/2021 19:36:21 - INFO - __main__ - Step 23637: {'lr': 0.00019989249014695936, 'samples': 756384, 'steps': 1477, 'loss/train': 3.226496458053589} -09/20/2021 19:36:22 - INFO - __main__ - Step 23638: {'lr': 0.00019989249014695936, 'samples': 756416, 'steps': 1477, 'loss/train': 2.9840006828308105} -09/20/2021 19:36:22 - INFO - __main__ - Step 23639: {'lr': 0.00019989249014695936, 'samples': 756448, 'steps': 1477, 'loss/train': 2.572486400604248} -09/20/2021 19:36:23 - INFO - __main__ - Step 23640: {'lr': 0.00019989249014695936, 'samples': 756480, 'steps': 1477, 'loss/train': 3.033822536468506} -09/20/2021 19:36:24 - INFO - __main__ - Step 23641: {'lr': 0.00019989249014695936, 'samples': 756512, 'steps': 1477, 'loss/train': 3.003382682800293} -09/20/2021 19:36:25 - INFO - __main__ - Step 23642: {'lr': 0.00019989249014695936, 'samples': 756544, 'steps': 1477, 'loss/train': 2.886120080947876} -09/20/2021 19:36:25 - INFO - __main__ - Step 23643: {'lr': 0.00019989249014695936, 'samples': 756576, 'steps': 1477, 'loss/train': 2.491758108139038} -09/20/2021 19:36:26 - INFO - __main__ - Step 23644: {'lr': 0.00019989249014695936, 'samples': 756608, 'steps': 1477, 'loss/train': 0.4722598195075989} -09/20/2021 19:36:27 - INFO - __main__ - Step 23645: {'lr': 0.00019989249014695936, 'samples': 756640, 'steps': 1477, 'loss/train': 3.820239782333374} -09/20/2021 19:36:28 - INFO - __main__ - Step 23646: {'lr': 0.00019989249014695936, 'samples': 756672, 'steps': 1477, 'loss/train': 2.266617774963379} -09/20/2021 19:36:28 - INFO - __main__ - Step 23647: {'lr': 0.00019989249014695936, 'samples': 756704, 'steps': 1477, 'loss/train': 3.41396427154541} -09/20/2021 19:36:29 - INFO - __main__ - Step 23648: {'lr': 0.00019989249014695936, 'samples': 756736, 'steps': 1477, 'loss/train': 2.068007707595825} -09/20/2021 19:36:30 - INFO - __main__ - Step 23649: {'lr': 0.00019989219423372862, 'samples': 756768, 'steps': 1478, 'loss/train': 3.32490873336792} -09/20/2021 19:36:31 - INFO - __main__ - Step 23650: {'lr': 0.00019989219423372862, 'samples': 756800, 'steps': 1478, 'loss/train': 3.1389474868774414} -09/20/2021 19:36:32 - INFO - __main__ - Step 23651: {'lr': 0.00019989219423372862, 'samples': 756832, 'steps': 1478, 'loss/train': 3.795210361480713} -09/20/2021 19:36:32 - INFO - __main__ - Step 23652: {'lr': 0.00019989219423372862, 'samples': 756864, 'steps': 1478, 'loss/train': 3.031497001647949} -09/20/2021 19:36:33 - INFO - __main__ - Step 23653: {'lr': 0.00019989219423372862, 'samples': 756896, 'steps': 1478, 'loss/train': 2.7678310871124268} -09/20/2021 19:36:34 - INFO - __main__ - Step 23654: {'lr': 0.00019989219423372862, 'samples': 756928, 'steps': 1478, 'loss/train': 3.4043288230895996} -09/20/2021 19:36:35 - INFO - __main__ - Step 23655: {'lr': 0.00019989219423372862, 'samples': 756960, 'steps': 1478, 'loss/train': 2.6952624320983887} -09/20/2021 19:36:36 - INFO - __main__ - Step 23656: {'lr': 0.00019989219423372862, 'samples': 756992, 'steps': 1478, 'loss/train': 2.177408218383789} -09/20/2021 19:36:37 - INFO - __main__ - Step 23657: {'lr': 0.00019989219423372862, 'samples': 757024, 'steps': 1478, 'loss/train': 2.5110723972320557} -09/20/2021 19:36:38 - INFO - __main__ - Step 23658: {'lr': 0.00019989219423372862, 'samples': 757056, 'steps': 1478, 'loss/train': 3.435486316680908} -09/20/2021 19:36:39 - INFO - __main__ - Step 23659: {'lr': 0.00019989219423372862, 'samples': 757088, 'steps': 1478, 'loss/train': 3.2786524295806885} -09/20/2021 19:36:39 - INFO - __main__ - Step 23660: {'lr': 0.00019989219423372862, 'samples': 757120, 'steps': 1478, 'loss/train': 3.032999038696289} -09/20/2021 19:36:40 - INFO - __main__ - Step 23661: {'lr': 0.00019989219423372862, 'samples': 757152, 'steps': 1478, 'loss/train': 2.863701343536377} -09/20/2021 19:36:41 - INFO - __main__ - Step 23662: {'lr': 0.00019989219423372862, 'samples': 757184, 'steps': 1478, 'loss/train': 3.146721363067627} -09/20/2021 19:36:42 - INFO - __main__ - Step 23663: {'lr': 0.00019989219423372862, 'samples': 757216, 'steps': 1478, 'loss/train': 3.607806921005249} -09/20/2021 19:36:42 - INFO - __main__ - Step 23664: {'lr': 0.00019989219423372862, 'samples': 757248, 'steps': 1478, 'loss/train': 4.363256454467773} -09/20/2021 19:36:43 - INFO - __main__ - Step 23665: {'lr': 0.00019989189791403696, 'samples': 757280, 'steps': 1479, 'loss/train': 0.7279709577560425} -09/20/2021 19:36:44 - INFO - __main__ - Step 23666: {'lr': 0.00019989189791403696, 'samples': 757312, 'steps': 1479, 'loss/train': 0.43510812520980835} -09/20/2021 19:36:45 - INFO - __main__ - Step 23667: {'lr': 0.00019989189791403696, 'samples': 757344, 'steps': 1479, 'loss/train': 2.8527204990386963} -09/20/2021 19:36:46 - INFO - __main__ - Step 23668: {'lr': 0.00019989189791403696, 'samples': 757376, 'steps': 1479, 'loss/train': 2.4724814891815186} -09/20/2021 19:36:46 - INFO - __main__ - Step 23669: {'lr': 0.00019989189791403696, 'samples': 757408, 'steps': 1479, 'loss/train': 2.846456289291382} -09/20/2021 19:36:47 - INFO - __main__ - Step 23670: {'lr': 0.00019989189791403696, 'samples': 757440, 'steps': 1479, 'loss/train': 2.337475061416626} -09/20/2021 19:36:48 - INFO - __main__ - Step 23671: {'lr': 0.00019989189791403696, 'samples': 757472, 'steps': 1479, 'loss/train': 2.566636323928833} -09/20/2021 19:36:49 - INFO - __main__ - Step 23672: {'lr': 0.00019989189791403696, 'samples': 757504, 'steps': 1479, 'loss/train': 3.67889404296875} -09/20/2021 19:36:49 - INFO - __main__ - Step 23673: {'lr': 0.00019989189791403696, 'samples': 757536, 'steps': 1479, 'loss/train': 3.3155345916748047} -09/20/2021 19:36:50 - INFO - __main__ - Step 23674: {'lr': 0.00019989189791403696, 'samples': 757568, 'steps': 1479, 'loss/train': 3.4066884517669678} -09/20/2021 19:36:51 - INFO - __main__ - Step 23675: {'lr': 0.00019989189791403696, 'samples': 757600, 'steps': 1479, 'loss/train': 3.1951582431793213} -09/20/2021 19:36:52 - INFO - __main__ - Step 23676: {'lr': 0.00019989189791403696, 'samples': 757632, 'steps': 1479, 'loss/train': 2.612720489501953} -09/20/2021 19:36:52 - INFO - __main__ - Step 23677: {'lr': 0.00019989189791403696, 'samples': 757664, 'steps': 1479, 'loss/train': 3.4181716442108154} -09/20/2021 19:36:53 - INFO - __main__ - Step 23678: {'lr': 0.00019989189791403696, 'samples': 757696, 'steps': 1479, 'loss/train': 0.5544484853744507} -09/20/2021 19:36:54 - INFO - __main__ - Step 23679: {'lr': 0.00019989189791403696, 'samples': 757728, 'steps': 1479, 'loss/train': 2.6678762435913086} -09/20/2021 19:36:55 - INFO - __main__ - Step 23680: {'lr': 0.00019989189791403696, 'samples': 757760, 'steps': 1479, 'loss/train': 3.368972063064575} -09/20/2021 19:36:55 - INFO - __main__ - Step 23681: {'lr': 0.00019989160118788553, 'samples': 757792, 'steps': 1480, 'loss/train': 3.9845571517944336} -09/20/2021 19:36:56 - INFO - __main__ - Step 23682: {'lr': 0.00019989160118788553, 'samples': 757824, 'steps': 1480, 'loss/train': 3.5929782390594482} -09/20/2021 19:36:57 - INFO - __main__ - Step 23683: {'lr': 0.00019989160118788553, 'samples': 757856, 'steps': 1480, 'loss/train': 1.9337252378463745} -09/20/2021 19:36:58 - INFO - __main__ - Step 23684: {'lr': 0.00019989160118788553, 'samples': 757888, 'steps': 1480, 'loss/train': 2.9959590435028076} -09/20/2021 19:36:58 - INFO - __main__ - Step 23685: {'lr': 0.00019989160118788553, 'samples': 757920, 'steps': 1480, 'loss/train': 2.1644814014434814} -09/20/2021 19:36:59 - INFO - __main__ - Step 23686: {'lr': 0.00019989160118788553, 'samples': 757952, 'steps': 1480, 'loss/train': 2.4009299278259277} -09/20/2021 19:37:00 - INFO - __main__ - Step 23687: {'lr': 0.00019989160118788553, 'samples': 757984, 'steps': 1480, 'loss/train': 3.1374454498291016} -09/20/2021 19:37:01 - INFO - __main__ - Step 23688: {'lr': 0.00019989160118788553, 'samples': 758016, 'steps': 1480, 'loss/train': 2.7569124698638916} -09/20/2021 19:37:02 - INFO - __main__ - Step 23689: {'lr': 0.00019989160118788553, 'samples': 758048, 'steps': 1480, 'loss/train': 3.9829022884368896} -09/20/2021 19:37:03 - INFO - __main__ - Step 23690: {'lr': 0.00019989160118788553, 'samples': 758080, 'steps': 1480, 'loss/train': 1.0975935459136963} -09/20/2021 19:37:03 - INFO - __main__ - Step 23691: {'lr': 0.00019989160118788553, 'samples': 758112, 'steps': 1480, 'loss/train': 2.750230550765991} -09/20/2021 19:37:04 - INFO - __main__ - Step 23692: {'lr': 0.00019989160118788553, 'samples': 758144, 'steps': 1480, 'loss/train': 2.638986587524414} -09/20/2021 19:37:05 - INFO - __main__ - Step 23693: {'lr': 0.00019989160118788553, 'samples': 758176, 'steps': 1480, 'loss/train': 2.292117118835449} -09/20/2021 19:37:06 - INFO - __main__ - Step 23694: {'lr': 0.00019989160118788553, 'samples': 758208, 'steps': 1480, 'loss/train': 3.51066255569458} -09/20/2021 19:37:06 - INFO - __main__ - Step 23695: {'lr': 0.00019989160118788553, 'samples': 758240, 'steps': 1480, 'loss/train': 3.8438379764556885} -09/20/2021 19:37:07 - INFO - __main__ - Step 23696: {'lr': 0.00019989160118788553, 'samples': 758272, 'steps': 1480, 'loss/train': 1.0013240575790405} -09/20/2021 19:37:08 - INFO - __main__ - Step 23697: {'lr': 0.00019989130405527553, 'samples': 758304, 'steps': 1481, 'loss/train': 2.793752908706665} -09/20/2021 19:37:09 - INFO - __main__ - Step 23698: {'lr': 0.00019989130405527553, 'samples': 758336, 'steps': 1481, 'loss/train': 2.9552876949310303} -09/20/2021 19:37:10 - INFO - __main__ - Step 23699: {'lr': 0.00019989130405527553, 'samples': 758368, 'steps': 1481, 'loss/train': 3.32063364982605} -09/20/2021 19:37:10 - INFO - __main__ - Step 23700: {'lr': 0.00019989130405527553, 'samples': 758400, 'steps': 1481, 'loss/train': 1.9677015542984009} -09/20/2021 19:37:11 - INFO - __main__ - Step 23701: {'lr': 0.00019989130405527553, 'samples': 758432, 'steps': 1481, 'loss/train': 2.697056293487549} -09/20/2021 19:37:12 - INFO - __main__ - Step 23702: {'lr': 0.00019989130405527553, 'samples': 758464, 'steps': 1481, 'loss/train': 3.3671159744262695} -09/20/2021 19:37:13 - INFO - __main__ - Step 23703: {'lr': 0.00019989130405527553, 'samples': 758496, 'steps': 1481, 'loss/train': 3.3419411182403564} -09/20/2021 19:37:13 - INFO - __main__ - Step 23704: {'lr': 0.00019989130405527553, 'samples': 758528, 'steps': 1481, 'loss/train': 1.6359162330627441} -09/20/2021 19:37:14 - INFO - __main__ - Step 23705: {'lr': 0.00019989130405527553, 'samples': 758560, 'steps': 1481, 'loss/train': 2.644646644592285} -09/20/2021 19:37:15 - INFO - __main__ - Step 23706: {'lr': 0.00019989130405527553, 'samples': 758592, 'steps': 1481, 'loss/train': 3.310368299484253} -09/20/2021 19:37:16 - INFO - __main__ - Step 23707: {'lr': 0.00019989130405527553, 'samples': 758624, 'steps': 1481, 'loss/train': 2.7657413482666016} -09/20/2021 19:37:16 - INFO - __main__ - Step 23708: {'lr': 0.00019989130405527553, 'samples': 758656, 'steps': 1481, 'loss/train': 3.2203893661499023} -09/20/2021 19:37:17 - INFO - __main__ - Step 23709: {'lr': 0.00019989130405527553, 'samples': 758688, 'steps': 1481, 'loss/train': 4.065510272979736} -09/20/2021 19:37:18 - INFO - __main__ - Step 23710: {'lr': 0.00019989130405527553, 'samples': 758720, 'steps': 1481, 'loss/train': 3.1753509044647217} -09/20/2021 19:37:19 - INFO - __main__ - Step 23711: {'lr': 0.00019989130405527553, 'samples': 758752, 'steps': 1481, 'loss/train': 2.976036548614502} -09/20/2021 19:37:19 - INFO - __main__ - Step 23712: {'lr': 0.00019989130405527553, 'samples': 758784, 'steps': 1481, 'loss/train': 2.3151676654815674} -09/20/2021 19:37:20 - INFO - __main__ - Step 23713: {'lr': 0.00019989100651620826, 'samples': 758816, 'steps': 1482, 'loss/train': 2.150313377380371} -09/20/2021 19:37:21 - INFO - __main__ - Step 23714: {'lr': 0.00019989100651620826, 'samples': 758848, 'steps': 1482, 'loss/train': 3.051527976989746} -09/20/2021 19:37:22 - INFO - __main__ - Step 23715: {'lr': 0.00019989100651620826, 'samples': 758880, 'steps': 1482, 'loss/train': 2.1621782779693604} -09/20/2021 19:37:23 - INFO - __main__ - Step 23716: {'lr': 0.00019989100651620826, 'samples': 758912, 'steps': 1482, 'loss/train': 2.5330402851104736} -09/20/2021 19:37:23 - INFO - __main__ - Step 23717: {'lr': 0.00019989100651620826, 'samples': 758944, 'steps': 1482, 'loss/train': 3.472288131713867} -09/20/2021 19:37:24 - INFO - __main__ - Step 23718: {'lr': 0.00019989100651620826, 'samples': 758976, 'steps': 1482, 'loss/train': 3.1609458923339844} -09/20/2021 19:37:25 - INFO - __main__ - Step 23719: {'lr': 0.00019989100651620826, 'samples': 759008, 'steps': 1482, 'loss/train': 3.593398332595825} -09/20/2021 19:37:26 - INFO - __main__ - Step 23720: {'lr': 0.00019989100651620826, 'samples': 759040, 'steps': 1482, 'loss/train': 3.0927417278289795} -09/20/2021 19:37:27 - INFO - __main__ - Step 23721: {'lr': 0.00019989100651620826, 'samples': 759072, 'steps': 1482, 'loss/train': 2.3483169078826904} -09/20/2021 19:37:28 - INFO - __main__ - Step 23722: {'lr': 0.00019989100651620826, 'samples': 759104, 'steps': 1482, 'loss/train': 3.0034172534942627} -09/20/2021 19:37:29 - INFO - __main__ - Step 23723: {'lr': 0.00019989100651620826, 'samples': 759136, 'steps': 1482, 'loss/train': 2.565875768661499} -09/20/2021 19:37:29 - INFO - __main__ - Step 23724: {'lr': 0.00019989100651620826, 'samples': 759168, 'steps': 1482, 'loss/train': 3.0319387912750244} -09/20/2021 19:37:30 - INFO - __main__ - Step 23725: {'lr': 0.00019989100651620826, 'samples': 759200, 'steps': 1482, 'loss/train': 2.5935213565826416} -09/20/2021 19:37:31 - INFO - __main__ - Step 23726: {'lr': 0.00019989100651620826, 'samples': 759232, 'steps': 1482, 'loss/train': 3.423301935195923} -09/20/2021 19:37:32 - INFO - __main__ - Step 23727: {'lr': 0.00019989100651620826, 'samples': 759264, 'steps': 1482, 'loss/train': 3.186594247817993} -09/20/2021 19:37:32 - INFO - __main__ - Step 23728: {'lr': 0.00019989100651620826, 'samples': 759296, 'steps': 1482, 'loss/train': 1.8891743421554565} -09/20/2021 19:37:33 - INFO - __main__ - Step 23729: {'lr': 0.0001998907085706848, 'samples': 759328, 'steps': 1483, 'loss/train': 3.22098970413208} -09/20/2021 19:37:34 - INFO - __main__ - Step 23730: {'lr': 0.0001998907085706848, 'samples': 759360, 'steps': 1483, 'loss/train': 3.4881742000579834} -09/20/2021 19:37:35 - INFO - __main__ - Step 23731: {'lr': 0.0001998907085706848, 'samples': 759392, 'steps': 1483, 'loss/train': 2.7681896686553955} -09/20/2021 19:37:35 - INFO - __main__ - Step 23732: {'lr': 0.0001998907085706848, 'samples': 759424, 'steps': 1483, 'loss/train': 3.132002830505371} -09/20/2021 19:37:36 - INFO - __main__ - Step 23733: {'lr': 0.0001998907085706848, 'samples': 759456, 'steps': 1483, 'loss/train': 3.5997092723846436} -09/20/2021 19:37:37 - INFO - __main__ - Step 23734: {'lr': 0.0001998907085706848, 'samples': 759488, 'steps': 1483, 'loss/train': 3.1344165802001953} -09/20/2021 19:37:38 - INFO - __main__ - Step 23735: {'lr': 0.0001998907085706848, 'samples': 759520, 'steps': 1483, 'loss/train': 3.3232786655426025} -09/20/2021 19:37:38 - INFO - __main__ - Step 23736: {'lr': 0.0001998907085706848, 'samples': 759552, 'steps': 1483, 'loss/train': 0.6978061199188232} -09/20/2021 19:37:39 - INFO - __main__ - Step 23737: {'lr': 0.0001998907085706848, 'samples': 759584, 'steps': 1483, 'loss/train': 0.5624536275863647} -09/20/2021 19:37:40 - INFO - __main__ - Step 23738: {'lr': 0.0001998907085706848, 'samples': 759616, 'steps': 1483, 'loss/train': 0.5278297066688538} -09/20/2021 19:37:41 - INFO - __main__ - Step 23739: {'lr': 0.0001998907085706848, 'samples': 759648, 'steps': 1483, 'loss/train': 0.3447439670562744} -09/20/2021 19:37:41 - INFO - __main__ - Step 23740: {'lr': 0.0001998907085706848, 'samples': 759680, 'steps': 1483, 'loss/train': 0.5458623170852661} -09/20/2021 19:37:42 - INFO - __main__ - Step 23741: {'lr': 0.0001998907085706848, 'samples': 759712, 'steps': 1483, 'loss/train': 3.2723565101623535} -09/20/2021 19:37:43 - INFO - __main__ - Step 23742: {'lr': 0.0001998907085706848, 'samples': 759744, 'steps': 1483, 'loss/train': 2.722500801086426} -09/20/2021 19:37:44 - INFO - __main__ - Step 23743: {'lr': 0.0001998907085706848, 'samples': 759776, 'steps': 1483, 'loss/train': 2.773071765899658} -09/20/2021 19:37:44 - INFO - __main__ - Step 23744: {'lr': 0.0001998907085706848, 'samples': 759808, 'steps': 1483, 'loss/train': 3.1735312938690186} -09/20/2021 19:37:45 - INFO - __main__ - Step 23745: {'lr': 0.00019989041021870648, 'samples': 759840, 'steps': 1484, 'loss/train': 2.661381959915161} -09/20/2021 19:37:46 - INFO - __main__ - Step 23746: {'lr': 0.00019989041021870648, 'samples': 759872, 'steps': 1484, 'loss/train': 3.160283088684082} -09/20/2021 19:37:47 - INFO - __main__ - Step 23747: {'lr': 0.00019989041021870648, 'samples': 759904, 'steps': 1484, 'loss/train': 3.5936646461486816} -09/20/2021 19:37:48 - INFO - __main__ - Step 23748: {'lr': 0.00019989041021870648, 'samples': 759936, 'steps': 1484, 'loss/train': 2.3387234210968018} -09/20/2021 19:37:48 - INFO - __main__ - Step 23749: {'lr': 0.00019989041021870648, 'samples': 759968, 'steps': 1484, 'loss/train': 3.315303325653076} -09/20/2021 19:37:50 - INFO - __main__ - Step 23750: {'lr': 0.00019989041021870648, 'samples': 760000, 'steps': 1484, 'loss/train': 3.1677868366241455} -09/20/2021 19:37:50 - INFO - __main__ - Step 23751: {'lr': 0.00019989041021870648, 'samples': 760032, 'steps': 1484, 'loss/train': 2.9966843128204346} -09/20/2021 19:37:51 - INFO - __main__ - Step 23752: {'lr': 0.00019989041021870648, 'samples': 760064, 'steps': 1484, 'loss/train': 2.7907967567443848} -09/20/2021 19:37:52 - INFO - __main__ - Step 23753: {'lr': 0.00019989041021870648, 'samples': 760096, 'steps': 1484, 'loss/train': 2.8315274715423584} -09/20/2021 19:37:53 - INFO - __main__ - Step 23754: {'lr': 0.00019989041021870648, 'samples': 760128, 'steps': 1484, 'loss/train': 3.0456652641296387} -09/20/2021 19:37:53 - INFO - __main__ - Step 23755: {'lr': 0.00019989041021870648, 'samples': 760160, 'steps': 1484, 'loss/train': 3.6329245567321777} -09/20/2021 19:37:54 - INFO - __main__ - Step 23756: {'lr': 0.00019989041021870648, 'samples': 760192, 'steps': 1484, 'loss/train': 3.7841620445251465} -09/20/2021 19:37:55 - INFO - __main__ - Step 23757: {'lr': 0.00019989041021870648, 'samples': 760224, 'steps': 1484, 'loss/train': 3.2257003784179688} -09/20/2021 19:37:56 - INFO - __main__ - Step 23758: {'lr': 0.00019989041021870648, 'samples': 760256, 'steps': 1484, 'loss/train': 2.714254856109619} -09/20/2021 19:37:56 - INFO - __main__ - Step 23759: {'lr': 0.00019989041021870648, 'samples': 760288, 'steps': 1484, 'loss/train': 3.186593532562256} -09/20/2021 19:37:57 - INFO - __main__ - Step 23760: {'lr': 0.00019989041021870648, 'samples': 760320, 'steps': 1484, 'loss/train': 4.351768493652344} -09/20/2021 19:37:58 - INFO - __main__ - Step 23761: {'lr': 0.00019989011146027448, 'samples': 760352, 'steps': 1485, 'loss/train': 2.1930766105651855} -09/20/2021 19:37:59 - INFO - __main__ - Step 23762: {'lr': 0.00019989011146027448, 'samples': 760384, 'steps': 1485, 'loss/train': 2.764662742614746} -09/20/2021 19:38:00 - INFO - __main__ - Step 23763: {'lr': 0.00019989011146027448, 'samples': 760416, 'steps': 1485, 'loss/train': 3.3409788608551025} -09/20/2021 19:38:00 - INFO - __main__ - Step 23764: {'lr': 0.00019989011146027448, 'samples': 760448, 'steps': 1485, 'loss/train': 3.499457836151123} -09/20/2021 19:38:01 - INFO - __main__ - Step 23765: {'lr': 0.00019989011146027448, 'samples': 760480, 'steps': 1485, 'loss/train': 4.29744291305542} -09/20/2021 19:38:02 - INFO - __main__ - Step 23766: {'lr': 0.00019989011146027448, 'samples': 760512, 'steps': 1485, 'loss/train': 3.9445269107818604} -09/20/2021 19:38:03 - INFO - __main__ - Step 23767: {'lr': 0.00019989011146027448, 'samples': 760544, 'steps': 1485, 'loss/train': 2.86155104637146} -09/20/2021 19:38:03 - INFO - __main__ - Step 23768: {'lr': 0.00019989011146027448, 'samples': 760576, 'steps': 1485, 'loss/train': 2.133946418762207} -09/20/2021 19:38:04 - INFO - __main__ - Step 23769: {'lr': 0.00019989011146027448, 'samples': 760608, 'steps': 1485, 'loss/train': 2.3874144554138184} -09/20/2021 19:38:05 - INFO - __main__ - Step 23770: {'lr': 0.00019989011146027448, 'samples': 760640, 'steps': 1485, 'loss/train': 3.4717440605163574} -09/20/2021 19:38:06 - INFO - __main__ - Step 23771: {'lr': 0.00019989011146027448, 'samples': 760672, 'steps': 1485, 'loss/train': 3.8520495891571045} -09/20/2021 19:38:06 - INFO - __main__ - Step 23772: {'lr': 0.00019989011146027448, 'samples': 760704, 'steps': 1485, 'loss/train': 4.049893856048584} -09/20/2021 19:38:07 - INFO - __main__ - Step 23773: {'lr': 0.00019989011146027448, 'samples': 760736, 'steps': 1485, 'loss/train': 4.154550075531006} -09/20/2021 19:38:08 - INFO - __main__ - Step 23774: {'lr': 0.00019989011146027448, 'samples': 760768, 'steps': 1485, 'loss/train': 2.5341732501983643} -09/20/2021 19:38:09 - INFO - __main__ - Step 23775: {'lr': 0.00019989011146027448, 'samples': 760800, 'steps': 1485, 'loss/train': 3.4345672130584717} -09/20/2021 19:38:09 - INFO - __main__ - Step 23776: {'lr': 0.00019989011146027448, 'samples': 760832, 'steps': 1485, 'loss/train': 3.0108227729797363} -09/20/2021 19:38:10 - INFO - __main__ - Step 23777: {'lr': 0.00019988981229539, 'samples': 760864, 'steps': 1486, 'loss/train': 2.7816476821899414} -09/20/2021 19:38:11 - INFO - __main__ - Step 23778: {'lr': 0.00019988981229539, 'samples': 760896, 'steps': 1486, 'loss/train': 3.1446075439453125} -09/20/2021 19:38:12 - INFO - __main__ - Step 23779: {'lr': 0.00019988981229539, 'samples': 760928, 'steps': 1486, 'loss/train': 3.5837414264678955} -09/20/2021 19:38:13 - INFO - __main__ - Step 23780: {'lr': 0.00019988981229539, 'samples': 760960, 'steps': 1486, 'loss/train': 3.397672653198242} -09/20/2021 19:38:14 - INFO - __main__ - Step 23781: {'lr': 0.00019988981229539, 'samples': 760992, 'steps': 1486, 'loss/train': 3.723555564880371} -09/20/2021 19:38:15 - INFO - __main__ - Step 23782: {'lr': 0.00019988981229539, 'samples': 761024, 'steps': 1486, 'loss/train': 2.491434097290039} -09/20/2021 19:38:15 - INFO - __main__ - Step 23783: {'lr': 0.00019988981229539, 'samples': 761056, 'steps': 1486, 'loss/train': 3.8334999084472656} -09/20/2021 19:38:16 - INFO - __main__ - Step 23784: {'lr': 0.00019988981229539, 'samples': 761088, 'steps': 1486, 'loss/train': 2.8077170848846436} -09/20/2021 19:38:17 - INFO - __main__ - Step 23785: {'lr': 0.00019988981229539, 'samples': 761120, 'steps': 1486, 'loss/train': 2.942563056945801} -09/20/2021 19:38:18 - INFO - __main__ - Step 23786: {'lr': 0.00019988981229539, 'samples': 761152, 'steps': 1486, 'loss/train': 2.34993577003479} -09/20/2021 19:38:18 - INFO - __main__ - Step 23787: {'lr': 0.00019988981229539, 'samples': 761184, 'steps': 1486, 'loss/train': 2.1923158168792725} -09/20/2021 19:38:19 - INFO - __main__ - Step 23788: {'lr': 0.00019988981229539, 'samples': 761216, 'steps': 1486, 'loss/train': 2.2224133014678955} -09/20/2021 19:38:20 - INFO - __main__ - Step 23789: {'lr': 0.00019988981229539, 'samples': 761248, 'steps': 1486, 'loss/train': 4.4220404624938965} -09/20/2021 19:38:21 - INFO - __main__ - Step 23790: {'lr': 0.00019988981229539, 'samples': 761280, 'steps': 1486, 'loss/train': 3.2660255432128906} -09/20/2021 19:38:21 - INFO - __main__ - Step 23791: {'lr': 0.00019988981229539, 'samples': 761312, 'steps': 1486, 'loss/train': 3.141146183013916} -09/20/2021 19:38:22 - INFO - __main__ - Step 23792: {'lr': 0.00019988981229539, 'samples': 761344, 'steps': 1486, 'loss/train': 3.3352739810943604} -09/20/2021 19:38:23 - INFO - __main__ - Step 23793: {'lr': 0.00019988951272405424, 'samples': 761376, 'steps': 1487, 'loss/train': 2.8376433849334717} -09/20/2021 19:38:24 - INFO - __main__ - Step 23794: {'lr': 0.00019988951272405424, 'samples': 761408, 'steps': 1487, 'loss/train': 2.1053121089935303} -09/20/2021 19:38:24 - INFO - __main__ - Step 23795: {'lr': 0.00019988951272405424, 'samples': 761440, 'steps': 1487, 'loss/train': 2.132317543029785} -09/20/2021 19:38:25 - INFO - __main__ - Step 23796: {'lr': 0.00019988951272405424, 'samples': 761472, 'steps': 1487, 'loss/train': 2.1096503734588623} -09/20/2021 19:38:26 - INFO - __main__ - Step 23797: {'lr': 0.00019988951272405424, 'samples': 761504, 'steps': 1487, 'loss/train': 2.12451434135437} -09/20/2021 19:38:27 - INFO - __main__ - Step 23798: {'lr': 0.00019988951272405424, 'samples': 761536, 'steps': 1487, 'loss/train': 2.132204294204712} -09/20/2021 19:38:27 - INFO - __main__ - Step 23799: {'lr': 0.00019988951272405424, 'samples': 761568, 'steps': 1487, 'loss/train': 2.132439374923706} -09/20/2021 19:38:28 - INFO - __main__ - Step 23800: {'lr': 0.00019988951272405424, 'samples': 761600, 'steps': 1487, 'loss/train': 4.093075752258301} -09/20/2021 19:38:29 - INFO - __main__ - Step 23801: {'lr': 0.00019988951272405424, 'samples': 761632, 'steps': 1487, 'loss/train': 3.268045425415039} -09/20/2021 19:38:30 - INFO - __main__ - Step 23802: {'lr': 0.00019988951272405424, 'samples': 761664, 'steps': 1487, 'loss/train': 1.6985834836959839} -09/20/2021 19:38:30 - INFO - __main__ - Step 23803: {'lr': 0.00019988951272405424, 'samples': 761696, 'steps': 1487, 'loss/train': 4.115926742553711} -09/20/2021 19:38:31 - INFO - __main__ - Step 23804: {'lr': 0.00019988951272405424, 'samples': 761728, 'steps': 1487, 'loss/train': 0.9044796824455261} -09/20/2021 19:38:32 - INFO - __main__ - Step 23805: {'lr': 0.00019988951272405424, 'samples': 761760, 'steps': 1487, 'loss/train': 3.4496967792510986} -09/20/2021 19:38:33 - INFO - __main__ - Step 23806: {'lr': 0.00019988951272405424, 'samples': 761792, 'steps': 1487, 'loss/train': 2.842519998550415} -09/20/2021 19:38:33 - INFO - __main__ - Step 23807: {'lr': 0.00019988951272405424, 'samples': 761824, 'steps': 1487, 'loss/train': 2.861563205718994} -09/20/2021 19:38:34 - INFO - __main__ - Step 23808: {'lr': 0.00019988951272405424, 'samples': 761856, 'steps': 1487, 'loss/train': 2.957097291946411} -09/20/2021 19:38:35 - INFO - __main__ - Step 23809: {'lr': 0.00019988921274626846, 'samples': 761888, 'steps': 1488, 'loss/train': 2.6867520809173584} -09/20/2021 19:38:36 - INFO - __main__ - Step 23810: {'lr': 0.00019988921274626846, 'samples': 761920, 'steps': 1488, 'loss/train': 3.291165351867676} -09/20/2021 19:38:37 - INFO - __main__ - Step 23811: {'lr': 0.00019988921274626846, 'samples': 761952, 'steps': 1488, 'loss/train': 3.390653610229492} -09/20/2021 19:38:37 - INFO - __main__ - Step 23812: {'lr': 0.00019988921274626846, 'samples': 761984, 'steps': 1488, 'loss/train': 3.3623061180114746} -09/20/2021 19:38:38 - INFO - __main__ - Step 23813: {'lr': 0.00019988921274626846, 'samples': 762016, 'steps': 1488, 'loss/train': 3.783703565597534} -09/20/2021 19:38:40 - INFO - __main__ - Step 23814: {'lr': 0.00019988921274626846, 'samples': 762048, 'steps': 1488, 'loss/train': 3.1494667530059814} -09/20/2021 19:38:40 - INFO - __main__ - Step 23815: {'lr': 0.00019988921274626846, 'samples': 762080, 'steps': 1488, 'loss/train': 3.7545061111450195} -09/20/2021 19:38:41 - INFO - __main__ - Step 23816: {'lr': 0.00019988921274626846, 'samples': 762112, 'steps': 1488, 'loss/train': 3.3909900188446045} -09/20/2021 19:38:42 - INFO - __main__ - Step 23817: {'lr': 0.00019988921274626846, 'samples': 762144, 'steps': 1488, 'loss/train': 3.2408220767974854} -09/20/2021 19:38:43 - INFO - __main__ - Step 23818: {'lr': 0.00019988921274626846, 'samples': 762176, 'steps': 1488, 'loss/train': 1.820619821548462} -09/20/2021 19:38:43 - INFO - __main__ - Step 23819: {'lr': 0.00019988921274626846, 'samples': 762208, 'steps': 1488, 'loss/train': 1.182361125946045} -09/20/2021 19:38:44 - INFO - __main__ - Step 23820: {'lr': 0.00019988921274626846, 'samples': 762240, 'steps': 1488, 'loss/train': 1.5612343549728394} -09/20/2021 19:38:45 - INFO - __main__ - Step 23821: {'lr': 0.00019988921274626846, 'samples': 762272, 'steps': 1488, 'loss/train': 1.182080864906311} -09/20/2021 19:38:46 - INFO - __main__ - Step 23822: {'lr': 0.00019988921274626846, 'samples': 762304, 'steps': 1488, 'loss/train': 1.636425256729126} -09/20/2021 19:38:46 - INFO - __main__ - Step 23823: {'lr': 0.00019988921274626846, 'samples': 762336, 'steps': 1488, 'loss/train': 0.18963222205638885} -09/20/2021 19:38:47 - INFO - __main__ - Step 23824: {'lr': 0.00019988921274626846, 'samples': 762368, 'steps': 1488, 'loss/train': 1.6277724504470825} -09/20/2021 19:38:48 - INFO - __main__ - Step 23825: {'lr': 0.00019988891236203383, 'samples': 762400, 'steps': 1489, 'loss/train': 3.509082078933716} -09/20/2021 19:38:49 - INFO - __main__ - Step 23826: {'lr': 0.00019988891236203383, 'samples': 762432, 'steps': 1489, 'loss/train': 2.7919304370880127} -09/20/2021 19:38:50 - INFO - __main__ - Step 23827: {'lr': 0.00019988891236203383, 'samples': 762464, 'steps': 1489, 'loss/train': 2.8337130546569824} -09/20/2021 19:38:50 - INFO - __main__ - Step 23828: {'lr': 0.00019988891236203383, 'samples': 762496, 'steps': 1489, 'loss/train': 2.7495381832122803} -09/20/2021 19:38:51 - INFO - __main__ - Step 23829: {'lr': 0.00019988891236203383, 'samples': 762528, 'steps': 1489, 'loss/train': 4.308847904205322} -09/20/2021 19:38:52 - INFO - __main__ - Step 23830: {'lr': 0.00019988891236203383, 'samples': 762560, 'steps': 1489, 'loss/train': 3.926379442214966} -09/20/2021 19:38:53 - INFO - __main__ - Step 23831: {'lr': 0.00019988891236203383, 'samples': 762592, 'steps': 1489, 'loss/train': 2.2395670413970947} -09/20/2021 19:38:53 - INFO - __main__ - Step 23832: {'lr': 0.00019988891236203383, 'samples': 762624, 'steps': 1489, 'loss/train': 2.948897361755371} -09/20/2021 19:38:54 - INFO - __main__ - Step 23833: {'lr': 0.00019988891236203383, 'samples': 762656, 'steps': 1489, 'loss/train': 2.9513213634490967} -09/20/2021 19:38:55 - INFO - __main__ - Step 23834: {'lr': 0.00019988891236203383, 'samples': 762688, 'steps': 1489, 'loss/train': 2.6904423236846924} -09/20/2021 19:38:56 - INFO - __main__ - Step 23835: {'lr': 0.00019988891236203383, 'samples': 762720, 'steps': 1489, 'loss/train': 2.9493274688720703} -09/20/2021 19:38:56 - INFO - __main__ - Step 23836: {'lr': 0.00019988891236203383, 'samples': 762752, 'steps': 1489, 'loss/train': 3.0190882682800293} -09/20/2021 19:38:57 - INFO - __main__ - Step 23837: {'lr': 0.00019988891236203383, 'samples': 762784, 'steps': 1489, 'loss/train': 3.6397950649261475} -09/20/2021 19:38:58 - INFO - __main__ - Step 23838: {'lr': 0.00019988891236203383, 'samples': 762816, 'steps': 1489, 'loss/train': 2.614004373550415} -09/20/2021 19:38:59 - INFO - __main__ - Step 23839: {'lr': 0.00019988891236203383, 'samples': 762848, 'steps': 1489, 'loss/train': 3.0525712966918945} -09/20/2021 19:38:59 - INFO - __main__ - Step 23840: {'lr': 0.00019988891236203383, 'samples': 762880, 'steps': 1489, 'loss/train': 2.8020179271698} -09/20/2021 19:39:00 - INFO - __main__ - Step 23841: {'lr': 0.00019988861157135165, 'samples': 762912, 'steps': 1490, 'loss/train': 3.3476414680480957} -09/20/2021 19:39:01 - INFO - __main__ - Step 23842: {'lr': 0.00019988861157135165, 'samples': 762944, 'steps': 1490, 'loss/train': 3.088963747024536} -09/20/2021 19:39:02 - INFO - __main__ - Step 23843: {'lr': 0.00019988861157135165, 'samples': 762976, 'steps': 1490, 'loss/train': 2.939316987991333} -09/20/2021 19:39:03 - INFO - __main__ - Step 23844: {'lr': 0.00019988861157135165, 'samples': 763008, 'steps': 1490, 'loss/train': 2.6753547191619873} -09/20/2021 19:39:04 - INFO - __main__ - Step 23845: {'lr': 0.00019988861157135165, 'samples': 763040, 'steps': 1490, 'loss/train': 2.4144535064697266} -09/20/2021 19:39:05 - INFO - __main__ - Step 23846: {'lr': 0.00019988861157135165, 'samples': 763072, 'steps': 1490, 'loss/train': 2.9502694606781006} -09/20/2021 19:39:05 - INFO - __main__ - Step 23847: {'lr': 0.00019988861157135165, 'samples': 763104, 'steps': 1490, 'loss/train': 3.2106616497039795} -09/20/2021 19:39:06 - INFO - __main__ - Step 23848: {'lr': 0.00019988861157135165, 'samples': 763136, 'steps': 1490, 'loss/train': 3.207045555114746} -09/20/2021 19:39:07 - INFO - __main__ - Step 23849: {'lr': 0.00019988861157135165, 'samples': 763168, 'steps': 1490, 'loss/train': 4.186084747314453} -09/20/2021 19:39:08 - INFO - __main__ - Step 23850: {'lr': 0.00019988861157135165, 'samples': 763200, 'steps': 1490, 'loss/train': 4.978566646575928} -09/20/2021 19:39:08 - INFO - __main__ - Step 23851: {'lr': 0.00019988861157135165, 'samples': 763232, 'steps': 1490, 'loss/train': 4.635743141174316} -09/20/2021 19:39:09 - INFO - __main__ - Step 23852: {'lr': 0.00019988861157135165, 'samples': 763264, 'steps': 1490, 'loss/train': 2.4336037635803223} -09/20/2021 19:39:10 - INFO - __main__ - Step 23853: {'lr': 0.00019988861157135165, 'samples': 763296, 'steps': 1490, 'loss/train': 3.197004556655884} -09/20/2021 19:39:11 - INFO - __main__ - Step 23854: {'lr': 0.00019988861157135165, 'samples': 763328, 'steps': 1490, 'loss/train': 3.2768630981445312} -09/20/2021 19:39:11 - INFO - __main__ - Step 23855: {'lr': 0.00019988861157135165, 'samples': 763360, 'steps': 1490, 'loss/train': 2.930431365966797} -09/20/2021 19:39:12 - INFO - __main__ - Step 23856: {'lr': 0.00019988861157135165, 'samples': 763392, 'steps': 1490, 'loss/train': 2.484147310256958} -09/20/2021 19:39:13 - INFO - __main__ - Step 23857: {'lr': 0.00019988831037422308, 'samples': 763424, 'steps': 1491, 'loss/train': 2.560028076171875} -09/20/2021 19:39:14 - INFO - __main__ - Step 23858: {'lr': 0.00019988831037422308, 'samples': 763456, 'steps': 1491, 'loss/train': 3.187736988067627} -09/20/2021 19:39:14 - INFO - __main__ - Step 23859: {'lr': 0.00019988831037422308, 'samples': 763488, 'steps': 1491, 'loss/train': 2.4477572441101074} -09/20/2021 19:39:15 - INFO - __main__ - Step 23860: {'lr': 0.00019988831037422308, 'samples': 763520, 'steps': 1491, 'loss/train': 2.565215587615967} -09/20/2021 19:39:16 - INFO - __main__ - Step 23861: {'lr': 0.00019988831037422308, 'samples': 763552, 'steps': 1491, 'loss/train': 2.6650965213775635} -09/20/2021 19:39:17 - INFO - __main__ - Step 23862: {'lr': 0.00019988831037422308, 'samples': 763584, 'steps': 1491, 'loss/train': 3.9096806049346924} -09/20/2021 19:39:17 - INFO - __main__ - Step 23863: {'lr': 0.00019988831037422308, 'samples': 763616, 'steps': 1491, 'loss/train': 2.993387460708618} -09/20/2021 19:39:18 - INFO - __main__ - Step 23864: {'lr': 0.00019988831037422308, 'samples': 763648, 'steps': 1491, 'loss/train': 2.6368916034698486} -09/20/2021 19:39:19 - INFO - __main__ - Step 23865: {'lr': 0.00019988831037422308, 'samples': 763680, 'steps': 1491, 'loss/train': 1.2747324705123901} -09/20/2021 19:39:20 - INFO - __main__ - Step 23866: {'lr': 0.00019988831037422308, 'samples': 763712, 'steps': 1491, 'loss/train': 4.334031581878662} -09/20/2021 19:39:20 - INFO - __main__ - Step 23867: {'lr': 0.00019988831037422308, 'samples': 763744, 'steps': 1491, 'loss/train': 2.4844985008239746} -09/20/2021 19:39:21 - INFO - __main__ - Step 23868: {'lr': 0.00019988831037422308, 'samples': 763776, 'steps': 1491, 'loss/train': 2.5802695751190186} -09/20/2021 19:39:22 - INFO - __main__ - Step 23869: {'lr': 0.00019988831037422308, 'samples': 763808, 'steps': 1491, 'loss/train': 2.90700101852417} -09/20/2021 19:39:23 - INFO - __main__ - Step 23870: {'lr': 0.00019988831037422308, 'samples': 763840, 'steps': 1491, 'loss/train': 2.7344861030578613} -09/20/2021 19:39:23 - INFO - __main__ - Step 23871: {'lr': 0.00019988831037422308, 'samples': 763872, 'steps': 1491, 'loss/train': 2.463510513305664} -09/20/2021 19:39:24 - INFO - __main__ - Step 23872: {'lr': 0.00019988831037422308, 'samples': 763904, 'steps': 1491, 'loss/train': 3.1552436351776123} -09/20/2021 19:39:25 - INFO - __main__ - Step 23873: {'lr': 0.00019988800877064934, 'samples': 763936, 'steps': 1492, 'loss/train': 3.452040433883667} -09/20/2021 19:39:26 - INFO - __main__ - Step 23874: {'lr': 0.00019988800877064934, 'samples': 763968, 'steps': 1492, 'loss/train': 3.2911620140075684} -09/20/2021 19:39:27 - INFO - __main__ - Step 23875: {'lr': 0.00019988800877064934, 'samples': 764000, 'steps': 1492, 'loss/train': 2.5434703826904297} -09/20/2021 19:39:28 - INFO - __main__ - Step 23876: {'lr': 0.00019988800877064934, 'samples': 764032, 'steps': 1492, 'loss/train': 2.8392302989959717} -09/20/2021 19:39:29 - INFO - __main__ - Step 23877: {'lr': 0.00019988800877064934, 'samples': 764064, 'steps': 1492, 'loss/train': 2.778108835220337} -09/20/2021 19:39:29 - INFO - __main__ - Step 23878: {'lr': 0.00019988800877064934, 'samples': 764096, 'steps': 1492, 'loss/train': 2.6968274116516113} -09/20/2021 19:39:30 - INFO - __main__ - Step 23879: {'lr': 0.00019988800877064934, 'samples': 764128, 'steps': 1492, 'loss/train': 1.2564191818237305} -09/20/2021 19:39:31 - INFO - __main__ - Step 23880: {'lr': 0.00019988800877064934, 'samples': 764160, 'steps': 1492, 'loss/train': 3.198439359664917} -09/20/2021 19:39:32 - INFO - __main__ - Step 23881: {'lr': 0.00019988800877064934, 'samples': 764192, 'steps': 1492, 'loss/train': 2.2939929962158203} -09/20/2021 19:39:32 - INFO - __main__ - Step 23882: {'lr': 0.00019988800877064934, 'samples': 764224, 'steps': 1492, 'loss/train': 3.153024435043335} -09/20/2021 19:39:33 - INFO - __main__ - Step 23883: {'lr': 0.00019988800877064934, 'samples': 764256, 'steps': 1492, 'loss/train': 3.0686750411987305} -09/20/2021 19:39:34 - INFO - __main__ - Step 23884: {'lr': 0.00019988800877064934, 'samples': 764288, 'steps': 1492, 'loss/train': 2.3785412311553955} -09/20/2021 19:39:35 - INFO - __main__ - Step 23885: {'lr': 0.00019988800877064934, 'samples': 764320, 'steps': 1492, 'loss/train': 2.9390604496002197} -09/20/2021 19:39:35 - INFO - __main__ - Step 23886: {'lr': 0.00019988800877064934, 'samples': 764352, 'steps': 1492, 'loss/train': 1.3110804557800293} -09/20/2021 19:39:36 - INFO - __main__ - Step 23887: {'lr': 0.00019988800877064934, 'samples': 764384, 'steps': 1492, 'loss/train': 1.514540195465088} -09/20/2021 19:39:37 - INFO - __main__ - Step 23888: {'lr': 0.00019988800877064934, 'samples': 764416, 'steps': 1492, 'loss/train': 4.876082897186279} -09/20/2021 19:39:38 - INFO - __main__ - Step 23889: {'lr': 0.0001998877067606317, 'samples': 764448, 'steps': 1493, 'loss/train': 4.0420823097229} -09/20/2021 19:39:39 - INFO - __main__ - Step 23890: {'lr': 0.0001998877067606317, 'samples': 764480, 'steps': 1493, 'loss/train': 0.7671093940734863} -09/20/2021 19:39:39 - INFO - __main__ - Step 23891: {'lr': 0.0001998877067606317, 'samples': 764512, 'steps': 1493, 'loss/train': 2.366961717605591} -09/20/2021 19:39:40 - INFO - __main__ - Step 23892: {'lr': 0.0001998877067606317, 'samples': 764544, 'steps': 1493, 'loss/train': 2.860722541809082} -09/20/2021 19:39:41 - INFO - __main__ - Step 23893: {'lr': 0.0001998877067606317, 'samples': 764576, 'steps': 1493, 'loss/train': 3.3117332458496094} -09/20/2021 19:39:42 - INFO - __main__ - Step 23894: {'lr': 0.0001998877067606317, 'samples': 764608, 'steps': 1493, 'loss/train': 3.358536958694458} -09/20/2021 19:39:42 - INFO - __main__ - Step 23895: {'lr': 0.0001998877067606317, 'samples': 764640, 'steps': 1493, 'loss/train': 0.9471352100372314} -09/20/2021 19:39:43 - INFO - __main__ - Step 23896: {'lr': 0.0001998877067606317, 'samples': 764672, 'steps': 1493, 'loss/train': 2.921013355255127} -09/20/2021 19:39:44 - INFO - __main__ - Step 23897: {'lr': 0.0001998877067606317, 'samples': 764704, 'steps': 1493, 'loss/train': 3.3748228549957275} -09/20/2021 19:39:45 - INFO - __main__ - Step 23898: {'lr': 0.0001998877067606317, 'samples': 764736, 'steps': 1493, 'loss/train': 2.322577714920044} -09/20/2021 19:39:45 - INFO - __main__ - Step 23899: {'lr': 0.0001998877067606317, 'samples': 764768, 'steps': 1493, 'loss/train': 2.8708016872406006} -09/20/2021 19:39:46 - INFO - __main__ - Step 23900: {'lr': 0.0001998877067606317, 'samples': 764800, 'steps': 1493, 'loss/train': 3.3275041580200195} -09/20/2021 19:39:47 - INFO - __main__ - Step 23901: {'lr': 0.0001998877067606317, 'samples': 764832, 'steps': 1493, 'loss/train': 2.526413679122925} -09/20/2021 19:39:48 - INFO - __main__ - Step 23902: {'lr': 0.0001998877067606317, 'samples': 764864, 'steps': 1493, 'loss/train': 3.4502532482147217} -09/20/2021 19:39:48 - INFO - __main__ - Step 23903: {'lr': 0.0001998877067606317, 'samples': 764896, 'steps': 1493, 'loss/train': 3.323315382003784} -09/20/2021 19:39:49 - INFO - __main__ - Step 23904: {'lr': 0.0001998877067606317, 'samples': 764928, 'steps': 1493, 'loss/train': 2.514273166656494} -09/20/2021 19:39:50 - INFO - __main__ - Step 23905: {'lr': 0.00019988740434417136, 'samples': 764960, 'steps': 1494, 'loss/train': 2.2013912200927734} -09/20/2021 19:39:51 - INFO - __main__ - Step 23906: {'lr': 0.00019988740434417136, 'samples': 764992, 'steps': 1494, 'loss/train': 2.811828136444092} -09/20/2021 19:39:51 - INFO - __main__ - Step 23907: {'lr': 0.00019988740434417136, 'samples': 765024, 'steps': 1494, 'loss/train': 3.4290950298309326} -09/20/2021 19:39:53 - INFO - __main__ - Step 23908: {'lr': 0.00019988740434417136, 'samples': 765056, 'steps': 1494, 'loss/train': 3.0338709354400635} -09/20/2021 19:39:53 - INFO - __main__ - Step 23909: {'lr': 0.00019988740434417136, 'samples': 765088, 'steps': 1494, 'loss/train': 3.943359613418579} -09/20/2021 19:39:54 - INFO - __main__ - Step 23910: {'lr': 0.00019988740434417136, 'samples': 765120, 'steps': 1494, 'loss/train': 1.9677841663360596} -09/20/2021 19:39:55 - INFO - __main__ - Step 23911: {'lr': 0.00019988740434417136, 'samples': 765152, 'steps': 1494, 'loss/train': 2.889524221420288} -09/20/2021 19:39:56 - INFO - __main__ - Step 23912: {'lr': 0.00019988740434417136, 'samples': 765184, 'steps': 1494, 'loss/train': 2.3087332248687744} -09/20/2021 19:39:56 - INFO - __main__ - Step 23913: {'lr': 0.00019988740434417136, 'samples': 765216, 'steps': 1494, 'loss/train': 2.000221014022827} -09/20/2021 19:39:57 - INFO - __main__ - Step 23914: {'lr': 0.00019988740434417136, 'samples': 765248, 'steps': 1494, 'loss/train': 3.054905891418457} -09/20/2021 19:39:58 - INFO - __main__ - Step 23915: {'lr': 0.00019988740434417136, 'samples': 765280, 'steps': 1494, 'loss/train': 2.7467565536499023} -09/20/2021 19:39:59 - INFO - __main__ - Step 23916: {'lr': 0.00019988740434417136, 'samples': 765312, 'steps': 1494, 'loss/train': 2.9906439781188965} -09/20/2021 19:39:59 - INFO - __main__ - Step 23917: {'lr': 0.00019988740434417136, 'samples': 765344, 'steps': 1494, 'loss/train': 3.502234935760498} -09/20/2021 19:40:00 - INFO - __main__ - Step 23918: {'lr': 0.00019988740434417136, 'samples': 765376, 'steps': 1494, 'loss/train': 2.900764226913452} -09/20/2021 19:40:01 - INFO - __main__ - Step 23919: {'lr': 0.00019988740434417136, 'samples': 765408, 'steps': 1494, 'loss/train': 2.1901135444641113} -09/20/2021 19:40:02 - INFO - __main__ - Step 23920: {'lr': 0.00019988740434417136, 'samples': 765440, 'steps': 1494, 'loss/train': 2.9222097396850586} -09/20/2021 19:40:03 - INFO - __main__ - Step 23921: {'lr': 0.00019988710152126955, 'samples': 765472, 'steps': 1495, 'loss/train': 3.0049514770507812} -09/20/2021 19:40:03 - INFO - __main__ - Step 23922: {'lr': 0.00019988710152126955, 'samples': 765504, 'steps': 1495, 'loss/train': 2.6035776138305664} -09/20/2021 19:40:04 - INFO - __main__ - Step 23923: {'lr': 0.00019988710152126955, 'samples': 765536, 'steps': 1495, 'loss/train': 3.07409930229187} -09/20/2021 19:40:05 - INFO - __main__ - Step 23924: {'lr': 0.00019988710152126955, 'samples': 765568, 'steps': 1495, 'loss/train': 2.1103835105895996} -09/20/2021 19:40:06 - INFO - __main__ - Step 23925: {'lr': 0.00019988710152126955, 'samples': 765600, 'steps': 1495, 'loss/train': 3.149024486541748} -09/20/2021 19:40:06 - INFO - __main__ - Step 23926: {'lr': 0.00019988710152126955, 'samples': 765632, 'steps': 1495, 'loss/train': 2.4492454528808594} -09/20/2021 19:40:07 - INFO - __main__ - Step 23927: {'lr': 0.00019988710152126955, 'samples': 765664, 'steps': 1495, 'loss/train': 3.5572590827941895} -09/20/2021 19:40:08 - INFO - __main__ - Step 23928: {'lr': 0.00019988710152126955, 'samples': 765696, 'steps': 1495, 'loss/train': 1.487596035003662} -09/20/2021 19:40:09 - INFO - __main__ - Step 23929: {'lr': 0.00019988710152126955, 'samples': 765728, 'steps': 1495, 'loss/train': 3.0720608234405518} -09/20/2021 19:40:09 - INFO - __main__ - Step 23930: {'lr': 0.00019988710152126955, 'samples': 765760, 'steps': 1495, 'loss/train': 2.8391871452331543} -09/20/2021 19:40:10 - INFO - __main__ - Step 23931: {'lr': 0.00019988710152126955, 'samples': 765792, 'steps': 1495, 'loss/train': 2.070051431655884} -09/20/2021 19:40:11 - INFO - __main__ - Step 23932: {'lr': 0.00019988710152126955, 'samples': 765824, 'steps': 1495, 'loss/train': 2.583791494369507} -09/20/2021 19:40:12 - INFO - __main__ - Step 23933: {'lr': 0.00019988710152126955, 'samples': 765856, 'steps': 1495, 'loss/train': 2.9237253665924072} -09/20/2021 19:40:12 - INFO - __main__ - Step 23934: {'lr': 0.00019988710152126955, 'samples': 765888, 'steps': 1495, 'loss/train': 2.3331429958343506} -09/20/2021 19:40:13 - INFO - __main__ - Step 23935: {'lr': 0.00019988710152126955, 'samples': 765920, 'steps': 1495, 'loss/train': 0.8499552607536316} -09/20/2021 19:40:14 - INFO - __main__ - Step 23936: {'lr': 0.00019988710152126955, 'samples': 765952, 'steps': 1495, 'loss/train': 2.8379414081573486} -09/20/2021 19:40:15 - INFO - __main__ - Step 23937: {'lr': 0.00019988679829192755, 'samples': 765984, 'steps': 1496, 'loss/train': 2.688667058944702} -09/20/2021 19:40:16 - INFO - __main__ - Step 23938: {'lr': 0.00019988679829192755, 'samples': 766016, 'steps': 1496, 'loss/train': 2.5348565578460693} -09/20/2021 19:40:17 - INFO - __main__ - Step 23939: {'lr': 0.00019988679829192755, 'samples': 766048, 'steps': 1496, 'loss/train': 3.5709526538848877} -09/20/2021 19:40:18 - INFO - __main__ - Step 23940: {'lr': 0.00019988679829192755, 'samples': 766080, 'steps': 1496, 'loss/train': 3.145765542984009} -09/20/2021 19:40:19 - INFO - __main__ - Step 23941: {'lr': 0.00019988679829192755, 'samples': 766112, 'steps': 1496, 'loss/train': 2.3751535415649414} -09/20/2021 19:40:19 - INFO - __main__ - Step 23942: {'lr': 0.00019988679829192755, 'samples': 766144, 'steps': 1496, 'loss/train': 2.5344362258911133} -09/20/2021 19:40:20 - INFO - __main__ - Step 23943: {'lr': 0.00019988679829192755, 'samples': 766176, 'steps': 1496, 'loss/train': 3.0199923515319824} -09/20/2021 19:40:21 - INFO - __main__ - Step 23944: {'lr': 0.00019988679829192755, 'samples': 766208, 'steps': 1496, 'loss/train': 3.027304172515869} -09/20/2021 19:40:22 - INFO - __main__ - Step 23945: {'lr': 0.00019988679829192755, 'samples': 766240, 'steps': 1496, 'loss/train': 2.956254482269287} -09/20/2021 19:40:22 - INFO - __main__ - Step 23946: {'lr': 0.00019988679829192755, 'samples': 766272, 'steps': 1496, 'loss/train': 3.018590211868286} -09/20/2021 19:40:23 - INFO - __main__ - Step 23947: {'lr': 0.00019988679829192755, 'samples': 766304, 'steps': 1496, 'loss/train': 2.851071357727051} -09/20/2021 19:40:24 - INFO - __main__ - Step 23948: {'lr': 0.00019988679829192755, 'samples': 766336, 'steps': 1496, 'loss/train': 3.2006349563598633} -09/20/2021 19:40:25 - INFO - __main__ - Step 23949: {'lr': 0.00019988679829192755, 'samples': 766368, 'steps': 1496, 'loss/train': 2.89707612991333} -09/20/2021 19:40:25 - INFO - __main__ - Step 23950: {'lr': 0.00019988679829192755, 'samples': 766400, 'steps': 1496, 'loss/train': 3.2535932064056396} -09/20/2021 19:40:26 - INFO - __main__ - Step 23951: {'lr': 0.00019988679829192755, 'samples': 766432, 'steps': 1496, 'loss/train': 3.3170652389526367} -09/20/2021 19:40:27 - INFO - __main__ - Step 23952: {'lr': 0.00019988679829192755, 'samples': 766464, 'steps': 1496, 'loss/train': 2.6526401042938232} -09/20/2021 19:40:28 - INFO - __main__ - Step 23953: {'lr': 0.0001998864946561465, 'samples': 766496, 'steps': 1497, 'loss/train': 3.880727529525757} -09/20/2021 19:40:29 - INFO - __main__ - Step 23954: {'lr': 0.0001998864946561465, 'samples': 766528, 'steps': 1497, 'loss/train': 2.8747572898864746} -09/20/2021 19:40:29 - INFO - __main__ - Step 23955: {'lr': 0.0001998864946561465, 'samples': 766560, 'steps': 1497, 'loss/train': 3.323953628540039} -09/20/2021 19:40:30 - INFO - __main__ - Step 23956: {'lr': 0.0001998864946561465, 'samples': 766592, 'steps': 1497, 'loss/train': 2.9025793075561523} -09/20/2021 19:40:31 - INFO - __main__ - Step 23957: {'lr': 0.0001998864946561465, 'samples': 766624, 'steps': 1497, 'loss/train': 3.3265140056610107} -09/20/2021 19:40:32 - INFO - __main__ - Step 23958: {'lr': 0.0001998864946561465, 'samples': 766656, 'steps': 1497, 'loss/train': 1.170691967010498} -09/20/2021 19:40:32 - INFO - __main__ - Step 23959: {'lr': 0.0001998864946561465, 'samples': 766688, 'steps': 1497, 'loss/train': 3.414311647415161} -09/20/2021 19:40:33 - INFO - __main__ - Step 23960: {'lr': 0.0001998864946561465, 'samples': 766720, 'steps': 1497, 'loss/train': 2.127831220626831} -09/20/2021 19:40:34 - INFO - __main__ - Step 23961: {'lr': 0.0001998864946561465, 'samples': 766752, 'steps': 1497, 'loss/train': 3.586575508117676} -09/20/2021 19:40:35 - INFO - __main__ - Step 23962: {'lr': 0.0001998864946561465, 'samples': 766784, 'steps': 1497, 'loss/train': 2.982299327850342} -09/20/2021 19:40:35 - INFO - __main__ - Step 23963: {'lr': 0.0001998864946561465, 'samples': 766816, 'steps': 1497, 'loss/train': 2.8950393199920654} -09/20/2021 19:40:36 - INFO - __main__ - Step 23964: {'lr': 0.0001998864946561465, 'samples': 766848, 'steps': 1497, 'loss/train': 2.957991600036621} -09/20/2021 19:40:37 - INFO - __main__ - Step 23965: {'lr': 0.0001998864946561465, 'samples': 766880, 'steps': 1497, 'loss/train': 3.0221469402313232} -09/20/2021 19:40:38 - INFO - __main__ - Step 23966: {'lr': 0.0001998864946561465, 'samples': 766912, 'steps': 1497, 'loss/train': 3.3647494316101074} -09/20/2021 19:40:38 - INFO - __main__ - Step 23967: {'lr': 0.0001998864946561465, 'samples': 766944, 'steps': 1497, 'loss/train': 3.045231342315674} -09/20/2021 19:40:39 - INFO - __main__ - Step 23968: {'lr': 0.0001998864946561465, 'samples': 766976, 'steps': 1497, 'loss/train': 3.4019384384155273} -09/20/2021 19:40:40 - INFO - __main__ - Step 23969: {'lr': 0.00019988619061392775, 'samples': 767008, 'steps': 1498, 'loss/train': 2.3838508129119873} -09/20/2021 19:40:41 - INFO - __main__ - Step 23970: {'lr': 0.00019988619061392775, 'samples': 767040, 'steps': 1498, 'loss/train': 3.218726396560669} -09/20/2021 19:40:42 - INFO - __main__ - Step 23971: {'lr': 0.00019988619061392775, 'samples': 767072, 'steps': 1498, 'loss/train': 2.508636713027954} -09/20/2021 19:40:43 - INFO - __main__ - Step 23972: {'lr': 0.00019988619061392775, 'samples': 767104, 'steps': 1498, 'loss/train': 3.5811073780059814} -09/20/2021 19:40:44 - INFO - __main__ - Step 23973: {'lr': 0.00019988619061392775, 'samples': 767136, 'steps': 1498, 'loss/train': 4.02132511138916} -09/20/2021 19:40:45 - INFO - __main__ - Step 23974: {'lr': 0.00019988619061392775, 'samples': 767168, 'steps': 1498, 'loss/train': 2.938415288925171} -09/20/2021 19:40:45 - INFO - __main__ - Step 23975: {'lr': 0.00019988619061392775, 'samples': 767200, 'steps': 1498, 'loss/train': 2.773813009262085} -09/20/2021 19:40:46 - INFO - __main__ - Step 23976: {'lr': 0.00019988619061392775, 'samples': 767232, 'steps': 1498, 'loss/train': 4.124123573303223} -09/20/2021 19:40:47 - INFO - __main__ - Step 23977: {'lr': 0.00019988619061392775, 'samples': 767264, 'steps': 1498, 'loss/train': 2.7392709255218506} -09/20/2021 19:40:48 - INFO - __main__ - Step 23978: {'lr': 0.00019988619061392775, 'samples': 767296, 'steps': 1498, 'loss/train': 3.6542625427246094} -09/20/2021 19:40:48 - INFO - __main__ - Step 23979: {'lr': 0.00019988619061392775, 'samples': 767328, 'steps': 1498, 'loss/train': 2.7727010250091553} -09/20/2021 19:40:49 - INFO - __main__ - Step 23980: {'lr': 0.00019988619061392775, 'samples': 767360, 'steps': 1498, 'loss/train': 3.352618455886841} -09/20/2021 19:40:50 - INFO - __main__ - Step 23981: {'lr': 0.00019988619061392775, 'samples': 767392, 'steps': 1498, 'loss/train': 3.3600802421569824} -09/20/2021 19:40:51 - INFO - __main__ - Step 23982: {'lr': 0.00019988619061392775, 'samples': 767424, 'steps': 1498, 'loss/train': 3.042384147644043} -09/20/2021 19:40:51 - INFO - __main__ - Step 23983: {'lr': 0.00019988619061392775, 'samples': 767456, 'steps': 1498, 'loss/train': 3.0985724925994873} -09/20/2021 19:40:52 - INFO - __main__ - Step 23984: {'lr': 0.00019988619061392775, 'samples': 767488, 'steps': 1498, 'loss/train': 2.9528372287750244} -09/20/2021 19:40:53 - INFO - __main__ - Step 23985: {'lr': 0.00019988588616527244, 'samples': 767520, 'steps': 1499, 'loss/train': 3.608891487121582} -09/20/2021 19:40:54 - INFO - __main__ - Step 23986: {'lr': 0.00019988588616527244, 'samples': 767552, 'steps': 1499, 'loss/train': 2.328745126724243} -09/20/2021 19:40:55 - INFO - __main__ - Step 23987: {'lr': 0.00019988588616527244, 'samples': 767584, 'steps': 1499, 'loss/train': 2.315208673477173} -09/20/2021 19:40:55 - INFO - __main__ - Step 23988: {'lr': 0.00019988588616527244, 'samples': 767616, 'steps': 1499, 'loss/train': 2.5703988075256348} -09/20/2021 19:40:56 - INFO - __main__ - Step 23989: {'lr': 0.00019988588616527244, 'samples': 767648, 'steps': 1499, 'loss/train': 4.114778995513916} -09/20/2021 19:40:57 - INFO - __main__ - Step 23990: {'lr': 0.00019988588616527244, 'samples': 767680, 'steps': 1499, 'loss/train': 3.231403112411499} -09/20/2021 19:40:58 - INFO - __main__ - Step 23991: {'lr': 0.00019988588616527244, 'samples': 767712, 'steps': 1499, 'loss/train': 4.820252418518066} -09/20/2021 19:40:58 - INFO - __main__ - Step 23992: {'lr': 0.00019988588616527244, 'samples': 767744, 'steps': 1499, 'loss/train': 2.3717386722564697} -09/20/2021 19:40:59 - INFO - __main__ - Step 23993: {'lr': 0.00019988588616527244, 'samples': 767776, 'steps': 1499, 'loss/train': 3.1393277645111084} -09/20/2021 19:41:00 - INFO - __main__ - Step 23994: {'lr': 0.00019988588616527244, 'samples': 767808, 'steps': 1499, 'loss/train': 3.1898319721221924} -09/20/2021 19:41:01 - INFO - __main__ - Step 23995: {'lr': 0.00019988588616527244, 'samples': 767840, 'steps': 1499, 'loss/train': 1.92160165309906} -09/20/2021 19:41:01 - INFO - __main__ - Step 23996: {'lr': 0.00019988588616527244, 'samples': 767872, 'steps': 1499, 'loss/train': 2.887289524078369} -09/20/2021 19:41:02 - INFO - __main__ - Step 23997: {'lr': 0.00019988588616527244, 'samples': 767904, 'steps': 1499, 'loss/train': 3.105558395385742} -09/20/2021 19:41:03 - INFO - __main__ - Step 23998: {'lr': 0.00019988588616527244, 'samples': 767936, 'steps': 1499, 'loss/train': 2.4829976558685303} -09/20/2021 19:41:04 - INFO - __main__ - Step 23999: {'lr': 0.00019988588616527244, 'samples': 767968, 'steps': 1499, 'loss/train': 2.6339380741119385} -09/20/2021 19:41:04 - INFO - __main__ - Step 24000: {'lr': 0.00019988588616527244, 'samples': 768000, 'steps': 1499, 'loss/train': 3.1081364154815674} -09/20/2021 19:41:05 - INFO - __main__ - Step 24001: {'lr': 0.00019988558131018186, 'samples': 768032, 'steps': 1500, 'loss/train': 3.5233452320098877} -09/20/2021 19:41:07 - INFO - __main__ - Step 24002: {'lr': 0.00019988558131018186, 'samples': 768064, 'steps': 1500, 'loss/train': 2.324453830718994} -09/20/2021 19:41:07 - INFO - __main__ - Step 24003: {'lr': 0.00019988558131018186, 'samples': 768096, 'steps': 1500, 'loss/train': 2.6982526779174805} -09/20/2021 19:41:08 - INFO - __main__ - Step 24004: {'lr': 0.00019988558131018186, 'samples': 768128, 'steps': 1500, 'loss/train': 2.9669227600097656} -09/20/2021 19:41:09 - INFO - __main__ - Step 24005: {'lr': 0.00019988558131018186, 'samples': 768160, 'steps': 1500, 'loss/train': 2.8798751831054688} -09/20/2021 19:41:10 - INFO - __main__ - Step 24006: {'lr': 0.00019988558131018186, 'samples': 768192, 'steps': 1500, 'loss/train': 2.9396398067474365} -09/20/2021 19:41:10 - INFO - __main__ - Step 24007: {'lr': 0.00019988558131018186, 'samples': 768224, 'steps': 1500, 'loss/train': 3.0661678314208984} -09/20/2021 19:41:11 - INFO - __main__ - Step 24008: {'lr': 0.00019988558131018186, 'samples': 768256, 'steps': 1500, 'loss/train': 2.038759469985962} -09/20/2021 19:41:12 - INFO - __main__ - Step 24009: {'lr': 0.00019988558131018186, 'samples': 768288, 'steps': 1500, 'loss/train': 3.008472204208374} -09/20/2021 19:41:13 - INFO - __main__ - Step 24010: {'lr': 0.00019988558131018186, 'samples': 768320, 'steps': 1500, 'loss/train': 2.7863340377807617} -09/20/2021 19:41:13 - INFO - __main__ - Step 24011: {'lr': 0.00019988558131018186, 'samples': 768352, 'steps': 1500, 'loss/train': 3.3089046478271484} -09/20/2021 19:41:14 - INFO - __main__ - Step 24012: {'lr': 0.00019988558131018186, 'samples': 768384, 'steps': 1500, 'loss/train': 2.8015682697296143} -09/20/2021 19:41:15 - INFO - __main__ - Step 24013: {'lr': 0.00019988558131018186, 'samples': 768416, 'steps': 1500, 'loss/train': 2.437026023864746} -09/20/2021 19:41:16 - INFO - __main__ - Step 24014: {'lr': 0.00019988558131018186, 'samples': 768448, 'steps': 1500, 'loss/train': 4.475440979003906} -09/20/2021 19:41:16 - INFO - __main__ - Step 24015: {'lr': 0.00019988558131018186, 'samples': 768480, 'steps': 1500, 'loss/train': 0.7228338718414307} -09/20/2021 19:41:17 - INFO - __main__ - Step 24016: {'lr': 0.00019988558131018186, 'samples': 768512, 'steps': 1500, 'loss/train': 2.97762393951416} -09/20/2021 19:41:18 - INFO - __main__ - Step 24017: {'lr': 0.00019988527604865723, 'samples': 768544, 'steps': 1501, 'loss/train': 3.474684715270996} -09/20/2021 19:41:19 - INFO - __main__ - Step 24018: {'lr': 0.00019988527604865723, 'samples': 768576, 'steps': 1501, 'loss/train': 2.2970893383026123} -09/20/2021 19:41:20 - INFO - __main__ - Step 24019: {'lr': 0.00019988527604865723, 'samples': 768608, 'steps': 1501, 'loss/train': 3.309142589569092} -09/20/2021 19:41:20 - INFO - __main__ - Step 24020: {'lr': 0.00019988527604865723, 'samples': 768640, 'steps': 1501, 'loss/train': 2.132091760635376} -09/20/2021 19:41:21 - INFO - __main__ - Step 24021: {'lr': 0.00019988527604865723, 'samples': 768672, 'steps': 1501, 'loss/train': 3.1776795387268066} -09/20/2021 19:41:22 - INFO - __main__ - Step 24022: {'lr': 0.00019988527604865723, 'samples': 768704, 'steps': 1501, 'loss/train': 2.831866979598999} -09/20/2021 19:41:23 - INFO - __main__ - Step 24023: {'lr': 0.00019988527604865723, 'samples': 768736, 'steps': 1501, 'loss/train': 3.735553741455078} -09/20/2021 19:41:23 - INFO - __main__ - Step 24024: {'lr': 0.00019988527604865723, 'samples': 768768, 'steps': 1501, 'loss/train': 2.8227076530456543} -09/20/2021 19:41:24 - INFO - __main__ - Step 24025: {'lr': 0.00019988527604865723, 'samples': 768800, 'steps': 1501, 'loss/train': 3.882685422897339} -09/20/2021 19:41:25 - INFO - __main__ - Step 24026: {'lr': 0.00019988527604865723, 'samples': 768832, 'steps': 1501, 'loss/train': 2.220327854156494} -09/20/2021 19:41:26 - INFO - __main__ - Step 24027: {'lr': 0.00019988527604865723, 'samples': 768864, 'steps': 1501, 'loss/train': 3.5024685859680176} -09/20/2021 19:41:26 - INFO - __main__ - Step 24028: {'lr': 0.00019988527604865723, 'samples': 768896, 'steps': 1501, 'loss/train': 2.2381486892700195} -09/20/2021 19:41:27 - INFO - __main__ - Step 24029: {'lr': 0.00019988527604865723, 'samples': 768928, 'steps': 1501, 'loss/train': 3.829284429550171} -09/20/2021 19:41:28 - INFO - __main__ - Step 24030: {'lr': 0.00019988527604865723, 'samples': 768960, 'steps': 1501, 'loss/train': 3.5603854656219482} -09/20/2021 19:41:29 - INFO - __main__ - Step 24031: {'lr': 0.00019988527604865723, 'samples': 768992, 'steps': 1501, 'loss/train': 3.237516164779663} -09/20/2021 19:41:30 - INFO - __main__ - Step 24032: {'lr': 0.00019988527604865723, 'samples': 769024, 'steps': 1501, 'loss/train': 3.137941837310791} -09/20/2021 19:41:31 - INFO - __main__ - Step 24033: {'lr': 0.0001998849703806998, 'samples': 769056, 'steps': 1502, 'loss/train': 1.9593629837036133} -09/20/2021 19:41:31 - INFO - __main__ - Step 24034: {'lr': 0.0001998849703806998, 'samples': 769088, 'steps': 1502, 'loss/train': 3.023543357849121} -09/20/2021 19:41:32 - INFO - __main__ - Step 24035: {'lr': 0.0001998849703806998, 'samples': 769120, 'steps': 1502, 'loss/train': 2.7226383686065674} -09/20/2021 19:41:33 - INFO - __main__ - Step 24036: {'lr': 0.0001998849703806998, 'samples': 769152, 'steps': 1502, 'loss/train': 2.4437766075134277} -09/20/2021 19:41:34 - INFO - __main__ - Step 24037: {'lr': 0.0001998849703806998, 'samples': 769184, 'steps': 1502, 'loss/train': 3.3010313510894775} -09/20/2021 19:41:34 - INFO - __main__ - Step 24038: {'lr': 0.0001998849703806998, 'samples': 769216, 'steps': 1502, 'loss/train': 2.5992822647094727} -09/20/2021 19:41:35 - INFO - __main__ - Step 24039: {'lr': 0.0001998849703806998, 'samples': 769248, 'steps': 1502, 'loss/train': 2.835766553878784} -09/20/2021 19:41:36 - INFO - __main__ - Step 24040: {'lr': 0.0001998849703806998, 'samples': 769280, 'steps': 1502, 'loss/train': 3.202043056488037} -09/20/2021 19:41:37 - INFO - __main__ - Step 24041: {'lr': 0.0001998849703806998, 'samples': 769312, 'steps': 1502, 'loss/train': 1.9399350881576538} -09/20/2021 19:41:37 - INFO - __main__ - Step 24042: {'lr': 0.0001998849703806998, 'samples': 769344, 'steps': 1502, 'loss/train': 3.208979606628418} -09/20/2021 19:41:38 - INFO - __main__ - Step 24043: {'lr': 0.0001998849703806998, 'samples': 769376, 'steps': 1502, 'loss/train': 3.2106876373291016} -09/20/2021 19:41:39 - INFO - __main__ - Step 24044: {'lr': 0.0001998849703806998, 'samples': 769408, 'steps': 1502, 'loss/train': 3.614475727081299} -09/20/2021 19:41:40 - INFO - __main__ - Step 24045: {'lr': 0.0001998849703806998, 'samples': 769440, 'steps': 1502, 'loss/train': 2.6428425312042236} -09/20/2021 19:41:40 - INFO - __main__ - Step 24046: {'lr': 0.0001998849703806998, 'samples': 769472, 'steps': 1502, 'loss/train': 3.265857458114624} -09/20/2021 19:41:41 - INFO - __main__ - Step 24047: {'lr': 0.0001998849703806998, 'samples': 769504, 'steps': 1502, 'loss/train': 3.3644938468933105} -09/20/2021 19:41:42 - INFO - __main__ - Step 24048: {'lr': 0.0001998849703806998, 'samples': 769536, 'steps': 1502, 'loss/train': 2.9268622398376465} -09/20/2021 19:41:43 - INFO - __main__ - Step 24049: {'lr': 0.00019988466430631083, 'samples': 769568, 'steps': 1503, 'loss/train': 4.199034214019775} -09/20/2021 19:41:44 - INFO - __main__ - Step 24050: {'lr': 0.00019988466430631083, 'samples': 769600, 'steps': 1503, 'loss/train': 3.784637689590454} -09/20/2021 19:41:44 - INFO - __main__ - Step 24051: {'lr': 0.00019988466430631083, 'samples': 769632, 'steps': 1503, 'loss/train': 2.1978487968444824} -09/20/2021 19:41:45 - INFO - __main__ - Step 24052: {'lr': 0.00019988466430631083, 'samples': 769664, 'steps': 1503, 'loss/train': 2.9207680225372314} -09/20/2021 19:41:46 - INFO - __main__ - Step 24053: {'lr': 0.00019988466430631083, 'samples': 769696, 'steps': 1503, 'loss/train': 3.3612728118896484} -09/20/2021 19:41:47 - INFO - __main__ - Step 24054: {'lr': 0.00019988466430631083, 'samples': 769728, 'steps': 1503, 'loss/train': 2.880032539367676} -09/20/2021 19:41:47 - INFO - __main__ - Step 24055: {'lr': 0.00019988466430631083, 'samples': 769760, 'steps': 1503, 'loss/train': 3.3807990550994873} -09/20/2021 19:41:48 - INFO - __main__ - Step 24056: {'lr': 0.00019988466430631083, 'samples': 769792, 'steps': 1503, 'loss/train': 3.328087329864502} -09/20/2021 19:41:49 - INFO - __main__ - Step 24057: {'lr': 0.00019988466430631083, 'samples': 769824, 'steps': 1503, 'loss/train': 1.687588095664978} -09/20/2021 19:41:50 - INFO - __main__ - Step 24058: {'lr': 0.00019988466430631083, 'samples': 769856, 'steps': 1503, 'loss/train': 2.4924817085266113} -09/20/2021 19:41:50 - INFO - __main__ - Step 24059: {'lr': 0.00019988466430631083, 'samples': 769888, 'steps': 1503, 'loss/train': 2.5640759468078613} -09/20/2021 19:41:51 - INFO - __main__ - Step 24060: {'lr': 0.00019988466430631083, 'samples': 769920, 'steps': 1503, 'loss/train': 3.337162494659424} -09/20/2021 19:41:52 - INFO - __main__ - Step 24061: {'lr': 0.00019988466430631083, 'samples': 769952, 'steps': 1503, 'loss/train': 1.939471960067749} -09/20/2021 19:41:53 - INFO - __main__ - Step 24062: {'lr': 0.00019988466430631083, 'samples': 769984, 'steps': 1503, 'loss/train': 2.9239203929901123} -09/20/2021 19:41:54 - INFO - __main__ - Step 24063: {'lr': 0.00019988466430631083, 'samples': 770016, 'steps': 1503, 'loss/train': 3.2995662689208984} -09/20/2021 19:41:55 - INFO - __main__ - Step 24064: {'lr': 0.00019988466430631083, 'samples': 770048, 'steps': 1503, 'loss/train': 3.2490222454071045} -09/20/2021 19:41:56 - INFO - __main__ - Step 24065: {'lr': 0.00019988435782549154, 'samples': 770080, 'steps': 1504, 'loss/train': 3.517608642578125} -09/20/2021 19:41:56 - INFO - __main__ - Step 24066: {'lr': 0.00019988435782549154, 'samples': 770112, 'steps': 1504, 'loss/train': 3.005110502243042} -09/20/2021 19:41:57 - INFO - __main__ - Step 24067: {'lr': 0.00019988435782549154, 'samples': 770144, 'steps': 1504, 'loss/train': 3.5760250091552734} -09/20/2021 19:41:58 - INFO - __main__ - Step 24068: {'lr': 0.00019988435782549154, 'samples': 770176, 'steps': 1504, 'loss/train': 3.891033411026001} -09/20/2021 19:41:59 - INFO - __main__ - Step 24069: {'lr': 0.00019988435782549154, 'samples': 770208, 'steps': 1504, 'loss/train': 3.4599623680114746} -09/20/2021 19:41:59 - INFO - __main__ - Step 24070: {'lr': 0.00019988435782549154, 'samples': 770240, 'steps': 1504, 'loss/train': 2.9316632747650146} -09/20/2021 19:42:00 - INFO - __main__ - Step 24071: {'lr': 0.00019988435782549154, 'samples': 770272, 'steps': 1504, 'loss/train': 2.021476984024048} -09/20/2021 19:42:01 - INFO - __main__ - Step 24072: {'lr': 0.00019988435782549154, 'samples': 770304, 'steps': 1504, 'loss/train': 3.093207836151123} -09/20/2021 19:42:02 - INFO - __main__ - Step 24073: {'lr': 0.00019988435782549154, 'samples': 770336, 'steps': 1504, 'loss/train': 0.985384464263916} -09/20/2021 19:42:02 - INFO - __main__ - Step 24074: {'lr': 0.00019988435782549154, 'samples': 770368, 'steps': 1504, 'loss/train': 1.2015384435653687} -09/20/2021 19:42:03 - INFO - __main__ - Step 24075: {'lr': 0.00019988435782549154, 'samples': 770400, 'steps': 1504, 'loss/train': 1.1482105255126953} -09/20/2021 19:42:04 - INFO - __main__ - Step 24076: {'lr': 0.00019988435782549154, 'samples': 770432, 'steps': 1504, 'loss/train': 4.136005878448486} -09/20/2021 19:42:05 - INFO - __main__ - Step 24077: {'lr': 0.00019988435782549154, 'samples': 770464, 'steps': 1504, 'loss/train': 2.4873085021972656} -09/20/2021 19:42:05 - INFO - __main__ - Step 24078: {'lr': 0.00019988435782549154, 'samples': 770496, 'steps': 1504, 'loss/train': 3.507960319519043} -09/20/2021 19:42:06 - INFO - __main__ - Step 24079: {'lr': 0.00019988435782549154, 'samples': 770528, 'steps': 1504, 'loss/train': 3.405855894088745} -09/20/2021 19:42:07 - INFO - __main__ - Step 24080: {'lr': 0.00019988435782549154, 'samples': 770560, 'steps': 1504, 'loss/train': 2.0847833156585693} -09/20/2021 19:42:08 - INFO - __main__ - Step 24081: {'lr': 0.00019988405093824318, 'samples': 770592, 'steps': 1505, 'loss/train': 2.5981011390686035} -09/20/2021 19:42:08 - INFO - __main__ - Step 24082: {'lr': 0.00019988405093824318, 'samples': 770624, 'steps': 1505, 'loss/train': 3.2042949199676514} -09/20/2021 19:42:09 - INFO - __main__ - Step 24083: {'lr': 0.00019988405093824318, 'samples': 770656, 'steps': 1505, 'loss/train': 0.7960239052772522} -09/20/2021 19:42:10 - INFO - __main__ - Step 24084: {'lr': 0.00019988405093824318, 'samples': 770688, 'steps': 1505, 'loss/train': 2.951319694519043} -09/20/2021 19:42:11 - INFO - __main__ - Step 24085: {'lr': 0.00019988405093824318, 'samples': 770720, 'steps': 1505, 'loss/train': 3.53159236907959} -09/20/2021 19:42:11 - INFO - __main__ - Step 24086: {'lr': 0.00019988405093824318, 'samples': 770752, 'steps': 1505, 'loss/train': 2.5617294311523438} -09/20/2021 19:42:12 - INFO - __main__ - Step 24087: {'lr': 0.00019988405093824318, 'samples': 770784, 'steps': 1505, 'loss/train': 3.045258045196533} -09/20/2021 19:42:13 - INFO - __main__ - Step 24088: {'lr': 0.00019988405093824318, 'samples': 770816, 'steps': 1505, 'loss/train': 3.335503578186035} -09/20/2021 19:42:14 - INFO - __main__ - Step 24089: {'lr': 0.00019988405093824318, 'samples': 770848, 'steps': 1505, 'loss/train': 3.067121744155884} -09/20/2021 19:42:14 - INFO - __main__ - Step 24090: {'lr': 0.00019988405093824318, 'samples': 770880, 'steps': 1505, 'loss/train': 2.9534785747528076} -09/20/2021 19:42:15 - INFO - __main__ - Step 24091: {'lr': 0.00019988405093824318, 'samples': 770912, 'steps': 1505, 'loss/train': 2.8957107067108154} -09/20/2021 19:42:16 - INFO - __main__ - Step 24092: {'lr': 0.00019988405093824318, 'samples': 770944, 'steps': 1505, 'loss/train': 2.1964147090911865} -09/20/2021 19:42:17 - INFO - __main__ - Step 24093: {'lr': 0.00019988405093824318, 'samples': 770976, 'steps': 1505, 'loss/train': 3.6248762607574463} -09/20/2021 19:42:18 - INFO - __main__ - Step 24094: {'lr': 0.00019988405093824318, 'samples': 771008, 'steps': 1505, 'loss/train': 2.742713451385498} -09/20/2021 19:42:19 - INFO - __main__ - Step 24095: {'lr': 0.00019988405093824318, 'samples': 771040, 'steps': 1505, 'loss/train': 3.446298360824585} -09/20/2021 19:42:20 - INFO - __main__ - Step 24096: {'lr': 0.00019988405093824318, 'samples': 771072, 'steps': 1505, 'loss/train': 3.4342880249023438} -09/20/2021 19:42:20 - INFO - __main__ - Step 24097: {'lr': 0.000199883743644567, 'samples': 771104, 'steps': 1506, 'loss/train': 2.4445884227752686} -09/20/2021 19:42:21 - INFO - __main__ - Step 24098: {'lr': 0.000199883743644567, 'samples': 771136, 'steps': 1506, 'loss/train': 3.027282476425171} -09/20/2021 19:42:22 - INFO - __main__ - Step 24099: {'lr': 0.000199883743644567, 'samples': 771168, 'steps': 1506, 'loss/train': 3.5596141815185547} -09/20/2021 19:42:23 - INFO - __main__ - Step 24100: {'lr': 0.000199883743644567, 'samples': 771200, 'steps': 1506, 'loss/train': 3.0855655670166016} -09/20/2021 19:42:23 - INFO - __main__ - Step 24101: {'lr': 0.000199883743644567, 'samples': 771232, 'steps': 1506, 'loss/train': 2.730647325515747} -09/20/2021 19:42:24 - INFO - __main__ - Step 24102: {'lr': 0.000199883743644567, 'samples': 771264, 'steps': 1506, 'loss/train': 2.460782527923584} -09/20/2021 19:42:25 - INFO - __main__ - Step 24103: {'lr': 0.000199883743644567, 'samples': 771296, 'steps': 1506, 'loss/train': 1.8931207656860352} -09/20/2021 19:42:26 - INFO - __main__ - Step 24104: {'lr': 0.000199883743644567, 'samples': 771328, 'steps': 1506, 'loss/train': 2.8764829635620117} -09/20/2021 19:42:26 - INFO - __main__ - Step 24105: {'lr': 0.000199883743644567, 'samples': 771360, 'steps': 1506, 'loss/train': 3.308878183364868} -09/20/2021 19:42:27 - INFO - __main__ - Step 24106: {'lr': 0.000199883743644567, 'samples': 771392, 'steps': 1506, 'loss/train': 3.101921796798706} -09/20/2021 19:42:28 - INFO - __main__ - Step 24107: {'lr': 0.000199883743644567, 'samples': 771424, 'steps': 1506, 'loss/train': 3.0184497833251953} -09/20/2021 19:42:29 - INFO - __main__ - Step 24108: {'lr': 0.000199883743644567, 'samples': 771456, 'steps': 1506, 'loss/train': 1.5026695728302002} -09/20/2021 19:42:29 - INFO - __main__ - Step 24109: {'lr': 0.000199883743644567, 'samples': 771488, 'steps': 1506, 'loss/train': 3.048103094100952} -09/20/2021 19:42:30 - INFO - __main__ - Step 24110: {'lr': 0.000199883743644567, 'samples': 771520, 'steps': 1506, 'loss/train': 3.220736026763916} -09/20/2021 19:42:31 - INFO - __main__ - Step 24111: {'lr': 0.000199883743644567, 'samples': 771552, 'steps': 1506, 'loss/train': 1.2472317218780518} -09/20/2021 19:42:32 - INFO - __main__ - Step 24112: {'lr': 0.000199883743644567, 'samples': 771584, 'steps': 1506, 'loss/train': 4.012999057769775} -09/20/2021 19:42:33 - INFO - __main__ - Step 24113: {'lr': 0.00019988343594446427, 'samples': 771616, 'steps': 1507, 'loss/train': 0.619470477104187} -09/20/2021 19:42:33 - INFO - __main__ - Step 24114: {'lr': 0.00019988343594446427, 'samples': 771648, 'steps': 1507, 'loss/train': 2.6897501945495605} -09/20/2021 19:42:34 - INFO - __main__ - Step 24115: {'lr': 0.00019988343594446427, 'samples': 771680, 'steps': 1507, 'loss/train': 3.139024019241333} -09/20/2021 19:42:35 - INFO - __main__ - Step 24116: {'lr': 0.00019988343594446427, 'samples': 771712, 'steps': 1507, 'loss/train': 3.4507737159729004} -09/20/2021 19:42:36 - INFO - __main__ - Step 24117: {'lr': 0.00019988343594446427, 'samples': 771744, 'steps': 1507, 'loss/train': 2.3388020992279053} -09/20/2021 19:42:36 - INFO - __main__ - Step 24118: {'lr': 0.00019988343594446427, 'samples': 771776, 'steps': 1507, 'loss/train': 2.4523262977600098} -09/20/2021 19:42:37 - INFO - __main__ - Step 24119: {'lr': 0.00019988343594446427, 'samples': 771808, 'steps': 1507, 'loss/train': 2.513622283935547} -09/20/2021 19:42:38 - INFO - __main__ - Step 24120: {'lr': 0.00019988343594446427, 'samples': 771840, 'steps': 1507, 'loss/train': 3.6820788383483887} -09/20/2021 19:42:39 - INFO - __main__ - Step 24121: {'lr': 0.00019988343594446427, 'samples': 771872, 'steps': 1507, 'loss/train': 2.057802677154541} -09/20/2021 19:42:39 - INFO - __main__ - Step 24122: {'lr': 0.00019988343594446427, 'samples': 771904, 'steps': 1507, 'loss/train': 2.8574798107147217} -09/20/2021 19:42:41 - INFO - __main__ - Step 24123: {'lr': 0.00019988343594446427, 'samples': 771936, 'steps': 1507, 'loss/train': 3.2897658348083496} -09/20/2021 19:42:42 - INFO - __main__ - Step 24124: {'lr': 0.00019988343594446427, 'samples': 771968, 'steps': 1507, 'loss/train': 3.202598810195923} -09/20/2021 19:42:42 - INFO - __main__ - Step 24125: {'lr': 0.00019988343594446427, 'samples': 772000, 'steps': 1507, 'loss/train': 3.492483615875244} -09/20/2021 19:42:43 - INFO - __main__ - Step 24126: {'lr': 0.00019988343594446427, 'samples': 772032, 'steps': 1507, 'loss/train': 3.3000311851501465} -09/20/2021 19:42:44 - INFO - __main__ - Step 24127: {'lr': 0.00019988343594446427, 'samples': 772064, 'steps': 1507, 'loss/train': 2.865373373031616} -09/20/2021 19:42:45 - INFO - __main__ - Step 24128: {'lr': 0.00019988343594446427, 'samples': 772096, 'steps': 1507, 'loss/train': 2.787947416305542} -09/20/2021 19:42:46 - INFO - __main__ - Step 24129: {'lr': 0.0001998831278379362, 'samples': 772128, 'steps': 1508, 'loss/train': 1.4592604637145996} -09/20/2021 19:42:46 - INFO - __main__ - Step 24130: {'lr': 0.0001998831278379362, 'samples': 772160, 'steps': 1508, 'loss/train': 3.0020315647125244} -09/20/2021 19:42:47 - INFO - __main__ - Step 24131: {'lr': 0.0001998831278379362, 'samples': 772192, 'steps': 1508, 'loss/train': 3.420647382736206} -09/20/2021 19:42:48 - INFO - __main__ - Step 24132: {'lr': 0.0001998831278379362, 'samples': 772224, 'steps': 1508, 'loss/train': 3.4817588329315186} -09/20/2021 19:42:49 - INFO - __main__ - Step 24133: {'lr': 0.0001998831278379362, 'samples': 772256, 'steps': 1508, 'loss/train': 3.95259165763855} -09/20/2021 19:42:49 - INFO - __main__ - Step 24134: {'lr': 0.0001998831278379362, 'samples': 772288, 'steps': 1508, 'loss/train': 3.3489086627960205} -09/20/2021 19:42:50 - INFO - __main__ - Step 24135: {'lr': 0.0001998831278379362, 'samples': 772320, 'steps': 1508, 'loss/train': 2.7420737743377686} -09/20/2021 19:42:51 - INFO - __main__ - Step 24136: {'lr': 0.0001998831278379362, 'samples': 772352, 'steps': 1508, 'loss/train': 2.0954861640930176} -09/20/2021 19:42:52 - INFO - __main__ - Step 24137: {'lr': 0.0001998831278379362, 'samples': 772384, 'steps': 1508, 'loss/train': 2.558448314666748} -09/20/2021 19:42:52 - INFO - __main__ - Step 24138: {'lr': 0.0001998831278379362, 'samples': 772416, 'steps': 1508, 'loss/train': 2.819199800491333} -09/20/2021 19:42:53 - INFO - __main__ - Step 24139: {'lr': 0.0001998831278379362, 'samples': 772448, 'steps': 1508, 'loss/train': 2.8753435611724854} -09/20/2021 19:42:54 - INFO - __main__ - Step 24140: {'lr': 0.0001998831278379362, 'samples': 772480, 'steps': 1508, 'loss/train': 3.168560266494751} -09/20/2021 19:42:55 - INFO - __main__ - Step 24141: {'lr': 0.0001998831278379362, 'samples': 772512, 'steps': 1508, 'loss/train': 2.4197821617126465} -09/20/2021 19:42:55 - INFO - __main__ - Step 24142: {'lr': 0.0001998831278379362, 'samples': 772544, 'steps': 1508, 'loss/train': 1.8741079568862915} -09/20/2021 19:42:56 - INFO - __main__ - Step 24143: {'lr': 0.0001998831278379362, 'samples': 772576, 'steps': 1508, 'loss/train': 2.833385944366455} -09/20/2021 19:42:57 - INFO - __main__ - Step 24144: {'lr': 0.0001998831278379362, 'samples': 772608, 'steps': 1508, 'loss/train': 2.3108608722686768} -09/20/2021 19:42:58 - INFO - __main__ - Step 24145: {'lr': 0.0001998828193249841, 'samples': 772640, 'steps': 1509, 'loss/train': 2.5308947563171387} -09/20/2021 19:42:58 - INFO - __main__ - Step 24146: {'lr': 0.0001998828193249841, 'samples': 772672, 'steps': 1509, 'loss/train': 3.0196993350982666} -09/20/2021 19:42:59 - INFO - __main__ - Step 24147: {'lr': 0.0001998828193249841, 'samples': 772704, 'steps': 1509, 'loss/train': 2.187917947769165} -09/20/2021 19:43:00 - INFO - __main__ - Step 24148: {'lr': 0.0001998828193249841, 'samples': 772736, 'steps': 1509, 'loss/train': 2.4463841915130615} -09/20/2021 19:43:01 - INFO - __main__ - Step 24149: {'lr': 0.0001998828193249841, 'samples': 772768, 'steps': 1509, 'loss/train': 2.327585458755493} -09/20/2021 19:43:01 - INFO - __main__ - Step 24150: {'lr': 0.0001998828193249841, 'samples': 772800, 'steps': 1509, 'loss/train': 2.482410430908203} -09/20/2021 19:43:02 - INFO - __main__ - Step 24151: {'lr': 0.0001998828193249841, 'samples': 772832, 'steps': 1509, 'loss/train': 2.258010149002075} -09/20/2021 19:43:03 - INFO - __main__ - Step 24152: {'lr': 0.0001998828193249841, 'samples': 772864, 'steps': 1509, 'loss/train': 2.0184624195098877} -09/20/2021 19:43:04 - INFO - __main__ - Step 24153: {'lr': 0.0001998828193249841, 'samples': 772896, 'steps': 1509, 'loss/train': 2.6085267066955566} -09/20/2021 19:43:04 - INFO - __main__ - Step 24154: {'lr': 0.0001998828193249841, 'samples': 772928, 'steps': 1509, 'loss/train': 2.130554676055908} -09/20/2021 19:43:05 - INFO - __main__ - Step 24155: {'lr': 0.0001998828193249841, 'samples': 772960, 'steps': 1509, 'loss/train': 2.1195292472839355} -09/20/2021 19:43:06 - INFO - __main__ - Step 24156: {'lr': 0.0001998828193249841, 'samples': 772992, 'steps': 1509, 'loss/train': 3.9413602352142334} -09/20/2021 19:43:07 - INFO - __main__ - Step 24157: {'lr': 0.0001998828193249841, 'samples': 773024, 'steps': 1509, 'loss/train': 2.462397336959839} -09/20/2021 19:43:07 - INFO - __main__ - Step 24158: {'lr': 0.0001998828193249841, 'samples': 773056, 'steps': 1509, 'loss/train': 2.209695816040039} -09/20/2021 19:43:09 - INFO - __main__ - Step 24159: {'lr': 0.0001998828193249841, 'samples': 773088, 'steps': 1509, 'loss/train': 3.3284878730773926} -09/20/2021 19:43:09 - INFO - __main__ - Step 24160: {'lr': 0.0001998828193249841, 'samples': 773120, 'steps': 1509, 'loss/train': 2.696044921875} -09/20/2021 19:43:10 - INFO - __main__ - Step 24161: {'lr': 0.00019988251040560918, 'samples': 773152, 'steps': 1510, 'loss/train': 3.935542583465576} -09/20/2021 19:43:11 - INFO - __main__ - Step 24162: {'lr': 0.00019988251040560918, 'samples': 773184, 'steps': 1510, 'loss/train': 3.3915750980377197} -09/20/2021 19:43:12 - INFO - __main__ - Step 24163: {'lr': 0.00019988251040560918, 'samples': 773216, 'steps': 1510, 'loss/train': 2.786863327026367} -09/20/2021 19:43:13 - INFO - __main__ - Step 24164: {'lr': 0.00019988251040560918, 'samples': 773248, 'steps': 1510, 'loss/train': 2.2657723426818848} -09/20/2021 19:43:13 - INFO - __main__ - Step 24165: {'lr': 0.00019988251040560918, 'samples': 773280, 'steps': 1510, 'loss/train': 2.113863945007324} -09/20/2021 19:43:14 - INFO - __main__ - Step 24166: {'lr': 0.00019988251040560918, 'samples': 773312, 'steps': 1510, 'loss/train': 3.593916893005371} -09/20/2021 19:43:15 - INFO - __main__ - Step 24167: {'lr': 0.00019988251040560918, 'samples': 773344, 'steps': 1510, 'loss/train': 1.4557228088378906} -09/20/2021 19:43:16 - INFO - __main__ - Step 24168: {'lr': 0.00019988251040560918, 'samples': 773376, 'steps': 1510, 'loss/train': 3.9071969985961914} -09/20/2021 19:43:16 - INFO - __main__ - Step 24169: {'lr': 0.00019988251040560918, 'samples': 773408, 'steps': 1510, 'loss/train': 2.8653740882873535} -09/20/2021 19:43:17 - INFO - __main__ - Step 24170: {'lr': 0.00019988251040560918, 'samples': 773440, 'steps': 1510, 'loss/train': 2.4023358821868896} -09/20/2021 19:43:18 - INFO - __main__ - Step 24171: {'lr': 0.00019988251040560918, 'samples': 773472, 'steps': 1510, 'loss/train': 2.3479933738708496} -09/20/2021 19:43:19 - INFO - __main__ - Step 24172: {'lr': 0.00019988251040560918, 'samples': 773504, 'steps': 1510, 'loss/train': 3.5821406841278076} -09/20/2021 19:43:19 - INFO - __main__ - Step 24173: {'lr': 0.00019988251040560918, 'samples': 773536, 'steps': 1510, 'loss/train': 2.227849245071411} -09/20/2021 19:43:20 - INFO - __main__ - Step 24174: {'lr': 0.00019988251040560918, 'samples': 773568, 'steps': 1510, 'loss/train': 1.9723026752471924} -09/20/2021 19:43:21 - INFO - __main__ - Step 24175: {'lr': 0.00019988251040560918, 'samples': 773600, 'steps': 1510, 'loss/train': 3.255378007888794} -09/20/2021 19:43:22 - INFO - __main__ - Step 24176: {'lr': 0.00019988251040560918, 'samples': 773632, 'steps': 1510, 'loss/train': 3.0707921981811523} -09/20/2021 19:43:22 - INFO - __main__ - Step 24177: {'lr': 0.0001998822010798127, 'samples': 773664, 'steps': 1511, 'loss/train': 3.2816407680511475} -09/20/2021 19:43:23 - INFO - __main__ - Step 24178: {'lr': 0.0001998822010798127, 'samples': 773696, 'steps': 1511, 'loss/train': 3.1878480911254883} -09/20/2021 19:43:24 - INFO - __main__ - Step 24179: {'lr': 0.0001998822010798127, 'samples': 773728, 'steps': 1511, 'loss/train': 3.1337783336639404} -09/20/2021 19:43:25 - INFO - __main__ - Step 24180: {'lr': 0.0001998822010798127, 'samples': 773760, 'steps': 1511, 'loss/train': 4.490928649902344} -09/20/2021 19:43:25 - INFO - __main__ - Step 24181: {'lr': 0.0001998822010798127, 'samples': 773792, 'steps': 1511, 'loss/train': 3.0567727088928223} -09/20/2021 19:43:26 - INFO - __main__ - Step 24182: {'lr': 0.0001998822010798127, 'samples': 773824, 'steps': 1511, 'loss/train': 2.6377711296081543} -09/20/2021 19:43:27 - INFO - __main__ - Step 24183: {'lr': 0.0001998822010798127, 'samples': 773856, 'steps': 1511, 'loss/train': 3.090022325515747} -09/20/2021 19:43:28 - INFO - __main__ - Step 24184: {'lr': 0.0001998822010798127, 'samples': 773888, 'steps': 1511, 'loss/train': 3.1833462715148926} -09/20/2021 19:43:28 - INFO - __main__ - Step 24185: {'lr': 0.0001998822010798127, 'samples': 773920, 'steps': 1511, 'loss/train': 2.4220402240753174} -09/20/2021 19:43:29 - INFO - __main__ - Step 24186: {'lr': 0.0001998822010798127, 'samples': 773952, 'steps': 1511, 'loss/train': 2.206310987472534} -09/20/2021 19:43:30 - INFO - __main__ - Step 24187: {'lr': 0.0001998822010798127, 'samples': 773984, 'steps': 1511, 'loss/train': 2.8013808727264404} -09/20/2021 19:43:31 - INFO - __main__ - Step 24188: {'lr': 0.0001998822010798127, 'samples': 774016, 'steps': 1511, 'loss/train': 2.693804979324341} -09/20/2021 19:43:32 - INFO - __main__ - Step 24189: {'lr': 0.0001998822010798127, 'samples': 774048, 'steps': 1511, 'loss/train': 3.8404650688171387} -09/20/2021 19:43:33 - INFO - __main__ - Step 24190: {'lr': 0.0001998822010798127, 'samples': 774080, 'steps': 1511, 'loss/train': 2.6374645233154297} -09/20/2021 19:43:34 - INFO - __main__ - Step 24191: {'lr': 0.0001998822010798127, 'samples': 774112, 'steps': 1511, 'loss/train': 2.7322616577148438} -09/20/2021 19:43:34 - INFO - __main__ - Step 24192: {'lr': 0.0001998822010798127, 'samples': 774144, 'steps': 1511, 'loss/train': 2.692657232284546} -09/20/2021 19:43:35 - INFO - __main__ - Step 24193: {'lr': 0.00019988189134759597, 'samples': 774176, 'steps': 1512, 'loss/train': 2.007335901260376} -09/20/2021 19:43:36 - INFO - __main__ - Step 24194: {'lr': 0.00019988189134759597, 'samples': 774208, 'steps': 1512, 'loss/train': 2.7315144538879395} -09/20/2021 19:43:37 - INFO - __main__ - Step 24195: {'lr': 0.00019988189134759597, 'samples': 774240, 'steps': 1512, 'loss/train': 2.792813539505005} -09/20/2021 19:43:37 - INFO - __main__ - Step 24196: {'lr': 0.00019988189134759597, 'samples': 774272, 'steps': 1512, 'loss/train': 2.255553960800171} -09/20/2021 19:43:38 - INFO - __main__ - Step 24197: {'lr': 0.00019988189134759597, 'samples': 774304, 'steps': 1512, 'loss/train': 2.8165605068206787} -09/20/2021 19:43:39 - INFO - __main__ - Step 24198: {'lr': 0.00019988189134759597, 'samples': 774336, 'steps': 1512, 'loss/train': 3.4870662689208984} -09/20/2021 19:43:40 - INFO - __main__ - Step 24199: {'lr': 0.00019988189134759597, 'samples': 774368, 'steps': 1512, 'loss/train': 2.235443353652954} -09/20/2021 19:43:40 - INFO - __main__ - Step 24200: {'lr': 0.00019988189134759597, 'samples': 774400, 'steps': 1512, 'loss/train': 2.6714975833892822} -09/20/2021 19:43:41 - INFO - __main__ - Step 24201: {'lr': 0.00019988189134759597, 'samples': 774432, 'steps': 1512, 'loss/train': 2.441251039505005} -09/20/2021 19:43:42 - INFO - __main__ - Step 24202: {'lr': 0.00019988189134759597, 'samples': 774464, 'steps': 1512, 'loss/train': 0.8553557991981506} -09/20/2021 19:43:43 - INFO - __main__ - Step 24203: {'lr': 0.00019988189134759597, 'samples': 774496, 'steps': 1512, 'loss/train': 3.1270554065704346} -09/20/2021 19:43:43 - INFO - __main__ - Step 24204: {'lr': 0.00019988189134759597, 'samples': 774528, 'steps': 1512, 'loss/train': 3.542120933532715} -09/20/2021 19:43:44 - INFO - __main__ - Step 24205: {'lr': 0.00019988189134759597, 'samples': 774560, 'steps': 1512, 'loss/train': 2.2215778827667236} -09/20/2021 19:43:45 - INFO - __main__ - Step 24206: {'lr': 0.00019988189134759597, 'samples': 774592, 'steps': 1512, 'loss/train': 2.1893820762634277} -09/20/2021 19:43:46 - INFO - __main__ - Step 24207: {'lr': 0.00019988189134759597, 'samples': 774624, 'steps': 1512, 'loss/train': 3.4552371501922607} -09/20/2021 19:43:46 - INFO - __main__ - Step 24208: {'lr': 0.00019988189134759597, 'samples': 774656, 'steps': 1512, 'loss/train': 3.0177981853485107} -09/20/2021 19:43:47 - INFO - __main__ - Step 24209: {'lr': 0.0001998815812089602, 'samples': 774688, 'steps': 1513, 'loss/train': 3.496948480606079} -09/20/2021 19:43:48 - INFO - __main__ - Step 24210: {'lr': 0.0001998815812089602, 'samples': 774720, 'steps': 1513, 'loss/train': 2.9707114696502686} -09/20/2021 19:43:49 - INFO - __main__ - Step 24211: {'lr': 0.0001998815812089602, 'samples': 774752, 'steps': 1513, 'loss/train': 0.9183434844017029} -09/20/2021 19:43:50 - INFO - __main__ - Step 24212: {'lr': 0.0001998815812089602, 'samples': 774784, 'steps': 1513, 'loss/train': 3.6493358612060547} -09/20/2021 19:43:50 - INFO - __main__ - Step 24213: {'lr': 0.0001998815812089602, 'samples': 774816, 'steps': 1513, 'loss/train': 3.5228116512298584} -09/20/2021 19:43:51 - INFO - __main__ - Step 24214: {'lr': 0.0001998815812089602, 'samples': 774848, 'steps': 1513, 'loss/train': 2.2479372024536133} -09/20/2021 19:43:52 - INFO - __main__ - Step 24215: {'lr': 0.0001998815812089602, 'samples': 774880, 'steps': 1513, 'loss/train': 3.045872688293457} -09/20/2021 19:43:53 - INFO - __main__ - Step 24216: {'lr': 0.0001998815812089602, 'samples': 774912, 'steps': 1513, 'loss/train': 2.3595378398895264} -09/20/2021 19:43:53 - INFO - __main__ - Step 24217: {'lr': 0.0001998815812089602, 'samples': 774944, 'steps': 1513, 'loss/train': 2.649229049682617} -09/20/2021 19:43:54 - INFO - __main__ - Step 24218: {'lr': 0.0001998815812089602, 'samples': 774976, 'steps': 1513, 'loss/train': 3.1421144008636475} -09/20/2021 19:43:55 - INFO - __main__ - Step 24219: {'lr': 0.0001998815812089602, 'samples': 775008, 'steps': 1513, 'loss/train': 3.066981315612793} -09/20/2021 19:43:56 - INFO - __main__ - Step 24220: {'lr': 0.0001998815812089602, 'samples': 775040, 'steps': 1513, 'loss/train': 4.185519695281982} -09/20/2021 19:43:57 - INFO - __main__ - Step 24221: {'lr': 0.0001998815812089602, 'samples': 775072, 'steps': 1513, 'loss/train': 3.122910737991333} -09/20/2021 19:43:58 - INFO - __main__ - Step 24222: {'lr': 0.0001998815812089602, 'samples': 775104, 'steps': 1513, 'loss/train': 2.08609938621521} -09/20/2021 19:43:58 - INFO - __main__ - Step 24223: {'lr': 0.0001998815812089602, 'samples': 775136, 'steps': 1513, 'loss/train': 3.1291682720184326} -09/20/2021 19:43:59 - INFO - __main__ - Step 24224: {'lr': 0.0001998815812089602, 'samples': 775168, 'steps': 1513, 'loss/train': 2.2778966426849365} -09/20/2021 19:44:00 - INFO - __main__ - Step 24225: {'lr': 0.00019988127066390666, 'samples': 775200, 'steps': 1514, 'loss/train': 2.8314828872680664} -09/20/2021 19:44:01 - INFO - __main__ - Step 24226: {'lr': 0.00019988127066390666, 'samples': 775232, 'steps': 1514, 'loss/train': 3.423799991607666} -09/20/2021 19:44:02 - INFO - __main__ - Step 24227: {'lr': 0.00019988127066390666, 'samples': 775264, 'steps': 1514, 'loss/train': 1.4738878011703491} -09/20/2021 19:44:02 - INFO - __main__ - Step 24228: {'lr': 0.00019988127066390666, 'samples': 775296, 'steps': 1514, 'loss/train': 2.293747901916504} -09/20/2021 19:44:03 - INFO - __main__ - Step 24229: {'lr': 0.00019988127066390666, 'samples': 775328, 'steps': 1514, 'loss/train': 4.609396457672119} -09/20/2021 19:44:04 - INFO - __main__ - Step 24230: {'lr': 0.00019988127066390666, 'samples': 775360, 'steps': 1514, 'loss/train': 2.0724849700927734} -09/20/2021 19:44:05 - INFO - __main__ - Step 24231: {'lr': 0.00019988127066390666, 'samples': 775392, 'steps': 1514, 'loss/train': 3.5578699111938477} -09/20/2021 19:44:05 - INFO - __main__ - Step 24232: {'lr': 0.00019988127066390666, 'samples': 775424, 'steps': 1514, 'loss/train': 3.5266900062561035} -09/20/2021 19:44:06 - INFO - __main__ - Step 24233: {'lr': 0.00019988127066390666, 'samples': 775456, 'steps': 1514, 'loss/train': 2.7978875637054443} -09/20/2021 19:44:07 - INFO - __main__ - Step 24234: {'lr': 0.00019988127066390666, 'samples': 775488, 'steps': 1514, 'loss/train': 3.147634506225586} -09/20/2021 19:44:08 - INFO - __main__ - Step 24235: {'lr': 0.00019988127066390666, 'samples': 775520, 'steps': 1514, 'loss/train': 3.2447116374969482} -09/20/2021 19:44:08 - INFO - __main__ - Step 24236: {'lr': 0.00019988127066390666, 'samples': 775552, 'steps': 1514, 'loss/train': 3.0562806129455566} -09/20/2021 19:44:09 - INFO - __main__ - Step 24237: {'lr': 0.00019988127066390666, 'samples': 775584, 'steps': 1514, 'loss/train': 4.370233535766602} -09/20/2021 19:44:10 - INFO - __main__ - Step 24238: {'lr': 0.00019988127066390666, 'samples': 775616, 'steps': 1514, 'loss/train': 3.7155425548553467} -09/20/2021 19:44:11 - INFO - __main__ - Step 24239: {'lr': 0.00019988127066390666, 'samples': 775648, 'steps': 1514, 'loss/train': 1.8153657913208008} -09/20/2021 19:44:11 - INFO - __main__ - Step 24240: {'lr': 0.00019988127066390666, 'samples': 775680, 'steps': 1514, 'loss/train': 2.36651611328125} -09/20/2021 19:44:12 - INFO - __main__ - Step 24241: {'lr': 0.0001998809597124366, 'samples': 775712, 'steps': 1515, 'loss/train': 2.925158977508545} -09/20/2021 19:44:13 - INFO - __main__ - Step 24242: {'lr': 0.0001998809597124366, 'samples': 775744, 'steps': 1515, 'loss/train': 3.4332497119903564} -09/20/2021 19:44:14 - INFO - __main__ - Step 24243: {'lr': 0.0001998809597124366, 'samples': 775776, 'steps': 1515, 'loss/train': 3.781552791595459} -09/20/2021 19:44:14 - INFO - __main__ - Step 24244: {'lr': 0.0001998809597124366, 'samples': 775808, 'steps': 1515, 'loss/train': 3.319524049758911} -09/20/2021 19:44:15 - INFO - __main__ - Step 24245: {'lr': 0.0001998809597124366, 'samples': 775840, 'steps': 1515, 'loss/train': 3.0048251152038574} -09/20/2021 19:44:16 - INFO - __main__ - Step 24246: {'lr': 0.0001998809597124366, 'samples': 775872, 'steps': 1515, 'loss/train': 2.5112321376800537} -09/20/2021 19:44:17 - INFO - __main__ - Step 24247: {'lr': 0.0001998809597124366, 'samples': 775904, 'steps': 1515, 'loss/train': 2.3429787158966064} -09/20/2021 19:44:17 - INFO - __main__ - Step 24248: {'lr': 0.0001998809597124366, 'samples': 775936, 'steps': 1515, 'loss/train': 2.6469080448150635} -09/20/2021 19:44:18 - INFO - __main__ - Step 24249: {'lr': 0.0001998809597124366, 'samples': 775968, 'steps': 1515, 'loss/train': 2.929213762283325} -09/20/2021 19:44:19 - INFO - __main__ - Step 24250: {'lr': 0.0001998809597124366, 'samples': 776000, 'steps': 1515, 'loss/train': 2.5740935802459717} -09/20/2021 19:44:20 - INFO - __main__ - Step 24251: {'lr': 0.0001998809597124366, 'samples': 776032, 'steps': 1515, 'loss/train': 0.6195080876350403} -09/20/2021 19:44:20 - INFO - __main__ - Step 24252: {'lr': 0.0001998809597124366, 'samples': 776064, 'steps': 1515, 'loss/train': 0.31196627020835876} -09/20/2021 19:44:22 - INFO - __main__ - Step 24253: {'lr': 0.0001998809597124366, 'samples': 776096, 'steps': 1515, 'loss/train': 0.4408513307571411} -09/20/2021 19:44:23 - INFO - __main__ - Step 24254: {'lr': 0.0001998809597124366, 'samples': 776128, 'steps': 1515, 'loss/train': 3.9279909133911133} -09/20/2021 19:44:23 - INFO - __main__ - Step 24255: {'lr': 0.0001998809597124366, 'samples': 776160, 'steps': 1515, 'loss/train': 2.543948173522949} -09/20/2021 19:44:24 - INFO - __main__ - Step 24256: {'lr': 0.0001998809597124366, 'samples': 776192, 'steps': 1515, 'loss/train': 2.652066230773926} -09/20/2021 19:44:25 - INFO - __main__ - Step 24257: {'lr': 0.00019988064835455133, 'samples': 776224, 'steps': 1516, 'loss/train': 2.87845778465271} -09/20/2021 19:44:26 - INFO - __main__ - Step 24258: {'lr': 0.00019988064835455133, 'samples': 776256, 'steps': 1516, 'loss/train': 2.4982094764709473} -09/20/2021 19:44:26 - INFO - __main__ - Step 24259: {'lr': 0.00019988064835455133, 'samples': 776288, 'steps': 1516, 'loss/train': 3.101961851119995} -09/20/2021 19:44:27 - INFO - __main__ - Step 24260: {'lr': 0.00019988064835455133, 'samples': 776320, 'steps': 1516, 'loss/train': 2.1094887256622314} -09/20/2021 19:44:28 - INFO - __main__ - Step 24261: {'lr': 0.00019988064835455133, 'samples': 776352, 'steps': 1516, 'loss/train': 3.5362348556518555} -09/20/2021 19:44:29 - INFO - __main__ - Step 24262: {'lr': 0.00019988064835455133, 'samples': 776384, 'steps': 1516, 'loss/train': 3.4707562923431396} -09/20/2021 19:44:29 - INFO - __main__ - Step 24263: {'lr': 0.00019988064835455133, 'samples': 776416, 'steps': 1516, 'loss/train': 3.307252883911133} -09/20/2021 19:44:30 - INFO - __main__ - Step 24264: {'lr': 0.00019988064835455133, 'samples': 776448, 'steps': 1516, 'loss/train': 3.2169909477233887} -09/20/2021 19:44:31 - INFO - __main__ - Step 24265: {'lr': 0.00019988064835455133, 'samples': 776480, 'steps': 1516, 'loss/train': 3.103971481323242} -09/20/2021 19:44:32 - INFO - __main__ - Step 24266: {'lr': 0.00019988064835455133, 'samples': 776512, 'steps': 1516, 'loss/train': 1.8010395765304565} -09/20/2021 19:44:32 - INFO - __main__ - Step 24267: {'lr': 0.00019988064835455133, 'samples': 776544, 'steps': 1516, 'loss/train': 2.848214626312256} -09/20/2021 19:44:33 - INFO - __main__ - Step 24268: {'lr': 0.00019988064835455133, 'samples': 776576, 'steps': 1516, 'loss/train': 2.4657037258148193} -09/20/2021 19:44:34 - INFO - __main__ - Step 24269: {'lr': 0.00019988064835455133, 'samples': 776608, 'steps': 1516, 'loss/train': 2.548330307006836} -09/20/2021 19:44:35 - INFO - __main__ - Step 24270: {'lr': 0.00019988064835455133, 'samples': 776640, 'steps': 1516, 'loss/train': 2.601419687271118} -09/20/2021 19:44:35 - INFO - __main__ - Step 24271: {'lr': 0.00019988064835455133, 'samples': 776672, 'steps': 1516, 'loss/train': 2.9041025638580322} -09/20/2021 19:44:36 - INFO - __main__ - Step 24272: {'lr': 0.00019988064835455133, 'samples': 776704, 'steps': 1516, 'loss/train': 3.028780221939087} -09/20/2021 19:44:37 - INFO - __main__ - Step 24273: {'lr': 0.00019988033659025205, 'samples': 776736, 'steps': 1517, 'loss/train': 3.0708510875701904} -09/20/2021 19:44:38 - INFO - __main__ - Step 24274: {'lr': 0.00019988033659025205, 'samples': 776768, 'steps': 1517, 'loss/train': 3.0264809131622314} -09/20/2021 19:44:39 - INFO - __main__ - Step 24275: {'lr': 0.00019988033659025205, 'samples': 776800, 'steps': 1517, 'loss/train': 2.4667434692382812} -09/20/2021 19:44:39 - INFO - __main__ - Step 24276: {'lr': 0.00019988033659025205, 'samples': 776832, 'steps': 1517, 'loss/train': 3.9041764736175537} -09/20/2021 19:44:40 - INFO - __main__ - Step 24277: {'lr': 0.00019988033659025205, 'samples': 776864, 'steps': 1517, 'loss/train': 2.763336181640625} -09/20/2021 19:44:41 - INFO - __main__ - Step 24278: {'lr': 0.00019988033659025205, 'samples': 776896, 'steps': 1517, 'loss/train': 2.5736894607543945} -09/20/2021 19:44:42 - INFO - __main__ - Step 24279: {'lr': 0.00019988033659025205, 'samples': 776928, 'steps': 1517, 'loss/train': 2.762864351272583} -09/20/2021 19:44:42 - INFO - __main__ - Step 24280: {'lr': 0.00019988033659025205, 'samples': 776960, 'steps': 1517, 'loss/train': 3.181884527206421} -09/20/2021 19:44:43 - INFO - __main__ - Step 24281: {'lr': 0.00019988033659025205, 'samples': 776992, 'steps': 1517, 'loss/train': 2.4676177501678467} -09/20/2021 19:44:44 - INFO - __main__ - Step 24282: {'lr': 0.00019988033659025205, 'samples': 777024, 'steps': 1517, 'loss/train': 4.175317287445068} -09/20/2021 19:44:45 - INFO - __main__ - Step 24283: {'lr': 0.00019988033659025205, 'samples': 777056, 'steps': 1517, 'loss/train': 3.407045364379883} -09/20/2021 19:44:46 - INFO - __main__ - Step 24284: {'lr': 0.00019988033659025205, 'samples': 777088, 'steps': 1517, 'loss/train': 2.670944929122925} -09/20/2021 19:44:47 - INFO - __main__ - Step 24285: {'lr': 0.00019988033659025205, 'samples': 777120, 'steps': 1517, 'loss/train': 3.1615490913391113} -09/20/2021 19:44:47 - INFO - __main__ - Step 24286: {'lr': 0.00019988033659025205, 'samples': 777152, 'steps': 1517, 'loss/train': 2.4712882041931152} -09/20/2021 19:44:48 - INFO - __main__ - Step 24287: {'lr': 0.00019988033659025205, 'samples': 777184, 'steps': 1517, 'loss/train': 3.426359176635742} -09/20/2021 19:44:49 - INFO - __main__ - Step 24288: {'lr': 0.00019988033659025205, 'samples': 777216, 'steps': 1517, 'loss/train': 3.9581785202026367} -09/20/2021 19:44:50 - INFO - __main__ - Step 24289: {'lr': 0.0001998800244195401, 'samples': 777248, 'steps': 1518, 'loss/train': 2.866448402404785} -09/20/2021 19:44:50 - INFO - __main__ - Step 24290: {'lr': 0.0001998800244195401, 'samples': 777280, 'steps': 1518, 'loss/train': 2.8584420680999756} -09/20/2021 19:44:51 - INFO - __main__ - Step 24291: {'lr': 0.0001998800244195401, 'samples': 777312, 'steps': 1518, 'loss/train': 3.295029640197754} -09/20/2021 19:44:52 - INFO - __main__ - Step 24292: {'lr': 0.0001998800244195401, 'samples': 777344, 'steps': 1518, 'loss/train': 4.32847261428833} -09/20/2021 19:44:53 - INFO - __main__ - Step 24293: {'lr': 0.0001998800244195401, 'samples': 777376, 'steps': 1518, 'loss/train': 2.7604968547821045} -09/20/2021 19:44:53 - INFO - __main__ - Step 24294: {'lr': 0.0001998800244195401, 'samples': 777408, 'steps': 1518, 'loss/train': 2.5792033672332764} -09/20/2021 19:44:54 - INFO - __main__ - Step 24295: {'lr': 0.0001998800244195401, 'samples': 777440, 'steps': 1518, 'loss/train': 3.4687678813934326} -09/20/2021 19:44:55 - INFO - __main__ - Step 24296: {'lr': 0.0001998800244195401, 'samples': 777472, 'steps': 1518, 'loss/train': 2.2945377826690674} -09/20/2021 19:44:56 - INFO - __main__ - Step 24297: {'lr': 0.0001998800244195401, 'samples': 777504, 'steps': 1518, 'loss/train': 2.967259168624878} -09/20/2021 19:44:56 - INFO - __main__ - Step 24298: {'lr': 0.0001998800244195401, 'samples': 777536, 'steps': 1518, 'loss/train': 2.225522994995117} -09/20/2021 19:44:57 - INFO - __main__ - Step 24299: {'lr': 0.0001998800244195401, 'samples': 777568, 'steps': 1518, 'loss/train': 2.8635616302490234} -09/20/2021 19:44:58 - INFO - __main__ - Step 24300: {'lr': 0.0001998800244195401, 'samples': 777600, 'steps': 1518, 'loss/train': 0.49273693561553955} -09/20/2021 19:44:59 - INFO - __main__ - Step 24301: {'lr': 0.0001998800244195401, 'samples': 777632, 'steps': 1518, 'loss/train': 3.7844221591949463} -09/20/2021 19:44:59 - INFO - __main__ - Step 24302: {'lr': 0.0001998800244195401, 'samples': 777664, 'steps': 1518, 'loss/train': 3.0855789184570312} -09/20/2021 19:45:00 - INFO - __main__ - Step 24303: {'lr': 0.0001998800244195401, 'samples': 777696, 'steps': 1518, 'loss/train': 3.215668201446533} -09/20/2021 19:45:01 - INFO - __main__ - Step 24304: {'lr': 0.0001998800244195401, 'samples': 777728, 'steps': 1518, 'loss/train': 2.197734832763672} -09/20/2021 19:45:02 - INFO - __main__ - Step 24305: {'lr': 0.00019987971184241672, 'samples': 777760, 'steps': 1519, 'loss/train': 3.1282243728637695} -09/20/2021 19:45:03 - INFO - __main__ - Step 24306: {'lr': 0.00019987971184241672, 'samples': 777792, 'steps': 1519, 'loss/train': 1.7177679538726807} -09/20/2021 19:45:03 - INFO - __main__ - Step 24307: {'lr': 0.00019987971184241672, 'samples': 777824, 'steps': 1519, 'loss/train': 2.0228428840637207} -09/20/2021 19:45:04 - INFO - __main__ - Step 24308: {'lr': 0.00019987971184241672, 'samples': 777856, 'steps': 1519, 'loss/train': 2.8140902519226074} -09/20/2021 19:45:05 - INFO - __main__ - Step 24309: {'lr': 0.00019987971184241672, 'samples': 777888, 'steps': 1519, 'loss/train': 3.133920669555664} -09/20/2021 19:45:06 - INFO - __main__ - Step 24310: {'lr': 0.00019987971184241672, 'samples': 777920, 'steps': 1519, 'loss/train': 2.773888111114502} -09/20/2021 19:45:06 - INFO - __main__ - Step 24311: {'lr': 0.00019987971184241672, 'samples': 777952, 'steps': 1519, 'loss/train': 1.9308329820632935} -09/20/2021 19:45:07 - INFO - __main__ - Step 24312: {'lr': 0.00019987971184241672, 'samples': 777984, 'steps': 1519, 'loss/train': 2.6616647243499756} -09/20/2021 19:45:08 - INFO - __main__ - Step 24313: {'lr': 0.00019987971184241672, 'samples': 778016, 'steps': 1519, 'loss/train': 2.7964634895324707} -09/20/2021 19:45:10 - INFO - __main__ - Step 24314: {'lr': 0.00019987971184241672, 'samples': 778048, 'steps': 1519, 'loss/train': 3.0659141540527344} -09/20/2021 19:45:10 - INFO - __main__ - Step 24315: {'lr': 0.00019987971184241672, 'samples': 778080, 'steps': 1519, 'loss/train': 3.229353189468384} -09/20/2021 19:45:11 - INFO - __main__ - Step 24316: {'lr': 0.00019987971184241672, 'samples': 778112, 'steps': 1519, 'loss/train': 2.9058382511138916} -09/20/2021 19:45:12 - INFO - __main__ - Step 24317: {'lr': 0.00019987971184241672, 'samples': 778144, 'steps': 1519, 'loss/train': 3.0355398654937744} -09/20/2021 19:45:13 - INFO - __main__ - Step 24318: {'lr': 0.00019987971184241672, 'samples': 778176, 'steps': 1519, 'loss/train': 3.2246222496032715} -09/20/2021 19:45:13 - INFO - __main__ - Step 24319: {'lr': 0.00019987971184241672, 'samples': 778208, 'steps': 1519, 'loss/train': 3.785020112991333} -09/20/2021 19:45:14 - INFO - __main__ - Step 24320: {'lr': 0.00019987971184241672, 'samples': 778240, 'steps': 1519, 'loss/train': 3.3620989322662354} -09/20/2021 19:45:15 - INFO - __main__ - Step 24321: {'lr': 0.00019987939885888313, 'samples': 778272, 'steps': 1520, 'loss/train': 3.2163889408111572} -09/20/2021 19:45:16 - INFO - __main__ - Step 24322: {'lr': 0.00019987939885888313, 'samples': 778304, 'steps': 1520, 'loss/train': 3.466630697250366} -09/20/2021 19:45:16 - INFO - __main__ - Step 24323: {'lr': 0.00019987939885888313, 'samples': 778336, 'steps': 1520, 'loss/train': 2.7065224647521973} -09/20/2021 19:45:17 - INFO - __main__ - Step 24324: {'lr': 0.00019987939885888313, 'samples': 778368, 'steps': 1520, 'loss/train': 2.6554806232452393} -09/20/2021 19:45:18 - INFO - __main__ - Step 24325: {'lr': 0.00019987939885888313, 'samples': 778400, 'steps': 1520, 'loss/train': 2.504889488220215} -09/20/2021 19:45:19 - INFO - __main__ - Step 24326: {'lr': 0.00019987939885888313, 'samples': 778432, 'steps': 1520, 'loss/train': 1.8965063095092773} -09/20/2021 19:45:19 - INFO - __main__ - Step 24327: {'lr': 0.00019987939885888313, 'samples': 778464, 'steps': 1520, 'loss/train': 1.9713082313537598} -09/20/2021 19:45:20 - INFO - __main__ - Step 24328: {'lr': 0.00019987939885888313, 'samples': 778496, 'steps': 1520, 'loss/train': 2.504706621170044} -09/20/2021 19:45:21 - INFO - __main__ - Step 24329: {'lr': 0.00019987939885888313, 'samples': 778528, 'steps': 1520, 'loss/train': 3.557269811630249} -09/20/2021 19:45:22 - INFO - __main__ - Step 24330: {'lr': 0.00019987939885888313, 'samples': 778560, 'steps': 1520, 'loss/train': 3.7548556327819824} -09/20/2021 19:45:22 - INFO - __main__ - Step 24331: {'lr': 0.00019987939885888313, 'samples': 778592, 'steps': 1520, 'loss/train': 2.8420376777648926} -09/20/2021 19:45:23 - INFO - __main__ - Step 24332: {'lr': 0.00019987939885888313, 'samples': 778624, 'steps': 1520, 'loss/train': 3.161677360534668} -09/20/2021 19:45:24 - INFO - __main__ - Step 24333: {'lr': 0.00019987939885888313, 'samples': 778656, 'steps': 1520, 'loss/train': 2.450589418411255} -09/20/2021 19:45:25 - INFO - __main__ - Step 24334: {'lr': 0.00019987939885888313, 'samples': 778688, 'steps': 1520, 'loss/train': 1.9450454711914062} -09/20/2021 19:45:25 - INFO - __main__ - Step 24335: {'lr': 0.00019987939885888313, 'samples': 778720, 'steps': 1520, 'loss/train': 3.8661038875579834} -09/20/2021 19:45:26 - INFO - __main__ - Step 24336: {'lr': 0.00019987939885888313, 'samples': 778752, 'steps': 1520, 'loss/train': 3.25593638420105} -09/20/2021 19:45:27 - INFO - __main__ - Step 24337: {'lr': 0.0001998790854689407, 'samples': 778784, 'steps': 1521, 'loss/train': 3.2792935371398926} -09/20/2021 19:45:28 - INFO - __main__ - Step 24338: {'lr': 0.0001998790854689407, 'samples': 778816, 'steps': 1521, 'loss/train': 2.687713384628296} -09/20/2021 19:45:29 - INFO - __main__ - Step 24339: {'lr': 0.0001998790854689407, 'samples': 778848, 'steps': 1521, 'loss/train': 2.5344414710998535} -09/20/2021 19:45:29 - INFO - __main__ - Step 24340: {'lr': 0.0001998790854689407, 'samples': 778880, 'steps': 1521, 'loss/train': 2.4958393573760986} -09/20/2021 19:45:30 - INFO - __main__ - Step 24341: {'lr': 0.0001998790854689407, 'samples': 778912, 'steps': 1521, 'loss/train': 2.6406819820404053} -09/20/2021 19:45:31 - INFO - __main__ - Step 24342: {'lr': 0.0001998790854689407, 'samples': 778944, 'steps': 1521, 'loss/train': 2.366978168487549} -09/20/2021 19:45:32 - INFO - __main__ - Step 24343: {'lr': 0.0001998790854689407, 'samples': 778976, 'steps': 1521, 'loss/train': 2.3317742347717285} -09/20/2021 19:45:33 - INFO - __main__ - Step 24344: {'lr': 0.0001998790854689407, 'samples': 779008, 'steps': 1521, 'loss/train': 2.9953818321228027} -09/20/2021 19:45:34 - INFO - __main__ - Step 24345: {'lr': 0.0001998790854689407, 'samples': 779040, 'steps': 1521, 'loss/train': 2.829002857208252} -09/20/2021 19:45:35 - INFO - __main__ - Step 24346: {'lr': 0.0001998790854689407, 'samples': 779072, 'steps': 1521, 'loss/train': 3.3223085403442383} -09/20/2021 19:45:35 - INFO - __main__ - Step 24347: {'lr': 0.0001998790854689407, 'samples': 779104, 'steps': 1521, 'loss/train': 2.7608752250671387} -09/20/2021 19:45:36 - INFO - __main__ - Step 24348: {'lr': 0.0001998790854689407, 'samples': 779136, 'steps': 1521, 'loss/train': 4.247581481933594} -09/20/2021 19:45:37 - INFO - __main__ - Step 24349: {'lr': 0.0001998790854689407, 'samples': 779168, 'steps': 1521, 'loss/train': 2.907683849334717} -09/20/2021 19:45:38 - INFO - __main__ - Step 24350: {'lr': 0.0001998790854689407, 'samples': 779200, 'steps': 1521, 'loss/train': 2.17248797416687} -09/20/2021 19:45:38 - INFO - __main__ - Step 24351: {'lr': 0.0001998790854689407, 'samples': 779232, 'steps': 1521, 'loss/train': 3.237778663635254} -09/20/2021 19:45:39 - INFO - __main__ - Step 24352: {'lr': 0.0001998790854689407, 'samples': 779264, 'steps': 1521, 'loss/train': 3.0598337650299072} -09/20/2021 19:45:40 - INFO - __main__ - Step 24353: {'lr': 0.00019987877167259067, 'samples': 779296, 'steps': 1522, 'loss/train': 2.9575188159942627} -09/20/2021 19:45:41 - INFO - __main__ - Step 24354: {'lr': 0.00019987877167259067, 'samples': 779328, 'steps': 1522, 'loss/train': 1.8936823606491089} -09/20/2021 19:45:41 - INFO - __main__ - Step 24355: {'lr': 0.00019987877167259067, 'samples': 779360, 'steps': 1522, 'loss/train': 1.9894440174102783} -09/20/2021 19:45:42 - INFO - __main__ - Step 24356: {'lr': 0.00019987877167259067, 'samples': 779392, 'steps': 1522, 'loss/train': 1.8904402256011963} -09/20/2021 19:45:43 - INFO - __main__ - Step 24357: {'lr': 0.00019987877167259067, 'samples': 779424, 'steps': 1522, 'loss/train': 2.2499725818634033} -09/20/2021 19:45:44 - INFO - __main__ - Step 24358: {'lr': 0.00019987877167259067, 'samples': 779456, 'steps': 1522, 'loss/train': 3.2697410583496094} -09/20/2021 19:45:44 - INFO - __main__ - Step 24359: {'lr': 0.00019987877167259067, 'samples': 779488, 'steps': 1522, 'loss/train': 2.6126697063446045} -09/20/2021 19:45:45 - INFO - __main__ - Step 24360: {'lr': 0.00019987877167259067, 'samples': 779520, 'steps': 1522, 'loss/train': 2.7524313926696777} -09/20/2021 19:45:46 - INFO - __main__ - Step 24361: {'lr': 0.00019987877167259067, 'samples': 779552, 'steps': 1522, 'loss/train': 0.8464513421058655} -09/20/2021 19:45:47 - INFO - __main__ - Step 24362: {'lr': 0.00019987877167259067, 'samples': 779584, 'steps': 1522, 'loss/train': 2.625225305557251} -09/20/2021 19:45:47 - INFO - __main__ - Step 24363: {'lr': 0.00019987877167259067, 'samples': 779616, 'steps': 1522, 'loss/train': 2.5018515586853027} -09/20/2021 19:45:48 - INFO - __main__ - Step 24364: {'lr': 0.00019987877167259067, 'samples': 779648, 'steps': 1522, 'loss/train': 2.6643354892730713} -09/20/2021 19:45:49 - INFO - __main__ - Step 24365: {'lr': 0.00019987877167259067, 'samples': 779680, 'steps': 1522, 'loss/train': 3.0476491451263428} -09/20/2021 19:45:50 - INFO - __main__ - Step 24366: {'lr': 0.00019987877167259067, 'samples': 779712, 'steps': 1522, 'loss/train': 2.7523930072784424} -09/20/2021 19:45:50 - INFO - __main__ - Step 24367: {'lr': 0.00019987877167259067, 'samples': 779744, 'steps': 1522, 'loss/train': 2.7527880668640137} -09/20/2021 19:45:51 - INFO - __main__ - Step 24368: {'lr': 0.00019987877167259067, 'samples': 779776, 'steps': 1522, 'loss/train': 2.3806447982788086} -09/20/2021 19:45:52 - INFO - __main__ - Step 24369: {'lr': 0.0001998784574698343, 'samples': 779808, 'steps': 1523, 'loss/train': 2.9953935146331787} -09/20/2021 19:45:53 - INFO - __main__ - Step 24370: {'lr': 0.0001998784574698343, 'samples': 779840, 'steps': 1523, 'loss/train': 2.6569297313690186} -09/20/2021 19:45:54 - INFO - __main__ - Step 24371: {'lr': 0.0001998784574698343, 'samples': 779872, 'steps': 1523, 'loss/train': 1.724941372871399} -09/20/2021 19:45:54 - INFO - __main__ - Step 24372: {'lr': 0.0001998784574698343, 'samples': 779904, 'steps': 1523, 'loss/train': 1.402208924293518} -09/20/2021 19:45:55 - INFO - __main__ - Step 24373: {'lr': 0.0001998784574698343, 'samples': 779936, 'steps': 1523, 'loss/train': 3.14312481880188} -09/20/2021 19:45:56 - INFO - __main__ - Step 24374: {'lr': 0.0001998784574698343, 'samples': 779968, 'steps': 1523, 'loss/train': 2.7455811500549316} -09/20/2021 19:45:57 - INFO - __main__ - Step 24375: {'lr': 0.0001998784574698343, 'samples': 780000, 'steps': 1523, 'loss/train': 2.8815062046051025} -09/20/2021 19:45:57 - INFO - __main__ - Step 24376: {'lr': 0.0001998784574698343, 'samples': 780032, 'steps': 1523, 'loss/train': 1.5593602657318115} -09/20/2021 19:45:59 - INFO - __main__ - Step 24377: {'lr': 0.0001998784574698343, 'samples': 780064, 'steps': 1523, 'loss/train': 1.4367806911468506} -09/20/2021 19:45:59 - INFO - __main__ - Step 24378: {'lr': 0.0001998784574698343, 'samples': 780096, 'steps': 1523, 'loss/train': 3.2681546211242676} -09/20/2021 19:46:00 - INFO - __main__ - Step 24379: {'lr': 0.0001998784574698343, 'samples': 780128, 'steps': 1523, 'loss/train': 3.4726641178131104} -09/20/2021 19:46:01 - INFO - __main__ - Step 24380: {'lr': 0.0001998784574698343, 'samples': 780160, 'steps': 1523, 'loss/train': 2.4101927280426025} -09/20/2021 19:46:02 - INFO - __main__ - Step 24381: {'lr': 0.0001998784574698343, 'samples': 780192, 'steps': 1523, 'loss/train': 2.758505344390869} -09/20/2021 19:46:02 - INFO - __main__ - Step 24382: {'lr': 0.0001998784574698343, 'samples': 780224, 'steps': 1523, 'loss/train': 2.998551845550537} -09/20/2021 19:46:03 - INFO - __main__ - Step 24383: {'lr': 0.0001998784574698343, 'samples': 780256, 'steps': 1523, 'loss/train': 3.0415611267089844} -09/20/2021 19:46:04 - INFO - __main__ - Step 24384: {'lr': 0.0001998784574698343, 'samples': 780288, 'steps': 1523, 'loss/train': 3.478262186050415} -09/20/2021 19:46:05 - INFO - __main__ - Step 24385: {'lr': 0.00019987814286067285, 'samples': 780320, 'steps': 1524, 'loss/train': 3.0520553588867188} -09/20/2021 19:46:06 - INFO - __main__ - Step 24386: {'lr': 0.00019987814286067285, 'samples': 780352, 'steps': 1524, 'loss/train': 2.148801326751709} -09/20/2021 19:46:06 - INFO - __main__ - Step 24387: {'lr': 0.00019987814286067285, 'samples': 780384, 'steps': 1524, 'loss/train': 2.7248852252960205} -09/20/2021 19:46:07 - INFO - __main__ - Step 24388: {'lr': 0.00019987814286067285, 'samples': 780416, 'steps': 1524, 'loss/train': 2.6307106018066406} -09/20/2021 19:46:08 - INFO - __main__ - Step 24389: {'lr': 0.00019987814286067285, 'samples': 780448, 'steps': 1524, 'loss/train': 3.2527947425842285} -09/20/2021 19:46:09 - INFO - __main__ - Step 24390: {'lr': 0.00019987814286067285, 'samples': 780480, 'steps': 1524, 'loss/train': 2.217172861099243} -09/20/2021 19:46:09 - INFO - __main__ - Step 24391: {'lr': 0.00019987814286067285, 'samples': 780512, 'steps': 1524, 'loss/train': 3.022345542907715} -09/20/2021 19:46:10 - INFO - __main__ - Step 24392: {'lr': 0.00019987814286067285, 'samples': 780544, 'steps': 1524, 'loss/train': 3.276127338409424} -09/20/2021 19:46:11 - INFO - __main__ - Step 24393: {'lr': 0.00019987814286067285, 'samples': 780576, 'steps': 1524, 'loss/train': 3.1443512439727783} -09/20/2021 19:46:12 - INFO - __main__ - Step 24394: {'lr': 0.00019987814286067285, 'samples': 780608, 'steps': 1524, 'loss/train': 6.261258602142334} -09/20/2021 19:46:12 - INFO - __main__ - Step 24395: {'lr': 0.00019987814286067285, 'samples': 780640, 'steps': 1524, 'loss/train': 3.2311127185821533} -09/20/2021 19:46:13 - INFO - __main__ - Step 24396: {'lr': 0.00019987814286067285, 'samples': 780672, 'steps': 1524, 'loss/train': 0.7633740901947021} -09/20/2021 19:46:14 - INFO - __main__ - Step 24397: {'lr': 0.00019987814286067285, 'samples': 780704, 'steps': 1524, 'loss/train': 2.891516923904419} -09/20/2021 19:46:15 - INFO - __main__ - Step 24398: {'lr': 0.00019987814286067285, 'samples': 780736, 'steps': 1524, 'loss/train': 2.3638947010040283} -09/20/2021 19:46:15 - INFO - __main__ - Step 24399: {'lr': 0.00019987814286067285, 'samples': 780768, 'steps': 1524, 'loss/train': 2.6992900371551514} -09/20/2021 19:46:16 - INFO - __main__ - Step 24400: {'lr': 0.00019987814286067285, 'samples': 780800, 'steps': 1524, 'loss/train': 2.812026023864746} -09/20/2021 19:46:17 - INFO - __main__ - Step 24401: {'lr': 0.00019987782784510762, 'samples': 780832, 'steps': 1525, 'loss/train': 3.4665346145629883} -09/20/2021 19:46:18 - INFO - __main__ - Step 24402: {'lr': 0.00019987782784510762, 'samples': 780864, 'steps': 1525, 'loss/train': 3.141505718231201} -09/20/2021 19:46:18 - INFO - __main__ - Step 24403: {'lr': 0.00019987782784510762, 'samples': 780896, 'steps': 1525, 'loss/train': 3.0281388759613037} -09/20/2021 19:46:19 - INFO - __main__ - Step 24404: {'lr': 0.00019987782784510762, 'samples': 780928, 'steps': 1525, 'loss/train': 2.9050605297088623} -09/20/2021 19:46:20 - INFO - __main__ - Step 24405: {'lr': 0.00019987782784510762, 'samples': 780960, 'steps': 1525, 'loss/train': 2.8250906467437744} -09/20/2021 19:46:21 - INFO - __main__ - Step 24406: {'lr': 0.00019987782784510762, 'samples': 780992, 'steps': 1525, 'loss/train': 1.7768707275390625} -09/20/2021 19:46:21 - INFO - __main__ - Step 24407: {'lr': 0.00019987782784510762, 'samples': 781024, 'steps': 1525, 'loss/train': 2.4143426418304443} -09/20/2021 19:46:23 - INFO - __main__ - Step 24408: {'lr': 0.00019987782784510762, 'samples': 781056, 'steps': 1525, 'loss/train': 2.4453320503234863} -09/20/2021 19:46:24 - INFO - __main__ - Step 24409: {'lr': 0.00019987782784510762, 'samples': 781088, 'steps': 1525, 'loss/train': 3.834111213684082} -09/20/2021 19:46:24 - INFO - __main__ - Step 24410: {'lr': 0.00019987782784510762, 'samples': 781120, 'steps': 1525, 'loss/train': 1.7497950792312622} -09/20/2021 19:46:25 - INFO - __main__ - Step 24411: {'lr': 0.00019987782784510762, 'samples': 781152, 'steps': 1525, 'loss/train': 2.2992560863494873} -09/20/2021 19:46:26 - INFO - __main__ - Step 24412: {'lr': 0.00019987782784510762, 'samples': 781184, 'steps': 1525, 'loss/train': 3.014234781265259} -09/20/2021 19:46:27 - INFO - __main__ - Step 24413: {'lr': 0.00019987782784510762, 'samples': 781216, 'steps': 1525, 'loss/train': 2.9986510276794434} -09/20/2021 19:46:27 - INFO - __main__ - Step 24414: {'lr': 0.00019987782784510762, 'samples': 781248, 'steps': 1525, 'loss/train': 3.6120445728302} -09/20/2021 19:46:28 - INFO - __main__ - Step 24415: {'lr': 0.00019987782784510762, 'samples': 781280, 'steps': 1525, 'loss/train': 1.7573213577270508} -09/20/2021 19:46:29 - INFO - __main__ - Step 24416: {'lr': 0.00019987782784510762, 'samples': 781312, 'steps': 1525, 'loss/train': 2.844780445098877} -09/20/2021 19:46:30 - INFO - __main__ - Step 24417: {'lr': 0.00019987751242313991, 'samples': 781344, 'steps': 1526, 'loss/train': 0.8330644965171814} -09/20/2021 19:46:31 - INFO - __main__ - Step 24418: {'lr': 0.00019987751242313991, 'samples': 781376, 'steps': 1526, 'loss/train': 2.677046060562134} -09/20/2021 19:46:31 - INFO - __main__ - Step 24419: {'lr': 0.00019987751242313991, 'samples': 781408, 'steps': 1526, 'loss/train': 2.7467195987701416} -09/20/2021 19:46:32 - INFO - __main__ - Step 24420: {'lr': 0.00019987751242313991, 'samples': 781440, 'steps': 1526, 'loss/train': 3.0071773529052734} -09/20/2021 19:46:33 - INFO - __main__ - Step 24421: {'lr': 0.00019987751242313991, 'samples': 781472, 'steps': 1526, 'loss/train': 4.504948616027832} -09/20/2021 19:46:34 - INFO - __main__ - Step 24422: {'lr': 0.00019987751242313991, 'samples': 781504, 'steps': 1526, 'loss/train': 0.6920358538627625} -09/20/2021 19:46:34 - INFO - __main__ - Step 24423: {'lr': 0.00019987751242313991, 'samples': 781536, 'steps': 1526, 'loss/train': 2.5312576293945312} -09/20/2021 19:46:35 - INFO - __main__ - Step 24424: {'lr': 0.00019987751242313991, 'samples': 781568, 'steps': 1526, 'loss/train': 2.2669014930725098} -09/20/2021 19:46:36 - INFO - __main__ - Step 24425: {'lr': 0.00019987751242313991, 'samples': 781600, 'steps': 1526, 'loss/train': 3.5183956623077393} -09/20/2021 19:46:37 - INFO - __main__ - Step 24426: {'lr': 0.00019987751242313991, 'samples': 781632, 'steps': 1526, 'loss/train': 2.7936997413635254} -09/20/2021 19:46:37 - INFO - __main__ - Step 24427: {'lr': 0.00019987751242313991, 'samples': 781664, 'steps': 1526, 'loss/train': 4.0543131828308105} -09/20/2021 19:46:38 - INFO - __main__ - Step 24428: {'lr': 0.00019987751242313991, 'samples': 781696, 'steps': 1526, 'loss/train': 3.6473138332366943} -09/20/2021 19:46:39 - INFO - __main__ - Step 24429: {'lr': 0.00019987751242313991, 'samples': 781728, 'steps': 1526, 'loss/train': 3.4737558364868164} -09/20/2021 19:46:40 - INFO - __main__ - Step 24430: {'lr': 0.00019987751242313991, 'samples': 781760, 'steps': 1526, 'loss/train': 3.4275081157684326} -09/20/2021 19:46:40 - INFO - __main__ - Step 24431: {'lr': 0.00019987751242313991, 'samples': 781792, 'steps': 1526, 'loss/train': 3.0090205669403076} -09/20/2021 19:46:41 - INFO - __main__ - Step 24432: {'lr': 0.00019987751242313991, 'samples': 781824, 'steps': 1526, 'loss/train': 2.765993118286133} -09/20/2021 19:46:42 - INFO - __main__ - Step 24433: {'lr': 0.000199877196594771, 'samples': 781856, 'steps': 1527, 'loss/train': 2.3897485733032227} -09/20/2021 19:46:43 - INFO - __main__ - Step 24434: {'lr': 0.000199877196594771, 'samples': 781888, 'steps': 1527, 'loss/train': 2.9046506881713867} -09/20/2021 19:46:43 - INFO - __main__ - Step 24435: {'lr': 0.000199877196594771, 'samples': 781920, 'steps': 1527, 'loss/train': 2.66080904006958} -09/20/2021 19:46:44 - INFO - __main__ - Step 24436: {'lr': 0.000199877196594771, 'samples': 781952, 'steps': 1527, 'loss/train': 2.4722039699554443} -09/20/2021 19:46:45 - INFO - __main__ - Step 24437: {'lr': 0.000199877196594771, 'samples': 781984, 'steps': 1527, 'loss/train': 2.0676839351654053} -09/20/2021 19:46:46 - INFO - __main__ - Step 24438: {'lr': 0.000199877196594771, 'samples': 782016, 'steps': 1527, 'loss/train': 0.5529391765594482} -09/20/2021 19:46:46 - INFO - __main__ - Step 24439: {'lr': 0.000199877196594771, 'samples': 782048, 'steps': 1527, 'loss/train': 0.6992378234863281} -09/20/2021 19:46:47 - INFO - __main__ - Step 24440: {'lr': 0.000199877196594771, 'samples': 782080, 'steps': 1527, 'loss/train': 0.477755606174469} -09/20/2021 19:46:49 - INFO - __main__ - Step 24441: {'lr': 0.000199877196594771, 'samples': 782112, 'steps': 1527, 'loss/train': 0.5497768521308899} -09/20/2021 19:46:49 - INFO - __main__ - Step 24442: {'lr': 0.000199877196594771, 'samples': 782144, 'steps': 1527, 'loss/train': 2.4561607837677} -09/20/2021 19:46:50 - INFO - __main__ - Step 24443: {'lr': 0.000199877196594771, 'samples': 782176, 'steps': 1527, 'loss/train': 2.923238754272461} -09/20/2021 19:46:51 - INFO - __main__ - Step 24444: {'lr': 0.000199877196594771, 'samples': 782208, 'steps': 1527, 'loss/train': 3.1839427947998047} -09/20/2021 19:46:52 - INFO - __main__ - Step 24445: {'lr': 0.000199877196594771, 'samples': 782240, 'steps': 1527, 'loss/train': 3.4714295864105225} -09/20/2021 19:46:52 - INFO - __main__ - Step 24446: {'lr': 0.000199877196594771, 'samples': 782272, 'steps': 1527, 'loss/train': 3.0015182495117188} -09/20/2021 19:46:53 - INFO - __main__ - Step 24447: {'lr': 0.000199877196594771, 'samples': 782304, 'steps': 1527, 'loss/train': 3.0041401386260986} -09/20/2021 19:46:54 - INFO - __main__ - Step 24448: {'lr': 0.000199877196594771, 'samples': 782336, 'steps': 1527, 'loss/train': 2.5187313556671143} -09/20/2021 19:46:55 - INFO - __main__ - Step 24449: {'lr': 0.0001998768803600022, 'samples': 782368, 'steps': 1528, 'loss/train': 2.493990182876587} -09/20/2021 19:46:56 - INFO - __main__ - Step 24450: {'lr': 0.0001998768803600022, 'samples': 782400, 'steps': 1528, 'loss/train': 2.8754966259002686} -09/20/2021 19:46:56 - INFO - __main__ - Step 24451: {'lr': 0.0001998768803600022, 'samples': 782432, 'steps': 1528, 'loss/train': 2.99408221244812} -09/20/2021 19:46:57 - INFO - __main__ - Step 24452: {'lr': 0.0001998768803600022, 'samples': 782464, 'steps': 1528, 'loss/train': 3.1220545768737793} -09/20/2021 19:46:58 - INFO - __main__ - Step 24453: {'lr': 0.0001998768803600022, 'samples': 782496, 'steps': 1528, 'loss/train': 5.190174579620361} -09/20/2021 19:46:59 - INFO - __main__ - Step 24454: {'lr': 0.0001998768803600022, 'samples': 782528, 'steps': 1528, 'loss/train': 5.150502681732178} -09/20/2021 19:46:59 - INFO - __main__ - Step 24455: {'lr': 0.0001998768803600022, 'samples': 782560, 'steps': 1528, 'loss/train': 5.117748737335205} -09/20/2021 19:47:00 - INFO - __main__ - Step 24456: {'lr': 0.0001998768803600022, 'samples': 782592, 'steps': 1528, 'loss/train': 5.162067890167236} -09/20/2021 19:47:01 - INFO - __main__ - Step 24457: {'lr': 0.0001998768803600022, 'samples': 782624, 'steps': 1528, 'loss/train': 3.1166930198669434} -09/20/2021 19:47:02 - INFO - __main__ - Step 24458: {'lr': 0.0001998768803600022, 'samples': 782656, 'steps': 1528, 'loss/train': 3.158665657043457} -09/20/2021 19:47:02 - INFO - __main__ - Step 24459: {'lr': 0.0001998768803600022, 'samples': 782688, 'steps': 1528, 'loss/train': 2.406031847000122} -09/20/2021 19:47:03 - INFO - __main__ - Step 24460: {'lr': 0.0001998768803600022, 'samples': 782720, 'steps': 1528, 'loss/train': 2.3842790126800537} -09/20/2021 19:47:04 - INFO - __main__ - Step 24461: {'lr': 0.0001998768803600022, 'samples': 782752, 'steps': 1528, 'loss/train': 3.132423162460327} -09/20/2021 19:47:05 - INFO - __main__ - Step 24462: {'lr': 0.0001998768803600022, 'samples': 782784, 'steps': 1528, 'loss/train': 2.75365948677063} -09/20/2021 19:47:05 - INFO - __main__ - Step 24463: {'lr': 0.0001998768803600022, 'samples': 782816, 'steps': 1528, 'loss/train': 2.1340951919555664} -09/20/2021 19:47:06 - INFO - __main__ - Step 24464: {'lr': 0.0001998768803600022, 'samples': 782848, 'steps': 1528, 'loss/train': 3.106827735900879} -09/20/2021 19:47:07 - INFO - __main__ - Step 24465: {'lr': 0.00019987656371883467, 'samples': 782880, 'steps': 1529, 'loss/train': 2.1832921504974365} -09/20/2021 19:47:08 - INFO - __main__ - Step 24466: {'lr': 0.00019987656371883467, 'samples': 782912, 'steps': 1529, 'loss/train': 3.3587822914123535} -09/20/2021 19:47:08 - INFO - __main__ - Step 24467: {'lr': 0.00019987656371883467, 'samples': 782944, 'steps': 1529, 'loss/train': 4.013500213623047} -09/20/2021 19:47:09 - INFO - __main__ - Step 24468: {'lr': 0.00019987656371883467, 'samples': 782976, 'steps': 1529, 'loss/train': 3.0250155925750732} -09/20/2021 19:47:10 - INFO - __main__ - Step 24469: {'lr': 0.00019987656371883467, 'samples': 783008, 'steps': 1529, 'loss/train': 2.975560188293457} -09/20/2021 19:47:11 - INFO - __main__ - Step 24470: {'lr': 0.00019987656371883467, 'samples': 783040, 'steps': 1529, 'loss/train': 2.466940402984619} -09/20/2021 19:47:11 - INFO - __main__ - Step 24471: {'lr': 0.00019987656371883467, 'samples': 783072, 'steps': 1529, 'loss/train': 3.4409780502319336} -09/20/2021 19:47:12 - INFO - __main__ - Step 24472: {'lr': 0.00019987656371883467, 'samples': 783104, 'steps': 1529, 'loss/train': 3.3729777336120605} -09/20/2021 19:47:13 - INFO - __main__ - Step 24473: {'lr': 0.00019987656371883467, 'samples': 783136, 'steps': 1529, 'loss/train': 2.541663408279419} -09/20/2021 19:47:14 - INFO - __main__ - Step 24474: {'lr': 0.00019987656371883467, 'samples': 783168, 'steps': 1529, 'loss/train': 3.1656689643859863} -09/20/2021 19:47:15 - INFO - __main__ - Step 24475: {'lr': 0.00019987656371883467, 'samples': 783200, 'steps': 1529, 'loss/train': 3.0142741203308105} -09/20/2021 19:47:16 - INFO - __main__ - Step 24476: {'lr': 0.00019987656371883467, 'samples': 783232, 'steps': 1529, 'loss/train': 2.661910057067871} -09/20/2021 19:47:16 - INFO - __main__ - Step 24477: {'lr': 0.00019987656371883467, 'samples': 783264, 'steps': 1529, 'loss/train': 3.786611318588257} -09/20/2021 19:47:17 - INFO - __main__ - Step 24478: {'lr': 0.00019987656371883467, 'samples': 783296, 'steps': 1529, 'loss/train': 3.562251091003418} -09/20/2021 19:47:18 - INFO - __main__ - Step 24479: {'lr': 0.00019987656371883467, 'samples': 783328, 'steps': 1529, 'loss/train': 3.7247731685638428} -09/20/2021 19:47:19 - INFO - __main__ - Step 24480: {'lr': 0.00019987656371883467, 'samples': 783360, 'steps': 1529, 'loss/train': 2.58197283744812} -09/20/2021 19:47:20 - INFO - __main__ - Step 24481: {'lr': 0.00019987624667126984, 'samples': 783392, 'steps': 1530, 'loss/train': 2.6920504570007324} -09/20/2021 19:47:20 - INFO - __main__ - Step 24482: {'lr': 0.00019987624667126984, 'samples': 783424, 'steps': 1530, 'loss/train': 1.0240038633346558} -09/20/2021 19:47:21 - INFO - __main__ - Step 24483: {'lr': 0.00019987624667126984, 'samples': 783456, 'steps': 1530, 'loss/train': 3.3668272495269775} -09/20/2021 19:47:22 - INFO - __main__ - Step 24484: {'lr': 0.00019987624667126984, 'samples': 783488, 'steps': 1530, 'loss/train': 1.364880919456482} -09/20/2021 19:47:23 - INFO - __main__ - Step 24485: {'lr': 0.00019987624667126984, 'samples': 783520, 'steps': 1530, 'loss/train': 2.7054293155670166} -09/20/2021 19:47:23 - INFO - __main__ - Step 24486: {'lr': 0.00019987624667126984, 'samples': 783552, 'steps': 1530, 'loss/train': 3.1320278644561768} -09/20/2021 19:47:24 - INFO - __main__ - Step 24487: {'lr': 0.00019987624667126984, 'samples': 783584, 'steps': 1530, 'loss/train': 3.0474607944488525} -09/20/2021 19:47:25 - INFO - __main__ - Step 24488: {'lr': 0.00019987624667126984, 'samples': 783616, 'steps': 1530, 'loss/train': 3.390477180480957} -09/20/2021 19:47:26 - INFO - __main__ - Step 24489: {'lr': 0.00019987624667126984, 'samples': 783648, 'steps': 1530, 'loss/train': 3.030207633972168} -09/20/2021 19:47:26 - INFO - __main__ - Step 24490: {'lr': 0.00019987624667126984, 'samples': 783680, 'steps': 1530, 'loss/train': 2.351320266723633} -09/20/2021 19:47:27 - INFO - __main__ - Step 24491: {'lr': 0.00019987624667126984, 'samples': 783712, 'steps': 1530, 'loss/train': 2.283546209335327} -09/20/2021 19:47:28 - INFO - __main__ - Step 24492: {'lr': 0.00019987624667126984, 'samples': 783744, 'steps': 1530, 'loss/train': 2.3870298862457275} -09/20/2021 19:47:29 - INFO - __main__ - Step 24493: {'lr': 0.00019987624667126984, 'samples': 783776, 'steps': 1530, 'loss/train': 3.2334537506103516} -09/20/2021 19:47:29 - INFO - __main__ - Step 24494: {'lr': 0.00019987624667126984, 'samples': 783808, 'steps': 1530, 'loss/train': 2.8874216079711914} -09/20/2021 19:47:30 - INFO - __main__ - Step 24495: {'lr': 0.00019987624667126984, 'samples': 783840, 'steps': 1530, 'loss/train': 1.9940184354782104} -09/20/2021 19:47:31 - INFO - __main__ - Step 24496: {'lr': 0.00019987624667126984, 'samples': 783872, 'steps': 1530, 'loss/train': 2.542658567428589} -09/20/2021 19:47:32 - INFO - __main__ - Step 24497: {'lr': 0.00019987592921730897, 'samples': 783904, 'steps': 1531, 'loss/train': 3.5922539234161377} -09/20/2021 19:47:33 - INFO - __main__ - Step 24498: {'lr': 0.00019987592921730897, 'samples': 783936, 'steps': 1531, 'loss/train': 4.13003396987915} -09/20/2021 19:47:33 - INFO - __main__ - Step 24499: {'lr': 0.00019987592921730897, 'samples': 783968, 'steps': 1531, 'loss/train': 3.33740234375} -09/20/2021 19:47:34 - INFO - __main__ - Step 24500: {'lr': 0.00019987592921730897, 'samples': 784000, 'steps': 1531, 'loss/train': 2.9242587089538574} -09/20/2021 19:47:35 - INFO - __main__ - Step 24501: {'lr': 0.00019987592921730897, 'samples': 784032, 'steps': 1531, 'loss/train': 3.1512770652770996} -09/20/2021 19:47:36 - INFO - __main__ - Step 24502: {'lr': 0.00019987592921730897, 'samples': 784064, 'steps': 1531, 'loss/train': 2.9391467571258545} -09/20/2021 19:47:37 - INFO - __main__ - Step 24503: {'lr': 0.00019987592921730897, 'samples': 784096, 'steps': 1531, 'loss/train': 2.5612030029296875} -09/20/2021 19:47:38 - INFO - __main__ - Step 24504: {'lr': 0.00019987592921730897, 'samples': 784128, 'steps': 1531, 'loss/train': 2.052293062210083} -09/20/2021 19:47:38 - INFO - __main__ - Step 24505: {'lr': 0.00019987592921730897, 'samples': 784160, 'steps': 1531, 'loss/train': 3.4539146423339844} -09/20/2021 19:47:39 - INFO - __main__ - Step 24506: {'lr': 0.00019987592921730897, 'samples': 784192, 'steps': 1531, 'loss/train': 2.6096150875091553} -09/20/2021 19:47:40 - INFO - __main__ - Step 24507: {'lr': 0.00019987592921730897, 'samples': 784224, 'steps': 1531, 'loss/train': 3.440859079360962} -09/20/2021 19:47:41 - INFO - __main__ - Step 24508: {'lr': 0.00019987592921730897, 'samples': 784256, 'steps': 1531, 'loss/train': 2.8710947036743164} -09/20/2021 19:47:41 - INFO - __main__ - Step 24509: {'lr': 0.00019987592921730897, 'samples': 784288, 'steps': 1531, 'loss/train': 2.9643616676330566} -09/20/2021 19:47:42 - INFO - __main__ - Step 24510: {'lr': 0.00019987592921730897, 'samples': 784320, 'steps': 1531, 'loss/train': 3.4651806354522705} -09/20/2021 19:47:43 - INFO - __main__ - Step 24511: {'lr': 0.00019987592921730897, 'samples': 784352, 'steps': 1531, 'loss/train': 3.34761118888855} -09/20/2021 19:47:44 - INFO - __main__ - Step 24512: {'lr': 0.00019987592921730897, 'samples': 784384, 'steps': 1531, 'loss/train': 3.4235334396362305} -09/20/2021 19:47:44 - INFO - __main__ - Step 24513: {'lr': 0.0001998756113569533, 'samples': 784416, 'steps': 1532, 'loss/train': 6.188966274261475} -09/20/2021 19:47:45 - INFO - __main__ - Step 24514: {'lr': 0.0001998756113569533, 'samples': 784448, 'steps': 1532, 'loss/train': 2.861872673034668} -09/20/2021 19:47:46 - INFO - __main__ - Step 24515: {'lr': 0.0001998756113569533, 'samples': 784480, 'steps': 1532, 'loss/train': 2.851083993911743} -09/20/2021 19:47:47 - INFO - __main__ - Step 24516: {'lr': 0.0001998756113569533, 'samples': 784512, 'steps': 1532, 'loss/train': 3.504075050354004} -09/20/2021 19:47:47 - INFO - __main__ - Step 24517: {'lr': 0.0001998756113569533, 'samples': 784544, 'steps': 1532, 'loss/train': 2.9116415977478027} -09/20/2021 19:47:48 - INFO - __main__ - Step 24518: {'lr': 0.0001998756113569533, 'samples': 784576, 'steps': 1532, 'loss/train': 2.3294262886047363} -09/20/2021 19:47:49 - INFO - __main__ - Step 24519: {'lr': 0.0001998756113569533, 'samples': 784608, 'steps': 1532, 'loss/train': 2.2134556770324707} -09/20/2021 19:47:50 - INFO - __main__ - Step 24520: {'lr': 0.0001998756113569533, 'samples': 784640, 'steps': 1532, 'loss/train': 3.720874547958374} -09/20/2021 19:47:50 - INFO - __main__ - Step 24521: {'lr': 0.0001998756113569533, 'samples': 784672, 'steps': 1532, 'loss/train': 3.1791903972625732} -09/20/2021 19:47:51 - INFO - __main__ - Step 24522: {'lr': 0.0001998756113569533, 'samples': 784704, 'steps': 1532, 'loss/train': 3.2409274578094482} -09/20/2021 19:47:52 - INFO - __main__ - Step 24523: {'lr': 0.0001998756113569533, 'samples': 784736, 'steps': 1532, 'loss/train': 3.4137566089630127} -09/20/2021 19:47:53 - INFO - __main__ - Step 24524: {'lr': 0.0001998756113569533, 'samples': 784768, 'steps': 1532, 'loss/train': 2.6581411361694336} -09/20/2021 19:47:53 - INFO - __main__ - Step 24525: {'lr': 0.0001998756113569533, 'samples': 784800, 'steps': 1532, 'loss/train': 2.5373473167419434} -09/20/2021 19:47:54 - INFO - __main__ - Step 24526: {'lr': 0.0001998756113569533, 'samples': 784832, 'steps': 1532, 'loss/train': 2.058912515640259} -09/20/2021 19:47:55 - INFO - __main__ - Step 24527: {'lr': 0.0001998756113569533, 'samples': 784864, 'steps': 1532, 'loss/train': 2.430020332336426} -09/20/2021 19:47:56 - INFO - __main__ - Step 24528: {'lr': 0.0001998756113569533, 'samples': 784896, 'steps': 1532, 'loss/train': 2.727278470993042} -09/20/2021 19:47:57 - INFO - __main__ - Step 24529: {'lr': 0.00019987529309020417, 'samples': 784928, 'steps': 1533, 'loss/train': 3.5902271270751953} -09/20/2021 19:47:57 - INFO - __main__ - Step 24530: {'lr': 0.00019987529309020417, 'samples': 784960, 'steps': 1533, 'loss/train': 2.0694167613983154} -09/20/2021 19:47:58 - INFO - __main__ - Step 24531: {'lr': 0.00019987529309020417, 'samples': 784992, 'steps': 1533, 'loss/train': 2.23199200630188} -09/20/2021 19:47:59 - INFO - __main__ - Step 24532: {'lr': 0.00019987529309020417, 'samples': 785024, 'steps': 1533, 'loss/train': 3.8607726097106934} -09/20/2021 19:48:00 - INFO - __main__ - Step 24533: {'lr': 0.00019987529309020417, 'samples': 785056, 'steps': 1533, 'loss/train': 3.0909852981567383} -09/20/2021 19:48:01 - INFO - __main__ - Step 24534: {'lr': 0.00019987529309020417, 'samples': 785088, 'steps': 1533, 'loss/train': 3.2101330757141113} -09/20/2021 19:48:02 - INFO - __main__ - Step 24535: {'lr': 0.00019987529309020417, 'samples': 785120, 'steps': 1533, 'loss/train': 3.742497682571411} -09/20/2021 19:48:03 - INFO - __main__ - Step 24536: {'lr': 0.00019987529309020417, 'samples': 785152, 'steps': 1533, 'loss/train': 1.8720793724060059} -09/20/2021 19:48:03 - INFO - __main__ - Step 24537: {'lr': 0.00019987529309020417, 'samples': 785184, 'steps': 1533, 'loss/train': 3.7655997276306152} -09/20/2021 19:48:04 - INFO - __main__ - Step 24538: {'lr': 0.00019987529309020417, 'samples': 785216, 'steps': 1533, 'loss/train': 3.2826008796691895} -09/20/2021 19:48:05 - INFO - __main__ - Step 24539: {'lr': 0.00019987529309020417, 'samples': 785248, 'steps': 1533, 'loss/train': 2.6667702198028564} -09/20/2021 19:48:06 - INFO - __main__ - Step 24540: {'lr': 0.00019987529309020417, 'samples': 785280, 'steps': 1533, 'loss/train': 3.753486394882202} -09/20/2021 19:48:06 - INFO - __main__ - Step 24541: {'lr': 0.00019987529309020417, 'samples': 785312, 'steps': 1533, 'loss/train': 3.8514490127563477} -09/20/2021 19:48:07 - INFO - __main__ - Step 24542: {'lr': 0.00019987529309020417, 'samples': 785344, 'steps': 1533, 'loss/train': 2.3463151454925537} -09/20/2021 19:48:08 - INFO - __main__ - Step 24543: {'lr': 0.00019987529309020417, 'samples': 785376, 'steps': 1533, 'loss/train': 2.22806978225708} -09/20/2021 19:48:09 - INFO - __main__ - Step 24544: {'lr': 0.00019987529309020417, 'samples': 785408, 'steps': 1533, 'loss/train': 2.680354595184326} -09/20/2021 19:48:09 - INFO - __main__ - Step 24545: {'lr': 0.00019987497441706286, 'samples': 785440, 'steps': 1534, 'loss/train': 2.7171432971954346} -09/20/2021 19:48:10 - INFO - __main__ - Step 24546: {'lr': 0.00019987497441706286, 'samples': 785472, 'steps': 1534, 'loss/train': 2.614219903945923} -09/20/2021 19:48:11 - INFO - __main__ - Step 24547: {'lr': 0.00019987497441706286, 'samples': 785504, 'steps': 1534, 'loss/train': 3.2116940021514893} -09/20/2021 19:48:12 - INFO - __main__ - Step 24548: {'lr': 0.00019987497441706286, 'samples': 785536, 'steps': 1534, 'loss/train': 0.5848186016082764} -09/20/2021 19:48:12 - INFO - __main__ - Step 24549: {'lr': 0.00019987497441706286, 'samples': 785568, 'steps': 1534, 'loss/train': 0.4906904399394989} -09/20/2021 19:48:13 - INFO - __main__ - Step 24550: {'lr': 0.00019987497441706286, 'samples': 785600, 'steps': 1534, 'loss/train': 0.333259254693985} -09/20/2021 19:48:14 - INFO - __main__ - Step 24551: {'lr': 0.00019987497441706286, 'samples': 785632, 'steps': 1534, 'loss/train': 3.2192249298095703} -09/20/2021 19:48:15 - INFO - __main__ - Step 24552: {'lr': 0.00019987497441706286, 'samples': 785664, 'steps': 1534, 'loss/train': 2.8223671913146973} -09/20/2021 19:48:15 - INFO - __main__ - Step 24553: {'lr': 0.00019987497441706286, 'samples': 785696, 'steps': 1534, 'loss/train': 2.7980074882507324} -09/20/2021 19:48:16 - INFO - __main__ - Step 24554: {'lr': 0.00019987497441706286, 'samples': 785728, 'steps': 1534, 'loss/train': 3.4407265186309814} -09/20/2021 19:48:17 - INFO - __main__ - Step 24555: {'lr': 0.00019987497441706286, 'samples': 785760, 'steps': 1534, 'loss/train': 2.1891486644744873} -09/20/2021 19:48:18 - INFO - __main__ - Step 24556: {'lr': 0.00019987497441706286, 'samples': 785792, 'steps': 1534, 'loss/train': 3.105837106704712} -09/20/2021 19:48:18 - INFO - __main__ - Step 24557: {'lr': 0.00019987497441706286, 'samples': 785824, 'steps': 1534, 'loss/train': 2.1754724979400635} -09/20/2021 19:48:19 - INFO - __main__ - Step 24558: {'lr': 0.00019987497441706286, 'samples': 785856, 'steps': 1534, 'loss/train': 2.7219388484954834} -09/20/2021 19:48:20 - INFO - __main__ - Step 24559: {'lr': 0.00019987497441706286, 'samples': 785888, 'steps': 1534, 'loss/train': 3.425400495529175} -09/20/2021 19:48:21 - INFO - __main__ - Step 24560: {'lr': 0.00019987497441706286, 'samples': 785920, 'steps': 1534, 'loss/train': 2.8472931385040283} -09/20/2021 19:48:22 - INFO - __main__ - Step 24561: {'lr': 0.00019987465533753067, 'samples': 785952, 'steps': 1535, 'loss/train': 2.579787254333496} -09/20/2021 19:48:22 - INFO - __main__ - Step 24562: {'lr': 0.00019987465533753067, 'samples': 785984, 'steps': 1535, 'loss/train': 5.467308521270752} -09/20/2021 19:48:23 - INFO - __main__ - Step 24563: {'lr': 0.00019987465533753067, 'samples': 786016, 'steps': 1535, 'loss/train': 2.777642011642456} -09/20/2021 19:48:24 - INFO - __main__ - Step 24564: {'lr': 0.00019987465533753067, 'samples': 786048, 'steps': 1535, 'loss/train': 2.097963571548462} -09/20/2021 19:48:25 - INFO - __main__ - Step 24565: {'lr': 0.00019987465533753067, 'samples': 786080, 'steps': 1535, 'loss/train': 2.5489563941955566} -09/20/2021 19:48:26 - INFO - __main__ - Step 24566: {'lr': 0.00019987465533753067, 'samples': 786112, 'steps': 1535, 'loss/train': 2.2765538692474365} -09/20/2021 19:48:27 - INFO - __main__ - Step 24567: {'lr': 0.00019987465533753067, 'samples': 786144, 'steps': 1535, 'loss/train': 2.7454159259796143} -09/20/2021 19:48:27 - INFO - __main__ - Step 24568: {'lr': 0.00019987465533753067, 'samples': 786176, 'steps': 1535, 'loss/train': 2.5909957885742188} -09/20/2021 19:48:28 - INFO - __main__ - Step 24569: {'lr': 0.00019987465533753067, 'samples': 786208, 'steps': 1535, 'loss/train': 2.754737377166748} -09/20/2021 19:48:29 - INFO - __main__ - Step 24570: {'lr': 0.00019987465533753067, 'samples': 786240, 'steps': 1535, 'loss/train': 3.8557229042053223} -09/20/2021 19:48:30 - INFO - __main__ - Step 24571: {'lr': 0.00019987465533753067, 'samples': 786272, 'steps': 1535, 'loss/train': 3.6351513862609863} -09/20/2021 19:48:30 - INFO - __main__ - Step 24572: {'lr': 0.00019987465533753067, 'samples': 786304, 'steps': 1535, 'loss/train': 3.0837178230285645} -09/20/2021 19:48:31 - INFO - __main__ - Step 24573: {'lr': 0.00019987465533753067, 'samples': 786336, 'steps': 1535, 'loss/train': 2.787860155105591} -09/20/2021 19:48:32 - INFO - __main__ - Step 24574: {'lr': 0.00019987465533753067, 'samples': 786368, 'steps': 1535, 'loss/train': 2.7318594455718994} -09/20/2021 19:48:33 - INFO - __main__ - Step 24575: {'lr': 0.00019987465533753067, 'samples': 786400, 'steps': 1535, 'loss/train': 3.5007941722869873} -09/20/2021 19:48:33 - INFO - __main__ - Step 24576: {'lr': 0.00019987465533753067, 'samples': 786432, 'steps': 1535, 'loss/train': 2.1113781929016113} -09/20/2021 19:48:34 - INFO - __main__ - Step 24577: {'lr': 0.00019987433585160887, 'samples': 786464, 'steps': 1536, 'loss/train': 2.842329978942871} -09/20/2021 19:48:35 - INFO - __main__ - Step 24578: {'lr': 0.00019987433585160887, 'samples': 786496, 'steps': 1536, 'loss/train': 3.2259292602539062} -09/20/2021 19:48:36 - INFO - __main__ - Step 24579: {'lr': 0.00019987433585160887, 'samples': 786528, 'steps': 1536, 'loss/train': 3.249600410461426} -09/20/2021 19:48:37 - INFO - __main__ - Step 24580: {'lr': 0.00019987433585160887, 'samples': 786560, 'steps': 1536, 'loss/train': 3.8409640789031982} -09/20/2021 19:48:37 - INFO - __main__ - Step 24581: {'lr': 0.00019987433585160887, 'samples': 786592, 'steps': 1536, 'loss/train': 2.526409864425659} -09/20/2021 19:48:38 - INFO - __main__ - Step 24582: {'lr': 0.00019987433585160887, 'samples': 786624, 'steps': 1536, 'loss/train': 3.660585880279541} -09/20/2021 19:48:39 - INFO - __main__ - Step 24583: {'lr': 0.00019987433585160887, 'samples': 786656, 'steps': 1536, 'loss/train': 3.736017942428589} -09/20/2021 19:48:40 - INFO - __main__ - Step 24584: {'lr': 0.00019987433585160887, 'samples': 786688, 'steps': 1536, 'loss/train': 3.0094802379608154} -09/20/2021 19:48:40 - INFO - __main__ - Step 24585: {'lr': 0.00019987433585160887, 'samples': 786720, 'steps': 1536, 'loss/train': 2.837928056716919} -09/20/2021 19:48:41 - INFO - __main__ - Step 24586: {'lr': 0.00019987433585160887, 'samples': 786752, 'steps': 1536, 'loss/train': 2.987741470336914} -09/20/2021 19:48:42 - INFO - __main__ - Step 24587: {'lr': 0.00019987433585160887, 'samples': 786784, 'steps': 1536, 'loss/train': 0.851452112197876} -09/20/2021 19:48:43 - INFO - __main__ - Step 24588: {'lr': 0.00019987433585160887, 'samples': 786816, 'steps': 1536, 'loss/train': 3.1138527393341064} -09/20/2021 19:48:43 - INFO - __main__ - Step 24589: {'lr': 0.00019987433585160887, 'samples': 786848, 'steps': 1536, 'loss/train': 2.589925765991211} -09/20/2021 19:48:44 - INFO - __main__ - Step 24590: {'lr': 0.00019987433585160887, 'samples': 786880, 'steps': 1536, 'loss/train': 2.7853870391845703} -09/20/2021 19:48:45 - INFO - __main__ - Step 24591: {'lr': 0.00019987433585160887, 'samples': 786912, 'steps': 1536, 'loss/train': 2.209670066833496} -09/20/2021 19:48:46 - INFO - __main__ - Step 24592: {'lr': 0.00019987433585160887, 'samples': 786944, 'steps': 1536, 'loss/train': 2.872598648071289} -09/20/2021 19:48:46 - INFO - __main__ - Step 24593: {'lr': 0.0001998740159592988, 'samples': 786976, 'steps': 1537, 'loss/train': 2.2594103813171387} -09/20/2021 19:48:47 - INFO - __main__ - Step 24594: {'lr': 0.0001998740159592988, 'samples': 787008, 'steps': 1537, 'loss/train': 2.480215072631836} -09/20/2021 19:48:48 - INFO - __main__ - Step 24595: {'lr': 0.0001998740159592988, 'samples': 787040, 'steps': 1537, 'loss/train': 3.3644773960113525} -09/20/2021 19:48:49 - INFO - __main__ - Step 24596: {'lr': 0.0001998740159592988, 'samples': 787072, 'steps': 1537, 'loss/train': 1.7765281200408936} -09/20/2021 19:48:50 - INFO - __main__ - Step 24597: {'lr': 0.0001998740159592988, 'samples': 787104, 'steps': 1537, 'loss/train': 2.6896965503692627} -09/20/2021 19:48:51 - INFO - __main__ - Step 24598: {'lr': 0.0001998740159592988, 'samples': 787136, 'steps': 1537, 'loss/train': 3.4616358280181885} -09/20/2021 19:48:51 - INFO - __main__ - Step 24599: {'lr': 0.0001998740159592988, 'samples': 787168, 'steps': 1537, 'loss/train': 3.2299561500549316} -09/20/2021 19:48:52 - INFO - __main__ - Step 24600: {'lr': 0.0001998740159592988, 'samples': 787200, 'steps': 1537, 'loss/train': 2.532877206802368} -09/20/2021 19:48:53 - INFO - __main__ - Step 24601: {'lr': 0.0001998740159592988, 'samples': 787232, 'steps': 1537, 'loss/train': 3.421365261077881} -09/20/2021 19:48:54 - INFO - __main__ - Step 24602: {'lr': 0.0001998740159592988, 'samples': 787264, 'steps': 1537, 'loss/train': 2.2842984199523926} -09/20/2021 19:48:54 - INFO - __main__ - Step 24603: {'lr': 0.0001998740159592988, 'samples': 787296, 'steps': 1537, 'loss/train': 3.312828302383423} -09/20/2021 19:48:55 - INFO - __main__ - Step 24604: {'lr': 0.0001998740159592988, 'samples': 787328, 'steps': 1537, 'loss/train': 2.3745789527893066} -09/20/2021 19:48:56 - INFO - __main__ - Step 24605: {'lr': 0.0001998740159592988, 'samples': 787360, 'steps': 1537, 'loss/train': 3.109271287918091} -09/20/2021 19:48:57 - INFO - __main__ - Step 24606: {'lr': 0.0001998740159592988, 'samples': 787392, 'steps': 1537, 'loss/train': 3.2790451049804688} -09/20/2021 19:48:57 - INFO - __main__ - Step 24607: {'lr': 0.0001998740159592988, 'samples': 787424, 'steps': 1537, 'loss/train': 2.7528460025787354} -09/20/2021 19:48:58 - INFO - __main__ - Step 24608: {'lr': 0.0001998740159592988, 'samples': 787456, 'steps': 1537, 'loss/train': 2.9659359455108643} -09/20/2021 19:48:59 - INFO - __main__ - Step 24609: {'lr': 0.00019987369566060176, 'samples': 787488, 'steps': 1538, 'loss/train': 3.259620189666748} -09/20/2021 19:49:00 - INFO - __main__ - Step 24610: {'lr': 0.00019987369566060176, 'samples': 787520, 'steps': 1538, 'loss/train': 2.943317174911499} -09/20/2021 19:49:01 - INFO - __main__ - Step 24611: {'lr': 0.00019987369566060176, 'samples': 787552, 'steps': 1538, 'loss/train': 2.5413007736206055} -09/20/2021 19:49:01 - INFO - __main__ - Step 24612: {'lr': 0.00019987369566060176, 'samples': 787584, 'steps': 1538, 'loss/train': 2.9123566150665283} -09/20/2021 19:49:02 - INFO - __main__ - Step 24613: {'lr': 0.00019987369566060176, 'samples': 787616, 'steps': 1538, 'loss/train': 3.8783485889434814} -09/20/2021 19:49:03 - INFO - __main__ - Step 24614: {'lr': 0.00019987369566060176, 'samples': 787648, 'steps': 1538, 'loss/train': 2.314951181411743} -09/20/2021 19:49:04 - INFO - __main__ - Step 24615: {'lr': 0.00019987369566060176, 'samples': 787680, 'steps': 1538, 'loss/train': 2.1152796745300293} -09/20/2021 19:49:04 - INFO - __main__ - Step 24616: {'lr': 0.00019987369566060176, 'samples': 787712, 'steps': 1538, 'loss/train': 2.14705228805542} -09/20/2021 19:49:05 - INFO - __main__ - Step 24617: {'lr': 0.00019987369566060176, 'samples': 787744, 'steps': 1538, 'loss/train': 2.2409732341766357} -09/20/2021 19:49:06 - INFO - __main__ - Step 24618: {'lr': 0.00019987369566060176, 'samples': 787776, 'steps': 1538, 'loss/train': 2.5435497760772705} -09/20/2021 19:49:07 - INFO - __main__ - Step 24619: {'lr': 0.00019987369566060176, 'samples': 787808, 'steps': 1538, 'loss/train': 3.5642168521881104} -09/20/2021 19:49:07 - INFO - __main__ - Step 24620: {'lr': 0.00019987369566060176, 'samples': 787840, 'steps': 1538, 'loss/train': 3.5867762565612793} -09/20/2021 19:49:08 - INFO - __main__ - Step 24621: {'lr': 0.00019987369566060176, 'samples': 787872, 'steps': 1538, 'loss/train': 2.6891274452209473} -09/20/2021 19:49:09 - INFO - __main__ - Step 24622: {'lr': 0.00019987369566060176, 'samples': 787904, 'steps': 1538, 'loss/train': 2.569368362426758} -09/20/2021 19:49:10 - INFO - __main__ - Step 24623: {'lr': 0.00019987369566060176, 'samples': 787936, 'steps': 1538, 'loss/train': 2.921966791152954} -09/20/2021 19:49:10 - INFO - __main__ - Step 24624: {'lr': 0.00019987369566060176, 'samples': 787968, 'steps': 1538, 'loss/train': 4.6468634605407715} -09/20/2021 19:49:11 - INFO - __main__ - Step 24625: {'lr': 0.00019987337495551904, 'samples': 788000, 'steps': 1539, 'loss/train': 2.5235486030578613} -09/20/2021 19:49:13 - INFO - __main__ - Step 24626: {'lr': 0.00019987337495551904, 'samples': 788032, 'steps': 1539, 'loss/train': 2.5032639503479004} -09/20/2021 19:49:14 - INFO - __main__ - Step 24627: {'lr': 0.00019987337495551904, 'samples': 788064, 'steps': 1539, 'loss/train': 3.235156536102295} -09/20/2021 19:49:15 - INFO - __main__ - Step 24628: {'lr': 0.00019987337495551904, 'samples': 788096, 'steps': 1539, 'loss/train': 2.7291038036346436} -09/20/2021 19:49:15 - INFO - __main__ - Step 24629: {'lr': 0.00019987337495551904, 'samples': 788128, 'steps': 1539, 'loss/train': 1.7233184576034546} -09/20/2021 19:49:16 - INFO - __main__ - Step 24630: {'lr': 0.00019987337495551904, 'samples': 788160, 'steps': 1539, 'loss/train': 2.0050208568573} -09/20/2021 19:49:17 - INFO - __main__ - Step 24631: {'lr': 0.00019987337495551904, 'samples': 788192, 'steps': 1539, 'loss/train': 2.1994547843933105} -09/20/2021 19:49:18 - INFO - __main__ - Step 24632: {'lr': 0.00019987337495551904, 'samples': 788224, 'steps': 1539, 'loss/train': 2.373645067214966} -09/20/2021 19:49:18 - INFO - __main__ - Step 24633: {'lr': 0.00019987337495551904, 'samples': 788256, 'steps': 1539, 'loss/train': 2.7044615745544434} -09/20/2021 19:49:19 - INFO - __main__ - Step 24634: {'lr': 0.00019987337495551904, 'samples': 788288, 'steps': 1539, 'loss/train': 2.3609118461608887} -09/20/2021 19:49:20 - INFO - __main__ - Step 24635: {'lr': 0.00019987337495551904, 'samples': 788320, 'steps': 1539, 'loss/train': 3.004725456237793} -09/20/2021 19:49:21 - INFO - __main__ - Step 24636: {'lr': 0.00019987337495551904, 'samples': 788352, 'steps': 1539, 'loss/train': 2.7969372272491455} -09/20/2021 19:49:21 - INFO - __main__ - Step 24637: {'lr': 0.00019987337495551904, 'samples': 788384, 'steps': 1539, 'loss/train': 2.4488000869750977} -09/20/2021 19:49:22 - INFO - __main__ - Step 24638: {'lr': 0.00019987337495551904, 'samples': 788416, 'steps': 1539, 'loss/train': 2.067009210586548} -09/20/2021 19:49:23 - INFO - __main__ - Step 24639: {'lr': 0.00019987337495551904, 'samples': 788448, 'steps': 1539, 'loss/train': 2.8877527713775635} -09/20/2021 19:49:24 - INFO - __main__ - Step 24640: {'lr': 0.00019987337495551904, 'samples': 788480, 'steps': 1539, 'loss/train': 3.345898151397705} -09/20/2021 19:49:24 - INFO - __main__ - Step 24641: {'lr': 0.00019987305384405193, 'samples': 788512, 'steps': 1540, 'loss/train': 3.1921751499176025} -09/20/2021 19:49:25 - INFO - __main__ - Step 24642: {'lr': 0.00019987305384405193, 'samples': 788544, 'steps': 1540, 'loss/train': 3.1739070415496826} -09/20/2021 19:49:26 - INFO - __main__ - Step 24643: {'lr': 0.00019987305384405193, 'samples': 788576, 'steps': 1540, 'loss/train': 3.2896885871887207} -09/20/2021 19:49:27 - INFO - __main__ - Step 24644: {'lr': 0.00019987305384405193, 'samples': 788608, 'steps': 1540, 'loss/train': 3.71235728263855} -09/20/2021 19:49:27 - INFO - __main__ - Step 24645: {'lr': 0.00019987305384405193, 'samples': 788640, 'steps': 1540, 'loss/train': 3.288067579269409} -09/20/2021 19:49:28 - INFO - __main__ - Step 24646: {'lr': 0.00019987305384405193, 'samples': 788672, 'steps': 1540, 'loss/train': 3.4503982067108154} -09/20/2021 19:49:29 - INFO - __main__ - Step 24647: {'lr': 0.00019987305384405193, 'samples': 788704, 'steps': 1540, 'loss/train': 2.801997184753418} -09/20/2021 19:49:30 - INFO - __main__ - Step 24648: {'lr': 0.00019987305384405193, 'samples': 788736, 'steps': 1540, 'loss/train': 2.8211007118225098} -09/20/2021 19:49:30 - INFO - __main__ - Step 24649: {'lr': 0.00019987305384405193, 'samples': 788768, 'steps': 1540, 'loss/train': 2.6089136600494385} -09/20/2021 19:49:31 - INFO - __main__ - Step 24650: {'lr': 0.00019987305384405193, 'samples': 788800, 'steps': 1540, 'loss/train': 2.303469181060791} -09/20/2021 19:49:32 - INFO - __main__ - Step 24651: {'lr': 0.00019987305384405193, 'samples': 788832, 'steps': 1540, 'loss/train': 3.287358522415161} -09/20/2021 19:49:33 - INFO - __main__ - Step 24652: {'lr': 0.00019987305384405193, 'samples': 788864, 'steps': 1540, 'loss/train': 3.3170056343078613} -09/20/2021 19:49:33 - INFO - __main__ - Step 24653: {'lr': 0.00019987305384405193, 'samples': 788896, 'steps': 1540, 'loss/train': 4.997308731079102} -09/20/2021 19:49:34 - INFO - __main__ - Step 24654: {'lr': 0.00019987305384405193, 'samples': 788928, 'steps': 1540, 'loss/train': 3.2495760917663574} -09/20/2021 19:49:35 - INFO - __main__ - Step 24655: {'lr': 0.00019987305384405193, 'samples': 788960, 'steps': 1540, 'loss/train': 3.337941884994507} -09/20/2021 19:49:36 - INFO - __main__ - Step 24656: {'lr': 0.00019987305384405193, 'samples': 788992, 'steps': 1540, 'loss/train': 3.265399217605591} -09/20/2021 19:49:37 - INFO - __main__ - Step 24657: {'lr': 0.00019987273232620174, 'samples': 789024, 'steps': 1541, 'loss/train': 2.8398690223693848} -09/20/2021 19:49:38 - INFO - __main__ - Step 24658: {'lr': 0.00019987273232620174, 'samples': 789056, 'steps': 1541, 'loss/train': 2.0869083404541016} -09/20/2021 19:49:39 - INFO - __main__ - Step 24659: {'lr': 0.00019987273232620174, 'samples': 789088, 'steps': 1541, 'loss/train': 3.0101583003997803} -09/20/2021 19:49:39 - INFO - __main__ - Step 24660: {'lr': 0.00019987273232620174, 'samples': 789120, 'steps': 1541, 'loss/train': 3.68725323677063} -09/20/2021 19:49:40 - INFO - __main__ - Step 24661: {'lr': 0.00019987273232620174, 'samples': 789152, 'steps': 1541, 'loss/train': 3.0447304248809814} -09/20/2021 19:49:41 - INFO - __main__ - Step 24662: {'lr': 0.00019987273232620174, 'samples': 789184, 'steps': 1541, 'loss/train': 3.06535005569458} -09/20/2021 19:49:42 - INFO - __main__ - Step 24663: {'lr': 0.00019987273232620174, 'samples': 789216, 'steps': 1541, 'loss/train': 2.8280625343322754} -09/20/2021 19:49:42 - INFO - __main__ - Step 24664: {'lr': 0.00019987273232620174, 'samples': 789248, 'steps': 1541, 'loss/train': 4.021754264831543} -09/20/2021 19:49:43 - INFO - __main__ - Step 24665: {'lr': 0.00019987273232620174, 'samples': 789280, 'steps': 1541, 'loss/train': 3.378345012664795} -09/20/2021 19:49:44 - INFO - __main__ - Step 24666: {'lr': 0.00019987273232620174, 'samples': 789312, 'steps': 1541, 'loss/train': 3.011723279953003} -09/20/2021 19:49:45 - INFO - __main__ - Step 24667: {'lr': 0.00019987273232620174, 'samples': 789344, 'steps': 1541, 'loss/train': 3.5543811321258545} -09/20/2021 19:49:45 - INFO - __main__ - Step 24668: {'lr': 0.00019987273232620174, 'samples': 789376, 'steps': 1541, 'loss/train': 3.8016538619995117} -09/20/2021 19:49:46 - INFO - __main__ - Step 24669: {'lr': 0.00019987273232620174, 'samples': 789408, 'steps': 1541, 'loss/train': 3.023223638534546} -09/20/2021 19:49:47 - INFO - __main__ - Step 24670: {'lr': 0.00019987273232620174, 'samples': 789440, 'steps': 1541, 'loss/train': 2.629617691040039} -09/20/2021 19:49:48 - INFO - __main__ - Step 24671: {'lr': 0.00019987273232620174, 'samples': 789472, 'steps': 1541, 'loss/train': 2.327065944671631} -09/20/2021 19:49:48 - INFO - __main__ - Step 24672: {'lr': 0.00019987273232620174, 'samples': 789504, 'steps': 1541, 'loss/train': 3.763683795928955} -09/20/2021 19:49:49 - INFO - __main__ - Step 24673: {'lr': 0.00019987241040196981, 'samples': 789536, 'steps': 1542, 'loss/train': 3.1514079570770264} -09/20/2021 19:49:50 - INFO - __main__ - Step 24674: {'lr': 0.00019987241040196981, 'samples': 789568, 'steps': 1542, 'loss/train': 3.452549457550049} -09/20/2021 19:49:51 - INFO - __main__ - Step 24675: {'lr': 0.00019987241040196981, 'samples': 789600, 'steps': 1542, 'loss/train': 3.749913215637207} -09/20/2021 19:49:52 - INFO - __main__ - Step 24676: {'lr': 0.00019987241040196981, 'samples': 789632, 'steps': 1542, 'loss/train': 2.551368474960327} -09/20/2021 19:49:52 - INFO - __main__ - Step 24677: {'lr': 0.00019987241040196981, 'samples': 789664, 'steps': 1542, 'loss/train': 3.042663812637329} -09/20/2021 19:49:53 - INFO - __main__ - Step 24678: {'lr': 0.00019987241040196981, 'samples': 789696, 'steps': 1542, 'loss/train': 0.3170972466468811} -09/20/2021 19:49:54 - INFO - __main__ - Step 24679: {'lr': 0.00019987241040196981, 'samples': 789728, 'steps': 1542, 'loss/train': 2.422394275665283} -09/20/2021 19:49:55 - INFO - __main__ - Step 24680: {'lr': 0.00019987241040196981, 'samples': 789760, 'steps': 1542, 'loss/train': 3.0105245113372803} -09/20/2021 19:49:55 - INFO - __main__ - Step 24681: {'lr': 0.00019987241040196981, 'samples': 789792, 'steps': 1542, 'loss/train': 2.984570264816284} -09/20/2021 19:49:56 - INFO - __main__ - Step 24682: {'lr': 0.00019987241040196981, 'samples': 789824, 'steps': 1542, 'loss/train': 3.020806074142456} -09/20/2021 19:49:57 - INFO - __main__ - Step 24683: {'lr': 0.00019987241040196981, 'samples': 789856, 'steps': 1542, 'loss/train': 2.550954818725586} -09/20/2021 19:49:58 - INFO - __main__ - Step 24684: {'lr': 0.00019987241040196981, 'samples': 789888, 'steps': 1542, 'loss/train': 4.737925052642822} -09/20/2021 19:49:58 - INFO - __main__ - Step 24685: {'lr': 0.00019987241040196981, 'samples': 789920, 'steps': 1542, 'loss/train': 3.3663156032562256} -09/20/2021 19:49:59 - INFO - __main__ - Step 24686: {'lr': 0.00019987241040196981, 'samples': 789952, 'steps': 1542, 'loss/train': 2.5760927200317383} -09/20/2021 19:50:00 - INFO - __main__ - Step 24687: {'lr': 0.00019987241040196981, 'samples': 789984, 'steps': 1542, 'loss/train': 3.29763126373291} -09/20/2021 19:50:01 - INFO - __main__ - Step 24688: {'lr': 0.00019987241040196981, 'samples': 790016, 'steps': 1542, 'loss/train': 0.7690128684043884} -09/20/2021 19:50:02 - INFO - __main__ - Step 24689: {'lr': 0.00019987208807135742, 'samples': 790048, 'steps': 1543, 'loss/train': 3.055584192276001} -09/20/2021 19:50:03 - INFO - __main__ - Step 24690: {'lr': 0.00019987208807135742, 'samples': 790080, 'steps': 1543, 'loss/train': 2.572906970977783} -09/20/2021 19:50:04 - INFO - __main__ - Step 24691: {'lr': 0.00019987208807135742, 'samples': 790112, 'steps': 1543, 'loss/train': 3.3953192234039307} -09/20/2021 19:50:04 - INFO - __main__ - Step 24692: {'lr': 0.00019987208807135742, 'samples': 790144, 'steps': 1543, 'loss/train': 2.32502818107605} -09/20/2021 19:50:05 - INFO - __main__ - Step 24693: {'lr': 0.00019987208807135742, 'samples': 790176, 'steps': 1543, 'loss/train': 2.582707643508911} -09/20/2021 19:50:06 - INFO - __main__ - Step 24694: {'lr': 0.00019987208807135742, 'samples': 790208, 'steps': 1543, 'loss/train': 2.5807623863220215} -09/20/2021 19:50:07 - INFO - __main__ - Step 24695: {'lr': 0.00019987208807135742, 'samples': 790240, 'steps': 1543, 'loss/train': 2.975684642791748} -09/20/2021 19:50:07 - INFO - __main__ - Step 24696: {'lr': 0.00019987208807135742, 'samples': 790272, 'steps': 1543, 'loss/train': 3.2257189750671387} -09/20/2021 19:50:08 - INFO - __main__ - Step 24697: {'lr': 0.00019987208807135742, 'samples': 790304, 'steps': 1543, 'loss/train': 2.353743553161621} -09/20/2021 19:50:09 - INFO - __main__ - Step 24698: {'lr': 0.00019987208807135742, 'samples': 790336, 'steps': 1543, 'loss/train': 3.1647591590881348} -09/20/2021 19:50:10 - INFO - __main__ - Step 24699: {'lr': 0.00019987208807135742, 'samples': 790368, 'steps': 1543, 'loss/train': 3.5159473419189453} -09/20/2021 19:50:10 - INFO - __main__ - Step 24700: {'lr': 0.00019987208807135742, 'samples': 790400, 'steps': 1543, 'loss/train': 2.7879979610443115} -09/20/2021 19:50:11 - INFO - __main__ - Step 24701: {'lr': 0.00019987208807135742, 'samples': 790432, 'steps': 1543, 'loss/train': 2.2747652530670166} -09/20/2021 19:50:12 - INFO - __main__ - Step 24702: {'lr': 0.00019987208807135742, 'samples': 790464, 'steps': 1543, 'loss/train': 2.7164413928985596} -09/20/2021 19:50:13 - INFO - __main__ - Step 24703: {'lr': 0.00019987208807135742, 'samples': 790496, 'steps': 1543, 'loss/train': 2.343090772628784} -09/20/2021 19:50:13 - INFO - __main__ - Step 24704: {'lr': 0.00019987208807135742, 'samples': 790528, 'steps': 1543, 'loss/train': 2.5711910724639893} -09/20/2021 19:50:14 - INFO - __main__ - Step 24705: {'lr': 0.00019987176533436588, 'samples': 790560, 'steps': 1544, 'loss/train': 2.3069307804107666} -09/20/2021 19:50:15 - INFO - __main__ - Step 24706: {'lr': 0.00019987176533436588, 'samples': 790592, 'steps': 1544, 'loss/train': 3.276197910308838} -09/20/2021 19:50:16 - INFO - __main__ - Step 24707: {'lr': 0.00019987176533436588, 'samples': 790624, 'steps': 1544, 'loss/train': 2.5822701454162598} -09/20/2021 19:50:16 - INFO - __main__ - Step 24708: {'lr': 0.00019987176533436588, 'samples': 790656, 'steps': 1544, 'loss/train': 1.7874352931976318} -09/20/2021 19:50:17 - INFO - __main__ - Step 24709: {'lr': 0.00019987176533436588, 'samples': 790688, 'steps': 1544, 'loss/train': 2.589458465576172} -09/20/2021 19:50:18 - INFO - __main__ - Step 24710: {'lr': 0.00019987176533436588, 'samples': 790720, 'steps': 1544, 'loss/train': 2.348280191421509} -09/20/2021 19:50:19 - INFO - __main__ - Step 24711: {'lr': 0.00019987176533436588, 'samples': 790752, 'steps': 1544, 'loss/train': 3.42136549949646} -09/20/2021 19:50:19 - INFO - __main__ - Step 24712: {'lr': 0.00019987176533436588, 'samples': 790784, 'steps': 1544, 'loss/train': 2.476630210876465} -09/20/2021 19:50:20 - INFO - __main__ - Step 24713: {'lr': 0.00019987176533436588, 'samples': 790816, 'steps': 1544, 'loss/train': 2.6333656311035156} -09/20/2021 19:50:21 - INFO - __main__ - Step 24714: {'lr': 0.00019987176533436588, 'samples': 790848, 'steps': 1544, 'loss/train': 3.2469842433929443} -09/20/2021 19:50:22 - INFO - __main__ - Step 24715: {'lr': 0.00019987176533436588, 'samples': 790880, 'steps': 1544, 'loss/train': 1.7740486860275269} -09/20/2021 19:50:22 - INFO - __main__ - Step 24716: {'lr': 0.00019987176533436588, 'samples': 790912, 'steps': 1544, 'loss/train': 2.550797462463379} -09/20/2021 19:50:23 - INFO - __main__ - Step 24717: {'lr': 0.00019987176533436588, 'samples': 790944, 'steps': 1544, 'loss/train': 2.408965826034546} -09/20/2021 19:50:25 - INFO - __main__ - Step 24718: {'lr': 0.00019987176533436588, 'samples': 790976, 'steps': 1544, 'loss/train': 2.6568875312805176} -09/20/2021 19:50:25 - INFO - __main__ - Step 24719: {'lr': 0.00019987176533436588, 'samples': 791008, 'steps': 1544, 'loss/train': 2.570537567138672} -09/20/2021 19:50:26 - INFO - __main__ - Step 24720: {'lr': 0.00019987176533436588, 'samples': 791040, 'steps': 1544, 'loss/train': 3.159036159515381} -09/20/2021 19:50:27 - INFO - __main__ - Step 24721: {'lr': 0.00019987144219099656, 'samples': 791072, 'steps': 1545, 'loss/train': 3.5731146335601807} -09/20/2021 19:50:28 - INFO - __main__ - Step 24722: {'lr': 0.00019987144219099656, 'samples': 791104, 'steps': 1545, 'loss/train': 2.158494710922241} -09/20/2021 19:50:28 - INFO - __main__ - Step 24723: {'lr': 0.00019987144219099656, 'samples': 791136, 'steps': 1545, 'loss/train': 2.2827155590057373} -09/20/2021 19:50:29 - INFO - __main__ - Step 24724: {'lr': 0.00019987144219099656, 'samples': 791168, 'steps': 1545, 'loss/train': 2.8340163230895996} -09/20/2021 19:50:30 - INFO - __main__ - Step 24725: {'lr': 0.00019987144219099656, 'samples': 791200, 'steps': 1545, 'loss/train': 2.8378775119781494} -09/20/2021 19:50:31 - INFO - __main__ - Step 24726: {'lr': 0.00019987144219099656, 'samples': 791232, 'steps': 1545, 'loss/train': 2.757408380508423} -09/20/2021 19:50:31 - INFO - __main__ - Step 24727: {'lr': 0.00019987144219099656, 'samples': 791264, 'steps': 1545, 'loss/train': 2.7763121128082275} -09/20/2021 19:50:32 - INFO - __main__ - Step 24728: {'lr': 0.00019987144219099656, 'samples': 791296, 'steps': 1545, 'loss/train': 2.892408609390259} -09/20/2021 19:50:33 - INFO - __main__ - Step 24729: {'lr': 0.00019987144219099656, 'samples': 791328, 'steps': 1545, 'loss/train': 3.160588026046753} -09/20/2021 19:50:34 - INFO - __main__ - Step 24730: {'lr': 0.00019987144219099656, 'samples': 791360, 'steps': 1545, 'loss/train': 2.8383285999298096} -09/20/2021 19:50:34 - INFO - __main__ - Step 24731: {'lr': 0.00019987144219099656, 'samples': 791392, 'steps': 1545, 'loss/train': 2.52488374710083} -09/20/2021 19:50:35 - INFO - __main__ - Step 24732: {'lr': 0.00019987144219099656, 'samples': 791424, 'steps': 1545, 'loss/train': 2.731100082397461} -09/20/2021 19:50:36 - INFO - __main__ - Step 24733: {'lr': 0.00019987144219099656, 'samples': 791456, 'steps': 1545, 'loss/train': 0.4673670530319214} -09/20/2021 19:50:37 - INFO - __main__ - Step 24734: {'lr': 0.00019987144219099656, 'samples': 791488, 'steps': 1545, 'loss/train': 3.670072555541992} -09/20/2021 19:50:37 - INFO - __main__ - Step 24735: {'lr': 0.00019987144219099656, 'samples': 791520, 'steps': 1545, 'loss/train': 2.550572156906128} -09/20/2021 19:50:38 - INFO - __main__ - Step 24736: {'lr': 0.00019987144219099656, 'samples': 791552, 'steps': 1545, 'loss/train': 1.7481991052627563} -09/20/2021 19:50:39 - INFO - __main__ - Step 24737: {'lr': 0.0001998711186412507, 'samples': 791584, 'steps': 1546, 'loss/train': 2.8329672813415527} -09/20/2021 19:50:40 - INFO - __main__ - Step 24738: {'lr': 0.0001998711186412507, 'samples': 791616, 'steps': 1546, 'loss/train': 2.2672338485717773} -09/20/2021 19:50:41 - INFO - __main__ - Step 24739: {'lr': 0.0001998711186412507, 'samples': 791648, 'steps': 1546, 'loss/train': 0.8796278238296509} -09/20/2021 19:50:41 - INFO - __main__ - Step 24740: {'lr': 0.0001998711186412507, 'samples': 791680, 'steps': 1546, 'loss/train': 3.158966541290283} -09/20/2021 19:50:42 - INFO - __main__ - Step 24741: {'lr': 0.0001998711186412507, 'samples': 791712, 'steps': 1546, 'loss/train': 2.9911389350891113} -09/20/2021 19:50:43 - INFO - __main__ - Step 24742: {'lr': 0.0001998711186412507, 'samples': 791744, 'steps': 1546, 'loss/train': 3.0140058994293213} -09/20/2021 19:50:44 - INFO - __main__ - Step 24743: {'lr': 0.0001998711186412507, 'samples': 791776, 'steps': 1546, 'loss/train': 2.4766898155212402} -09/20/2021 19:50:44 - INFO - __main__ - Step 24744: {'lr': 0.0001998711186412507, 'samples': 791808, 'steps': 1546, 'loss/train': 3.8437135219573975} -09/20/2021 19:50:45 - INFO - __main__ - Step 24745: {'lr': 0.0001998711186412507, 'samples': 791840, 'steps': 1546, 'loss/train': 2.5792768001556396} -09/20/2021 19:50:46 - INFO - __main__ - Step 24746: {'lr': 0.0001998711186412507, 'samples': 791872, 'steps': 1546, 'loss/train': 2.7222933769226074} -09/20/2021 19:50:47 - INFO - __main__ - Step 24747: {'lr': 0.0001998711186412507, 'samples': 791904, 'steps': 1546, 'loss/train': 3.048105478286743} -09/20/2021 19:50:47 - INFO - __main__ - Step 24748: {'lr': 0.0001998711186412507, 'samples': 791936, 'steps': 1546, 'loss/train': 0.6592181921005249} -09/20/2021 19:50:48 - INFO - __main__ - Step 24749: {'lr': 0.0001998711186412507, 'samples': 791968, 'steps': 1546, 'loss/train': 0.4432224929332733} -09/20/2021 19:50:49 - INFO - __main__ - Step 24750: {'lr': 0.0001998711186412507, 'samples': 792000, 'steps': 1546, 'loss/train': 1.0910370349884033} -09/20/2021 19:50:50 - INFO - __main__ - Step 24751: {'lr': 0.0001998711186412507, 'samples': 792032, 'steps': 1546, 'loss/train': 1.6977720260620117} -09/20/2021 19:50:51 - INFO - __main__ - Step 24752: {'lr': 0.0001998711186412507, 'samples': 792064, 'steps': 1546, 'loss/train': 2.4946672916412354} -09/20/2021 19:50:52 - INFO - __main__ - Step 24753: {'lr': 0.00019987079468512965, 'samples': 792096, 'steps': 1547, 'loss/train': 2.523106575012207} -09/20/2021 19:50:52 - INFO - __main__ - Step 24754: {'lr': 0.00019987079468512965, 'samples': 792128, 'steps': 1547, 'loss/train': 2.40990948677063} -09/20/2021 19:50:53 - INFO - __main__ - Step 24755: {'lr': 0.00019987079468512965, 'samples': 792160, 'steps': 1547, 'loss/train': 2.2082645893096924} -09/20/2021 19:50:54 - INFO - __main__ - Step 24756: {'lr': 0.00019987079468512965, 'samples': 792192, 'steps': 1547, 'loss/train': 3.1573076248168945} -09/20/2021 19:50:55 - INFO - __main__ - Step 24757: {'lr': 0.00019987079468512965, 'samples': 792224, 'steps': 1547, 'loss/train': 2.268831491470337} -09/20/2021 19:50:55 - INFO - __main__ - Step 24758: {'lr': 0.00019987079468512965, 'samples': 792256, 'steps': 1547, 'loss/train': 2.2745862007141113} -09/20/2021 19:50:56 - INFO - __main__ - Step 24759: {'lr': 0.00019987079468512965, 'samples': 792288, 'steps': 1547, 'loss/train': 1.8534034490585327} -09/20/2021 19:50:57 - INFO - __main__ - Step 24760: {'lr': 0.00019987079468512965, 'samples': 792320, 'steps': 1547, 'loss/train': 3.2228903770446777} -09/20/2021 19:50:58 - INFO - __main__ - Step 24761: {'lr': 0.00019987079468512965, 'samples': 792352, 'steps': 1547, 'loss/train': 2.945071220397949} -09/20/2021 19:50:58 - INFO - __main__ - Step 24762: {'lr': 0.00019987079468512965, 'samples': 792384, 'steps': 1547, 'loss/train': 2.554708957672119} -09/20/2021 19:50:59 - INFO - __main__ - Step 24763: {'lr': 0.00019987079468512965, 'samples': 792416, 'steps': 1547, 'loss/train': 2.2563412189483643} -09/20/2021 19:51:00 - INFO - __main__ - Step 24764: {'lr': 0.00019987079468512965, 'samples': 792448, 'steps': 1547, 'loss/train': 2.512847900390625} -09/20/2021 19:51:01 - INFO - __main__ - Step 24765: {'lr': 0.00019987079468512965, 'samples': 792480, 'steps': 1547, 'loss/train': 2.780672311782837} -09/20/2021 19:51:01 - INFO - __main__ - Step 24766: {'lr': 0.00019987079468512965, 'samples': 792512, 'steps': 1547, 'loss/train': 3.663173198699951} -09/20/2021 19:51:02 - INFO - __main__ - Step 24767: {'lr': 0.00019987079468512965, 'samples': 792544, 'steps': 1547, 'loss/train': 1.5197068452835083} -09/20/2021 19:51:03 - INFO - __main__ - Step 24768: {'lr': 0.00019987079468512965, 'samples': 792576, 'steps': 1547, 'loss/train': 2.7134456634521484} -09/20/2021 19:51:04 - INFO - __main__ - Step 24769: {'lr': 0.0001998704703226347, 'samples': 792608, 'steps': 1548, 'loss/train': 2.2197225093841553} -09/20/2021 19:51:05 - INFO - __main__ - Step 24770: {'lr': 0.0001998704703226347, 'samples': 792640, 'steps': 1548, 'loss/train': 2.3100357055664062} -09/20/2021 19:51:05 - INFO - __main__ - Step 24771: {'lr': 0.0001998704703226347, 'samples': 792672, 'steps': 1548, 'loss/train': 2.004179000854492} -09/20/2021 19:51:06 - INFO - __main__ - Step 24772: {'lr': 0.0001998704703226347, 'samples': 792704, 'steps': 1548, 'loss/train': 3.3574960231781006} -09/20/2021 19:51:07 - INFO - __main__ - Step 24773: {'lr': 0.0001998704703226347, 'samples': 792736, 'steps': 1548, 'loss/train': 2.775434732437134} -09/20/2021 19:51:08 - INFO - __main__ - Step 24774: {'lr': 0.0001998704703226347, 'samples': 792768, 'steps': 1548, 'loss/train': 3.6307284832000732} -09/20/2021 19:51:08 - INFO - __main__ - Step 24775: {'lr': 0.0001998704703226347, 'samples': 792800, 'steps': 1548, 'loss/train': 2.876615524291992} -09/20/2021 19:51:09 - INFO - __main__ - Step 24776: {'lr': 0.0001998704703226347, 'samples': 792832, 'steps': 1548, 'loss/train': 2.9772145748138428} -09/20/2021 19:51:10 - INFO - __main__ - Step 24777: {'lr': 0.0001998704703226347, 'samples': 792864, 'steps': 1548, 'loss/train': 3.8218517303466797} -09/20/2021 19:51:11 - INFO - __main__ - Step 24778: {'lr': 0.0001998704703226347, 'samples': 792896, 'steps': 1548, 'loss/train': 2.7242507934570312} -09/20/2021 19:51:11 - INFO - __main__ - Step 24779: {'lr': 0.0001998704703226347, 'samples': 792928, 'steps': 1548, 'loss/train': 2.803898572921753} -09/20/2021 19:51:12 - INFO - __main__ - Step 24780: {'lr': 0.0001998704703226347, 'samples': 792960, 'steps': 1548, 'loss/train': 1.316545844078064} -09/20/2021 19:51:13 - INFO - __main__ - Step 24781: {'lr': 0.0001998704703226347, 'samples': 792992, 'steps': 1548, 'loss/train': 2.567784070968628} -09/20/2021 19:51:14 - INFO - __main__ - Step 24782: {'lr': 0.0001998704703226347, 'samples': 793024, 'steps': 1548, 'loss/train': 3.5292561054229736} -09/20/2021 19:51:15 - INFO - __main__ - Step 24783: {'lr': 0.0001998704703226347, 'samples': 793056, 'steps': 1548, 'loss/train': 3.7021875381469727} -09/20/2021 19:51:16 - INFO - __main__ - Step 24784: {'lr': 0.0001998704703226347, 'samples': 793088, 'steps': 1548, 'loss/train': 2.1102523803710938} -09/20/2021 19:51:16 - INFO - __main__ - Step 24785: {'lr': 0.00019987014555376722, 'samples': 793120, 'steps': 1549, 'loss/train': 3.3212242126464844} -09/20/2021 19:51:17 - INFO - __main__ - Step 24786: {'lr': 0.00019987014555376722, 'samples': 793152, 'steps': 1549, 'loss/train': 2.486816167831421} -09/20/2021 19:51:18 - INFO - __main__ - Step 24787: {'lr': 0.00019987014555376722, 'samples': 793184, 'steps': 1549, 'loss/train': 2.9226646423339844} -09/20/2021 19:51:19 - INFO - __main__ - Step 24788: {'lr': 0.00019987014555376722, 'samples': 793216, 'steps': 1549, 'loss/train': 2.9213547706604004} -09/20/2021 19:51:19 - INFO - __main__ - Step 24789: {'lr': 0.00019987014555376722, 'samples': 793248, 'steps': 1549, 'loss/train': 3.17159366607666} -09/20/2021 19:51:20 - INFO - __main__ - Step 24790: {'lr': 0.00019987014555376722, 'samples': 793280, 'steps': 1549, 'loss/train': 3.3189737796783447} -09/20/2021 19:51:21 - INFO - __main__ - Step 24791: {'lr': 0.00019987014555376722, 'samples': 793312, 'steps': 1549, 'loss/train': 2.4898571968078613} -09/20/2021 19:51:22 - INFO - __main__ - Step 24792: {'lr': 0.00019987014555376722, 'samples': 793344, 'steps': 1549, 'loss/train': 3.1591169834136963} -09/20/2021 19:51:22 - INFO - __main__ - Step 24793: {'lr': 0.00019987014555376722, 'samples': 793376, 'steps': 1549, 'loss/train': 2.899310827255249} -09/20/2021 19:51:23 - INFO - __main__ - Step 24794: {'lr': 0.00019987014555376722, 'samples': 793408, 'steps': 1549, 'loss/train': 2.9050192832946777} -09/20/2021 19:51:24 - INFO - __main__ - Step 24795: {'lr': 0.00019987014555376722, 'samples': 793440, 'steps': 1549, 'loss/train': 3.03010630607605} -09/20/2021 19:51:25 - INFO - __main__ - Step 24796: {'lr': 0.00019987014555376722, 'samples': 793472, 'steps': 1549, 'loss/train': 3.1619389057159424} -09/20/2021 19:51:25 - INFO - __main__ - Step 24797: {'lr': 0.00019987014555376722, 'samples': 793504, 'steps': 1549, 'loss/train': 3.8876967430114746} -09/20/2021 19:51:26 - INFO - __main__ - Step 24798: {'lr': 0.00019987014555376722, 'samples': 793536, 'steps': 1549, 'loss/train': 3.6175894737243652} -09/20/2021 19:51:27 - INFO - __main__ - Step 24799: {'lr': 0.00019987014555376722, 'samples': 793568, 'steps': 1549, 'loss/train': 3.4678475856781006} -09/20/2021 19:51:28 - INFO - __main__ - Step 24800: {'lr': 0.00019987014555376722, 'samples': 793600, 'steps': 1549, 'loss/train': 3.262575626373291} -09/20/2021 19:51:29 - INFO - __main__ - Step 24801: {'lr': 0.00019986982037852852, 'samples': 793632, 'steps': 1550, 'loss/train': 2.342803716659546} -09/20/2021 19:51:29 - INFO - __main__ - Step 24802: {'lr': 0.00019986982037852852, 'samples': 793664, 'steps': 1550, 'loss/train': 3.200880527496338} -09/20/2021 19:51:30 - INFO - __main__ - Step 24803: {'lr': 0.00019986982037852852, 'samples': 793696, 'steps': 1550, 'loss/train': 2.696502923965454} -09/20/2021 19:51:31 - INFO - __main__ - Step 24804: {'lr': 0.00019986982037852852, 'samples': 793728, 'steps': 1550, 'loss/train': 3.455888032913208} -09/20/2021 19:51:32 - INFO - __main__ - Step 24805: {'lr': 0.00019986982037852852, 'samples': 793760, 'steps': 1550, 'loss/train': 3.511014938354492} -09/20/2021 19:51:32 - INFO - __main__ - Step 24806: {'lr': 0.00019986982037852852, 'samples': 793792, 'steps': 1550, 'loss/train': 2.251105308532715} -09/20/2021 19:51:33 - INFO - __main__ - Step 24807: {'lr': 0.00019986982037852852, 'samples': 793824, 'steps': 1550, 'loss/train': 2.27901029586792} -09/20/2021 19:51:34 - INFO - __main__ - Step 24808: {'lr': 0.00019986982037852852, 'samples': 793856, 'steps': 1550, 'loss/train': 2.7700917720794678} -09/20/2021 19:51:35 - INFO - __main__ - Step 24809: {'lr': 0.00019986982037852852, 'samples': 793888, 'steps': 1550, 'loss/train': 2.165994167327881} -09/20/2021 19:51:35 - INFO - __main__ - Step 24810: {'lr': 0.00019986982037852852, 'samples': 793920, 'steps': 1550, 'loss/train': 2.3069329261779785} -09/20/2021 19:51:36 - INFO - __main__ - Step 24811: {'lr': 0.00019986982037852852, 'samples': 793952, 'steps': 1550, 'loss/train': 3.6605091094970703} -09/20/2021 19:51:37 - INFO - __main__ - Step 24812: {'lr': 0.00019986982037852852, 'samples': 793984, 'steps': 1550, 'loss/train': 2.7582387924194336} -09/20/2021 19:51:38 - INFO - __main__ - Step 24813: {'lr': 0.00019986982037852852, 'samples': 794016, 'steps': 1550, 'loss/train': 2.3960394859313965} -09/20/2021 19:51:39 - INFO - __main__ - Step 24814: {'lr': 0.00019986982037852852, 'samples': 794048, 'steps': 1550, 'loss/train': 2.9734396934509277} -09/20/2021 19:51:40 - INFO - __main__ - Step 24815: {'lr': 0.00019986982037852852, 'samples': 794080, 'steps': 1550, 'loss/train': 3.0522520542144775} -09/20/2021 19:51:40 - INFO - __main__ - Step 24816: {'lr': 0.00019986982037852852, 'samples': 794112, 'steps': 1550, 'loss/train': 2.8205325603485107} -09/20/2021 19:51:41 - INFO - __main__ - Step 24817: {'lr': 0.0001998694947969199, 'samples': 794144, 'steps': 1551, 'loss/train': 2.8901867866516113} -09/20/2021 19:51:42 - INFO - __main__ - Step 24818: {'lr': 0.0001998694947969199, 'samples': 794176, 'steps': 1551, 'loss/train': 3.7177631855010986} -09/20/2021 19:51:43 - INFO - __main__ - Step 24819: {'lr': 0.0001998694947969199, 'samples': 794208, 'steps': 1551, 'loss/train': 3.0751852989196777} -09/20/2021 19:51:44 - INFO - __main__ - Step 24820: {'lr': 0.0001998694947969199, 'samples': 794240, 'steps': 1551, 'loss/train': 2.6044704914093018} -09/20/2021 19:51:44 - INFO - __main__ - Step 24821: {'lr': 0.0001998694947969199, 'samples': 794272, 'steps': 1551, 'loss/train': 3.111891508102417} -09/20/2021 19:51:45 - INFO - __main__ - Step 24822: {'lr': 0.0001998694947969199, 'samples': 794304, 'steps': 1551, 'loss/train': 2.1158082485198975} -09/20/2021 19:51:46 - INFO - __main__ - Step 24823: {'lr': 0.0001998694947969199, 'samples': 794336, 'steps': 1551, 'loss/train': 1.9099655151367188} -09/20/2021 19:51:47 - INFO - __main__ - Step 24824: {'lr': 0.0001998694947969199, 'samples': 794368, 'steps': 1551, 'loss/train': 2.6705639362335205} -09/20/2021 19:51:47 - INFO - __main__ - Step 24825: {'lr': 0.0001998694947969199, 'samples': 794400, 'steps': 1551, 'loss/train': 2.859287738800049} -09/20/2021 19:51:48 - INFO - __main__ - Step 24826: {'lr': 0.0001998694947969199, 'samples': 794432, 'steps': 1551, 'loss/train': 2.276158332824707} -09/20/2021 19:51:49 - INFO - __main__ - Step 24827: {'lr': 0.0001998694947969199, 'samples': 794464, 'steps': 1551, 'loss/train': 3.8219308853149414} -09/20/2021 19:51:50 - INFO - __main__ - Step 24828: {'lr': 0.0001998694947969199, 'samples': 794496, 'steps': 1551, 'loss/train': 2.834106683731079} -09/20/2021 19:51:50 - INFO - __main__ - Step 24829: {'lr': 0.0001998694947969199, 'samples': 794528, 'steps': 1551, 'loss/train': 2.8975393772125244} -09/20/2021 19:51:51 - INFO - __main__ - Step 24830: {'lr': 0.0001998694947969199, 'samples': 794560, 'steps': 1551, 'loss/train': 3.2405073642730713} -09/20/2021 19:51:52 - INFO - __main__ - Step 24831: {'lr': 0.0001998694947969199, 'samples': 794592, 'steps': 1551, 'loss/train': 2.168492555618286} -09/20/2021 19:51:53 - INFO - __main__ - Step 24832: {'lr': 0.0001998694947969199, 'samples': 794624, 'steps': 1551, 'loss/train': 2.5889039039611816} -09/20/2021 19:51:53 - INFO - __main__ - Step 24833: {'lr': 0.00019986916880894266, 'samples': 794656, 'steps': 1552, 'loss/train': 2.661485195159912} -09/20/2021 19:51:54 - INFO - __main__ - Step 24834: {'lr': 0.00019986916880894266, 'samples': 794688, 'steps': 1552, 'loss/train': 2.459538221359253} -09/20/2021 19:51:55 - INFO - __main__ - Step 24835: {'lr': 0.00019986916880894266, 'samples': 794720, 'steps': 1552, 'loss/train': 2.183805227279663} -09/20/2021 19:51:56 - INFO - __main__ - Step 24836: {'lr': 0.00019986916880894266, 'samples': 794752, 'steps': 1552, 'loss/train': 2.6303930282592773} -09/20/2021 19:51:56 - INFO - __main__ - Step 24837: {'lr': 0.00019986916880894266, 'samples': 794784, 'steps': 1552, 'loss/train': 2.3659234046936035} -09/20/2021 19:51:57 - INFO - __main__ - Step 24838: {'lr': 0.00019986916880894266, 'samples': 794816, 'steps': 1552, 'loss/train': 3.1603810787200928} -09/20/2021 19:51:58 - INFO - __main__ - Step 24839: {'lr': 0.00019986916880894266, 'samples': 794848, 'steps': 1552, 'loss/train': 2.4671099185943604} -09/20/2021 19:51:59 - INFO - __main__ - Step 24840: {'lr': 0.00019986916880894266, 'samples': 794880, 'steps': 1552, 'loss/train': 2.9333202838897705} -09/20/2021 19:51:59 - INFO - __main__ - Step 24841: {'lr': 0.00019986916880894266, 'samples': 794912, 'steps': 1552, 'loss/train': 2.1246376037597656} -09/20/2021 19:52:00 - INFO - __main__ - Step 24842: {'lr': 0.00019986916880894266, 'samples': 794944, 'steps': 1552, 'loss/train': 3.111927032470703} -09/20/2021 19:52:02 - INFO - __main__ - Step 24843: {'lr': 0.00019986916880894266, 'samples': 794976, 'steps': 1552, 'loss/train': 2.006382703781128} -09/20/2021 19:52:03 - INFO - __main__ - Step 24844: {'lr': 0.00019986916880894266, 'samples': 795008, 'steps': 1552, 'loss/train': 2.4887351989746094} -09/20/2021 19:52:03 - INFO - __main__ - Step 24845: {'lr': 0.00019986916880894266, 'samples': 795040, 'steps': 1552, 'loss/train': 2.573436737060547} -09/20/2021 19:52:04 - INFO - __main__ - Step 24846: {'lr': 0.00019986916880894266, 'samples': 795072, 'steps': 1552, 'loss/train': 2.8183798789978027} -09/20/2021 19:52:05 - INFO - __main__ - Step 24847: {'lr': 0.00019986916880894266, 'samples': 795104, 'steps': 1552, 'loss/train': 2.8843724727630615} -09/20/2021 19:52:06 - INFO - __main__ - Step 24848: {'lr': 0.00019986916880894266, 'samples': 795136, 'steps': 1552, 'loss/train': 2.5676538944244385} -09/20/2021 19:52:06 - INFO - __main__ - Step 24849: {'lr': 0.00019986884241459817, 'samples': 795168, 'steps': 1553, 'loss/train': 3.103236675262451} -09/20/2021 19:52:07 - INFO - __main__ - Step 24850: {'lr': 0.00019986884241459817, 'samples': 795200, 'steps': 1553, 'loss/train': 2.8031725883483887} -09/20/2021 19:52:08 - INFO - __main__ - Step 24851: {'lr': 0.00019986884241459817, 'samples': 795232, 'steps': 1553, 'loss/train': 2.9830410480499268} -09/20/2021 19:52:09 - INFO - __main__ - Step 24852: {'lr': 0.00019986884241459817, 'samples': 795264, 'steps': 1553, 'loss/train': 2.6450324058532715} -09/20/2021 19:52:09 - INFO - __main__ - Step 24853: {'lr': 0.00019986884241459817, 'samples': 795296, 'steps': 1553, 'loss/train': 2.766998291015625} -09/20/2021 19:52:10 - INFO - __main__ - Step 24854: {'lr': 0.00019986884241459817, 'samples': 795328, 'steps': 1553, 'loss/train': 0.46979740262031555} -09/20/2021 19:52:11 - INFO - __main__ - Step 24855: {'lr': 0.00019986884241459817, 'samples': 795360, 'steps': 1553, 'loss/train': 3.191532611846924} -09/20/2021 19:52:12 - INFO - __main__ - Step 24856: {'lr': 0.00019986884241459817, 'samples': 795392, 'steps': 1553, 'loss/train': 2.5714659690856934} -09/20/2021 19:52:12 - INFO - __main__ - Step 24857: {'lr': 0.00019986884241459817, 'samples': 795424, 'steps': 1553, 'loss/train': 2.7374629974365234} -09/20/2021 19:52:13 - INFO - __main__ - Step 24858: {'lr': 0.00019986884241459817, 'samples': 795456, 'steps': 1553, 'loss/train': 3.5198814868927} -09/20/2021 19:52:14 - INFO - __main__ - Step 24859: {'lr': 0.00019986884241459817, 'samples': 795488, 'steps': 1553, 'loss/train': 3.0835843086242676} -09/20/2021 19:52:15 - INFO - __main__ - Step 24860: {'lr': 0.00019986884241459817, 'samples': 795520, 'steps': 1553, 'loss/train': 2.1855392456054688} -09/20/2021 19:52:15 - INFO - __main__ - Step 24861: {'lr': 0.00019986884241459817, 'samples': 795552, 'steps': 1553, 'loss/train': 2.4151697158813477} -09/20/2021 19:52:16 - INFO - __main__ - Step 24862: {'lr': 0.00019986884241459817, 'samples': 795584, 'steps': 1553, 'loss/train': 2.0553104877471924} -09/20/2021 19:52:17 - INFO - __main__ - Step 24863: {'lr': 0.00019986884241459817, 'samples': 795616, 'steps': 1553, 'loss/train': 2.0923261642456055} -09/20/2021 19:52:18 - INFO - __main__ - Step 24864: {'lr': 0.00019986884241459817, 'samples': 795648, 'steps': 1553, 'loss/train': 2.040832281112671} -09/20/2021 19:52:19 - INFO - __main__ - Step 24865: {'lr': 0.00019986851561388779, 'samples': 795680, 'steps': 1554, 'loss/train': 2.846498727798462} -09/20/2021 19:52:19 - INFO - __main__ - Step 24866: {'lr': 0.00019986851561388779, 'samples': 795712, 'steps': 1554, 'loss/train': 2.17531156539917} -09/20/2021 19:52:20 - INFO - __main__ - Step 24867: {'lr': 0.00019986851561388779, 'samples': 795744, 'steps': 1554, 'loss/train': 2.221378803253174} -09/20/2021 19:52:21 - INFO - __main__ - Step 24868: {'lr': 0.00019986851561388779, 'samples': 795776, 'steps': 1554, 'loss/train': 0.7158022522926331} -09/20/2021 19:52:22 - INFO - __main__ - Step 24869: {'lr': 0.00019986851561388779, 'samples': 795808, 'steps': 1554, 'loss/train': 2.8528876304626465} -09/20/2021 19:52:22 - INFO - __main__ - Step 24870: {'lr': 0.00019986851561388779, 'samples': 795840, 'steps': 1554, 'loss/train': 2.608159065246582} -09/20/2021 19:52:23 - INFO - __main__ - Step 24871: {'lr': 0.00019986851561388779, 'samples': 795872, 'steps': 1554, 'loss/train': 1.3439879417419434} -09/20/2021 19:52:24 - INFO - __main__ - Step 24872: {'lr': 0.00019986851561388779, 'samples': 795904, 'steps': 1554, 'loss/train': 1.2756919860839844} -09/20/2021 19:52:25 - INFO - __main__ - Step 24873: {'lr': 0.00019986851561388779, 'samples': 795936, 'steps': 1554, 'loss/train': 1.682685375213623} -09/20/2021 19:52:25 - INFO - __main__ - Step 24874: {'lr': 0.00019986851561388779, 'samples': 795968, 'steps': 1554, 'loss/train': 1.4298906326293945} -09/20/2021 19:52:26 - INFO - __main__ - Step 24875: {'lr': 0.00019986851561388779, 'samples': 796000, 'steps': 1554, 'loss/train': 1.3716888427734375} -09/20/2021 19:52:27 - INFO - __main__ - Step 24876: {'lr': 0.00019986851561388779, 'samples': 796032, 'steps': 1554, 'loss/train': 1.5752397775650024} -09/20/2021 19:52:28 - INFO - __main__ - Step 24877: {'lr': 0.00019986851561388779, 'samples': 796064, 'steps': 1554, 'loss/train': 1.4255083799362183} -09/20/2021 19:52:28 - INFO - __main__ - Step 24878: {'lr': 0.00019986851561388779, 'samples': 796096, 'steps': 1554, 'loss/train': 1.4744176864624023} -09/20/2021 19:52:31 - INFO - __main__ - Step 24879: {'lr': 0.00019986851561388779, 'samples': 796128, 'steps': 1554, 'loss/train': 1.6835604906082153} -09/20/2021 19:52:31 - INFO - __main__ - Step 24880: {'lr': 0.00019986851561388779, 'samples': 796160, 'steps': 1554, 'loss/train': 2.8457822799682617} -09/20/2021 19:52:32 - INFO - __main__ - Step 24881: {'lr': 0.00019986818840681277, 'samples': 796192, 'steps': 1555, 'loss/train': 2.545816421508789} -09/20/2021 19:52:33 - INFO - __main__ - Step 24882: {'lr': 0.00019986818840681277, 'samples': 796224, 'steps': 1555, 'loss/train': 2.4646811485290527} -09/20/2021 19:52:34 - INFO - __main__ - Step 24883: {'lr': 0.00019986818840681277, 'samples': 796256, 'steps': 1555, 'loss/train': 1.6064974069595337} -09/20/2021 19:52:35 - INFO - __main__ - Step 24884: {'lr': 0.00019986818840681277, 'samples': 796288, 'steps': 1555, 'loss/train': 2.5759503841400146} -09/20/2021 19:52:35 - INFO - __main__ - Step 24885: {'lr': 0.00019986818840681277, 'samples': 796320, 'steps': 1555, 'loss/train': 2.034031629562378} -09/20/2021 19:52:36 - INFO - __main__ - Step 24886: {'lr': 0.00019986818840681277, 'samples': 796352, 'steps': 1555, 'loss/train': 1.7385905981063843} -09/20/2021 19:52:37 - INFO - __main__ - Step 24887: {'lr': 0.00019986818840681277, 'samples': 796384, 'steps': 1555, 'loss/train': 1.824945092201233} -09/20/2021 19:52:38 - INFO - __main__ - Step 24888: {'lr': 0.00019986818840681277, 'samples': 796416, 'steps': 1555, 'loss/train': 1.9577248096466064} -09/20/2021 19:52:38 - INFO - __main__ - Step 24889: {'lr': 0.00019986818840681277, 'samples': 796448, 'steps': 1555, 'loss/train': 2.8754448890686035} -09/20/2021 19:52:39 - INFO - __main__ - Step 24890: {'lr': 0.00019986818840681277, 'samples': 796480, 'steps': 1555, 'loss/train': 2.1794662475585938} -09/20/2021 19:52:40 - INFO - __main__ - Step 24891: {'lr': 0.00019986818840681277, 'samples': 796512, 'steps': 1555, 'loss/train': 2.1316380500793457} -09/20/2021 19:52:41 - INFO - __main__ - Step 24892: {'lr': 0.00019986818840681277, 'samples': 796544, 'steps': 1555, 'loss/train': 2.2673416137695312} -09/20/2021 19:52:41 - INFO - __main__ - Step 24893: {'lr': 0.00019986818840681277, 'samples': 796576, 'steps': 1555, 'loss/train': 1.769824743270874} -09/20/2021 19:52:42 - INFO - __main__ - Step 24894: {'lr': 0.00019986818840681277, 'samples': 796608, 'steps': 1555, 'loss/train': 2.0735278129577637} -09/20/2021 19:52:43 - INFO - __main__ - Step 24895: {'lr': 0.00019986818840681277, 'samples': 796640, 'steps': 1555, 'loss/train': 2.7019402980804443} -09/20/2021 19:52:44 - INFO - __main__ - Step 24896: {'lr': 0.00019986818840681277, 'samples': 796672, 'steps': 1555, 'loss/train': 1.9504663944244385} -09/20/2021 19:52:44 - INFO - __main__ - Step 24897: {'lr': 0.00019986786079337446, 'samples': 796704, 'steps': 1556, 'loss/train': 3.068944215774536} -09/20/2021 19:52:45 - INFO - __main__ - Step 24898: {'lr': 0.00019986786079337446, 'samples': 796736, 'steps': 1556, 'loss/train': 2.990093469619751} -09/20/2021 19:52:46 - INFO - __main__ - Step 24899: {'lr': 0.00019986786079337446, 'samples': 796768, 'steps': 1556, 'loss/train': 3.2313218116760254} -09/20/2021 19:52:47 - INFO - __main__ - Step 24900: {'lr': 0.00019986786079337446, 'samples': 796800, 'steps': 1556, 'loss/train': 4.014441013336182} -09/20/2021 19:52:47 - INFO - __main__ - Step 24901: {'lr': 0.00019986786079337446, 'samples': 796832, 'steps': 1556, 'loss/train': 2.8830533027648926} -09/20/2021 19:52:48 - INFO - __main__ - Step 24902: {'lr': 0.00019986786079337446, 'samples': 796864, 'steps': 1556, 'loss/train': 2.7512753009796143} -09/20/2021 19:52:49 - INFO - __main__ - Step 24903: {'lr': 0.00019986786079337446, 'samples': 796896, 'steps': 1556, 'loss/train': 2.4465525150299072} -09/20/2021 19:52:50 - INFO - __main__ - Step 24904: {'lr': 0.00019986786079337446, 'samples': 796928, 'steps': 1556, 'loss/train': 3.6799795627593994} -09/20/2021 19:52:50 - INFO - __main__ - Step 24905: {'lr': 0.00019986786079337446, 'samples': 796960, 'steps': 1556, 'loss/train': 3.8377931118011475} -09/20/2021 19:52:51 - INFO - __main__ - Step 24906: {'lr': 0.00019986786079337446, 'samples': 796992, 'steps': 1556, 'loss/train': 2.3023619651794434} -09/20/2021 19:52:52 - INFO - __main__ - Step 24907: {'lr': 0.00019986786079337446, 'samples': 797024, 'steps': 1556, 'loss/train': 2.757908821105957} -09/20/2021 19:52:53 - INFO - __main__ - Step 24908: {'lr': 0.00019986786079337446, 'samples': 797056, 'steps': 1556, 'loss/train': 2.845973491668701} -09/20/2021 19:52:53 - INFO - __main__ - Step 24909: {'lr': 0.00019986786079337446, 'samples': 797088, 'steps': 1556, 'loss/train': 2.877984046936035} -09/20/2021 19:52:54 - INFO - __main__ - Step 24910: {'lr': 0.00019986786079337446, 'samples': 797120, 'steps': 1556, 'loss/train': 2.105177402496338} -09/20/2021 19:52:55 - INFO - __main__ - Step 24911: {'lr': 0.00019986786079337446, 'samples': 797152, 'steps': 1556, 'loss/train': 3.05072283744812} -09/20/2021 19:52:56 - INFO - __main__ - Step 24912: {'lr': 0.00019986786079337446, 'samples': 797184, 'steps': 1556, 'loss/train': 2.696209669113159} -09/20/2021 19:52:57 - INFO - __main__ - Step 24913: {'lr': 0.00019986753277357426, 'samples': 797216, 'steps': 1557, 'loss/train': 2.451901435852051} -09/20/2021 19:52:57 - INFO - __main__ - Step 24914: {'lr': 0.00019986753277357426, 'samples': 797248, 'steps': 1557, 'loss/train': 2.8167896270751953} -09/20/2021 19:52:58 - INFO - __main__ - Step 24915: {'lr': 0.00019986753277357426, 'samples': 797280, 'steps': 1557, 'loss/train': 2.587496280670166} -09/20/2021 19:52:59 - INFO - __main__ - Step 24916: {'lr': 0.00019986753277357426, 'samples': 797312, 'steps': 1557, 'loss/train': 3.412642002105713} -09/20/2021 19:53:00 - INFO - __main__ - Step 24917: {'lr': 0.00019986753277357426, 'samples': 797344, 'steps': 1557, 'loss/train': 2.354851245880127} -09/20/2021 19:53:01 - INFO - __main__ - Step 24918: {'lr': 0.00019986753277357426, 'samples': 797376, 'steps': 1557, 'loss/train': 3.7231855392456055} -09/20/2021 19:53:02 - INFO - __main__ - Step 24919: {'lr': 0.00019986753277357426, 'samples': 797408, 'steps': 1557, 'loss/train': 5.129631996154785} -09/20/2021 19:53:02 - INFO - __main__ - Step 24920: {'lr': 0.00019986753277357426, 'samples': 797440, 'steps': 1557, 'loss/train': 3.0481956005096436} -09/20/2021 19:53:03 - INFO - __main__ - Step 24921: {'lr': 0.00019986753277357426, 'samples': 797472, 'steps': 1557, 'loss/train': 2.762561559677124} -09/20/2021 19:53:04 - INFO - __main__ - Step 24922: {'lr': 0.00019986753277357426, 'samples': 797504, 'steps': 1557, 'loss/train': 3.6252782344818115} -09/20/2021 19:53:05 - INFO - __main__ - Step 24923: {'lr': 0.00019986753277357426, 'samples': 797536, 'steps': 1557, 'loss/train': 2.0006165504455566} -09/20/2021 19:53:05 - INFO - __main__ - Step 24924: {'lr': 0.00019986753277357426, 'samples': 797568, 'steps': 1557, 'loss/train': 3.045043706893921} -09/20/2021 19:53:06 - INFO - __main__ - Step 24925: {'lr': 0.00019986753277357426, 'samples': 797600, 'steps': 1557, 'loss/train': 2.6976547241210938} -09/20/2021 19:53:07 - INFO - __main__ - Step 24926: {'lr': 0.00019986753277357426, 'samples': 797632, 'steps': 1557, 'loss/train': 2.6069047451019287} -09/20/2021 19:53:08 - INFO - __main__ - Step 24927: {'lr': 0.00019986753277357426, 'samples': 797664, 'steps': 1557, 'loss/train': 2.816913604736328} -09/20/2021 19:53:08 - INFO - __main__ - Step 24928: {'lr': 0.00019986753277357426, 'samples': 797696, 'steps': 1557, 'loss/train': 0.8316696286201477} -09/20/2021 19:53:09 - INFO - __main__ - Step 24929: {'lr': 0.00019986720434741342, 'samples': 797728, 'steps': 1558, 'loss/train': 3.5946922302246094} -09/20/2021 19:53:10 - INFO - __main__ - Step 24930: {'lr': 0.00019986720434741342, 'samples': 797760, 'steps': 1558, 'loss/train': 3.125887632369995} -09/20/2021 19:53:11 - INFO - __main__ - Step 24931: {'lr': 0.00019986720434741342, 'samples': 797792, 'steps': 1558, 'loss/train': 2.4276273250579834} -09/20/2021 19:53:12 - INFO - __main__ - Step 24932: {'lr': 0.00019986720434741342, 'samples': 797824, 'steps': 1558, 'loss/train': 3.4832029342651367} -09/20/2021 19:53:12 - INFO - __main__ - Step 24933: {'lr': 0.00019986720434741342, 'samples': 797856, 'steps': 1558, 'loss/train': 3.0050365924835205} -09/20/2021 19:53:13 - INFO - __main__ - Step 24934: {'lr': 0.00019986720434741342, 'samples': 797888, 'steps': 1558, 'loss/train': 2.9995365142822266} -09/20/2021 19:53:14 - INFO - __main__ - Step 24935: {'lr': 0.00019986720434741342, 'samples': 797920, 'steps': 1558, 'loss/train': 2.9875423908233643} -09/20/2021 19:53:15 - INFO - __main__ - Step 24936: {'lr': 0.00019986720434741342, 'samples': 797952, 'steps': 1558, 'loss/train': 3.2197153568267822} -09/20/2021 19:53:15 - INFO - __main__ - Step 24937: {'lr': 0.00019986720434741342, 'samples': 797984, 'steps': 1558, 'loss/train': 3.209927558898926} -09/20/2021 19:53:16 - INFO - __main__ - Step 24938: {'lr': 0.00019986720434741342, 'samples': 798016, 'steps': 1558, 'loss/train': 3.1712071895599365} -09/20/2021 19:53:17 - INFO - __main__ - Step 24939: {'lr': 0.00019986720434741342, 'samples': 798048, 'steps': 1558, 'loss/train': 3.057706117630005} -09/20/2021 19:53:18 - INFO - __main__ - Step 24940: {'lr': 0.00019986720434741342, 'samples': 798080, 'steps': 1558, 'loss/train': 2.531482696533203} -09/20/2021 19:53:18 - INFO - __main__ - Step 24941: {'lr': 0.00019986720434741342, 'samples': 798112, 'steps': 1558, 'loss/train': 5.999413013458252} -09/20/2021 19:53:19 - INFO - __main__ - Step 24942: {'lr': 0.00019986720434741342, 'samples': 798144, 'steps': 1558, 'loss/train': 3.165487289428711} -09/20/2021 19:53:20 - INFO - __main__ - Step 24943: {'lr': 0.00019986720434741342, 'samples': 798176, 'steps': 1558, 'loss/train': 2.0759339332580566} -09/20/2021 19:53:21 - INFO - __main__ - Step 24944: {'lr': 0.00019986720434741342, 'samples': 798208, 'steps': 1558, 'loss/train': 3.4264276027679443} -09/20/2021 19:53:21 - INFO - __main__ - Step 24945: {'lr': 0.00019986687551489335, 'samples': 798240, 'steps': 1559, 'loss/train': 3.0765035152435303} -09/20/2021 19:53:22 - INFO - __main__ - Step 24946: {'lr': 0.00019986687551489335, 'samples': 798272, 'steps': 1559, 'loss/train': 3.0391526222229004} -09/20/2021 19:53:24 - INFO - __main__ - Step 24947: {'lr': 0.00019986687551489335, 'samples': 798304, 'steps': 1559, 'loss/train': 2.4458820819854736} -09/20/2021 19:53:25 - INFO - __main__ - Step 24948: {'lr': 0.00019986687551489335, 'samples': 798336, 'steps': 1559, 'loss/train': 2.694077730178833} -09/20/2021 19:53:25 - INFO - __main__ - Step 24949: {'lr': 0.00019986687551489335, 'samples': 798368, 'steps': 1559, 'loss/train': 3.3249142169952393} -09/20/2021 19:53:26 - INFO - __main__ - Step 24950: {'lr': 0.00019986687551489335, 'samples': 798400, 'steps': 1559, 'loss/train': 3.345869541168213} -09/20/2021 19:53:27 - INFO - __main__ - Step 24951: {'lr': 0.00019986687551489335, 'samples': 798432, 'steps': 1559, 'loss/train': 3.937549591064453} -09/20/2021 19:53:28 - INFO - __main__ - Step 24952: {'lr': 0.00019986687551489335, 'samples': 798464, 'steps': 1559, 'loss/train': 2.8816609382629395} -09/20/2021 19:53:28 - INFO - __main__ - Step 24953: {'lr': 0.00019986687551489335, 'samples': 798496, 'steps': 1559, 'loss/train': 2.6837351322174072} -09/20/2021 19:53:29 - INFO - __main__ - Step 24954: {'lr': 0.00019986687551489335, 'samples': 798528, 'steps': 1559, 'loss/train': 2.5451252460479736} -09/20/2021 19:53:30 - INFO - __main__ - Step 24955: {'lr': 0.00019986687551489335, 'samples': 798560, 'steps': 1559, 'loss/train': 3.5696704387664795} -09/20/2021 19:53:31 - INFO - __main__ - Step 24956: {'lr': 0.00019986687551489335, 'samples': 798592, 'steps': 1559, 'loss/train': 3.513519048690796} -09/20/2021 19:53:31 - INFO - __main__ - Step 24957: {'lr': 0.00019986687551489335, 'samples': 798624, 'steps': 1559, 'loss/train': 0.4701380431652069} -09/20/2021 19:53:32 - INFO - __main__ - Step 24958: {'lr': 0.00019986687551489335, 'samples': 798656, 'steps': 1559, 'loss/train': 0.3256691098213196} -09/20/2021 19:53:33 - INFO - __main__ - Step 24959: {'lr': 0.00019986687551489335, 'samples': 798688, 'steps': 1559, 'loss/train': 0.5345089435577393} -09/20/2021 19:53:34 - INFO - __main__ - Step 24960: {'lr': 0.00019986687551489335, 'samples': 798720, 'steps': 1559, 'loss/train': 2.3396689891815186} -09/20/2021 19:53:35 - INFO - __main__ - Step 24961: {'lr': 0.00019986654627601532, 'samples': 798752, 'steps': 1560, 'loss/train': 3.5884246826171875} -09/20/2021 19:53:35 - INFO - __main__ - Step 24962: {'lr': 0.00019986654627601532, 'samples': 798784, 'steps': 1560, 'loss/train': 3.14831805229187} -09/20/2021 19:53:36 - INFO - __main__ - Step 24963: {'lr': 0.00019986654627601532, 'samples': 798816, 'steps': 1560, 'loss/train': 1.8979859352111816} -09/20/2021 19:53:37 - INFO - __main__ - Step 24964: {'lr': 0.00019986654627601532, 'samples': 798848, 'steps': 1560, 'loss/train': 3.0192131996154785} -09/20/2021 19:53:38 - INFO - __main__ - Step 24965: {'lr': 0.00019986654627601532, 'samples': 798880, 'steps': 1560, 'loss/train': 2.9747684001922607} -09/20/2021 19:53:38 - INFO - __main__ - Step 24966: {'lr': 0.00019986654627601532, 'samples': 798912, 'steps': 1560, 'loss/train': 3.4515209197998047} -09/20/2021 19:53:39 - INFO - __main__ - Step 24967: {'lr': 0.00019986654627601532, 'samples': 798944, 'steps': 1560, 'loss/train': 3.292478561401367} -09/20/2021 19:53:40 - INFO - __main__ - Step 24968: {'lr': 0.00019986654627601532, 'samples': 798976, 'steps': 1560, 'loss/train': 2.433739185333252} -09/20/2021 19:53:41 - INFO - __main__ - Step 24969: {'lr': 0.00019986654627601532, 'samples': 799008, 'steps': 1560, 'loss/train': 3.3207356929779053} -09/20/2021 19:53:41 - INFO - __main__ - Step 24970: {'lr': 0.00019986654627601532, 'samples': 799040, 'steps': 1560, 'loss/train': 2.807654857635498} -09/20/2021 19:53:42 - INFO - __main__ - Step 24971: {'lr': 0.00019986654627601532, 'samples': 799072, 'steps': 1560, 'loss/train': 4.198572635650635} -09/20/2021 19:53:43 - INFO - __main__ - Step 24972: {'lr': 0.00019986654627601532, 'samples': 799104, 'steps': 1560, 'loss/train': 3.488365650177002} -09/20/2021 19:53:44 - INFO - __main__ - Step 24973: {'lr': 0.00019986654627601532, 'samples': 799136, 'steps': 1560, 'loss/train': 3.3339812755584717} -09/20/2021 19:53:44 - INFO - __main__ - Step 24974: {'lr': 0.00019986654627601532, 'samples': 799168, 'steps': 1560, 'loss/train': 2.0233988761901855} -09/20/2021 19:53:45 - INFO - __main__ - Step 24975: {'lr': 0.00019986654627601532, 'samples': 799200, 'steps': 1560, 'loss/train': 2.894523859024048} -09/20/2021 19:53:47 - INFO - __main__ - Step 24976: {'lr': 0.00019986654627601532, 'samples': 799232, 'steps': 1560, 'loss/train': 2.596085548400879} -09/20/2021 19:53:48 - INFO - __main__ - Step 24977: {'lr': 0.0001998662166307807, 'samples': 799264, 'steps': 1561, 'loss/train': 0.5402947068214417} -09/20/2021 19:53:48 - INFO - __main__ - Step 24978: {'lr': 0.0001998662166307807, 'samples': 799296, 'steps': 1561, 'loss/train': 2.3769896030426025} -09/20/2021 19:53:49 - INFO - __main__ - Step 24979: {'lr': 0.0001998662166307807, 'samples': 799328, 'steps': 1561, 'loss/train': 4.108720779418945} -09/20/2021 19:53:50 - INFO - __main__ - Step 24980: {'lr': 0.0001998662166307807, 'samples': 799360, 'steps': 1561, 'loss/train': 3.267698287963867} -09/20/2021 19:53:51 - INFO - __main__ - Step 24981: {'lr': 0.0001998662166307807, 'samples': 799392, 'steps': 1561, 'loss/train': 2.690002918243408} -09/20/2021 19:53:51 - INFO - __main__ - Step 24982: {'lr': 0.0001998662166307807, 'samples': 799424, 'steps': 1561, 'loss/train': 2.778864860534668} -09/20/2021 19:53:52 - INFO - __main__ - Step 24983: {'lr': 0.0001998662166307807, 'samples': 799456, 'steps': 1561, 'loss/train': 3.4615938663482666} -09/20/2021 19:53:53 - INFO - __main__ - Step 24984: {'lr': 0.0001998662166307807, 'samples': 799488, 'steps': 1561, 'loss/train': 2.1533846855163574} -09/20/2021 19:53:54 - INFO - __main__ - Step 24985: {'lr': 0.0001998662166307807, 'samples': 799520, 'steps': 1561, 'loss/train': 2.6400136947631836} -09/20/2021 19:53:54 - INFO - __main__ - Step 24986: {'lr': 0.0001998662166307807, 'samples': 799552, 'steps': 1561, 'loss/train': 2.519676446914673} -09/20/2021 19:53:55 - INFO - __main__ - Step 24987: {'lr': 0.0001998662166307807, 'samples': 799584, 'steps': 1561, 'loss/train': 4.104724884033203} -09/20/2021 19:53:56 - INFO - __main__ - Step 24988: {'lr': 0.0001998662166307807, 'samples': 799616, 'steps': 1561, 'loss/train': 2.653813123703003} -09/20/2021 19:53:57 - INFO - __main__ - Step 24989: {'lr': 0.0001998662166307807, 'samples': 799648, 'steps': 1561, 'loss/train': 3.2402069568634033} -09/20/2021 19:53:57 - INFO - __main__ - Step 24990: {'lr': 0.0001998662166307807, 'samples': 799680, 'steps': 1561, 'loss/train': 2.212029457092285} -09/20/2021 19:53:58 - INFO - __main__ - Step 24991: {'lr': 0.0001998662166307807, 'samples': 799712, 'steps': 1561, 'loss/train': 2.887803792953491} -09/20/2021 19:53:59 - INFO - __main__ - Step 24992: {'lr': 0.0001998662166307807, 'samples': 799744, 'steps': 1561, 'loss/train': 2.969803810119629} -09/20/2021 19:54:00 - INFO - __main__ - Step 24993: {'lr': 0.00019986588657919084, 'samples': 799776, 'steps': 1562, 'loss/train': 2.8616621494293213} -09/20/2021 19:54:00 - INFO - __main__ - Step 24994: {'lr': 0.00019986588657919084, 'samples': 799808, 'steps': 1562, 'loss/train': 3.0121829509735107} -09/20/2021 19:54:01 - INFO - __main__ - Step 24995: {'lr': 0.00019986588657919084, 'samples': 799840, 'steps': 1562, 'loss/train': 3.5356814861297607} -09/20/2021 19:54:02 - INFO - __main__ - Step 24996: {'lr': 0.00019986588657919084, 'samples': 799872, 'steps': 1562, 'loss/train': 3.7856225967407227} -09/20/2021 19:54:03 - INFO - __main__ - Step 24997: {'lr': 0.00019986588657919084, 'samples': 799904, 'steps': 1562, 'loss/train': 3.3727900981903076} -09/20/2021 19:54:03 - INFO - __main__ - Step 24998: {'lr': 0.00019986588657919084, 'samples': 799936, 'steps': 1562, 'loss/train': 2.83266282081604} -09/20/2021 19:54:04 - INFO - __main__ - Step 24999: {'lr': 0.00019986588657919084, 'samples': 799968, 'steps': 1562, 'loss/train': 3.3199641704559326} -09/20/2021 19:54:05 - INFO - __main__ - Step 25000: {'lr': 0.00019986588657919084, 'samples': 800000, 'steps': 1562, 'loss/train': 3.8518824577331543} -09/20/2021 19:54:06 - INFO - __main__ - Step 25001: {'lr': 0.00019986588657919084, 'samples': 800032, 'steps': 1562, 'loss/train': 3.5477960109710693} -09/20/2021 19:54:06 - INFO - __main__ - Step 25002: {'lr': 0.00019986588657919084, 'samples': 800064, 'steps': 1562, 'loss/train': 3.5774905681610107} -09/20/2021 19:54:07 - INFO - __main__ - Step 25003: {'lr': 0.00019986588657919084, 'samples': 800096, 'steps': 1562, 'loss/train': 2.721179485321045} -09/20/2021 19:54:08 - INFO - __main__ - Step 25004: {'lr': 0.00019986588657919084, 'samples': 800128, 'steps': 1562, 'loss/train': 2.275505542755127} -09/20/2021 19:54:09 - INFO - __main__ - Step 25005: {'lr': 0.00019986588657919084, 'samples': 800160, 'steps': 1562, 'loss/train': 2.3546366691589355} -09/20/2021 19:54:09 - INFO - __main__ - Step 25006: {'lr': 0.00019986588657919084, 'samples': 800192, 'steps': 1562, 'loss/train': 3.025062322616577} -09/20/2021 19:54:10 - INFO - __main__ - Step 25007: {'lr': 0.00019986588657919084, 'samples': 800224, 'steps': 1562, 'loss/train': 3.5628411769866943} -09/20/2021 19:54:11 - INFO - __main__ - Step 25008: {'lr': 0.00019986588657919084, 'samples': 800256, 'steps': 1562, 'loss/train': 3.9462199211120605} -09/20/2021 19:54:12 - INFO - __main__ - Step 25009: {'lr': 0.00019986555612124706, 'samples': 800288, 'steps': 1563, 'loss/train': 3.843046188354492} -09/20/2021 19:54:13 - INFO - __main__ - Step 25010: {'lr': 0.00019986555612124706, 'samples': 800320, 'steps': 1563, 'loss/train': 2.762873888015747} -09/20/2021 19:54:13 - INFO - __main__ - Step 25011: {'lr': 0.00019986555612124706, 'samples': 800352, 'steps': 1563, 'loss/train': 2.5702099800109863} -09/20/2021 19:54:14 - INFO - __main__ - Step 25012: {'lr': 0.00019986555612124706, 'samples': 800384, 'steps': 1563, 'loss/train': 3.748605251312256} -09/20/2021 19:54:15 - INFO - __main__ - Step 25013: {'lr': 0.00019986555612124706, 'samples': 800416, 'steps': 1563, 'loss/train': 2.3000648021698} -09/20/2021 19:54:16 - INFO - __main__ - Step 25014: {'lr': 0.00019986555612124706, 'samples': 800448, 'steps': 1563, 'loss/train': 2.7209739685058594} -09/20/2021 19:54:17 - INFO - __main__ - Step 25015: {'lr': 0.00019986555612124706, 'samples': 800480, 'steps': 1563, 'loss/train': 2.88932466506958} -09/20/2021 19:54:18 - INFO - __main__ - Step 25016: {'lr': 0.00019986555612124706, 'samples': 800512, 'steps': 1563, 'loss/train': 2.395230531692505} -09/20/2021 19:54:18 - INFO - __main__ - Step 25017: {'lr': 0.00019986555612124706, 'samples': 800544, 'steps': 1563, 'loss/train': 2.985807418823242} -09/20/2021 19:54:19 - INFO - __main__ - Step 25018: {'lr': 0.00019986555612124706, 'samples': 800576, 'steps': 1563, 'loss/train': 2.9115755558013916} -09/20/2021 19:54:20 - INFO - __main__ - Step 25019: {'lr': 0.00019986555612124706, 'samples': 800608, 'steps': 1563, 'loss/train': 2.355950117111206} -09/20/2021 19:54:21 - INFO - __main__ - Step 25020: {'lr': 0.00019986555612124706, 'samples': 800640, 'steps': 1563, 'loss/train': 3.0052335262298584} -09/20/2021 19:54:21 - INFO - __main__ - Step 25021: {'lr': 0.00019986555612124706, 'samples': 800672, 'steps': 1563, 'loss/train': 2.854810953140259} -09/20/2021 19:54:22 - INFO - __main__ - Step 25022: {'lr': 0.00019986555612124706, 'samples': 800704, 'steps': 1563, 'loss/train': 2.6602768898010254} -09/20/2021 19:54:23 - INFO - __main__ - Step 25023: {'lr': 0.00019986555612124706, 'samples': 800736, 'steps': 1563, 'loss/train': 4.3790693283081055} -09/20/2021 19:54:24 - INFO - __main__ - Step 25024: {'lr': 0.00019986555612124706, 'samples': 800768, 'steps': 1563, 'loss/train': 2.341735363006592} -09/20/2021 19:54:25 - INFO - __main__ - Step 25025: {'lr': 0.00019986522525695076, 'samples': 800800, 'steps': 1564, 'loss/train': 2.484128952026367} -09/20/2021 19:54:25 - INFO - __main__ - Step 25026: {'lr': 0.00019986522525695076, 'samples': 800832, 'steps': 1564, 'loss/train': 2.6026124954223633} -09/20/2021 19:54:26 - INFO - __main__ - Step 25027: {'lr': 0.00019986522525695076, 'samples': 800864, 'steps': 1564, 'loss/train': 1.839106559753418} -09/20/2021 19:54:27 - INFO - __main__ - Step 25028: {'lr': 0.00019986522525695076, 'samples': 800896, 'steps': 1564, 'loss/train': 2.4504787921905518} -09/20/2021 19:54:28 - INFO - __main__ - Step 25029: {'lr': 0.00019986522525695076, 'samples': 800928, 'steps': 1564, 'loss/train': 2.4151558876037598} -09/20/2021 19:54:28 - INFO - __main__ - Step 25030: {'lr': 0.00019986522525695076, 'samples': 800960, 'steps': 1564, 'loss/train': 2.854923725128174} -09/20/2021 19:54:29 - INFO - __main__ - Step 25031: {'lr': 0.00019986522525695076, 'samples': 800992, 'steps': 1564, 'loss/train': 3.351132869720459} -09/20/2021 19:54:30 - INFO - __main__ - Step 25032: {'lr': 0.00019986522525695076, 'samples': 801024, 'steps': 1564, 'loss/train': 3.6284737586975098} -09/20/2021 19:54:31 - INFO - __main__ - Step 25033: {'lr': 0.00019986522525695076, 'samples': 801056, 'steps': 1564, 'loss/train': 2.898538112640381} -09/20/2021 19:54:31 - INFO - __main__ - Step 25034: {'lr': 0.00019986522525695076, 'samples': 801088, 'steps': 1564, 'loss/train': 2.7415072917938232} -09/20/2021 19:54:32 - INFO - __main__ - Step 25035: {'lr': 0.00019986522525695076, 'samples': 801120, 'steps': 1564, 'loss/train': 3.976203680038452} -09/20/2021 19:54:33 - INFO - __main__ - Step 25036: {'lr': 0.00019986522525695076, 'samples': 801152, 'steps': 1564, 'loss/train': 2.997528076171875} -09/20/2021 19:54:34 - INFO - __main__ - Step 25037: {'lr': 0.00019986522525695076, 'samples': 801184, 'steps': 1564, 'loss/train': 2.5376060009002686} -09/20/2021 19:54:34 - INFO - __main__ - Step 25038: {'lr': 0.00019986522525695076, 'samples': 801216, 'steps': 1564, 'loss/train': 2.5695691108703613} -09/20/2021 19:54:35 - INFO - __main__ - Step 25039: {'lr': 0.00019986522525695076, 'samples': 801248, 'steps': 1564, 'loss/train': 2.8764748573303223} -09/20/2021 19:54:36 - INFO - __main__ - Step 25040: {'lr': 0.00019986522525695076, 'samples': 801280, 'steps': 1564, 'loss/train': 2.852085590362549} -09/20/2021 19:54:37 - INFO - __main__ - Step 25041: {'lr': 0.0001998648939863032, 'samples': 801312, 'steps': 1565, 'loss/train': 2.6694071292877197} -09/20/2021 19:54:37 - INFO - __main__ - Step 25042: {'lr': 0.0001998648939863032, 'samples': 801344, 'steps': 1565, 'loss/train': 2.7966694831848145} -09/20/2021 19:54:38 - INFO - __main__ - Step 25043: {'lr': 0.0001998648939863032, 'samples': 801376, 'steps': 1565, 'loss/train': 1.0919090509414673} -09/20/2021 19:54:39 - INFO - __main__ - Step 25044: {'lr': 0.0001998648939863032, 'samples': 801408, 'steps': 1565, 'loss/train': 3.1904404163360596} -09/20/2021 19:54:40 - INFO - __main__ - Step 25045: {'lr': 0.0001998648939863032, 'samples': 801440, 'steps': 1565, 'loss/train': 2.071500301361084} -09/20/2021 19:54:41 - INFO - __main__ - Step 25046: {'lr': 0.0001998648939863032, 'samples': 801472, 'steps': 1565, 'loss/train': 2.515218734741211} -09/20/2021 19:54:42 - INFO - __main__ - Step 25047: {'lr': 0.0001998648939863032, 'samples': 801504, 'steps': 1565, 'loss/train': 2.4861807823181152} -09/20/2021 19:54:43 - INFO - __main__ - Step 25048: {'lr': 0.0001998648939863032, 'samples': 801536, 'steps': 1565, 'loss/train': 3.2161033153533936} -09/20/2021 19:54:44 - INFO - __main__ - Step 25049: {'lr': 0.0001998648939863032, 'samples': 801568, 'steps': 1565, 'loss/train': 3.1624908447265625} -09/20/2021 19:54:44 - INFO - __main__ - Step 25050: {'lr': 0.0001998648939863032, 'samples': 801600, 'steps': 1565, 'loss/train': 2.417141914367676} -09/20/2021 19:54:45 - INFO - __main__ - Step 25051: {'lr': 0.0001998648939863032, 'samples': 801632, 'steps': 1565, 'loss/train': 2.559882164001465} -09/20/2021 19:54:46 - INFO - __main__ - Step 25052: {'lr': 0.0001998648939863032, 'samples': 801664, 'steps': 1565, 'loss/train': 3.3015005588531494} -09/20/2021 19:54:47 - INFO - __main__ - Step 25053: {'lr': 0.0001998648939863032, 'samples': 801696, 'steps': 1565, 'loss/train': 2.719386100769043} -09/20/2021 19:54:47 - INFO - __main__ - Step 25054: {'lr': 0.0001998648939863032, 'samples': 801728, 'steps': 1565, 'loss/train': 2.4463932514190674} -09/20/2021 19:54:48 - INFO - __main__ - Step 25055: {'lr': 0.0001998648939863032, 'samples': 801760, 'steps': 1565, 'loss/train': 3.1098709106445312} -09/20/2021 19:54:49 - INFO - __main__ - Step 25056: {'lr': 0.0001998648939863032, 'samples': 801792, 'steps': 1565, 'loss/train': 3.1701080799102783} -09/20/2021 19:54:50 - INFO - __main__ - Step 25057: {'lr': 0.00019986456230930582, 'samples': 801824, 'steps': 1566, 'loss/train': 2.0907981395721436} -09/20/2021 19:54:50 - INFO - __main__ - Step 25058: {'lr': 0.00019986456230930582, 'samples': 801856, 'steps': 1566, 'loss/train': 2.041606903076172} -09/20/2021 19:54:51 - INFO - __main__ - Step 25059: {'lr': 0.00019986456230930582, 'samples': 801888, 'steps': 1566, 'loss/train': 2.1220972537994385} -09/20/2021 19:54:52 - INFO - __main__ - Step 25060: {'lr': 0.00019986456230930582, 'samples': 801920, 'steps': 1566, 'loss/train': 2.1850998401641846} -09/20/2021 19:54:53 - INFO - __main__ - Step 25061: {'lr': 0.00019986456230930582, 'samples': 801952, 'steps': 1566, 'loss/train': 1.9139890670776367} -09/20/2021 19:54:53 - INFO - __main__ - Step 25062: {'lr': 0.00019986456230930582, 'samples': 801984, 'steps': 1566, 'loss/train': 3.010878324508667} -09/20/2021 19:54:54 - INFO - __main__ - Step 25063: {'lr': 0.00019986456230930582, 'samples': 802016, 'steps': 1566, 'loss/train': 3.4475960731506348} -09/20/2021 19:54:55 - INFO - __main__ - Step 25064: {'lr': 0.00019986456230930582, 'samples': 802048, 'steps': 1566, 'loss/train': 3.8131120204925537} -09/20/2021 19:54:56 - INFO - __main__ - Step 25065: {'lr': 0.00019986456230930582, 'samples': 802080, 'steps': 1566, 'loss/train': 2.5775818824768066} -09/20/2021 19:54:56 - INFO - __main__ - Step 25066: {'lr': 0.00019986456230930582, 'samples': 802112, 'steps': 1566, 'loss/train': 2.868281841278076} -09/20/2021 19:54:57 - INFO - __main__ - Step 25067: {'lr': 0.00019986456230930582, 'samples': 802144, 'steps': 1566, 'loss/train': 3.25673770904541} -09/20/2021 19:54:58 - INFO - __main__ - Step 25068: {'lr': 0.00019986456230930582, 'samples': 802176, 'steps': 1566, 'loss/train': 2.259040117263794} -09/20/2021 19:54:59 - INFO - __main__ - Step 25069: {'lr': 0.00019986456230930582, 'samples': 802208, 'steps': 1566, 'loss/train': 4.654092788696289} -09/20/2021 19:54:59 - INFO - __main__ - Step 25070: {'lr': 0.00019986456230930582, 'samples': 802240, 'steps': 1566, 'loss/train': 5.160802364349365} -09/20/2021 19:55:00 - INFO - __main__ - Step 25071: {'lr': 0.00019986456230930582, 'samples': 802272, 'steps': 1566, 'loss/train': 2.628120183944702} -09/20/2021 19:55:01 - INFO - __main__ - Step 25072: {'lr': 0.00019986456230930582, 'samples': 802304, 'steps': 1566, 'loss/train': 2.8716118335723877} -09/20/2021 19:55:02 - INFO - __main__ - Step 25073: {'lr': 0.00019986423022595991, 'samples': 802336, 'steps': 1567, 'loss/train': 1.8918495178222656} -09/20/2021 19:55:03 - INFO - __main__ - Step 25074: {'lr': 0.00019986423022595991, 'samples': 802368, 'steps': 1567, 'loss/train': 0.9927337765693665} -09/20/2021 19:55:03 - INFO - __main__ - Step 25075: {'lr': 0.00019986423022595991, 'samples': 802400, 'steps': 1567, 'loss/train': 2.2974565029144287} -09/20/2021 19:55:04 - INFO - __main__ - Step 25076: {'lr': 0.00019986423022595991, 'samples': 802432, 'steps': 1567, 'loss/train': 2.6396524906158447} -09/20/2021 19:55:05 - INFO - __main__ - Step 25077: {'lr': 0.00019986423022595991, 'samples': 802464, 'steps': 1567, 'loss/train': 3.2647652626037598} -09/20/2021 19:55:06 - INFO - __main__ - Step 25078: {'lr': 0.00019986423022595991, 'samples': 802496, 'steps': 1567, 'loss/train': 3.090564012527466} -09/20/2021 19:55:07 - INFO - __main__ - Step 25079: {'lr': 0.00019986423022595991, 'samples': 802528, 'steps': 1567, 'loss/train': 3.294250726699829} -09/20/2021 19:55:08 - INFO - __main__ - Step 25080: {'lr': 0.00019986423022595991, 'samples': 802560, 'steps': 1567, 'loss/train': 0.6963714361190796} -09/20/2021 19:55:09 - INFO - __main__ - Step 25081: {'lr': 0.00019986423022595991, 'samples': 802592, 'steps': 1567, 'loss/train': 2.642789363861084} -09/20/2021 19:55:09 - INFO - __main__ - Step 25082: {'lr': 0.00019986423022595991, 'samples': 802624, 'steps': 1567, 'loss/train': 2.4303486347198486} -09/20/2021 19:55:10 - INFO - __main__ - Step 25083: {'lr': 0.00019986423022595991, 'samples': 802656, 'steps': 1567, 'loss/train': 1.5089824199676514} -09/20/2021 19:55:11 - INFO - __main__ - Step 25084: {'lr': 0.00019986423022595991, 'samples': 802688, 'steps': 1567, 'loss/train': 2.7920968532562256} -09/20/2021 19:55:12 - INFO - __main__ - Step 25085: {'lr': 0.00019986423022595991, 'samples': 802720, 'steps': 1567, 'loss/train': 2.0084729194641113} -09/20/2021 19:55:12 - INFO - __main__ - Step 25086: {'lr': 0.00019986423022595991, 'samples': 802752, 'steps': 1567, 'loss/train': 1.9693799018859863} -09/20/2021 19:55:13 - INFO - __main__ - Step 25087: {'lr': 0.00019986423022595991, 'samples': 802784, 'steps': 1567, 'loss/train': 2.2647221088409424} -09/20/2021 19:55:14 - INFO - __main__ - Step 25088: {'lr': 0.00019986423022595991, 'samples': 802816, 'steps': 1567, 'loss/train': 3.1276071071624756} -09/20/2021 19:55:15 - INFO - __main__ - Step 25089: {'lr': 0.0001998638977362668, 'samples': 802848, 'steps': 1568, 'loss/train': 2.6097240447998047} -09/20/2021 19:55:15 - INFO - __main__ - Step 25090: {'lr': 0.0001998638977362668, 'samples': 802880, 'steps': 1568, 'loss/train': 3.075566530227661} -09/20/2021 19:55:16 - INFO - __main__ - Step 25091: {'lr': 0.0001998638977362668, 'samples': 802912, 'steps': 1568, 'loss/train': 2.941039562225342} -09/20/2021 19:55:17 - INFO - __main__ - Step 25092: {'lr': 0.0001998638977362668, 'samples': 802944, 'steps': 1568, 'loss/train': 2.582412004470825} -09/20/2021 19:55:18 - INFO - __main__ - Step 25093: {'lr': 0.0001998638977362668, 'samples': 802976, 'steps': 1568, 'loss/train': 3.425595760345459} -09/20/2021 19:55:18 - INFO - __main__ - Step 25094: {'lr': 0.0001998638977362668, 'samples': 803008, 'steps': 1568, 'loss/train': 3.5834665298461914} -09/20/2021 19:55:19 - INFO - __main__ - Step 25095: {'lr': 0.0001998638977362668, 'samples': 803040, 'steps': 1568, 'loss/train': 3.3649511337280273} -09/20/2021 19:55:20 - INFO - __main__ - Step 25096: {'lr': 0.0001998638977362668, 'samples': 803072, 'steps': 1568, 'loss/train': 0.7464865446090698} -09/20/2021 19:55:21 - INFO - __main__ - Step 25097: {'lr': 0.0001998638977362668, 'samples': 803104, 'steps': 1568, 'loss/train': 0.5391913056373596} -09/20/2021 19:55:21 - INFO - __main__ - Step 25098: {'lr': 0.0001998638977362668, 'samples': 803136, 'steps': 1568, 'loss/train': 0.9657204151153564} -09/20/2021 19:55:22 - INFO - __main__ - Step 25099: {'lr': 0.0001998638977362668, 'samples': 803168, 'steps': 1568, 'loss/train': 2.946206569671631} -09/20/2021 19:55:23 - INFO - __main__ - Step 25100: {'lr': 0.0001998638977362668, 'samples': 803200, 'steps': 1568, 'loss/train': 2.0961856842041016} -09/20/2021 19:55:24 - INFO - __main__ - Step 25101: {'lr': 0.0001998638977362668, 'samples': 803232, 'steps': 1568, 'loss/train': 2.470299243927002} -09/20/2021 19:55:24 - INFO - __main__ - Step 25102: {'lr': 0.0001998638977362668, 'samples': 803264, 'steps': 1568, 'loss/train': 3.132718324661255} -09/20/2021 19:55:25 - INFO - __main__ - Step 25103: {'lr': 0.0001998638977362668, 'samples': 803296, 'steps': 1568, 'loss/train': 2.917086124420166} -09/20/2021 19:55:26 - INFO - __main__ - Step 25104: {'lr': 0.0001998638977362668, 'samples': 803328, 'steps': 1568, 'loss/train': 1.1597706079483032} -09/20/2021 19:55:27 - INFO - __main__ - Step 25105: {'lr': 0.00019986356484022792, 'samples': 803360, 'steps': 1569, 'loss/train': 3.0886850357055664} -09/20/2021 19:55:28 - INFO - __main__ - Step 25106: {'lr': 0.00019986356484022792, 'samples': 803392, 'steps': 1569, 'loss/train': 2.6436281204223633} -09/20/2021 19:55:28 - INFO - __main__ - Step 25107: {'lr': 0.00019986356484022792, 'samples': 803424, 'steps': 1569, 'loss/train': 2.059424638748169} -09/20/2021 19:55:29 - INFO - __main__ - Step 25108: {'lr': 0.00019986356484022792, 'samples': 803456, 'steps': 1569, 'loss/train': 3.192013740539551} -09/20/2021 19:55:30 - INFO - __main__ - Step 25109: {'lr': 0.00019986356484022792, 'samples': 803488, 'steps': 1569, 'loss/train': 3.482283353805542} -09/20/2021 19:55:31 - INFO - __main__ - Step 25110: {'lr': 0.00019986356484022792, 'samples': 803520, 'steps': 1569, 'loss/train': 2.3234853744506836} -09/20/2021 19:55:32 - INFO - __main__ - Step 25111: {'lr': 0.00019986356484022792, 'samples': 803552, 'steps': 1569, 'loss/train': 2.511843204498291} -09/20/2021 19:55:33 - INFO - __main__ - Step 25112: {'lr': 0.00019986356484022792, 'samples': 803584, 'steps': 1569, 'loss/train': 3.3931496143341064} -09/20/2021 19:55:34 - INFO - __main__ - Step 25113: {'lr': 0.00019986356484022792, 'samples': 803616, 'steps': 1569, 'loss/train': 3.386218786239624} -09/20/2021 19:55:34 - INFO - __main__ - Step 25114: {'lr': 0.00019986356484022792, 'samples': 803648, 'steps': 1569, 'loss/train': 2.6110353469848633} -09/20/2021 19:55:35 - INFO - __main__ - Step 25115: {'lr': 0.00019986356484022792, 'samples': 803680, 'steps': 1569, 'loss/train': 2.3747851848602295} -09/20/2021 19:55:36 - INFO - __main__ - Step 25116: {'lr': 0.00019986356484022792, 'samples': 803712, 'steps': 1569, 'loss/train': 2.1068267822265625} -09/20/2021 19:55:37 - INFO - __main__ - Step 25117: {'lr': 0.00019986356484022792, 'samples': 803744, 'steps': 1569, 'loss/train': 2.245154857635498} -09/20/2021 19:55:37 - INFO - __main__ - Step 25118: {'lr': 0.00019986356484022792, 'samples': 803776, 'steps': 1569, 'loss/train': 2.8914687633514404} -09/20/2021 19:55:38 - INFO - __main__ - Step 25119: {'lr': 0.00019986356484022792, 'samples': 803808, 'steps': 1569, 'loss/train': 3.494062662124634} -09/20/2021 19:55:39 - INFO - __main__ - Step 25120: {'lr': 0.00019986356484022792, 'samples': 803840, 'steps': 1569, 'loss/train': 1.733221173286438} -09/20/2021 19:55:40 - INFO - __main__ - Step 25121: {'lr': 0.00019986323153784456, 'samples': 803872, 'steps': 1570, 'loss/train': 2.9817752838134766} -09/20/2021 19:55:40 - INFO - __main__ - Step 25122: {'lr': 0.00019986323153784456, 'samples': 803904, 'steps': 1570, 'loss/train': 5.396787166595459} -09/20/2021 19:55:41 - INFO - __main__ - Step 25123: {'lr': 0.00019986323153784456, 'samples': 803936, 'steps': 1570, 'loss/train': 3.504197835922241} -09/20/2021 19:55:42 - INFO - __main__ - Step 25124: {'lr': 0.00019986323153784456, 'samples': 803968, 'steps': 1570, 'loss/train': 2.440437078475952} -09/20/2021 19:55:43 - INFO - __main__ - Step 25125: {'lr': 0.00019986323153784456, 'samples': 804000, 'steps': 1570, 'loss/train': 2.9368295669555664} -09/20/2021 19:55:43 - INFO - __main__ - Step 25126: {'lr': 0.00019986323153784456, 'samples': 804032, 'steps': 1570, 'loss/train': 2.5171830654144287} -09/20/2021 19:55:44 - INFO - __main__ - Step 25127: {'lr': 0.00019986323153784456, 'samples': 804064, 'steps': 1570, 'loss/train': 2.148963212966919} -09/20/2021 19:55:45 - INFO - __main__ - Step 25128: {'lr': 0.00019986323153784456, 'samples': 804096, 'steps': 1570, 'loss/train': 3.115949869155884} -09/20/2021 19:55:46 - INFO - __main__ - Step 25129: {'lr': 0.00019986323153784456, 'samples': 804128, 'steps': 1570, 'loss/train': 1.6790188550949097} -09/20/2021 19:55:46 - INFO - __main__ - Step 25130: {'lr': 0.00019986323153784456, 'samples': 804160, 'steps': 1570, 'loss/train': 3.6322524547576904} -09/20/2021 19:55:47 - INFO - __main__ - Step 25131: {'lr': 0.00019986323153784456, 'samples': 804192, 'steps': 1570, 'loss/train': 3.4098055362701416} -09/20/2021 19:55:48 - INFO - __main__ - Step 25132: {'lr': 0.00019986323153784456, 'samples': 804224, 'steps': 1570, 'loss/train': 2.958550453186035} -09/20/2021 19:55:49 - INFO - __main__ - Step 25133: {'lr': 0.00019986323153784456, 'samples': 804256, 'steps': 1570, 'loss/train': 2.6827824115753174} -09/20/2021 19:55:49 - INFO - __main__ - Step 25134: {'lr': 0.00019986323153784456, 'samples': 804288, 'steps': 1570, 'loss/train': 1.0676127672195435} -09/20/2021 19:55:50 - INFO - __main__ - Step 25135: {'lr': 0.00019986323153784456, 'samples': 804320, 'steps': 1570, 'loss/train': 2.0612454414367676} -09/20/2021 19:55:51 - INFO - __main__ - Step 25136: {'lr': 0.00019986323153784456, 'samples': 804352, 'steps': 1570, 'loss/train': 1.719261884689331} -09/20/2021 19:55:52 - INFO - __main__ - Step 25137: {'lr': 0.0001998628978291181, 'samples': 804384, 'steps': 1571, 'loss/train': 1.928381085395813} -09/20/2021 19:55:53 - INFO - __main__ - Step 25138: {'lr': 0.0001998628978291181, 'samples': 804416, 'steps': 1571, 'loss/train': 1.7126705646514893} -09/20/2021 19:55:53 - INFO - __main__ - Step 25139: {'lr': 0.0001998628978291181, 'samples': 804448, 'steps': 1571, 'loss/train': 2.3113772869110107} -09/20/2021 19:55:54 - INFO - __main__ - Step 25140: {'lr': 0.0001998628978291181, 'samples': 804480, 'steps': 1571, 'loss/train': 3.2764692306518555} -09/20/2021 19:55:55 - INFO - __main__ - Step 25141: {'lr': 0.0001998628978291181, 'samples': 804512, 'steps': 1571, 'loss/train': 2.6729021072387695} -09/20/2021 19:55:56 - INFO - __main__ - Step 25142: {'lr': 0.0001998628978291181, 'samples': 804544, 'steps': 1571, 'loss/train': 3.05855655670166} -09/20/2021 19:55:57 - INFO - __main__ - Step 25143: {'lr': 0.0001998628978291181, 'samples': 804576, 'steps': 1571, 'loss/train': 3.7278335094451904} -09/20/2021 19:55:58 - INFO - __main__ - Step 25144: {'lr': 0.0001998628978291181, 'samples': 804608, 'steps': 1571, 'loss/train': 2.7911150455474854} -09/20/2021 19:55:58 - INFO - __main__ - Step 25145: {'lr': 0.0001998628978291181, 'samples': 804640, 'steps': 1571, 'loss/train': 3.4195942878723145} -09/20/2021 19:55:59 - INFO - __main__ - Step 25146: {'lr': 0.0001998628978291181, 'samples': 804672, 'steps': 1571, 'loss/train': 3.7344889640808105} -09/20/2021 19:56:00 - INFO - __main__ - Step 25147: {'lr': 0.0001998628978291181, 'samples': 804704, 'steps': 1571, 'loss/train': 3.200549840927124} -09/20/2021 19:56:01 - INFO - __main__ - Step 25148: {'lr': 0.0001998628978291181, 'samples': 804736, 'steps': 1571, 'loss/train': 2.1879289150238037} -09/20/2021 19:56:01 - INFO - __main__ - Step 25149: {'lr': 0.0001998628978291181, 'samples': 804768, 'steps': 1571, 'loss/train': 2.792156219482422} -09/20/2021 19:56:02 - INFO - __main__ - Step 25150: {'lr': 0.0001998628978291181, 'samples': 804800, 'steps': 1571, 'loss/train': 3.568211555480957} -09/20/2021 19:56:03 - INFO - __main__ - Step 25151: {'lr': 0.0001998628978291181, 'samples': 804832, 'steps': 1571, 'loss/train': 2.933718204498291} -09/20/2021 19:56:04 - INFO - __main__ - Step 25152: {'lr': 0.0001998628978291181, 'samples': 804864, 'steps': 1571, 'loss/train': 3.053861141204834} -09/20/2021 19:56:04 - INFO - __main__ - Step 25153: {'lr': 0.00019986256371404992, 'samples': 804896, 'steps': 1572, 'loss/train': 3.3206746578216553} -09/20/2021 19:56:05 - INFO - __main__ - Step 25154: {'lr': 0.00019986256371404992, 'samples': 804928, 'steps': 1572, 'loss/train': 3.0769453048706055} -09/20/2021 19:56:06 - INFO - __main__ - Step 25155: {'lr': 0.00019986256371404992, 'samples': 804960, 'steps': 1572, 'loss/train': 2.093019962310791} -09/20/2021 19:56:07 - INFO - __main__ - Step 25156: {'lr': 0.00019986256371404992, 'samples': 804992, 'steps': 1572, 'loss/train': 3.986065626144409} -09/20/2021 19:56:07 - INFO - __main__ - Step 25157: {'lr': 0.00019986256371404992, 'samples': 805024, 'steps': 1572, 'loss/train': 2.800607919692993} -09/20/2021 19:56:08 - INFO - __main__ - Step 25158: {'lr': 0.00019986256371404992, 'samples': 805056, 'steps': 1572, 'loss/train': 2.9941518306732178} -09/20/2021 19:56:09 - INFO - __main__ - Step 25159: {'lr': 0.00019986256371404992, 'samples': 805088, 'steps': 1572, 'loss/train': 1.0134755373001099} -09/20/2021 19:56:10 - INFO - __main__ - Step 25160: {'lr': 0.00019986256371404992, 'samples': 805120, 'steps': 1572, 'loss/train': 2.167487144470215} -09/20/2021 19:56:10 - INFO - __main__ - Step 25161: {'lr': 0.00019986256371404992, 'samples': 805152, 'steps': 1572, 'loss/train': 3.38606333732605} -09/20/2021 19:56:11 - INFO - __main__ - Step 25162: {'lr': 0.00019986256371404992, 'samples': 805184, 'steps': 1572, 'loss/train': 2.860635995864868} -09/20/2021 19:56:12 - INFO - __main__ - Step 25163: {'lr': 0.00019986256371404992, 'samples': 805216, 'steps': 1572, 'loss/train': 3.067423105239868} -09/20/2021 19:56:13 - INFO - __main__ - Step 25164: {'lr': 0.00019986256371404992, 'samples': 805248, 'steps': 1572, 'loss/train': 2.2715344429016113} -09/20/2021 19:56:13 - INFO - __main__ - Step 25165: {'lr': 0.00019986256371404992, 'samples': 805280, 'steps': 1572, 'loss/train': 3.6180973052978516} -09/20/2021 19:56:14 - INFO - __main__ - Step 25166: {'lr': 0.00019986256371404992, 'samples': 805312, 'steps': 1572, 'loss/train': 3.9251465797424316} -09/20/2021 19:56:15 - INFO - __main__ - Step 25167: {'lr': 0.00019986256371404992, 'samples': 805344, 'steps': 1572, 'loss/train': 2.8099350929260254} -09/20/2021 19:56:16 - INFO - __main__ - Step 25168: {'lr': 0.00019986256371404992, 'samples': 805376, 'steps': 1572, 'loss/train': 2.4364399909973145} -09/20/2021 19:56:17 - INFO - __main__ - Step 25169: {'lr': 0.00019986222919264132, 'samples': 805408, 'steps': 1573, 'loss/train': 2.8933072090148926} -09/20/2021 19:56:17 - INFO - __main__ - Step 25170: {'lr': 0.00019986222919264132, 'samples': 805440, 'steps': 1573, 'loss/train': 3.4060256481170654} -09/20/2021 19:56:18 - INFO - __main__ - Step 25171: {'lr': 0.00019986222919264132, 'samples': 805472, 'steps': 1573, 'loss/train': 3.079317092895508} -09/20/2021 19:56:19 - INFO - __main__ - Step 25172: {'lr': 0.00019986222919264132, 'samples': 805504, 'steps': 1573, 'loss/train': 4.126032829284668} -09/20/2021 19:56:20 - INFO - __main__ - Step 25173: {'lr': 0.00019986222919264132, 'samples': 805536, 'steps': 1573, 'loss/train': 3.0272960662841797} -09/20/2021 19:56:21 - INFO - __main__ - Step 25174: {'lr': 0.00019986222919264132, 'samples': 805568, 'steps': 1573, 'loss/train': 2.5440053939819336} -09/20/2021 19:56:22 - INFO - __main__ - Step 25175: {'lr': 0.00019986222919264132, 'samples': 805600, 'steps': 1573, 'loss/train': 3.1138336658477783} -09/20/2021 19:56:22 - INFO - __main__ - Step 25176: {'lr': 0.00019986222919264132, 'samples': 805632, 'steps': 1573, 'loss/train': 1.7309901714324951} -09/20/2021 19:56:23 - INFO - __main__ - Step 25177: {'lr': 0.00019986222919264132, 'samples': 805664, 'steps': 1573, 'loss/train': 2.987027883529663} -09/20/2021 19:56:24 - INFO - __main__ - Step 25178: {'lr': 0.00019986222919264132, 'samples': 805696, 'steps': 1573, 'loss/train': 2.7584452629089355} -09/20/2021 19:56:25 - INFO - __main__ - Step 25179: {'lr': 0.00019986222919264132, 'samples': 805728, 'steps': 1573, 'loss/train': 4.239578723907471} -09/20/2021 19:56:25 - INFO - __main__ - Step 25180: {'lr': 0.00019986222919264132, 'samples': 805760, 'steps': 1573, 'loss/train': 2.988503932952881} -09/20/2021 19:56:26 - INFO - __main__ - Step 25181: {'lr': 0.00019986222919264132, 'samples': 805792, 'steps': 1573, 'loss/train': 2.0045924186706543} -09/20/2021 19:56:27 - INFO - __main__ - Step 25182: {'lr': 0.00019986222919264132, 'samples': 805824, 'steps': 1573, 'loss/train': 2.695720672607422} -09/20/2021 19:56:28 - INFO - __main__ - Step 25183: {'lr': 0.00019986222919264132, 'samples': 805856, 'steps': 1573, 'loss/train': 2.2117292881011963} -09/20/2021 19:56:28 - INFO - __main__ - Step 25184: {'lr': 0.00019986222919264132, 'samples': 805888, 'steps': 1573, 'loss/train': 1.8610033988952637} -09/20/2021 19:56:29 - INFO - __main__ - Step 25185: {'lr': 0.00019986189426489373, 'samples': 805920, 'steps': 1574, 'loss/train': 1.7561259269714355} -09/20/2021 19:56:30 - INFO - __main__ - Step 25186: {'lr': 0.00019986189426489373, 'samples': 805952, 'steps': 1574, 'loss/train': 3.673661708831787} -09/20/2021 19:56:31 - INFO - __main__ - Step 25187: {'lr': 0.00019986189426489373, 'samples': 805984, 'steps': 1574, 'loss/train': 2.420659303665161} -09/20/2021 19:56:32 - INFO - __main__ - Step 25188: {'lr': 0.00019986189426489373, 'samples': 806016, 'steps': 1574, 'loss/train': 2.2191812992095947} -09/20/2021 19:56:32 - INFO - __main__ - Step 25189: {'lr': 0.00019986189426489373, 'samples': 806048, 'steps': 1574, 'loss/train': 2.483640193939209} -09/20/2021 19:56:33 - INFO - __main__ - Step 25190: {'lr': 0.00019986189426489373, 'samples': 806080, 'steps': 1574, 'loss/train': 3.5473854541778564} -09/20/2021 19:56:34 - INFO - __main__ - Step 25191: {'lr': 0.00019986189426489373, 'samples': 806112, 'steps': 1574, 'loss/train': 2.6742513179779053} -09/20/2021 19:56:35 - INFO - __main__ - Step 25192: {'lr': 0.00019986189426489373, 'samples': 806144, 'steps': 1574, 'loss/train': 2.7806506156921387} -09/20/2021 19:56:35 - INFO - __main__ - Step 25193: {'lr': 0.00019986189426489373, 'samples': 806176, 'steps': 1574, 'loss/train': 4.250051975250244} -09/20/2021 19:56:36 - INFO - __main__ - Step 25194: {'lr': 0.00019986189426489373, 'samples': 806208, 'steps': 1574, 'loss/train': 2.5895278453826904} -09/20/2021 19:56:37 - INFO - __main__ - Step 25195: {'lr': 0.00019986189426489373, 'samples': 806240, 'steps': 1574, 'loss/train': 3.1516242027282715} -09/20/2021 19:56:38 - INFO - __main__ - Step 25196: {'lr': 0.00019986189426489373, 'samples': 806272, 'steps': 1574, 'loss/train': 3.3165767192840576} -09/20/2021 19:56:38 - INFO - __main__ - Step 25197: {'lr': 0.00019986189426489373, 'samples': 806304, 'steps': 1574, 'loss/train': 2.9477155208587646} -09/20/2021 19:56:39 - INFO - __main__ - Step 25198: {'lr': 0.00019986189426489373, 'samples': 806336, 'steps': 1574, 'loss/train': 2.5151591300964355} -09/20/2021 19:56:40 - INFO - __main__ - Step 25199: {'lr': 0.00019986189426489373, 'samples': 806368, 'steps': 1574, 'loss/train': 3.0634925365448} -09/20/2021 19:56:41 - INFO - __main__ - Step 25200: {'lr': 0.00019986189426489373, 'samples': 806400, 'steps': 1574, 'loss/train': 3.738673448562622} -09/20/2021 19:56:41 - INFO - __main__ - Step 25201: {'lr': 0.00019986155893080845, 'samples': 806432, 'steps': 1575, 'loss/train': 3.6348750591278076} -09/20/2021 19:56:42 - INFO - __main__ - Step 25202: {'lr': 0.00019986155893080845, 'samples': 806464, 'steps': 1575, 'loss/train': 3.7137680053710938} -09/20/2021 19:56:43 - INFO - __main__ - Step 25203: {'lr': 0.00019986155893080845, 'samples': 806496, 'steps': 1575, 'loss/train': 3.1033992767333984} -09/20/2021 19:56:44 - INFO - __main__ - Step 25204: {'lr': 0.00019986155893080845, 'samples': 806528, 'steps': 1575, 'loss/train': 2.902336835861206} -09/20/2021 19:56:45 - INFO - __main__ - Step 25205: {'lr': 0.00019986155893080845, 'samples': 806560, 'steps': 1575, 'loss/train': 2.9702086448669434} -09/20/2021 19:56:46 - INFO - __main__ - Step 25206: {'lr': 0.00019986155893080845, 'samples': 806592, 'steps': 1575, 'loss/train': 2.9833285808563232} -09/20/2021 19:56:47 - INFO - __main__ - Step 25207: {'lr': 0.00019986155893080845, 'samples': 806624, 'steps': 1575, 'loss/train': 2.5981836318969727} -09/20/2021 19:56:47 - INFO - __main__ - Step 25208: {'lr': 0.00019986155893080845, 'samples': 806656, 'steps': 1575, 'loss/train': 3.1024317741394043} -09/20/2021 19:56:48 - INFO - __main__ - Step 25209: {'lr': 0.00019986155893080845, 'samples': 806688, 'steps': 1575, 'loss/train': 2.220510244369507} -09/20/2021 19:56:49 - INFO - __main__ - Step 25210: {'lr': 0.00019986155893080845, 'samples': 806720, 'steps': 1575, 'loss/train': 3.153618335723877} -09/20/2021 19:56:50 - INFO - __main__ - Step 25211: {'lr': 0.00019986155893080845, 'samples': 806752, 'steps': 1575, 'loss/train': 3.0623621940612793} -09/20/2021 19:56:50 - INFO - __main__ - Step 25212: {'lr': 0.00019986155893080845, 'samples': 806784, 'steps': 1575, 'loss/train': 3.087594985961914} -09/20/2021 19:56:51 - INFO - __main__ - Step 25213: {'lr': 0.00019986155893080845, 'samples': 806816, 'steps': 1575, 'loss/train': 2.8045947551727295} -09/20/2021 19:56:52 - INFO - __main__ - Step 25214: {'lr': 0.00019986155893080845, 'samples': 806848, 'steps': 1575, 'loss/train': 4.580746173858643} -09/20/2021 19:56:53 - INFO - __main__ - Step 25215: {'lr': 0.00019986155893080845, 'samples': 806880, 'steps': 1575, 'loss/train': 3.3535313606262207} -09/20/2021 19:56:53 - INFO - __main__ - Step 25216: {'lr': 0.00019986155893080845, 'samples': 806912, 'steps': 1575, 'loss/train': 1.8368208408355713} -09/20/2021 19:56:54 - INFO - __main__ - Step 25217: {'lr': 0.0001998612231903869, 'samples': 806944, 'steps': 1576, 'loss/train': 1.3814750909805298} -09/20/2021 19:56:55 - INFO - __main__ - Step 25218: {'lr': 0.0001998612231903869, 'samples': 806976, 'steps': 1576, 'loss/train': 1.4411424398422241} -09/20/2021 19:56:56 - INFO - __main__ - Step 25219: {'lr': 0.0001998612231903869, 'samples': 807008, 'steps': 1576, 'loss/train': 1.3426331281661987} -09/20/2021 19:56:56 - INFO - __main__ - Step 25220: {'lr': 0.0001998612231903869, 'samples': 807040, 'steps': 1576, 'loss/train': 2.6132001876831055} -09/20/2021 19:56:57 - INFO - __main__ - Step 25221: {'lr': 0.0001998612231903869, 'samples': 807072, 'steps': 1576, 'loss/train': 2.280519723892212} -09/20/2021 19:56:58 - INFO - __main__ - Step 25222: {'lr': 0.0001998612231903869, 'samples': 807104, 'steps': 1576, 'loss/train': 2.742335796356201} -09/20/2021 19:56:59 - INFO - __main__ - Step 25223: {'lr': 0.0001998612231903869, 'samples': 807136, 'steps': 1576, 'loss/train': 2.4768331050872803} -09/20/2021 19:56:59 - INFO - __main__ - Step 25224: {'lr': 0.0001998612231903869, 'samples': 807168, 'steps': 1576, 'loss/train': 0.9639564752578735} -09/20/2021 19:57:00 - INFO - __main__ - Step 25225: {'lr': 0.0001998612231903869, 'samples': 807200, 'steps': 1576, 'loss/train': 0.8498488068580627} -09/20/2021 19:57:01 - INFO - __main__ - Step 25226: {'lr': 0.0001998612231903869, 'samples': 807232, 'steps': 1576, 'loss/train': 1.2575263977050781} -09/20/2021 19:57:02 - INFO - __main__ - Step 25227: {'lr': 0.0001998612231903869, 'samples': 807264, 'steps': 1576, 'loss/train': 0.5885148048400879} -09/20/2021 19:57:02 - INFO - __main__ - Step 25228: {'lr': 0.0001998612231903869, 'samples': 807296, 'steps': 1576, 'loss/train': 2.4214773178100586} -09/20/2021 19:57:03 - INFO - __main__ - Step 25229: {'lr': 0.0001998612231903869, 'samples': 807328, 'steps': 1576, 'loss/train': 2.5749974250793457} -09/20/2021 19:57:04 - INFO - __main__ - Step 25230: {'lr': 0.0001998612231903869, 'samples': 807360, 'steps': 1576, 'loss/train': 2.9559807777404785} -09/20/2021 19:57:05 - INFO - __main__ - Step 25231: {'lr': 0.0001998612231903869, 'samples': 807392, 'steps': 1576, 'loss/train': 2.476306438446045} -09/20/2021 19:57:05 - INFO - __main__ - Step 25232: {'lr': 0.0001998612231903869, 'samples': 807424, 'steps': 1576, 'loss/train': 2.6706936359405518} -09/20/2021 19:57:06 - INFO - __main__ - Step 25233: {'lr': 0.0001998608870436304, 'samples': 807456, 'steps': 1577, 'loss/train': 2.632075548171997} -09/20/2021 19:57:07 - INFO - __main__ - Step 25234: {'lr': 0.0001998608870436304, 'samples': 807488, 'steps': 1577, 'loss/train': 2.8482820987701416} -09/20/2021 19:57:08 - INFO - __main__ - Step 25235: {'lr': 0.0001998608870436304, 'samples': 807520, 'steps': 1577, 'loss/train': 2.528877019882202} -09/20/2021 19:57:09 - INFO - __main__ - Step 25236: {'lr': 0.0001998608870436304, 'samples': 807552, 'steps': 1577, 'loss/train': 3.8106536865234375} -09/20/2021 19:57:10 - INFO - __main__ - Step 25237: {'lr': 0.0001998608870436304, 'samples': 807584, 'steps': 1577, 'loss/train': 3.7419466972351074} -09/20/2021 19:57:11 - INFO - __main__ - Step 25238: {'lr': 0.0001998608870436304, 'samples': 807616, 'steps': 1577, 'loss/train': 2.3395180702209473} -09/20/2021 19:57:12 - INFO - __main__ - Step 25239: {'lr': 0.0001998608870436304, 'samples': 807648, 'steps': 1577, 'loss/train': 2.438593626022339} -09/20/2021 19:57:12 - INFO - __main__ - Step 25240: {'lr': 0.0001998608870436304, 'samples': 807680, 'steps': 1577, 'loss/train': 3.2240962982177734} -09/20/2021 19:57:13 - INFO - __main__ - Step 25241: {'lr': 0.0001998608870436304, 'samples': 807712, 'steps': 1577, 'loss/train': 2.216487407684326} -09/20/2021 19:57:14 - INFO - __main__ - Step 25242: {'lr': 0.0001998608870436304, 'samples': 807744, 'steps': 1577, 'loss/train': 2.020376443862915} -09/20/2021 19:57:15 - INFO - __main__ - Step 25243: {'lr': 0.0001998608870436304, 'samples': 807776, 'steps': 1577, 'loss/train': 2.7834630012512207} -09/20/2021 19:57:15 - INFO - __main__ - Step 25244: {'lr': 0.0001998608870436304, 'samples': 807808, 'steps': 1577, 'loss/train': 3.000335454940796} -09/20/2021 19:57:16 - INFO - __main__ - Step 25245: {'lr': 0.0001998608870436304, 'samples': 807840, 'steps': 1577, 'loss/train': 3.4959464073181152} -09/20/2021 19:57:17 - INFO - __main__ - Step 25246: {'lr': 0.0001998608870436304, 'samples': 807872, 'steps': 1577, 'loss/train': 2.818143367767334} -09/20/2021 19:57:18 - INFO - __main__ - Step 25247: {'lr': 0.0001998608870436304, 'samples': 807904, 'steps': 1577, 'loss/train': 3.163421392440796} -09/20/2021 19:57:18 - INFO - __main__ - Step 25248: {'lr': 0.0001998608870436304, 'samples': 807936, 'steps': 1577, 'loss/train': 3.033660411834717} -09/20/2021 19:57:19 - INFO - __main__ - Step 25249: {'lr': 0.00019986055049054033, 'samples': 807968, 'steps': 1578, 'loss/train': 3.043140172958374} -09/20/2021 19:57:20 - INFO - __main__ - Step 25250: {'lr': 0.00019986055049054033, 'samples': 808000, 'steps': 1578, 'loss/train': 2.5873188972473145} -09/20/2021 19:57:21 - INFO - __main__ - Step 25251: {'lr': 0.00019986055049054033, 'samples': 808032, 'steps': 1578, 'loss/train': 2.6407546997070312} -09/20/2021 19:57:21 - INFO - __main__ - Step 25252: {'lr': 0.00019986055049054033, 'samples': 808064, 'steps': 1578, 'loss/train': 2.039707899093628} -09/20/2021 19:57:22 - INFO - __main__ - Step 25253: {'lr': 0.00019986055049054033, 'samples': 808096, 'steps': 1578, 'loss/train': 2.2538325786590576} -09/20/2021 19:57:23 - INFO - __main__ - Step 25254: {'lr': 0.00019986055049054033, 'samples': 808128, 'steps': 1578, 'loss/train': 2.010268211364746} -09/20/2021 19:57:24 - INFO - __main__ - Step 25255: {'lr': 0.00019986055049054033, 'samples': 808160, 'steps': 1578, 'loss/train': 1.674318790435791} -09/20/2021 19:57:24 - INFO - __main__ - Step 25256: {'lr': 0.00019986055049054033, 'samples': 808192, 'steps': 1578, 'loss/train': 2.6338143348693848} -09/20/2021 19:57:25 - INFO - __main__ - Step 25257: {'lr': 0.00019986055049054033, 'samples': 808224, 'steps': 1578, 'loss/train': 3.3889899253845215} -09/20/2021 19:57:26 - INFO - __main__ - Step 25258: {'lr': 0.00019986055049054033, 'samples': 808256, 'steps': 1578, 'loss/train': 3.584294080734253} -09/20/2021 19:57:27 - INFO - __main__ - Step 25259: {'lr': 0.00019986055049054033, 'samples': 808288, 'steps': 1578, 'loss/train': 3.1359193325042725} -09/20/2021 19:57:27 - INFO - __main__ - Step 25260: {'lr': 0.00019986055049054033, 'samples': 808320, 'steps': 1578, 'loss/train': 3.0387625694274902} -09/20/2021 19:57:28 - INFO - __main__ - Step 25261: {'lr': 0.00019986055049054033, 'samples': 808352, 'steps': 1578, 'loss/train': 2.1350486278533936} -09/20/2021 19:57:29 - INFO - __main__ - Step 25262: {'lr': 0.00019986055049054033, 'samples': 808384, 'steps': 1578, 'loss/train': 2.943568229675293} -09/20/2021 19:57:30 - INFO - __main__ - Step 25263: {'lr': 0.00019986055049054033, 'samples': 808416, 'steps': 1578, 'loss/train': 2.4675958156585693} -09/20/2021 19:57:30 - INFO - __main__ - Step 25264: {'lr': 0.00019986055049054033, 'samples': 808448, 'steps': 1578, 'loss/train': 2.8194077014923096} -09/20/2021 19:57:31 - INFO - __main__ - Step 25265: {'lr': 0.0001998602135311181, 'samples': 808480, 'steps': 1579, 'loss/train': 3.5470306873321533} -09/20/2021 19:57:32 - INFO - __main__ - Step 25266: {'lr': 0.0001998602135311181, 'samples': 808512, 'steps': 1579, 'loss/train': 2.7215304374694824} -09/20/2021 19:57:33 - INFO - __main__ - Step 25267: {'lr': 0.0001998602135311181, 'samples': 808544, 'steps': 1579, 'loss/train': 3.0851943492889404} -09/20/2021 19:57:34 - INFO - __main__ - Step 25268: {'lr': 0.0001998602135311181, 'samples': 808576, 'steps': 1579, 'loss/train': 2.3880412578582764} -09/20/2021 19:57:35 - INFO - __main__ - Step 25269: {'lr': 0.0001998602135311181, 'samples': 808608, 'steps': 1579, 'loss/train': 3.638550043106079} -09/20/2021 19:57:36 - INFO - __main__ - Step 25270: {'lr': 0.0001998602135311181, 'samples': 808640, 'steps': 1579, 'loss/train': 3.1445651054382324} -09/20/2021 19:57:36 - INFO - __main__ - Step 25271: {'lr': 0.0001998602135311181, 'samples': 808672, 'steps': 1579, 'loss/train': 3.305691957473755} -09/20/2021 19:57:37 - INFO - __main__ - Step 25272: {'lr': 0.0001998602135311181, 'samples': 808704, 'steps': 1579, 'loss/train': 2.7216315269470215} -09/20/2021 19:57:38 - INFO - __main__ - Step 25273: {'lr': 0.0001998602135311181, 'samples': 808736, 'steps': 1579, 'loss/train': 2.328294038772583} -09/20/2021 19:57:39 - INFO - __main__ - Step 25274: {'lr': 0.0001998602135311181, 'samples': 808768, 'steps': 1579, 'loss/train': 2.007683277130127} -09/20/2021 19:57:39 - INFO - __main__ - Step 25275: {'lr': 0.0001998602135311181, 'samples': 808800, 'steps': 1579, 'loss/train': 2.597904682159424} -09/20/2021 19:57:40 - INFO - __main__ - Step 25276: {'lr': 0.0001998602135311181, 'samples': 808832, 'steps': 1579, 'loss/train': 3.4039204120635986} -09/20/2021 19:57:41 - INFO - __main__ - Step 25277: {'lr': 0.0001998602135311181, 'samples': 808864, 'steps': 1579, 'loss/train': 1.6659939289093018} -09/20/2021 19:57:42 - INFO - __main__ - Step 25278: {'lr': 0.0001998602135311181, 'samples': 808896, 'steps': 1579, 'loss/train': 2.6220717430114746} -09/20/2021 19:57:42 - INFO - __main__ - Step 25279: {'lr': 0.0001998602135311181, 'samples': 808928, 'steps': 1579, 'loss/train': 2.779573678970337} -09/20/2021 19:57:43 - INFO - __main__ - Step 25280: {'lr': 0.0001998602135311181, 'samples': 808960, 'steps': 1579, 'loss/train': 2.759871244430542} -09/20/2021 19:57:44 - INFO - __main__ - Step 25281: {'lr': 0.00019985987616536504, 'samples': 808992, 'steps': 1580, 'loss/train': 2.2872676849365234} -09/20/2021 19:57:45 - INFO - __main__ - Step 25282: {'lr': 0.00019985987616536504, 'samples': 809024, 'steps': 1580, 'loss/train': 2.7368931770324707} -09/20/2021 19:57:46 - INFO - __main__ - Step 25283: {'lr': 0.00019985987616536504, 'samples': 809056, 'steps': 1580, 'loss/train': 3.453683376312256} -09/20/2021 19:57:46 - INFO - __main__ - Step 25284: {'lr': 0.00019985987616536504, 'samples': 809088, 'steps': 1580, 'loss/train': 3.6251585483551025} -09/20/2021 19:57:47 - INFO - __main__ - Step 25285: {'lr': 0.00019985987616536504, 'samples': 809120, 'steps': 1580, 'loss/train': 2.929633855819702} -09/20/2021 19:57:48 - INFO - __main__ - Step 25286: {'lr': 0.00019985987616536504, 'samples': 809152, 'steps': 1580, 'loss/train': 2.9572393894195557} -09/20/2021 19:57:49 - INFO - __main__ - Step 25287: {'lr': 0.00019985987616536504, 'samples': 809184, 'steps': 1580, 'loss/train': 2.890874147415161} -09/20/2021 19:57:49 - INFO - __main__ - Step 25288: {'lr': 0.00019985987616536504, 'samples': 809216, 'steps': 1580, 'loss/train': 3.0333938598632812} -09/20/2021 19:57:50 - INFO - __main__ - Step 25289: {'lr': 0.00019985987616536504, 'samples': 809248, 'steps': 1580, 'loss/train': 2.9829294681549072} -09/20/2021 19:57:51 - INFO - __main__ - Step 25290: {'lr': 0.00019985987616536504, 'samples': 809280, 'steps': 1580, 'loss/train': 2.901460886001587} -09/20/2021 19:57:52 - INFO - __main__ - Step 25291: {'lr': 0.00019985987616536504, 'samples': 809312, 'steps': 1580, 'loss/train': 2.5790793895721436} -09/20/2021 19:57:52 - INFO - __main__ - Step 25292: {'lr': 0.00019985987616536504, 'samples': 809344, 'steps': 1580, 'loss/train': 2.8094992637634277} -09/20/2021 19:57:53 - INFO - __main__ - Step 25293: {'lr': 0.00019985987616536504, 'samples': 809376, 'steps': 1580, 'loss/train': 3.777038812637329} -09/20/2021 19:57:54 - INFO - __main__ - Step 25294: {'lr': 0.00019985987616536504, 'samples': 809408, 'steps': 1580, 'loss/train': 4.143582344055176} -09/20/2021 19:57:55 - INFO - __main__ - Step 25295: {'lr': 0.00019985987616536504, 'samples': 809440, 'steps': 1580, 'loss/train': 1.9979281425476074} -09/20/2021 19:57:55 - INFO - __main__ - Step 25296: {'lr': 0.00019985987616536504, 'samples': 809472, 'steps': 1580, 'loss/train': 2.5774953365325928} -09/20/2021 19:57:56 - INFO - __main__ - Step 25297: {'lr': 0.0001998595383932825, 'samples': 809504, 'steps': 1581, 'loss/train': 2.406043529510498} -09/20/2021 19:57:57 - INFO - __main__ - Step 25298: {'lr': 0.0001998595383932825, 'samples': 809536, 'steps': 1581, 'loss/train': 2.3540737628936768} -09/20/2021 19:57:59 - INFO - __main__ - Step 25299: {'lr': 0.0001998595383932825, 'samples': 809568, 'steps': 1581, 'loss/train': 3.446382999420166} -09/20/2021 19:58:00 - INFO - __main__ - Step 25300: {'lr': 0.0001998595383932825, 'samples': 809600, 'steps': 1581, 'loss/train': 1.6242904663085938} -09/20/2021 19:58:00 - INFO - __main__ - Step 25301: {'lr': 0.0001998595383932825, 'samples': 809632, 'steps': 1581, 'loss/train': 3.7803471088409424} -09/20/2021 19:58:01 - INFO - __main__ - Step 25302: {'lr': 0.0001998595383932825, 'samples': 809664, 'steps': 1581, 'loss/train': 3.8823208808898926} -09/20/2021 19:58:02 - INFO - __main__ - Step 25303: {'lr': 0.0001998595383932825, 'samples': 809696, 'steps': 1581, 'loss/train': 3.129934549331665} -09/20/2021 19:58:03 - INFO - __main__ - Step 25304: {'lr': 0.0001998595383932825, 'samples': 809728, 'steps': 1581, 'loss/train': 3.0079293251037598} -09/20/2021 19:58:03 - INFO - __main__ - Step 25305: {'lr': 0.0001998595383932825, 'samples': 809760, 'steps': 1581, 'loss/train': 2.73508882522583} -09/20/2021 19:58:04 - INFO - __main__ - Step 25306: {'lr': 0.0001998595383932825, 'samples': 809792, 'steps': 1581, 'loss/train': 1.5424776077270508} -09/20/2021 19:58:05 - INFO - __main__ - Step 25307: {'lr': 0.0001998595383932825, 'samples': 809824, 'steps': 1581, 'loss/train': 1.9850949048995972} -09/20/2021 19:58:06 - INFO - __main__ - Step 25308: {'lr': 0.0001998595383932825, 'samples': 809856, 'steps': 1581, 'loss/train': 0.5613889098167419} -09/20/2021 19:58:06 - INFO - __main__ - Step 25309: {'lr': 0.0001998595383932825, 'samples': 809888, 'steps': 1581, 'loss/train': 0.4878210425376892} -09/20/2021 19:58:07 - INFO - __main__ - Step 25310: {'lr': 0.0001998595383932825, 'samples': 809920, 'steps': 1581, 'loss/train': 0.7710428833961487} -09/20/2021 19:58:08 - INFO - __main__ - Step 25311: {'lr': 0.0001998595383932825, 'samples': 809952, 'steps': 1581, 'loss/train': 0.6765267848968506} -09/20/2021 19:58:09 - INFO - __main__ - Step 25312: {'lr': 0.0001998595383932825, 'samples': 809984, 'steps': 1581, 'loss/train': 0.5629892349243164} -09/20/2021 19:58:10 - INFO - __main__ - Step 25313: {'lr': 0.00019985920021487193, 'samples': 810016, 'steps': 1582, 'loss/train': 2.208979606628418} -09/20/2021 19:58:10 - INFO - __main__ - Step 25314: {'lr': 0.00019985920021487193, 'samples': 810048, 'steps': 1582, 'loss/train': 3.305600881576538} -09/20/2021 19:58:11 - INFO - __main__ - Step 25315: {'lr': 0.00019985920021487193, 'samples': 810080, 'steps': 1582, 'loss/train': 1.2290040254592896} -09/20/2021 19:58:12 - INFO - __main__ - Step 25316: {'lr': 0.00019985920021487193, 'samples': 810112, 'steps': 1582, 'loss/train': 2.3186399936676025} -09/20/2021 19:58:13 - INFO - __main__ - Step 25317: {'lr': 0.00019985920021487193, 'samples': 810144, 'steps': 1582, 'loss/train': 3.0350377559661865} -09/20/2021 19:58:13 - INFO - __main__ - Step 25318: {'lr': 0.00019985920021487193, 'samples': 810176, 'steps': 1582, 'loss/train': 1.941361665725708} -09/20/2021 19:58:14 - INFO - __main__ - Step 25319: {'lr': 0.00019985920021487193, 'samples': 810208, 'steps': 1582, 'loss/train': 3.2065913677215576} -09/20/2021 19:58:15 - INFO - __main__ - Step 25320: {'lr': 0.00019985920021487193, 'samples': 810240, 'steps': 1582, 'loss/train': 3.032092571258545} -09/20/2021 19:58:16 - INFO - __main__ - Step 25321: {'lr': 0.00019985920021487193, 'samples': 810272, 'steps': 1582, 'loss/train': 2.3881969451904297} -09/20/2021 19:58:16 - INFO - __main__ - Step 25322: {'lr': 0.00019985920021487193, 'samples': 810304, 'steps': 1582, 'loss/train': 2.306396007537842} -09/20/2021 19:58:17 - INFO - __main__ - Step 25323: {'lr': 0.00019985920021487193, 'samples': 810336, 'steps': 1582, 'loss/train': 3.387744426727295} -09/20/2021 19:58:18 - INFO - __main__ - Step 25324: {'lr': 0.00019985920021487193, 'samples': 810368, 'steps': 1582, 'loss/train': 3.128998279571533} -09/20/2021 19:58:19 - INFO - __main__ - Step 25325: {'lr': 0.00019985920021487193, 'samples': 810400, 'steps': 1582, 'loss/train': 2.6505773067474365} -09/20/2021 19:58:19 - INFO - __main__ - Step 25326: {'lr': 0.00019985920021487193, 'samples': 810432, 'steps': 1582, 'loss/train': 2.7139158248901367} -09/20/2021 19:58:20 - INFO - __main__ - Step 25327: {'lr': 0.00019985920021487193, 'samples': 810464, 'steps': 1582, 'loss/train': 3.744969129562378} -09/20/2021 19:58:21 - INFO - __main__ - Step 25328: {'lr': 0.00019985920021487193, 'samples': 810496, 'steps': 1582, 'loss/train': 2.5971364974975586} -09/20/2021 19:58:22 - INFO - __main__ - Step 25329: {'lr': 0.00019985886163013464, 'samples': 810528, 'steps': 1583, 'loss/train': 3.3500454425811768} -09/20/2021 19:58:22 - INFO - __main__ - Step 25330: {'lr': 0.00019985886163013464, 'samples': 810560, 'steps': 1583, 'loss/train': 2.785827159881592} -09/20/2021 19:58:24 - INFO - __main__ - Step 25331: {'lr': 0.00019985886163013464, 'samples': 810592, 'steps': 1583, 'loss/train': 0.6838266849517822} -09/20/2021 19:58:25 - INFO - __main__ - Step 25332: {'lr': 0.00019985886163013464, 'samples': 810624, 'steps': 1583, 'loss/train': 2.7499489784240723} -09/20/2021 19:58:26 - INFO - __main__ - Step 25333: {'lr': 0.00019985886163013464, 'samples': 810656, 'steps': 1583, 'loss/train': 2.5646989345550537} -09/20/2021 19:58:27 - INFO - __main__ - Step 25334: {'lr': 0.00019985886163013464, 'samples': 810688, 'steps': 1583, 'loss/train': 3.4345734119415283} -09/20/2021 19:58:27 - INFO - __main__ - Step 25335: {'lr': 0.00019985886163013464, 'samples': 810720, 'steps': 1583, 'loss/train': 2.50488018989563} -09/20/2021 19:58:28 - INFO - __main__ - Step 25336: {'lr': 0.00019985886163013464, 'samples': 810752, 'steps': 1583, 'loss/train': 1.855257272720337} -09/20/2021 19:58:29 - INFO - __main__ - Step 25337: {'lr': 0.00019985886163013464, 'samples': 810784, 'steps': 1583, 'loss/train': 3.210322141647339} -09/20/2021 19:58:30 - INFO - __main__ - Step 25338: {'lr': 0.00019985886163013464, 'samples': 810816, 'steps': 1583, 'loss/train': 2.53410005569458} -09/20/2021 19:58:30 - INFO - __main__ - Step 25339: {'lr': 0.00019985886163013464, 'samples': 810848, 'steps': 1583, 'loss/train': 2.9589977264404297} -09/20/2021 19:58:31 - INFO - __main__ - Step 25340: {'lr': 0.00019985886163013464, 'samples': 810880, 'steps': 1583, 'loss/train': 2.19038987159729} -09/20/2021 19:58:32 - INFO - __main__ - Step 25341: {'lr': 0.00019985886163013464, 'samples': 810912, 'steps': 1583, 'loss/train': 2.4743704795837402} -09/20/2021 19:58:33 - INFO - __main__ - Step 25342: {'lr': 0.00019985886163013464, 'samples': 810944, 'steps': 1583, 'loss/train': 0.6929826736450195} -09/20/2021 19:58:33 - INFO - __main__ - Step 25343: {'lr': 0.00019985886163013464, 'samples': 810976, 'steps': 1583, 'loss/train': 2.5281479358673096} -09/20/2021 19:58:34 - INFO - __main__ - Step 25344: {'lr': 0.00019985886163013464, 'samples': 811008, 'steps': 1583, 'loss/train': 2.917609930038452} -09/20/2021 19:58:35 - INFO - __main__ - Step 25345: {'lr': 0.00019985852263907204, 'samples': 811040, 'steps': 1584, 'loss/train': 1.7757560014724731} -09/20/2021 19:58:36 - INFO - __main__ - Step 25346: {'lr': 0.00019985852263907204, 'samples': 811072, 'steps': 1584, 'loss/train': 2.0978853702545166} -09/20/2021 19:58:36 - INFO - __main__ - Step 25347: {'lr': 0.00019985852263907204, 'samples': 811104, 'steps': 1584, 'loss/train': 4.19593620300293} -09/20/2021 19:58:37 - INFO - __main__ - Step 25348: {'lr': 0.00019985852263907204, 'samples': 811136, 'steps': 1584, 'loss/train': 4.25046968460083} -09/20/2021 19:58:38 - INFO - __main__ - Step 25349: {'lr': 0.00019985852263907204, 'samples': 811168, 'steps': 1584, 'loss/train': 4.222963333129883} -09/20/2021 19:58:39 - INFO - __main__ - Step 25350: {'lr': 0.00019985852263907204, 'samples': 811200, 'steps': 1584, 'loss/train': 4.089319229125977} -09/20/2021 19:58:39 - INFO - __main__ - Step 25351: {'lr': 0.00019985852263907204, 'samples': 811232, 'steps': 1584, 'loss/train': 4.164083480834961} -09/20/2021 19:58:40 - INFO - __main__ - Step 25352: {'lr': 0.00019985852263907204, 'samples': 811264, 'steps': 1584, 'loss/train': 4.2305521965026855} -09/20/2021 19:58:41 - INFO - __main__ - Step 25353: {'lr': 0.00019985852263907204, 'samples': 811296, 'steps': 1584, 'loss/train': 4.150024890899658} -09/20/2021 19:58:42 - INFO - __main__ - Step 25354: {'lr': 0.00019985852263907204, 'samples': 811328, 'steps': 1584, 'loss/train': 4.235428810119629} -09/20/2021 19:58:42 - INFO - __main__ - Step 25355: {'lr': 0.00019985852263907204, 'samples': 811360, 'steps': 1584, 'loss/train': 4.251521587371826} -09/20/2021 19:58:43 - INFO - __main__ - Step 25356: {'lr': 0.00019985852263907204, 'samples': 811392, 'steps': 1584, 'loss/train': 4.074374198913574} -09/20/2021 19:58:44 - INFO - __main__ - Step 25357: {'lr': 0.00019985852263907204, 'samples': 811424, 'steps': 1584, 'loss/train': 2.700467586517334} -09/20/2021 19:58:45 - INFO - __main__ - Step 25358: {'lr': 0.00019985852263907204, 'samples': 811456, 'steps': 1584, 'loss/train': 2.0043463706970215} -09/20/2021 19:58:45 - INFO - __main__ - Step 25359: {'lr': 0.00019985852263907204, 'samples': 811488, 'steps': 1584, 'loss/train': 3.0866408348083496} -09/20/2021 19:58:46 - INFO - __main__ - Step 25360: {'lr': 0.00019985852263907204, 'samples': 811520, 'steps': 1584, 'loss/train': 2.552964925765991} -09/20/2021 19:58:47 - INFO - __main__ - Step 25361: {'lr': 0.0001998581832416855, 'samples': 811552, 'steps': 1585, 'loss/train': 2.478736162185669} -09/20/2021 19:58:48 - INFO - __main__ - Step 25362: {'lr': 0.0001998581832416855, 'samples': 811584, 'steps': 1585, 'loss/train': 3.2555782794952393} -09/20/2021 19:58:49 - INFO - __main__ - Step 25363: {'lr': 0.0001998581832416855, 'samples': 811616, 'steps': 1585, 'loss/train': 2.548229455947876} -09/20/2021 19:58:49 - INFO - __main__ - Step 25364: {'lr': 0.0001998581832416855, 'samples': 811648, 'steps': 1585, 'loss/train': 3.0849616527557373} -09/20/2021 19:58:52 - INFO - __main__ - Step 25365: {'lr': 0.0001998581832416855, 'samples': 811680, 'steps': 1585, 'loss/train': 2.490682363510132} -09/20/2021 19:58:52 - INFO - __main__ - Step 25366: {'lr': 0.0001998581832416855, 'samples': 811712, 'steps': 1585, 'loss/train': 2.4917824268341064} -09/20/2021 19:58:53 - INFO - __main__ - Step 25367: {'lr': 0.0001998581832416855, 'samples': 811744, 'steps': 1585, 'loss/train': 2.685964822769165} -09/20/2021 19:58:54 - INFO - __main__ - Step 25368: {'lr': 0.0001998581832416855, 'samples': 811776, 'steps': 1585, 'loss/train': 2.7792882919311523} -09/20/2021 19:58:55 - INFO - __main__ - Step 25369: {'lr': 0.0001998581832416855, 'samples': 811808, 'steps': 1585, 'loss/train': 2.8411078453063965} -09/20/2021 19:58:55 - INFO - __main__ - Step 25370: {'lr': 0.0001998581832416855, 'samples': 811840, 'steps': 1585, 'loss/train': 2.405771255493164} -09/20/2021 19:58:56 - INFO - __main__ - Step 25371: {'lr': 0.0001998581832416855, 'samples': 811872, 'steps': 1585, 'loss/train': 2.5704870223999023} -09/20/2021 19:58:57 - INFO - __main__ - Step 25372: {'lr': 0.0001998581832416855, 'samples': 811904, 'steps': 1585, 'loss/train': 2.9885213375091553} -09/20/2021 19:58:58 - INFO - __main__ - Step 25373: {'lr': 0.0001998581832416855, 'samples': 811936, 'steps': 1585, 'loss/train': 3.3477284908294678} -09/20/2021 19:58:58 - INFO - __main__ - Step 25374: {'lr': 0.0001998581832416855, 'samples': 811968, 'steps': 1585, 'loss/train': 1.4192525148391724} -09/20/2021 19:58:59 - INFO - __main__ - Step 25375: {'lr': 0.0001998581832416855, 'samples': 812000, 'steps': 1585, 'loss/train': 2.744912624359131} -09/20/2021 19:59:00 - INFO - __main__ - Step 25376: {'lr': 0.0001998581832416855, 'samples': 812032, 'steps': 1585, 'loss/train': 2.089627981185913} -09/20/2021 19:59:01 - INFO - __main__ - Step 25377: {'lr': 0.00019985784343797634, 'samples': 812064, 'steps': 1586, 'loss/train': 2.5498745441436768} -09/20/2021 19:59:01 - INFO - __main__ - Step 25378: {'lr': 0.00019985784343797634, 'samples': 812096, 'steps': 1586, 'loss/train': 2.6082043647766113} -09/20/2021 19:59:02 - INFO - __main__ - Step 25379: {'lr': 0.00019985784343797634, 'samples': 812128, 'steps': 1586, 'loss/train': 2.968745708465576} -09/20/2021 19:59:03 - INFO - __main__ - Step 25380: {'lr': 0.00019985784343797634, 'samples': 812160, 'steps': 1586, 'loss/train': 2.085113286972046} -09/20/2021 19:59:04 - INFO - __main__ - Step 25381: {'lr': 0.00019985784343797634, 'samples': 812192, 'steps': 1586, 'loss/train': 3.4334218502044678} -09/20/2021 19:59:04 - INFO - __main__ - Step 25382: {'lr': 0.00019985784343797634, 'samples': 812224, 'steps': 1586, 'loss/train': 2.078376531600952} -09/20/2021 19:59:05 - INFO - __main__ - Step 25383: {'lr': 0.00019985784343797634, 'samples': 812256, 'steps': 1586, 'loss/train': 2.2694902420043945} -09/20/2021 19:59:06 - INFO - __main__ - Step 25384: {'lr': 0.00019985784343797634, 'samples': 812288, 'steps': 1586, 'loss/train': 1.6764944791793823} -09/20/2021 19:59:07 - INFO - __main__ - Step 25385: {'lr': 0.00019985784343797634, 'samples': 812320, 'steps': 1586, 'loss/train': 1.684393286705017} -09/20/2021 19:59:07 - INFO - __main__ - Step 25386: {'lr': 0.00019985784343797634, 'samples': 812352, 'steps': 1586, 'loss/train': 1.8555525541305542} -09/20/2021 19:59:08 - INFO - __main__ - Step 25387: {'lr': 0.00019985784343797634, 'samples': 812384, 'steps': 1586, 'loss/train': 1.9360724687576294} -09/20/2021 19:59:09 - INFO - __main__ - Step 25388: {'lr': 0.00019985784343797634, 'samples': 812416, 'steps': 1586, 'loss/train': 2.025380849838257} -09/20/2021 19:59:10 - INFO - __main__ - Step 25389: {'lr': 0.00019985784343797634, 'samples': 812448, 'steps': 1586, 'loss/train': 1.648918867111206} -09/20/2021 19:59:10 - INFO - __main__ - Step 25390: {'lr': 0.00019985784343797634, 'samples': 812480, 'steps': 1586, 'loss/train': 1.964730978012085} -09/20/2021 19:59:11 - INFO - __main__ - Step 25391: {'lr': 0.00019985784343797634, 'samples': 812512, 'steps': 1586, 'loss/train': 1.9353411197662354} -09/20/2021 19:59:12 - INFO - __main__ - Step 25392: {'lr': 0.00019985784343797634, 'samples': 812544, 'steps': 1586, 'loss/train': 2.02767014503479} -09/20/2021 19:59:13 - INFO - __main__ - Step 25393: {'lr': 0.00019985750322794608, 'samples': 812576, 'steps': 1587, 'loss/train': 2.640509843826294} -09/20/2021 19:59:14 - INFO - __main__ - Step 25394: {'lr': 0.00019985750322794608, 'samples': 812608, 'steps': 1587, 'loss/train': 2.7803280353546143} -09/20/2021 19:59:14 - INFO - __main__ - Step 25395: {'lr': 0.00019985750322794608, 'samples': 812640, 'steps': 1587, 'loss/train': 1.3266968727111816} -09/20/2021 19:59:15 - INFO - __main__ - Step 25396: {'lr': 0.00019985750322794608, 'samples': 812672, 'steps': 1587, 'loss/train': 1.5738459825515747} -09/20/2021 19:59:16 - INFO - __main__ - Step 25397: {'lr': 0.00019985750322794608, 'samples': 812704, 'steps': 1587, 'loss/train': 1.4593310356140137} -09/20/2021 19:59:17 - INFO - __main__ - Step 25398: {'lr': 0.00019985750322794608, 'samples': 812736, 'steps': 1587, 'loss/train': 1.595521092414856} -09/20/2021 19:59:17 - INFO - __main__ - Step 25399: {'lr': 0.00019985750322794608, 'samples': 812768, 'steps': 1587, 'loss/train': 2.4477298259735107} -09/20/2021 19:59:18 - INFO - __main__ - Step 25400: {'lr': 0.00019985750322794608, 'samples': 812800, 'steps': 1587, 'loss/train': 3.4104576110839844} -09/20/2021 19:59:19 - INFO - __main__ - Step 25401: {'lr': 0.00019985750322794608, 'samples': 812832, 'steps': 1587, 'loss/train': 2.7466793060302734} -09/20/2021 19:59:20 - INFO - __main__ - Step 25402: {'lr': 0.00019985750322794608, 'samples': 812864, 'steps': 1587, 'loss/train': 4.595304489135742} -09/20/2021 19:59:21 - INFO - __main__ - Step 25403: {'lr': 0.00019985750322794608, 'samples': 812896, 'steps': 1587, 'loss/train': 3.614612102508545} -09/20/2021 19:59:22 - INFO - __main__ - Step 25404: {'lr': 0.00019985750322794608, 'samples': 812928, 'steps': 1587, 'loss/train': 1.761605978012085} -09/20/2021 19:59:22 - INFO - __main__ - Step 25405: {'lr': 0.00019985750322794608, 'samples': 812960, 'steps': 1587, 'loss/train': 3.577333927154541} -09/20/2021 19:59:23 - INFO - __main__ - Step 25406: {'lr': 0.00019985750322794608, 'samples': 812992, 'steps': 1587, 'loss/train': 1.8986279964447021} -09/20/2021 19:59:24 - INFO - __main__ - Step 25407: {'lr': 0.00019985750322794608, 'samples': 813024, 'steps': 1587, 'loss/train': 2.3117101192474365} -09/20/2021 19:59:25 - INFO - __main__ - Step 25408: {'lr': 0.00019985750322794608, 'samples': 813056, 'steps': 1587, 'loss/train': 2.7740931510925293} -09/20/2021 19:59:26 - INFO - __main__ - Step 25409: {'lr': 0.000199857162611596, 'samples': 813088, 'steps': 1588, 'loss/train': 2.949603319168091} -09/20/2021 19:59:26 - INFO - __main__ - Step 25410: {'lr': 0.000199857162611596, 'samples': 813120, 'steps': 1588, 'loss/train': 3.67153000831604} -09/20/2021 19:59:27 - INFO - __main__ - Step 25411: {'lr': 0.000199857162611596, 'samples': 813152, 'steps': 1588, 'loss/train': 3.018700122833252} -09/20/2021 19:59:28 - INFO - __main__ - Step 25412: {'lr': 0.000199857162611596, 'samples': 813184, 'steps': 1588, 'loss/train': 3.4242825508117676} -09/20/2021 19:59:29 - INFO - __main__ - Step 25413: {'lr': 0.000199857162611596, 'samples': 813216, 'steps': 1588, 'loss/train': 3.1070635318756104} -09/20/2021 19:59:29 - INFO - __main__ - Step 25414: {'lr': 0.000199857162611596, 'samples': 813248, 'steps': 1588, 'loss/train': 2.9057836532592773} -09/20/2021 19:59:30 - INFO - __main__ - Step 25415: {'lr': 0.000199857162611596, 'samples': 813280, 'steps': 1588, 'loss/train': 3.207507610321045} -09/20/2021 19:59:31 - INFO - __main__ - Step 25416: {'lr': 0.000199857162611596, 'samples': 813312, 'steps': 1588, 'loss/train': 3.3619954586029053} -09/20/2021 19:59:32 - INFO - __main__ - Step 25417: {'lr': 0.000199857162611596, 'samples': 813344, 'steps': 1588, 'loss/train': 0.8770571351051331} -09/20/2021 19:59:32 - INFO - __main__ - Step 25418: {'lr': 0.000199857162611596, 'samples': 813376, 'steps': 1588, 'loss/train': 2.3605434894561768} -09/20/2021 19:59:33 - INFO - __main__ - Step 25419: {'lr': 0.000199857162611596, 'samples': 813408, 'steps': 1588, 'loss/train': 2.689836025238037} -09/20/2021 19:59:34 - INFO - __main__ - Step 25420: {'lr': 0.000199857162611596, 'samples': 813440, 'steps': 1588, 'loss/train': 3.3620717525482178} -09/20/2021 19:59:35 - INFO - __main__ - Step 25421: {'lr': 0.000199857162611596, 'samples': 813472, 'steps': 1588, 'loss/train': 3.3324778079986572} -09/20/2021 19:59:35 - INFO - __main__ - Step 25422: {'lr': 0.000199857162611596, 'samples': 813504, 'steps': 1588, 'loss/train': 2.3968453407287598} -09/20/2021 19:59:36 - INFO - __main__ - Step 25423: {'lr': 0.000199857162611596, 'samples': 813536, 'steps': 1588, 'loss/train': 3.4810845851898193} -09/20/2021 19:59:37 - INFO - __main__ - Step 25424: {'lr': 0.000199857162611596, 'samples': 813568, 'steps': 1588, 'loss/train': 3.35534405708313} -09/20/2021 19:59:38 - INFO - __main__ - Step 25425: {'lr': 0.00019985682158892753, 'samples': 813600, 'steps': 1589, 'loss/train': 3.214057445526123} -09/20/2021 19:59:38 - INFO - __main__ - Step 25426: {'lr': 0.00019985682158892753, 'samples': 813632, 'steps': 1589, 'loss/train': 2.3274006843566895} -09/20/2021 19:59:39 - INFO - __main__ - Step 25427: {'lr': 0.00019985682158892753, 'samples': 813664, 'steps': 1589, 'loss/train': 3.463310480117798} -09/20/2021 19:59:40 - INFO - __main__ - Step 25428: {'lr': 0.00019985682158892753, 'samples': 813696, 'steps': 1589, 'loss/train': 4.261758804321289} -09/20/2021 19:59:41 - INFO - __main__ - Step 25429: {'lr': 0.00019985682158892753, 'samples': 813728, 'steps': 1589, 'loss/train': 2.3444395065307617} -09/20/2021 19:59:41 - INFO - __main__ - Step 25430: {'lr': 0.00019985682158892753, 'samples': 813760, 'steps': 1589, 'loss/train': 2.8298981189727783} -09/20/2021 19:59:42 - INFO - __main__ - Step 25431: {'lr': 0.00019985682158892753, 'samples': 813792, 'steps': 1589, 'loss/train': 2.946443796157837} -09/20/2021 19:59:43 - INFO - __main__ - Step 25432: {'lr': 0.00019985682158892753, 'samples': 813824, 'steps': 1589, 'loss/train': 3.0589466094970703} -09/20/2021 19:59:44 - INFO - __main__ - Step 25433: {'lr': 0.00019985682158892753, 'samples': 813856, 'steps': 1589, 'loss/train': 0.427140474319458} -09/20/2021 19:59:45 - INFO - __main__ - Step 25434: {'lr': 0.00019985682158892753, 'samples': 813888, 'steps': 1589, 'loss/train': 0.8655059933662415} -09/20/2021 19:59:46 - INFO - __main__ - Step 25435: {'lr': 0.00019985682158892753, 'samples': 813920, 'steps': 1589, 'loss/train': 3.087273359298706} -09/20/2021 19:59:46 - INFO - __main__ - Step 25436: {'lr': 0.00019985682158892753, 'samples': 813952, 'steps': 1589, 'loss/train': 2.446803569793701} -09/20/2021 19:59:47 - INFO - __main__ - Step 25437: {'lr': 0.00019985682158892753, 'samples': 813984, 'steps': 1589, 'loss/train': 3.5020806789398193} -09/20/2021 19:59:48 - INFO - __main__ - Step 25438: {'lr': 0.00019985682158892753, 'samples': 814016, 'steps': 1589, 'loss/train': 3.0451016426086426} -09/20/2021 19:59:49 - INFO - __main__ - Step 25439: {'lr': 0.00019985682158892753, 'samples': 814048, 'steps': 1589, 'loss/train': 1.0453280210494995} -09/20/2021 19:59:49 - INFO - __main__ - Step 25440: {'lr': 0.00019985682158892753, 'samples': 814080, 'steps': 1589, 'loss/train': 2.077720880508423} -09/20/2021 19:59:50 - INFO - __main__ - Step 25441: {'lr': 0.00019985648015994202, 'samples': 814112, 'steps': 1590, 'loss/train': 2.3224143981933594} -09/20/2021 19:59:51 - INFO - __main__ - Step 25442: {'lr': 0.00019985648015994202, 'samples': 814144, 'steps': 1590, 'loss/train': 3.039478302001953} -09/20/2021 19:59:52 - INFO - __main__ - Step 25443: {'lr': 0.00019985648015994202, 'samples': 814176, 'steps': 1590, 'loss/train': 2.4471805095672607} -09/20/2021 19:59:53 - INFO - __main__ - Step 25444: {'lr': 0.00019985648015994202, 'samples': 814208, 'steps': 1590, 'loss/train': 3.2141644954681396} -09/20/2021 19:59:53 - INFO - __main__ - Step 25445: {'lr': 0.00019985648015994202, 'samples': 814240, 'steps': 1590, 'loss/train': 3.0098001956939697} -09/20/2021 19:59:54 - INFO - __main__ - Step 25446: {'lr': 0.00019985648015994202, 'samples': 814272, 'steps': 1590, 'loss/train': 3.1169300079345703} -09/20/2021 19:59:55 - INFO - __main__ - Step 25447: {'lr': 0.00019985648015994202, 'samples': 814304, 'steps': 1590, 'loss/train': 2.2142298221588135} -09/20/2021 19:59:56 - INFO - __main__ - Step 25448: {'lr': 0.00019985648015994202, 'samples': 814336, 'steps': 1590, 'loss/train': 2.7812838554382324} -09/20/2021 19:59:56 - INFO - __main__ - Step 25449: {'lr': 0.00019985648015994202, 'samples': 814368, 'steps': 1590, 'loss/train': 3.4123618602752686} -09/20/2021 19:59:57 - INFO - __main__ - Step 25450: {'lr': 0.00019985648015994202, 'samples': 814400, 'steps': 1590, 'loss/train': 3.32427716255188} -09/20/2021 19:59:58 - INFO - __main__ - Step 25451: {'lr': 0.00019985648015994202, 'samples': 814432, 'steps': 1590, 'loss/train': 2.0880541801452637} -09/20/2021 19:59:59 - INFO - __main__ - Step 25452: {'lr': 0.00019985648015994202, 'samples': 814464, 'steps': 1590, 'loss/train': 2.7881851196289062} -09/20/2021 19:59:59 - INFO - __main__ - Step 25453: {'lr': 0.00019985648015994202, 'samples': 814496, 'steps': 1590, 'loss/train': 0.657593309879303} -09/20/2021 20:00:00 - INFO - __main__ - Step 25454: {'lr': 0.00019985648015994202, 'samples': 814528, 'steps': 1590, 'loss/train': 3.1766176223754883} -09/20/2021 20:00:01 - INFO - __main__ - Step 25455: {'lr': 0.00019985648015994202, 'samples': 814560, 'steps': 1590, 'loss/train': 3.461141586303711} -09/20/2021 20:00:02 - INFO - __main__ - Step 25456: {'lr': 0.00019985648015994202, 'samples': 814592, 'steps': 1590, 'loss/train': 2.20780873298645} -09/20/2021 20:00:02 - INFO - __main__ - Step 25457: {'lr': 0.00019985613832464085, 'samples': 814624, 'steps': 1591, 'loss/train': 3.1757442951202393} -09/20/2021 20:00:03 - INFO - __main__ - Step 25458: {'lr': 0.00019985613832464085, 'samples': 814656, 'steps': 1591, 'loss/train': 2.9149892330169678} -09/20/2021 20:00:04 - INFO - __main__ - Step 25459: {'lr': 0.00019985613832464085, 'samples': 814688, 'steps': 1591, 'loss/train': 2.0267815589904785} -09/20/2021 20:00:05 - INFO - __main__ - Step 25460: {'lr': 0.00019985613832464085, 'samples': 814720, 'steps': 1591, 'loss/train': 3.063608169555664} -09/20/2021 20:00:05 - INFO - __main__ - Step 25461: {'lr': 0.00019985613832464085, 'samples': 814752, 'steps': 1591, 'loss/train': 3.421921730041504} -09/20/2021 20:00:06 - INFO - __main__ - Step 25462: {'lr': 0.00019985613832464085, 'samples': 814784, 'steps': 1591, 'loss/train': 3.231127977371216} -09/20/2021 20:00:07 - INFO - __main__ - Step 25463: {'lr': 0.00019985613832464085, 'samples': 814816, 'steps': 1591, 'loss/train': 2.423426628112793} -09/20/2021 20:00:08 - INFO - __main__ - Step 25464: {'lr': 0.00019985613832464085, 'samples': 814848, 'steps': 1591, 'loss/train': 3.1593198776245117} -09/20/2021 20:00:09 - INFO - __main__ - Step 25465: {'lr': 0.00019985613832464085, 'samples': 814880, 'steps': 1591, 'loss/train': 2.7472403049468994} -09/20/2021 20:00:10 - INFO - __main__ - Step 25466: {'lr': 0.00019985613832464085, 'samples': 814912, 'steps': 1591, 'loss/train': 1.8415409326553345} -09/20/2021 20:00:11 - INFO - __main__ - Step 25467: {'lr': 0.00019985613832464085, 'samples': 814944, 'steps': 1591, 'loss/train': 3.369762897491455} -09/20/2021 20:00:11 - INFO - __main__ - Step 25468: {'lr': 0.00019985613832464085, 'samples': 814976, 'steps': 1591, 'loss/train': 3.1264374256134033} -09/20/2021 20:00:12 - INFO - __main__ - Step 25469: {'lr': 0.00019985613832464085, 'samples': 815008, 'steps': 1591, 'loss/train': 1.7756186723709106} -09/20/2021 20:00:13 - INFO - __main__ - Step 25470: {'lr': 0.00019985613832464085, 'samples': 815040, 'steps': 1591, 'loss/train': 0.8336571455001831} -09/20/2021 20:00:14 - INFO - __main__ - Step 25471: {'lr': 0.00019985613832464085, 'samples': 815072, 'steps': 1591, 'loss/train': 2.8984415531158447} -09/20/2021 20:00:14 - INFO - __main__ - Step 25472: {'lr': 0.00019985613832464085, 'samples': 815104, 'steps': 1591, 'loss/train': 1.9211848974227905} -09/20/2021 20:00:15 - INFO - __main__ - Step 25473: {'lr': 0.00019985579608302549, 'samples': 815136, 'steps': 1592, 'loss/train': 3.4055371284484863} -09/20/2021 20:00:16 - INFO - __main__ - Step 25474: {'lr': 0.00019985579608302549, 'samples': 815168, 'steps': 1592, 'loss/train': 2.4980337619781494} -09/20/2021 20:00:17 - INFO - __main__ - Step 25475: {'lr': 0.00019985579608302549, 'samples': 815200, 'steps': 1592, 'loss/train': 2.739185333251953} -09/20/2021 20:00:18 - INFO - __main__ - Step 25476: {'lr': 0.00019985579608302549, 'samples': 815232, 'steps': 1592, 'loss/train': 2.8406286239624023} -09/20/2021 20:00:18 - INFO - __main__ - Step 25477: {'lr': 0.00019985579608302549, 'samples': 815264, 'steps': 1592, 'loss/train': 3.792654275894165} -09/20/2021 20:00:19 - INFO - __main__ - Step 25478: {'lr': 0.00019985579608302549, 'samples': 815296, 'steps': 1592, 'loss/train': 0.6653518676757812} -09/20/2021 20:00:20 - INFO - __main__ - Step 25479: {'lr': 0.00019985579608302549, 'samples': 815328, 'steps': 1592, 'loss/train': 0.4555234909057617} -09/20/2021 20:00:21 - INFO - __main__ - Step 25480: {'lr': 0.00019985579608302549, 'samples': 815360, 'steps': 1592, 'loss/train': 0.7910136580467224} -09/20/2021 20:00:21 - INFO - __main__ - Step 25481: {'lr': 0.00019985579608302549, 'samples': 815392, 'steps': 1592, 'loss/train': 0.4598802626132965} -09/20/2021 20:00:22 - INFO - __main__ - Step 25482: {'lr': 0.00019985579608302549, 'samples': 815424, 'steps': 1592, 'loss/train': 2.234982490539551} -09/20/2021 20:00:23 - INFO - __main__ - Step 25483: {'lr': 0.00019985579608302549, 'samples': 815456, 'steps': 1592, 'loss/train': 2.791616916656494} -09/20/2021 20:00:24 - INFO - __main__ - Step 25484: {'lr': 0.00019985579608302549, 'samples': 815488, 'steps': 1592, 'loss/train': 1.8881957530975342} -09/20/2021 20:00:24 - INFO - __main__ - Step 25485: {'lr': 0.00019985579608302549, 'samples': 815520, 'steps': 1592, 'loss/train': 2.5472757816314697} -09/20/2021 20:00:25 - INFO - __main__ - Step 25486: {'lr': 0.00019985579608302549, 'samples': 815552, 'steps': 1592, 'loss/train': 3.14289927482605} -09/20/2021 20:00:26 - INFO - __main__ - Step 25487: {'lr': 0.00019985579608302549, 'samples': 815584, 'steps': 1592, 'loss/train': 2.877923011779785} -09/20/2021 20:00:27 - INFO - __main__ - Step 25488: {'lr': 0.00019985579608302549, 'samples': 815616, 'steps': 1592, 'loss/train': 2.7071940898895264} -09/20/2021 20:00:27 - INFO - __main__ - Step 25489: {'lr': 0.00019985545343509728, 'samples': 815648, 'steps': 1593, 'loss/train': 2.9538989067077637} -09/20/2021 20:00:28 - INFO - __main__ - Step 25490: {'lr': 0.00019985545343509728, 'samples': 815680, 'steps': 1593, 'loss/train': 1.6370303630828857} -09/20/2021 20:00:29 - INFO - __main__ - Step 25491: {'lr': 0.00019985545343509728, 'samples': 815712, 'steps': 1593, 'loss/train': 4.146655559539795} -09/20/2021 20:00:30 - INFO - __main__ - Step 25492: {'lr': 0.00019985545343509728, 'samples': 815744, 'steps': 1593, 'loss/train': 2.335883617401123} -09/20/2021 20:00:30 - INFO - __main__ - Step 25493: {'lr': 0.00019985545343509728, 'samples': 815776, 'steps': 1593, 'loss/train': 2.4231975078582764} -09/20/2021 20:00:31 - INFO - __main__ - Step 25494: {'lr': 0.00019985545343509728, 'samples': 815808, 'steps': 1593, 'loss/train': 2.629523992538452} -09/20/2021 20:00:32 - INFO - __main__ - Step 25495: {'lr': 0.00019985545343509728, 'samples': 815840, 'steps': 1593, 'loss/train': 2.733812093734741} -09/20/2021 20:00:33 - INFO - __main__ - Step 25496: {'lr': 0.00019985545343509728, 'samples': 815872, 'steps': 1593, 'loss/train': 1.6244643926620483} -09/20/2021 20:00:33 - INFO - __main__ - Step 25497: {'lr': 0.00019985545343509728, 'samples': 815904, 'steps': 1593, 'loss/train': 3.7853586673736572} -09/20/2021 20:00:35 - INFO - __main__ - Step 25498: {'lr': 0.00019985545343509728, 'samples': 815936, 'steps': 1593, 'loss/train': 2.4166643619537354} -09/20/2021 20:00:35 - INFO - __main__ - Step 25499: {'lr': 0.00019985545343509728, 'samples': 815968, 'steps': 1593, 'loss/train': 3.577051877975464} -09/20/2021 20:00:36 - INFO - __main__ - Step 25500: {'lr': 0.00019985545343509728, 'samples': 816000, 'steps': 1593, 'loss/train': 3.3833909034729004} -09/20/2021 20:00:37 - INFO - __main__ - Step 25501: {'lr': 0.00019985545343509728, 'samples': 816032, 'steps': 1593, 'loss/train': 2.2550246715545654} -09/20/2021 20:00:38 - INFO - __main__ - Step 25502: {'lr': 0.00019985545343509728, 'samples': 816064, 'steps': 1593, 'loss/train': 2.8925676345825195} -09/20/2021 20:00:38 - INFO - __main__ - Step 25503: {'lr': 0.00019985545343509728, 'samples': 816096, 'steps': 1593, 'loss/train': 2.59993577003479} -09/20/2021 20:00:39 - INFO - __main__ - Step 25504: {'lr': 0.00019985545343509728, 'samples': 816128, 'steps': 1593, 'loss/train': 2.3737757205963135} -09/20/2021 20:00:40 - INFO - __main__ - Step 25505: {'lr': 0.00019985511038085762, 'samples': 816160, 'steps': 1594, 'loss/train': 2.964451313018799} -09/20/2021 20:00:41 - INFO - __main__ - Step 25506: {'lr': 0.00019985511038085762, 'samples': 816192, 'steps': 1594, 'loss/train': 2.874530553817749} -09/20/2021 20:00:42 - INFO - __main__ - Step 25507: {'lr': 0.00019985511038085762, 'samples': 816224, 'steps': 1594, 'loss/train': 2.720536470413208} -09/20/2021 20:00:42 - INFO - __main__ - Step 25508: {'lr': 0.00019985511038085762, 'samples': 816256, 'steps': 1594, 'loss/train': 2.0123908519744873} -09/20/2021 20:00:43 - INFO - __main__ - Step 25509: {'lr': 0.00019985511038085762, 'samples': 816288, 'steps': 1594, 'loss/train': 3.201951742172241} -09/20/2021 20:00:44 - INFO - __main__ - Step 25510: {'lr': 0.00019985511038085762, 'samples': 816320, 'steps': 1594, 'loss/train': 2.0141022205352783} -09/20/2021 20:00:45 - INFO - __main__ - Step 25511: {'lr': 0.00019985511038085762, 'samples': 816352, 'steps': 1594, 'loss/train': 3.018871545791626} -09/20/2021 20:00:45 - INFO - __main__ - Step 25512: {'lr': 0.00019985511038085762, 'samples': 816384, 'steps': 1594, 'loss/train': 2.9277420043945312} -09/20/2021 20:00:46 - INFO - __main__ - Step 25513: {'lr': 0.00019985511038085762, 'samples': 816416, 'steps': 1594, 'loss/train': 2.8741872310638428} -09/20/2021 20:00:47 - INFO - __main__ - Step 25514: {'lr': 0.00019985511038085762, 'samples': 816448, 'steps': 1594, 'loss/train': 2.4776766300201416} -09/20/2021 20:00:48 - INFO - __main__ - Step 25515: {'lr': 0.00019985511038085762, 'samples': 816480, 'steps': 1594, 'loss/train': 2.7893059253692627} -09/20/2021 20:00:48 - INFO - __main__ - Step 25516: {'lr': 0.00019985511038085762, 'samples': 816512, 'steps': 1594, 'loss/train': 3.2216684818267822} -09/20/2021 20:00:49 - INFO - __main__ - Step 25517: {'lr': 0.00019985511038085762, 'samples': 816544, 'steps': 1594, 'loss/train': 2.372049331665039} -09/20/2021 20:00:50 - INFO - __main__ - Step 25518: {'lr': 0.00019985511038085762, 'samples': 816576, 'steps': 1594, 'loss/train': 3.300377368927002} -09/20/2021 20:00:51 - INFO - __main__ - Step 25519: {'lr': 0.00019985511038085762, 'samples': 816608, 'steps': 1594, 'loss/train': 2.806358575820923} -09/20/2021 20:00:51 - INFO - __main__ - Step 25520: {'lr': 0.00019985511038085762, 'samples': 816640, 'steps': 1594, 'loss/train': 2.187222480773926} -09/20/2021 20:00:52 - INFO - __main__ - Step 25521: {'lr': 0.00019985476692030787, 'samples': 816672, 'steps': 1595, 'loss/train': 2.736079692840576} -09/20/2021 20:00:53 - INFO - __main__ - Step 25522: {'lr': 0.00019985476692030787, 'samples': 816704, 'steps': 1595, 'loss/train': 2.3320977687835693} -09/20/2021 20:00:54 - INFO - __main__ - Step 25523: {'lr': 0.00019985476692030787, 'samples': 816736, 'steps': 1595, 'loss/train': 2.8801658153533936} -09/20/2021 20:00:54 - INFO - __main__ - Step 25524: {'lr': 0.00019985476692030787, 'samples': 816768, 'steps': 1595, 'loss/train': 2.246596336364746} -09/20/2021 20:00:55 - INFO - __main__ - Step 25525: {'lr': 0.00019985476692030787, 'samples': 816800, 'steps': 1595, 'loss/train': 3.0048000812530518} -09/20/2021 20:00:56 - INFO - __main__ - Step 25526: {'lr': 0.00019985476692030787, 'samples': 816832, 'steps': 1595, 'loss/train': 3.9429802894592285} -09/20/2021 20:00:57 - INFO - __main__ - Step 25527: {'lr': 0.00019985476692030787, 'samples': 816864, 'steps': 1595, 'loss/train': 3.231384038925171} -09/20/2021 20:00:58 - INFO - __main__ - Step 25528: {'lr': 0.00019985476692030787, 'samples': 816896, 'steps': 1595, 'loss/train': 3.010622501373291} -09/20/2021 20:00:59 - INFO - __main__ - Step 25529: {'lr': 0.00019985476692030787, 'samples': 816928, 'steps': 1595, 'loss/train': 1.1252539157867432} -09/20/2021 20:00:59 - INFO - __main__ - Step 25530: {'lr': 0.00019985476692030787, 'samples': 816960, 'steps': 1595, 'loss/train': 3.2943739891052246} -09/20/2021 20:01:00 - INFO - __main__ - Step 25531: {'lr': 0.00019985476692030787, 'samples': 816992, 'steps': 1595, 'loss/train': 2.908560037612915} -09/20/2021 20:01:01 - INFO - __main__ - Step 25532: {'lr': 0.00019985476692030787, 'samples': 817024, 'steps': 1595, 'loss/train': 2.762401580810547} -09/20/2021 20:01:02 - INFO - __main__ - Step 25533: {'lr': 0.00019985476692030787, 'samples': 817056, 'steps': 1595, 'loss/train': 2.860370635986328} -09/20/2021 20:01:02 - INFO - __main__ - Step 25534: {'lr': 0.00019985476692030787, 'samples': 817088, 'steps': 1595, 'loss/train': 2.320125102996826} -09/20/2021 20:01:03 - INFO - __main__ - Step 25535: {'lr': 0.00019985476692030787, 'samples': 817120, 'steps': 1595, 'loss/train': 3.3670003414154053} -09/20/2021 20:01:04 - INFO - __main__ - Step 25536: {'lr': 0.00019985476692030787, 'samples': 817152, 'steps': 1595, 'loss/train': 3.312081813812256} -09/20/2021 20:01:05 - INFO - __main__ - Step 25537: {'lr': 0.00019985442305344946, 'samples': 817184, 'steps': 1596, 'loss/train': 1.990599274635315} -09/20/2021 20:01:06 - INFO - __main__ - Step 25538: {'lr': 0.00019985442305344946, 'samples': 817216, 'steps': 1596, 'loss/train': 2.809455394744873} -09/20/2021 20:01:06 - INFO - __main__ - Step 25539: {'lr': 0.00019985442305344946, 'samples': 817248, 'steps': 1596, 'loss/train': 1.6881552934646606} -09/20/2021 20:01:07 - INFO - __main__ - Step 25540: {'lr': 0.00019985442305344946, 'samples': 817280, 'steps': 1596, 'loss/train': 1.7695194482803345} -09/20/2021 20:01:08 - INFO - __main__ - Step 25541: {'lr': 0.00019985442305344946, 'samples': 817312, 'steps': 1596, 'loss/train': 3.291243553161621} -09/20/2021 20:01:09 - INFO - __main__ - Step 25542: {'lr': 0.00019985442305344946, 'samples': 817344, 'steps': 1596, 'loss/train': 1.9766918420791626} -09/20/2021 20:01:09 - INFO - __main__ - Step 25543: {'lr': 0.00019985442305344946, 'samples': 817376, 'steps': 1596, 'loss/train': 1.4329655170440674} -09/20/2021 20:01:10 - INFO - __main__ - Step 25544: {'lr': 0.00019985442305344946, 'samples': 817408, 'steps': 1596, 'loss/train': 0.7470241785049438} -09/20/2021 20:01:11 - INFO - __main__ - Step 25545: {'lr': 0.00019985442305344946, 'samples': 817440, 'steps': 1596, 'loss/train': 2.656830072402954} -09/20/2021 20:01:12 - INFO - __main__ - Step 25546: {'lr': 0.00019985442305344946, 'samples': 817472, 'steps': 1596, 'loss/train': 2.5269742012023926} -09/20/2021 20:01:12 - INFO - __main__ - Step 25547: {'lr': 0.00019985442305344946, 'samples': 817504, 'steps': 1596, 'loss/train': 2.7465591430664062} -09/20/2021 20:01:13 - INFO - __main__ - Step 25548: {'lr': 0.00019985442305344946, 'samples': 817536, 'steps': 1596, 'loss/train': 3.662374973297119} -09/20/2021 20:01:14 - INFO - __main__ - Step 25549: {'lr': 0.00019985442305344946, 'samples': 817568, 'steps': 1596, 'loss/train': 2.948031425476074} -09/20/2021 20:01:15 - INFO - __main__ - Step 25550: {'lr': 0.00019985442305344946, 'samples': 817600, 'steps': 1596, 'loss/train': 2.97577166557312} -09/20/2021 20:01:15 - INFO - __main__ - Step 25551: {'lr': 0.00019985442305344946, 'samples': 817632, 'steps': 1596, 'loss/train': 2.5693607330322266} -09/20/2021 20:01:16 - INFO - __main__ - Step 25552: {'lr': 0.00019985442305344946, 'samples': 817664, 'steps': 1596, 'loss/train': 4.065329074859619} -09/20/2021 20:01:17 - INFO - __main__ - Step 25553: {'lr': 0.00019985407878028382, 'samples': 817696, 'steps': 1597, 'loss/train': 2.6619858741760254} -09/20/2021 20:01:18 - INFO - __main__ - Step 25554: {'lr': 0.00019985407878028382, 'samples': 817728, 'steps': 1597, 'loss/train': 0.4311097264289856} -09/20/2021 20:01:19 - INFO - __main__ - Step 25555: {'lr': 0.00019985407878028382, 'samples': 817760, 'steps': 1597, 'loss/train': 0.8128039836883545} -09/20/2021 20:01:19 - INFO - __main__ - Step 25556: {'lr': 0.00019985407878028382, 'samples': 817792, 'steps': 1597, 'loss/train': 2.883885622024536} -09/20/2021 20:01:20 - INFO - __main__ - Step 25557: {'lr': 0.00019985407878028382, 'samples': 817824, 'steps': 1597, 'loss/train': 2.610400438308716} -09/20/2021 20:01:21 - INFO - __main__ - Step 25558: {'lr': 0.00019985407878028382, 'samples': 817856, 'steps': 1597, 'loss/train': 3.6427366733551025} -09/20/2021 20:01:22 - INFO - __main__ - Step 25559: {'lr': 0.00019985407878028382, 'samples': 817888, 'steps': 1597, 'loss/train': 4.2692952156066895} -09/20/2021 20:01:23 - INFO - __main__ - Step 25560: {'lr': 0.00019985407878028382, 'samples': 817920, 'steps': 1597, 'loss/train': 2.0178751945495605} -09/20/2021 20:01:24 - INFO - __main__ - Step 25561: {'lr': 0.00019985407878028382, 'samples': 817952, 'steps': 1597, 'loss/train': 2.7248690128326416} -09/20/2021 20:01:24 - INFO - __main__ - Step 25562: {'lr': 0.00019985407878028382, 'samples': 817984, 'steps': 1597, 'loss/train': 3.196666955947876} -09/20/2021 20:01:25 - INFO - __main__ - Step 25563: {'lr': 0.00019985407878028382, 'samples': 818016, 'steps': 1597, 'loss/train': 3.4203553199768066} -09/20/2021 20:01:26 - INFO - __main__ - Step 25564: {'lr': 0.00019985407878028382, 'samples': 818048, 'steps': 1597, 'loss/train': 2.875454902648926} -09/20/2021 20:01:27 - INFO - __main__ - Step 25565: {'lr': 0.00019985407878028382, 'samples': 818080, 'steps': 1597, 'loss/train': 1.2756810188293457} -09/20/2021 20:01:27 - INFO - __main__ - Step 25566: {'lr': 0.00019985407878028382, 'samples': 818112, 'steps': 1597, 'loss/train': 2.784248113632202} -09/20/2021 20:01:28 - INFO - __main__ - Step 25567: {'lr': 0.00019985407878028382, 'samples': 818144, 'steps': 1597, 'loss/train': 0.8755086064338684} -09/20/2021 20:01:29 - INFO - __main__ - Step 25568: {'lr': 0.00019985407878028382, 'samples': 818176, 'steps': 1597, 'loss/train': 0.4614057242870331} -09/20/2021 20:01:30 - INFO - __main__ - Step 25569: {'lr': 0.00019985373410081228, 'samples': 818208, 'steps': 1598, 'loss/train': 0.31857702136039734} -09/20/2021 20:01:31 - INFO - __main__ - Step 25570: {'lr': 0.00019985373410081228, 'samples': 818240, 'steps': 1598, 'loss/train': 0.666133463382721} -09/20/2021 20:01:31 - INFO - __main__ - Step 25571: {'lr': 0.00019985373410081228, 'samples': 818272, 'steps': 1598, 'loss/train': 2.5644447803497314} -09/20/2021 20:01:32 - INFO - __main__ - Step 25572: {'lr': 0.00019985373410081228, 'samples': 818304, 'steps': 1598, 'loss/train': 1.3516507148742676} -09/20/2021 20:01:33 - INFO - __main__ - Step 25573: {'lr': 0.00019985373410081228, 'samples': 818336, 'steps': 1598, 'loss/train': 1.6849589347839355} -09/20/2021 20:01:34 - INFO - __main__ - Step 25574: {'lr': 0.00019985373410081228, 'samples': 818368, 'steps': 1598, 'loss/train': 1.474232792854309} -09/20/2021 20:01:34 - INFO - __main__ - Step 25575: {'lr': 0.00019985373410081228, 'samples': 818400, 'steps': 1598, 'loss/train': 2.248262405395508} -09/20/2021 20:01:35 - INFO - __main__ - Step 25576: {'lr': 0.00019985373410081228, 'samples': 818432, 'steps': 1598, 'loss/train': 2.3080036640167236} -09/20/2021 20:01:36 - INFO - __main__ - Step 25577: {'lr': 0.00019985373410081228, 'samples': 818464, 'steps': 1598, 'loss/train': 2.7633516788482666} -09/20/2021 20:01:37 - INFO - __main__ - Step 25578: {'lr': 0.00019985373410081228, 'samples': 818496, 'steps': 1598, 'loss/train': 2.8564441204071045} -09/20/2021 20:01:37 - INFO - __main__ - Step 25579: {'lr': 0.00019985373410081228, 'samples': 818528, 'steps': 1598, 'loss/train': 2.615574359893799} -09/20/2021 20:01:38 - INFO - __main__ - Step 25580: {'lr': 0.00019985373410081228, 'samples': 818560, 'steps': 1598, 'loss/train': 3.366048574447632} -09/20/2021 20:01:39 - INFO - __main__ - Step 25581: {'lr': 0.00019985373410081228, 'samples': 818592, 'steps': 1598, 'loss/train': 2.711829423904419} -09/20/2021 20:01:40 - INFO - __main__ - Step 25582: {'lr': 0.00019985373410081228, 'samples': 818624, 'steps': 1598, 'loss/train': 3.639784574508667} -09/20/2021 20:01:40 - INFO - __main__ - Step 25583: {'lr': 0.00019985373410081228, 'samples': 818656, 'steps': 1598, 'loss/train': 2.7602357864379883} -09/20/2021 20:01:41 - INFO - __main__ - Step 25584: {'lr': 0.00019985373410081228, 'samples': 818688, 'steps': 1598, 'loss/train': 2.873746633529663} -09/20/2021 20:01:42 - INFO - __main__ - Step 25585: {'lr': 0.00019985338901503633, 'samples': 818720, 'steps': 1599, 'loss/train': 3.532200574874878} -09/20/2021 20:01:43 - INFO - __main__ - Step 25586: {'lr': 0.00019985338901503633, 'samples': 818752, 'steps': 1599, 'loss/train': 2.714311361312866} -09/20/2021 20:01:43 - INFO - __main__ - Step 25587: {'lr': 0.00019985338901503633, 'samples': 818784, 'steps': 1599, 'loss/train': 2.547269582748413} -09/20/2021 20:01:44 - INFO - __main__ - Step 25588: {'lr': 0.00019985338901503633, 'samples': 818816, 'steps': 1599, 'loss/train': 2.9221177101135254} -09/20/2021 20:01:45 - INFO - __main__ - Step 25589: {'lr': 0.00019985338901503633, 'samples': 818848, 'steps': 1599, 'loss/train': 2.226003408432007} -09/20/2021 20:01:46 - INFO - __main__ - Step 25590: {'lr': 0.00019985338901503633, 'samples': 818880, 'steps': 1599, 'loss/train': 3.357191324234009} -09/20/2021 20:01:46 - INFO - __main__ - Step 25591: {'lr': 0.00019985338901503633, 'samples': 818912, 'steps': 1599, 'loss/train': 3.356971263885498} -09/20/2021 20:01:48 - INFO - __main__ - Step 25592: {'lr': 0.00019985338901503633, 'samples': 818944, 'steps': 1599, 'loss/train': 3.031526803970337} -09/20/2021 20:01:49 - INFO - __main__ - Step 25593: {'lr': 0.00019985338901503633, 'samples': 818976, 'steps': 1599, 'loss/train': 2.9286930561065674} -09/20/2021 20:01:49 - INFO - __main__ - Step 25594: {'lr': 0.00019985338901503633, 'samples': 819008, 'steps': 1599, 'loss/train': 3.595580577850342} -09/20/2021 20:01:50 - INFO - __main__ - Step 25595: {'lr': 0.00019985338901503633, 'samples': 819040, 'steps': 1599, 'loss/train': 2.43182110786438} -09/20/2021 20:01:51 - INFO - __main__ - Step 25596: {'lr': 0.00019985338901503633, 'samples': 819072, 'steps': 1599, 'loss/train': 2.2064261436462402} -09/20/2021 20:01:52 - INFO - __main__ - Step 25597: {'lr': 0.00019985338901503633, 'samples': 819104, 'steps': 1599, 'loss/train': 2.5415594577789307} -09/20/2021 20:01:52 - INFO - __main__ - Step 25598: {'lr': 0.00019985338901503633, 'samples': 819136, 'steps': 1599, 'loss/train': 3.2292816638946533} -09/20/2021 20:01:53 - INFO - __main__ - Step 25599: {'lr': 0.00019985338901503633, 'samples': 819168, 'steps': 1599, 'loss/train': 2.1851742267608643} -09/20/2021 20:01:54 - INFO - __main__ - Step 25600: {'lr': 0.00019985338901503633, 'samples': 819200, 'steps': 1599, 'loss/train': 1.8088781833648682} -09/20/2021 20:01:55 - INFO - __main__ - Step 25601: {'lr': 0.00019985304352295732, 'samples': 819232, 'steps': 1600, 'loss/train': 3.0234479904174805} -09/20/2021 20:01:55 - INFO - __main__ - Step 25602: {'lr': 0.00019985304352295732, 'samples': 819264, 'steps': 1600, 'loss/train': 2.2369236946105957} -09/20/2021 20:01:56 - INFO - __main__ - Step 25603: {'lr': 0.00019985304352295732, 'samples': 819296, 'steps': 1600, 'loss/train': 0.34267401695251465} -09/20/2021 20:01:57 - INFO - __main__ - Step 25604: {'lr': 0.00019985304352295732, 'samples': 819328, 'steps': 1600, 'loss/train': 0.34328633546829224} -09/20/2021 20:01:58 - INFO - __main__ - Step 25605: {'lr': 0.00019985304352295732, 'samples': 819360, 'steps': 1600, 'loss/train': 0.8169059157371521} -09/20/2021 20:01:58 - INFO - __main__ - Step 25606: {'lr': 0.00019985304352295732, 'samples': 819392, 'steps': 1600, 'loss/train': 3.116657257080078} -09/20/2021 20:01:59 - INFO - __main__ - Step 25607: {'lr': 0.00019985304352295732, 'samples': 819424, 'steps': 1600, 'loss/train': 3.56455135345459} -09/20/2021 20:02:00 - INFO - __main__ - Step 25608: {'lr': 0.00019985304352295732, 'samples': 819456, 'steps': 1600, 'loss/train': 1.718264102935791} -09/20/2021 20:02:01 - INFO - __main__ - Step 25609: {'lr': 0.00019985304352295732, 'samples': 819488, 'steps': 1600, 'loss/train': 2.4177911281585693} -09/20/2021 20:02:01 - INFO - __main__ - Step 25610: {'lr': 0.00019985304352295732, 'samples': 819520, 'steps': 1600, 'loss/train': 2.9267048835754395} -09/20/2021 20:02:02 - INFO - __main__ - Step 25611: {'lr': 0.00019985304352295732, 'samples': 819552, 'steps': 1600, 'loss/train': 1.7961498498916626} -09/20/2021 20:02:03 - INFO - __main__ - Step 25612: {'lr': 0.00019985304352295732, 'samples': 819584, 'steps': 1600, 'loss/train': 3.821962594985962} -09/20/2021 20:02:04 - INFO - __main__ - Step 25613: {'lr': 0.00019985304352295732, 'samples': 819616, 'steps': 1600, 'loss/train': 3.515721559524536} -09/20/2021 20:02:04 - INFO - __main__ - Step 25614: {'lr': 0.00019985304352295732, 'samples': 819648, 'steps': 1600, 'loss/train': 3.1283373832702637} -09/20/2021 20:02:05 - INFO - __main__ - Step 25615: {'lr': 0.00019985304352295732, 'samples': 819680, 'steps': 1600, 'loss/train': 1.8143670558929443} -09/20/2021 20:02:06 - INFO - __main__ - Step 25616: {'lr': 0.00019985304352295732, 'samples': 819712, 'steps': 1600, 'loss/train': 3.055992603302002} -09/20/2021 20:02:07 - INFO - __main__ - Step 25617: {'lr': 0.00019985269762457666, 'samples': 819744, 'steps': 1601, 'loss/train': 2.9494946002960205} -09/20/2021 20:02:08 - INFO - __main__ - Step 25618: {'lr': 0.00019985269762457666, 'samples': 819776, 'steps': 1601, 'loss/train': 2.1678483486175537} -09/20/2021 20:02:08 - INFO - __main__ - Step 25619: {'lr': 0.00019985269762457666, 'samples': 819808, 'steps': 1601, 'loss/train': 3.2840044498443604} -09/20/2021 20:02:09 - INFO - __main__ - Step 25620: {'lr': 0.00019985269762457666, 'samples': 819840, 'steps': 1601, 'loss/train': 2.053493022918701} -09/20/2021 20:02:10 - INFO - __main__ - Step 25621: {'lr': 0.00019985269762457666, 'samples': 819872, 'steps': 1601, 'loss/train': 2.8533458709716797} -09/20/2021 20:02:11 - INFO - __main__ - Step 25622: {'lr': 0.00019985269762457666, 'samples': 819904, 'steps': 1601, 'loss/train': 2.4398012161254883} -09/20/2021 20:02:12 - INFO - __main__ - Step 25623: {'lr': 0.00019985269762457666, 'samples': 819936, 'steps': 1601, 'loss/train': 3.1432008743286133} -09/20/2021 20:02:13 - INFO - __main__ - Step 25624: {'lr': 0.00019985269762457666, 'samples': 819968, 'steps': 1601, 'loss/train': 4.2928314208984375} -09/20/2021 20:02:14 - INFO - __main__ - Step 25625: {'lr': 0.00019985269762457666, 'samples': 820000, 'steps': 1601, 'loss/train': 2.256718397140503} -09/20/2021 20:02:15 - INFO - __main__ - Step 25626: {'lr': 0.00019985269762457666, 'samples': 820032, 'steps': 1601, 'loss/train': 2.5760812759399414} -09/20/2021 20:02:15 - INFO - __main__ - Step 25627: {'lr': 0.00019985269762457666, 'samples': 820064, 'steps': 1601, 'loss/train': 2.887378692626953} -09/20/2021 20:02:16 - INFO - __main__ - Step 25628: {'lr': 0.00019985269762457666, 'samples': 820096, 'steps': 1601, 'loss/train': 3.415863513946533} -09/20/2021 20:02:17 - INFO - __main__ - Step 25629: {'lr': 0.00019985269762457666, 'samples': 820128, 'steps': 1601, 'loss/train': 2.8262298107147217} -09/20/2021 20:02:18 - INFO - __main__ - Step 25630: {'lr': 0.00019985269762457666, 'samples': 820160, 'steps': 1601, 'loss/train': 3.278768301010132} -09/20/2021 20:02:18 - INFO - __main__ - Step 25631: {'lr': 0.00019985269762457666, 'samples': 820192, 'steps': 1601, 'loss/train': 2.746591806411743} -09/20/2021 20:02:19 - INFO - __main__ - Step 25632: {'lr': 0.00019985269762457666, 'samples': 820224, 'steps': 1601, 'loss/train': 0.9786550998687744} -09/20/2021 20:02:20 - INFO - __main__ - Step 25633: {'lr': 0.00019985235131989577, 'samples': 820256, 'steps': 1602, 'loss/train': 2.6351535320281982} -09/20/2021 20:02:21 - INFO - __main__ - Step 25634: {'lr': 0.00019985235131989577, 'samples': 820288, 'steps': 1602, 'loss/train': 3.135006904602051} -09/20/2021 20:02:21 - INFO - __main__ - Step 25635: {'lr': 0.00019985235131989577, 'samples': 820320, 'steps': 1602, 'loss/train': 2.478588104248047} -09/20/2021 20:02:22 - INFO - __main__ - Step 25636: {'lr': 0.00019985235131989577, 'samples': 820352, 'steps': 1602, 'loss/train': 2.673966884613037} -09/20/2021 20:02:23 - INFO - __main__ - Step 25637: {'lr': 0.00019985235131989577, 'samples': 820384, 'steps': 1602, 'loss/train': 2.023905038833618} -09/20/2021 20:02:24 - INFO - __main__ - Step 25638: {'lr': 0.00019985235131989577, 'samples': 820416, 'steps': 1602, 'loss/train': 2.9589273929595947} -09/20/2021 20:02:24 - INFO - __main__ - Step 25639: {'lr': 0.00019985235131989577, 'samples': 820448, 'steps': 1602, 'loss/train': 2.4993433952331543} -09/20/2021 20:02:25 - INFO - __main__ - Step 25640: {'lr': 0.00019985235131989577, 'samples': 820480, 'steps': 1602, 'loss/train': 3.2020022869110107} -09/20/2021 20:02:26 - INFO - __main__ - Step 25641: {'lr': 0.00019985235131989577, 'samples': 820512, 'steps': 1602, 'loss/train': 2.7716052532196045} -09/20/2021 20:02:27 - INFO - __main__ - Step 25642: {'lr': 0.00019985235131989577, 'samples': 820544, 'steps': 1602, 'loss/train': 1.0881212949752808} -09/20/2021 20:02:27 - INFO - __main__ - Step 25643: {'lr': 0.00019985235131989577, 'samples': 820576, 'steps': 1602, 'loss/train': 3.5301103591918945} -09/20/2021 20:02:28 - INFO - __main__ - Step 25644: {'lr': 0.00019985235131989577, 'samples': 820608, 'steps': 1602, 'loss/train': 2.5672695636749268} -09/20/2021 20:02:29 - INFO - __main__ - Step 25645: {'lr': 0.00019985235131989577, 'samples': 820640, 'steps': 1602, 'loss/train': 3.442328929901123} -09/20/2021 20:02:30 - INFO - __main__ - Step 25646: {'lr': 0.00019985235131989577, 'samples': 820672, 'steps': 1602, 'loss/train': 2.2981724739074707} -09/20/2021 20:02:30 - INFO - __main__ - Step 25647: {'lr': 0.00019985235131989577, 'samples': 820704, 'steps': 1602, 'loss/train': 3.2771410942077637} -09/20/2021 20:02:31 - INFO - __main__ - Step 25648: {'lr': 0.00019985235131989577, 'samples': 820736, 'steps': 1602, 'loss/train': 3.1025280952453613} -09/20/2021 20:02:32 - INFO - __main__ - Step 25649: {'lr': 0.00019985200460891602, 'samples': 820768, 'steps': 1603, 'loss/train': 2.2082295417785645} -09/20/2021 20:02:33 - INFO - __main__ - Step 25650: {'lr': 0.00019985200460891602, 'samples': 820800, 'steps': 1603, 'loss/train': 2.72469162940979} -09/20/2021 20:02:34 - INFO - __main__ - Step 25651: {'lr': 0.00019985200460891602, 'samples': 820832, 'steps': 1603, 'loss/train': 1.8820058107376099} -09/20/2021 20:02:34 - INFO - __main__ - Step 25652: {'lr': 0.00019985200460891602, 'samples': 820864, 'steps': 1603, 'loss/train': 5.105242729187012} -09/20/2021 20:02:35 - INFO - __main__ - Step 25653: {'lr': 0.00019985200460891602, 'samples': 820896, 'steps': 1603, 'loss/train': 2.509678602218628} -09/20/2021 20:02:36 - INFO - __main__ - Step 25654: {'lr': 0.00019985200460891602, 'samples': 820928, 'steps': 1603, 'loss/train': 2.050513505935669} -09/20/2021 20:02:37 - INFO - __main__ - Step 25655: {'lr': 0.00019985200460891602, 'samples': 820960, 'steps': 1603, 'loss/train': 2.970820188522339} -09/20/2021 20:02:38 - INFO - __main__ - Step 25656: {'lr': 0.00019985200460891602, 'samples': 820992, 'steps': 1603, 'loss/train': 2.4266061782836914} -09/20/2021 20:02:39 - INFO - __main__ - Step 25657: {'lr': 0.00019985200460891602, 'samples': 821024, 'steps': 1603, 'loss/train': 1.913722276687622} -09/20/2021 20:02:39 - INFO - __main__ - Step 25658: {'lr': 0.00019985200460891602, 'samples': 821056, 'steps': 1603, 'loss/train': 1.7633049488067627} -09/20/2021 20:02:40 - INFO - __main__ - Step 25659: {'lr': 0.00019985200460891602, 'samples': 821088, 'steps': 1603, 'loss/train': 1.4666942358016968} -09/20/2021 20:02:41 - INFO - __main__ - Step 25660: {'lr': 0.00019985200460891602, 'samples': 821120, 'steps': 1603, 'loss/train': 2.9031922817230225} -09/20/2021 20:02:42 - INFO - __main__ - Step 25661: {'lr': 0.00019985200460891602, 'samples': 821152, 'steps': 1603, 'loss/train': 1.692861795425415} -09/20/2021 20:02:42 - INFO - __main__ - Step 25662: {'lr': 0.00019985200460891602, 'samples': 821184, 'steps': 1603, 'loss/train': 2.4444329738616943} -09/20/2021 20:02:43 - INFO - __main__ - Step 25663: {'lr': 0.00019985200460891602, 'samples': 821216, 'steps': 1603, 'loss/train': 2.349217176437378} -09/20/2021 20:02:44 - INFO - __main__ - Step 25664: {'lr': 0.00019985200460891602, 'samples': 821248, 'steps': 1603, 'loss/train': 3.723973512649536} -09/20/2021 20:02:45 - INFO - __main__ - Step 25665: {'lr': 0.00019985165749163887, 'samples': 821280, 'steps': 1604, 'loss/train': 2.3122568130493164} -09/20/2021 20:02:46 - INFO - __main__ - Step 25666: {'lr': 0.00019985165749163887, 'samples': 821312, 'steps': 1604, 'loss/train': 1.4740464687347412} -09/20/2021 20:02:46 - INFO - __main__ - Step 25667: {'lr': 0.00019985165749163887, 'samples': 821344, 'steps': 1604, 'loss/train': 2.53739857673645} -09/20/2021 20:02:47 - INFO - __main__ - Step 25668: {'lr': 0.00019985165749163887, 'samples': 821376, 'steps': 1604, 'loss/train': 2.6407408714294434} -09/20/2021 20:02:48 - INFO - __main__ - Step 25669: {'lr': 0.00019985165749163887, 'samples': 821408, 'steps': 1604, 'loss/train': 2.928884506225586} -09/20/2021 20:02:49 - INFO - __main__ - Step 25670: {'lr': 0.00019985165749163887, 'samples': 821440, 'steps': 1604, 'loss/train': 3.048412322998047} -09/20/2021 20:02:49 - INFO - __main__ - Step 25671: {'lr': 0.00019985165749163887, 'samples': 821472, 'steps': 1604, 'loss/train': 3.125265598297119} -09/20/2021 20:02:50 - INFO - __main__ - Step 25672: {'lr': 0.00019985165749163887, 'samples': 821504, 'steps': 1604, 'loss/train': 2.1861088275909424} -09/20/2021 20:02:51 - INFO - __main__ - Step 25673: {'lr': 0.00019985165749163887, 'samples': 821536, 'steps': 1604, 'loss/train': 2.3643126487731934} -09/20/2021 20:02:52 - INFO - __main__ - Step 25674: {'lr': 0.00019985165749163887, 'samples': 821568, 'steps': 1604, 'loss/train': 1.9847720861434937} -09/20/2021 20:02:52 - INFO - __main__ - Step 25675: {'lr': 0.00019985165749163887, 'samples': 821600, 'steps': 1604, 'loss/train': 3.288698673248291} -09/20/2021 20:02:53 - INFO - __main__ - Step 25676: {'lr': 0.00019985165749163887, 'samples': 821632, 'steps': 1604, 'loss/train': 2.539548397064209} -09/20/2021 20:02:54 - INFO - __main__ - Step 25677: {'lr': 0.00019985165749163887, 'samples': 821664, 'steps': 1604, 'loss/train': 3.1425464153289795} -09/20/2021 20:02:55 - INFO - __main__ - Step 25678: {'lr': 0.00019985165749163887, 'samples': 821696, 'steps': 1604, 'loss/train': 0.6335715651512146} -09/20/2021 20:02:55 - INFO - __main__ - Step 25679: {'lr': 0.00019985165749163887, 'samples': 821728, 'steps': 1604, 'loss/train': 3.3967041969299316} -09/20/2021 20:02:56 - INFO - __main__ - Step 25680: {'lr': 0.00019985165749163887, 'samples': 821760, 'steps': 1604, 'loss/train': 2.2954800128936768} -09/20/2021 20:02:57 - INFO - __main__ - Step 25681: {'lr': 0.00019985130996806572, 'samples': 821792, 'steps': 1605, 'loss/train': 1.9405776262283325} -09/20/2021 20:02:58 - INFO - __main__ - Step 25682: {'lr': 0.00019985130996806572, 'samples': 821824, 'steps': 1605, 'loss/train': 2.433274745941162} -09/20/2021 20:02:58 - INFO - __main__ - Step 25683: {'lr': 0.00019985130996806572, 'samples': 821856, 'steps': 1605, 'loss/train': 2.9444007873535156} -09/20/2021 20:02:59 - INFO - __main__ - Step 25684: {'lr': 0.00019985130996806572, 'samples': 821888, 'steps': 1605, 'loss/train': 2.999488115310669} -09/20/2021 20:03:00 - INFO - __main__ - Step 25685: {'lr': 0.00019985130996806572, 'samples': 821920, 'steps': 1605, 'loss/train': 2.8542368412017822} -09/20/2021 20:03:01 - INFO - __main__ - Step 25686: {'lr': 0.00019985130996806572, 'samples': 821952, 'steps': 1605, 'loss/train': 2.549412727355957} -09/20/2021 20:03:02 - INFO - __main__ - Step 25687: {'lr': 0.00019985130996806572, 'samples': 821984, 'steps': 1605, 'loss/train': 2.600332498550415} -09/20/2021 20:03:03 - INFO - __main__ - Step 25688: {'lr': 0.00019985130996806572, 'samples': 822016, 'steps': 1605, 'loss/train': 3.409827470779419} -09/20/2021 20:03:04 - INFO - __main__ - Step 25689: {'lr': 0.00019985130996806572, 'samples': 822048, 'steps': 1605, 'loss/train': 3.113117218017578} -09/20/2021 20:03:04 - INFO - __main__ - Step 25690: {'lr': 0.00019985130996806572, 'samples': 822080, 'steps': 1605, 'loss/train': 3.244532585144043} -09/20/2021 20:03:05 - INFO - __main__ - Step 25691: {'lr': 0.00019985130996806572, 'samples': 822112, 'steps': 1605, 'loss/train': 2.1022119522094727} -09/20/2021 20:03:06 - INFO - __main__ - Step 25692: {'lr': 0.00019985130996806572, 'samples': 822144, 'steps': 1605, 'loss/train': 2.616727113723755} -09/20/2021 20:03:07 - INFO - __main__ - Step 25693: {'lr': 0.00019985130996806572, 'samples': 822176, 'steps': 1605, 'loss/train': 3.012343645095825} -09/20/2021 20:03:07 - INFO - __main__ - Step 25694: {'lr': 0.00019985130996806572, 'samples': 822208, 'steps': 1605, 'loss/train': 2.6927669048309326} -09/20/2021 20:03:08 - INFO - __main__ - Step 25695: {'lr': 0.00019985130996806572, 'samples': 822240, 'steps': 1605, 'loss/train': 2.7503106594085693} -09/20/2021 20:03:09 - INFO - __main__ - Step 25696: {'lr': 0.00019985130996806572, 'samples': 822272, 'steps': 1605, 'loss/train': 2.2724568843841553} -09/20/2021 20:03:10 - INFO - __main__ - Step 25697: {'lr': 0.00019985096203819794, 'samples': 822304, 'steps': 1606, 'loss/train': 2.681698799133301} -09/20/2021 20:03:10 - INFO - __main__ - Step 25698: {'lr': 0.00019985096203819794, 'samples': 822336, 'steps': 1606, 'loss/train': 3.483981132507324} -09/20/2021 20:03:11 - INFO - __main__ - Step 25699: {'lr': 0.00019985096203819794, 'samples': 822368, 'steps': 1606, 'loss/train': 3.053128957748413} -09/20/2021 20:03:12 - INFO - __main__ - Step 25700: {'lr': 0.00019985096203819794, 'samples': 822400, 'steps': 1606, 'loss/train': 1.048660397529602} -09/20/2021 20:03:13 - INFO - __main__ - Step 25701: {'lr': 0.00019985096203819794, 'samples': 822432, 'steps': 1606, 'loss/train': 2.3959078788757324} -09/20/2021 20:03:13 - INFO - __main__ - Step 25702: {'lr': 0.00019985096203819794, 'samples': 822464, 'steps': 1606, 'loss/train': 3.078793525695801} -09/20/2021 20:03:14 - INFO - __main__ - Step 25703: {'lr': 0.00019985096203819794, 'samples': 822496, 'steps': 1606, 'loss/train': 3.015596389770508} -09/20/2021 20:03:15 - INFO - __main__ - Step 25704: {'lr': 0.00019985096203819794, 'samples': 822528, 'steps': 1606, 'loss/train': 2.415266990661621} -09/20/2021 20:03:16 - INFO - __main__ - Step 25705: {'lr': 0.00019985096203819794, 'samples': 822560, 'steps': 1606, 'loss/train': 2.9580578804016113} -09/20/2021 20:03:16 - INFO - __main__ - Step 25706: {'lr': 0.00019985096203819794, 'samples': 822592, 'steps': 1606, 'loss/train': 1.9372174739837646} -09/20/2021 20:03:17 - INFO - __main__ - Step 25707: {'lr': 0.00019985096203819794, 'samples': 822624, 'steps': 1606, 'loss/train': 3.677590847015381} -09/20/2021 20:03:18 - INFO - __main__ - Step 25708: {'lr': 0.00019985096203819794, 'samples': 822656, 'steps': 1606, 'loss/train': 3.944257974624634} -09/20/2021 20:03:19 - INFO - __main__ - Step 25709: {'lr': 0.00019985096203819794, 'samples': 822688, 'steps': 1606, 'loss/train': 2.7718427181243896} -09/20/2021 20:03:19 - INFO - __main__ - Step 25710: {'lr': 0.00019985096203819794, 'samples': 822720, 'steps': 1606, 'loss/train': 2.7063658237457275} -09/20/2021 20:03:20 - INFO - __main__ - Step 25711: {'lr': 0.00019985096203819794, 'samples': 822752, 'steps': 1606, 'loss/train': 2.9655637741088867} -09/20/2021 20:03:21 - INFO - __main__ - Step 25712: {'lr': 0.00019985096203819794, 'samples': 822784, 'steps': 1606, 'loss/train': 2.6386947631835938} -09/20/2021 20:03:22 - INFO - __main__ - Step 25713: {'lr': 0.000199850613702037, 'samples': 822816, 'steps': 1607, 'loss/train': 2.9778575897216797} -09/20/2021 20:03:23 - INFO - __main__ - Step 25714: {'lr': 0.000199850613702037, 'samples': 822848, 'steps': 1607, 'loss/train': 3.0126144886016846} -09/20/2021 20:03:23 - INFO - __main__ - Step 25715: {'lr': 0.000199850613702037, 'samples': 822880, 'steps': 1607, 'loss/train': 0.5666302442550659} -09/20/2021 20:03:24 - INFO - __main__ - Step 25716: {'lr': 0.000199850613702037, 'samples': 822912, 'steps': 1607, 'loss/train': 4.004020690917969} -09/20/2021 20:03:25 - INFO - __main__ - Step 25717: {'lr': 0.000199850613702037, 'samples': 822944, 'steps': 1607, 'loss/train': 2.4507699012756348} -09/20/2021 20:03:26 - INFO - __main__ - Step 25718: {'lr': 0.000199850613702037, 'samples': 822976, 'steps': 1607, 'loss/train': 1.9406769275665283} -09/20/2021 20:03:27 - INFO - __main__ - Step 25719: {'lr': 0.000199850613702037, 'samples': 823008, 'steps': 1607, 'loss/train': 2.348641872406006} -09/20/2021 20:03:28 - INFO - __main__ - Step 25720: {'lr': 0.000199850613702037, 'samples': 823040, 'steps': 1607, 'loss/train': 2.9099538326263428} -09/20/2021 20:03:28 - INFO - __main__ - Step 25721: {'lr': 0.000199850613702037, 'samples': 823072, 'steps': 1607, 'loss/train': 3.715663433074951} -09/20/2021 20:03:29 - INFO - __main__ - Step 25722: {'lr': 0.000199850613702037, 'samples': 823104, 'steps': 1607, 'loss/train': 3.4782626628875732} -09/20/2021 20:03:30 - INFO - __main__ - Step 25723: {'lr': 0.000199850613702037, 'samples': 823136, 'steps': 1607, 'loss/train': 2.366366147994995} -09/20/2021 20:03:31 - INFO - __main__ - Step 25724: {'lr': 0.000199850613702037, 'samples': 823168, 'steps': 1607, 'loss/train': 3.0183682441711426} -09/20/2021 20:03:31 - INFO - __main__ - Step 25725: {'lr': 0.000199850613702037, 'samples': 823200, 'steps': 1607, 'loss/train': 2.456233501434326} -09/20/2021 20:03:32 - INFO - __main__ - Step 25726: {'lr': 0.000199850613702037, 'samples': 823232, 'steps': 1607, 'loss/train': 1.9904911518096924} -09/20/2021 20:03:33 - INFO - __main__ - Step 25727: {'lr': 0.000199850613702037, 'samples': 823264, 'steps': 1607, 'loss/train': 3.284345865249634} -09/20/2021 20:03:34 - INFO - __main__ - Step 25728: {'lr': 0.000199850613702037, 'samples': 823296, 'steps': 1607, 'loss/train': 2.6084840297698975} -09/20/2021 20:03:34 - INFO - __main__ - Step 25729: {'lr': 0.00019985026495958434, 'samples': 823328, 'steps': 1608, 'loss/train': 3.3127951622009277} -09/20/2021 20:03:35 - INFO - __main__ - Step 25730: {'lr': 0.00019985026495958434, 'samples': 823360, 'steps': 1608, 'loss/train': 0.7225691676139832} -09/20/2021 20:03:36 - INFO - __main__ - Step 25731: {'lr': 0.00019985026495958434, 'samples': 823392, 'steps': 1608, 'loss/train': 2.3080244064331055} -09/20/2021 20:03:37 - INFO - __main__ - Step 25732: {'lr': 0.00019985026495958434, 'samples': 823424, 'steps': 1608, 'loss/train': 2.834052562713623} -09/20/2021 20:03:37 - INFO - __main__ - Step 25733: {'lr': 0.00019985026495958434, 'samples': 823456, 'steps': 1608, 'loss/train': 2.105428695678711} -09/20/2021 20:03:38 - INFO - __main__ - Step 25734: {'lr': 0.00019985026495958434, 'samples': 823488, 'steps': 1608, 'loss/train': 3.469827890396118} -09/20/2021 20:03:39 - INFO - __main__ - Step 25735: {'lr': 0.00019985026495958434, 'samples': 823520, 'steps': 1608, 'loss/train': 2.683530807495117} -09/20/2021 20:03:40 - INFO - __main__ - Step 25736: {'lr': 0.00019985026495958434, 'samples': 823552, 'steps': 1608, 'loss/train': 3.419238567352295} -09/20/2021 20:03:40 - INFO - __main__ - Step 25737: {'lr': 0.00019985026495958434, 'samples': 823584, 'steps': 1608, 'loss/train': 2.399106502532959} -09/20/2021 20:03:41 - INFO - __main__ - Step 25738: {'lr': 0.00019985026495958434, 'samples': 823616, 'steps': 1608, 'loss/train': 2.480851411819458} -09/20/2021 20:03:42 - INFO - __main__ - Step 25739: {'lr': 0.00019985026495958434, 'samples': 823648, 'steps': 1608, 'loss/train': 3.3726603984832764} -09/20/2021 20:03:43 - INFO - __main__ - Step 25740: {'lr': 0.00019985026495958434, 'samples': 823680, 'steps': 1608, 'loss/train': 3.1799240112304688} -09/20/2021 20:03:43 - INFO - __main__ - Step 25741: {'lr': 0.00019985026495958434, 'samples': 823712, 'steps': 1608, 'loss/train': 2.8971076011657715} -09/20/2021 20:03:44 - INFO - __main__ - Step 25742: {'lr': 0.00019985026495958434, 'samples': 823744, 'steps': 1608, 'loss/train': 2.8489320278167725} -09/20/2021 20:03:45 - INFO - __main__ - Step 25743: {'lr': 0.00019985026495958434, 'samples': 823776, 'steps': 1608, 'loss/train': 2.428375720977783} -09/20/2021 20:03:46 - INFO - __main__ - Step 25744: {'lr': 0.00019985026495958434, 'samples': 823808, 'steps': 1608, 'loss/train': 2.1296935081481934} -09/20/2021 20:03:47 - INFO - __main__ - Step 25745: {'lr': 0.0001998499158108413, 'samples': 823840, 'steps': 1609, 'loss/train': 3.1610751152038574} -09/20/2021 20:03:47 - INFO - __main__ - Step 25746: {'lr': 0.0001998499158108413, 'samples': 823872, 'steps': 1609, 'loss/train': 3.056701898574829} -09/20/2021 20:03:48 - INFO - __main__ - Step 25747: {'lr': 0.0001998499158108413, 'samples': 823904, 'steps': 1609, 'loss/train': 2.5644030570983887} -09/20/2021 20:03:49 - INFO - __main__ - Step 25748: {'lr': 0.0001998499158108413, 'samples': 823936, 'steps': 1609, 'loss/train': 1.8747646808624268} -09/20/2021 20:03:50 - INFO - __main__ - Step 25749: {'lr': 0.0001998499158108413, 'samples': 823968, 'steps': 1609, 'loss/train': 3.4866583347320557} -09/20/2021 20:03:51 - INFO - __main__ - Step 25750: {'lr': 0.0001998499158108413, 'samples': 824000, 'steps': 1609, 'loss/train': 3.235053062438965} -09/20/2021 20:03:52 - INFO - __main__ - Step 25751: {'lr': 0.0001998499158108413, 'samples': 824032, 'steps': 1609, 'loss/train': 2.2317934036254883} -09/20/2021 20:03:52 - INFO - __main__ - Step 25752: {'lr': 0.0001998499158108413, 'samples': 824064, 'steps': 1609, 'loss/train': 3.0493717193603516} -09/20/2021 20:03:53 - INFO - __main__ - Step 25753: {'lr': 0.0001998499158108413, 'samples': 824096, 'steps': 1609, 'loss/train': 1.7378857135772705} -09/20/2021 20:03:54 - INFO - __main__ - Step 25754: {'lr': 0.0001998499158108413, 'samples': 824128, 'steps': 1609, 'loss/train': 2.6575984954833984} -09/20/2021 20:03:55 - INFO - __main__ - Step 25755: {'lr': 0.0001998499158108413, 'samples': 824160, 'steps': 1609, 'loss/train': 2.7839109897613525} -09/20/2021 20:03:55 - INFO - __main__ - Step 25756: {'lr': 0.0001998499158108413, 'samples': 824192, 'steps': 1609, 'loss/train': 2.6100668907165527} -09/20/2021 20:03:56 - INFO - __main__ - Step 25757: {'lr': 0.0001998499158108413, 'samples': 824224, 'steps': 1609, 'loss/train': 3.6355955600738525} -09/20/2021 20:03:57 - INFO - __main__ - Step 25758: {'lr': 0.0001998499158108413, 'samples': 824256, 'steps': 1609, 'loss/train': 2.4902443885803223} -09/20/2021 20:03:58 - INFO - __main__ - Step 25759: {'lr': 0.0001998499158108413, 'samples': 824288, 'steps': 1609, 'loss/train': 2.405485153198242} -09/20/2021 20:03:58 - INFO - __main__ - Step 25760: {'lr': 0.0001998499158108413, 'samples': 824320, 'steps': 1609, 'loss/train': 2.0219054222106934} -09/20/2021 20:03:59 - INFO - __main__ - Step 25761: {'lr': 0.00019984956625580935, 'samples': 824352, 'steps': 1610, 'loss/train': 2.1406898498535156} -09/20/2021 20:04:00 - INFO - __main__ - Step 25762: {'lr': 0.00019984956625580935, 'samples': 824384, 'steps': 1610, 'loss/train': 2.5887739658355713} -09/20/2021 20:04:01 - INFO - __main__ - Step 25763: {'lr': 0.00019984956625580935, 'samples': 824416, 'steps': 1610, 'loss/train': 2.603858470916748} -09/20/2021 20:04:02 - INFO - __main__ - Step 25764: {'lr': 0.00019984956625580935, 'samples': 824448, 'steps': 1610, 'loss/train': 2.8661348819732666} -09/20/2021 20:04:02 - INFO - __main__ - Step 25765: {'lr': 0.00019984956625580935, 'samples': 824480, 'steps': 1610, 'loss/train': 2.6970229148864746} -09/20/2021 20:04:03 - INFO - __main__ - Step 25766: {'lr': 0.00019984956625580935, 'samples': 824512, 'steps': 1610, 'loss/train': 1.6089839935302734} -09/20/2021 20:04:04 - INFO - __main__ - Step 25767: {'lr': 0.00019984956625580935, 'samples': 824544, 'steps': 1610, 'loss/train': 3.029792547225952} -09/20/2021 20:04:05 - INFO - __main__ - Step 25768: {'lr': 0.00019984956625580935, 'samples': 824576, 'steps': 1610, 'loss/train': 2.199948310852051} -09/20/2021 20:04:05 - INFO - __main__ - Step 25769: {'lr': 0.00019984956625580935, 'samples': 824608, 'steps': 1610, 'loss/train': 2.832223892211914} -09/20/2021 20:04:06 - INFO - __main__ - Step 25770: {'lr': 0.00019984956625580935, 'samples': 824640, 'steps': 1610, 'loss/train': 2.1525754928588867} -09/20/2021 20:04:07 - INFO - __main__ - Step 25771: {'lr': 0.00019984956625580935, 'samples': 824672, 'steps': 1610, 'loss/train': 3.1214163303375244} -09/20/2021 20:04:08 - INFO - __main__ - Step 25772: {'lr': 0.00019984956625580935, 'samples': 824704, 'steps': 1610, 'loss/train': 2.6839632987976074} -09/20/2021 20:04:08 - INFO - __main__ - Step 25773: {'lr': 0.00019984956625580935, 'samples': 824736, 'steps': 1610, 'loss/train': 3.2829487323760986} -09/20/2021 20:04:09 - INFO - __main__ - Step 25774: {'lr': 0.00019984956625580935, 'samples': 824768, 'steps': 1610, 'loss/train': 2.97908878326416} -09/20/2021 20:04:10 - INFO - __main__ - Step 25775: {'lr': 0.00019984956625580935, 'samples': 824800, 'steps': 1610, 'loss/train': 3.187079429626465} -09/20/2021 20:04:11 - INFO - __main__ - Step 25776: {'lr': 0.00019984956625580935, 'samples': 824832, 'steps': 1610, 'loss/train': 3.6592555046081543} -09/20/2021 20:04:11 - INFO - __main__ - Step 25777: {'lr': 0.0001998492162944899, 'samples': 824864, 'steps': 1611, 'loss/train': 3.794966459274292} -09/20/2021 20:04:12 - INFO - __main__ - Step 25778: {'lr': 0.0001998492162944899, 'samples': 824896, 'steps': 1611, 'loss/train': 0.9048334956169128} -09/20/2021 20:04:13 - INFO - __main__ - Step 25779: {'lr': 0.0001998492162944899, 'samples': 824928, 'steps': 1611, 'loss/train': 2.6724231243133545} -09/20/2021 20:04:14 - INFO - __main__ - Step 25780: {'lr': 0.0001998492162944899, 'samples': 824960, 'steps': 1611, 'loss/train': 2.4759998321533203} -09/20/2021 20:04:15 - INFO - __main__ - Step 25781: {'lr': 0.0001998492162944899, 'samples': 824992, 'steps': 1611, 'loss/train': 2.2034127712249756} -09/20/2021 20:04:16 - INFO - __main__ - Step 25782: {'lr': 0.0001998492162944899, 'samples': 825024, 'steps': 1611, 'loss/train': 0.9672918319702148} -09/20/2021 20:04:16 - INFO - __main__ - Step 25783: {'lr': 0.0001998492162944899, 'samples': 825056, 'steps': 1611, 'loss/train': 2.9131243228912354} -09/20/2021 20:04:17 - INFO - __main__ - Step 25784: {'lr': 0.0001998492162944899, 'samples': 825088, 'steps': 1611, 'loss/train': 3.1362407207489014} -09/20/2021 20:04:18 - INFO - __main__ - Step 25785: {'lr': 0.0001998492162944899, 'samples': 825120, 'steps': 1611, 'loss/train': 3.2049968242645264} -09/20/2021 20:04:19 - INFO - __main__ - Step 25786: {'lr': 0.0001998492162944899, 'samples': 825152, 'steps': 1611, 'loss/train': 2.3708457946777344} -09/20/2021 20:04:19 - INFO - __main__ - Step 25787: {'lr': 0.0001998492162944899, 'samples': 825184, 'steps': 1611, 'loss/train': 2.2022857666015625} -09/20/2021 20:04:20 - INFO - __main__ - Step 25788: {'lr': 0.0001998492162944899, 'samples': 825216, 'steps': 1611, 'loss/train': 2.6406702995300293} -09/20/2021 20:04:21 - INFO - __main__ - Step 25789: {'lr': 0.0001998492162944899, 'samples': 825248, 'steps': 1611, 'loss/train': 3.3223586082458496} -09/20/2021 20:04:22 - INFO - __main__ - Step 25790: {'lr': 0.0001998492162944899, 'samples': 825280, 'steps': 1611, 'loss/train': 2.3350837230682373} -09/20/2021 20:04:22 - INFO - __main__ - Step 25791: {'lr': 0.0001998492162944899, 'samples': 825312, 'steps': 1611, 'loss/train': 3.360236167907715} -09/20/2021 20:04:23 - INFO - __main__ - Step 25792: {'lr': 0.0001998492162944899, 'samples': 825344, 'steps': 1611, 'loss/train': 2.7137742042541504} -09/20/2021 20:04:24 - INFO - __main__ - Step 25793: {'lr': 0.0001998488659268844, 'samples': 825376, 'steps': 1612, 'loss/train': 2.8253636360168457} -09/20/2021 20:04:25 - INFO - __main__ - Step 25794: {'lr': 0.0001998488659268844, 'samples': 825408, 'steps': 1612, 'loss/train': 2.039653778076172} -09/20/2021 20:04:26 - INFO - __main__ - Step 25795: {'lr': 0.0001998488659268844, 'samples': 825440, 'steps': 1612, 'loss/train': 1.6827619075775146} -09/20/2021 20:04:26 - INFO - __main__ - Step 25796: {'lr': 0.0001998488659268844, 'samples': 825472, 'steps': 1612, 'loss/train': 3.650674343109131} -09/20/2021 20:04:27 - INFO - __main__ - Step 25797: {'lr': 0.0001998488659268844, 'samples': 825504, 'steps': 1612, 'loss/train': 3.1891064643859863} -09/20/2021 20:04:28 - INFO - __main__ - Step 25798: {'lr': 0.0001998488659268844, 'samples': 825536, 'steps': 1612, 'loss/train': 2.9294707775115967} -09/20/2021 20:04:29 - INFO - __main__ - Step 25799: {'lr': 0.0001998488659268844, 'samples': 825568, 'steps': 1612, 'loss/train': 2.7972252368927} -09/20/2021 20:04:29 - INFO - __main__ - Step 25800: {'lr': 0.0001998488659268844, 'samples': 825600, 'steps': 1612, 'loss/train': 2.8668460845947266} -09/20/2021 20:04:30 - INFO - __main__ - Step 25801: {'lr': 0.0001998488659268844, 'samples': 825632, 'steps': 1612, 'loss/train': 2.9439172744750977} -09/20/2021 20:04:31 - INFO - __main__ - Step 25802: {'lr': 0.0001998488659268844, 'samples': 825664, 'steps': 1612, 'loss/train': 2.7157516479492188} -09/20/2021 20:04:32 - INFO - __main__ - Step 25803: {'lr': 0.0001998488659268844, 'samples': 825696, 'steps': 1612, 'loss/train': 2.6475651264190674} -09/20/2021 20:04:32 - INFO - __main__ - Step 25804: {'lr': 0.0001998488659268844, 'samples': 825728, 'steps': 1612, 'loss/train': 3.355442523956299} -09/20/2021 20:04:33 - INFO - __main__ - Step 25805: {'lr': 0.0001998488659268844, 'samples': 825760, 'steps': 1612, 'loss/train': 2.7906265258789062} -09/20/2021 20:04:34 - INFO - __main__ - Step 25806: {'lr': 0.0001998488659268844, 'samples': 825792, 'steps': 1612, 'loss/train': 2.5599162578582764} -09/20/2021 20:04:35 - INFO - __main__ - Step 25807: {'lr': 0.0001998488659268844, 'samples': 825824, 'steps': 1612, 'loss/train': 2.5577564239501953} -09/20/2021 20:04:35 - INFO - __main__ - Step 25808: {'lr': 0.0001998488659268844, 'samples': 825856, 'steps': 1612, 'loss/train': 2.6774656772613525} -09/20/2021 20:04:37 - INFO - __main__ - Step 25809: {'lr': 0.0001998485151529942, 'samples': 825888, 'steps': 1613, 'loss/train': 2.2438364028930664} -09/20/2021 20:04:38 - INFO - __main__ - Step 25810: {'lr': 0.0001998485151529942, 'samples': 825920, 'steps': 1613, 'loss/train': 2.0676658153533936} -09/20/2021 20:04:39 - INFO - __main__ - Step 25811: {'lr': 0.0001998485151529942, 'samples': 825952, 'steps': 1613, 'loss/train': 2.481510639190674} -09/20/2021 20:04:39 - INFO - __main__ - Step 25812: {'lr': 0.0001998485151529942, 'samples': 825984, 'steps': 1613, 'loss/train': 2.805321455001831} -09/20/2021 20:04:40 - INFO - __main__ - Step 25813: {'lr': 0.0001998485151529942, 'samples': 826016, 'steps': 1613, 'loss/train': 1.6366955041885376} -09/20/2021 20:04:41 - INFO - __main__ - Step 25814: {'lr': 0.0001998485151529942, 'samples': 826048, 'steps': 1613, 'loss/train': 1.525473713874817} -09/20/2021 20:04:42 - INFO - __main__ - Step 25815: {'lr': 0.0001998485151529942, 'samples': 826080, 'steps': 1613, 'loss/train': 2.7819554805755615} -09/20/2021 20:04:42 - INFO - __main__ - Step 25816: {'lr': 0.0001998485151529942, 'samples': 826112, 'steps': 1613, 'loss/train': 2.8715434074401855} -09/20/2021 20:04:43 - INFO - __main__ - Step 25817: {'lr': 0.0001998485151529942, 'samples': 826144, 'steps': 1613, 'loss/train': 3.5772969722747803} -09/20/2021 20:04:44 - INFO - __main__ - Step 25818: {'lr': 0.0001998485151529942, 'samples': 826176, 'steps': 1613, 'loss/train': 1.0719006061553955} -09/20/2021 20:04:45 - INFO - __main__ - Step 25819: {'lr': 0.0001998485151529942, 'samples': 826208, 'steps': 1613, 'loss/train': 2.4766604900360107} -09/20/2021 20:04:45 - INFO - __main__ - Step 25820: {'lr': 0.0001998485151529942, 'samples': 826240, 'steps': 1613, 'loss/train': 3.0645952224731445} -09/20/2021 20:04:46 - INFO - __main__ - Step 25821: {'lr': 0.0001998485151529942, 'samples': 826272, 'steps': 1613, 'loss/train': 2.9894845485687256} -09/20/2021 20:04:47 - INFO - __main__ - Step 25822: {'lr': 0.0001998485151529942, 'samples': 826304, 'steps': 1613, 'loss/train': 2.148033857345581} -09/20/2021 20:04:48 - INFO - __main__ - Step 25823: {'lr': 0.0001998485151529942, 'samples': 826336, 'steps': 1613, 'loss/train': 1.365532398223877} -09/20/2021 20:04:48 - INFO - __main__ - Step 25824: {'lr': 0.0001998485151529942, 'samples': 826368, 'steps': 1613, 'loss/train': 0.36470744013786316} -09/20/2021 20:04:49 - INFO - __main__ - Step 25825: {'lr': 0.0001998481639728208, 'samples': 826400, 'steps': 1614, 'loss/train': 0.8383285999298096} -09/20/2021 20:04:50 - INFO - __main__ - Step 25826: {'lr': 0.0001998481639728208, 'samples': 826432, 'steps': 1614, 'loss/train': 0.8562210202217102} -09/20/2021 20:04:51 - INFO - __main__ - Step 25827: {'lr': 0.0001998481639728208, 'samples': 826464, 'steps': 1614, 'loss/train': 0.8574148416519165} -09/20/2021 20:04:51 - INFO - __main__ - Step 25828: {'lr': 0.0001998481639728208, 'samples': 826496, 'steps': 1614, 'loss/train': 2.883594036102295} -09/20/2021 20:04:52 - INFO - __main__ - Step 25829: {'lr': 0.0001998481639728208, 'samples': 826528, 'steps': 1614, 'loss/train': 3.487006902694702} -09/20/2021 20:04:53 - INFO - __main__ - Step 25830: {'lr': 0.0001998481639728208, 'samples': 826560, 'steps': 1614, 'loss/train': 2.9111616611480713} -09/20/2021 20:04:54 - INFO - __main__ - Step 25831: {'lr': 0.0001998481639728208, 'samples': 826592, 'steps': 1614, 'loss/train': 2.228695869445801} -09/20/2021 20:04:54 - INFO - __main__ - Step 25832: {'lr': 0.0001998481639728208, 'samples': 826624, 'steps': 1614, 'loss/train': 2.523054361343384} -09/20/2021 20:04:55 - INFO - __main__ - Step 25833: {'lr': 0.0001998481639728208, 'samples': 826656, 'steps': 1614, 'loss/train': 3.052605152130127} -09/20/2021 20:04:56 - INFO - __main__ - Step 25834: {'lr': 0.0001998481639728208, 'samples': 826688, 'steps': 1614, 'loss/train': 3.4756717681884766} -09/20/2021 20:04:57 - INFO - __main__ - Step 25835: {'lr': 0.0001998481639728208, 'samples': 826720, 'steps': 1614, 'loss/train': 1.2808955907821655} -09/20/2021 20:04:57 - INFO - __main__ - Step 25836: {'lr': 0.0001998481639728208, 'samples': 826752, 'steps': 1614, 'loss/train': 2.338806390762329} -09/20/2021 20:04:58 - INFO - __main__ - Step 25837: {'lr': 0.0001998481639728208, 'samples': 826784, 'steps': 1614, 'loss/train': 2.1605396270751953} -09/20/2021 20:04:59 - INFO - __main__ - Step 25838: {'lr': 0.0001998481639728208, 'samples': 826816, 'steps': 1614, 'loss/train': 2.071993112564087} -09/20/2021 20:05:00 - INFO - __main__ - Step 25839: {'lr': 0.0001998481639728208, 'samples': 826848, 'steps': 1614, 'loss/train': 2.2006843090057373} -09/20/2021 20:05:02 - INFO - __main__ - Step 25840: {'lr': 0.0001998481639728208, 'samples': 826880, 'steps': 1614, 'loss/train': 2.957502841949463} -09/20/2021 20:05:02 - INFO - __main__ - Step 25841: {'lr': 0.00019984781238636566, 'samples': 826912, 'steps': 1615, 'loss/train': 3.0115184783935547} -09/20/2021 20:05:03 - INFO - __main__ - Step 25842: {'lr': 0.00019984781238636566, 'samples': 826944, 'steps': 1615, 'loss/train': 1.5557485818862915} -09/20/2021 20:05:04 - INFO - __main__ - Step 25843: {'lr': 0.00019984781238636566, 'samples': 826976, 'steps': 1615, 'loss/train': 2.3698642253875732} -09/20/2021 20:05:05 - INFO - __main__ - Step 25844: {'lr': 0.00019984781238636566, 'samples': 827008, 'steps': 1615, 'loss/train': 2.832146406173706} -09/20/2021 20:05:05 - INFO - __main__ - Step 25845: {'lr': 0.00019984781238636566, 'samples': 827040, 'steps': 1615, 'loss/train': 2.811998128890991} -09/20/2021 20:05:06 - INFO - __main__ - Step 25846: {'lr': 0.00019984781238636566, 'samples': 827072, 'steps': 1615, 'loss/train': 2.404306411743164} -09/20/2021 20:05:07 - INFO - __main__ - Step 25847: {'lr': 0.00019984781238636566, 'samples': 827104, 'steps': 1615, 'loss/train': 2.5475780963897705} -09/20/2021 20:05:08 - INFO - __main__ - Step 25848: {'lr': 0.00019984781238636566, 'samples': 827136, 'steps': 1615, 'loss/train': 2.62628436088562} -09/20/2021 20:05:08 - INFO - __main__ - Step 25849: {'lr': 0.00019984781238636566, 'samples': 827168, 'steps': 1615, 'loss/train': 1.11418879032135} -09/20/2021 20:05:09 - INFO - __main__ - Step 25850: {'lr': 0.00019984781238636566, 'samples': 827200, 'steps': 1615, 'loss/train': 0.9734542965888977} -09/20/2021 20:05:10 - INFO - __main__ - Step 25851: {'lr': 0.00019984781238636566, 'samples': 827232, 'steps': 1615, 'loss/train': 1.5235344171524048} -09/20/2021 20:05:11 - INFO - __main__ - Step 25852: {'lr': 0.00019984781238636566, 'samples': 827264, 'steps': 1615, 'loss/train': 0.4125968813896179} -09/20/2021 20:05:11 - INFO - __main__ - Step 25853: {'lr': 0.00019984781238636566, 'samples': 827296, 'steps': 1615, 'loss/train': 0.712130069732666} -09/20/2021 20:05:12 - INFO - __main__ - Step 25854: {'lr': 0.00019984781238636566, 'samples': 827328, 'steps': 1615, 'loss/train': 0.526822030544281} -09/20/2021 20:05:13 - INFO - __main__ - Step 25855: {'lr': 0.00019984781238636566, 'samples': 827360, 'steps': 1615, 'loss/train': 1.0844855308532715} -09/20/2021 20:05:14 - INFO - __main__ - Step 25856: {'lr': 0.00019984781238636566, 'samples': 827392, 'steps': 1615, 'loss/train': 0.3898840844631195} -09/20/2021 20:05:15 - INFO - __main__ - Step 25857: {'lr': 0.0001998474603936301, 'samples': 827424, 'steps': 1616, 'loss/train': 1.151737928390503} -09/20/2021 20:05:15 - INFO - __main__ - Step 25858: {'lr': 0.0001998474603936301, 'samples': 827456, 'steps': 1616, 'loss/train': 3.4062373638153076} -09/20/2021 20:05:16 - INFO - __main__ - Step 25859: {'lr': 0.0001998474603936301, 'samples': 827488, 'steps': 1616, 'loss/train': 2.8021552562713623} -09/20/2021 20:05:17 - INFO - __main__ - Step 25860: {'lr': 0.0001998474603936301, 'samples': 827520, 'steps': 1616, 'loss/train': 2.784681558609009} -09/20/2021 20:05:18 - INFO - __main__ - Step 25861: {'lr': 0.0001998474603936301, 'samples': 827552, 'steps': 1616, 'loss/train': 2.3528759479522705} -09/20/2021 20:05:18 - INFO - __main__ - Step 25862: {'lr': 0.0001998474603936301, 'samples': 827584, 'steps': 1616, 'loss/train': 2.3618311882019043} -09/20/2021 20:05:19 - INFO - __main__ - Step 25863: {'lr': 0.0001998474603936301, 'samples': 827616, 'steps': 1616, 'loss/train': 3.2383873462677} -09/20/2021 20:05:20 - INFO - __main__ - Step 25864: {'lr': 0.0001998474603936301, 'samples': 827648, 'steps': 1616, 'loss/train': 3.163684129714966} -09/20/2021 20:05:21 - INFO - __main__ - Step 25865: {'lr': 0.0001998474603936301, 'samples': 827680, 'steps': 1616, 'loss/train': 2.4110145568847656} -09/20/2021 20:05:21 - INFO - __main__ - Step 25866: {'lr': 0.0001998474603936301, 'samples': 827712, 'steps': 1616, 'loss/train': 1.93986177444458} -09/20/2021 20:05:22 - INFO - __main__ - Step 25867: {'lr': 0.0001998474603936301, 'samples': 827744, 'steps': 1616, 'loss/train': 1.9897565841674805} -09/20/2021 20:05:23 - INFO - __main__ - Step 25868: {'lr': 0.0001998474603936301, 'samples': 827776, 'steps': 1616, 'loss/train': 2.8933699131011963} -09/20/2021 20:05:24 - INFO - __main__ - Step 25869: {'lr': 0.0001998474603936301, 'samples': 827808, 'steps': 1616, 'loss/train': 2.187138080596924} -09/20/2021 20:05:24 - INFO - __main__ - Step 25870: {'lr': 0.0001998474603936301, 'samples': 827840, 'steps': 1616, 'loss/train': 2.182220935821533} -09/20/2021 20:05:26 - INFO - __main__ - Step 25871: {'lr': 0.0001998474603936301, 'samples': 827872, 'steps': 1616, 'loss/train': 3.034173011779785} -09/20/2021 20:05:26 - INFO - __main__ - Step 25872: {'lr': 0.0001998474603936301, 'samples': 827904, 'steps': 1616, 'loss/train': 2.6166062355041504} -09/20/2021 20:05:27 - INFO - __main__ - Step 25873: {'lr': 0.00019984710799461562, 'samples': 827936, 'steps': 1617, 'loss/train': 2.8523733615875244} -09/20/2021 20:05:28 - INFO - __main__ - Step 25874: {'lr': 0.00019984710799461562, 'samples': 827968, 'steps': 1617, 'loss/train': 2.93757700920105} -09/20/2021 20:05:29 - INFO - __main__ - Step 25875: {'lr': 0.00019984710799461562, 'samples': 828000, 'steps': 1617, 'loss/train': 2.6328699588775635} -09/20/2021 20:05:30 - INFO - __main__ - Step 25876: {'lr': 0.00019984710799461562, 'samples': 828032, 'steps': 1617, 'loss/train': 3.2269814014434814} -09/20/2021 20:05:30 - INFO - __main__ - Step 25877: {'lr': 0.00019984710799461562, 'samples': 828064, 'steps': 1617, 'loss/train': 2.353245496749878} -09/20/2021 20:05:31 - INFO - __main__ - Step 25878: {'lr': 0.00019984710799461562, 'samples': 828096, 'steps': 1617, 'loss/train': 3.791546583175659} -09/20/2021 20:05:32 - INFO - __main__ - Step 25879: {'lr': 0.00019984710799461562, 'samples': 828128, 'steps': 1617, 'loss/train': 2.9540536403656006} -09/20/2021 20:05:33 - INFO - __main__ - Step 25880: {'lr': 0.00019984710799461562, 'samples': 828160, 'steps': 1617, 'loss/train': 2.527986764907837} -09/20/2021 20:05:33 - INFO - __main__ - Step 25881: {'lr': 0.00019984710799461562, 'samples': 828192, 'steps': 1617, 'loss/train': 2.8551249504089355} -09/20/2021 20:05:34 - INFO - __main__ - Step 25882: {'lr': 0.00019984710799461562, 'samples': 828224, 'steps': 1617, 'loss/train': 3.0391685962677} -09/20/2021 20:05:35 - INFO - __main__ - Step 25883: {'lr': 0.00019984710799461562, 'samples': 828256, 'steps': 1617, 'loss/train': 2.5567939281463623} -09/20/2021 20:05:36 - INFO - __main__ - Step 25884: {'lr': 0.00019984710799461562, 'samples': 828288, 'steps': 1617, 'loss/train': 2.7716708183288574} -09/20/2021 20:05:36 - INFO - __main__ - Step 25885: {'lr': 0.00019984710799461562, 'samples': 828320, 'steps': 1617, 'loss/train': 2.9834513664245605} -09/20/2021 20:05:37 - INFO - __main__ - Step 25886: {'lr': 0.00019984710799461562, 'samples': 828352, 'steps': 1617, 'loss/train': 2.4525306224823} -09/20/2021 20:05:38 - INFO - __main__ - Step 25887: {'lr': 0.00019984710799461562, 'samples': 828384, 'steps': 1617, 'loss/train': 3.445801019668579} -09/20/2021 20:05:39 - INFO - __main__ - Step 25888: {'lr': 0.00019984710799461562, 'samples': 828416, 'steps': 1617, 'loss/train': 2.751390218734741} -09/20/2021 20:05:39 - INFO - __main__ - Step 25889: {'lr': 0.00019984675518932367, 'samples': 828448, 'steps': 1618, 'loss/train': 2.3896114826202393} -09/20/2021 20:05:40 - INFO - __main__ - Step 25890: {'lr': 0.00019984675518932367, 'samples': 828480, 'steps': 1618, 'loss/train': 1.9063071012496948} -09/20/2021 20:05:41 - INFO - __main__ - Step 25891: {'lr': 0.00019984675518932367, 'samples': 828512, 'steps': 1618, 'loss/train': 1.4419670104980469} -09/20/2021 20:05:42 - INFO - __main__ - Step 25892: {'lr': 0.00019984675518932367, 'samples': 828544, 'steps': 1618, 'loss/train': 3.7118775844573975} -09/20/2021 20:05:42 - INFO - __main__ - Step 25893: {'lr': 0.00019984675518932367, 'samples': 828576, 'steps': 1618, 'loss/train': 3.0880162715911865} -09/20/2021 20:05:43 - INFO - __main__ - Step 25894: {'lr': 0.00019984675518932367, 'samples': 828608, 'steps': 1618, 'loss/train': 2.551393747329712} -09/20/2021 20:05:44 - INFO - __main__ - Step 25895: {'lr': 0.00019984675518932367, 'samples': 828640, 'steps': 1618, 'loss/train': 2.1834475994110107} -09/20/2021 20:05:45 - INFO - __main__ - Step 25896: {'lr': 0.00019984675518932367, 'samples': 828672, 'steps': 1618, 'loss/train': 3.261498212814331} -09/20/2021 20:05:45 - INFO - __main__ - Step 25897: {'lr': 0.00019984675518932367, 'samples': 828704, 'steps': 1618, 'loss/train': 3.1678059101104736} -09/20/2021 20:05:46 - INFO - __main__ - Step 25898: {'lr': 0.00019984675518932367, 'samples': 828736, 'steps': 1618, 'loss/train': 2.7219414710998535} -09/20/2021 20:05:47 - INFO - __main__ - Step 25899: {'lr': 0.00019984675518932367, 'samples': 828768, 'steps': 1618, 'loss/train': 2.3065919876098633} -09/20/2021 20:05:48 - INFO - __main__ - Step 25900: {'lr': 0.00019984675518932367, 'samples': 828800, 'steps': 1618, 'loss/train': 2.6547842025756836} -09/20/2021 20:05:48 - INFO - __main__ - Step 25901: {'lr': 0.00019984675518932367, 'samples': 828832, 'steps': 1618, 'loss/train': 2.4690914154052734} -09/20/2021 20:05:50 - INFO - __main__ - Step 25902: {'lr': 0.00019984675518932367, 'samples': 828864, 'steps': 1618, 'loss/train': 2.9472713470458984} -09/20/2021 20:05:51 - INFO - __main__ - Step 25903: {'lr': 0.00019984675518932367, 'samples': 828896, 'steps': 1618, 'loss/train': 2.7934865951538086} -09/20/2021 20:05:52 - INFO - __main__ - Step 25904: {'lr': 0.00019984675518932367, 'samples': 828928, 'steps': 1618, 'loss/train': 2.8229825496673584} -09/20/2021 20:05:52 - INFO - __main__ - Step 25905: {'lr': 0.00019984640197775563, 'samples': 828960, 'steps': 1619, 'loss/train': 2.420229434967041} -09/20/2021 20:05:53 - INFO - __main__ - Step 25906: {'lr': 0.00019984640197775563, 'samples': 828992, 'steps': 1619, 'loss/train': 2.713066339492798} -09/20/2021 20:05:54 - INFO - __main__ - Step 25907: {'lr': 0.00019984640197775563, 'samples': 829024, 'steps': 1619, 'loss/train': 2.143711566925049} -09/20/2021 20:05:55 - INFO - __main__ - Step 25908: {'lr': 0.00019984640197775563, 'samples': 829056, 'steps': 1619, 'loss/train': 3.7214486598968506} -09/20/2021 20:05:55 - INFO - __main__ - Step 25909: {'lr': 0.00019984640197775563, 'samples': 829088, 'steps': 1619, 'loss/train': 2.817680835723877} -09/20/2021 20:05:56 - INFO - __main__ - Step 25910: {'lr': 0.00019984640197775563, 'samples': 829120, 'steps': 1619, 'loss/train': 2.7107059955596924} -09/20/2021 20:05:57 - INFO - __main__ - Step 25911: {'lr': 0.00019984640197775563, 'samples': 829152, 'steps': 1619, 'loss/train': 3.035400152206421} -09/20/2021 20:05:58 - INFO - __main__ - Step 25912: {'lr': 0.00019984640197775563, 'samples': 829184, 'steps': 1619, 'loss/train': 2.4799246788024902} -09/20/2021 20:05:58 - INFO - __main__ - Step 25913: {'lr': 0.00019984640197775563, 'samples': 829216, 'steps': 1619, 'loss/train': 1.3452883958816528} -09/20/2021 20:05:59 - INFO - __main__ - Step 25914: {'lr': 0.00019984640197775563, 'samples': 829248, 'steps': 1619, 'loss/train': 4.228282451629639} -09/20/2021 20:06:00 - INFO - __main__ - Step 25915: {'lr': 0.00019984640197775563, 'samples': 829280, 'steps': 1619, 'loss/train': 2.7963881492614746} -09/20/2021 20:06:01 - INFO - __main__ - Step 25916: {'lr': 0.00019984640197775563, 'samples': 829312, 'steps': 1619, 'loss/train': 3.691453456878662} -09/20/2021 20:06:01 - INFO - __main__ - Step 25917: {'lr': 0.00019984640197775563, 'samples': 829344, 'steps': 1619, 'loss/train': 2.167510509490967} -09/20/2021 20:06:02 - INFO - __main__ - Step 25918: {'lr': 0.00019984640197775563, 'samples': 829376, 'steps': 1619, 'loss/train': 1.9513521194458008} -09/20/2021 20:06:03 - INFO - __main__ - Step 25919: {'lr': 0.00019984640197775563, 'samples': 829408, 'steps': 1619, 'loss/train': 1.532435417175293} -09/20/2021 20:06:04 - INFO - __main__ - Step 25920: {'lr': 0.00019984640197775563, 'samples': 829440, 'steps': 1619, 'loss/train': 2.4624526500701904} -09/20/2021 20:06:05 - INFO - __main__ - Step 25921: {'lr': 0.000199846048359913, 'samples': 829472, 'steps': 1620, 'loss/train': 1.854828119277954} -09/20/2021 20:06:05 - INFO - __main__ - Step 25922: {'lr': 0.000199846048359913, 'samples': 829504, 'steps': 1620, 'loss/train': 2.5174038410186768} -09/20/2021 20:06:06 - INFO - __main__ - Step 25923: {'lr': 0.000199846048359913, 'samples': 829536, 'steps': 1620, 'loss/train': 2.9992191791534424} -09/20/2021 20:06:07 - INFO - __main__ - Step 25924: {'lr': 0.000199846048359913, 'samples': 829568, 'steps': 1620, 'loss/train': 3.1155645847320557} -09/20/2021 20:06:08 - INFO - __main__ - Step 25925: {'lr': 0.000199846048359913, 'samples': 829600, 'steps': 1620, 'loss/train': 2.825596332550049} -09/20/2021 20:06:08 - INFO - __main__ - Step 25926: {'lr': 0.000199846048359913, 'samples': 829632, 'steps': 1620, 'loss/train': 2.345719337463379} -09/20/2021 20:06:09 - INFO - __main__ - Step 25927: {'lr': 0.000199846048359913, 'samples': 829664, 'steps': 1620, 'loss/train': 2.748473644256592} -09/20/2021 20:06:10 - INFO - __main__ - Step 25928: {'lr': 0.000199846048359913, 'samples': 829696, 'steps': 1620, 'loss/train': 2.1857640743255615} -09/20/2021 20:06:11 - INFO - __main__ - Step 25929: {'lr': 0.000199846048359913, 'samples': 829728, 'steps': 1620, 'loss/train': 3.0623905658721924} -09/20/2021 20:06:11 - INFO - __main__ - Step 25930: {'lr': 0.000199846048359913, 'samples': 829760, 'steps': 1620, 'loss/train': 3.243497133255005} -09/20/2021 20:06:12 - INFO - __main__ - Step 25931: {'lr': 0.000199846048359913, 'samples': 829792, 'steps': 1620, 'loss/train': 1.2093324661254883} -09/20/2021 20:06:13 - INFO - __main__ - Step 25932: {'lr': 0.000199846048359913, 'samples': 829824, 'steps': 1620, 'loss/train': 1.2275480031967163} -09/20/2021 20:06:14 - INFO - __main__ - Step 25933: {'lr': 0.000199846048359913, 'samples': 829856, 'steps': 1620, 'loss/train': 1.4612070322036743} -09/20/2021 20:06:14 - INFO - __main__ - Step 25934: {'lr': 0.000199846048359913, 'samples': 829888, 'steps': 1620, 'loss/train': 1.4736897945404053} -09/20/2021 20:06:15 - INFO - __main__ - Step 25935: {'lr': 0.000199846048359913, 'samples': 829920, 'steps': 1620, 'loss/train': 1.246653437614441} -09/20/2021 20:06:16 - INFO - __main__ - Step 25936: {'lr': 0.000199846048359913, 'samples': 829952, 'steps': 1620, 'loss/train': 1.2518112659454346} -09/20/2021 20:06:17 - INFO - __main__ - Step 25937: {'lr': 0.00019984569433579717, 'samples': 829984, 'steps': 1621, 'loss/train': 1.0938396453857422} -09/20/2021 20:06:18 - INFO - __main__ - Step 25938: {'lr': 0.00019984569433579717, 'samples': 830016, 'steps': 1621, 'loss/train': 1.5681633949279785} -09/20/2021 20:06:18 - INFO - __main__ - Step 25939: {'lr': 0.00019984569433579717, 'samples': 830048, 'steps': 1621, 'loss/train': 4.034658432006836} -09/20/2021 20:06:20 - INFO - __main__ - Step 25940: {'lr': 0.00019984569433579717, 'samples': 830080, 'steps': 1621, 'loss/train': 3.216266632080078} -09/20/2021 20:06:20 - INFO - __main__ - Step 25941: {'lr': 0.00019984569433579717, 'samples': 830112, 'steps': 1621, 'loss/train': 3.2483410835266113} -09/20/2021 20:06:21 - INFO - __main__ - Step 25942: {'lr': 0.00019984569433579717, 'samples': 830144, 'steps': 1621, 'loss/train': 3.1443679332733154} -09/20/2021 20:06:22 - INFO - __main__ - Step 25943: {'lr': 0.00019984569433579717, 'samples': 830176, 'steps': 1621, 'loss/train': 2.4395246505737305} -09/20/2021 20:06:23 - INFO - __main__ - Step 25944: {'lr': 0.00019984569433579717, 'samples': 830208, 'steps': 1621, 'loss/train': 5.531432628631592} -09/20/2021 20:06:23 - INFO - __main__ - Step 25945: {'lr': 0.00019984569433579717, 'samples': 830240, 'steps': 1621, 'loss/train': 2.633622169494629} -09/20/2021 20:06:24 - INFO - __main__ - Step 25946: {'lr': 0.00019984569433579717, 'samples': 830272, 'steps': 1621, 'loss/train': 2.595784902572632} -09/20/2021 20:06:25 - INFO - __main__ - Step 25947: {'lr': 0.00019984569433579717, 'samples': 830304, 'steps': 1621, 'loss/train': 2.730729103088379} -09/20/2021 20:06:26 - INFO - __main__ - Step 25948: {'lr': 0.00019984569433579717, 'samples': 830336, 'steps': 1621, 'loss/train': 0.5480495095252991} -09/20/2021 20:06:26 - INFO - __main__ - Step 25949: {'lr': 0.00019984569433579717, 'samples': 830368, 'steps': 1621, 'loss/train': 0.619307279586792} -09/20/2021 20:06:27 - INFO - __main__ - Step 25950: {'lr': 0.00019984569433579717, 'samples': 830400, 'steps': 1621, 'loss/train': 2.2579405307769775} -09/20/2021 20:06:28 - INFO - __main__ - Step 25951: {'lr': 0.00019984569433579717, 'samples': 830432, 'steps': 1621, 'loss/train': 3.2239205837249756} -09/20/2021 20:06:29 - INFO - __main__ - Step 25952: {'lr': 0.00019984569433579717, 'samples': 830464, 'steps': 1621, 'loss/train': 3.126932144165039} -09/20/2021 20:06:30 - INFO - __main__ - Step 25953: {'lr': 0.0001998453399054096, 'samples': 830496, 'steps': 1622, 'loss/train': 3.060866117477417} -09/20/2021 20:06:30 - INFO - __main__ - Step 25954: {'lr': 0.0001998453399054096, 'samples': 830528, 'steps': 1622, 'loss/train': 2.258563280105591} -09/20/2021 20:06:31 - INFO - __main__ - Step 25955: {'lr': 0.0001998453399054096, 'samples': 830560, 'steps': 1622, 'loss/train': 1.9922930002212524} -09/20/2021 20:06:32 - INFO - __main__ - Step 25956: {'lr': 0.0001998453399054096, 'samples': 830592, 'steps': 1622, 'loss/train': 1.844631314277649} -09/20/2021 20:06:33 - INFO - __main__ - Step 25957: {'lr': 0.0001998453399054096, 'samples': 830624, 'steps': 1622, 'loss/train': 2.465841293334961} -09/20/2021 20:06:33 - INFO - __main__ - Step 25958: {'lr': 0.0001998453399054096, 'samples': 830656, 'steps': 1622, 'loss/train': 5.642001152038574} -09/20/2021 20:06:34 - INFO - __main__ - Step 25959: {'lr': 0.0001998453399054096, 'samples': 830688, 'steps': 1622, 'loss/train': 2.693399429321289} -09/20/2021 20:06:35 - INFO - __main__ - Step 25960: {'lr': 0.0001998453399054096, 'samples': 830720, 'steps': 1622, 'loss/train': 4.246277809143066} -09/20/2021 20:06:36 - INFO - __main__ - Step 25961: {'lr': 0.0001998453399054096, 'samples': 830752, 'steps': 1622, 'loss/train': 5.363094329833984} -09/20/2021 20:06:36 - INFO - __main__ - Step 25962: {'lr': 0.0001998453399054096, 'samples': 830784, 'steps': 1622, 'loss/train': 5.299304485321045} -09/20/2021 20:06:37 - INFO - __main__ - Step 25963: {'lr': 0.0001998453399054096, 'samples': 830816, 'steps': 1622, 'loss/train': 5.382992744445801} -09/20/2021 20:06:38 - INFO - __main__ - Step 25964: {'lr': 0.0001998453399054096, 'samples': 830848, 'steps': 1622, 'loss/train': 5.254169464111328} -09/20/2021 20:06:39 - INFO - __main__ - Step 25965: {'lr': 0.0001998453399054096, 'samples': 830880, 'steps': 1622, 'loss/train': 2.5009779930114746} -09/20/2021 20:06:39 - INFO - __main__ - Step 25966: {'lr': 0.0001998453399054096, 'samples': 830912, 'steps': 1622, 'loss/train': 3.143155097961426} -09/20/2021 20:06:40 - INFO - __main__ - Step 25967: {'lr': 0.0001998453399054096, 'samples': 830944, 'steps': 1622, 'loss/train': 3.467726230621338} -09/20/2021 20:06:41 - INFO - __main__ - Step 25968: {'lr': 0.0001998453399054096, 'samples': 830976, 'steps': 1622, 'loss/train': 2.6824123859405518} -09/20/2021 20:06:42 - INFO - __main__ - Step 25969: {'lr': 0.00019984498506875174, 'samples': 831008, 'steps': 1623, 'loss/train': 3.360866069793701} -09/20/2021 20:06:42 - INFO - __main__ - Step 25970: {'lr': 0.00019984498506875174, 'samples': 831040, 'steps': 1623, 'loss/train': 2.522866725921631} -09/20/2021 20:06:43 - INFO - __main__ - Step 25971: {'lr': 0.00019984498506875174, 'samples': 831072, 'steps': 1623, 'loss/train': 2.3921167850494385} -09/20/2021 20:06:44 - INFO - __main__ - Step 25972: {'lr': 0.00019984498506875174, 'samples': 831104, 'steps': 1623, 'loss/train': 2.4740710258483887} -09/20/2021 20:06:46 - INFO - __main__ - Step 25973: {'lr': 0.00019984498506875174, 'samples': 831136, 'steps': 1623, 'loss/train': 3.172869920730591} -09/20/2021 20:06:47 - INFO - __main__ - Step 25974: {'lr': 0.00019984498506875174, 'samples': 831168, 'steps': 1623, 'loss/train': 2.95424222946167} -09/20/2021 20:06:47 - INFO - __main__ - Step 25975: {'lr': 0.00019984498506875174, 'samples': 831200, 'steps': 1623, 'loss/train': 1.7941282987594604} -09/20/2021 20:06:48 - INFO - __main__ - Step 25976: {'lr': 0.00019984498506875174, 'samples': 831232, 'steps': 1623, 'loss/train': 2.328184127807617} -09/20/2021 20:06:49 - INFO - __main__ - Step 25977: {'lr': 0.00019984498506875174, 'samples': 831264, 'steps': 1623, 'loss/train': 3.865015745162964} -09/20/2021 20:06:50 - INFO - __main__ - Step 25978: {'lr': 0.00019984498506875174, 'samples': 831296, 'steps': 1623, 'loss/train': 2.0392794609069824} -09/20/2021 20:06:50 - INFO - __main__ - Step 25979: {'lr': 0.00019984498506875174, 'samples': 831328, 'steps': 1623, 'loss/train': 2.614100933074951} -09/20/2021 20:06:51 - INFO - __main__ - Step 25980: {'lr': 0.00019984498506875174, 'samples': 831360, 'steps': 1623, 'loss/train': 3.1275012493133545} -09/20/2021 20:06:52 - INFO - __main__ - Step 25981: {'lr': 0.00019984498506875174, 'samples': 831392, 'steps': 1623, 'loss/train': 2.8754489421844482} -09/20/2021 20:06:53 - INFO - __main__ - Step 25982: {'lr': 0.00019984498506875174, 'samples': 831424, 'steps': 1623, 'loss/train': 1.9416050910949707} -09/20/2021 20:06:53 - INFO - __main__ - Step 25983: {'lr': 0.00019984498506875174, 'samples': 831456, 'steps': 1623, 'loss/train': 2.30981183052063} -09/20/2021 20:06:54 - INFO - __main__ - Step 25984: {'lr': 0.00019984498506875174, 'samples': 831488, 'steps': 1623, 'loss/train': 2.960763454437256} -09/20/2021 20:06:55 - INFO - __main__ - Step 25985: {'lr': 0.000199844629825825, 'samples': 831520, 'steps': 1624, 'loss/train': 2.654473066329956} -09/20/2021 20:06:56 - INFO - __main__ - Step 25986: {'lr': 0.000199844629825825, 'samples': 831552, 'steps': 1624, 'loss/train': 3.0956783294677734} -09/20/2021 20:06:56 - INFO - __main__ - Step 25987: {'lr': 0.000199844629825825, 'samples': 831584, 'steps': 1624, 'loss/train': 2.5632636547088623} -09/20/2021 20:06:57 - INFO - __main__ - Step 25988: {'lr': 0.000199844629825825, 'samples': 831616, 'steps': 1624, 'loss/train': 2.608992576599121} -09/20/2021 20:06:58 - INFO - __main__ - Step 25989: {'lr': 0.000199844629825825, 'samples': 831648, 'steps': 1624, 'loss/train': 2.113369941711426} -09/20/2021 20:06:59 - INFO - __main__ - Step 25990: {'lr': 0.000199844629825825, 'samples': 831680, 'steps': 1624, 'loss/train': 1.8686347007751465} -09/20/2021 20:06:59 - INFO - __main__ - Step 25991: {'lr': 0.000199844629825825, 'samples': 831712, 'steps': 1624, 'loss/train': 3.0267632007598877} -09/20/2021 20:07:00 - INFO - __main__ - Step 25992: {'lr': 0.000199844629825825, 'samples': 831744, 'steps': 1624, 'loss/train': 2.6172800064086914} -09/20/2021 20:07:01 - INFO - __main__ - Step 25993: {'lr': 0.000199844629825825, 'samples': 831776, 'steps': 1624, 'loss/train': 2.023955821990967} -09/20/2021 20:07:02 - INFO - __main__ - Step 25994: {'lr': 0.000199844629825825, 'samples': 831808, 'steps': 1624, 'loss/train': 2.1416728496551514} -09/20/2021 20:07:02 - INFO - __main__ - Step 25995: {'lr': 0.000199844629825825, 'samples': 831840, 'steps': 1624, 'loss/train': 2.9094319343566895} -09/20/2021 20:07:03 - INFO - __main__ - Step 25996: {'lr': 0.000199844629825825, 'samples': 831872, 'steps': 1624, 'loss/train': 2.4043197631835938} -09/20/2021 20:07:04 - INFO - __main__ - Step 25997: {'lr': 0.000199844629825825, 'samples': 831904, 'steps': 1624, 'loss/train': 2.7886993885040283} -09/20/2021 20:07:05 - INFO - __main__ - Step 25998: {'lr': 0.000199844629825825, 'samples': 831936, 'steps': 1624, 'loss/train': 2.9171674251556396} -09/20/2021 20:07:05 - INFO - __main__ - Step 25999: {'lr': 0.000199844629825825, 'samples': 831968, 'steps': 1624, 'loss/train': 2.7286629676818848} -09/20/2021 20:07:06 - INFO - __main__ - Step 26000: {'lr': 0.000199844629825825, 'samples': 832000, 'steps': 1624, 'loss/train': 2.688143014907837} -09/20/2021 20:07:07 - INFO - __main__ - Step 26001: {'lr': 0.00019984427417663085, 'samples': 832032, 'steps': 1625, 'loss/train': 2.4146862030029297} -09/20/2021 20:07:08 - INFO - __main__ - Step 26002: {'lr': 0.00019984427417663085, 'samples': 832064, 'steps': 1625, 'loss/train': 2.7486515045166016} -09/20/2021 20:07:09 - INFO - __main__ - Step 26003: {'lr': 0.00019984427417663085, 'samples': 832096, 'steps': 1625, 'loss/train': 2.8883087635040283} -09/20/2021 20:07:09 - INFO - __main__ - Step 26004: {'lr': 0.00019984427417663085, 'samples': 832128, 'steps': 1625, 'loss/train': 2.5252490043640137} -09/20/2021 20:07:10 - INFO - __main__ - Step 26005: {'lr': 0.00019984427417663085, 'samples': 832160, 'steps': 1625, 'loss/train': 2.617474317550659} -09/20/2021 20:07:12 - INFO - __main__ - Step 26006: {'lr': 0.00019984427417663085, 'samples': 832192, 'steps': 1625, 'loss/train': 2.4238953590393066} -09/20/2021 20:07:12 - INFO - __main__ - Step 26007: {'lr': 0.00019984427417663085, 'samples': 832224, 'steps': 1625, 'loss/train': 2.6628425121307373} -09/20/2021 20:07:13 - INFO - __main__ - Step 26008: {'lr': 0.00019984427417663085, 'samples': 832256, 'steps': 1625, 'loss/train': 1.8677029609680176} -09/20/2021 20:07:14 - INFO - __main__ - Step 26009: {'lr': 0.00019984427417663085, 'samples': 832288, 'steps': 1625, 'loss/train': 0.839942455291748} -09/20/2021 20:07:15 - INFO - __main__ - Step 26010: {'lr': 0.00019984427417663085, 'samples': 832320, 'steps': 1625, 'loss/train': 0.33347466588020325} -09/20/2021 20:07:15 - INFO - __main__ - Step 26011: {'lr': 0.00019984427417663085, 'samples': 832352, 'steps': 1625, 'loss/train': 0.5277794599533081} -09/20/2021 20:07:16 - INFO - __main__ - Step 26012: {'lr': 0.00019984427417663085, 'samples': 832384, 'steps': 1625, 'loss/train': 0.3558429479598999} -09/20/2021 20:07:17 - INFO - __main__ - Step 26013: {'lr': 0.00019984427417663085, 'samples': 832416, 'steps': 1625, 'loss/train': 0.645267903804779} -09/20/2021 20:07:18 - INFO - __main__ - Step 26014: {'lr': 0.00019984427417663085, 'samples': 832448, 'steps': 1625, 'loss/train': 2.8516147136688232} -09/20/2021 20:07:18 - INFO - __main__ - Step 26015: {'lr': 0.00019984427417663085, 'samples': 832480, 'steps': 1625, 'loss/train': 0.76413494348526} -09/20/2021 20:07:19 - INFO - __main__ - Step 26016: {'lr': 0.00019984427417663085, 'samples': 832512, 'steps': 1625, 'loss/train': 2.1170952320098877} -09/20/2021 20:07:20 - INFO - __main__ - Step 26017: {'lr': 0.00019984391812117073, 'samples': 832544, 'steps': 1626, 'loss/train': 3.1039490699768066} -09/20/2021 20:07:21 - INFO - __main__ - Step 26018: {'lr': 0.00019984391812117073, 'samples': 832576, 'steps': 1626, 'loss/train': 2.970160484313965} -09/20/2021 20:07:21 - INFO - __main__ - Step 26019: {'lr': 0.00019984391812117073, 'samples': 832608, 'steps': 1626, 'loss/train': 2.862374782562256} -09/20/2021 20:07:22 - INFO - __main__ - Step 26020: {'lr': 0.00019984391812117073, 'samples': 832640, 'steps': 1626, 'loss/train': 2.794700860977173} -09/20/2021 20:07:23 - INFO - __main__ - Step 26021: {'lr': 0.00019984391812117073, 'samples': 832672, 'steps': 1626, 'loss/train': 3.723008632659912} -09/20/2021 20:07:24 - INFO - __main__ - Step 26022: {'lr': 0.00019984391812117073, 'samples': 832704, 'steps': 1626, 'loss/train': 1.5614690780639648} -09/20/2021 20:07:24 - INFO - __main__ - Step 26023: {'lr': 0.00019984391812117073, 'samples': 832736, 'steps': 1626, 'loss/train': 3.297694206237793} -09/20/2021 20:07:25 - INFO - __main__ - Step 26024: {'lr': 0.00019984391812117073, 'samples': 832768, 'steps': 1626, 'loss/train': 3.125704288482666} -09/20/2021 20:07:26 - INFO - __main__ - Step 26025: {'lr': 0.00019984391812117073, 'samples': 832800, 'steps': 1626, 'loss/train': 3.2452197074890137} -09/20/2021 20:07:27 - INFO - __main__ - Step 26026: {'lr': 0.00019984391812117073, 'samples': 832832, 'steps': 1626, 'loss/train': 3.2178516387939453} -09/20/2021 20:07:27 - INFO - __main__ - Step 26027: {'lr': 0.00019984391812117073, 'samples': 832864, 'steps': 1626, 'loss/train': 1.3023571968078613} -09/20/2021 20:07:28 - INFO - __main__ - Step 26028: {'lr': 0.00019984391812117073, 'samples': 832896, 'steps': 1626, 'loss/train': 2.502855062484741} -09/20/2021 20:07:29 - INFO - __main__ - Step 26029: {'lr': 0.00019984391812117073, 'samples': 832928, 'steps': 1626, 'loss/train': 2.7105445861816406} -09/20/2021 20:07:30 - INFO - __main__ - Step 26030: {'lr': 0.00019984391812117073, 'samples': 832960, 'steps': 1626, 'loss/train': 2.961491823196411} -09/20/2021 20:07:30 - INFO - __main__ - Step 26031: {'lr': 0.00019984391812117073, 'samples': 832992, 'steps': 1626, 'loss/train': 2.9976844787597656} -09/20/2021 20:07:31 - INFO - __main__ - Step 26032: {'lr': 0.00019984391812117073, 'samples': 833024, 'steps': 1626, 'loss/train': 2.983365774154663} -09/20/2021 20:07:32 - INFO - __main__ - Step 26033: {'lr': 0.00019984356165944614, 'samples': 833056, 'steps': 1627, 'loss/train': 1.8897041082382202} -09/20/2021 20:07:33 - INFO - __main__ - Step 26034: {'lr': 0.00019984356165944614, 'samples': 833088, 'steps': 1627, 'loss/train': 2.730454683303833} -09/20/2021 20:07:34 - INFO - __main__ - Step 26035: {'lr': 0.00019984356165944614, 'samples': 833120, 'steps': 1627, 'loss/train': 2.4742157459259033} -09/20/2021 20:07:35 - INFO - __main__ - Step 26036: {'lr': 0.00019984356165944614, 'samples': 833152, 'steps': 1627, 'loss/train': 2.3786087036132812} -09/20/2021 20:07:36 - INFO - __main__ - Step 26037: {'lr': 0.00019984356165944614, 'samples': 833184, 'steps': 1627, 'loss/train': 2.422685384750366} -09/20/2021 20:07:36 - INFO - __main__ - Step 26038: {'lr': 0.00019984356165944614, 'samples': 833216, 'steps': 1627, 'loss/train': 2.8081347942352295} -09/20/2021 20:07:37 - INFO - __main__ - Step 26039: {'lr': 0.00019984356165944614, 'samples': 833248, 'steps': 1627, 'loss/train': 2.927694797515869} -09/20/2021 20:07:38 - INFO - __main__ - Step 26040: {'lr': 0.00019984356165944614, 'samples': 833280, 'steps': 1627, 'loss/train': 3.0848639011383057} -09/20/2021 20:07:39 - INFO - __main__ - Step 26041: {'lr': 0.00019984356165944614, 'samples': 833312, 'steps': 1627, 'loss/train': 3.018171548843384} -09/20/2021 20:07:39 - INFO - __main__ - Step 26042: {'lr': 0.00019984356165944614, 'samples': 833344, 'steps': 1627, 'loss/train': 3.1947479248046875} -09/20/2021 20:07:40 - INFO - __main__ - Step 26043: {'lr': 0.00019984356165944614, 'samples': 833376, 'steps': 1627, 'loss/train': 2.2108254432678223} -09/20/2021 20:07:41 - INFO - __main__ - Step 26044: {'lr': 0.00019984356165944614, 'samples': 833408, 'steps': 1627, 'loss/train': 2.986135482788086} -09/20/2021 20:07:42 - INFO - __main__ - Step 26045: {'lr': 0.00019984356165944614, 'samples': 833440, 'steps': 1627, 'loss/train': 2.589695930480957} -09/20/2021 20:07:42 - INFO - __main__ - Step 26046: {'lr': 0.00019984356165944614, 'samples': 833472, 'steps': 1627, 'loss/train': 2.9285590648651123} -09/20/2021 20:07:43 - INFO - __main__ - Step 26047: {'lr': 0.00019984356165944614, 'samples': 833504, 'steps': 1627, 'loss/train': 2.4077954292297363} -09/20/2021 20:07:44 - INFO - __main__ - Step 26048: {'lr': 0.00019984356165944614, 'samples': 833536, 'steps': 1627, 'loss/train': 2.085362195968628} -09/20/2021 20:07:45 - INFO - __main__ - Step 26049: {'lr': 0.00019984320479145845, 'samples': 833568, 'steps': 1628, 'loss/train': 3.615125894546509} -09/20/2021 20:07:45 - INFO - __main__ - Step 26050: {'lr': 0.00019984320479145845, 'samples': 833600, 'steps': 1628, 'loss/train': 1.412235975265503} -09/20/2021 20:07:46 - INFO - __main__ - Step 26051: {'lr': 0.00019984320479145845, 'samples': 833632, 'steps': 1628, 'loss/train': 2.6858251094818115} -09/20/2021 20:07:47 - INFO - __main__ - Step 26052: {'lr': 0.00019984320479145845, 'samples': 833664, 'steps': 1628, 'loss/train': 2.8197340965270996} -09/20/2021 20:07:48 - INFO - __main__ - Step 26053: {'lr': 0.00019984320479145845, 'samples': 833696, 'steps': 1628, 'loss/train': 2.72988224029541} -09/20/2021 20:07:48 - INFO - __main__ - Step 26054: {'lr': 0.00019984320479145845, 'samples': 833728, 'steps': 1628, 'loss/train': 3.1351094245910645} -09/20/2021 20:07:49 - INFO - __main__ - Step 26055: {'lr': 0.00019984320479145845, 'samples': 833760, 'steps': 1628, 'loss/train': 2.636902093887329} -09/20/2021 20:07:50 - INFO - __main__ - Step 26056: {'lr': 0.00019984320479145845, 'samples': 833792, 'steps': 1628, 'loss/train': 2.3250694274902344} -09/20/2021 20:07:51 - INFO - __main__ - Step 26057: {'lr': 0.00019984320479145845, 'samples': 833824, 'steps': 1628, 'loss/train': 2.7506988048553467} -09/20/2021 20:07:51 - INFO - __main__ - Step 26058: {'lr': 0.00019984320479145845, 'samples': 833856, 'steps': 1628, 'loss/train': 3.6462910175323486} -09/20/2021 20:07:52 - INFO - __main__ - Step 26059: {'lr': 0.00019984320479145845, 'samples': 833888, 'steps': 1628, 'loss/train': 0.7993593811988831} -09/20/2021 20:07:53 - INFO - __main__ - Step 26060: {'lr': 0.00019984320479145845, 'samples': 833920, 'steps': 1628, 'loss/train': 2.7480082511901855} -09/20/2021 20:07:54 - INFO - __main__ - Step 26061: {'lr': 0.00019984320479145845, 'samples': 833952, 'steps': 1628, 'loss/train': 1.610601782798767} -09/20/2021 20:07:54 - INFO - __main__ - Step 26062: {'lr': 0.00019984320479145845, 'samples': 833984, 'steps': 1628, 'loss/train': 2.02302885055542} -09/20/2021 20:07:55 - INFO - __main__ - Step 26063: {'lr': 0.00019984320479145845, 'samples': 834016, 'steps': 1628, 'loss/train': 2.2983388900756836} -09/20/2021 20:07:56 - INFO - __main__ - Step 26064: {'lr': 0.00019984320479145845, 'samples': 834048, 'steps': 1628, 'loss/train': 1.444457769393921} -09/20/2021 20:07:57 - INFO - __main__ - Step 26065: {'lr': 0.00019984284751720915, 'samples': 834080, 'steps': 1629, 'loss/train': 2.951932191848755} -09/20/2021 20:07:59 - INFO - __main__ - Step 26066: {'lr': 0.00019984284751720915, 'samples': 834112, 'steps': 1629, 'loss/train': 2.9440133571624756} -09/20/2021 20:07:59 - INFO - __main__ - Step 26067: {'lr': 0.00019984284751720915, 'samples': 834144, 'steps': 1629, 'loss/train': 3.0468788146972656} -09/20/2021 20:08:00 - INFO - __main__ - Step 26068: {'lr': 0.00019984284751720915, 'samples': 834176, 'steps': 1629, 'loss/train': 2.5444583892822266} -09/20/2021 20:08:01 - INFO - __main__ - Step 26069: {'lr': 0.00019984284751720915, 'samples': 834208, 'steps': 1629, 'loss/train': 1.8698419332504272} -09/20/2021 20:08:02 - INFO - __main__ - Step 26070: {'lr': 0.00019984284751720915, 'samples': 834240, 'steps': 1629, 'loss/train': 2.229440450668335} -09/20/2021 20:08:02 - INFO - __main__ - Step 26071: {'lr': 0.00019984284751720915, 'samples': 834272, 'steps': 1629, 'loss/train': 3.014529228210449} -09/20/2021 20:08:03 - INFO - __main__ - Step 26072: {'lr': 0.00019984284751720915, 'samples': 834304, 'steps': 1629, 'loss/train': 2.5367555618286133} -09/20/2021 20:08:04 - INFO - __main__ - Step 26073: {'lr': 0.00019984284751720915, 'samples': 834336, 'steps': 1629, 'loss/train': 3.4898478984832764} -09/20/2021 20:08:05 - INFO - __main__ - Step 26074: {'lr': 0.00019984284751720915, 'samples': 834368, 'steps': 1629, 'loss/train': 1.9399465322494507} -09/20/2021 20:08:05 - INFO - __main__ - Step 26075: {'lr': 0.00019984284751720915, 'samples': 834400, 'steps': 1629, 'loss/train': 3.124877452850342} -09/20/2021 20:08:06 - INFO - __main__ - Step 26076: {'lr': 0.00019984284751720915, 'samples': 834432, 'steps': 1629, 'loss/train': 2.8799731731414795} -09/20/2021 20:08:07 - INFO - __main__ - Step 26077: {'lr': 0.00019984284751720915, 'samples': 834464, 'steps': 1629, 'loss/train': 2.3704707622528076} -09/20/2021 20:08:08 - INFO - __main__ - Step 26078: {'lr': 0.00019984284751720915, 'samples': 834496, 'steps': 1629, 'loss/train': 2.1438210010528564} -09/20/2021 20:08:08 - INFO - __main__ - Step 26079: {'lr': 0.00019984284751720915, 'samples': 834528, 'steps': 1629, 'loss/train': 2.7327511310577393} -09/20/2021 20:08:09 - INFO - __main__ - Step 26080: {'lr': 0.00019984284751720915, 'samples': 834560, 'steps': 1629, 'loss/train': 2.517522096633911} -09/20/2021 20:08:10 - INFO - __main__ - Step 26081: {'lr': 0.00019984248983669967, 'samples': 834592, 'steps': 1630, 'loss/train': 3.745002269744873} -09/20/2021 20:08:11 - INFO - __main__ - Step 26082: {'lr': 0.00019984248983669967, 'samples': 834624, 'steps': 1630, 'loss/train': 3.488328218460083} -09/20/2021 20:08:11 - INFO - __main__ - Step 26083: {'lr': 0.00019984248983669967, 'samples': 834656, 'steps': 1630, 'loss/train': 2.197441339492798} -09/20/2021 20:08:12 - INFO - __main__ - Step 26084: {'lr': 0.00019984248983669967, 'samples': 834688, 'steps': 1630, 'loss/train': 1.2537107467651367} -09/20/2021 20:08:13 - INFO - __main__ - Step 26085: {'lr': 0.00019984248983669967, 'samples': 834720, 'steps': 1630, 'loss/train': 1.1821476221084595} -09/20/2021 20:08:14 - INFO - __main__ - Step 26086: {'lr': 0.00019984248983669967, 'samples': 834752, 'steps': 1630, 'loss/train': 1.1251063346862793} -09/20/2021 20:08:14 - INFO - __main__ - Step 26087: {'lr': 0.00019984248983669967, 'samples': 834784, 'steps': 1630, 'loss/train': 1.4275919198989868} -09/20/2021 20:08:15 - INFO - __main__ - Step 26088: {'lr': 0.00019984248983669967, 'samples': 834816, 'steps': 1630, 'loss/train': 1.237856149673462} -09/20/2021 20:08:16 - INFO - __main__ - Step 26089: {'lr': 0.00019984248983669967, 'samples': 834848, 'steps': 1630, 'loss/train': 1.2139121294021606} -09/20/2021 20:08:17 - INFO - __main__ - Step 26090: {'lr': 0.00019984248983669967, 'samples': 834880, 'steps': 1630, 'loss/train': 1.2311710119247437} -09/20/2021 20:08:17 - INFO - __main__ - Step 26091: {'lr': 0.00019984248983669967, 'samples': 834912, 'steps': 1630, 'loss/train': 1.1168826818466187} -09/20/2021 20:08:18 - INFO - __main__ - Step 26092: {'lr': 0.00019984248983669967, 'samples': 834944, 'steps': 1630, 'loss/train': 1.350211262702942} -09/20/2021 20:08:19 - INFO - __main__ - Step 26093: {'lr': 0.00019984248983669967, 'samples': 834976, 'steps': 1630, 'loss/train': 1.4441355466842651} -09/20/2021 20:08:20 - INFO - __main__ - Step 26094: {'lr': 0.00019984248983669967, 'samples': 835008, 'steps': 1630, 'loss/train': 2.7020010948181152} -09/20/2021 20:08:20 - INFO - __main__ - Step 26095: {'lr': 0.00019984248983669967, 'samples': 835040, 'steps': 1630, 'loss/train': 1.7539267539978027} -09/20/2021 20:08:21 - INFO - __main__ - Step 26096: {'lr': 0.00019984248983669967, 'samples': 835072, 'steps': 1630, 'loss/train': 2.7819912433624268} -09/20/2021 20:08:22 - INFO - __main__ - Step 26097: {'lr': 0.00019984213174993154, 'samples': 835104, 'steps': 1631, 'loss/train': 2.9662046432495117} -09/20/2021 20:08:23 - INFO - __main__ - Step 26098: {'lr': 0.00019984213174993154, 'samples': 835136, 'steps': 1631, 'loss/train': 2.7107207775115967} -09/20/2021 20:08:24 - INFO - __main__ - Step 26099: {'lr': 0.00019984213174993154, 'samples': 835168, 'steps': 1631, 'loss/train': 3.3000473976135254} -09/20/2021 20:08:24 - INFO - __main__ - Step 26100: {'lr': 0.00019984213174993154, 'samples': 835200, 'steps': 1631, 'loss/train': 2.1744985580444336} -09/20/2021 20:08:25 - INFO - __main__ - Step 26101: {'lr': 0.00019984213174993154, 'samples': 835232, 'steps': 1631, 'loss/train': 2.7226433753967285} -09/20/2021 20:08:26 - INFO - __main__ - Step 26102: {'lr': 0.00019984213174993154, 'samples': 835264, 'steps': 1631, 'loss/train': 2.785047769546509} -09/20/2021 20:08:27 - INFO - __main__ - Step 26103: {'lr': 0.00019984213174993154, 'samples': 835296, 'steps': 1631, 'loss/train': 2.655454397201538} -09/20/2021 20:08:28 - INFO - __main__ - Step 26104: {'lr': 0.00019984213174993154, 'samples': 835328, 'steps': 1631, 'loss/train': 3.47882080078125} -09/20/2021 20:08:29 - INFO - __main__ - Step 26105: {'lr': 0.00019984213174993154, 'samples': 835360, 'steps': 1631, 'loss/train': 2.862440586090088} -09/20/2021 20:08:29 - INFO - __main__ - Step 26106: {'lr': 0.00019984213174993154, 'samples': 835392, 'steps': 1631, 'loss/train': 3.3955061435699463} -09/20/2021 20:08:30 - INFO - __main__ - Step 26107: {'lr': 0.00019984213174993154, 'samples': 835424, 'steps': 1631, 'loss/train': 3.2420613765716553} -09/20/2021 20:08:31 - INFO - __main__ - Step 26108: {'lr': 0.00019984213174993154, 'samples': 835456, 'steps': 1631, 'loss/train': 2.3080670833587646} -09/20/2021 20:08:32 - INFO - __main__ - Step 26109: {'lr': 0.00019984213174993154, 'samples': 835488, 'steps': 1631, 'loss/train': 1.3592729568481445} -09/20/2021 20:08:32 - INFO - __main__ - Step 26110: {'lr': 0.00019984213174993154, 'samples': 835520, 'steps': 1631, 'loss/train': 3.3253579139709473} -09/20/2021 20:08:33 - INFO - __main__ - Step 26111: {'lr': 0.00019984213174993154, 'samples': 835552, 'steps': 1631, 'loss/train': 2.6480274200439453} -09/20/2021 20:08:34 - INFO - __main__ - Step 26112: {'lr': 0.00019984213174993154, 'samples': 835584, 'steps': 1631, 'loss/train': 2.3767244815826416} -09/20/2021 20:08:35 - INFO - __main__ - Step 26113: {'lr': 0.00019984177325690612, 'samples': 835616, 'steps': 1632, 'loss/train': 3.525519609451294} -09/20/2021 20:08:35 - INFO - __main__ - Step 26114: {'lr': 0.00019984177325690612, 'samples': 835648, 'steps': 1632, 'loss/train': 3.103785753250122} -09/20/2021 20:08:36 - INFO - __main__ - Step 26115: {'lr': 0.00019984177325690612, 'samples': 835680, 'steps': 1632, 'loss/train': 2.470386505126953} -09/20/2021 20:08:37 - INFO - __main__ - Step 26116: {'lr': 0.00019984177325690612, 'samples': 835712, 'steps': 1632, 'loss/train': 3.3809924125671387} -09/20/2021 20:08:38 - INFO - __main__ - Step 26117: {'lr': 0.00019984177325690612, 'samples': 835744, 'steps': 1632, 'loss/train': 2.7962794303894043} -09/20/2021 20:08:38 - INFO - __main__ - Step 26118: {'lr': 0.00019984177325690612, 'samples': 835776, 'steps': 1632, 'loss/train': 2.0041897296905518} -09/20/2021 20:08:39 - INFO - __main__ - Step 26119: {'lr': 0.00019984177325690612, 'samples': 835808, 'steps': 1632, 'loss/train': 3.3195693492889404} -09/20/2021 20:08:40 - INFO - __main__ - Step 26120: {'lr': 0.00019984177325690612, 'samples': 835840, 'steps': 1632, 'loss/train': 1.902234435081482} -09/20/2021 20:08:41 - INFO - __main__ - Step 26121: {'lr': 0.00019984177325690612, 'samples': 835872, 'steps': 1632, 'loss/train': 2.6260628700256348} -09/20/2021 20:08:41 - INFO - __main__ - Step 26122: {'lr': 0.00019984177325690612, 'samples': 835904, 'steps': 1632, 'loss/train': 2.5418176651000977} -09/20/2021 20:08:42 - INFO - __main__ - Step 26123: {'lr': 0.00019984177325690612, 'samples': 835936, 'steps': 1632, 'loss/train': 1.7811912298202515} -09/20/2021 20:08:43 - INFO - __main__ - Step 26124: {'lr': 0.00019984177325690612, 'samples': 835968, 'steps': 1632, 'loss/train': 2.4141526222229004} -09/20/2021 20:08:44 - INFO - __main__ - Step 26125: {'lr': 0.00019984177325690612, 'samples': 836000, 'steps': 1632, 'loss/train': 3.1753416061401367} -09/20/2021 20:08:44 - INFO - __main__ - Step 26126: {'lr': 0.00019984177325690612, 'samples': 836032, 'steps': 1632, 'loss/train': 2.4361469745635986} -09/20/2021 20:08:45 - INFO - __main__ - Step 26127: {'lr': 0.00019984177325690612, 'samples': 836064, 'steps': 1632, 'loss/train': 2.6440787315368652} -09/20/2021 20:08:46 - INFO - __main__ - Step 26128: {'lr': 0.00019984177325690612, 'samples': 836096, 'steps': 1632, 'loss/train': 2.029524087905884} -09/20/2021 20:08:47 - INFO - __main__ - Step 26129: {'lr': 0.0001998414143576249, 'samples': 836128, 'steps': 1633, 'loss/train': 2.975564479827881} -09/20/2021 20:08:48 - INFO - __main__ - Step 26130: {'lr': 0.0001998414143576249, 'samples': 836160, 'steps': 1633, 'loss/train': 2.826554298400879} -09/20/2021 20:08:48 - INFO - __main__ - Step 26131: {'lr': 0.0001998414143576249, 'samples': 836192, 'steps': 1633, 'loss/train': 2.696401357650757} -09/20/2021 20:08:49 - INFO - __main__ - Step 26132: {'lr': 0.0001998414143576249, 'samples': 836224, 'steps': 1633, 'loss/train': 3.4992308616638184} -09/20/2021 20:08:50 - INFO - __main__ - Step 26133: {'lr': 0.0001998414143576249, 'samples': 836256, 'steps': 1633, 'loss/train': 3.3128137588500977} -09/20/2021 20:08:52 - INFO - __main__ - Step 26134: {'lr': 0.0001998414143576249, 'samples': 836288, 'steps': 1633, 'loss/train': 2.0218591690063477} -09/20/2021 20:08:52 - INFO - __main__ - Step 26135: {'lr': 0.0001998414143576249, 'samples': 836320, 'steps': 1633, 'loss/train': 2.1418871879577637} -09/20/2021 20:08:53 - INFO - __main__ - Step 26136: {'lr': 0.0001998414143576249, 'samples': 836352, 'steps': 1633, 'loss/train': 2.5305607318878174} -09/20/2021 20:08:54 - INFO - __main__ - Step 26137: {'lr': 0.0001998414143576249, 'samples': 836384, 'steps': 1633, 'loss/train': 2.4784059524536133} -09/20/2021 20:08:55 - INFO - __main__ - Step 26138: {'lr': 0.0001998414143576249, 'samples': 836416, 'steps': 1633, 'loss/train': 3.4923243522644043} -09/20/2021 20:08:55 - INFO - __main__ - Step 26139: {'lr': 0.0001998414143576249, 'samples': 836448, 'steps': 1633, 'loss/train': 3.308863878250122} -09/20/2021 20:08:56 - INFO - __main__ - Step 26140: {'lr': 0.0001998414143576249, 'samples': 836480, 'steps': 1633, 'loss/train': 3.5492799282073975} -09/20/2021 20:08:57 - INFO - __main__ - Step 26141: {'lr': 0.0001998414143576249, 'samples': 836512, 'steps': 1633, 'loss/train': 3.279271125793457} -09/20/2021 20:08:58 - INFO - __main__ - Step 26142: {'lr': 0.0001998414143576249, 'samples': 836544, 'steps': 1633, 'loss/train': 3.600522041320801} -09/20/2021 20:08:58 - INFO - __main__ - Step 26143: {'lr': 0.0001998414143576249, 'samples': 836576, 'steps': 1633, 'loss/train': 3.55436110496521} -09/20/2021 20:08:59 - INFO - __main__ - Step 26144: {'lr': 0.0001998414143576249, 'samples': 836608, 'steps': 1633, 'loss/train': 3.5602943897247314} -09/20/2021 20:09:00 - INFO - __main__ - Step 26145: {'lr': 0.0001998410550520894, 'samples': 836640, 'steps': 1634, 'loss/train': 2.32774019241333} -09/20/2021 20:09:01 - INFO - __main__ - Step 26146: {'lr': 0.0001998410550520894, 'samples': 836672, 'steps': 1634, 'loss/train': 2.2287943363189697} -09/20/2021 20:09:02 - INFO - __main__ - Step 26147: {'lr': 0.0001998410550520894, 'samples': 836704, 'steps': 1634, 'loss/train': 3.866619348526001} -09/20/2021 20:09:02 - INFO - __main__ - Step 26148: {'lr': 0.0001998410550520894, 'samples': 836736, 'steps': 1634, 'loss/train': 3.6364269256591797} -09/20/2021 20:09:03 - INFO - __main__ - Step 26149: {'lr': 0.0001998410550520894, 'samples': 836768, 'steps': 1634, 'loss/train': 2.9671599864959717} -09/20/2021 20:09:04 - INFO - __main__ - Step 26150: {'lr': 0.0001998410550520894, 'samples': 836800, 'steps': 1634, 'loss/train': 0.5391038656234741} -09/20/2021 20:09:05 - INFO - __main__ - Step 26151: {'lr': 0.0001998410550520894, 'samples': 836832, 'steps': 1634, 'loss/train': 3.643760919570923} -09/20/2021 20:09:05 - INFO - __main__ - Step 26152: {'lr': 0.0001998410550520894, 'samples': 836864, 'steps': 1634, 'loss/train': 2.0728280544281006} -09/20/2021 20:09:06 - INFO - __main__ - Step 26153: {'lr': 0.0001998410550520894, 'samples': 836896, 'steps': 1634, 'loss/train': 2.6563243865966797} -09/20/2021 20:09:07 - INFO - __main__ - Step 26154: {'lr': 0.0001998410550520894, 'samples': 836928, 'steps': 1634, 'loss/train': 2.0029633045196533} -09/20/2021 20:09:08 - INFO - __main__ - Step 26155: {'lr': 0.0001998410550520894, 'samples': 836960, 'steps': 1634, 'loss/train': 3.232152223587036} -09/20/2021 20:09:08 - INFO - __main__ - Step 26156: {'lr': 0.0001998410550520894, 'samples': 836992, 'steps': 1634, 'loss/train': 1.5329766273498535} -09/20/2021 20:09:09 - INFO - __main__ - Step 26157: {'lr': 0.0001998410550520894, 'samples': 837024, 'steps': 1634, 'loss/train': 2.0001730918884277} -09/20/2021 20:09:10 - INFO - __main__ - Step 26158: {'lr': 0.0001998410550520894, 'samples': 837056, 'steps': 1634, 'loss/train': 3.155362844467163} -09/20/2021 20:09:11 - INFO - __main__ - Step 26159: {'lr': 0.0001998410550520894, 'samples': 837088, 'steps': 1634, 'loss/train': 3.4169397354125977} -09/20/2021 20:09:11 - INFO - __main__ - Step 26160: {'lr': 0.0001998410550520894, 'samples': 837120, 'steps': 1634, 'loss/train': 1.747745394706726} -09/20/2021 20:09:12 - INFO - __main__ - Step 26161: {'lr': 0.000199840695340301, 'samples': 837152, 'steps': 1635, 'loss/train': 3.391477346420288} -09/20/2021 20:09:13 - INFO - __main__ - Step 26162: {'lr': 0.000199840695340301, 'samples': 837184, 'steps': 1635, 'loss/train': 1.6385198831558228} -09/20/2021 20:09:14 - INFO - __main__ - Step 26163: {'lr': 0.000199840695340301, 'samples': 837216, 'steps': 1635, 'loss/train': 2.3617334365844727} -09/20/2021 20:09:15 - INFO - __main__ - Step 26164: {'lr': 0.000199840695340301, 'samples': 837248, 'steps': 1635, 'loss/train': 3.2213897705078125} -09/20/2021 20:09:15 - INFO - __main__ - Step 26165: {'lr': 0.000199840695340301, 'samples': 837280, 'steps': 1635, 'loss/train': 3.600961446762085} -09/20/2021 20:09:16 - INFO - __main__ - Step 26166: {'lr': 0.000199840695340301, 'samples': 837312, 'steps': 1635, 'loss/train': 1.9710553884506226} -09/20/2021 20:09:17 - INFO - __main__ - Step 26167: {'lr': 0.000199840695340301, 'samples': 837344, 'steps': 1635, 'loss/train': 2.6530725955963135} -09/20/2021 20:09:18 - INFO - __main__ - Step 26168: {'lr': 0.000199840695340301, 'samples': 837376, 'steps': 1635, 'loss/train': 1.3109272718429565} -09/20/2021 20:09:18 - INFO - __main__ - Step 26169: {'lr': 0.000199840695340301, 'samples': 837408, 'steps': 1635, 'loss/train': 1.715951919555664} -09/20/2021 20:09:19 - INFO - __main__ - Step 26170: {'lr': 0.000199840695340301, 'samples': 837440, 'steps': 1635, 'loss/train': 2.7197976112365723} -09/20/2021 20:09:20 - INFO - __main__ - Step 26171: {'lr': 0.000199840695340301, 'samples': 837472, 'steps': 1635, 'loss/train': 3.0945825576782227} -09/20/2021 20:09:21 - INFO - __main__ - Step 26172: {'lr': 0.000199840695340301, 'samples': 837504, 'steps': 1635, 'loss/train': 2.778432607650757} -09/20/2021 20:09:22 - INFO - __main__ - Step 26173: {'lr': 0.000199840695340301, 'samples': 837536, 'steps': 1635, 'loss/train': 3.7713751792907715} -09/20/2021 20:09:23 - INFO - __main__ - Step 26174: {'lr': 0.000199840695340301, 'samples': 837568, 'steps': 1635, 'loss/train': 2.20363450050354} -09/20/2021 20:09:23 - INFO - __main__ - Step 26175: {'lr': 0.000199840695340301, 'samples': 837600, 'steps': 1635, 'loss/train': 3.4284143447875977} -09/20/2021 20:09:24 - INFO - __main__ - Step 26176: {'lr': 0.000199840695340301, 'samples': 837632, 'steps': 1635, 'loss/train': 0.705331027507782} -09/20/2021 20:09:25 - INFO - __main__ - Step 26177: {'lr': 0.00019984033522226123, 'samples': 837664, 'steps': 1636, 'loss/train': 2.9318747520446777} -09/20/2021 20:09:26 - INFO - __main__ - Step 26178: {'lr': 0.00019984033522226123, 'samples': 837696, 'steps': 1636, 'loss/train': 2.933387517929077} -09/20/2021 20:09:26 - INFO - __main__ - Step 26179: {'lr': 0.00019984033522226123, 'samples': 837728, 'steps': 1636, 'loss/train': 3.0595998764038086} -09/20/2021 20:09:27 - INFO - __main__ - Step 26180: {'lr': 0.00019984033522226123, 'samples': 837760, 'steps': 1636, 'loss/train': 3.5147359371185303} -09/20/2021 20:09:28 - INFO - __main__ - Step 26181: {'lr': 0.00019984033522226123, 'samples': 837792, 'steps': 1636, 'loss/train': 3.5010759830474854} -09/20/2021 20:09:29 - INFO - __main__ - Step 26182: {'lr': 0.00019984033522226123, 'samples': 837824, 'steps': 1636, 'loss/train': 2.290503978729248} -09/20/2021 20:09:29 - INFO - __main__ - Step 26183: {'lr': 0.00019984033522226123, 'samples': 837856, 'steps': 1636, 'loss/train': 2.233416795730591} -09/20/2021 20:09:30 - INFO - __main__ - Step 26184: {'lr': 0.00019984033522226123, 'samples': 837888, 'steps': 1636, 'loss/train': 2.466113805770874} -09/20/2021 20:09:31 - INFO - __main__ - Step 26185: {'lr': 0.00019984033522226123, 'samples': 837920, 'steps': 1636, 'loss/train': 2.7241101264953613} -09/20/2021 20:09:32 - INFO - __main__ - Step 26186: {'lr': 0.00019984033522226123, 'samples': 837952, 'steps': 1636, 'loss/train': 2.946199417114258} -09/20/2021 20:09:32 - INFO - __main__ - Step 26187: {'lr': 0.00019984033522226123, 'samples': 837984, 'steps': 1636, 'loss/train': 1.4125711917877197} -09/20/2021 20:09:33 - INFO - __main__ - Step 26188: {'lr': 0.00019984033522226123, 'samples': 838016, 'steps': 1636, 'loss/train': 2.896282434463501} -09/20/2021 20:09:34 - INFO - __main__ - Step 26189: {'lr': 0.00019984033522226123, 'samples': 838048, 'steps': 1636, 'loss/train': 3.1319363117218018} -09/20/2021 20:09:35 - INFO - __main__ - Step 26190: {'lr': 0.00019984033522226123, 'samples': 838080, 'steps': 1636, 'loss/train': 2.357131242752075} -09/20/2021 20:09:35 - INFO - __main__ - Step 26191: {'lr': 0.00019984033522226123, 'samples': 838112, 'steps': 1636, 'loss/train': 1.8936063051223755} -09/20/2021 20:09:36 - INFO - __main__ - Step 26192: {'lr': 0.00019984033522226123, 'samples': 838144, 'steps': 1636, 'loss/train': 2.5472123622894287} -09/20/2021 20:09:37 - INFO - __main__ - Step 26193: {'lr': 0.0001998399746979715, 'samples': 838176, 'steps': 1637, 'loss/train': 3.092688798904419} -09/20/2021 20:09:38 - INFO - __main__ - Step 26194: {'lr': 0.0001998399746979715, 'samples': 838208, 'steps': 1637, 'loss/train': 2.2502200603485107} -09/20/2021 20:09:39 - INFO - __main__ - Step 26195: {'lr': 0.0001998399746979715, 'samples': 838240, 'steps': 1637, 'loss/train': 3.8338325023651123} -09/20/2021 20:09:39 - INFO - __main__ - Step 26196: {'lr': 0.0001998399746979715, 'samples': 838272, 'steps': 1637, 'loss/train': 2.4602420330047607} -09/20/2021 20:09:40 - INFO - __main__ - Step 26197: {'lr': 0.0001998399746979715, 'samples': 838304, 'steps': 1637, 'loss/train': 2.734698534011841} -09/20/2021 20:09:41 - INFO - __main__ - Step 26198: {'lr': 0.0001998399746979715, 'samples': 838336, 'steps': 1637, 'loss/train': 3.731579303741455} -09/20/2021 20:09:42 - INFO - __main__ - Step 26199: {'lr': 0.0001998399746979715, 'samples': 838368, 'steps': 1637, 'loss/train': 2.966712236404419} -09/20/2021 20:09:42 - INFO - __main__ - Step 26200: {'lr': 0.0001998399746979715, 'samples': 838400, 'steps': 1637, 'loss/train': 2.3140923976898193} -09/20/2021 20:09:43 - INFO - __main__ - Step 26201: {'lr': 0.0001998399746979715, 'samples': 838432, 'steps': 1637, 'loss/train': 3.231081008911133} -09/20/2021 20:09:44 - INFO - __main__ - Step 26202: {'lr': 0.0001998399746979715, 'samples': 838464, 'steps': 1637, 'loss/train': 3.2007803916931152} -09/20/2021 20:09:45 - INFO - __main__ - Step 26203: {'lr': 0.0001998399746979715, 'samples': 838496, 'steps': 1637, 'loss/train': 3.271005392074585} -09/20/2021 20:09:46 - INFO - __main__ - Step 26204: {'lr': 0.0001998399746979715, 'samples': 838528, 'steps': 1637, 'loss/train': 1.438734531402588} -09/20/2021 20:09:47 - INFO - __main__ - Step 26205: {'lr': 0.0001998399746979715, 'samples': 838560, 'steps': 1637, 'loss/train': 2.9443347454071045} -09/20/2021 20:09:47 - INFO - __main__ - Step 26206: {'lr': 0.0001998399746979715, 'samples': 838592, 'steps': 1637, 'loss/train': 3.1598024368286133} -09/20/2021 20:09:48 - INFO - __main__ - Step 26207: {'lr': 0.0001998399746979715, 'samples': 838624, 'steps': 1637, 'loss/train': 1.0555442571640015} -09/20/2021 20:09:49 - INFO - __main__ - Step 26208: {'lr': 0.0001998399746979715, 'samples': 838656, 'steps': 1637, 'loss/train': 2.394224166870117} -09/20/2021 20:09:50 - INFO - __main__ - Step 26209: {'lr': 0.0001998396137674333, 'samples': 838688, 'steps': 1638, 'loss/train': 2.345004081726074} -09/20/2021 20:09:51 - INFO - __main__ - Step 26210: {'lr': 0.0001998396137674333, 'samples': 838720, 'steps': 1638, 'loss/train': 2.5729947090148926} -09/20/2021 20:09:51 - INFO - __main__ - Step 26211: {'lr': 0.0001998396137674333, 'samples': 838752, 'steps': 1638, 'loss/train': 2.7413344383239746} -09/20/2021 20:09:52 - INFO - __main__ - Step 26212: {'lr': 0.0001998396137674333, 'samples': 838784, 'steps': 1638, 'loss/train': 3.05185604095459} -09/20/2021 20:09:53 - INFO - __main__ - Step 26213: {'lr': 0.0001998396137674333, 'samples': 838816, 'steps': 1638, 'loss/train': 2.41182804107666} -09/20/2021 20:09:54 - INFO - __main__ - Step 26214: {'lr': 0.0001998396137674333, 'samples': 838848, 'steps': 1638, 'loss/train': 2.773237705230713} -09/20/2021 20:09:54 - INFO - __main__ - Step 26215: {'lr': 0.0001998396137674333, 'samples': 838880, 'steps': 1638, 'loss/train': 2.379784107208252} -09/20/2021 20:09:55 - INFO - __main__ - Step 26216: {'lr': 0.0001998396137674333, 'samples': 838912, 'steps': 1638, 'loss/train': 2.0157101154327393} -09/20/2021 20:09:56 - INFO - __main__ - Step 26217: {'lr': 0.0001998396137674333, 'samples': 838944, 'steps': 1638, 'loss/train': 2.4759514331817627} -09/20/2021 20:09:57 - INFO - __main__ - Step 26218: {'lr': 0.0001998396137674333, 'samples': 838976, 'steps': 1638, 'loss/train': 2.190865993499756} -09/20/2021 20:09:57 - INFO - __main__ - Step 26219: {'lr': 0.0001998396137674333, 'samples': 839008, 'steps': 1638, 'loss/train': 3.3333303928375244} -09/20/2021 20:09:58 - INFO - __main__ - Step 26220: {'lr': 0.0001998396137674333, 'samples': 839040, 'steps': 1638, 'loss/train': 3.792797327041626} -09/20/2021 20:09:59 - INFO - __main__ - Step 26221: {'lr': 0.0001998396137674333, 'samples': 839072, 'steps': 1638, 'loss/train': 2.4356982707977295} -09/20/2021 20:10:00 - INFO - __main__ - Step 26222: {'lr': 0.0001998396137674333, 'samples': 839104, 'steps': 1638, 'loss/train': 3.6254844665527344} -09/20/2021 20:10:00 - INFO - __main__ - Step 26223: {'lr': 0.0001998396137674333, 'samples': 839136, 'steps': 1638, 'loss/train': 2.8581390380859375} -09/20/2021 20:10:01 - INFO - __main__ - Step 26224: {'lr': 0.0001998396137674333, 'samples': 839168, 'steps': 1638, 'loss/train': 2.6887688636779785} -09/20/2021 20:10:02 - INFO - __main__ - Step 26225: {'lr': 0.0001998392524306481, 'samples': 839200, 'steps': 1639, 'loss/train': 1.7541546821594238} -09/20/2021 20:10:03 - INFO - __main__ - Step 26226: {'lr': 0.0001998392524306481, 'samples': 839232, 'steps': 1639, 'loss/train': 2.3227145671844482} -09/20/2021 20:10:03 - INFO - __main__ - Step 26227: {'lr': 0.0001998392524306481, 'samples': 839264, 'steps': 1639, 'loss/train': 1.3648887872695923} -09/20/2021 20:10:04 - INFO - __main__ - Step 26228: {'lr': 0.0001998392524306481, 'samples': 839296, 'steps': 1639, 'loss/train': 2.6399266719818115} -09/20/2021 20:10:05 - INFO - __main__ - Step 26229: {'lr': 0.0001998392524306481, 'samples': 839328, 'steps': 1639, 'loss/train': 2.523069381713867} -09/20/2021 20:10:06 - INFO - __main__ - Step 26230: {'lr': 0.0001998392524306481, 'samples': 839360, 'steps': 1639, 'loss/train': 2.0164260864257812} -09/20/2021 20:10:06 - INFO - __main__ - Step 26231: {'lr': 0.0001998392524306481, 'samples': 839392, 'steps': 1639, 'loss/train': 2.6959218978881836} -09/20/2021 20:10:07 - INFO - __main__ - Step 26232: {'lr': 0.0001998392524306481, 'samples': 839424, 'steps': 1639, 'loss/train': 2.911914587020874} -09/20/2021 20:10:09 - INFO - __main__ - Step 26233: {'lr': 0.0001998392524306481, 'samples': 839456, 'steps': 1639, 'loss/train': 3.2668213844299316} -09/20/2021 20:10:09 - INFO - __main__ - Step 26234: {'lr': 0.0001998392524306481, 'samples': 839488, 'steps': 1639, 'loss/train': 0.7217794060707092} -09/20/2021 20:10:10 - INFO - __main__ - Step 26235: {'lr': 0.0001998392524306481, 'samples': 839520, 'steps': 1639, 'loss/train': 2.768406391143799} -09/20/2021 20:10:11 - INFO - __main__ - Step 26236: {'lr': 0.0001998392524306481, 'samples': 839552, 'steps': 1639, 'loss/train': 1.3218052387237549} -09/20/2021 20:10:12 - INFO - __main__ - Step 26237: {'lr': 0.0001998392524306481, 'samples': 839584, 'steps': 1639, 'loss/train': 2.422173261642456} -09/20/2021 20:10:12 - INFO - __main__ - Step 26238: {'lr': 0.0001998392524306481, 'samples': 839616, 'steps': 1639, 'loss/train': 2.6622798442840576} -09/20/2021 20:10:13 - INFO - __main__ - Step 26239: {'lr': 0.0001998392524306481, 'samples': 839648, 'steps': 1639, 'loss/train': 1.8604353666305542} -09/20/2021 20:10:14 - INFO - __main__ - Step 26240: {'lr': 0.0001998392524306481, 'samples': 839680, 'steps': 1639, 'loss/train': 3.8544270992279053} -09/20/2021 20:10:15 - INFO - __main__ - Step 26241: {'lr': 0.00019983889068761736, 'samples': 839712, 'steps': 1640, 'loss/train': 2.1433401107788086} -09/20/2021 20:10:15 - INFO - __main__ - Step 26242: {'lr': 0.00019983889068761736, 'samples': 839744, 'steps': 1640, 'loss/train': 0.962614893913269} -09/20/2021 20:10:16 - INFO - __main__ - Step 26243: {'lr': 0.00019983889068761736, 'samples': 839776, 'steps': 1640, 'loss/train': 2.891535758972168} -09/20/2021 20:10:17 - INFO - __main__ - Step 26244: {'lr': 0.00019983889068761736, 'samples': 839808, 'steps': 1640, 'loss/train': 3.4712612628936768} -09/20/2021 20:10:18 - INFO - __main__ - Step 26245: {'lr': 0.00019983889068761736, 'samples': 839840, 'steps': 1640, 'loss/train': 2.5748231410980225} -09/20/2021 20:10:18 - INFO - __main__ - Step 26246: {'lr': 0.00019983889068761736, 'samples': 839872, 'steps': 1640, 'loss/train': 4.414223670959473} -09/20/2021 20:10:19 - INFO - __main__ - Step 26247: {'lr': 0.00019983889068761736, 'samples': 839904, 'steps': 1640, 'loss/train': 2.5999789237976074} -09/20/2021 20:10:20 - INFO - __main__ - Step 26248: {'lr': 0.00019983889068761736, 'samples': 839936, 'steps': 1640, 'loss/train': 2.031324863433838} -09/20/2021 20:10:21 - INFO - __main__ - Step 26249: {'lr': 0.00019983889068761736, 'samples': 839968, 'steps': 1640, 'loss/train': 2.99670147895813} -09/20/2021 20:10:21 - INFO - __main__ - Step 26250: {'lr': 0.00019983889068761736, 'samples': 840000, 'steps': 1640, 'loss/train': 2.416285991668701} -09/20/2021 20:10:22 - INFO - __main__ - Step 26251: {'lr': 0.00019983889068761736, 'samples': 840032, 'steps': 1640, 'loss/train': 2.8859899044036865} -09/20/2021 20:10:23 - INFO - __main__ - Step 26252: {'lr': 0.00019983889068761736, 'samples': 840064, 'steps': 1640, 'loss/train': 0.6340689063072205} -09/20/2021 20:10:24 - INFO - __main__ - Step 26253: {'lr': 0.00019983889068761736, 'samples': 840096, 'steps': 1640, 'loss/train': 2.6361424922943115} -09/20/2021 20:10:24 - INFO - __main__ - Step 26254: {'lr': 0.00019983889068761736, 'samples': 840128, 'steps': 1640, 'loss/train': 2.927589178085327} -09/20/2021 20:10:25 - INFO - __main__ - Step 26255: {'lr': 0.00019983889068761736, 'samples': 840160, 'steps': 1640, 'loss/train': 2.3849925994873047} -09/20/2021 20:10:26 - INFO - __main__ - Step 26256: {'lr': 0.00019983889068761736, 'samples': 840192, 'steps': 1640, 'loss/train': 2.4915072917938232} -09/20/2021 20:10:27 - INFO - __main__ - Step 26257: {'lr': 0.0001998385285383426, 'samples': 840224, 'steps': 1641, 'loss/train': 4.056159973144531} -09/20/2021 20:10:28 - INFO - __main__ - Step 26258: {'lr': 0.0001998385285383426, 'samples': 840256, 'steps': 1641, 'loss/train': 2.2865965366363525} -09/20/2021 20:10:28 - INFO - __main__ - Step 26259: {'lr': 0.0001998385285383426, 'samples': 840288, 'steps': 1641, 'loss/train': 0.9041846990585327} -09/20/2021 20:10:29 - INFO - __main__ - Step 26260: {'lr': 0.0001998385285383426, 'samples': 840320, 'steps': 1641, 'loss/train': 2.80637788772583} -09/20/2021 20:10:30 - INFO - __main__ - Step 26261: {'lr': 0.0001998385285383426, 'samples': 840352, 'steps': 1641, 'loss/train': 3.34932017326355} -09/20/2021 20:10:31 - INFO - __main__ - Step 26262: {'lr': 0.0001998385285383426, 'samples': 840384, 'steps': 1641, 'loss/train': 2.820539712905884} -09/20/2021 20:10:31 - INFO - __main__ - Step 26263: {'lr': 0.0001998385285383426, 'samples': 840416, 'steps': 1641, 'loss/train': 2.84098219871521} -09/20/2021 20:10:33 - INFO - __main__ - Step 26264: {'lr': 0.0001998385285383426, 'samples': 840448, 'steps': 1641, 'loss/train': 2.8080954551696777} -09/20/2021 20:10:33 - INFO - __main__ - Step 26265: {'lr': 0.0001998385285383426, 'samples': 840480, 'steps': 1641, 'loss/train': 3.479624032974243} -09/20/2021 20:10:34 - INFO - __main__ - Step 26266: {'lr': 0.0001998385285383426, 'samples': 840512, 'steps': 1641, 'loss/train': 3.1406381130218506} -09/20/2021 20:10:35 - INFO - __main__ - Step 26267: {'lr': 0.0001998385285383426, 'samples': 840544, 'steps': 1641, 'loss/train': 3.1245522499084473} -09/20/2021 20:10:36 - INFO - __main__ - Step 26268: {'lr': 0.0001998385285383426, 'samples': 840576, 'steps': 1641, 'loss/train': 3.04880690574646} -09/20/2021 20:10:36 - INFO - __main__ - Step 26269: {'lr': 0.0001998385285383426, 'samples': 840608, 'steps': 1641, 'loss/train': 1.798531174659729} -09/20/2021 20:10:37 - INFO - __main__ - Step 26270: {'lr': 0.0001998385285383426, 'samples': 840640, 'steps': 1641, 'loss/train': 2.432431697845459} -09/20/2021 20:10:38 - INFO - __main__ - Step 26271: {'lr': 0.0001998385285383426, 'samples': 840672, 'steps': 1641, 'loss/train': 2.8857674598693848} -09/20/2021 20:10:39 - INFO - __main__ - Step 26272: {'lr': 0.0001998385285383426, 'samples': 840704, 'steps': 1641, 'loss/train': 1.6897215843200684} -09/20/2021 20:10:40 - INFO - __main__ - Step 26273: {'lr': 0.00019983816598282523, 'samples': 840736, 'steps': 1642, 'loss/train': 2.264961004257202} -09/20/2021 20:10:40 - INFO - __main__ - Step 26274: {'lr': 0.00019983816598282523, 'samples': 840768, 'steps': 1642, 'loss/train': 2.0903189182281494} -09/20/2021 20:10:41 - INFO - __main__ - Step 26275: {'lr': 0.00019983816598282523, 'samples': 840800, 'steps': 1642, 'loss/train': 1.5287175178527832} -09/20/2021 20:10:42 - INFO - __main__ - Step 26276: {'lr': 0.00019983816598282523, 'samples': 840832, 'steps': 1642, 'loss/train': 2.4447920322418213} -09/20/2021 20:10:43 - INFO - __main__ - Step 26277: {'lr': 0.00019983816598282523, 'samples': 840864, 'steps': 1642, 'loss/train': 2.9741458892822266} -09/20/2021 20:10:43 - INFO - __main__ - Step 26278: {'lr': 0.00019983816598282523, 'samples': 840896, 'steps': 1642, 'loss/train': 2.8171393871307373} -09/20/2021 20:10:44 - INFO - __main__ - Step 26279: {'lr': 0.00019983816598282523, 'samples': 840928, 'steps': 1642, 'loss/train': 3.311988353729248} -09/20/2021 20:10:45 - INFO - __main__ - Step 26280: {'lr': 0.00019983816598282523, 'samples': 840960, 'steps': 1642, 'loss/train': 2.8787314891815186} -09/20/2021 20:10:46 - INFO - __main__ - Step 26281: {'lr': 0.00019983816598282523, 'samples': 840992, 'steps': 1642, 'loss/train': 3.6911275386810303} -09/20/2021 20:10:46 - INFO - __main__ - Step 26282: {'lr': 0.00019983816598282523, 'samples': 841024, 'steps': 1642, 'loss/train': 2.206862449645996} -09/20/2021 20:10:47 - INFO - __main__ - Step 26283: {'lr': 0.00019983816598282523, 'samples': 841056, 'steps': 1642, 'loss/train': 2.4336280822753906} -09/20/2021 20:10:48 - INFO - __main__ - Step 26284: {'lr': 0.00019983816598282523, 'samples': 841088, 'steps': 1642, 'loss/train': 2.3179638385772705} -09/20/2021 20:10:49 - INFO - __main__ - Step 26285: {'lr': 0.00019983816598282523, 'samples': 841120, 'steps': 1642, 'loss/train': 3.0087454319000244} -09/20/2021 20:10:49 - INFO - __main__ - Step 26286: {'lr': 0.00019983816598282523, 'samples': 841152, 'steps': 1642, 'loss/train': 2.602214813232422} -09/20/2021 20:10:50 - INFO - __main__ - Step 26287: {'lr': 0.00019983816598282523, 'samples': 841184, 'steps': 1642, 'loss/train': 2.6998727321624756} -09/20/2021 20:10:51 - INFO - __main__ - Step 26288: {'lr': 0.00019983816598282523, 'samples': 841216, 'steps': 1642, 'loss/train': 3.1649832725524902} -09/20/2021 20:10:52 - INFO - __main__ - Step 26289: {'lr': 0.00019983780302106673, 'samples': 841248, 'steps': 1643, 'loss/train': 2.564171552658081} -09/20/2021 20:10:52 - INFO - __main__ - Step 26290: {'lr': 0.00019983780302106673, 'samples': 841280, 'steps': 1643, 'loss/train': 3.3648202419281006} -09/20/2021 20:10:53 - INFO - __main__ - Step 26291: {'lr': 0.00019983780302106673, 'samples': 841312, 'steps': 1643, 'loss/train': 1.916944146156311} -09/20/2021 20:10:54 - INFO - __main__ - Step 26292: {'lr': 0.00019983780302106673, 'samples': 841344, 'steps': 1643, 'loss/train': 2.9309329986572266} -09/20/2021 20:10:55 - INFO - __main__ - Step 26293: {'lr': 0.00019983780302106673, 'samples': 841376, 'steps': 1643, 'loss/train': 2.3965871334075928} -09/20/2021 20:10:55 - INFO - __main__ - Step 26294: {'lr': 0.00019983780302106673, 'samples': 841408, 'steps': 1643, 'loss/train': 2.885108709335327} -09/20/2021 20:10:57 - INFO - __main__ - Step 26295: {'lr': 0.00019983780302106673, 'samples': 841440, 'steps': 1643, 'loss/train': 2.2781083583831787} -09/20/2021 20:10:58 - INFO - __main__ - Step 26296: {'lr': 0.00019983780302106673, 'samples': 841472, 'steps': 1643, 'loss/train': 2.4903969764709473} -09/20/2021 20:10:58 - INFO - __main__ - Step 26297: {'lr': 0.00019983780302106673, 'samples': 841504, 'steps': 1643, 'loss/train': 2.1374638080596924} -09/20/2021 20:10:59 - INFO - __main__ - Step 26298: {'lr': 0.00019983780302106673, 'samples': 841536, 'steps': 1643, 'loss/train': 2.1250410079956055} -09/20/2021 20:11:00 - INFO - __main__ - Step 26299: {'lr': 0.00019983780302106673, 'samples': 841568, 'steps': 1643, 'loss/train': 3.01649808883667} -09/20/2021 20:11:01 - INFO - __main__ - Step 26300: {'lr': 0.00019983780302106673, 'samples': 841600, 'steps': 1643, 'loss/train': 2.7001149654388428} -09/20/2021 20:11:01 - INFO - __main__ - Step 26301: {'lr': 0.00019983780302106673, 'samples': 841632, 'steps': 1643, 'loss/train': 3.3854501247406006} -09/20/2021 20:11:02 - INFO - __main__ - Step 26302: {'lr': 0.00019983780302106673, 'samples': 841664, 'steps': 1643, 'loss/train': 2.133415460586548} -09/20/2021 20:11:03 - INFO - __main__ - Step 26303: {'lr': 0.00019983780302106673, 'samples': 841696, 'steps': 1643, 'loss/train': 1.8582360744476318} -09/20/2021 20:11:04 - INFO - __main__ - Step 26304: {'lr': 0.00019983780302106673, 'samples': 841728, 'steps': 1643, 'loss/train': 3.026453971862793} -09/20/2021 20:11:04 - INFO - __main__ - Step 26305: {'lr': 0.00019983743965306864, 'samples': 841760, 'steps': 1644, 'loss/train': 2.9216132164001465} -09/20/2021 20:11:05 - INFO - __main__ - Step 26306: {'lr': 0.00019983743965306864, 'samples': 841792, 'steps': 1644, 'loss/train': 2.4134390354156494} -09/20/2021 20:11:06 - INFO - __main__ - Step 26307: {'lr': 0.00019983743965306864, 'samples': 841824, 'steps': 1644, 'loss/train': 2.038738965988159} -09/20/2021 20:11:07 - INFO - __main__ - Step 26308: {'lr': 0.00019983743965306864, 'samples': 841856, 'steps': 1644, 'loss/train': 3.0436389446258545} -09/20/2021 20:11:07 - INFO - __main__ - Step 26309: {'lr': 0.00019983743965306864, 'samples': 841888, 'steps': 1644, 'loss/train': 4.992988586425781} -09/20/2021 20:11:08 - INFO - __main__ - Step 26310: {'lr': 0.00019983743965306864, 'samples': 841920, 'steps': 1644, 'loss/train': 2.2603094577789307} -09/20/2021 20:11:09 - INFO - __main__ - Step 26311: {'lr': 0.00019983743965306864, 'samples': 841952, 'steps': 1644, 'loss/train': 2.756256103515625} -09/20/2021 20:11:10 - INFO - __main__ - Step 26312: {'lr': 0.00019983743965306864, 'samples': 841984, 'steps': 1644, 'loss/train': 3.187565565109253} -09/20/2021 20:11:10 - INFO - __main__ - Step 26313: {'lr': 0.00019983743965306864, 'samples': 842016, 'steps': 1644, 'loss/train': 3.295358896255493} -09/20/2021 20:11:11 - INFO - __main__ - Step 26314: {'lr': 0.00019983743965306864, 'samples': 842048, 'steps': 1644, 'loss/train': 1.9637635946273804} -09/20/2021 20:11:12 - INFO - __main__ - Step 26315: {'lr': 0.00019983743965306864, 'samples': 842080, 'steps': 1644, 'loss/train': 1.8881261348724365} -09/20/2021 20:11:13 - INFO - __main__ - Step 26316: {'lr': 0.00019983743965306864, 'samples': 842112, 'steps': 1644, 'loss/train': 2.58305025100708} -09/20/2021 20:11:13 - INFO - __main__ - Step 26317: {'lr': 0.00019983743965306864, 'samples': 842144, 'steps': 1644, 'loss/train': 1.870381474494934} -09/20/2021 20:11:14 - INFO - __main__ - Step 26318: {'lr': 0.00019983743965306864, 'samples': 842176, 'steps': 1644, 'loss/train': 2.0613205432891846} -09/20/2021 20:11:15 - INFO - __main__ - Step 26319: {'lr': 0.00019983743965306864, 'samples': 842208, 'steps': 1644, 'loss/train': 2.689241886138916} -09/20/2021 20:11:16 - INFO - __main__ - Step 26320: {'lr': 0.00019983743965306864, 'samples': 842240, 'steps': 1644, 'loss/train': 3.281999349594116} -09/20/2021 20:11:17 - INFO - __main__ - Step 26321: {'lr': 0.00019983707587883237, 'samples': 842272, 'steps': 1645, 'loss/train': 2.8106319904327393} -09/20/2021 20:11:17 - INFO - __main__ - Step 26322: {'lr': 0.00019983707587883237, 'samples': 842304, 'steps': 1645, 'loss/train': 2.5464766025543213} -09/20/2021 20:11:18 - INFO - __main__ - Step 26323: {'lr': 0.00019983707587883237, 'samples': 842336, 'steps': 1645, 'loss/train': 3.6964757442474365} -09/20/2021 20:11:19 - INFO - __main__ - Step 26324: {'lr': 0.00019983707587883237, 'samples': 842368, 'steps': 1645, 'loss/train': 2.5762526988983154} -09/20/2021 20:11:21 - INFO - __main__ - Step 26325: {'lr': 0.00019983707587883237, 'samples': 842400, 'steps': 1645, 'loss/train': 2.3251256942749023} -09/20/2021 20:11:22 - INFO - __main__ - Step 26326: {'lr': 0.00019983707587883237, 'samples': 842432, 'steps': 1645, 'loss/train': 2.890550136566162} -09/20/2021 20:11:22 - INFO - __main__ - Step 26327: {'lr': 0.00019983707587883237, 'samples': 842464, 'steps': 1645, 'loss/train': 2.9354348182678223} -09/20/2021 20:11:23 - INFO - __main__ - Step 26328: {'lr': 0.00019983707587883237, 'samples': 842496, 'steps': 1645, 'loss/train': 2.8521130084991455} -09/20/2021 20:11:24 - INFO - __main__ - Step 26329: {'lr': 0.00019983707587883237, 'samples': 842528, 'steps': 1645, 'loss/train': 2.035203695297241} -09/20/2021 20:11:25 - INFO - __main__ - Step 26330: {'lr': 0.00019983707587883237, 'samples': 842560, 'steps': 1645, 'loss/train': 3.2312166690826416} -09/20/2021 20:11:25 - INFO - __main__ - Step 26331: {'lr': 0.00019983707587883237, 'samples': 842592, 'steps': 1645, 'loss/train': 1.6243846416473389} -09/20/2021 20:11:26 - INFO - __main__ - Step 26332: {'lr': 0.00019983707587883237, 'samples': 842624, 'steps': 1645, 'loss/train': 1.8468018770217896} -09/20/2021 20:11:27 - INFO - __main__ - Step 26333: {'lr': 0.00019983707587883237, 'samples': 842656, 'steps': 1645, 'loss/train': 1.7005974054336548} -09/20/2021 20:11:28 - INFO - __main__ - Step 26334: {'lr': 0.00019983707587883237, 'samples': 842688, 'steps': 1645, 'loss/train': 1.793036699295044} -09/20/2021 20:11:28 - INFO - __main__ - Step 26335: {'lr': 0.00019983707587883237, 'samples': 842720, 'steps': 1645, 'loss/train': 2.147348165512085} -09/20/2021 20:11:29 - INFO - __main__ - Step 26336: {'lr': 0.00019983707587883237, 'samples': 842752, 'steps': 1645, 'loss/train': 2.0850462913513184} -09/20/2021 20:11:30 - INFO - __main__ - Step 26337: {'lr': 0.0001998367116983594, 'samples': 842784, 'steps': 1646, 'loss/train': 2.5056450366973877} -09/20/2021 20:11:31 - INFO - __main__ - Step 26338: {'lr': 0.0001998367116983594, 'samples': 842816, 'steps': 1646, 'loss/train': 2.3738677501678467} -09/20/2021 20:11:32 - INFO - __main__ - Step 26339: {'lr': 0.0001998367116983594, 'samples': 842848, 'steps': 1646, 'loss/train': 2.5336008071899414} -09/20/2021 20:11:32 - INFO - __main__ - Step 26340: {'lr': 0.0001998367116983594, 'samples': 842880, 'steps': 1646, 'loss/train': 0.5271092653274536} -09/20/2021 20:11:33 - INFO - __main__ - Step 26341: {'lr': 0.0001998367116983594, 'samples': 842912, 'steps': 1646, 'loss/train': 2.9026615619659424} -09/20/2021 20:11:34 - INFO - __main__ - Step 26342: {'lr': 0.0001998367116983594, 'samples': 842944, 'steps': 1646, 'loss/train': 3.1264071464538574} -09/20/2021 20:11:35 - INFO - __main__ - Step 26343: {'lr': 0.0001998367116983594, 'samples': 842976, 'steps': 1646, 'loss/train': 2.2559103965759277} -09/20/2021 20:11:35 - INFO - __main__ - Step 26344: {'lr': 0.0001998367116983594, 'samples': 843008, 'steps': 1646, 'loss/train': 2.5472404956817627} -09/20/2021 20:11:36 - INFO - __main__ - Step 26345: {'lr': 0.0001998367116983594, 'samples': 843040, 'steps': 1646, 'loss/train': 2.3598453998565674} -09/20/2021 20:11:37 - INFO - __main__ - Step 26346: {'lr': 0.0001998367116983594, 'samples': 843072, 'steps': 1646, 'loss/train': 2.0118515491485596} -09/20/2021 20:11:38 - INFO - __main__ - Step 26347: {'lr': 0.0001998367116983594, 'samples': 843104, 'steps': 1646, 'loss/train': 2.819377899169922} -09/20/2021 20:11:38 - INFO - __main__ - Step 26348: {'lr': 0.0001998367116983594, 'samples': 843136, 'steps': 1646, 'loss/train': 2.7703664302825928} -09/20/2021 20:11:39 - INFO - __main__ - Step 26349: {'lr': 0.0001998367116983594, 'samples': 843168, 'steps': 1646, 'loss/train': 1.8571836948394775} -09/20/2021 20:11:40 - INFO - __main__ - Step 26350: {'lr': 0.0001998367116983594, 'samples': 843200, 'steps': 1646, 'loss/train': 2.7404398918151855} -09/20/2021 20:11:41 - INFO - __main__ - Step 26351: {'lr': 0.0001998367116983594, 'samples': 843232, 'steps': 1646, 'loss/train': 4.182501316070557} -09/20/2021 20:11:41 - INFO - __main__ - Step 26352: {'lr': 0.0001998367116983594, 'samples': 843264, 'steps': 1646, 'loss/train': 2.6151540279388428} -09/20/2021 20:11:42 - INFO - __main__ - Step 26353: {'lr': 0.0001998363471116513, 'samples': 843296, 'steps': 1647, 'loss/train': 2.425910234451294} -09/20/2021 20:11:43 - INFO - __main__ - Step 26354: {'lr': 0.0001998363471116513, 'samples': 843328, 'steps': 1647, 'loss/train': 2.6368868350982666} -09/20/2021 20:11:44 - INFO - __main__ - Step 26355: {'lr': 0.0001998363471116513, 'samples': 843360, 'steps': 1647, 'loss/train': 2.5931167602539062} -09/20/2021 20:11:45 - INFO - __main__ - Step 26356: {'lr': 0.0001998363471116513, 'samples': 843392, 'steps': 1647, 'loss/train': 1.0595674514770508} -09/20/2021 20:11:46 - INFO - __main__ - Step 26357: {'lr': 0.0001998363471116513, 'samples': 843424, 'steps': 1647, 'loss/train': 3.107424020767212} -09/20/2021 20:11:47 - INFO - __main__ - Step 26358: {'lr': 0.0001998363471116513, 'samples': 843456, 'steps': 1647, 'loss/train': 3.0594115257263184} -09/20/2021 20:11:47 - INFO - __main__ - Step 26359: {'lr': 0.0001998363471116513, 'samples': 843488, 'steps': 1647, 'loss/train': 3.786937952041626} -09/20/2021 20:11:48 - INFO - __main__ - Step 26360: {'lr': 0.0001998363471116513, 'samples': 843520, 'steps': 1647, 'loss/train': 3.211509943008423} -09/20/2021 20:11:49 - INFO - __main__ - Step 26361: {'lr': 0.0001998363471116513, 'samples': 843552, 'steps': 1647, 'loss/train': 3.248751401901245} -09/20/2021 20:11:50 - INFO - __main__ - Step 26362: {'lr': 0.0001998363471116513, 'samples': 843584, 'steps': 1647, 'loss/train': 3.2342913150787354} -09/20/2021 20:11:50 - INFO - __main__ - Step 26363: {'lr': 0.0001998363471116513, 'samples': 843616, 'steps': 1647, 'loss/train': 2.685828924179077} -09/20/2021 20:11:51 - INFO - __main__ - Step 26364: {'lr': 0.0001998363471116513, 'samples': 843648, 'steps': 1647, 'loss/train': 2.652070999145508} -09/20/2021 20:11:52 - INFO - __main__ - Step 26365: {'lr': 0.0001998363471116513, 'samples': 843680, 'steps': 1647, 'loss/train': 2.291590929031372} -09/20/2021 20:11:53 - INFO - __main__ - Step 26366: {'lr': 0.0001998363471116513, 'samples': 843712, 'steps': 1647, 'loss/train': 2.3676013946533203} -09/20/2021 20:11:53 - INFO - __main__ - Step 26367: {'lr': 0.0001998363471116513, 'samples': 843744, 'steps': 1647, 'loss/train': 1.027701497077942} -09/20/2021 20:11:54 - INFO - __main__ - Step 26368: {'lr': 0.0001998363471116513, 'samples': 843776, 'steps': 1647, 'loss/train': 2.4814445972442627} -09/20/2021 20:11:55 - INFO - __main__ - Step 26369: {'lr': 0.00019983598211870945, 'samples': 843808, 'steps': 1648, 'loss/train': 2.6642849445343018} -09/20/2021 20:11:56 - INFO - __main__ - Step 26370: {'lr': 0.00019983598211870945, 'samples': 843840, 'steps': 1648, 'loss/train': 2.5185158252716064} -09/20/2021 20:11:56 - INFO - __main__ - Step 26371: {'lr': 0.00019983598211870945, 'samples': 843872, 'steps': 1648, 'loss/train': 2.588371753692627} -09/20/2021 20:11:57 - INFO - __main__ - Step 26372: {'lr': 0.00019983598211870945, 'samples': 843904, 'steps': 1648, 'loss/train': 3.3856558799743652} -09/20/2021 20:11:58 - INFO - __main__ - Step 26373: {'lr': 0.00019983598211870945, 'samples': 843936, 'steps': 1648, 'loss/train': 2.990528106689453} -09/20/2021 20:11:59 - INFO - __main__ - Step 26374: {'lr': 0.00019983598211870945, 'samples': 843968, 'steps': 1648, 'loss/train': 3.0191714763641357} -09/20/2021 20:11:59 - INFO - __main__ - Step 26375: {'lr': 0.00019983598211870945, 'samples': 844000, 'steps': 1648, 'loss/train': 0.4762190580368042} -09/20/2021 20:12:00 - INFO - __main__ - Step 26376: {'lr': 0.00019983598211870945, 'samples': 844032, 'steps': 1648, 'loss/train': 0.46812117099761963} -09/20/2021 20:12:01 - INFO - __main__ - Step 26377: {'lr': 0.00019983598211870945, 'samples': 844064, 'steps': 1648, 'loss/train': 0.410677433013916} -09/20/2021 20:12:02 - INFO - __main__ - Step 26378: {'lr': 0.00019983598211870945, 'samples': 844096, 'steps': 1648, 'loss/train': 2.708143711090088} -09/20/2021 20:12:02 - INFO - __main__ - Step 26379: {'lr': 0.00019983598211870945, 'samples': 844128, 'steps': 1648, 'loss/train': 4.272956371307373} -09/20/2021 20:12:03 - INFO - __main__ - Step 26380: {'lr': 0.00019983598211870945, 'samples': 844160, 'steps': 1648, 'loss/train': 0.5698131918907166} -09/20/2021 20:12:04 - INFO - __main__ - Step 26381: {'lr': 0.00019983598211870945, 'samples': 844192, 'steps': 1648, 'loss/train': 1.8328901529312134} -09/20/2021 20:12:05 - INFO - __main__ - Step 26382: {'lr': 0.00019983598211870945, 'samples': 844224, 'steps': 1648, 'loss/train': 2.914828300476074} -09/20/2021 20:12:05 - INFO - __main__ - Step 26383: {'lr': 0.00019983598211870945, 'samples': 844256, 'steps': 1648, 'loss/train': 2.9870331287384033} -09/20/2021 20:12:06 - INFO - __main__ - Step 26384: {'lr': 0.00019983598211870945, 'samples': 844288, 'steps': 1648, 'loss/train': 3.1253814697265625} -09/20/2021 20:12:07 - INFO - __main__ - Step 26385: {'lr': 0.00019983561671953537, 'samples': 844320, 'steps': 1649, 'loss/train': 3.1319825649261475} -09/20/2021 20:12:08 - INFO - __main__ - Step 26386: {'lr': 0.00019983561671953537, 'samples': 844352, 'steps': 1649, 'loss/train': 3.4537670612335205} -09/20/2021 20:12:09 - INFO - __main__ - Step 26387: {'lr': 0.00019983561671953537, 'samples': 844384, 'steps': 1649, 'loss/train': 2.748106002807617} -09/20/2021 20:12:10 - INFO - __main__ - Step 26388: {'lr': 0.00019983561671953537, 'samples': 844416, 'steps': 1649, 'loss/train': 2.2835440635681152} -09/20/2021 20:12:11 - INFO - __main__ - Step 26389: {'lr': 0.00019983561671953537, 'samples': 844448, 'steps': 1649, 'loss/train': 3.8658604621887207} -09/20/2021 20:12:11 - INFO - __main__ - Step 26390: {'lr': 0.00019983561671953537, 'samples': 844480, 'steps': 1649, 'loss/train': 0.5745031237602234} -09/20/2021 20:12:12 - INFO - __main__ - Step 26391: {'lr': 0.00019983561671953537, 'samples': 844512, 'steps': 1649, 'loss/train': 2.4370627403259277} -09/20/2021 20:12:13 - INFO - __main__ - Step 26392: {'lr': 0.00019983561671953537, 'samples': 844544, 'steps': 1649, 'loss/train': 1.6739228963851929} -09/20/2021 20:12:14 - INFO - __main__ - Step 26393: {'lr': 0.00019983561671953537, 'samples': 844576, 'steps': 1649, 'loss/train': 4.055569171905518} -09/20/2021 20:12:14 - INFO - __main__ - Step 26394: {'lr': 0.00019983561671953537, 'samples': 844608, 'steps': 1649, 'loss/train': 2.895179033279419} -09/20/2021 20:12:15 - INFO - __main__ - Step 26395: {'lr': 0.00019983561671953537, 'samples': 844640, 'steps': 1649, 'loss/train': 2.973257064819336} -09/20/2021 20:12:16 - INFO - __main__ - Step 26396: {'lr': 0.00019983561671953537, 'samples': 844672, 'steps': 1649, 'loss/train': 2.4739491939544678} -09/20/2021 20:12:17 - INFO - __main__ - Step 26397: {'lr': 0.00019983561671953537, 'samples': 844704, 'steps': 1649, 'loss/train': 2.6292877197265625} -09/20/2021 20:12:17 - INFO - __main__ - Step 26398: {'lr': 0.00019983561671953537, 'samples': 844736, 'steps': 1649, 'loss/train': 3.052520990371704} -09/20/2021 20:12:18 - INFO - __main__ - Step 26399: {'lr': 0.00019983561671953537, 'samples': 844768, 'steps': 1649, 'loss/train': 3.2393999099731445} -09/20/2021 20:12:19 - INFO - __main__ - Step 26400: {'lr': 0.00019983561671953537, 'samples': 844800, 'steps': 1649, 'loss/train': 2.3161423206329346} -09/20/2021 20:12:20 - INFO - __main__ - Step 26401: {'lr': 0.00019983525091413058, 'samples': 844832, 'steps': 1650, 'loss/train': 3.7499477863311768} -09/20/2021 20:12:21 - INFO - __main__ - Step 26402: {'lr': 0.00019983525091413058, 'samples': 844864, 'steps': 1650, 'loss/train': 2.2070508003234863} -09/20/2021 20:12:21 - INFO - __main__ - Step 26403: {'lr': 0.00019983525091413058, 'samples': 844896, 'steps': 1650, 'loss/train': 3.112889289855957} -09/20/2021 20:12:22 - INFO - __main__ - Step 26404: {'lr': 0.00019983525091413058, 'samples': 844928, 'steps': 1650, 'loss/train': 2.6582887172698975} -09/20/2021 20:12:23 - INFO - __main__ - Step 26405: {'lr': 0.00019983525091413058, 'samples': 844960, 'steps': 1650, 'loss/train': 3.586115837097168} -09/20/2021 20:12:24 - INFO - __main__ - Step 26406: {'lr': 0.00019983525091413058, 'samples': 844992, 'steps': 1650, 'loss/train': 3.8811466693878174} -09/20/2021 20:12:24 - INFO - __main__ - Step 26407: {'lr': 0.00019983525091413058, 'samples': 845024, 'steps': 1650, 'loss/train': 2.8742687702178955} -09/20/2021 20:12:25 - INFO - __main__ - Step 26408: {'lr': 0.00019983525091413058, 'samples': 845056, 'steps': 1650, 'loss/train': 2.7319588661193848} -09/20/2021 20:12:26 - INFO - __main__ - Step 26409: {'lr': 0.00019983525091413058, 'samples': 845088, 'steps': 1650, 'loss/train': 3.352959156036377} -09/20/2021 20:12:27 - INFO - __main__ - Step 26410: {'lr': 0.00019983525091413058, 'samples': 845120, 'steps': 1650, 'loss/train': 2.8409879207611084} -09/20/2021 20:12:27 - INFO - __main__ - Step 26411: {'lr': 0.00019983525091413058, 'samples': 845152, 'steps': 1650, 'loss/train': 2.9880826473236084} -09/20/2021 20:12:28 - INFO - __main__ - Step 26412: {'lr': 0.00019983525091413058, 'samples': 845184, 'steps': 1650, 'loss/train': 2.9285330772399902} -09/20/2021 20:12:29 - INFO - __main__ - Step 26413: {'lr': 0.00019983525091413058, 'samples': 845216, 'steps': 1650, 'loss/train': 3.471025228500366} -09/20/2021 20:12:30 - INFO - __main__ - Step 26414: {'lr': 0.00019983525091413058, 'samples': 845248, 'steps': 1650, 'loss/train': 3.4934866428375244} -09/20/2021 20:12:30 - INFO - __main__ - Step 26415: {'lr': 0.00019983525091413058, 'samples': 845280, 'steps': 1650, 'loss/train': 2.6064682006835938} -09/20/2021 20:12:31 - INFO - __main__ - Step 26416: {'lr': 0.00019983525091413058, 'samples': 845312, 'steps': 1650, 'loss/train': 1.5612967014312744} -09/20/2021 20:12:32 - INFO - __main__ - Step 26417: {'lr': 0.00019983488470249648, 'samples': 845344, 'steps': 1651, 'loss/train': 2.5364506244659424} -09/20/2021 20:12:33 - INFO - __main__ - Step 26418: {'lr': 0.00019983488470249648, 'samples': 845376, 'steps': 1651, 'loss/train': 2.1044859886169434} -09/20/2021 20:12:34 - INFO - __main__ - Step 26419: {'lr': 0.00019983488470249648, 'samples': 845408, 'steps': 1651, 'loss/train': 2.953850030899048} -09/20/2021 20:12:35 - INFO - __main__ - Step 26420: {'lr': 0.00019983488470249648, 'samples': 845440, 'steps': 1651, 'loss/train': 3.0221073627471924} -09/20/2021 20:12:35 - INFO - __main__ - Step 26421: {'lr': 0.00019983488470249648, 'samples': 845472, 'steps': 1651, 'loss/train': 3.4602572917938232} -09/20/2021 20:12:36 - INFO - __main__ - Step 26422: {'lr': 0.00019983488470249648, 'samples': 845504, 'steps': 1651, 'loss/train': 1.5057538747787476} -09/20/2021 20:12:37 - INFO - __main__ - Step 26423: {'lr': 0.00019983488470249648, 'samples': 845536, 'steps': 1651, 'loss/train': 1.863347053527832} -09/20/2021 20:12:38 - INFO - __main__ - Step 26424: {'lr': 0.00019983488470249648, 'samples': 845568, 'steps': 1651, 'loss/train': 2.8099417686462402} -09/20/2021 20:12:38 - INFO - __main__ - Step 26425: {'lr': 0.00019983488470249648, 'samples': 845600, 'steps': 1651, 'loss/train': 4.159984111785889} -09/20/2021 20:12:39 - INFO - __main__ - Step 26426: {'lr': 0.00019983488470249648, 'samples': 845632, 'steps': 1651, 'loss/train': 2.751988649368286} -09/20/2021 20:12:40 - INFO - __main__ - Step 26427: {'lr': 0.00019983488470249648, 'samples': 845664, 'steps': 1651, 'loss/train': 3.2487523555755615} -09/20/2021 20:12:41 - INFO - __main__ - Step 26428: {'lr': 0.00019983488470249648, 'samples': 845696, 'steps': 1651, 'loss/train': 3.38248348236084} -09/20/2021 20:12:41 - INFO - __main__ - Step 26429: {'lr': 0.00019983488470249648, 'samples': 845728, 'steps': 1651, 'loss/train': 2.342910051345825} -09/20/2021 20:12:42 - INFO - __main__ - Step 26430: {'lr': 0.00019983488470249648, 'samples': 845760, 'steps': 1651, 'loss/train': 2.7289233207702637} -09/20/2021 20:12:43 - INFO - __main__ - Step 26431: {'lr': 0.00019983488470249648, 'samples': 845792, 'steps': 1651, 'loss/train': 3.1480743885040283} -09/20/2021 20:12:44 - INFO - __main__ - Step 26432: {'lr': 0.00019983488470249648, 'samples': 845824, 'steps': 1651, 'loss/train': 2.4675729274749756} -09/20/2021 20:12:45 - INFO - __main__ - Step 26433: {'lr': 0.00019983451808463468, 'samples': 845856, 'steps': 1652, 'loss/train': 2.9750444889068604} -09/20/2021 20:12:45 - INFO - __main__ - Step 26434: {'lr': 0.00019983451808463468, 'samples': 845888, 'steps': 1652, 'loss/train': 3.586238384246826} -09/20/2021 20:12:46 - INFO - __main__ - Step 26435: {'lr': 0.00019983451808463468, 'samples': 845920, 'steps': 1652, 'loss/train': 3.522520065307617} -09/20/2021 20:12:47 - INFO - __main__ - Step 26436: {'lr': 0.00019983451808463468, 'samples': 845952, 'steps': 1652, 'loss/train': 2.135934352874756} -09/20/2021 20:12:48 - INFO - __main__ - Step 26437: {'lr': 0.00019983451808463468, 'samples': 845984, 'steps': 1652, 'loss/train': 3.3610615730285645} -09/20/2021 20:12:48 - INFO - __main__ - Step 26438: {'lr': 0.00019983451808463468, 'samples': 846016, 'steps': 1652, 'loss/train': 2.155480146408081} -09/20/2021 20:12:49 - INFO - __main__ - Step 26439: {'lr': 0.00019983451808463468, 'samples': 846048, 'steps': 1652, 'loss/train': 2.5826597213745117} -09/20/2021 20:12:50 - INFO - __main__ - Step 26440: {'lr': 0.00019983451808463468, 'samples': 846080, 'steps': 1652, 'loss/train': 3.3081166744232178} -09/20/2021 20:12:51 - INFO - __main__ - Step 26441: {'lr': 0.00019983451808463468, 'samples': 846112, 'steps': 1652, 'loss/train': 3.7047598361968994} -09/20/2021 20:12:51 - INFO - __main__ - Step 26442: {'lr': 0.00019983451808463468, 'samples': 846144, 'steps': 1652, 'loss/train': 3.1546361446380615} -09/20/2021 20:12:52 - INFO - __main__ - Step 26443: {'lr': 0.00019983451808463468, 'samples': 846176, 'steps': 1652, 'loss/train': 2.6982812881469727} -09/20/2021 20:12:53 - INFO - __main__ - Step 26444: {'lr': 0.00019983451808463468, 'samples': 846208, 'steps': 1652, 'loss/train': 2.0149238109588623} -09/20/2021 20:12:54 - INFO - __main__ - Step 26445: {'lr': 0.00019983451808463468, 'samples': 846240, 'steps': 1652, 'loss/train': 2.9273722171783447} -09/20/2021 20:12:54 - INFO - __main__ - Step 26446: {'lr': 0.00019983451808463468, 'samples': 846272, 'steps': 1652, 'loss/train': 2.5432236194610596} -09/20/2021 20:12:55 - INFO - __main__ - Step 26447: {'lr': 0.00019983451808463468, 'samples': 846304, 'steps': 1652, 'loss/train': 2.4141485691070557} -09/20/2021 20:12:56 - INFO - __main__ - Step 26448: {'lr': 0.00019983451808463468, 'samples': 846336, 'steps': 1652, 'loss/train': 2.3331172466278076} -09/20/2021 20:12:57 - INFO - __main__ - Step 26449: {'lr': 0.00019983415106054664, 'samples': 846368, 'steps': 1653, 'loss/train': 2.5213069915771484} -09/20/2021 20:12:58 - INFO - __main__ - Step 26450: {'lr': 0.00019983415106054664, 'samples': 846400, 'steps': 1653, 'loss/train': 2.307919979095459} -09/20/2021 20:12:59 - INFO - __main__ - Step 26451: {'lr': 0.00019983415106054664, 'samples': 846432, 'steps': 1653, 'loss/train': 2.7201805114746094} -09/20/2021 20:12:59 - INFO - __main__ - Step 26452: {'lr': 0.00019983415106054664, 'samples': 846464, 'steps': 1653, 'loss/train': 3.401550769805908} -09/20/2021 20:13:00 - INFO - __main__ - Step 26453: {'lr': 0.00019983415106054664, 'samples': 846496, 'steps': 1653, 'loss/train': 3.762312412261963} -09/20/2021 20:13:01 - INFO - __main__ - Step 26454: {'lr': 0.00019983415106054664, 'samples': 846528, 'steps': 1653, 'loss/train': 2.323119878768921} -09/20/2021 20:13:02 - INFO - __main__ - Step 26455: {'lr': 0.00019983415106054664, 'samples': 846560, 'steps': 1653, 'loss/train': 2.88197660446167} -09/20/2021 20:13:02 - INFO - __main__ - Step 26456: {'lr': 0.00019983415106054664, 'samples': 846592, 'steps': 1653, 'loss/train': 3.2909274101257324} -09/20/2021 20:13:03 - INFO - __main__ - Step 26457: {'lr': 0.00019983415106054664, 'samples': 846624, 'steps': 1653, 'loss/train': 2.8034486770629883} -09/20/2021 20:13:04 - INFO - __main__ - Step 26458: {'lr': 0.00019983415106054664, 'samples': 846656, 'steps': 1653, 'loss/train': 2.9350125789642334} -09/20/2021 20:13:05 - INFO - __main__ - Step 26459: {'lr': 0.00019983415106054664, 'samples': 846688, 'steps': 1653, 'loss/train': 2.1955385208129883} -09/20/2021 20:13:05 - INFO - __main__ - Step 26460: {'lr': 0.00019983415106054664, 'samples': 846720, 'steps': 1653, 'loss/train': 1.9574912786483765} -09/20/2021 20:13:06 - INFO - __main__ - Step 26461: {'lr': 0.00019983415106054664, 'samples': 846752, 'steps': 1653, 'loss/train': 2.5451316833496094} -09/20/2021 20:13:07 - INFO - __main__ - Step 26462: {'lr': 0.00019983415106054664, 'samples': 846784, 'steps': 1653, 'loss/train': 3.360661029815674} -09/20/2021 20:13:08 - INFO - __main__ - Step 26463: {'lr': 0.00019983415106054664, 'samples': 846816, 'steps': 1653, 'loss/train': 3.0008485317230225} -09/20/2021 20:13:08 - INFO - __main__ - Step 26464: {'lr': 0.00019983415106054664, 'samples': 846848, 'steps': 1653, 'loss/train': 2.4146344661712646} -09/20/2021 20:13:09 - INFO - __main__ - Step 26465: {'lr': 0.00019983378363023376, 'samples': 846880, 'steps': 1654, 'loss/train': 2.7065699100494385} -09/20/2021 20:13:10 - INFO - __main__ - Step 26466: {'lr': 0.00019983378363023376, 'samples': 846912, 'steps': 1654, 'loss/train': 1.557321548461914} -09/20/2021 20:13:11 - INFO - __main__ - Step 26467: {'lr': 0.00019983378363023376, 'samples': 846944, 'steps': 1654, 'loss/train': 2.979710340499878} -09/20/2021 20:13:12 - INFO - __main__ - Step 26468: {'lr': 0.00019983378363023376, 'samples': 846976, 'steps': 1654, 'loss/train': 2.765944004058838} -09/20/2021 20:13:12 - INFO - __main__ - Step 26469: {'lr': 0.00019983378363023376, 'samples': 847008, 'steps': 1654, 'loss/train': 2.629793405532837} -09/20/2021 20:13:13 - INFO - __main__ - Step 26470: {'lr': 0.00019983378363023376, 'samples': 847040, 'steps': 1654, 'loss/train': 2.0907506942749023} -09/20/2021 20:13:14 - INFO - __main__ - Step 26471: {'lr': 0.00019983378363023376, 'samples': 847072, 'steps': 1654, 'loss/train': 2.603693962097168} -09/20/2021 20:13:15 - INFO - __main__ - Step 26472: {'lr': 0.00019983378363023376, 'samples': 847104, 'steps': 1654, 'loss/train': 1.857800006866455} -09/20/2021 20:13:15 - INFO - __main__ - Step 26473: {'lr': 0.00019983378363023376, 'samples': 847136, 'steps': 1654, 'loss/train': 2.0746426582336426} -09/20/2021 20:13:16 - INFO - __main__ - Step 26474: {'lr': 0.00019983378363023376, 'samples': 847168, 'steps': 1654, 'loss/train': 2.7358431816101074} -09/20/2021 20:13:17 - INFO - __main__ - Step 26475: {'lr': 0.00019983378363023376, 'samples': 847200, 'steps': 1654, 'loss/train': 3.1457972526550293} -09/20/2021 20:13:18 - INFO - __main__ - Step 26476: {'lr': 0.00019983378363023376, 'samples': 847232, 'steps': 1654, 'loss/train': 2.1304845809936523} -09/20/2021 20:13:18 - INFO - __main__ - Step 26477: {'lr': 0.00019983378363023376, 'samples': 847264, 'steps': 1654, 'loss/train': 2.3815629482269287} -09/20/2021 20:13:19 - INFO - __main__ - Step 26478: {'lr': 0.00019983378363023376, 'samples': 847296, 'steps': 1654, 'loss/train': 0.5333482027053833} -09/20/2021 20:13:20 - INFO - __main__ - Step 26479: {'lr': 0.00019983378363023376, 'samples': 847328, 'steps': 1654, 'loss/train': 1.7742570638656616} -09/20/2021 20:13:21 - INFO - __main__ - Step 26480: {'lr': 0.00019983378363023376, 'samples': 847360, 'steps': 1654, 'loss/train': 3.136242628097534} -09/20/2021 20:13:22 - INFO - __main__ - Step 26481: {'lr': 0.00019983341579369763, 'samples': 847392, 'steps': 1655, 'loss/train': 2.846858501434326} -09/20/2021 20:13:23 - INFO - __main__ - Step 26482: {'lr': 0.00019983341579369763, 'samples': 847424, 'steps': 1655, 'loss/train': 2.4839048385620117} -09/20/2021 20:13:24 - INFO - __main__ - Step 26483: {'lr': 0.00019983341579369763, 'samples': 847456, 'steps': 1655, 'loss/train': 3.1010451316833496} -09/20/2021 20:13:25 - INFO - __main__ - Step 26484: {'lr': 0.00019983341579369763, 'samples': 847488, 'steps': 1655, 'loss/train': 3.0053701400756836} -09/20/2021 20:13:26 - INFO - __main__ - Step 26485: {'lr': 0.00019983341579369763, 'samples': 847520, 'steps': 1655, 'loss/train': 3.1694350242614746} -09/20/2021 20:13:26 - INFO - __main__ - Step 26486: {'lr': 0.00019983341579369763, 'samples': 847552, 'steps': 1655, 'loss/train': 3.3262248039245605} -09/20/2021 20:13:27 - INFO - __main__ - Step 26487: {'lr': 0.00019983341579369763, 'samples': 847584, 'steps': 1655, 'loss/train': 2.0956239700317383} -09/20/2021 20:13:28 - INFO - __main__ - Step 26488: {'lr': 0.00019983341579369763, 'samples': 847616, 'steps': 1655, 'loss/train': 1.6526278257369995} -09/20/2021 20:13:29 - INFO - __main__ - Step 26489: {'lr': 0.00019983341579369763, 'samples': 847648, 'steps': 1655, 'loss/train': 2.304658889770508} -09/20/2021 20:13:29 - INFO - __main__ - Step 26490: {'lr': 0.00019983341579369763, 'samples': 847680, 'steps': 1655, 'loss/train': 2.3463175296783447} -09/20/2021 20:13:30 - INFO - __main__ - Step 26491: {'lr': 0.00019983341579369763, 'samples': 847712, 'steps': 1655, 'loss/train': 1.6445785760879517} -09/20/2021 20:13:31 - INFO - __main__ - Step 26492: {'lr': 0.00019983341579369763, 'samples': 847744, 'steps': 1655, 'loss/train': 2.9952027797698975} -09/20/2021 20:13:32 - INFO - __main__ - Step 26493: {'lr': 0.00019983341579369763, 'samples': 847776, 'steps': 1655, 'loss/train': 1.385063648223877} -09/20/2021 20:13:32 - INFO - __main__ - Step 26494: {'lr': 0.00019983341579369763, 'samples': 847808, 'steps': 1655, 'loss/train': 2.7903661727905273} -09/20/2021 20:13:33 - INFO - __main__ - Step 26495: {'lr': 0.00019983341579369763, 'samples': 847840, 'steps': 1655, 'loss/train': 3.2034473419189453} -09/20/2021 20:13:34 - INFO - __main__ - Step 26496: {'lr': 0.00019983341579369763, 'samples': 847872, 'steps': 1655, 'loss/train': 2.3231654167175293} -09/20/2021 20:13:35 - INFO - __main__ - Step 26497: {'lr': 0.00019983304755093976, 'samples': 847904, 'steps': 1656, 'loss/train': 3.2037644386291504} -09/20/2021 20:13:35 - INFO - __main__ - Step 26498: {'lr': 0.00019983304755093976, 'samples': 847936, 'steps': 1656, 'loss/train': 2.1438753604888916} -09/20/2021 20:13:36 - INFO - __main__ - Step 26499: {'lr': 0.00019983304755093976, 'samples': 847968, 'steps': 1656, 'loss/train': 2.6028287410736084} -09/20/2021 20:13:37 - INFO - __main__ - Step 26500: {'lr': 0.00019983304755093976, 'samples': 848000, 'steps': 1656, 'loss/train': 2.584048271179199} -09/20/2021 20:13:38 - INFO - __main__ - Step 26501: {'lr': 0.00019983304755093976, 'samples': 848032, 'steps': 1656, 'loss/train': 3.4307146072387695} -09/20/2021 20:13:38 - INFO - __main__ - Step 26502: {'lr': 0.00019983304755093976, 'samples': 848064, 'steps': 1656, 'loss/train': 1.3528895378112793} -09/20/2021 20:13:39 - INFO - __main__ - Step 26503: {'lr': 0.00019983304755093976, 'samples': 848096, 'steps': 1656, 'loss/train': 2.4228289127349854} -09/20/2021 20:13:40 - INFO - __main__ - Step 26504: {'lr': 0.00019983304755093976, 'samples': 848128, 'steps': 1656, 'loss/train': 2.001821279525757} -09/20/2021 20:13:41 - INFO - __main__ - Step 26505: {'lr': 0.00019983304755093976, 'samples': 848160, 'steps': 1656, 'loss/train': 0.8246767520904541} -09/20/2021 20:13:41 - INFO - __main__ - Step 26506: {'lr': 0.00019983304755093976, 'samples': 848192, 'steps': 1656, 'loss/train': 0.6323815584182739} -09/20/2021 20:13:42 - INFO - __main__ - Step 26507: {'lr': 0.00019983304755093976, 'samples': 848224, 'steps': 1656, 'loss/train': 0.435173898935318} -09/20/2021 20:13:43 - INFO - __main__ - Step 26508: {'lr': 0.00019983304755093976, 'samples': 848256, 'steps': 1656, 'loss/train': 0.33501172065734863} -09/20/2021 20:13:44 - INFO - __main__ - Step 26509: {'lr': 0.00019983304755093976, 'samples': 848288, 'steps': 1656, 'loss/train': 1.0445160865783691} -09/20/2021 20:13:44 - INFO - __main__ - Step 26510: {'lr': 0.00019983304755093976, 'samples': 848320, 'steps': 1656, 'loss/train': 0.42587220668792725} -09/20/2021 20:13:45 - INFO - __main__ - Step 26511: {'lr': 0.00019983304755093976, 'samples': 848352, 'steps': 1656, 'loss/train': 0.7564611434936523} -09/20/2021 20:13:46 - INFO - __main__ - Step 26512: {'lr': 0.00019983304755093976, 'samples': 848384, 'steps': 1656, 'loss/train': 1.2034251689910889} -09/20/2021 20:13:47 - INFO - __main__ - Step 26513: {'lr': 0.00019983267890196152, 'samples': 848416, 'steps': 1657, 'loss/train': 2.4567477703094482} -09/20/2021 20:13:48 - INFO - __main__ - Step 26514: {'lr': 0.00019983267890196152, 'samples': 848448, 'steps': 1657, 'loss/train': 0.897108793258667} -09/20/2021 20:13:49 - INFO - __main__ - Step 26515: {'lr': 0.00019983267890196152, 'samples': 848480, 'steps': 1657, 'loss/train': 3.4569108486175537} -09/20/2021 20:13:50 - INFO - __main__ - Step 26516: {'lr': 0.00019983267890196152, 'samples': 848512, 'steps': 1657, 'loss/train': 2.0810904502868652} -09/20/2021 20:13:50 - INFO - __main__ - Step 26517: {'lr': 0.00019983267890196152, 'samples': 848544, 'steps': 1657, 'loss/train': 0.8881075382232666} -09/20/2021 20:13:51 - INFO - __main__ - Step 26518: {'lr': 0.00019983267890196152, 'samples': 848576, 'steps': 1657, 'loss/train': 3.085432767868042} -09/20/2021 20:13:52 - INFO - __main__ - Step 26519: {'lr': 0.00019983267890196152, 'samples': 848608, 'steps': 1657, 'loss/train': 2.6150407791137695} -09/20/2021 20:13:53 - INFO - __main__ - Step 26520: {'lr': 0.00019983267890196152, 'samples': 848640, 'steps': 1657, 'loss/train': 2.5411622524261475} -09/20/2021 20:13:53 - INFO - __main__ - Step 26521: {'lr': 0.00019983267890196152, 'samples': 848672, 'steps': 1657, 'loss/train': 2.0756332874298096} -09/20/2021 20:13:54 - INFO - __main__ - Step 26522: {'lr': 0.00019983267890196152, 'samples': 848704, 'steps': 1657, 'loss/train': 1.9972044229507446} -09/20/2021 20:13:55 - INFO - __main__ - Step 26523: {'lr': 0.00019983267890196152, 'samples': 848736, 'steps': 1657, 'loss/train': 2.752906322479248} -09/20/2021 20:13:56 - INFO - __main__ - Step 26524: {'lr': 0.00019983267890196152, 'samples': 848768, 'steps': 1657, 'loss/train': 2.715369939804077} -09/20/2021 20:13:56 - INFO - __main__ - Step 26525: {'lr': 0.00019983267890196152, 'samples': 848800, 'steps': 1657, 'loss/train': 2.523263931274414} -09/20/2021 20:13:57 - INFO - __main__ - Step 26526: {'lr': 0.00019983267890196152, 'samples': 848832, 'steps': 1657, 'loss/train': 3.163163185119629} -09/20/2021 20:13:58 - INFO - __main__ - Step 26527: {'lr': 0.00019983267890196152, 'samples': 848864, 'steps': 1657, 'loss/train': 2.4035651683807373} -09/20/2021 20:13:59 - INFO - __main__ - Step 26528: {'lr': 0.00019983267890196152, 'samples': 848896, 'steps': 1657, 'loss/train': 2.252556085586548} -09/20/2021 20:13:59 - INFO - __main__ - Step 26529: {'lr': 0.00019983230984676459, 'samples': 848928, 'steps': 1658, 'loss/train': 2.835726499557495} -09/20/2021 20:14:00 - INFO - __main__ - Step 26530: {'lr': 0.00019983230984676459, 'samples': 848960, 'steps': 1658, 'loss/train': 2.895460367202759} -09/20/2021 20:14:01 - INFO - __main__ - Step 26531: {'lr': 0.00019983230984676459, 'samples': 848992, 'steps': 1658, 'loss/train': 2.9943127632141113} -09/20/2021 20:14:02 - INFO - __main__ - Step 26532: {'lr': 0.00019983230984676459, 'samples': 849024, 'steps': 1658, 'loss/train': 2.7230305671691895} -09/20/2021 20:14:02 - INFO - __main__ - Step 26533: {'lr': 0.00019983230984676459, 'samples': 849056, 'steps': 1658, 'loss/train': 3.3242576122283936} -09/20/2021 20:14:03 - INFO - __main__ - Step 26534: {'lr': 0.00019983230984676459, 'samples': 849088, 'steps': 1658, 'loss/train': 0.9769387245178223} -09/20/2021 20:14:04 - INFO - __main__ - Step 26535: {'lr': 0.00019983230984676459, 'samples': 849120, 'steps': 1658, 'loss/train': 3.185932159423828} -09/20/2021 20:14:05 - INFO - __main__ - Step 26536: {'lr': 0.00019983230984676459, 'samples': 849152, 'steps': 1658, 'loss/train': 2.180652618408203} -09/20/2021 20:14:05 - INFO - __main__ - Step 26537: {'lr': 0.00019983230984676459, 'samples': 849184, 'steps': 1658, 'loss/train': 2.356522798538208} -09/20/2021 20:14:06 - INFO - __main__ - Step 26538: {'lr': 0.00019983230984676459, 'samples': 849216, 'steps': 1658, 'loss/train': 2.973972797393799} -09/20/2021 20:14:07 - INFO - __main__ - Step 26539: {'lr': 0.00019983230984676459, 'samples': 849248, 'steps': 1658, 'loss/train': 2.254831075668335} -09/20/2021 20:14:08 - INFO - __main__ - Step 26540: {'lr': 0.00019983230984676459, 'samples': 849280, 'steps': 1658, 'loss/train': 2.8632049560546875} -09/20/2021 20:14:08 - INFO - __main__ - Step 26541: {'lr': 0.00019983230984676459, 'samples': 849312, 'steps': 1658, 'loss/train': 2.4951024055480957} -09/20/2021 20:14:09 - INFO - __main__ - Step 26542: {'lr': 0.00019983230984676459, 'samples': 849344, 'steps': 1658, 'loss/train': 1.9968856573104858} -09/20/2021 20:14:10 - INFO - __main__ - Step 26543: {'lr': 0.00019983230984676459, 'samples': 849376, 'steps': 1658, 'loss/train': 2.926527738571167} -09/20/2021 20:14:11 - INFO - __main__ - Step 26544: {'lr': 0.00019983230984676459, 'samples': 849408, 'steps': 1658, 'loss/train': 2.3062543869018555} -09/20/2021 20:14:12 - INFO - __main__ - Step 26545: {'lr': 0.00019983194038535032, 'samples': 849440, 'steps': 1659, 'loss/train': 2.847620725631714} -09/20/2021 20:14:13 - INFO - __main__ - Step 26546: {'lr': 0.00019983194038535032, 'samples': 849472, 'steps': 1659, 'loss/train': 1.9076199531555176} -09/20/2021 20:14:14 - INFO - __main__ - Step 26547: {'lr': 0.00019983194038535032, 'samples': 849504, 'steps': 1659, 'loss/train': 2.5153963565826416} -09/20/2021 20:14:14 - INFO - __main__ - Step 26548: {'lr': 0.00019983194038535032, 'samples': 849536, 'steps': 1659, 'loss/train': 1.100888967514038} -09/20/2021 20:14:15 - INFO - __main__ - Step 26549: {'lr': 0.00019983194038535032, 'samples': 849568, 'steps': 1659, 'loss/train': 2.142155170440674} -09/20/2021 20:14:16 - INFO - __main__ - Step 26550: {'lr': 0.00019983194038535032, 'samples': 849600, 'steps': 1659, 'loss/train': 2.410637855529785} -09/20/2021 20:14:17 - INFO - __main__ - Step 26551: {'lr': 0.00019983194038535032, 'samples': 849632, 'steps': 1659, 'loss/train': 3.2093894481658936} -09/20/2021 20:14:17 - INFO - __main__ - Step 26552: {'lr': 0.00019983194038535032, 'samples': 849664, 'steps': 1659, 'loss/train': 3.106851100921631} -09/20/2021 20:14:18 - INFO - __main__ - Step 26553: {'lr': 0.00019983194038535032, 'samples': 849696, 'steps': 1659, 'loss/train': 2.493795871734619} -09/20/2021 20:14:19 - INFO - __main__ - Step 26554: {'lr': 0.00019983194038535032, 'samples': 849728, 'steps': 1659, 'loss/train': 2.6429595947265625} -09/20/2021 20:14:20 - INFO - __main__ - Step 26555: {'lr': 0.00019983194038535032, 'samples': 849760, 'steps': 1659, 'loss/train': 3.3986315727233887} -09/20/2021 20:14:20 - INFO - __main__ - Step 26556: {'lr': 0.00019983194038535032, 'samples': 849792, 'steps': 1659, 'loss/train': 2.1658284664154053} -09/20/2021 20:14:21 - INFO - __main__ - Step 26557: {'lr': 0.00019983194038535032, 'samples': 849824, 'steps': 1659, 'loss/train': 3.549179792404175} -09/20/2021 20:14:22 - INFO - __main__ - Step 26558: {'lr': 0.00019983194038535032, 'samples': 849856, 'steps': 1659, 'loss/train': 3.50836443901062} -09/20/2021 20:14:23 - INFO - __main__ - Step 26559: {'lr': 0.00019983194038535032, 'samples': 849888, 'steps': 1659, 'loss/train': 1.8294273614883423} -09/20/2021 20:14:23 - INFO - __main__ - Step 26560: {'lr': 0.00019983194038535032, 'samples': 849920, 'steps': 1659, 'loss/train': 2.447176933288574} -09/20/2021 20:14:24 - INFO - __main__ - Step 26561: {'lr': 0.00019983157051772028, 'samples': 849952, 'steps': 1660, 'loss/train': 2.6283376216888428} -09/20/2021 20:14:25 - INFO - __main__ - Step 26562: {'lr': 0.00019983157051772028, 'samples': 849984, 'steps': 1660, 'loss/train': 1.8004337549209595} -09/20/2021 20:14:26 - INFO - __main__ - Step 26563: {'lr': 0.00019983157051772028, 'samples': 850016, 'steps': 1660, 'loss/train': 2.0458996295928955} -09/20/2021 20:14:26 - INFO - __main__ - Step 26564: {'lr': 0.00019983157051772028, 'samples': 850048, 'steps': 1660, 'loss/train': 2.5211470127105713} -09/20/2021 20:14:27 - INFO - __main__ - Step 26565: {'lr': 0.00019983157051772028, 'samples': 850080, 'steps': 1660, 'loss/train': 2.5248422622680664} -09/20/2021 20:14:28 - INFO - __main__ - Step 26566: {'lr': 0.00019983157051772028, 'samples': 850112, 'steps': 1660, 'loss/train': 1.7350728511810303} -09/20/2021 20:14:29 - INFO - __main__ - Step 26567: {'lr': 0.00019983157051772028, 'samples': 850144, 'steps': 1660, 'loss/train': 2.542924642562866} -09/20/2021 20:14:29 - INFO - __main__ - Step 26568: {'lr': 0.00019983157051772028, 'samples': 850176, 'steps': 1660, 'loss/train': 2.284640073776245} -09/20/2021 20:14:30 - INFO - __main__ - Step 26569: {'lr': 0.00019983157051772028, 'samples': 850208, 'steps': 1660, 'loss/train': 2.1347665786743164} -09/20/2021 20:14:31 - INFO - __main__ - Step 26570: {'lr': 0.00019983157051772028, 'samples': 850240, 'steps': 1660, 'loss/train': 1.754157543182373} -09/20/2021 20:14:32 - INFO - __main__ - Step 26571: {'lr': 0.00019983157051772028, 'samples': 850272, 'steps': 1660, 'loss/train': 2.157439947128296} -09/20/2021 20:14:32 - INFO - __main__ - Step 26572: {'lr': 0.00019983157051772028, 'samples': 850304, 'steps': 1660, 'loss/train': 2.7918193340301514} -09/20/2021 20:14:33 - INFO - __main__ - Step 26573: {'lr': 0.00019983157051772028, 'samples': 850336, 'steps': 1660, 'loss/train': 1.6935572624206543} -09/20/2021 20:14:35 - INFO - __main__ - Step 26574: {'lr': 0.00019983157051772028, 'samples': 850368, 'steps': 1660, 'loss/train': 2.1635570526123047} -09/20/2021 20:14:35 - INFO - __main__ - Step 26575: {'lr': 0.00019983157051772028, 'samples': 850400, 'steps': 1660, 'loss/train': 1.8912254571914673} -09/20/2021 20:14:36 - INFO - __main__ - Step 26576: {'lr': 0.00019983157051772028, 'samples': 850432, 'steps': 1660, 'loss/train': 3.1831905841827393} -09/20/2021 20:14:37 - INFO - __main__ - Step 26577: {'lr': 0.00019983120024387596, 'samples': 850464, 'steps': 1661, 'loss/train': 2.007432699203491} -09/20/2021 20:14:38 - INFO - __main__ - Step 26578: {'lr': 0.00019983120024387596, 'samples': 850496, 'steps': 1661, 'loss/train': 2.9337384700775146} -09/20/2021 20:14:38 - INFO - __main__ - Step 26579: {'lr': 0.00019983120024387596, 'samples': 850528, 'steps': 1661, 'loss/train': 2.770155668258667} -09/20/2021 20:14:39 - INFO - __main__ - Step 26580: {'lr': 0.00019983120024387596, 'samples': 850560, 'steps': 1661, 'loss/train': 2.5506796836853027} -09/20/2021 20:14:40 - INFO - __main__ - Step 26581: {'lr': 0.00019983120024387596, 'samples': 850592, 'steps': 1661, 'loss/train': 2.499730348587036} -09/20/2021 20:14:41 - INFO - __main__ - Step 26582: {'lr': 0.00019983120024387596, 'samples': 850624, 'steps': 1661, 'loss/train': 2.5065834522247314} -09/20/2021 20:14:41 - INFO - __main__ - Step 26583: {'lr': 0.00019983120024387596, 'samples': 850656, 'steps': 1661, 'loss/train': 2.226559638977051} -09/20/2021 20:14:42 - INFO - __main__ - Step 26584: {'lr': 0.00019983120024387596, 'samples': 850688, 'steps': 1661, 'loss/train': 2.340244770050049} -09/20/2021 20:14:43 - INFO - __main__ - Step 26585: {'lr': 0.00019983120024387596, 'samples': 850720, 'steps': 1661, 'loss/train': 3.6903228759765625} -09/20/2021 20:14:44 - INFO - __main__ - Step 26586: {'lr': 0.00019983120024387596, 'samples': 850752, 'steps': 1661, 'loss/train': 2.9490959644317627} -09/20/2021 20:14:44 - INFO - __main__ - Step 26587: {'lr': 0.00019983120024387596, 'samples': 850784, 'steps': 1661, 'loss/train': 2.2360658645629883} -09/20/2021 20:14:45 - INFO - __main__ - Step 26588: {'lr': 0.00019983120024387596, 'samples': 850816, 'steps': 1661, 'loss/train': 3.04194974899292} -09/20/2021 20:14:46 - INFO - __main__ - Step 26589: {'lr': 0.00019983120024387596, 'samples': 850848, 'steps': 1661, 'loss/train': 2.1979329586029053} -09/20/2021 20:14:47 - INFO - __main__ - Step 26590: {'lr': 0.00019983120024387596, 'samples': 850880, 'steps': 1661, 'loss/train': 3.3116540908813477} -09/20/2021 20:14:47 - INFO - __main__ - Step 26591: {'lr': 0.00019983120024387596, 'samples': 850912, 'steps': 1661, 'loss/train': 2.304070234298706} -09/20/2021 20:14:48 - INFO - __main__ - Step 26592: {'lr': 0.00019983120024387596, 'samples': 850944, 'steps': 1661, 'loss/train': 4.366553783416748} -09/20/2021 20:14:49 - INFO - __main__ - Step 26593: {'lr': 0.00019983082956381889, 'samples': 850976, 'steps': 1662, 'loss/train': 2.8508615493774414} -09/20/2021 20:14:50 - INFO - __main__ - Step 26594: {'lr': 0.00019983082956381889, 'samples': 851008, 'steps': 1662, 'loss/train': 3.957047700881958} -09/20/2021 20:14:51 - INFO - __main__ - Step 26595: {'lr': 0.00019983082956381889, 'samples': 851040, 'steps': 1662, 'loss/train': 2.4852240085601807} -09/20/2021 20:14:51 - INFO - __main__ - Step 26596: {'lr': 0.00019983082956381889, 'samples': 851072, 'steps': 1662, 'loss/train': 2.7680463790893555} -09/20/2021 20:14:52 - INFO - __main__ - Step 26597: {'lr': 0.00019983082956381889, 'samples': 851104, 'steps': 1662, 'loss/train': 3.0813417434692383} -09/20/2021 20:14:53 - INFO - __main__ - Step 26598: {'lr': 0.00019983082956381889, 'samples': 851136, 'steps': 1662, 'loss/train': 2.182861328125} -09/20/2021 20:14:54 - INFO - __main__ - Step 26599: {'lr': 0.00019983082956381889, 'samples': 851168, 'steps': 1662, 'loss/train': 3.0080010890960693} -09/20/2021 20:14:54 - INFO - __main__ - Step 26600: {'lr': 0.00019983082956381889, 'samples': 851200, 'steps': 1662, 'loss/train': 0.8310617804527283} -09/20/2021 20:14:55 - INFO - __main__ - Step 26601: {'lr': 0.00019983082956381889, 'samples': 851232, 'steps': 1662, 'loss/train': 2.1916451454162598} -09/20/2021 20:14:56 - INFO - __main__ - Step 26602: {'lr': 0.00019983082956381889, 'samples': 851264, 'steps': 1662, 'loss/train': 2.845663070678711} -09/20/2021 20:14:57 - INFO - __main__ - Step 26603: {'lr': 0.00019983082956381889, 'samples': 851296, 'steps': 1662, 'loss/train': 3.3621795177459717} -09/20/2021 20:14:57 - INFO - __main__ - Step 26604: {'lr': 0.00019983082956381889, 'samples': 851328, 'steps': 1662, 'loss/train': 2.117964267730713} -09/20/2021 20:14:59 - INFO - __main__ - Step 26605: {'lr': 0.00019983082956381889, 'samples': 851360, 'steps': 1662, 'loss/train': 2.2646803855895996} -09/20/2021 20:14:59 - INFO - __main__ - Step 26606: {'lr': 0.00019983082956381889, 'samples': 851392, 'steps': 1662, 'loss/train': 2.7366554737091064} -09/20/2021 20:15:00 - INFO - __main__ - Step 26607: {'lr': 0.00019983082956381889, 'samples': 851424, 'steps': 1662, 'loss/train': 2.9859864711761475} -09/20/2021 20:15:01 - INFO - __main__ - Step 26608: {'lr': 0.00019983082956381889, 'samples': 851456, 'steps': 1662, 'loss/train': 3.0167500972747803} -09/20/2021 20:15:02 - INFO - __main__ - Step 26609: {'lr': 0.00019983045847755056, 'samples': 851488, 'steps': 1663, 'loss/train': 2.5033388137817383} -09/20/2021 20:15:03 - INFO - __main__ - Step 26610: {'lr': 0.00019983045847755056, 'samples': 851520, 'steps': 1663, 'loss/train': 2.8469390869140625} -09/20/2021 20:15:03 - INFO - __main__ - Step 26611: {'lr': 0.00019983045847755056, 'samples': 851552, 'steps': 1663, 'loss/train': 3.0206093788146973} -09/20/2021 20:15:04 - INFO - __main__ - Step 26612: {'lr': 0.00019983045847755056, 'samples': 851584, 'steps': 1663, 'loss/train': 4.955907344818115} -09/20/2021 20:15:05 - INFO - __main__ - Step 26613: {'lr': 0.00019983045847755056, 'samples': 851616, 'steps': 1663, 'loss/train': 5.106747627258301} -09/20/2021 20:15:06 - INFO - __main__ - Step 26614: {'lr': 0.00019983045847755056, 'samples': 851648, 'steps': 1663, 'loss/train': 3.6402997970581055} -09/20/2021 20:15:06 - INFO - __main__ - Step 26615: {'lr': 0.00019983045847755056, 'samples': 851680, 'steps': 1663, 'loss/train': 3.238413095474243} -09/20/2021 20:15:07 - INFO - __main__ - Step 26616: {'lr': 0.00019983045847755056, 'samples': 851712, 'steps': 1663, 'loss/train': 2.4992198944091797} -09/20/2021 20:15:08 - INFO - __main__ - Step 26617: {'lr': 0.00019983045847755056, 'samples': 851744, 'steps': 1663, 'loss/train': 3.56882643699646} -09/20/2021 20:15:09 - INFO - __main__ - Step 26618: {'lr': 0.00019983045847755056, 'samples': 851776, 'steps': 1663, 'loss/train': 2.083939790725708} -09/20/2021 20:15:09 - INFO - __main__ - Step 26619: {'lr': 0.00019983045847755056, 'samples': 851808, 'steps': 1663, 'loss/train': 2.84470796585083} -09/20/2021 20:15:10 - INFO - __main__ - Step 26620: {'lr': 0.00019983045847755056, 'samples': 851840, 'steps': 1663, 'loss/train': 2.9613747596740723} -09/20/2021 20:15:11 - INFO - __main__ - Step 26621: {'lr': 0.00019983045847755056, 'samples': 851872, 'steps': 1663, 'loss/train': 2.9728386402130127} -09/20/2021 20:15:12 - INFO - __main__ - Step 26622: {'lr': 0.00019983045847755056, 'samples': 851904, 'steps': 1663, 'loss/train': 2.414292335510254} -09/20/2021 20:15:12 - INFO - __main__ - Step 26623: {'lr': 0.00019983045847755056, 'samples': 851936, 'steps': 1663, 'loss/train': 1.134325385093689} -09/20/2021 20:15:13 - INFO - __main__ - Step 26624: {'lr': 0.00019983045847755056, 'samples': 851968, 'steps': 1663, 'loss/train': 2.280332565307617} -09/20/2021 20:15:14 - INFO - __main__ - Step 26625: {'lr': 0.00019983008698507245, 'samples': 852000, 'steps': 1664, 'loss/train': 4.039471626281738} -09/20/2021 20:15:15 - INFO - __main__ - Step 26626: {'lr': 0.00019983008698507245, 'samples': 852032, 'steps': 1664, 'loss/train': 2.7928311824798584} -09/20/2021 20:15:15 - INFO - __main__ - Step 26627: {'lr': 0.00019983008698507245, 'samples': 852064, 'steps': 1664, 'loss/train': 2.452878713607788} -09/20/2021 20:15:16 - INFO - __main__ - Step 26628: {'lr': 0.00019983008698507245, 'samples': 852096, 'steps': 1664, 'loss/train': 2.0690808296203613} -09/20/2021 20:15:17 - INFO - __main__ - Step 26629: {'lr': 0.00019983008698507245, 'samples': 852128, 'steps': 1664, 'loss/train': 3.5058743953704834} -09/20/2021 20:15:18 - INFO - __main__ - Step 26630: {'lr': 0.00019983008698507245, 'samples': 852160, 'steps': 1664, 'loss/train': 2.512261390686035} -09/20/2021 20:15:18 - INFO - __main__ - Step 26631: {'lr': 0.00019983008698507245, 'samples': 852192, 'steps': 1664, 'loss/train': 1.8036893606185913} -09/20/2021 20:15:19 - INFO - __main__ - Step 26632: {'lr': 0.00019983008698507245, 'samples': 852224, 'steps': 1664, 'loss/train': 2.6337099075317383} -09/20/2021 20:15:20 - INFO - __main__ - Step 26633: {'lr': 0.00019983008698507245, 'samples': 852256, 'steps': 1664, 'loss/train': 4.6483683586120605} -09/20/2021 20:15:21 - INFO - __main__ - Step 26634: {'lr': 0.00019983008698507245, 'samples': 852288, 'steps': 1664, 'loss/train': 0.865789532661438} -09/20/2021 20:15:21 - INFO - __main__ - Step 26635: {'lr': 0.00019983008698507245, 'samples': 852320, 'steps': 1664, 'loss/train': 3.968973159790039} -09/20/2021 20:15:22 - INFO - __main__ - Step 26636: {'lr': 0.00019983008698507245, 'samples': 852352, 'steps': 1664, 'loss/train': 2.0131688117980957} -09/20/2021 20:15:23 - INFO - __main__ - Step 26637: {'lr': 0.00019983008698507245, 'samples': 852384, 'steps': 1664, 'loss/train': 2.040093421936035} -09/20/2021 20:15:25 - INFO - __main__ - Step 26638: {'lr': 0.00019983008698507245, 'samples': 852416, 'steps': 1664, 'loss/train': 2.3419978618621826} -09/20/2021 20:15:26 - INFO - __main__ - Step 26639: {'lr': 0.00019983008698507245, 'samples': 852448, 'steps': 1664, 'loss/train': 4.799551486968994} -09/20/2021 20:15:26 - INFO - __main__ - Step 26640: {'lr': 0.00019983008698507245, 'samples': 852480, 'steps': 1664, 'loss/train': 4.531083583831787} -09/20/2021 20:15:27 - INFO - __main__ - Step 26641: {'lr': 0.00019982971508638616, 'samples': 852512, 'steps': 1665, 'loss/train': 3.0773799419403076} -09/20/2021 20:15:28 - INFO - __main__ - Step 26642: {'lr': 0.00019982971508638616, 'samples': 852544, 'steps': 1665, 'loss/train': 2.1495983600616455} -09/20/2021 20:15:29 - INFO - __main__ - Step 26643: {'lr': 0.00019982971508638616, 'samples': 852576, 'steps': 1665, 'loss/train': 1.6108616590499878} -09/20/2021 20:15:29 - INFO - __main__ - Step 26644: {'lr': 0.00019982971508638616, 'samples': 852608, 'steps': 1665, 'loss/train': 2.0958375930786133} -09/20/2021 20:15:30 - INFO - __main__ - Step 26645: {'lr': 0.00019982971508638616, 'samples': 852640, 'steps': 1665, 'loss/train': 2.507776975631714} -09/20/2021 20:15:31 - INFO - __main__ - Step 26646: {'lr': 0.00019982971508638616, 'samples': 852672, 'steps': 1665, 'loss/train': 2.5543580055236816} -09/20/2021 20:15:32 - INFO - __main__ - Step 26647: {'lr': 0.00019982971508638616, 'samples': 852704, 'steps': 1665, 'loss/train': 3.5283100605010986} -09/20/2021 20:15:32 - INFO - __main__ - Step 26648: {'lr': 0.00019982971508638616, 'samples': 852736, 'steps': 1665, 'loss/train': 2.9242470264434814} -09/20/2021 20:15:33 - INFO - __main__ - Step 26649: {'lr': 0.00019982971508638616, 'samples': 852768, 'steps': 1665, 'loss/train': 3.53340482711792} -09/20/2021 20:15:34 - INFO - __main__ - Step 26650: {'lr': 0.00019982971508638616, 'samples': 852800, 'steps': 1665, 'loss/train': 3.1001644134521484} -09/20/2021 20:15:35 - INFO - __main__ - Step 26651: {'lr': 0.00019982971508638616, 'samples': 852832, 'steps': 1665, 'loss/train': 2.3159584999084473} -09/20/2021 20:15:35 - INFO - __main__ - Step 26652: {'lr': 0.00019982971508638616, 'samples': 852864, 'steps': 1665, 'loss/train': 2.288888692855835} -09/20/2021 20:15:36 - INFO - __main__ - Step 26653: {'lr': 0.00019982971508638616, 'samples': 852896, 'steps': 1665, 'loss/train': 2.7488834857940674} -09/20/2021 20:15:37 - INFO - __main__ - Step 26654: {'lr': 0.00019982971508638616, 'samples': 852928, 'steps': 1665, 'loss/train': 2.8871564865112305} -09/20/2021 20:15:38 - INFO - __main__ - Step 26655: {'lr': 0.00019982971508638616, 'samples': 852960, 'steps': 1665, 'loss/train': 2.5930111408233643} -09/20/2021 20:15:38 - INFO - __main__ - Step 26656: {'lr': 0.00019982971508638616, 'samples': 852992, 'steps': 1665, 'loss/train': 2.1018056869506836} -09/20/2021 20:15:39 - INFO - __main__ - Step 26657: {'lr': 0.0001998293427814931, 'samples': 853024, 'steps': 1666, 'loss/train': 2.8476853370666504} -09/20/2021 20:15:40 - INFO - __main__ - Step 26658: {'lr': 0.0001998293427814931, 'samples': 853056, 'steps': 1666, 'loss/train': 2.8126657009124756} -09/20/2021 20:15:41 - INFO - __main__ - Step 26659: {'lr': 0.0001998293427814931, 'samples': 853088, 'steps': 1666, 'loss/train': 3.1352314949035645} -09/20/2021 20:15:42 - INFO - __main__ - Step 26660: {'lr': 0.0001998293427814931, 'samples': 853120, 'steps': 1666, 'loss/train': 2.2450428009033203} -09/20/2021 20:15:42 - INFO - __main__ - Step 26661: {'lr': 0.0001998293427814931, 'samples': 853152, 'steps': 1666, 'loss/train': 3.1367409229278564} -09/20/2021 20:15:43 - INFO - __main__ - Step 26662: {'lr': 0.0001998293427814931, 'samples': 853184, 'steps': 1666, 'loss/train': 2.531846523284912} -09/20/2021 20:15:44 - INFO - __main__ - Step 26663: {'lr': 0.0001998293427814931, 'samples': 853216, 'steps': 1666, 'loss/train': 3.302232503890991} -09/20/2021 20:15:45 - INFO - __main__ - Step 26664: {'lr': 0.0001998293427814931, 'samples': 853248, 'steps': 1666, 'loss/train': 2.907672643661499} -09/20/2021 20:15:45 - INFO - __main__ - Step 26665: {'lr': 0.0001998293427814931, 'samples': 853280, 'steps': 1666, 'loss/train': 3.225318193435669} -09/20/2021 20:15:46 - INFO - __main__ - Step 26666: {'lr': 0.0001998293427814931, 'samples': 853312, 'steps': 1666, 'loss/train': 2.6965038776397705} -09/20/2021 20:15:47 - INFO - __main__ - Step 26667: {'lr': 0.0001998293427814931, 'samples': 853344, 'steps': 1666, 'loss/train': 3.4737181663513184} -09/20/2021 20:15:48 - INFO - __main__ - Step 26668: {'lr': 0.0001998293427814931, 'samples': 853376, 'steps': 1666, 'loss/train': 2.8677525520324707} -09/20/2021 20:15:49 - INFO - __main__ - Step 26669: {'lr': 0.0001998293427814931, 'samples': 853408, 'steps': 1666, 'loss/train': 3.357943296432495} -09/20/2021 20:15:50 - INFO - __main__ - Step 26670: {'lr': 0.0001998293427814931, 'samples': 853440, 'steps': 1666, 'loss/train': 2.265343189239502} -09/20/2021 20:15:51 - INFO - __main__ - Step 26671: {'lr': 0.0001998293427814931, 'samples': 853472, 'steps': 1666, 'loss/train': 2.747305154800415} -09/20/2021 20:15:51 - INFO - __main__ - Step 26672: {'lr': 0.0001998293427814931, 'samples': 853504, 'steps': 1666, 'loss/train': 3.417667865753174} -09/20/2021 20:15:52 - INFO - __main__ - Step 26673: {'lr': 0.00019982897007039485, 'samples': 853536, 'steps': 1667, 'loss/train': 0.6759858131408691} -09/20/2021 20:15:53 - INFO - __main__ - Step 26674: {'lr': 0.00019982897007039485, 'samples': 853568, 'steps': 1667, 'loss/train': 0.9643955826759338} -09/20/2021 20:15:54 - INFO - __main__ - Step 26675: {'lr': 0.00019982897007039485, 'samples': 853600, 'steps': 1667, 'loss/train': 0.4600178599357605} -09/20/2021 20:15:55 - INFO - __main__ - Step 26676: {'lr': 0.00019982897007039485, 'samples': 853632, 'steps': 1667, 'loss/train': 1.006337285041809} -09/20/2021 20:15:55 - INFO - __main__ - Step 26677: {'lr': 0.00019982897007039485, 'samples': 853664, 'steps': 1667, 'loss/train': 0.5262805223464966} -09/20/2021 20:15:56 - INFO - __main__ - Step 26678: {'lr': 0.00019982897007039485, 'samples': 853696, 'steps': 1667, 'loss/train': 1.1171363592147827} -09/20/2021 20:15:57 - INFO - __main__ - Step 26679: {'lr': 0.00019982897007039485, 'samples': 853728, 'steps': 1667, 'loss/train': 2.3733112812042236} -09/20/2021 20:15:58 - INFO - __main__ - Step 26680: {'lr': 0.00019982897007039485, 'samples': 853760, 'steps': 1667, 'loss/train': 2.999473810195923} -09/20/2021 20:15:58 - INFO - __main__ - Step 26681: {'lr': 0.00019982897007039485, 'samples': 853792, 'steps': 1667, 'loss/train': 1.4393913745880127} -09/20/2021 20:15:59 - INFO - __main__ - Step 26682: {'lr': 0.00019982897007039485, 'samples': 853824, 'steps': 1667, 'loss/train': 2.0970609188079834} -09/20/2021 20:16:00 - INFO - __main__ - Step 26683: {'lr': 0.00019982897007039485, 'samples': 853856, 'steps': 1667, 'loss/train': 2.6880171298980713} -09/20/2021 20:16:01 - INFO - __main__ - Step 26684: {'lr': 0.00019982897007039485, 'samples': 853888, 'steps': 1667, 'loss/train': 2.2971150875091553} -09/20/2021 20:16:01 - INFO - __main__ - Step 26685: {'lr': 0.00019982897007039485, 'samples': 853920, 'steps': 1667, 'loss/train': 4.091405391693115} -09/20/2021 20:16:02 - INFO - __main__ - Step 26686: {'lr': 0.00019982897007039485, 'samples': 853952, 'steps': 1667, 'loss/train': 2.9796206951141357} -09/20/2021 20:16:03 - INFO - __main__ - Step 26687: {'lr': 0.00019982897007039485, 'samples': 853984, 'steps': 1667, 'loss/train': 3.1614394187927246} -09/20/2021 20:16:04 - INFO - __main__ - Step 26688: {'lr': 0.00019982897007039485, 'samples': 854016, 'steps': 1667, 'loss/train': 2.708282470703125} -09/20/2021 20:16:05 - INFO - __main__ - Step 26689: {'lr': 0.0001998285969530929, 'samples': 854048, 'steps': 1668, 'loss/train': 2.425629138946533} -09/20/2021 20:16:05 - INFO - __main__ - Step 26690: {'lr': 0.0001998285969530929, 'samples': 854080, 'steps': 1668, 'loss/train': 2.8138880729675293} -09/20/2021 20:16:06 - INFO - __main__ - Step 26691: {'lr': 0.0001998285969530929, 'samples': 854112, 'steps': 1668, 'loss/train': 1.3485455513000488} -09/20/2021 20:16:07 - INFO - __main__ - Step 26692: {'lr': 0.0001998285969530929, 'samples': 854144, 'steps': 1668, 'loss/train': 2.965444803237915} -09/20/2021 20:16:08 - INFO - __main__ - Step 26693: {'lr': 0.0001998285969530929, 'samples': 854176, 'steps': 1668, 'loss/train': 2.976705551147461} -09/20/2021 20:16:08 - INFO - __main__ - Step 26694: {'lr': 0.0001998285969530929, 'samples': 854208, 'steps': 1668, 'loss/train': 4.2833123207092285} -09/20/2021 20:16:09 - INFO - __main__ - Step 26695: {'lr': 0.0001998285969530929, 'samples': 854240, 'steps': 1668, 'loss/train': 4.43766450881958} -09/20/2021 20:16:10 - INFO - __main__ - Step 26696: {'lr': 0.0001998285969530929, 'samples': 854272, 'steps': 1668, 'loss/train': 3.9214370250701904} -09/20/2021 20:16:11 - INFO - __main__ - Step 26697: {'lr': 0.0001998285969530929, 'samples': 854304, 'steps': 1668, 'loss/train': 1.7986729145050049} -09/20/2021 20:16:11 - INFO - __main__ - Step 26698: {'lr': 0.0001998285969530929, 'samples': 854336, 'steps': 1668, 'loss/train': 1.6652806997299194} -09/20/2021 20:16:12 - INFO - __main__ - Step 26699: {'lr': 0.0001998285969530929, 'samples': 854368, 'steps': 1668, 'loss/train': 2.270231246948242} -09/20/2021 20:16:13 - INFO - __main__ - Step 26700: {'lr': 0.0001998285969530929, 'samples': 854400, 'steps': 1668, 'loss/train': 3.8232028484344482} -09/20/2021 20:16:14 - INFO - __main__ - Step 26701: {'lr': 0.0001998285969530929, 'samples': 854432, 'steps': 1668, 'loss/train': 2.54594349861145} -09/20/2021 20:16:15 - INFO - __main__ - Step 26702: {'lr': 0.0001998285969530929, 'samples': 854464, 'steps': 1668, 'loss/train': 1.5744026899337769} -09/20/2021 20:16:16 - INFO - __main__ - Step 26703: {'lr': 0.0001998285969530929, 'samples': 854496, 'steps': 1668, 'loss/train': 2.880751609802246} -09/20/2021 20:16:17 - INFO - __main__ - Step 26704: {'lr': 0.0001998285969530929, 'samples': 854528, 'steps': 1668, 'loss/train': 3.4184203147888184} -09/20/2021 20:16:18 - INFO - __main__ - Step 26705: {'lr': 0.0001998282234295888, 'samples': 854560, 'steps': 1669, 'loss/train': 1.6220605373382568} -09/20/2021 20:16:18 - INFO - __main__ - Step 26706: {'lr': 0.0001998282234295888, 'samples': 854592, 'steps': 1669, 'loss/train': 3.0785531997680664} -09/20/2021 20:16:19 - INFO - __main__ - Step 26707: {'lr': 0.0001998282234295888, 'samples': 854624, 'steps': 1669, 'loss/train': 0.6589856743812561} -09/20/2021 20:16:20 - INFO - __main__ - Step 26708: {'lr': 0.0001998282234295888, 'samples': 854656, 'steps': 1669, 'loss/train': 3.0755386352539062} -09/20/2021 20:16:21 - INFO - __main__ - Step 26709: {'lr': 0.0001998282234295888, 'samples': 854688, 'steps': 1669, 'loss/train': 1.109899640083313} -09/20/2021 20:16:21 - INFO - __main__ - Step 26710: {'lr': 0.0001998282234295888, 'samples': 854720, 'steps': 1669, 'loss/train': 1.2752604484558105} -09/20/2021 20:16:22 - INFO - __main__ - Step 26711: {'lr': 0.0001998282234295888, 'samples': 854752, 'steps': 1669, 'loss/train': 1.434715986251831} -09/20/2021 20:16:23 - INFO - __main__ - Step 26712: {'lr': 0.0001998282234295888, 'samples': 854784, 'steps': 1669, 'loss/train': 1.1885849237442017} -09/20/2021 20:16:24 - INFO - __main__ - Step 26713: {'lr': 0.0001998282234295888, 'samples': 854816, 'steps': 1669, 'loss/train': 1.0922706127166748} -09/20/2021 20:16:24 - INFO - __main__ - Step 26714: {'lr': 0.0001998282234295888, 'samples': 854848, 'steps': 1669, 'loss/train': 1.2813441753387451} -09/20/2021 20:16:25 - INFO - __main__ - Step 26715: {'lr': 0.0001998282234295888, 'samples': 854880, 'steps': 1669, 'loss/train': 1.2345281839370728} -09/20/2021 20:16:26 - INFO - __main__ - Step 26716: {'lr': 0.0001998282234295888, 'samples': 854912, 'steps': 1669, 'loss/train': 1.359474778175354} -09/20/2021 20:16:27 - INFO - __main__ - Step 26717: {'lr': 0.0001998282234295888, 'samples': 854944, 'steps': 1669, 'loss/train': 2.6503279209136963} -09/20/2021 20:16:27 - INFO - __main__ - Step 26718: {'lr': 0.0001998282234295888, 'samples': 854976, 'steps': 1669, 'loss/train': 2.7158045768737793} -09/20/2021 20:16:28 - INFO - __main__ - Step 26719: {'lr': 0.0001998282234295888, 'samples': 855008, 'steps': 1669, 'loss/train': 2.952937126159668} -09/20/2021 20:16:29 - INFO - __main__ - Step 26720: {'lr': 0.0001998282234295888, 'samples': 855040, 'steps': 1669, 'loss/train': 2.0606138706207275} -09/20/2021 20:16:30 - INFO - __main__ - Step 26721: {'lr': 0.00019982784949988403, 'samples': 855072, 'steps': 1670, 'loss/train': 3.1958017349243164} -09/20/2021 20:16:30 - INFO - __main__ - Step 26722: {'lr': 0.00019982784949988403, 'samples': 855104, 'steps': 1670, 'loss/train': 2.930046319961548} -09/20/2021 20:16:31 - INFO - __main__ - Step 26723: {'lr': 0.00019982784949988403, 'samples': 855136, 'steps': 1670, 'loss/train': 1.6788185834884644} -09/20/2021 20:16:32 - INFO - __main__ - Step 26724: {'lr': 0.00019982784949988403, 'samples': 855168, 'steps': 1670, 'loss/train': 3.534412145614624} -09/20/2021 20:16:33 - INFO - __main__ - Step 26725: {'lr': 0.00019982784949988403, 'samples': 855200, 'steps': 1670, 'loss/train': 2.9224321842193604} -09/20/2021 20:16:33 - INFO - __main__ - Step 26726: {'lr': 0.00019982784949988403, 'samples': 855232, 'steps': 1670, 'loss/train': 1.7151579856872559} -09/20/2021 20:16:34 - INFO - __main__ - Step 26727: {'lr': 0.00019982784949988403, 'samples': 855264, 'steps': 1670, 'loss/train': 2.8622007369995117} -09/20/2021 20:16:35 - INFO - __main__ - Step 26728: {'lr': 0.00019982784949988403, 'samples': 855296, 'steps': 1670, 'loss/train': 2.0477819442749023} -09/20/2021 20:16:36 - INFO - __main__ - Step 26729: {'lr': 0.00019982784949988403, 'samples': 855328, 'steps': 1670, 'loss/train': 3.330031394958496} -09/20/2021 20:16:36 - INFO - __main__ - Step 26730: {'lr': 0.00019982784949988403, 'samples': 855360, 'steps': 1670, 'loss/train': 2.1753451824188232} -09/20/2021 20:16:37 - INFO - __main__ - Step 26731: {'lr': 0.00019982784949988403, 'samples': 855392, 'steps': 1670, 'loss/train': 1.6470987796783447} -09/20/2021 20:16:38 - INFO - __main__ - Step 26732: {'lr': 0.00019982784949988403, 'samples': 855424, 'steps': 1670, 'loss/train': 2.0633156299591064} -09/20/2021 20:16:39 - INFO - __main__ - Step 26733: {'lr': 0.00019982784949988403, 'samples': 855456, 'steps': 1670, 'loss/train': 2.685999631881714} -09/20/2021 20:16:39 - INFO - __main__ - Step 26734: {'lr': 0.00019982784949988403, 'samples': 855488, 'steps': 1670, 'loss/train': 2.9792466163635254} -09/20/2021 20:16:40 - INFO - __main__ - Step 26735: {'lr': 0.00019982784949988403, 'samples': 855520, 'steps': 1670, 'loss/train': 2.167997121810913} -09/20/2021 20:16:41 - INFO - __main__ - Step 26736: {'lr': 0.00019982784949988403, 'samples': 855552, 'steps': 1670, 'loss/train': 3.003520965576172} -09/20/2021 20:16:42 - INFO - __main__ - Step 26737: {'lr': 0.00019982747516398015, 'samples': 855584, 'steps': 1671, 'loss/train': 4.076963424682617} -09/20/2021 20:16:43 - INFO - __main__ - Step 26738: {'lr': 0.00019982747516398015, 'samples': 855616, 'steps': 1671, 'loss/train': 2.7490952014923096} -09/20/2021 20:16:44 - INFO - __main__ - Step 26739: {'lr': 0.00019982747516398015, 'samples': 855648, 'steps': 1671, 'loss/train': 2.5951766967773438} -09/20/2021 20:16:45 - INFO - __main__ - Step 26740: {'lr': 0.00019982747516398015, 'samples': 855680, 'steps': 1671, 'loss/train': 2.9760968685150146} -09/20/2021 20:16:45 - INFO - __main__ - Step 26741: {'lr': 0.00019982747516398015, 'samples': 855712, 'steps': 1671, 'loss/train': 3.933885097503662} -09/20/2021 20:16:46 - INFO - __main__ - Step 26742: {'lr': 0.00019982747516398015, 'samples': 855744, 'steps': 1671, 'loss/train': 4.142519474029541} -09/20/2021 20:16:47 - INFO - __main__ - Step 26743: {'lr': 0.00019982747516398015, 'samples': 855776, 'steps': 1671, 'loss/train': 3.2164950370788574} -09/20/2021 20:16:48 - INFO - __main__ - Step 26744: {'lr': 0.00019982747516398015, 'samples': 855808, 'steps': 1671, 'loss/train': 2.640918254852295} -09/20/2021 20:16:48 - INFO - __main__ - Step 26745: {'lr': 0.00019982747516398015, 'samples': 855840, 'steps': 1671, 'loss/train': 1.8970232009887695} -09/20/2021 20:16:49 - INFO - __main__ - Step 26746: {'lr': 0.00019982747516398015, 'samples': 855872, 'steps': 1671, 'loss/train': 1.2332388162612915} -09/20/2021 20:16:50 - INFO - __main__ - Step 26747: {'lr': 0.00019982747516398015, 'samples': 855904, 'steps': 1671, 'loss/train': 2.5981249809265137} -09/20/2021 20:16:51 - INFO - __main__ - Step 26748: {'lr': 0.00019982747516398015, 'samples': 855936, 'steps': 1671, 'loss/train': 3.0719735622406006} -09/20/2021 20:16:51 - INFO - __main__ - Step 26749: {'lr': 0.00019982747516398015, 'samples': 855968, 'steps': 1671, 'loss/train': 2.0757381916046143} -09/20/2021 20:16:52 - INFO - __main__ - Step 26750: {'lr': 0.00019982747516398015, 'samples': 856000, 'steps': 1671, 'loss/train': 2.84942889213562} -09/20/2021 20:16:53 - INFO - __main__ - Step 26751: {'lr': 0.00019982747516398015, 'samples': 856032, 'steps': 1671, 'loss/train': 2.020406723022461} -09/20/2021 20:16:54 - INFO - __main__ - Step 26752: {'lr': 0.00019982747516398015, 'samples': 856064, 'steps': 1671, 'loss/train': 2.7064244747161865} -09/20/2021 20:16:54 - INFO - __main__ - Step 26753: {'lr': 0.00019982710042187863, 'samples': 856096, 'steps': 1672, 'loss/train': 3.0468497276306152} -09/20/2021 20:16:55 - INFO - __main__ - Step 26754: {'lr': 0.00019982710042187863, 'samples': 856128, 'steps': 1672, 'loss/train': 2.8198230266571045} -09/20/2021 20:16:56 - INFO - __main__ - Step 26755: {'lr': 0.00019982710042187863, 'samples': 856160, 'steps': 1672, 'loss/train': 2.751654863357544} -09/20/2021 20:16:57 - INFO - __main__ - Step 26756: {'lr': 0.00019982710042187863, 'samples': 856192, 'steps': 1672, 'loss/train': 2.761503219604492} -09/20/2021 20:16:57 - INFO - __main__ - Step 26757: {'lr': 0.00019982710042187863, 'samples': 856224, 'steps': 1672, 'loss/train': 1.5478328466415405} -09/20/2021 20:16:58 - INFO - __main__ - Step 26758: {'lr': 0.00019982710042187863, 'samples': 856256, 'steps': 1672, 'loss/train': 3.578533411026001} -09/20/2021 20:16:59 - INFO - __main__ - Step 26759: {'lr': 0.00019982710042187863, 'samples': 856288, 'steps': 1672, 'loss/train': 3.3114101886749268} -09/20/2021 20:17:00 - INFO - __main__ - Step 26760: {'lr': 0.00019982710042187863, 'samples': 856320, 'steps': 1672, 'loss/train': 2.4480090141296387} -09/20/2021 20:17:00 - INFO - __main__ - Step 26761: {'lr': 0.00019982710042187863, 'samples': 856352, 'steps': 1672, 'loss/train': 3.1058311462402344} -09/20/2021 20:17:01 - INFO - __main__ - Step 26762: {'lr': 0.00019982710042187863, 'samples': 856384, 'steps': 1672, 'loss/train': 3.095628499984741} -09/20/2021 20:17:02 - INFO - __main__ - Step 26763: {'lr': 0.00019982710042187863, 'samples': 856416, 'steps': 1672, 'loss/train': 2.9493846893310547} -09/20/2021 20:17:03 - INFO - __main__ - Step 26764: {'lr': 0.00019982710042187863, 'samples': 856448, 'steps': 1672, 'loss/train': 2.9287033081054688} -09/20/2021 20:17:03 - INFO - __main__ - Step 26765: {'lr': 0.00019982710042187863, 'samples': 856480, 'steps': 1672, 'loss/train': 2.8618640899658203} -09/20/2021 20:17:04 - INFO - __main__ - Step 26766: {'lr': 0.00019982710042187863, 'samples': 856512, 'steps': 1672, 'loss/train': 2.763223886489868} -09/20/2021 20:17:05 - INFO - __main__ - Step 26767: {'lr': 0.00019982710042187863, 'samples': 856544, 'steps': 1672, 'loss/train': 2.7049524784088135} -09/20/2021 20:17:06 - INFO - __main__ - Step 26768: {'lr': 0.00019982710042187863, 'samples': 856576, 'steps': 1672, 'loss/train': 3.1575443744659424} -09/20/2021 20:17:07 - INFO - __main__ - Step 26769: {'lr': 0.00019982672527358103, 'samples': 856608, 'steps': 1673, 'loss/train': 2.9253275394439697} -09/20/2021 20:17:08 - INFO - __main__ - Step 26770: {'lr': 0.00019982672527358103, 'samples': 856640, 'steps': 1673, 'loss/train': 3.386444568634033} -09/20/2021 20:17:09 - INFO - __main__ - Step 26771: {'lr': 0.00019982672527358103, 'samples': 856672, 'steps': 1673, 'loss/train': 2.5405526161193848} -09/20/2021 20:17:09 - INFO - __main__ - Step 26772: {'lr': 0.00019982672527358103, 'samples': 856704, 'steps': 1673, 'loss/train': 2.4280989170074463} -09/20/2021 20:17:10 - INFO - __main__ - Step 26773: {'lr': 0.00019982672527358103, 'samples': 856736, 'steps': 1673, 'loss/train': 3.2294397354125977} -09/20/2021 20:17:11 - INFO - __main__ - Step 26774: {'lr': 0.00019982672527358103, 'samples': 856768, 'steps': 1673, 'loss/train': 2.697056293487549} -09/20/2021 20:17:12 - INFO - __main__ - Step 26775: {'lr': 0.00019982672527358103, 'samples': 856800, 'steps': 1673, 'loss/train': 3.4908673763275146} -09/20/2021 20:17:12 - INFO - __main__ - Step 26776: {'lr': 0.00019982672527358103, 'samples': 856832, 'steps': 1673, 'loss/train': 2.6358509063720703} -09/20/2021 20:17:13 - INFO - __main__ - Step 26777: {'lr': 0.00019982672527358103, 'samples': 856864, 'steps': 1673, 'loss/train': 3.0074381828308105} -09/20/2021 20:17:14 - INFO - __main__ - Step 26778: {'lr': 0.00019982672527358103, 'samples': 856896, 'steps': 1673, 'loss/train': 2.541494369506836} -09/20/2021 20:17:15 - INFO - __main__ - Step 26779: {'lr': 0.00019982672527358103, 'samples': 856928, 'steps': 1673, 'loss/train': 3.906188488006592} -09/20/2021 20:17:15 - INFO - __main__ - Step 26780: {'lr': 0.00019982672527358103, 'samples': 856960, 'steps': 1673, 'loss/train': 2.455409288406372} -09/20/2021 20:17:16 - INFO - __main__ - Step 26781: {'lr': 0.00019982672527358103, 'samples': 856992, 'steps': 1673, 'loss/train': 2.483429431915283} -09/20/2021 20:17:17 - INFO - __main__ - Step 26782: {'lr': 0.00019982672527358103, 'samples': 857024, 'steps': 1673, 'loss/train': 3.0041894912719727} -09/20/2021 20:17:18 - INFO - __main__ - Step 26783: {'lr': 0.00019982672527358103, 'samples': 857056, 'steps': 1673, 'loss/train': 2.8184804916381836} -09/20/2021 20:17:18 - INFO - __main__ - Step 26784: {'lr': 0.00019982672527358103, 'samples': 857088, 'steps': 1673, 'loss/train': 2.554499864578247} -09/20/2021 20:17:19 - INFO - __main__ - Step 26785: {'lr': 0.00019982634971908887, 'samples': 857120, 'steps': 1674, 'loss/train': 2.0793185234069824} -09/20/2021 20:17:20 - INFO - __main__ - Step 26786: {'lr': 0.00019982634971908887, 'samples': 857152, 'steps': 1674, 'loss/train': 3.2756283283233643} -09/20/2021 20:17:21 - INFO - __main__ - Step 26787: {'lr': 0.00019982634971908887, 'samples': 857184, 'steps': 1674, 'loss/train': 2.873056173324585} -09/20/2021 20:17:22 - INFO - __main__ - Step 26788: {'lr': 0.00019982634971908887, 'samples': 857216, 'steps': 1674, 'loss/train': 2.383152484893799} -09/20/2021 20:17:22 - INFO - __main__ - Step 26789: {'lr': 0.00019982634971908887, 'samples': 857248, 'steps': 1674, 'loss/train': 2.9644968509674072} -09/20/2021 20:17:23 - INFO - __main__ - Step 26790: {'lr': 0.00019982634971908887, 'samples': 857280, 'steps': 1674, 'loss/train': 1.0137114524841309} -09/20/2021 20:17:24 - INFO - __main__ - Step 26791: {'lr': 0.00019982634971908887, 'samples': 857312, 'steps': 1674, 'loss/train': 2.5809578895568848} -09/20/2021 20:17:25 - INFO - __main__ - Step 26792: {'lr': 0.00019982634971908887, 'samples': 857344, 'steps': 1674, 'loss/train': 2.983766555786133} -09/20/2021 20:17:25 - INFO - __main__ - Step 26793: {'lr': 0.00019982634971908887, 'samples': 857376, 'steps': 1674, 'loss/train': 2.891228199005127} -09/20/2021 20:17:26 - INFO - __main__ - Step 26794: {'lr': 0.00019982634971908887, 'samples': 857408, 'steps': 1674, 'loss/train': 2.62690806388855} -09/20/2021 20:17:27 - INFO - __main__ - Step 26795: {'lr': 0.00019982634971908887, 'samples': 857440, 'steps': 1674, 'loss/train': 2.880241632461548} -09/20/2021 20:17:28 - INFO - __main__ - Step 26796: {'lr': 0.00019982634971908887, 'samples': 857472, 'steps': 1674, 'loss/train': 2.8368842601776123} -09/20/2021 20:17:28 - INFO - __main__ - Step 26797: {'lr': 0.00019982634971908887, 'samples': 857504, 'steps': 1674, 'loss/train': 2.2941606044769287} -09/20/2021 20:17:29 - INFO - __main__ - Step 26798: {'lr': 0.00019982634971908887, 'samples': 857536, 'steps': 1674, 'loss/train': 2.642784357070923} -09/20/2021 20:17:30 - INFO - __main__ - Step 26799: {'lr': 0.00019982634971908887, 'samples': 857568, 'steps': 1674, 'loss/train': 2.2265214920043945} -09/20/2021 20:17:31 - INFO - __main__ - Step 26800: {'lr': 0.00019982634971908887, 'samples': 857600, 'steps': 1674, 'loss/train': 2.042165517807007} -09/20/2021 20:17:32 - INFO - __main__ - Step 26801: {'lr': 0.0001998259737584037, 'samples': 857632, 'steps': 1675, 'loss/train': 2.6624133586883545} -09/20/2021 20:17:33 - INFO - __main__ - Step 26802: {'lr': 0.0001998259737584037, 'samples': 857664, 'steps': 1675, 'loss/train': 1.9857103824615479} -09/20/2021 20:17:33 - INFO - __main__ - Step 26803: {'lr': 0.0001998259737584037, 'samples': 857696, 'steps': 1675, 'loss/train': 1.1726961135864258} -09/20/2021 20:17:34 - INFO - __main__ - Step 26804: {'lr': 0.0001998259737584037, 'samples': 857728, 'steps': 1675, 'loss/train': 1.099280595779419} -09/20/2021 20:17:35 - INFO - __main__ - Step 26805: {'lr': 0.0001998259737584037, 'samples': 857760, 'steps': 1675, 'loss/train': 2.81465744972229} -09/20/2021 20:17:36 - INFO - __main__ - Step 26806: {'lr': 0.0001998259737584037, 'samples': 857792, 'steps': 1675, 'loss/train': 2.5061097145080566} -09/20/2021 20:17:36 - INFO - __main__ - Step 26807: {'lr': 0.0001998259737584037, 'samples': 857824, 'steps': 1675, 'loss/train': 3.2429685592651367} -09/20/2021 20:17:37 - INFO - __main__ - Step 26808: {'lr': 0.0001998259737584037, 'samples': 857856, 'steps': 1675, 'loss/train': 2.5139055252075195} -09/20/2021 20:17:38 - INFO - __main__ - Step 26809: {'lr': 0.0001998259737584037, 'samples': 857888, 'steps': 1675, 'loss/train': 2.9033236503601074} -09/20/2021 20:17:39 - INFO - __main__ - Step 26810: {'lr': 0.0001998259737584037, 'samples': 857920, 'steps': 1675, 'loss/train': 2.26918888092041} -09/20/2021 20:17:40 - INFO - __main__ - Step 26811: {'lr': 0.0001998259737584037, 'samples': 857952, 'steps': 1675, 'loss/train': 2.1701231002807617} -09/20/2021 20:17:40 - INFO - __main__ - Step 26812: {'lr': 0.0001998259737584037, 'samples': 857984, 'steps': 1675, 'loss/train': 2.614428758621216} -09/20/2021 20:17:41 - INFO - __main__ - Step 26813: {'lr': 0.0001998259737584037, 'samples': 858016, 'steps': 1675, 'loss/train': 2.318603277206421} -09/20/2021 20:17:42 - INFO - __main__ - Step 26814: {'lr': 0.0001998259737584037, 'samples': 858048, 'steps': 1675, 'loss/train': 2.7118232250213623} -09/20/2021 20:17:43 - INFO - __main__ - Step 26815: {'lr': 0.0001998259737584037, 'samples': 858080, 'steps': 1675, 'loss/train': 3.3296425342559814} -09/20/2021 20:17:43 - INFO - __main__ - Step 26816: {'lr': 0.0001998259737584037, 'samples': 858112, 'steps': 1675, 'loss/train': 3.442215919494629} -09/20/2021 20:17:44 - INFO - __main__ - Step 26817: {'lr': 0.00019982559739152703, 'samples': 858144, 'steps': 1676, 'loss/train': 3.212026596069336} -09/20/2021 20:17:45 - INFO - __main__ - Step 26818: {'lr': 0.00019982559739152703, 'samples': 858176, 'steps': 1676, 'loss/train': 2.9857842922210693} -09/20/2021 20:17:46 - INFO - __main__ - Step 26819: {'lr': 0.00019982559739152703, 'samples': 858208, 'steps': 1676, 'loss/train': 3.9644486904144287} -09/20/2021 20:17:46 - INFO - __main__ - Step 26820: {'lr': 0.00019982559739152703, 'samples': 858240, 'steps': 1676, 'loss/train': 3.112011432647705} -09/20/2021 20:17:47 - INFO - __main__ - Step 26821: {'lr': 0.00019982559739152703, 'samples': 858272, 'steps': 1676, 'loss/train': 3.9139111042022705} -09/20/2021 20:17:48 - INFO - __main__ - Step 26822: {'lr': 0.00019982559739152703, 'samples': 858304, 'steps': 1676, 'loss/train': 2.2352333068847656} -09/20/2021 20:17:49 - INFO - __main__ - Step 26823: {'lr': 0.00019982559739152703, 'samples': 858336, 'steps': 1676, 'loss/train': 3.011655330657959} -09/20/2021 20:17:49 - INFO - __main__ - Step 26824: {'lr': 0.00019982559739152703, 'samples': 858368, 'steps': 1676, 'loss/train': 4.042206764221191} -09/20/2021 20:17:50 - INFO - __main__ - Step 26825: {'lr': 0.00019982559739152703, 'samples': 858400, 'steps': 1676, 'loss/train': 4.166642189025879} -09/20/2021 20:17:51 - INFO - __main__ - Step 26826: {'lr': 0.00019982559739152703, 'samples': 858432, 'steps': 1676, 'loss/train': 2.7929604053497314} -09/20/2021 20:17:52 - INFO - __main__ - Step 26827: {'lr': 0.00019982559739152703, 'samples': 858464, 'steps': 1676, 'loss/train': 1.579185128211975} -09/20/2021 20:17:52 - INFO - __main__ - Step 26828: {'lr': 0.00019982559739152703, 'samples': 858496, 'steps': 1676, 'loss/train': 1.5795167684555054} -09/20/2021 20:17:53 - INFO - __main__ - Step 26829: {'lr': 0.00019982559739152703, 'samples': 858528, 'steps': 1676, 'loss/train': 1.8564163446426392} -09/20/2021 20:17:54 - INFO - __main__ - Step 26830: {'lr': 0.00019982559739152703, 'samples': 858560, 'steps': 1676, 'loss/train': 2.909087657928467} -09/20/2021 20:17:56 - INFO - __main__ - Step 26831: {'lr': 0.00019982559739152703, 'samples': 858592, 'steps': 1676, 'loss/train': 3.3988633155822754} -09/20/2021 20:17:56 - INFO - __main__ - Step 26832: {'lr': 0.00019982559739152703, 'samples': 858624, 'steps': 1676, 'loss/train': 3.185614585876465} -09/20/2021 20:17:57 - INFO - __main__ - Step 26833: {'lr': 0.00019982522061846037, 'samples': 858656, 'steps': 1677, 'loss/train': 2.5356035232543945} -09/20/2021 20:17:58 - INFO - __main__ - Step 26834: {'lr': 0.00019982522061846037, 'samples': 858688, 'steps': 1677, 'loss/train': 2.3762528896331787} -09/20/2021 20:17:59 - INFO - __main__ - Step 26835: {'lr': 0.00019982522061846037, 'samples': 858720, 'steps': 1677, 'loss/train': 3.358039379119873} -09/20/2021 20:17:59 - INFO - __main__ - Step 26836: {'lr': 0.00019982522061846037, 'samples': 858752, 'steps': 1677, 'loss/train': 1.3780808448791504} -09/20/2021 20:18:00 - INFO - __main__ - Step 26837: {'lr': 0.00019982522061846037, 'samples': 858784, 'steps': 1677, 'loss/train': 2.6039135456085205} -09/20/2021 20:18:01 - INFO - __main__ - Step 26838: {'lr': 0.00019982522061846037, 'samples': 858816, 'steps': 1677, 'loss/train': 2.882657289505005} -09/20/2021 20:18:02 - INFO - __main__ - Step 26839: {'lr': 0.00019982522061846037, 'samples': 858848, 'steps': 1677, 'loss/train': 1.5015912055969238} -09/20/2021 20:18:02 - INFO - __main__ - Step 26840: {'lr': 0.00019982522061846037, 'samples': 858880, 'steps': 1677, 'loss/train': 1.0886719226837158} -09/20/2021 20:18:03 - INFO - __main__ - Step 26841: {'lr': 0.00019982522061846037, 'samples': 858912, 'steps': 1677, 'loss/train': 1.6489841938018799} -09/20/2021 20:18:04 - INFO - __main__ - Step 26842: {'lr': 0.00019982522061846037, 'samples': 858944, 'steps': 1677, 'loss/train': 1.5250316858291626} -09/20/2021 20:18:05 - INFO - __main__ - Step 26843: {'lr': 0.00019982522061846037, 'samples': 858976, 'steps': 1677, 'loss/train': 1.780761480331421} -09/20/2021 20:18:05 - INFO - __main__ - Step 26844: {'lr': 0.00019982522061846037, 'samples': 859008, 'steps': 1677, 'loss/train': 1.4889365434646606} -09/20/2021 20:18:06 - INFO - __main__ - Step 26845: {'lr': 0.00019982522061846037, 'samples': 859040, 'steps': 1677, 'loss/train': 1.3303008079528809} -09/20/2021 20:18:07 - INFO - __main__ - Step 26846: {'lr': 0.00019982522061846037, 'samples': 859072, 'steps': 1677, 'loss/train': 1.410526990890503} -09/20/2021 20:18:08 - INFO - __main__ - Step 26847: {'lr': 0.00019982522061846037, 'samples': 859104, 'steps': 1677, 'loss/train': 1.5974184274673462} -09/20/2021 20:18:08 - INFO - __main__ - Step 26848: {'lr': 0.00019982522061846037, 'samples': 859136, 'steps': 1677, 'loss/train': 2.5046470165252686} -09/20/2021 20:18:09 - INFO - __main__ - Step 26849: {'lr': 0.00019982484343920528, 'samples': 859168, 'steps': 1678, 'loss/train': 2.5328187942504883} -09/20/2021 20:18:10 - INFO - __main__ - Step 26850: {'lr': 0.00019982484343920528, 'samples': 859200, 'steps': 1678, 'loss/train': 2.518263339996338} -09/20/2021 20:18:11 - INFO - __main__ - Step 26851: {'lr': 0.00019982484343920528, 'samples': 859232, 'steps': 1678, 'loss/train': 3.3652992248535156} -09/20/2021 20:18:12 - INFO - __main__ - Step 26852: {'lr': 0.00019982484343920528, 'samples': 859264, 'steps': 1678, 'loss/train': 2.2144715785980225} -09/20/2021 20:18:12 - INFO - __main__ - Step 26853: {'lr': 0.00019982484343920528, 'samples': 859296, 'steps': 1678, 'loss/train': 3.1756703853607178} -09/20/2021 20:18:13 - INFO - __main__ - Step 26854: {'lr': 0.00019982484343920528, 'samples': 859328, 'steps': 1678, 'loss/train': 2.5894715785980225} -09/20/2021 20:18:14 - INFO - __main__ - Step 26855: {'lr': 0.00019982484343920528, 'samples': 859360, 'steps': 1678, 'loss/train': 1.3932700157165527} -09/20/2021 20:18:15 - INFO - __main__ - Step 26856: {'lr': 0.00019982484343920528, 'samples': 859392, 'steps': 1678, 'loss/train': 2.3757097721099854} -09/20/2021 20:18:15 - INFO - __main__ - Step 26857: {'lr': 0.00019982484343920528, 'samples': 859424, 'steps': 1678, 'loss/train': 2.863762140274048} -09/20/2021 20:18:16 - INFO - __main__ - Step 26858: {'lr': 0.00019982484343920528, 'samples': 859456, 'steps': 1678, 'loss/train': 2.511518955230713} -09/20/2021 20:18:17 - INFO - __main__ - Step 26859: {'lr': 0.00019982484343920528, 'samples': 859488, 'steps': 1678, 'loss/train': 1.9587411880493164} -09/20/2021 20:18:18 - INFO - __main__ - Step 26860: {'lr': 0.00019982484343920528, 'samples': 859520, 'steps': 1678, 'loss/train': 2.2961323261260986} -09/20/2021 20:18:18 - INFO - __main__ - Step 26861: {'lr': 0.00019982484343920528, 'samples': 859552, 'steps': 1678, 'loss/train': 0.9003371000289917} -09/20/2021 20:18:19 - INFO - __main__ - Step 26862: {'lr': 0.00019982484343920528, 'samples': 859584, 'steps': 1678, 'loss/train': 0.7365339398384094} -09/20/2021 20:18:20 - INFO - __main__ - Step 26863: {'lr': 0.00019982484343920528, 'samples': 859616, 'steps': 1678, 'loss/train': 0.5242576003074646} -09/20/2021 20:18:21 - INFO - __main__ - Step 26864: {'lr': 0.00019982484343920528, 'samples': 859648, 'steps': 1678, 'loss/train': 0.88947993516922} -09/20/2021 20:18:21 - INFO - __main__ - Step 26865: {'lr': 0.0001998244658537633, 'samples': 859680, 'steps': 1679, 'loss/train': 3.2252652645111084} -09/20/2021 20:18:23 - INFO - __main__ - Step 26866: {'lr': 0.0001998244658537633, 'samples': 859712, 'steps': 1679, 'loss/train': 2.8386166095733643} -09/20/2021 20:18:24 - INFO - __main__ - Step 26867: {'lr': 0.0001998244658537633, 'samples': 859744, 'steps': 1679, 'loss/train': 2.6900556087493896} -09/20/2021 20:18:24 - INFO - __main__ - Step 26868: {'lr': 0.0001998244658537633, 'samples': 859776, 'steps': 1679, 'loss/train': 2.3879804611206055} -09/20/2021 20:18:25 - INFO - __main__ - Step 26869: {'lr': 0.0001998244658537633, 'samples': 859808, 'steps': 1679, 'loss/train': 2.3362717628479004} -09/20/2021 20:18:26 - INFO - __main__ - Step 26870: {'lr': 0.0001998244658537633, 'samples': 859840, 'steps': 1679, 'loss/train': 2.984978437423706} -09/20/2021 20:18:27 - INFO - __main__ - Step 26871: {'lr': 0.0001998244658537633, 'samples': 859872, 'steps': 1679, 'loss/train': 2.195889711380005} -09/20/2021 20:18:27 - INFO - __main__ - Step 26872: {'lr': 0.0001998244658537633, 'samples': 859904, 'steps': 1679, 'loss/train': 2.88012957572937} -09/20/2021 20:18:28 - INFO - __main__ - Step 26873: {'lr': 0.0001998244658537633, 'samples': 859936, 'steps': 1679, 'loss/train': 2.357058048248291} -09/20/2021 20:18:29 - INFO - __main__ - Step 26874: {'lr': 0.0001998244658537633, 'samples': 859968, 'steps': 1679, 'loss/train': 0.675869882106781} -09/20/2021 20:18:30 - INFO - __main__ - Step 26875: {'lr': 0.0001998244658537633, 'samples': 860000, 'steps': 1679, 'loss/train': 1.2101666927337646} -09/20/2021 20:18:30 - INFO - __main__ - Step 26876: {'lr': 0.0001998244658537633, 'samples': 860032, 'steps': 1679, 'loss/train': 0.7402965426445007} -09/20/2021 20:18:31 - INFO - __main__ - Step 26877: {'lr': 0.0001998244658537633, 'samples': 860064, 'steps': 1679, 'loss/train': 0.6241810321807861} -09/20/2021 20:18:32 - INFO - __main__ - Step 26878: {'lr': 0.0001998244658537633, 'samples': 860096, 'steps': 1679, 'loss/train': 0.4844493567943573} -09/20/2021 20:18:33 - INFO - __main__ - Step 26879: {'lr': 0.0001998244658537633, 'samples': 860128, 'steps': 1679, 'loss/train': 2.2070415019989014} -09/20/2021 20:18:33 - INFO - __main__ - Step 26880: {'lr': 0.0001998244658537633, 'samples': 860160, 'steps': 1679, 'loss/train': 3.1343636512756348} -09/20/2021 20:18:34 - INFO - __main__ - Step 26881: {'lr': 0.00019982408786213595, 'samples': 860192, 'steps': 1680, 'loss/train': 2.9006214141845703} -09/20/2021 20:18:35 - INFO - __main__ - Step 26882: {'lr': 0.00019982408786213595, 'samples': 860224, 'steps': 1680, 'loss/train': 2.187589406967163} -09/20/2021 20:18:36 - INFO - __main__ - Step 26883: {'lr': 0.00019982408786213595, 'samples': 860256, 'steps': 1680, 'loss/train': 2.8779358863830566} -09/20/2021 20:18:37 - INFO - __main__ - Step 26884: {'lr': 0.00019982408786213595, 'samples': 860288, 'steps': 1680, 'loss/train': 2.088277816772461} -09/20/2021 20:18:37 - INFO - __main__ - Step 26885: {'lr': 0.00019982408786213595, 'samples': 860320, 'steps': 1680, 'loss/train': 3.1718311309814453} -09/20/2021 20:18:38 - INFO - __main__ - Step 26886: {'lr': 0.00019982408786213595, 'samples': 860352, 'steps': 1680, 'loss/train': 0.8047072887420654} -09/20/2021 20:18:39 - INFO - __main__ - Step 26887: {'lr': 0.00019982408786213595, 'samples': 860384, 'steps': 1680, 'loss/train': 2.4037418365478516} -09/20/2021 20:18:40 - INFO - __main__ - Step 26888: {'lr': 0.00019982408786213595, 'samples': 860416, 'steps': 1680, 'loss/train': 2.4525721073150635} -09/20/2021 20:18:40 - INFO - __main__ - Step 26889: {'lr': 0.00019982408786213595, 'samples': 860448, 'steps': 1680, 'loss/train': 2.6014513969421387} -09/20/2021 20:18:41 - INFO - __main__ - Step 26890: {'lr': 0.00019982408786213595, 'samples': 860480, 'steps': 1680, 'loss/train': 2.5350019931793213} -09/20/2021 20:18:42 - INFO - __main__ - Step 26891: {'lr': 0.00019982408786213595, 'samples': 860512, 'steps': 1680, 'loss/train': 2.8537235260009766} -09/20/2021 20:18:43 - INFO - __main__ - Step 26892: {'lr': 0.00019982408786213595, 'samples': 860544, 'steps': 1680, 'loss/train': 3.3576090335845947} -09/20/2021 20:18:43 - INFO - __main__ - Step 26893: {'lr': 0.00019982408786213595, 'samples': 860576, 'steps': 1680, 'loss/train': 2.481252908706665} -09/20/2021 20:18:44 - INFO - __main__ - Step 26894: {'lr': 0.00019982408786213595, 'samples': 860608, 'steps': 1680, 'loss/train': 3.7612338066101074} -09/20/2021 20:18:45 - INFO - __main__ - Step 26895: {'lr': 0.00019982408786213595, 'samples': 860640, 'steps': 1680, 'loss/train': 3.817445993423462} -09/20/2021 20:18:46 - INFO - __main__ - Step 26896: {'lr': 0.00019982408786213595, 'samples': 860672, 'steps': 1680, 'loss/train': 3.3768630027770996} -09/20/2021 20:18:47 - INFO - __main__ - Step 26897: {'lr': 0.0001998237094643248, 'samples': 860704, 'steps': 1681, 'loss/train': 2.779858350753784} -09/20/2021 20:18:48 - INFO - __main__ - Step 26898: {'lr': 0.0001998237094643248, 'samples': 860736, 'steps': 1681, 'loss/train': 3.0125322341918945} -09/20/2021 20:18:49 - INFO - __main__ - Step 26899: {'lr': 0.0001998237094643248, 'samples': 860768, 'steps': 1681, 'loss/train': 5.0245041847229} -09/20/2021 20:18:49 - INFO - __main__ - Step 26900: {'lr': 0.0001998237094643248, 'samples': 860800, 'steps': 1681, 'loss/train': 2.767012596130371} -09/20/2021 20:18:50 - INFO - __main__ - Step 26901: {'lr': 0.0001998237094643248, 'samples': 860832, 'steps': 1681, 'loss/train': 2.5050625801086426} -09/20/2021 20:18:51 - INFO - __main__ - Step 26902: {'lr': 0.0001998237094643248, 'samples': 860864, 'steps': 1681, 'loss/train': 3.82470440864563} -09/20/2021 20:18:52 - INFO - __main__ - Step 26903: {'lr': 0.0001998237094643248, 'samples': 860896, 'steps': 1681, 'loss/train': 2.806065559387207} -09/20/2021 20:18:52 - INFO - __main__ - Step 26904: {'lr': 0.0001998237094643248, 'samples': 860928, 'steps': 1681, 'loss/train': 2.6726057529449463} -09/20/2021 20:18:53 - INFO - __main__ - Step 26905: {'lr': 0.0001998237094643248, 'samples': 860960, 'steps': 1681, 'loss/train': 2.309321403503418} -09/20/2021 20:18:54 - INFO - __main__ - Step 26906: {'lr': 0.0001998237094643248, 'samples': 860992, 'steps': 1681, 'loss/train': 3.361605644226074} -09/20/2021 20:18:55 - INFO - __main__ - Step 26907: {'lr': 0.0001998237094643248, 'samples': 861024, 'steps': 1681, 'loss/train': 2.132136821746826} -09/20/2021 20:18:55 - INFO - __main__ - Step 26908: {'lr': 0.0001998237094643248, 'samples': 861056, 'steps': 1681, 'loss/train': 2.144346237182617} -09/20/2021 20:18:56 - INFO - __main__ - Step 26909: {'lr': 0.0001998237094643248, 'samples': 861088, 'steps': 1681, 'loss/train': 2.404594659805298} -09/20/2021 20:18:57 - INFO - __main__ - Step 26910: {'lr': 0.0001998237094643248, 'samples': 861120, 'steps': 1681, 'loss/train': 2.0097761154174805} -09/20/2021 20:18:58 - INFO - __main__ - Step 26911: {'lr': 0.0001998237094643248, 'samples': 861152, 'steps': 1681, 'loss/train': 2.2098805904388428} -09/20/2021 20:18:58 - INFO - __main__ - Step 26912: {'lr': 0.0001998237094643248, 'samples': 861184, 'steps': 1681, 'loss/train': 1.4720046520233154} -09/20/2021 20:18:59 - INFO - __main__ - Step 26913: {'lr': 0.00019982333066033132, 'samples': 861216, 'steps': 1682, 'loss/train': 4.154382228851318} -09/20/2021 20:19:00 - INFO - __main__ - Step 26914: {'lr': 0.00019982333066033132, 'samples': 861248, 'steps': 1682, 'loss/train': 3.123537302017212} -09/20/2021 20:19:01 - INFO - __main__ - Step 26915: {'lr': 0.00019982333066033132, 'samples': 861280, 'steps': 1682, 'loss/train': 2.5151729583740234} -09/20/2021 20:19:01 - INFO - __main__ - Step 26916: {'lr': 0.00019982333066033132, 'samples': 861312, 'steps': 1682, 'loss/train': 2.4394752979278564} -09/20/2021 20:19:02 - INFO - __main__ - Step 26917: {'lr': 0.00019982333066033132, 'samples': 861344, 'steps': 1682, 'loss/train': 2.7907817363739014} -09/20/2021 20:19:03 - INFO - __main__ - Step 26918: {'lr': 0.00019982333066033132, 'samples': 861376, 'steps': 1682, 'loss/train': 2.666492223739624} -09/20/2021 20:19:04 - INFO - __main__ - Step 26919: {'lr': 0.00019982333066033132, 'samples': 861408, 'steps': 1682, 'loss/train': 3.196382522583008} -09/20/2021 20:19:04 - INFO - __main__ - Step 26920: {'lr': 0.00019982333066033132, 'samples': 861440, 'steps': 1682, 'loss/train': 2.980665445327759} -09/20/2021 20:19:05 - INFO - __main__ - Step 26921: {'lr': 0.00019982333066033132, 'samples': 861472, 'steps': 1682, 'loss/train': 3.5653300285339355} -09/20/2021 20:19:06 - INFO - __main__ - Step 26922: {'lr': 0.00019982333066033132, 'samples': 861504, 'steps': 1682, 'loss/train': 3.0064942836761475} -09/20/2021 20:19:07 - INFO - __main__ - Step 26923: {'lr': 0.00019982333066033132, 'samples': 861536, 'steps': 1682, 'loss/train': 2.30938458442688} -09/20/2021 20:19:07 - INFO - __main__ - Step 26924: {'lr': 0.00019982333066033132, 'samples': 861568, 'steps': 1682, 'loss/train': 2.725277900695801} -09/20/2021 20:19:08 - INFO - __main__ - Step 26925: {'lr': 0.00019982333066033132, 'samples': 861600, 'steps': 1682, 'loss/train': 3.0892810821533203} -09/20/2021 20:19:09 - INFO - __main__ - Step 26926: {'lr': 0.00019982333066033132, 'samples': 861632, 'steps': 1682, 'loss/train': 3.2638325691223145} -09/20/2021 20:19:10 - INFO - __main__ - Step 26927: {'lr': 0.00019982333066033132, 'samples': 861664, 'steps': 1682, 'loss/train': 2.960038423538208} -09/20/2021 20:19:10 - INFO - __main__ - Step 26928: {'lr': 0.00019982333066033132, 'samples': 861696, 'steps': 1682, 'loss/train': 2.8220901489257812} -09/20/2021 20:19:12 - INFO - __main__ - Step 26929: {'lr': 0.0001998229514501571, 'samples': 861728, 'steps': 1683, 'loss/train': 2.3080506324768066} -09/20/2021 20:19:13 - INFO - __main__ - Step 26930: {'lr': 0.0001998229514501571, 'samples': 861760, 'steps': 1683, 'loss/train': 3.1151058673858643} -09/20/2021 20:19:14 - INFO - __main__ - Step 26931: {'lr': 0.0001998229514501571, 'samples': 861792, 'steps': 1683, 'loss/train': 3.267249822616577} -09/20/2021 20:19:14 - INFO - __main__ - Step 26932: {'lr': 0.0001998229514501571, 'samples': 861824, 'steps': 1683, 'loss/train': 2.679323196411133} -09/20/2021 20:19:15 - INFO - __main__ - Step 26933: {'lr': 0.0001998229514501571, 'samples': 861856, 'steps': 1683, 'loss/train': 2.762606620788574} -09/20/2021 20:19:16 - INFO - __main__ - Step 26934: {'lr': 0.0001998229514501571, 'samples': 861888, 'steps': 1683, 'loss/train': 2.5531833171844482} -09/20/2021 20:19:17 - INFO - __main__ - Step 26935: {'lr': 0.0001998229514501571, 'samples': 861920, 'steps': 1683, 'loss/train': 1.7119336128234863} -09/20/2021 20:19:17 - INFO - __main__ - Step 26936: {'lr': 0.0001998229514501571, 'samples': 861952, 'steps': 1683, 'loss/train': 1.6306331157684326} -09/20/2021 20:19:18 - INFO - __main__ - Step 26937: {'lr': 0.0001998229514501571, 'samples': 861984, 'steps': 1683, 'loss/train': 1.1926854848861694} -09/20/2021 20:19:19 - INFO - __main__ - Step 26938: {'lr': 0.0001998229514501571, 'samples': 862016, 'steps': 1683, 'loss/train': 2.8608148097991943} -09/20/2021 20:19:20 - INFO - __main__ - Step 26939: {'lr': 0.0001998229514501571, 'samples': 862048, 'steps': 1683, 'loss/train': 2.0070698261260986} -09/20/2021 20:19:20 - INFO - __main__ - Step 26940: {'lr': 0.0001998229514501571, 'samples': 862080, 'steps': 1683, 'loss/train': 1.7633082866668701} -09/20/2021 20:19:21 - INFO - __main__ - Step 26941: {'lr': 0.0001998229514501571, 'samples': 862112, 'steps': 1683, 'loss/train': 2.6187472343444824} -09/20/2021 20:19:22 - INFO - __main__ - Step 26942: {'lr': 0.0001998229514501571, 'samples': 862144, 'steps': 1683, 'loss/train': 3.2191431522369385} -09/20/2021 20:19:23 - INFO - __main__ - Step 26943: {'lr': 0.0001998229514501571, 'samples': 862176, 'steps': 1683, 'loss/train': 3.5581207275390625} -09/20/2021 20:19:23 - INFO - __main__ - Step 26944: {'lr': 0.0001998229514501571, 'samples': 862208, 'steps': 1683, 'loss/train': 2.9806158542633057} -09/20/2021 20:19:24 - INFO - __main__ - Step 26945: {'lr': 0.0001998225718338037, 'samples': 862240, 'steps': 1684, 'loss/train': 2.513852596282959} -09/20/2021 20:19:25 - INFO - __main__ - Step 26946: {'lr': 0.0001998225718338037, 'samples': 862272, 'steps': 1684, 'loss/train': 6.138484001159668} -09/20/2021 20:19:26 - INFO - __main__ - Step 26947: {'lr': 0.0001998225718338037, 'samples': 862304, 'steps': 1684, 'loss/train': 6.119961261749268} -09/20/2021 20:19:26 - INFO - __main__ - Step 26948: {'lr': 0.0001998225718338037, 'samples': 862336, 'steps': 1684, 'loss/train': 2.910728931427002} -09/20/2021 20:19:27 - INFO - __main__ - Step 26949: {'lr': 0.0001998225718338037, 'samples': 862368, 'steps': 1684, 'loss/train': 3.0709030628204346} -09/20/2021 20:19:28 - INFO - __main__ - Step 26950: {'lr': 0.0001998225718338037, 'samples': 862400, 'steps': 1684, 'loss/train': 3.6522233486175537} -09/20/2021 20:19:29 - INFO - __main__ - Step 26951: {'lr': 0.0001998225718338037, 'samples': 862432, 'steps': 1684, 'loss/train': 4.5104780197143555} -09/20/2021 20:19:29 - INFO - __main__ - Step 26952: {'lr': 0.0001998225718338037, 'samples': 862464, 'steps': 1684, 'loss/train': 3.33855938911438} -09/20/2021 20:19:30 - INFO - __main__ - Step 26953: {'lr': 0.0001998225718338037, 'samples': 862496, 'steps': 1684, 'loss/train': 0.4724116027355194} -09/20/2021 20:19:31 - INFO - __main__ - Step 26954: {'lr': 0.0001998225718338037, 'samples': 862528, 'steps': 1684, 'loss/train': 0.6962369084358215} -09/20/2021 20:19:32 - INFO - __main__ - Step 26955: {'lr': 0.0001998225718338037, 'samples': 862560, 'steps': 1684, 'loss/train': 0.7302082777023315} -09/20/2021 20:19:32 - INFO - __main__ - Step 26956: {'lr': 0.0001998225718338037, 'samples': 862592, 'steps': 1684, 'loss/train': 2.232618570327759} -09/20/2021 20:19:33 - INFO - __main__ - Step 26957: {'lr': 0.0001998225718338037, 'samples': 862624, 'steps': 1684, 'loss/train': 3.6382763385772705} -09/20/2021 20:19:34 - INFO - __main__ - Step 26958: {'lr': 0.0001998225718338037, 'samples': 862656, 'steps': 1684, 'loss/train': 2.594735860824585} -09/20/2021 20:19:35 - INFO - __main__ - Step 26959: {'lr': 0.0001998225718338037, 'samples': 862688, 'steps': 1684, 'loss/train': 3.0943193435668945} -09/20/2021 20:19:35 - INFO - __main__ - Step 26960: {'lr': 0.0001998225718338037, 'samples': 862720, 'steps': 1684, 'loss/train': 1.8686366081237793} -09/20/2021 20:19:36 - INFO - __main__ - Step 26961: {'lr': 0.00019982219181127265, 'samples': 862752, 'steps': 1685, 'loss/train': 3.631960391998291} -09/20/2021 20:19:38 - INFO - __main__ - Step 26962: {'lr': 0.00019982219181127265, 'samples': 862784, 'steps': 1685, 'loss/train': 2.858313798904419} -09/20/2021 20:19:39 - INFO - __main__ - Step 26963: {'lr': 0.00019982219181127265, 'samples': 862816, 'steps': 1685, 'loss/train': 2.175328493118286} -09/20/2021 20:19:40 - INFO - __main__ - Step 26964: {'lr': 0.00019982219181127265, 'samples': 862848, 'steps': 1685, 'loss/train': 2.455132246017456} -09/20/2021 20:19:40 - INFO - __main__ - Step 26965: {'lr': 0.00019982219181127265, 'samples': 862880, 'steps': 1685, 'loss/train': 2.681919574737549} -09/20/2021 20:19:41 - INFO - __main__ - Step 26966: {'lr': 0.00019982219181127265, 'samples': 862912, 'steps': 1685, 'loss/train': 3.23223614692688} -09/20/2021 20:19:42 - INFO - __main__ - Step 26967: {'lr': 0.00019982219181127265, 'samples': 862944, 'steps': 1685, 'loss/train': 2.2323684692382812} -09/20/2021 20:19:43 - INFO - __main__ - Step 26968: {'lr': 0.00019982219181127265, 'samples': 862976, 'steps': 1685, 'loss/train': 2.4792885780334473} -09/20/2021 20:19:43 - INFO - __main__ - Step 26969: {'lr': 0.00019982219181127265, 'samples': 863008, 'steps': 1685, 'loss/train': 2.7522246837615967} -09/20/2021 20:19:44 - INFO - __main__ - Step 26970: {'lr': 0.00019982219181127265, 'samples': 863040, 'steps': 1685, 'loss/train': 2.9288408756256104} -09/20/2021 20:19:45 - INFO - __main__ - Step 26971: {'lr': 0.00019982219181127265, 'samples': 863072, 'steps': 1685, 'loss/train': 2.113480806350708} -09/20/2021 20:19:46 - INFO - __main__ - Step 26972: {'lr': 0.00019982219181127265, 'samples': 863104, 'steps': 1685, 'loss/train': 3.3158228397369385} -09/20/2021 20:19:46 - INFO - __main__ - Step 26973: {'lr': 0.00019982219181127265, 'samples': 863136, 'steps': 1685, 'loss/train': 0.670512855052948} -09/20/2021 20:19:47 - INFO - __main__ - Step 26974: {'lr': 0.00019982219181127265, 'samples': 863168, 'steps': 1685, 'loss/train': 0.6211841106414795} -09/20/2021 20:19:48 - INFO - __main__ - Step 26975: {'lr': 0.00019982219181127265, 'samples': 863200, 'steps': 1685, 'loss/train': 0.4263523817062378} -09/20/2021 20:19:49 - INFO - __main__ - Step 26976: {'lr': 0.00019982219181127265, 'samples': 863232, 'steps': 1685, 'loss/train': 1.5314557552337646} -09/20/2021 20:19:50 - INFO - __main__ - Step 26977: {'lr': 0.00019982181138256547, 'samples': 863264, 'steps': 1686, 'loss/train': 1.6565260887145996} -09/20/2021 20:19:50 - INFO - __main__ - Step 26978: {'lr': 0.00019982181138256547, 'samples': 863296, 'steps': 1686, 'loss/train': 2.28337025642395} -09/20/2021 20:19:51 - INFO - __main__ - Step 26979: {'lr': 0.00019982181138256547, 'samples': 863328, 'steps': 1686, 'loss/train': 1.7147752046585083} -09/20/2021 20:19:52 - INFO - __main__ - Step 26980: {'lr': 0.00019982181138256547, 'samples': 863360, 'steps': 1686, 'loss/train': 1.4609662294387817} -09/20/2021 20:19:53 - INFO - __main__ - Step 26981: {'lr': 0.00019982181138256547, 'samples': 863392, 'steps': 1686, 'loss/train': 3.2990005016326904} -09/20/2021 20:19:53 - INFO - __main__ - Step 26982: {'lr': 0.00019982181138256547, 'samples': 863424, 'steps': 1686, 'loss/train': 2.761960983276367} -09/20/2021 20:19:54 - INFO - __main__ - Step 26983: {'lr': 0.00019982181138256547, 'samples': 863456, 'steps': 1686, 'loss/train': 3.742222785949707} -09/20/2021 20:19:55 - INFO - __main__ - Step 26984: {'lr': 0.00019982181138256547, 'samples': 863488, 'steps': 1686, 'loss/train': 4.424907684326172} -09/20/2021 20:19:56 - INFO - __main__ - Step 26985: {'lr': 0.00019982181138256547, 'samples': 863520, 'steps': 1686, 'loss/train': 2.422837734222412} -09/20/2021 20:19:56 - INFO - __main__ - Step 26986: {'lr': 0.00019982181138256547, 'samples': 863552, 'steps': 1686, 'loss/train': 2.41268253326416} -09/20/2021 20:19:57 - INFO - __main__ - Step 26987: {'lr': 0.00019982181138256547, 'samples': 863584, 'steps': 1686, 'loss/train': 1.8958125114440918} -09/20/2021 20:19:58 - INFO - __main__ - Step 26988: {'lr': 0.00019982181138256547, 'samples': 863616, 'steps': 1686, 'loss/train': 1.6139410734176636} -09/20/2021 20:19:59 - INFO - __main__ - Step 26989: {'lr': 0.00019982181138256547, 'samples': 863648, 'steps': 1686, 'loss/train': 2.0795843601226807} -09/20/2021 20:19:59 - INFO - __main__ - Step 26990: {'lr': 0.00019982181138256547, 'samples': 863680, 'steps': 1686, 'loss/train': 2.04014253616333} -09/20/2021 20:20:00 - INFO - __main__ - Step 26991: {'lr': 0.00019982181138256547, 'samples': 863712, 'steps': 1686, 'loss/train': 1.8325188159942627} -09/20/2021 20:20:01 - INFO - __main__ - Step 26992: {'lr': 0.00019982181138256547, 'samples': 863744, 'steps': 1686, 'loss/train': 2.688429832458496} -09/20/2021 20:20:02 - INFO - __main__ - Step 26993: {'lr': 0.00019982143054768372, 'samples': 863776, 'steps': 1687, 'loss/train': 1.0388007164001465} -09/20/2021 20:20:02 - INFO - __main__ - Step 26994: {'lr': 0.00019982143054768372, 'samples': 863808, 'steps': 1687, 'loss/train': 1.0249459743499756} -09/20/2021 20:20:03 - INFO - __main__ - Step 26995: {'lr': 0.00019982143054768372, 'samples': 863840, 'steps': 1687, 'loss/train': 1.1877962350845337} -09/20/2021 20:20:04 - INFO - __main__ - Step 26996: {'lr': 0.00019982143054768372, 'samples': 863872, 'steps': 1687, 'loss/train': 1.2153162956237793} -09/20/2021 20:20:05 - INFO - __main__ - Step 26997: {'lr': 0.00019982143054768372, 'samples': 863904, 'steps': 1687, 'loss/train': 1.2213916778564453} -09/20/2021 20:20:05 - INFO - __main__ - Step 26998: {'lr': 0.00019982143054768372, 'samples': 863936, 'steps': 1687, 'loss/train': 1.2238866090774536} -09/20/2021 20:20:06 - INFO - __main__ - Step 26999: {'lr': 0.00019982143054768372, 'samples': 863968, 'steps': 1687, 'loss/train': 1.170627236366272} -09/20/2021 20:20:07 - INFO - __main__ - Step 27000: {'lr': 0.00019982143054768372, 'samples': 864000, 'steps': 1687, 'loss/train': 2.62078595161438} -09/20/2021 20:20:09 - INFO - __main__ - Step 27001: {'lr': 0.00019982143054768372, 'samples': 864032, 'steps': 1687, 'loss/train': 3.7030787467956543} -09/20/2021 20:20:09 - INFO - __main__ - Step 27002: {'lr': 0.00019982143054768372, 'samples': 864064, 'steps': 1687, 'loss/train': 2.5546810626983643} -09/20/2021 20:20:10 - INFO - __main__ - Step 27003: {'lr': 0.00019982143054768372, 'samples': 864096, 'steps': 1687, 'loss/train': 2.625279664993286} -09/20/2021 20:20:11 - INFO - __main__ - Step 27004: {'lr': 0.00019982143054768372, 'samples': 864128, 'steps': 1687, 'loss/train': 3.0410192012786865} -09/20/2021 20:20:12 - INFO - __main__ - Step 27005: {'lr': 0.00019982143054768372, 'samples': 864160, 'steps': 1687, 'loss/train': 1.895371675491333} -09/20/2021 20:20:12 - INFO - __main__ - Step 27006: {'lr': 0.00019982143054768372, 'samples': 864192, 'steps': 1687, 'loss/train': 3.38742995262146} -09/20/2021 20:20:13 - INFO - __main__ - Step 27007: {'lr': 0.00019982143054768372, 'samples': 864224, 'steps': 1687, 'loss/train': 2.8321616649627686} -09/20/2021 20:20:14 - INFO - __main__ - Step 27008: {'lr': 0.00019982143054768372, 'samples': 864256, 'steps': 1687, 'loss/train': 3.5981595516204834} -09/20/2021 20:20:15 - INFO - __main__ - Step 27009: {'lr': 0.00019982104930662897, 'samples': 864288, 'steps': 1688, 'loss/train': 2.4325907230377197} -09/20/2021 20:20:16 - INFO - __main__ - Step 27010: {'lr': 0.00019982104930662897, 'samples': 864320, 'steps': 1688, 'loss/train': 2.790656566619873} -09/20/2021 20:20:16 - INFO - __main__ - Step 27011: {'lr': 0.00019982104930662897, 'samples': 864352, 'steps': 1688, 'loss/train': 2.7415964603424072} -09/20/2021 20:20:17 - INFO - __main__ - Step 27012: {'lr': 0.00019982104930662897, 'samples': 864384, 'steps': 1688, 'loss/train': 2.997072219848633} -09/20/2021 20:20:18 - INFO - __main__ - Step 27013: {'lr': 0.00019982104930662897, 'samples': 864416, 'steps': 1688, 'loss/train': 2.1923201084136963} -09/20/2021 20:20:19 - INFO - __main__ - Step 27014: {'lr': 0.00019982104930662897, 'samples': 864448, 'steps': 1688, 'loss/train': 2.4971721172332764} -09/20/2021 20:20:19 - INFO - __main__ - Step 27015: {'lr': 0.00019982104930662897, 'samples': 864480, 'steps': 1688, 'loss/train': 2.2078652381896973} -09/20/2021 20:20:20 - INFO - __main__ - Step 27016: {'lr': 0.00019982104930662897, 'samples': 864512, 'steps': 1688, 'loss/train': 2.564204454421997} -09/20/2021 20:20:21 - INFO - __main__ - Step 27017: {'lr': 0.00019982104930662897, 'samples': 864544, 'steps': 1688, 'loss/train': 1.287845492362976} -09/20/2021 20:20:22 - INFO - __main__ - Step 27018: {'lr': 0.00019982104930662897, 'samples': 864576, 'steps': 1688, 'loss/train': 3.275630235671997} -09/20/2021 20:20:22 - INFO - __main__ - Step 27019: {'lr': 0.00019982104930662897, 'samples': 864608, 'steps': 1688, 'loss/train': 3.0005249977111816} -09/20/2021 20:20:23 - INFO - __main__ - Step 27020: {'lr': 0.00019982104930662897, 'samples': 864640, 'steps': 1688, 'loss/train': 2.2480533123016357} -09/20/2021 20:20:24 - INFO - __main__ - Step 27021: {'lr': 0.00019982104930662897, 'samples': 864672, 'steps': 1688, 'loss/train': 3.0272724628448486} -09/20/2021 20:20:25 - INFO - __main__ - Step 27022: {'lr': 0.00019982104930662897, 'samples': 864704, 'steps': 1688, 'loss/train': 2.1405138969421387} -09/20/2021 20:20:25 - INFO - __main__ - Step 27023: {'lr': 0.00019982104930662897, 'samples': 864736, 'steps': 1688, 'loss/train': 2.54103422164917} -09/20/2021 20:20:26 - INFO - __main__ - Step 27024: {'lr': 0.00019982104930662897, 'samples': 864768, 'steps': 1688, 'loss/train': 2.758601665496826} -09/20/2021 20:20:27 - INFO - __main__ - Step 27025: {'lr': 0.00019982066765940277, 'samples': 864800, 'steps': 1689, 'loss/train': 2.8326172828674316} -09/20/2021 20:20:28 - INFO - __main__ - Step 27026: {'lr': 0.00019982066765940277, 'samples': 864832, 'steps': 1689, 'loss/train': 2.174656629562378} -09/20/2021 20:20:29 - INFO - __main__ - Step 27027: {'lr': 0.00019982066765940277, 'samples': 864864, 'steps': 1689, 'loss/train': 2.464683771133423} -09/20/2021 20:20:29 - INFO - __main__ - Step 27028: {'lr': 0.00019982066765940277, 'samples': 864896, 'steps': 1689, 'loss/train': 2.6592094898223877} -09/20/2021 20:20:30 - INFO - __main__ - Step 27029: {'lr': 0.00019982066765940277, 'samples': 864928, 'steps': 1689, 'loss/train': 3.444230794906616} -09/20/2021 20:20:31 - INFO - __main__ - Step 27030: {'lr': 0.00019982066765940277, 'samples': 864960, 'steps': 1689, 'loss/train': 3.3808321952819824} -09/20/2021 20:20:32 - INFO - __main__ - Step 27031: {'lr': 0.00019982066765940277, 'samples': 864992, 'steps': 1689, 'loss/train': 3.402117967605591} -09/20/2021 20:20:33 - INFO - __main__ - Step 27032: {'lr': 0.00019982066765940277, 'samples': 865024, 'steps': 1689, 'loss/train': 2.9809563159942627} -09/20/2021 20:20:34 - INFO - __main__ - Step 27033: {'lr': 0.00019982066765940277, 'samples': 865056, 'steps': 1689, 'loss/train': 3.443117380142212} -09/20/2021 20:20:34 - INFO - __main__ - Step 27034: {'lr': 0.00019982066765940277, 'samples': 865088, 'steps': 1689, 'loss/train': 2.7344810962677} -09/20/2021 20:20:35 - INFO - __main__ - Step 27035: {'lr': 0.00019982066765940277, 'samples': 865120, 'steps': 1689, 'loss/train': 2.1691904067993164} -09/20/2021 20:20:36 - INFO - __main__ - Step 27036: {'lr': 0.00019982066765940277, 'samples': 865152, 'steps': 1689, 'loss/train': 2.3708763122558594} -09/20/2021 20:20:37 - INFO - __main__ - Step 27037: {'lr': 0.00019982066765940277, 'samples': 865184, 'steps': 1689, 'loss/train': 2.3265435695648193} -09/20/2021 20:20:37 - INFO - __main__ - Step 27038: {'lr': 0.00019982066765940277, 'samples': 865216, 'steps': 1689, 'loss/train': 3.4419069290161133} -09/20/2021 20:20:38 - INFO - __main__ - Step 27039: {'lr': 0.00019982066765940277, 'samples': 865248, 'steps': 1689, 'loss/train': 3.2979941368103027} -09/20/2021 20:20:39 - INFO - __main__ - Step 27040: {'lr': 0.00019982066765940277, 'samples': 865280, 'steps': 1689, 'loss/train': 3.0823893547058105} -09/20/2021 20:20:40 - INFO - __main__ - Step 27041: {'lr': 0.00019982028560600664, 'samples': 865312, 'steps': 1690, 'loss/train': 2.8837037086486816} -09/20/2021 20:20:40 - INFO - __main__ - Step 27042: {'lr': 0.00019982028560600664, 'samples': 865344, 'steps': 1690, 'loss/train': 0.7767895460128784} -09/20/2021 20:20:41 - INFO - __main__ - Step 27043: {'lr': 0.00019982028560600664, 'samples': 865376, 'steps': 1690, 'loss/train': 2.2342171669006348} -09/20/2021 20:20:42 - INFO - __main__ - Step 27044: {'lr': 0.00019982028560600664, 'samples': 865408, 'steps': 1690, 'loss/train': 2.424877166748047} -09/20/2021 20:20:43 - INFO - __main__ - Step 27045: {'lr': 0.00019982028560600664, 'samples': 865440, 'steps': 1690, 'loss/train': 2.0015151500701904} -09/20/2021 20:20:43 - INFO - __main__ - Step 27046: {'lr': 0.00019982028560600664, 'samples': 865472, 'steps': 1690, 'loss/train': 5.281360626220703} -09/20/2021 20:20:44 - INFO - __main__ - Step 27047: {'lr': 0.00019982028560600664, 'samples': 865504, 'steps': 1690, 'loss/train': 2.3072452545166016} -09/20/2021 20:20:45 - INFO - __main__ - Step 27048: {'lr': 0.00019982028560600664, 'samples': 865536, 'steps': 1690, 'loss/train': 2.707972526550293} -09/20/2021 20:20:46 - INFO - __main__ - Step 27049: {'lr': 0.00019982028560600664, 'samples': 865568, 'steps': 1690, 'loss/train': 2.574923515319824} -09/20/2021 20:20:46 - INFO - __main__ - Step 27050: {'lr': 0.00019982028560600664, 'samples': 865600, 'steps': 1690, 'loss/train': 1.9687014818191528} -09/20/2021 20:20:47 - INFO - __main__ - Step 27051: {'lr': 0.00019982028560600664, 'samples': 865632, 'steps': 1690, 'loss/train': 3.21744966506958} -09/20/2021 20:20:48 - INFO - __main__ - Step 27052: {'lr': 0.00019982028560600664, 'samples': 865664, 'steps': 1690, 'loss/train': 2.214109420776367} -09/20/2021 20:20:49 - INFO - __main__ - Step 27053: {'lr': 0.00019982028560600664, 'samples': 865696, 'steps': 1690, 'loss/train': 2.5336754322052} -09/20/2021 20:20:49 - INFO - __main__ - Step 27054: {'lr': 0.00019982028560600664, 'samples': 865728, 'steps': 1690, 'loss/train': 3.3062589168548584} -09/20/2021 20:20:50 - INFO - __main__ - Step 27055: {'lr': 0.00019982028560600664, 'samples': 865760, 'steps': 1690, 'loss/train': 1.2399128675460815} -09/20/2021 20:20:51 - INFO - __main__ - Step 27056: {'lr': 0.00019982028560600664, 'samples': 865792, 'steps': 1690, 'loss/train': 2.827915668487549} -09/20/2021 20:20:52 - INFO - __main__ - Step 27057: {'lr': 0.00019981990314644213, 'samples': 865824, 'steps': 1691, 'loss/train': 2.5326478481292725} -09/20/2021 20:20:53 - INFO - __main__ - Step 27058: {'lr': 0.00019981990314644213, 'samples': 865856, 'steps': 1691, 'loss/train': 2.685990810394287} -09/20/2021 20:20:53 - INFO - __main__ - Step 27059: {'lr': 0.00019981990314644213, 'samples': 865888, 'steps': 1691, 'loss/train': 4.046982765197754} -09/20/2021 20:20:54 - INFO - __main__ - Step 27060: {'lr': 0.00019981990314644213, 'samples': 865920, 'steps': 1691, 'loss/train': 1.1119600534439087} -09/20/2021 20:20:55 - INFO - __main__ - Step 27061: {'lr': 0.00019981990314644213, 'samples': 865952, 'steps': 1691, 'loss/train': 2.095707893371582} -09/20/2021 20:20:56 - INFO - __main__ - Step 27062: {'lr': 0.00019981990314644213, 'samples': 865984, 'steps': 1691, 'loss/train': 3.763157367706299} -09/20/2021 20:20:57 - INFO - __main__ - Step 27063: {'lr': 0.00019981990314644213, 'samples': 866016, 'steps': 1691, 'loss/train': 2.7225875854492188} -09/20/2021 20:20:58 - INFO - __main__ - Step 27064: {'lr': 0.00019981990314644213, 'samples': 866048, 'steps': 1691, 'loss/train': 2.7507641315460205} -09/20/2021 20:20:58 - INFO - __main__ - Step 27065: {'lr': 0.00019981990314644213, 'samples': 866080, 'steps': 1691, 'loss/train': 2.448683261871338} -09/20/2021 20:20:59 - INFO - __main__ - Step 27066: {'lr': 0.00019981990314644213, 'samples': 866112, 'steps': 1691, 'loss/train': 3.4762611389160156} -09/20/2021 20:21:00 - INFO - __main__ - Step 27067: {'lr': 0.00019981990314644213, 'samples': 866144, 'steps': 1691, 'loss/train': 2.3286361694335938} -09/20/2021 20:21:01 - INFO - __main__ - Step 27068: {'lr': 0.00019981990314644213, 'samples': 866176, 'steps': 1691, 'loss/train': 2.803727626800537} -09/20/2021 20:21:01 - INFO - __main__ - Step 27069: {'lr': 0.00019981990314644213, 'samples': 866208, 'steps': 1691, 'loss/train': 2.26357364654541} -09/20/2021 20:21:02 - INFO - __main__ - Step 27070: {'lr': 0.00019981990314644213, 'samples': 866240, 'steps': 1691, 'loss/train': 2.2980756759643555} -09/20/2021 20:21:03 - INFO - __main__ - Step 27071: {'lr': 0.00019981990314644213, 'samples': 866272, 'steps': 1691, 'loss/train': 2.1823461055755615} -09/20/2021 20:21:04 - INFO - __main__ - Step 27072: {'lr': 0.00019981990314644213, 'samples': 866304, 'steps': 1691, 'loss/train': 2.242528200149536} -09/20/2021 20:21:05 - INFO - __main__ - Step 27073: {'lr': 0.00019981952028071088, 'samples': 866336, 'steps': 1692, 'loss/train': 2.269517660140991} -09/20/2021 20:21:05 - INFO - __main__ - Step 27074: {'lr': 0.00019981952028071088, 'samples': 866368, 'steps': 1692, 'loss/train': 2.8445420265197754} -09/20/2021 20:21:06 - INFO - __main__ - Step 27075: {'lr': 0.00019981952028071088, 'samples': 866400, 'steps': 1692, 'loss/train': 2.3262548446655273} -09/20/2021 20:21:07 - INFO - __main__ - Step 27076: {'lr': 0.00019981952028071088, 'samples': 866432, 'steps': 1692, 'loss/train': 2.8768112659454346} -09/20/2021 20:21:08 - INFO - __main__ - Step 27077: {'lr': 0.00019981952028071088, 'samples': 866464, 'steps': 1692, 'loss/train': 3.057638168334961} -09/20/2021 20:21:08 - INFO - __main__ - Step 27078: {'lr': 0.00019981952028071088, 'samples': 866496, 'steps': 1692, 'loss/train': 3.68322491645813} -09/20/2021 20:21:09 - INFO - __main__ - Step 27079: {'lr': 0.00019981952028071088, 'samples': 866528, 'steps': 1692, 'loss/train': 2.2129664421081543} -09/20/2021 20:21:10 - INFO - __main__ - Step 27080: {'lr': 0.00019981952028071088, 'samples': 866560, 'steps': 1692, 'loss/train': 3.586226463317871} -09/20/2021 20:21:11 - INFO - __main__ - Step 27081: {'lr': 0.00019981952028071088, 'samples': 866592, 'steps': 1692, 'loss/train': 2.448385238647461} -09/20/2021 20:21:11 - INFO - __main__ - Step 27082: {'lr': 0.00019981952028071088, 'samples': 866624, 'steps': 1692, 'loss/train': 2.364335298538208} -09/20/2021 20:21:12 - INFO - __main__ - Step 27083: {'lr': 0.00019981952028071088, 'samples': 866656, 'steps': 1692, 'loss/train': 2.7835264205932617} -09/20/2021 20:21:13 - INFO - __main__ - Step 27084: {'lr': 0.00019981952028071088, 'samples': 866688, 'steps': 1692, 'loss/train': 2.772705554962158} -09/20/2021 20:21:14 - INFO - __main__ - Step 27085: {'lr': 0.00019981952028071088, 'samples': 866720, 'steps': 1692, 'loss/train': 3.2553699016571045} -09/20/2021 20:21:14 - INFO - __main__ - Step 27086: {'lr': 0.00019981952028071088, 'samples': 866752, 'steps': 1692, 'loss/train': 2.9042510986328125} -09/20/2021 20:21:15 - INFO - __main__ - Step 27087: {'lr': 0.00019981952028071088, 'samples': 866784, 'steps': 1692, 'loss/train': 2.2727534770965576} -09/20/2021 20:21:16 - INFO - __main__ - Step 27088: {'lr': 0.00019981952028071088, 'samples': 866816, 'steps': 1692, 'loss/train': 4.01897668838501} -09/20/2021 20:21:17 - INFO - __main__ - Step 27089: {'lr': 0.00019981913700881437, 'samples': 866848, 'steps': 1693, 'loss/train': 1.4487653970718384} -09/20/2021 20:21:18 - INFO - __main__ - Step 27090: {'lr': 0.00019981913700881437, 'samples': 866880, 'steps': 1693, 'loss/train': 2.907602310180664} -09/20/2021 20:21:18 - INFO - __main__ - Step 27091: {'lr': 0.00019981913700881437, 'samples': 866912, 'steps': 1693, 'loss/train': 1.8279904127120972} -09/20/2021 20:21:19 - INFO - __main__ - Step 27092: {'lr': 0.00019981913700881437, 'samples': 866944, 'steps': 1693, 'loss/train': 2.809041976928711} -09/20/2021 20:21:20 - INFO - __main__ - Step 27093: {'lr': 0.00019981913700881437, 'samples': 866976, 'steps': 1693, 'loss/train': 3.533533811569214} -09/20/2021 20:21:21 - INFO - __main__ - Step 27094: {'lr': 0.00019981913700881437, 'samples': 867008, 'steps': 1693, 'loss/train': 2.886089324951172} -09/20/2021 20:21:21 - INFO - __main__ - Step 27095: {'lr': 0.00019981913700881437, 'samples': 867040, 'steps': 1693, 'loss/train': 4.062779426574707} -09/20/2021 20:21:22 - INFO - __main__ - Step 27096: {'lr': 0.00019981913700881437, 'samples': 867072, 'steps': 1693, 'loss/train': 3.2049918174743652} -09/20/2021 20:21:23 - INFO - __main__ - Step 27097: {'lr': 0.00019981913700881437, 'samples': 867104, 'steps': 1693, 'loss/train': 2.7229950428009033} -09/20/2021 20:21:24 - INFO - __main__ - Step 27098: {'lr': 0.00019981913700881437, 'samples': 867136, 'steps': 1693, 'loss/train': 2.0094985961914062} -09/20/2021 20:21:25 - INFO - __main__ - Step 27099: {'lr': 0.00019981913700881437, 'samples': 867168, 'steps': 1693, 'loss/train': 1.9784029722213745} -09/20/2021 20:21:26 - INFO - __main__ - Step 27100: {'lr': 0.00019981913700881437, 'samples': 867200, 'steps': 1693, 'loss/train': 2.3337152004241943} -09/20/2021 20:21:26 - INFO - __main__ - Step 27101: {'lr': 0.00019981913700881437, 'samples': 867232, 'steps': 1693, 'loss/train': 1.9841598272323608} -09/20/2021 20:21:27 - INFO - __main__ - Step 27102: {'lr': 0.00019981913700881437, 'samples': 867264, 'steps': 1693, 'loss/train': 0.9780791997909546} -09/20/2021 20:21:28 - INFO - __main__ - Step 27103: {'lr': 0.00019981913700881437, 'samples': 867296, 'steps': 1693, 'loss/train': 1.4442598819732666} -09/20/2021 20:21:29 - INFO - __main__ - Step 27104: {'lr': 0.00019981913700881437, 'samples': 867328, 'steps': 1693, 'loss/train': 2.917896032333374} -09/20/2021 20:21:30 - INFO - __main__ - Step 27105: {'lr': 0.00019981875333075416, 'samples': 867360, 'steps': 1694, 'loss/train': 3.600202798843384} -09/20/2021 20:21:30 - INFO - __main__ - Step 27106: {'lr': 0.00019981875333075416, 'samples': 867392, 'steps': 1694, 'loss/train': 2.4004061222076416} -09/20/2021 20:21:31 - INFO - __main__ - Step 27107: {'lr': 0.00019981875333075416, 'samples': 867424, 'steps': 1694, 'loss/train': 2.1118886470794678} -09/20/2021 20:21:32 - INFO - __main__ - Step 27108: {'lr': 0.00019981875333075416, 'samples': 867456, 'steps': 1694, 'loss/train': 4.461817264556885} -09/20/2021 20:21:33 - INFO - __main__ - Step 27109: {'lr': 0.00019981875333075416, 'samples': 867488, 'steps': 1694, 'loss/train': 3.9625539779663086} -09/20/2021 20:21:33 - INFO - __main__ - Step 27110: {'lr': 0.00019981875333075416, 'samples': 867520, 'steps': 1694, 'loss/train': 4.010652542114258} -09/20/2021 20:21:34 - INFO - __main__ - Step 27111: {'lr': 0.00019981875333075416, 'samples': 867552, 'steps': 1694, 'loss/train': 2.336920976638794} -09/20/2021 20:21:35 - INFO - __main__ - Step 27112: {'lr': 0.00019981875333075416, 'samples': 867584, 'steps': 1694, 'loss/train': 3.336394786834717} -09/20/2021 20:21:36 - INFO - __main__ - Step 27113: {'lr': 0.00019981875333075416, 'samples': 867616, 'steps': 1694, 'loss/train': 2.4004242420196533} -09/20/2021 20:21:36 - INFO - __main__ - Step 27114: {'lr': 0.00019981875333075416, 'samples': 867648, 'steps': 1694, 'loss/train': 3.1657116413116455} -09/20/2021 20:21:37 - INFO - __main__ - Step 27115: {'lr': 0.00019981875333075416, 'samples': 867680, 'steps': 1694, 'loss/train': 2.7740299701690674} -09/20/2021 20:21:38 - INFO - __main__ - Step 27116: {'lr': 0.00019981875333075416, 'samples': 867712, 'steps': 1694, 'loss/train': 3.195652961730957} -09/20/2021 20:21:39 - INFO - __main__ - Step 27117: {'lr': 0.00019981875333075416, 'samples': 867744, 'steps': 1694, 'loss/train': 2.641608476638794} -09/20/2021 20:21:39 - INFO - __main__ - Step 27118: {'lr': 0.00019981875333075416, 'samples': 867776, 'steps': 1694, 'loss/train': 2.0586953163146973} -09/20/2021 20:21:40 - INFO - __main__ - Step 27119: {'lr': 0.00019981875333075416, 'samples': 867808, 'steps': 1694, 'loss/train': 2.8157026767730713} -09/20/2021 20:21:41 - INFO - __main__ - Step 27120: {'lr': 0.00019981875333075416, 'samples': 867840, 'steps': 1694, 'loss/train': 2.69124436378479} -09/20/2021 20:21:42 - INFO - __main__ - Step 27121: {'lr': 0.00019981836924653186, 'samples': 867872, 'steps': 1695, 'loss/train': 2.778848648071289} -09/20/2021 20:21:42 - INFO - __main__ - Step 27122: {'lr': 0.00019981836924653186, 'samples': 867904, 'steps': 1695, 'loss/train': 2.6726388931274414} -09/20/2021 20:21:43 - INFO - __main__ - Step 27123: {'lr': 0.00019981836924653186, 'samples': 867936, 'steps': 1695, 'loss/train': 3.002122640609741} -09/20/2021 20:21:44 - INFO - __main__ - Step 27124: {'lr': 0.00019981836924653186, 'samples': 867968, 'steps': 1695, 'loss/train': 2.96799373626709} -09/20/2021 20:21:45 - INFO - __main__ - Step 27125: {'lr': 0.00019981836924653186, 'samples': 868000, 'steps': 1695, 'loss/train': 2.350724458694458} -09/20/2021 20:21:45 - INFO - __main__ - Step 27126: {'lr': 0.00019981836924653186, 'samples': 868032, 'steps': 1695, 'loss/train': 2.3515608310699463} -09/20/2021 20:21:46 - INFO - __main__ - Step 27127: {'lr': 0.00019981836924653186, 'samples': 868064, 'steps': 1695, 'loss/train': 2.4964022636413574} -09/20/2021 20:21:47 - INFO - __main__ - Step 27128: {'lr': 0.00019981836924653186, 'samples': 868096, 'steps': 1695, 'loss/train': 3.099700689315796} -09/20/2021 20:21:48 - INFO - __main__ - Step 27129: {'lr': 0.00019981836924653186, 'samples': 868128, 'steps': 1695, 'loss/train': 2.3601760864257812} -09/20/2021 20:21:49 - INFO - __main__ - Step 27130: {'lr': 0.00019981836924653186, 'samples': 868160, 'steps': 1695, 'loss/train': 3.2018861770629883} -09/20/2021 20:21:50 - INFO - __main__ - Step 27131: {'lr': 0.00019981836924653186, 'samples': 868192, 'steps': 1695, 'loss/train': 6.018471717834473} -09/20/2021 20:21:51 - INFO - __main__ - Step 27132: {'lr': 0.00019981836924653186, 'samples': 868224, 'steps': 1695, 'loss/train': 6.000485897064209} -09/20/2021 20:21:51 - INFO - __main__ - Step 27133: {'lr': 0.00019981836924653186, 'samples': 868256, 'steps': 1695, 'loss/train': 6.306305408477783} -09/20/2021 20:21:52 - INFO - __main__ - Step 27134: {'lr': 0.00019981836924653186, 'samples': 868288, 'steps': 1695, 'loss/train': 3.735006332397461} -09/20/2021 20:21:53 - INFO - __main__ - Step 27135: {'lr': 0.00019981836924653186, 'samples': 868320, 'steps': 1695, 'loss/train': 3.8681540489196777} -09/20/2021 20:21:54 - INFO - __main__ - Step 27136: {'lr': 0.00019981836924653186, 'samples': 868352, 'steps': 1695, 'loss/train': 3.5811331272125244} -09/20/2021 20:21:54 - INFO - __main__ - Step 27137: {'lr': 0.00019981798475614897, 'samples': 868384, 'steps': 1696, 'loss/train': 3.2720627784729004} -09/20/2021 20:21:55 - INFO - __main__ - Step 27138: {'lr': 0.00019981798475614897, 'samples': 868416, 'steps': 1696, 'loss/train': 2.9751479625701904} -09/20/2021 20:21:56 - INFO - __main__ - Step 27139: {'lr': 0.00019981798475614897, 'samples': 868448, 'steps': 1696, 'loss/train': 2.7085721492767334} -09/20/2021 20:21:57 - INFO - __main__ - Step 27140: {'lr': 0.00019981798475614897, 'samples': 868480, 'steps': 1696, 'loss/train': 3.2886438369750977} -09/20/2021 20:21:57 - INFO - __main__ - Step 27141: {'lr': 0.00019981798475614897, 'samples': 868512, 'steps': 1696, 'loss/train': 3.1078336238861084} -09/20/2021 20:21:58 - INFO - __main__ - Step 27142: {'lr': 0.00019981798475614897, 'samples': 868544, 'steps': 1696, 'loss/train': 2.513390064239502} -09/20/2021 20:21:59 - INFO - __main__ - Step 27143: {'lr': 0.00019981798475614897, 'samples': 868576, 'steps': 1696, 'loss/train': 2.597140312194824} -09/20/2021 20:22:00 - INFO - __main__ - Step 27144: {'lr': 0.00019981798475614897, 'samples': 868608, 'steps': 1696, 'loss/train': 2.197559356689453} -09/20/2021 20:22:00 - INFO - __main__ - Step 27145: {'lr': 0.00019981798475614897, 'samples': 868640, 'steps': 1696, 'loss/train': 3.44128680229187} -09/20/2021 20:22:01 - INFO - __main__ - Step 27146: {'lr': 0.00019981798475614897, 'samples': 868672, 'steps': 1696, 'loss/train': 3.00211763381958} -09/20/2021 20:22:02 - INFO - __main__ - Step 27147: {'lr': 0.00019981798475614897, 'samples': 868704, 'steps': 1696, 'loss/train': 2.5872340202331543} -09/20/2021 20:22:03 - INFO - __main__ - Step 27148: {'lr': 0.00019981798475614897, 'samples': 868736, 'steps': 1696, 'loss/train': 3.7220911979675293} -09/20/2021 20:22:03 - INFO - __main__ - Step 27149: {'lr': 0.00019981798475614897, 'samples': 868768, 'steps': 1696, 'loss/train': 2.1995532512664795} -09/20/2021 20:22:04 - INFO - __main__ - Step 27150: {'lr': 0.00019981798475614897, 'samples': 868800, 'steps': 1696, 'loss/train': 3.4996285438537598} -09/20/2021 20:22:05 - INFO - __main__ - Step 27151: {'lr': 0.00019981798475614897, 'samples': 868832, 'steps': 1696, 'loss/train': 2.507087469100952} -09/20/2021 20:22:06 - INFO - __main__ - Step 27152: {'lr': 0.00019981798475614897, 'samples': 868864, 'steps': 1696, 'loss/train': 3.0632803440093994} -09/20/2021 20:22:07 - INFO - __main__ - Step 27153: {'lr': 0.0001998175998596071, 'samples': 868896, 'steps': 1697, 'loss/train': 3.514273166656494} -09/20/2021 20:22:07 - INFO - __main__ - Step 27154: {'lr': 0.0001998175998596071, 'samples': 868928, 'steps': 1697, 'loss/train': 2.871851682662964} -09/20/2021 20:22:08 - INFO - __main__ - Step 27155: {'lr': 0.0001998175998596071, 'samples': 868960, 'steps': 1697, 'loss/train': 2.658554792404175} -09/20/2021 20:22:09 - INFO - __main__ - Step 27156: {'lr': 0.0001998175998596071, 'samples': 868992, 'steps': 1697, 'loss/train': 1.3640226125717163} -09/20/2021 20:22:10 - INFO - __main__ - Step 27157: {'lr': 0.0001998175998596071, 'samples': 869024, 'steps': 1697, 'loss/train': 1.5392658710479736} -09/20/2021 20:22:10 - INFO - __main__ - Step 27158: {'lr': 0.0001998175998596071, 'samples': 869056, 'steps': 1697, 'loss/train': 2.987741231918335} -09/20/2021 20:22:11 - INFO - __main__ - Step 27159: {'lr': 0.0001998175998596071, 'samples': 869088, 'steps': 1697, 'loss/train': 2.9620046615600586} -09/20/2021 20:22:12 - INFO - __main__ - Step 27160: {'lr': 0.0001998175998596071, 'samples': 869120, 'steps': 1697, 'loss/train': 2.9535133838653564} -09/20/2021 20:22:13 - INFO - __main__ - Step 27161: {'lr': 0.0001998175998596071, 'samples': 869152, 'steps': 1697, 'loss/train': 2.5481679439544678} -09/20/2021 20:22:13 - INFO - __main__ - Step 27162: {'lr': 0.0001998175998596071, 'samples': 869184, 'steps': 1697, 'loss/train': 3.1589839458465576} -09/20/2021 20:22:14 - INFO - __main__ - Step 27163: {'lr': 0.0001998175998596071, 'samples': 869216, 'steps': 1697, 'loss/train': 3.1724746227264404} -09/20/2021 20:22:15 - INFO - __main__ - Step 27164: {'lr': 0.0001998175998596071, 'samples': 869248, 'steps': 1697, 'loss/train': 2.8933234214782715} -09/20/2021 20:22:16 - INFO - __main__ - Step 27165: {'lr': 0.0001998175998596071, 'samples': 869280, 'steps': 1697, 'loss/train': 1.038644790649414} -09/20/2021 20:22:17 - INFO - __main__ - Step 27166: {'lr': 0.0001998175998596071, 'samples': 869312, 'steps': 1697, 'loss/train': 3.047743320465088} -09/20/2021 20:22:18 - INFO - __main__ - Step 27167: {'lr': 0.0001998175998596071, 'samples': 869344, 'steps': 1697, 'loss/train': 0.6900492310523987} -09/20/2021 20:22:18 - INFO - __main__ - Step 27168: {'lr': 0.0001998175998596071, 'samples': 869376, 'steps': 1697, 'loss/train': 2.7703254222869873} -09/20/2021 20:22:19 - INFO - __main__ - Step 27169: {'lr': 0.0001998172145569078, 'samples': 869408, 'steps': 1698, 'loss/train': 3.125065326690674} -09/20/2021 20:22:20 - INFO - __main__ - Step 27170: {'lr': 0.0001998172145569078, 'samples': 869440, 'steps': 1698, 'loss/train': 4.179402828216553} -09/20/2021 20:22:21 - INFO - __main__ - Step 27171: {'lr': 0.0001998172145569078, 'samples': 869472, 'steps': 1698, 'loss/train': 3.0282139778137207} -09/20/2021 20:22:22 - INFO - __main__ - Step 27172: {'lr': 0.0001998172145569078, 'samples': 869504, 'steps': 1698, 'loss/train': 2.779757261276245} -09/20/2021 20:22:22 - INFO - __main__ - Step 27173: {'lr': 0.0001998172145569078, 'samples': 869536, 'steps': 1698, 'loss/train': 2.5754787921905518} -09/20/2021 20:22:23 - INFO - __main__ - Step 27174: {'lr': 0.0001998172145569078, 'samples': 869568, 'steps': 1698, 'loss/train': 2.567739963531494} -09/20/2021 20:22:24 - INFO - __main__ - Step 27175: {'lr': 0.0001998172145569078, 'samples': 869600, 'steps': 1698, 'loss/train': 3.198359489440918} -09/20/2021 20:22:25 - INFO - __main__ - Step 27176: {'lr': 0.0001998172145569078, 'samples': 869632, 'steps': 1698, 'loss/train': 2.862372636795044} -09/20/2021 20:22:25 - INFO - __main__ - Step 27177: {'lr': 0.0001998172145569078, 'samples': 869664, 'steps': 1698, 'loss/train': 2.406611680984497} -09/20/2021 20:22:26 - INFO - __main__ - Step 27178: {'lr': 0.0001998172145569078, 'samples': 869696, 'steps': 1698, 'loss/train': 3.6397013664245605} -09/20/2021 20:22:27 - INFO - __main__ - Step 27179: {'lr': 0.0001998172145569078, 'samples': 869728, 'steps': 1698, 'loss/train': 2.431882381439209} -09/20/2021 20:22:28 - INFO - __main__ - Step 27180: {'lr': 0.0001998172145569078, 'samples': 869760, 'steps': 1698, 'loss/train': 3.288662910461426} -09/20/2021 20:22:28 - INFO - __main__ - Step 27181: {'lr': 0.0001998172145569078, 'samples': 869792, 'steps': 1698, 'loss/train': 2.5015151500701904} -09/20/2021 20:22:29 - INFO - __main__ - Step 27182: {'lr': 0.0001998172145569078, 'samples': 869824, 'steps': 1698, 'loss/train': 3.6160666942596436} -09/20/2021 20:22:30 - INFO - __main__ - Step 27183: {'lr': 0.0001998172145569078, 'samples': 869856, 'steps': 1698, 'loss/train': 2.7962892055511475} -09/20/2021 20:22:31 - INFO - __main__ - Step 27184: {'lr': 0.0001998172145569078, 'samples': 869888, 'steps': 1698, 'loss/train': 1.5143007040023804} -09/20/2021 20:22:31 - INFO - __main__ - Step 27185: {'lr': 0.00019981682884805265, 'samples': 869920, 'steps': 1699, 'loss/train': 4.074533939361572} -09/20/2021 20:22:32 - INFO - __main__ - Step 27186: {'lr': 0.00019981682884805265, 'samples': 869952, 'steps': 1699, 'loss/train': 2.2481138706207275} -09/20/2021 20:22:33 - INFO - __main__ - Step 27187: {'lr': 0.00019981682884805265, 'samples': 869984, 'steps': 1699, 'loss/train': 2.2993569374084473} -09/20/2021 20:22:34 - INFO - __main__ - Step 27188: {'lr': 0.00019981682884805265, 'samples': 870016, 'steps': 1699, 'loss/train': 1.9129465818405151} -09/20/2021 20:22:34 - INFO - __main__ - Step 27189: {'lr': 0.00019981682884805265, 'samples': 870048, 'steps': 1699, 'loss/train': 2.2288925647735596} -09/20/2021 20:22:35 - INFO - __main__ - Step 27190: {'lr': 0.00019981682884805265, 'samples': 870080, 'steps': 1699, 'loss/train': 2.5289876461029053} -09/20/2021 20:22:36 - INFO - __main__ - Step 27191: {'lr': 0.00019981682884805265, 'samples': 870112, 'steps': 1699, 'loss/train': 1.1338422298431396} -09/20/2021 20:22:37 - INFO - __main__ - Step 27192: {'lr': 0.00019981682884805265, 'samples': 870144, 'steps': 1699, 'loss/train': 3.1833391189575195} -09/20/2021 20:22:37 - INFO - __main__ - Step 27193: {'lr': 0.00019981682884805265, 'samples': 870176, 'steps': 1699, 'loss/train': 2.9589312076568604} -09/20/2021 20:22:38 - INFO - __main__ - Step 27194: {'lr': 0.00019981682884805265, 'samples': 870208, 'steps': 1699, 'loss/train': 2.8609609603881836} -09/20/2021 20:22:39 - INFO - __main__ - Step 27195: {'lr': 0.00019981682884805265, 'samples': 870240, 'steps': 1699, 'loss/train': 2.937018394470215} -09/20/2021 20:22:40 - INFO - __main__ - Step 27196: {'lr': 0.00019981682884805265, 'samples': 870272, 'steps': 1699, 'loss/train': 2.466038942337036} -09/20/2021 20:22:40 - INFO - __main__ - Step 27197: {'lr': 0.00019981682884805265, 'samples': 870304, 'steps': 1699, 'loss/train': 2.725161552429199} -09/20/2021 20:22:42 - INFO - __main__ - Step 27198: {'lr': 0.00019981682884805265, 'samples': 870336, 'steps': 1699, 'loss/train': 2.951072931289673} -09/20/2021 20:22:43 - INFO - __main__ - Step 27199: {'lr': 0.00019981682884805265, 'samples': 870368, 'steps': 1699, 'loss/train': 2.4532032012939453} -09/20/2021 20:22:43 - INFO - __main__ - Step 27200: {'lr': 0.00019981682884805265, 'samples': 870400, 'steps': 1699, 'loss/train': 2.4001243114471436} -09/20/2021 20:22:44 - INFO - __main__ - Step 27201: {'lr': 0.00019981644273304322, 'samples': 870432, 'steps': 1700, 'loss/train': 2.3626556396484375} -09/20/2021 20:22:45 - INFO - __main__ - Step 27202: {'lr': 0.00019981644273304322, 'samples': 870464, 'steps': 1700, 'loss/train': 3.6553940773010254} -09/20/2021 20:22:46 - INFO - __main__ - Step 27203: {'lr': 0.00019981644273304322, 'samples': 870496, 'steps': 1700, 'loss/train': 2.239748954772949} -09/20/2021 20:22:47 - INFO - __main__ - Step 27204: {'lr': 0.00019981644273304322, 'samples': 870528, 'steps': 1700, 'loss/train': 2.7272021770477295} -09/20/2021 20:22:47 - INFO - __main__ - Step 27205: {'lr': 0.00019981644273304322, 'samples': 870560, 'steps': 1700, 'loss/train': 2.274003028869629} -09/20/2021 20:22:48 - INFO - __main__ - Step 27206: {'lr': 0.00019981644273304322, 'samples': 870592, 'steps': 1700, 'loss/train': 3.9837756156921387} -09/20/2021 20:22:49 - INFO - __main__ - Step 27207: {'lr': 0.00019981644273304322, 'samples': 870624, 'steps': 1700, 'loss/train': 2.636730432510376} -09/20/2021 20:22:50 - INFO - __main__ - Step 27208: {'lr': 0.00019981644273304322, 'samples': 870656, 'steps': 1700, 'loss/train': 2.4846413135528564} -09/20/2021 20:22:50 - INFO - __main__ - Step 27209: {'lr': 0.00019981644273304322, 'samples': 870688, 'steps': 1700, 'loss/train': 3.4354841709136963} -09/20/2021 20:22:51 - INFO - __main__ - Step 27210: {'lr': 0.00019981644273304322, 'samples': 870720, 'steps': 1700, 'loss/train': 2.012289047241211} -09/20/2021 20:22:52 - INFO - __main__ - Step 27211: {'lr': 0.00019981644273304322, 'samples': 870752, 'steps': 1700, 'loss/train': 2.310668706893921} -09/20/2021 20:22:53 - INFO - __main__ - Step 27212: {'lr': 0.00019981644273304322, 'samples': 870784, 'steps': 1700, 'loss/train': 1.7811963558197021} -09/20/2021 20:22:53 - INFO - __main__ - Step 27213: {'lr': 0.00019981644273304322, 'samples': 870816, 'steps': 1700, 'loss/train': 2.8980634212493896} -09/20/2021 20:22:54 - INFO - __main__ - Step 27214: {'lr': 0.00019981644273304322, 'samples': 870848, 'steps': 1700, 'loss/train': 2.7028608322143555} -09/20/2021 20:22:55 - INFO - __main__ - Step 27215: {'lr': 0.00019981644273304322, 'samples': 870880, 'steps': 1700, 'loss/train': 2.379495620727539} -09/20/2021 20:22:56 - INFO - __main__ - Step 27216: {'lr': 0.00019981644273304322, 'samples': 870912, 'steps': 1700, 'loss/train': 3.672579526901245} -09/20/2021 20:22:56 - INFO - __main__ - Step 27217: {'lr': 0.00019981605621188106, 'samples': 870944, 'steps': 1701, 'loss/train': 3.0194504261016846} -09/20/2021 20:22:57 - INFO - __main__ - Step 27218: {'lr': 0.00019981605621188106, 'samples': 870976, 'steps': 1701, 'loss/train': 2.8996150493621826} -09/20/2021 20:22:58 - INFO - __main__ - Step 27219: {'lr': 0.00019981605621188106, 'samples': 871008, 'steps': 1701, 'loss/train': 3.2232089042663574} -09/20/2021 20:22:59 - INFO - __main__ - Step 27220: {'lr': 0.00019981605621188106, 'samples': 871040, 'steps': 1701, 'loss/train': 3.4603641033172607} -09/20/2021 20:22:59 - INFO - __main__ - Step 27221: {'lr': 0.00019981605621188106, 'samples': 871072, 'steps': 1701, 'loss/train': 3.03505539894104} -09/20/2021 20:23:00 - INFO - __main__ - Step 27222: {'lr': 0.00019981605621188106, 'samples': 871104, 'steps': 1701, 'loss/train': 3.6549251079559326} -09/20/2021 20:23:01 - INFO - __main__ - Step 27223: {'lr': 0.00019981605621188106, 'samples': 871136, 'steps': 1701, 'loss/train': 3.5903432369232178} -09/20/2021 20:23:02 - INFO - __main__ - Step 27224: {'lr': 0.00019981605621188106, 'samples': 871168, 'steps': 1701, 'loss/train': 3.838245153427124} -09/20/2021 20:23:02 - INFO - __main__ - Step 27225: {'lr': 0.00019981605621188106, 'samples': 871200, 'steps': 1701, 'loss/train': 2.6731343269348145} -09/20/2021 20:23:03 - INFO - __main__ - Step 27226: {'lr': 0.00019981605621188106, 'samples': 871232, 'steps': 1701, 'loss/train': 2.748828411102295} -09/20/2021 20:23:04 - INFO - __main__ - Step 27227: {'lr': 0.00019981605621188106, 'samples': 871264, 'steps': 1701, 'loss/train': 1.2734681367874146} -09/20/2021 20:23:05 - INFO - __main__ - Step 27228: {'lr': 0.00019981605621188106, 'samples': 871296, 'steps': 1701, 'loss/train': 2.710587501525879} -09/20/2021 20:23:06 - INFO - __main__ - Step 27229: {'lr': 0.00019981605621188106, 'samples': 871328, 'steps': 1701, 'loss/train': 3.136484384536743} -09/20/2021 20:23:07 - INFO - __main__ - Step 27230: {'lr': 0.00019981605621188106, 'samples': 871360, 'steps': 1701, 'loss/train': 2.598999261856079} -09/20/2021 20:23:07 - INFO - __main__ - Step 27231: {'lr': 0.00019981605621188106, 'samples': 871392, 'steps': 1701, 'loss/train': 3.2122297286987305} -09/20/2021 20:23:08 - INFO - __main__ - Step 27232: {'lr': 0.00019981605621188106, 'samples': 871424, 'steps': 1701, 'loss/train': 2.9405956268310547} -09/20/2021 20:23:09 - INFO - __main__ - Step 27233: {'lr': 0.00019981566928456773, 'samples': 871456, 'steps': 1702, 'loss/train': 2.374997138977051} -09/20/2021 20:23:10 - INFO - __main__ - Step 27234: {'lr': 0.00019981566928456773, 'samples': 871488, 'steps': 1702, 'loss/train': 2.688166856765747} -09/20/2021 20:23:11 - INFO - __main__ - Step 27235: {'lr': 0.00019981566928456773, 'samples': 871520, 'steps': 1702, 'loss/train': 2.5900394916534424} -09/20/2021 20:23:11 - INFO - __main__ - Step 27236: {'lr': 0.00019981566928456773, 'samples': 871552, 'steps': 1702, 'loss/train': 2.748692750930786} -09/20/2021 20:23:12 - INFO - __main__ - Step 27237: {'lr': 0.00019981566928456773, 'samples': 871584, 'steps': 1702, 'loss/train': 3.256671190261841} -09/20/2021 20:23:13 - INFO - __main__ - Step 27238: {'lr': 0.00019981566928456773, 'samples': 871616, 'steps': 1702, 'loss/train': 2.3001632690429688} -09/20/2021 20:23:14 - INFO - __main__ - Step 27239: {'lr': 0.00019981566928456773, 'samples': 871648, 'steps': 1702, 'loss/train': 2.7765960693359375} -09/20/2021 20:23:14 - INFO - __main__ - Step 27240: {'lr': 0.00019981566928456773, 'samples': 871680, 'steps': 1702, 'loss/train': 3.4377927780151367} -09/20/2021 20:23:15 - INFO - __main__ - Step 27241: {'lr': 0.00019981566928456773, 'samples': 871712, 'steps': 1702, 'loss/train': 2.6983532905578613} -09/20/2021 20:23:16 - INFO - __main__ - Step 27242: {'lr': 0.00019981566928456773, 'samples': 871744, 'steps': 1702, 'loss/train': 3.159761667251587} -09/20/2021 20:23:17 - INFO - __main__ - Step 27243: {'lr': 0.00019981566928456773, 'samples': 871776, 'steps': 1702, 'loss/train': 3.2216403484344482} -09/20/2021 20:23:17 - INFO - __main__ - Step 27244: {'lr': 0.00019981566928456773, 'samples': 871808, 'steps': 1702, 'loss/train': 2.70896577835083} -09/20/2021 20:23:18 - INFO - __main__ - Step 27245: {'lr': 0.00019981566928456773, 'samples': 871840, 'steps': 1702, 'loss/train': 2.4797520637512207} -09/20/2021 20:23:19 - INFO - __main__ - Step 27246: {'lr': 0.00019981566928456773, 'samples': 871872, 'steps': 1702, 'loss/train': 3.105456829071045} -09/20/2021 20:23:20 - INFO - __main__ - Step 27247: {'lr': 0.00019981566928456773, 'samples': 871904, 'steps': 1702, 'loss/train': 3.287012815475464} -09/20/2021 20:23:20 - INFO - __main__ - Step 27248: {'lr': 0.00019981566928456773, 'samples': 871936, 'steps': 1702, 'loss/train': 2.9844210147857666} -09/20/2021 20:23:21 - INFO - __main__ - Step 27249: {'lr': 0.00019981528195110485, 'samples': 871968, 'steps': 1703, 'loss/train': 1.6117584705352783} -09/20/2021 20:23:22 - INFO - __main__ - Step 27250: {'lr': 0.00019981528195110485, 'samples': 872000, 'steps': 1703, 'loss/train': 3.546898126602173} -09/20/2021 20:23:23 - INFO - __main__ - Step 27251: {'lr': 0.00019981528195110485, 'samples': 872032, 'steps': 1703, 'loss/train': 2.5277059078216553} -09/20/2021 20:23:23 - INFO - __main__ - Step 27252: {'lr': 0.00019981528195110485, 'samples': 872064, 'steps': 1703, 'loss/train': 2.7469871044158936} -09/20/2021 20:23:24 - INFO - __main__ - Step 27253: {'lr': 0.00019981528195110485, 'samples': 872096, 'steps': 1703, 'loss/train': 2.3546597957611084} -09/20/2021 20:23:25 - INFO - __main__ - Step 27254: {'lr': 0.00019981528195110485, 'samples': 872128, 'steps': 1703, 'loss/train': 3.291139602661133} -09/20/2021 20:23:26 - INFO - __main__ - Step 27255: {'lr': 0.00019981528195110485, 'samples': 872160, 'steps': 1703, 'loss/train': 3.227823257446289} -09/20/2021 20:23:26 - INFO - __main__ - Step 27256: {'lr': 0.00019981528195110485, 'samples': 872192, 'steps': 1703, 'loss/train': 2.6354458332061768} -09/20/2021 20:23:27 - INFO - __main__ - Step 27257: {'lr': 0.00019981528195110485, 'samples': 872224, 'steps': 1703, 'loss/train': 2.451195478439331} -09/20/2021 20:23:28 - INFO - __main__ - Step 27258: {'lr': 0.00019981528195110485, 'samples': 872256, 'steps': 1703, 'loss/train': 3.2640538215637207} -09/20/2021 20:23:29 - INFO - __main__ - Step 27259: {'lr': 0.00019981528195110485, 'samples': 872288, 'steps': 1703, 'loss/train': 3.50321626663208} -09/20/2021 20:23:30 - INFO - __main__ - Step 27260: {'lr': 0.00019981528195110485, 'samples': 872320, 'steps': 1703, 'loss/train': 3.633216142654419} -09/20/2021 20:23:31 - INFO - __main__ - Step 27261: {'lr': 0.00019981528195110485, 'samples': 872352, 'steps': 1703, 'loss/train': 2.539879560470581} -09/20/2021 20:23:32 - INFO - __main__ - Step 27262: {'lr': 0.00019981528195110485, 'samples': 872384, 'steps': 1703, 'loss/train': 3.8006670475006104} -09/20/2021 20:23:33 - INFO - __main__ - Step 27263: {'lr': 0.00019981528195110485, 'samples': 872416, 'steps': 1703, 'loss/train': 2.1060304641723633} -09/20/2021 20:23:33 - INFO - __main__ - Step 27264: {'lr': 0.00019981528195110485, 'samples': 872448, 'steps': 1703, 'loss/train': 2.5370190143585205} -09/20/2021 20:23:34 - INFO - __main__ - Step 27265: {'lr': 0.000199814894211494, 'samples': 872480, 'steps': 1704, 'loss/train': 3.6393990516662598} -09/20/2021 20:23:35 - INFO - __main__ - Step 27266: {'lr': 0.000199814894211494, 'samples': 872512, 'steps': 1704, 'loss/train': 1.8730309009552002} -09/20/2021 20:23:36 - INFO - __main__ - Step 27267: {'lr': 0.000199814894211494, 'samples': 872544, 'steps': 1704, 'loss/train': 2.8927013874053955} -09/20/2021 20:23:36 - INFO - __main__ - Step 27268: {'lr': 0.000199814894211494, 'samples': 872576, 'steps': 1704, 'loss/train': 2.6866466999053955} -09/20/2021 20:23:37 - INFO - __main__ - Step 27269: {'lr': 0.000199814894211494, 'samples': 872608, 'steps': 1704, 'loss/train': 1.8967338800430298} -09/20/2021 20:23:38 - INFO - __main__ - Step 27270: {'lr': 0.000199814894211494, 'samples': 872640, 'steps': 1704, 'loss/train': 2.5667076110839844} -09/20/2021 20:23:39 - INFO - __main__ - Step 27271: {'lr': 0.000199814894211494, 'samples': 872672, 'steps': 1704, 'loss/train': 1.7520592212677002} -09/20/2021 20:23:39 - INFO - __main__ - Step 27272: {'lr': 0.000199814894211494, 'samples': 872704, 'steps': 1704, 'loss/train': 2.2742867469787598} -09/20/2021 20:23:40 - INFO - __main__ - Step 27273: {'lr': 0.000199814894211494, 'samples': 872736, 'steps': 1704, 'loss/train': 3.083644390106201} -09/20/2021 20:23:41 - INFO - __main__ - Step 27274: {'lr': 0.000199814894211494, 'samples': 872768, 'steps': 1704, 'loss/train': 2.4333832263946533} -09/20/2021 20:23:42 - INFO - __main__ - Step 27275: {'lr': 0.000199814894211494, 'samples': 872800, 'steps': 1704, 'loss/train': 2.186960220336914} -09/20/2021 20:23:42 - INFO - __main__ - Step 27276: {'lr': 0.000199814894211494, 'samples': 872832, 'steps': 1704, 'loss/train': 2.7254958152770996} -09/20/2021 20:23:43 - INFO - __main__ - Step 27277: {'lr': 0.000199814894211494, 'samples': 872864, 'steps': 1704, 'loss/train': 2.440382957458496} -09/20/2021 20:23:44 - INFO - __main__ - Step 27278: {'lr': 0.000199814894211494, 'samples': 872896, 'steps': 1704, 'loss/train': 3.2311975955963135} -09/20/2021 20:23:45 - INFO - __main__ - Step 27279: {'lr': 0.000199814894211494, 'samples': 872928, 'steps': 1704, 'loss/train': 1.8097114562988281} -09/20/2021 20:23:45 - INFO - __main__ - Step 27280: {'lr': 0.000199814894211494, 'samples': 872960, 'steps': 1704, 'loss/train': 5.050098419189453} -09/20/2021 20:23:46 - INFO - __main__ - Step 27281: {'lr': 0.00019981450606573671, 'samples': 872992, 'steps': 1705, 'loss/train': 2.871762752532959} -09/20/2021 20:23:47 - INFO - __main__ - Step 27282: {'lr': 0.00019981450606573671, 'samples': 873024, 'steps': 1705, 'loss/train': 2.7656548023223877} -09/20/2021 20:23:48 - INFO - __main__ - Step 27283: {'lr': 0.00019981450606573671, 'samples': 873056, 'steps': 1705, 'loss/train': 1.5461708307266235} -09/20/2021 20:23:49 - INFO - __main__ - Step 27284: {'lr': 0.00019981450606573671, 'samples': 873088, 'steps': 1705, 'loss/train': 1.298852801322937} -09/20/2021 20:23:49 - INFO - __main__ - Step 27285: {'lr': 0.00019981450606573671, 'samples': 873120, 'steps': 1705, 'loss/train': 1.330500841140747} -09/20/2021 20:23:50 - INFO - __main__ - Step 27286: {'lr': 0.00019981450606573671, 'samples': 873152, 'steps': 1705, 'loss/train': 1.1796021461486816} -09/20/2021 20:23:51 - INFO - __main__ - Step 27287: {'lr': 0.00019981450606573671, 'samples': 873184, 'steps': 1705, 'loss/train': 1.9595133066177368} -09/20/2021 20:23:52 - INFO - __main__ - Step 27288: {'lr': 0.00019981450606573671, 'samples': 873216, 'steps': 1705, 'loss/train': 1.3267230987548828} -09/20/2021 20:23:52 - INFO - __main__ - Step 27289: {'lr': 0.00019981450606573671, 'samples': 873248, 'steps': 1705, 'loss/train': 1.525512933731079} -09/20/2021 20:23:53 - INFO - __main__ - Step 27290: {'lr': 0.00019981450606573671, 'samples': 873280, 'steps': 1705, 'loss/train': 2.324105978012085} -09/20/2021 20:23:54 - INFO - __main__ - Step 27291: {'lr': 0.00019981450606573671, 'samples': 873312, 'steps': 1705, 'loss/train': 2.5627758502960205} -09/20/2021 20:23:55 - INFO - __main__ - Step 27292: {'lr': 0.00019981450606573671, 'samples': 873344, 'steps': 1705, 'loss/train': 3.197892427444458} -09/20/2021 20:23:55 - INFO - __main__ - Step 27293: {'lr': 0.00019981450606573671, 'samples': 873376, 'steps': 1705, 'loss/train': 2.889270305633545} -09/20/2021 20:23:56 - INFO - __main__ - Step 27294: {'lr': 0.00019981450606573671, 'samples': 873408, 'steps': 1705, 'loss/train': 2.486388921737671} -09/20/2021 20:23:57 - INFO - __main__ - Step 27295: {'lr': 0.00019981450606573671, 'samples': 873440, 'steps': 1705, 'loss/train': 2.5243306159973145} -09/20/2021 20:23:58 - INFO - __main__ - Step 27296: {'lr': 0.00019981450606573671, 'samples': 873472, 'steps': 1705, 'loss/train': 3.4489808082580566} -09/20/2021 20:23:59 - INFO - __main__ - Step 27297: {'lr': 0.00019981411751383458, 'samples': 873504, 'steps': 1706, 'loss/train': 2.4540698528289795} -09/20/2021 20:24:00 - INFO - __main__ - Step 27298: {'lr': 0.00019981411751383458, 'samples': 873536, 'steps': 1706, 'loss/train': 1.6959915161132812} -09/20/2021 20:24:00 - INFO - __main__ - Step 27299: {'lr': 0.00019981411751383458, 'samples': 873568, 'steps': 1706, 'loss/train': 2.0884275436401367} -09/20/2021 20:24:01 - INFO - __main__ - Step 27300: {'lr': 0.00019981411751383458, 'samples': 873600, 'steps': 1706, 'loss/train': 3.130749464035034} -09/20/2021 20:24:02 - INFO - __main__ - Step 27301: {'lr': 0.00019981411751383458, 'samples': 873632, 'steps': 1706, 'loss/train': 2.851208448410034} -09/20/2021 20:24:03 - INFO - __main__ - Step 27302: {'lr': 0.00019981411751383458, 'samples': 873664, 'steps': 1706, 'loss/train': 3.3258750438690186} -09/20/2021 20:24:04 - INFO - __main__ - Step 27303: {'lr': 0.00019981411751383458, 'samples': 873696, 'steps': 1706, 'loss/train': 3.7912280559539795} -09/20/2021 20:24:04 - INFO - __main__ - Step 27304: {'lr': 0.00019981411751383458, 'samples': 873728, 'steps': 1706, 'loss/train': 2.2700889110565186} -09/20/2021 20:24:05 - INFO - __main__ - Step 27305: {'lr': 0.00019981411751383458, 'samples': 873760, 'steps': 1706, 'loss/train': 3.5956907272338867} -09/20/2021 20:24:06 - INFO - __main__ - Step 27306: {'lr': 0.00019981411751383458, 'samples': 873792, 'steps': 1706, 'loss/train': 3.1394739151000977} -09/20/2021 20:24:07 - INFO - __main__ - Step 27307: {'lr': 0.00019981411751383458, 'samples': 873824, 'steps': 1706, 'loss/train': 3.3232293128967285} -09/20/2021 20:24:07 - INFO - __main__ - Step 27308: {'lr': 0.00019981411751383458, 'samples': 873856, 'steps': 1706, 'loss/train': 3.5393295288085938} -09/20/2021 20:24:08 - INFO - __main__ - Step 27309: {'lr': 0.00019981411751383458, 'samples': 873888, 'steps': 1706, 'loss/train': 3.3094348907470703} -09/20/2021 20:24:09 - INFO - __main__ - Step 27310: {'lr': 0.00019981411751383458, 'samples': 873920, 'steps': 1706, 'loss/train': 2.813857316970825} -09/20/2021 20:24:10 - INFO - __main__ - Step 27311: {'lr': 0.00019981411751383458, 'samples': 873952, 'steps': 1706, 'loss/train': 2.3339788913726807} -09/20/2021 20:24:10 - INFO - __main__ - Step 27312: {'lr': 0.00019981411751383458, 'samples': 873984, 'steps': 1706, 'loss/train': 2.9656670093536377} -09/20/2021 20:24:11 - INFO - __main__ - Step 27313: {'lr': 0.0001998137285557892, 'samples': 874016, 'steps': 1707, 'loss/train': 3.0877368450164795} -09/20/2021 20:24:12 - INFO - __main__ - Step 27314: {'lr': 0.0001998137285557892, 'samples': 874048, 'steps': 1707, 'loss/train': 2.342784881591797} -09/20/2021 20:24:13 - INFO - __main__ - Step 27315: {'lr': 0.0001998137285557892, 'samples': 874080, 'steps': 1707, 'loss/train': 2.3904824256896973} -09/20/2021 20:24:13 - INFO - __main__ - Step 27316: {'lr': 0.0001998137285557892, 'samples': 874112, 'steps': 1707, 'loss/train': 2.1226487159729004} -09/20/2021 20:24:14 - INFO - __main__ - Step 27317: {'lr': 0.0001998137285557892, 'samples': 874144, 'steps': 1707, 'loss/train': 2.6737451553344727} -09/20/2021 20:24:15 - INFO - __main__ - Step 27318: {'lr': 0.0001998137285557892, 'samples': 874176, 'steps': 1707, 'loss/train': 2.934999942779541} -09/20/2021 20:24:16 - INFO - __main__ - Step 27319: {'lr': 0.0001998137285557892, 'samples': 874208, 'steps': 1707, 'loss/train': 3.303380250930786} -09/20/2021 20:24:16 - INFO - __main__ - Step 27320: {'lr': 0.0001998137285557892, 'samples': 874240, 'steps': 1707, 'loss/train': 2.68395733833313} -09/20/2021 20:24:17 - INFO - __main__ - Step 27321: {'lr': 0.0001998137285557892, 'samples': 874272, 'steps': 1707, 'loss/train': 2.643263578414917} -09/20/2021 20:24:18 - INFO - __main__ - Step 27322: {'lr': 0.0001998137285557892, 'samples': 874304, 'steps': 1707, 'loss/train': 1.7364838123321533} -09/20/2021 20:24:19 - INFO - __main__ - Step 27323: {'lr': 0.0001998137285557892, 'samples': 874336, 'steps': 1707, 'loss/train': 3.0268661975860596} -09/20/2021 20:24:19 - INFO - __main__ - Step 27324: {'lr': 0.0001998137285557892, 'samples': 874368, 'steps': 1707, 'loss/train': 2.443357229232788} -09/20/2021 20:24:20 - INFO - __main__ - Step 27325: {'lr': 0.0001998137285557892, 'samples': 874400, 'steps': 1707, 'loss/train': 2.7985951900482178} -09/20/2021 20:24:22 - INFO - __main__ - Step 27326: {'lr': 0.0001998137285557892, 'samples': 874432, 'steps': 1707, 'loss/train': 2.6349587440490723} -09/20/2021 20:24:22 - INFO - __main__ - Step 27327: {'lr': 0.0001998137285557892, 'samples': 874464, 'steps': 1707, 'loss/train': 2.324913740158081} -09/20/2021 20:24:23 - INFO - __main__ - Step 27328: {'lr': 0.0001998137285557892, 'samples': 874496, 'steps': 1707, 'loss/train': 2.84261417388916} -09/20/2021 20:24:24 - INFO - __main__ - Step 27329: {'lr': 0.00019981333919160215, 'samples': 874528, 'steps': 1708, 'loss/train': 2.610506296157837} -09/20/2021 20:24:25 - INFO - __main__ - Step 27330: {'lr': 0.00019981333919160215, 'samples': 874560, 'steps': 1708, 'loss/train': 2.6534361839294434} -09/20/2021 20:24:25 - INFO - __main__ - Step 27331: {'lr': 0.00019981333919160215, 'samples': 874592, 'steps': 1708, 'loss/train': 2.799665689468384} -09/20/2021 20:24:26 - INFO - __main__ - Step 27332: {'lr': 0.00019981333919160215, 'samples': 874624, 'steps': 1708, 'loss/train': 2.2325119972229004} -09/20/2021 20:24:27 - INFO - __main__ - Step 27333: {'lr': 0.00019981333919160215, 'samples': 874656, 'steps': 1708, 'loss/train': 3.3665382862091064} -09/20/2021 20:24:28 - INFO - __main__ - Step 27334: {'lr': 0.00019981333919160215, 'samples': 874688, 'steps': 1708, 'loss/train': 2.997678756713867} -09/20/2021 20:24:28 - INFO - __main__ - Step 27335: {'lr': 0.00019981333919160215, 'samples': 874720, 'steps': 1708, 'loss/train': 2.6618573665618896} -09/20/2021 20:24:29 - INFO - __main__ - Step 27336: {'lr': 0.00019981333919160215, 'samples': 874752, 'steps': 1708, 'loss/train': 1.9122190475463867} -09/20/2021 20:24:30 - INFO - __main__ - Step 27337: {'lr': 0.00019981333919160215, 'samples': 874784, 'steps': 1708, 'loss/train': 2.774423360824585} -09/20/2021 20:24:31 - INFO - __main__ - Step 27338: {'lr': 0.00019981333919160215, 'samples': 874816, 'steps': 1708, 'loss/train': 3.0615651607513428} -09/20/2021 20:24:31 - INFO - __main__ - Step 27339: {'lr': 0.00019981333919160215, 'samples': 874848, 'steps': 1708, 'loss/train': 1.8153367042541504} -09/20/2021 20:24:32 - INFO - __main__ - Step 27340: {'lr': 0.00019981333919160215, 'samples': 874880, 'steps': 1708, 'loss/train': 2.9155519008636475} -09/20/2021 20:24:33 - INFO - __main__ - Step 27341: {'lr': 0.00019981333919160215, 'samples': 874912, 'steps': 1708, 'loss/train': 0.697174608707428} -09/20/2021 20:24:34 - INFO - __main__ - Step 27342: {'lr': 0.00019981333919160215, 'samples': 874944, 'steps': 1708, 'loss/train': 0.6721359491348267} -09/20/2021 20:24:34 - INFO - __main__ - Step 27343: {'lr': 0.00019981333919160215, 'samples': 874976, 'steps': 1708, 'loss/train': 3.244933605194092} -09/20/2021 20:24:35 - INFO - __main__ - Step 27344: {'lr': 0.00019981333919160215, 'samples': 875008, 'steps': 1708, 'loss/train': 1.8427834510803223} -09/20/2021 20:24:36 - INFO - __main__ - Step 27345: {'lr': 0.000199812949421275, 'samples': 875040, 'steps': 1709, 'loss/train': 1.3744850158691406} -09/20/2021 20:24:37 - INFO - __main__ - Step 27346: {'lr': 0.000199812949421275, 'samples': 875072, 'steps': 1709, 'loss/train': 2.7523629665374756} -09/20/2021 20:24:38 - INFO - __main__ - Step 27347: {'lr': 0.000199812949421275, 'samples': 875104, 'steps': 1709, 'loss/train': 1.8193176984786987} -09/20/2021 20:24:38 - INFO - __main__ - Step 27348: {'lr': 0.000199812949421275, 'samples': 875136, 'steps': 1709, 'loss/train': 3.2294154167175293} -09/20/2021 20:24:39 - INFO - __main__ - Step 27349: {'lr': 0.000199812949421275, 'samples': 875168, 'steps': 1709, 'loss/train': 3.085282564163208} -09/20/2021 20:24:40 - INFO - __main__ - Step 27350: {'lr': 0.000199812949421275, 'samples': 875200, 'steps': 1709, 'loss/train': 2.3452322483062744} -09/20/2021 20:24:41 - INFO - __main__ - Step 27351: {'lr': 0.000199812949421275, 'samples': 875232, 'steps': 1709, 'loss/train': 1.485935926437378} -09/20/2021 20:24:41 - INFO - __main__ - Step 27352: {'lr': 0.000199812949421275, 'samples': 875264, 'steps': 1709, 'loss/train': 4.186635494232178} -09/20/2021 20:24:42 - INFO - __main__ - Step 27353: {'lr': 0.000199812949421275, 'samples': 875296, 'steps': 1709, 'loss/train': 3.9947426319122314} -09/20/2021 20:24:43 - INFO - __main__ - Step 27354: {'lr': 0.000199812949421275, 'samples': 875328, 'steps': 1709, 'loss/train': 3.646233320236206} -09/20/2021 20:24:44 - INFO - __main__ - Step 27355: {'lr': 0.000199812949421275, 'samples': 875360, 'steps': 1709, 'loss/train': 2.501530170440674} -09/20/2021 20:24:44 - INFO - __main__ - Step 27356: {'lr': 0.000199812949421275, 'samples': 875392, 'steps': 1709, 'loss/train': 2.4511311054229736} -09/20/2021 20:24:46 - INFO - __main__ - Step 27357: {'lr': 0.000199812949421275, 'samples': 875424, 'steps': 1709, 'loss/train': 0.5346351861953735} -09/20/2021 20:24:47 - INFO - __main__ - Step 27358: {'lr': 0.000199812949421275, 'samples': 875456, 'steps': 1709, 'loss/train': 3.3081068992614746} -09/20/2021 20:24:48 - INFO - __main__ - Step 27359: {'lr': 0.000199812949421275, 'samples': 875488, 'steps': 1709, 'loss/train': 2.015547275543213} -09/20/2021 20:24:48 - INFO - __main__ - Step 27360: {'lr': 0.000199812949421275, 'samples': 875520, 'steps': 1709, 'loss/train': 2.344912052154541} -09/20/2021 20:24:49 - INFO - __main__ - Step 27361: {'lr': 0.00019981255924480935, 'samples': 875552, 'steps': 1710, 'loss/train': 2.9765260219573975} -09/20/2021 20:24:50 - INFO - __main__ - Step 27362: {'lr': 0.00019981255924480935, 'samples': 875584, 'steps': 1710, 'loss/train': 3.102125883102417} -09/20/2021 20:24:51 - INFO - __main__ - Step 27363: {'lr': 0.00019981255924480935, 'samples': 875616, 'steps': 1710, 'loss/train': 4.494601249694824} -09/20/2021 20:24:51 - INFO - __main__ - Step 27364: {'lr': 0.00019981255924480935, 'samples': 875648, 'steps': 1710, 'loss/train': 2.5439107418060303} -09/20/2021 20:24:52 - INFO - __main__ - Step 27365: {'lr': 0.00019981255924480935, 'samples': 875680, 'steps': 1710, 'loss/train': 2.556699514389038} -09/20/2021 20:24:53 - INFO - __main__ - Step 27366: {'lr': 0.00019981255924480935, 'samples': 875712, 'steps': 1710, 'loss/train': 2.754397392272949} -09/20/2021 20:24:54 - INFO - __main__ - Step 27367: {'lr': 0.00019981255924480935, 'samples': 875744, 'steps': 1710, 'loss/train': 2.2847342491149902} -09/20/2021 20:24:54 - INFO - __main__ - Step 27368: {'lr': 0.00019981255924480935, 'samples': 875776, 'steps': 1710, 'loss/train': 3.7155747413635254} -09/20/2021 20:24:55 - INFO - __main__ - Step 27369: {'lr': 0.00019981255924480935, 'samples': 875808, 'steps': 1710, 'loss/train': 3.1405155658721924} -09/20/2021 20:24:56 - INFO - __main__ - Step 27370: {'lr': 0.00019981255924480935, 'samples': 875840, 'steps': 1710, 'loss/train': 3.06445574760437} -09/20/2021 20:24:57 - INFO - __main__ - Step 27371: {'lr': 0.00019981255924480935, 'samples': 875872, 'steps': 1710, 'loss/train': 2.8229026794433594} -09/20/2021 20:24:57 - INFO - __main__ - Step 27372: {'lr': 0.00019981255924480935, 'samples': 875904, 'steps': 1710, 'loss/train': 2.3659234046936035} -09/20/2021 20:24:58 - INFO - __main__ - Step 27373: {'lr': 0.00019981255924480935, 'samples': 875936, 'steps': 1710, 'loss/train': 2.504753351211548} -09/20/2021 20:24:59 - INFO - __main__ - Step 27374: {'lr': 0.00019981255924480935, 'samples': 875968, 'steps': 1710, 'loss/train': 1.5848122835159302} -09/20/2021 20:25:00 - INFO - __main__ - Step 27375: {'lr': 0.00019981255924480935, 'samples': 876000, 'steps': 1710, 'loss/train': 2.3286612033843994} -09/20/2021 20:25:00 - INFO - __main__ - Step 27376: {'lr': 0.00019981255924480935, 'samples': 876032, 'steps': 1710, 'loss/train': 2.457231283187866} -09/20/2021 20:25:01 - INFO - __main__ - Step 27377: {'lr': 0.0001998121686622068, 'samples': 876064, 'steps': 1711, 'loss/train': 3.682325839996338} -09/20/2021 20:25:02 - INFO - __main__ - Step 27378: {'lr': 0.0001998121686622068, 'samples': 876096, 'steps': 1711, 'loss/train': 0.7088771462440491} -09/20/2021 20:25:03 - INFO - __main__ - Step 27379: {'lr': 0.0001998121686622068, 'samples': 876128, 'steps': 1711, 'loss/train': 2.468496322631836} -09/20/2021 20:25:04 - INFO - __main__ - Step 27380: {'lr': 0.0001998121686622068, 'samples': 876160, 'steps': 1711, 'loss/train': 2.883901596069336} -09/20/2021 20:25:04 - INFO - __main__ - Step 27381: {'lr': 0.0001998121686622068, 'samples': 876192, 'steps': 1711, 'loss/train': 3.3939530849456787} -09/20/2021 20:25:05 - INFO - __main__ - Step 27382: {'lr': 0.0001998121686622068, 'samples': 876224, 'steps': 1711, 'loss/train': 2.588838577270508} -09/20/2021 20:25:06 - INFO - __main__ - Step 27383: {'lr': 0.0001998121686622068, 'samples': 876256, 'steps': 1711, 'loss/train': 2.7555692195892334} -09/20/2021 20:25:07 - INFO - __main__ - Step 27384: {'lr': 0.0001998121686622068, 'samples': 876288, 'steps': 1711, 'loss/train': 2.966312885284424} -09/20/2021 20:25:07 - INFO - __main__ - Step 27385: {'lr': 0.0001998121686622068, 'samples': 876320, 'steps': 1711, 'loss/train': 2.3065223693847656} -09/20/2021 20:25:08 - INFO - __main__ - Step 27386: {'lr': 0.0001998121686622068, 'samples': 876352, 'steps': 1711, 'loss/train': 2.9684364795684814} -09/20/2021 20:25:09 - INFO - __main__ - Step 27387: {'lr': 0.0001998121686622068, 'samples': 876384, 'steps': 1711, 'loss/train': 2.619671106338501} -09/20/2021 20:25:10 - INFO - __main__ - Step 27388: {'lr': 0.0001998121686622068, 'samples': 876416, 'steps': 1711, 'loss/train': 1.4588522911071777} -09/20/2021 20:25:11 - INFO - __main__ - Step 27389: {'lr': 0.0001998121686622068, 'samples': 876448, 'steps': 1711, 'loss/train': 1.5318409204483032} -09/20/2021 20:25:12 - INFO - __main__ - Step 27390: {'lr': 0.0001998121686622068, 'samples': 876480, 'steps': 1711, 'loss/train': 3.27148699760437} -09/20/2021 20:25:12 - INFO - __main__ - Step 27391: {'lr': 0.0001998121686622068, 'samples': 876512, 'steps': 1711, 'loss/train': 2.32529878616333} -09/20/2021 20:25:13 - INFO - __main__ - Step 27392: {'lr': 0.0001998121686622068, 'samples': 876544, 'steps': 1711, 'loss/train': 2.737178087234497} -09/20/2021 20:25:14 - INFO - __main__ - Step 27393: {'lr': 0.00019981177767346888, 'samples': 876576, 'steps': 1712, 'loss/train': 3.4313554763793945} -09/20/2021 20:25:15 - INFO - __main__ - Step 27394: {'lr': 0.00019981177767346888, 'samples': 876608, 'steps': 1712, 'loss/train': 3.0892484188079834} -09/20/2021 20:25:16 - INFO - __main__ - Step 27395: {'lr': 0.00019981177767346888, 'samples': 876640, 'steps': 1712, 'loss/train': 2.1364264488220215} -09/20/2021 20:25:16 - INFO - __main__ - Step 27396: {'lr': 0.00019981177767346888, 'samples': 876672, 'steps': 1712, 'loss/train': 2.542137861251831} -09/20/2021 20:25:17 - INFO - __main__ - Step 27397: {'lr': 0.00019981177767346888, 'samples': 876704, 'steps': 1712, 'loss/train': 2.08296275138855} -09/20/2021 20:25:18 - INFO - __main__ - Step 27398: {'lr': 0.00019981177767346888, 'samples': 876736, 'steps': 1712, 'loss/train': 2.618795156478882} -09/20/2021 20:25:19 - INFO - __main__ - Step 27399: {'lr': 0.00019981177767346888, 'samples': 876768, 'steps': 1712, 'loss/train': 3.499312162399292} -09/20/2021 20:25:19 - INFO - __main__ - Step 27400: {'lr': 0.00019981177767346888, 'samples': 876800, 'steps': 1712, 'loss/train': 2.9405083656311035} -09/20/2021 20:25:20 - INFO - __main__ - Step 27401: {'lr': 0.00019981177767346888, 'samples': 876832, 'steps': 1712, 'loss/train': 2.6913628578186035} -09/20/2021 20:25:21 - INFO - __main__ - Step 27402: {'lr': 0.00019981177767346888, 'samples': 876864, 'steps': 1712, 'loss/train': 2.8490400314331055} -09/20/2021 20:25:22 - INFO - __main__ - Step 27403: {'lr': 0.00019981177767346888, 'samples': 876896, 'steps': 1712, 'loss/train': 2.6000497341156006} -09/20/2021 20:25:22 - INFO - __main__ - Step 27404: {'lr': 0.00019981177767346888, 'samples': 876928, 'steps': 1712, 'loss/train': 4.4176506996154785} -09/20/2021 20:25:23 - INFO - __main__ - Step 27405: {'lr': 0.00019981177767346888, 'samples': 876960, 'steps': 1712, 'loss/train': 3.887096881866455} -09/20/2021 20:25:24 - INFO - __main__ - Step 27406: {'lr': 0.00019981177767346888, 'samples': 876992, 'steps': 1712, 'loss/train': 2.5004169940948486} -09/20/2021 20:25:25 - INFO - __main__ - Step 27407: {'lr': 0.00019981177767346888, 'samples': 877024, 'steps': 1712, 'loss/train': 3.061410665512085} -09/20/2021 20:25:25 - INFO - __main__ - Step 27408: {'lr': 0.00019981177767346888, 'samples': 877056, 'steps': 1712, 'loss/train': 2.423996686935425} -09/20/2021 20:25:26 - INFO - __main__ - Step 27409: {'lr': 0.00019981138627859726, 'samples': 877088, 'steps': 1713, 'loss/train': 3.2895071506500244} -09/20/2021 20:25:27 - INFO - __main__ - Step 27410: {'lr': 0.00019981138627859726, 'samples': 877120, 'steps': 1713, 'loss/train': 3.404839038848877} -09/20/2021 20:25:28 - INFO - __main__ - Step 27411: {'lr': 0.00019981138627859726, 'samples': 877152, 'steps': 1713, 'loss/train': 1.8945772647857666} -09/20/2021 20:25:28 - INFO - __main__ - Step 27412: {'lr': 0.00019981138627859726, 'samples': 877184, 'steps': 1713, 'loss/train': 3.042207717895508} -09/20/2021 20:25:29 - INFO - __main__ - Step 27413: {'lr': 0.00019981138627859726, 'samples': 877216, 'steps': 1713, 'loss/train': 2.404618501663208} -09/20/2021 20:25:30 - INFO - __main__ - Step 27414: {'lr': 0.00019981138627859726, 'samples': 877248, 'steps': 1713, 'loss/train': 2.544801950454712} -09/20/2021 20:25:31 - INFO - __main__ - Step 27415: {'lr': 0.00019981138627859726, 'samples': 877280, 'steps': 1713, 'loss/train': 2.608888626098633} -09/20/2021 20:25:31 - INFO - __main__ - Step 27416: {'lr': 0.00019981138627859726, 'samples': 877312, 'steps': 1713, 'loss/train': 0.772748589515686} -09/20/2021 20:25:32 - INFO - __main__ - Step 27417: {'lr': 0.00019981138627859726, 'samples': 877344, 'steps': 1713, 'loss/train': 3.104557514190674} -09/20/2021 20:25:33 - INFO - __main__ - Step 27418: {'lr': 0.00019981138627859726, 'samples': 877376, 'steps': 1713, 'loss/train': 2.8813412189483643} -09/20/2021 20:25:34 - INFO - __main__ - Step 27419: {'lr': 0.00019981138627859726, 'samples': 877408, 'steps': 1713, 'loss/train': 1.9262748956680298} -09/20/2021 20:25:35 - INFO - __main__ - Step 27420: {'lr': 0.00019981138627859726, 'samples': 877440, 'steps': 1713, 'loss/train': 2.6779046058654785} -09/20/2021 20:25:36 - INFO - __main__ - Step 27421: {'lr': 0.00019981138627859726, 'samples': 877472, 'steps': 1713, 'loss/train': 2.3810250759124756} -09/20/2021 20:25:37 - INFO - __main__ - Step 27422: {'lr': 0.00019981138627859726, 'samples': 877504, 'steps': 1713, 'loss/train': 2.7316553592681885} -09/20/2021 20:25:38 - INFO - __main__ - Step 27423: {'lr': 0.00019981138627859726, 'samples': 877536, 'steps': 1713, 'loss/train': 0.465859979391098} -09/20/2021 20:25:38 - INFO - __main__ - Step 27424: {'lr': 0.00019981138627859726, 'samples': 877568, 'steps': 1713, 'loss/train': 0.8230252861976624} -09/20/2021 20:25:39 - INFO - __main__ - Step 27425: {'lr': 0.00019981099447759348, 'samples': 877600, 'steps': 1714, 'loss/train': 2.407297372817993} -09/20/2021 20:25:40 - INFO - __main__ - Step 27426: {'lr': 0.00019981099447759348, 'samples': 877632, 'steps': 1714, 'loss/train': 2.8782529830932617} -09/20/2021 20:25:41 - INFO - __main__ - Step 27427: {'lr': 0.00019981099447759348, 'samples': 877664, 'steps': 1714, 'loss/train': 2.641833782196045} -09/20/2021 20:25:41 - INFO - __main__ - Step 27428: {'lr': 0.00019981099447759348, 'samples': 877696, 'steps': 1714, 'loss/train': 2.205803155899048} -09/20/2021 20:25:42 - INFO - __main__ - Step 27429: {'lr': 0.00019981099447759348, 'samples': 877728, 'steps': 1714, 'loss/train': 1.8126153945922852} -09/20/2021 20:25:43 - INFO - __main__ - Step 27430: {'lr': 0.00019981099447759348, 'samples': 877760, 'steps': 1714, 'loss/train': 2.096464157104492} -09/20/2021 20:25:44 - INFO - __main__ - Step 27431: {'lr': 0.00019981099447759348, 'samples': 877792, 'steps': 1714, 'loss/train': 3.2972214221954346} -09/20/2021 20:25:44 - INFO - __main__ - Step 27432: {'lr': 0.00019981099447759348, 'samples': 877824, 'steps': 1714, 'loss/train': 2.115347385406494} -09/20/2021 20:25:45 - INFO - __main__ - Step 27433: {'lr': 0.00019981099447759348, 'samples': 877856, 'steps': 1714, 'loss/train': 2.725633382797241} -09/20/2021 20:25:46 - INFO - __main__ - Step 27434: {'lr': 0.00019981099447759348, 'samples': 877888, 'steps': 1714, 'loss/train': 2.822892189025879} -09/20/2021 20:25:47 - INFO - __main__ - Step 27435: {'lr': 0.00019981099447759348, 'samples': 877920, 'steps': 1714, 'loss/train': 2.550755262374878} -09/20/2021 20:25:47 - INFO - __main__ - Step 27436: {'lr': 0.00019981099447759348, 'samples': 877952, 'steps': 1714, 'loss/train': 1.7101860046386719} -09/20/2021 20:25:48 - INFO - __main__ - Step 27437: {'lr': 0.00019981099447759348, 'samples': 877984, 'steps': 1714, 'loss/train': 2.2632617950439453} -09/20/2021 20:25:49 - INFO - __main__ - Step 27438: {'lr': 0.00019981099447759348, 'samples': 878016, 'steps': 1714, 'loss/train': 2.990176200866699} -09/20/2021 20:25:50 - INFO - __main__ - Step 27439: {'lr': 0.00019981099447759348, 'samples': 878048, 'steps': 1714, 'loss/train': 3.409128427505493} -09/20/2021 20:25:50 - INFO - __main__ - Step 27440: {'lr': 0.00019981099447759348, 'samples': 878080, 'steps': 1714, 'loss/train': 2.8078396320343018} -09/20/2021 20:25:51 - INFO - __main__ - Step 27441: {'lr': 0.00019981060227045914, 'samples': 878112, 'steps': 1715, 'loss/train': 2.054628610610962} -09/20/2021 20:25:52 - INFO - __main__ - Step 27442: {'lr': 0.00019981060227045914, 'samples': 878144, 'steps': 1715, 'loss/train': 2.2054905891418457} -09/20/2021 20:25:53 - INFO - __main__ - Step 27443: {'lr': 0.00019981060227045914, 'samples': 878176, 'steps': 1715, 'loss/train': 1.7458150386810303} -09/20/2021 20:25:54 - INFO - __main__ - Step 27444: {'lr': 0.00019981060227045914, 'samples': 878208, 'steps': 1715, 'loss/train': 2.030092477798462} -09/20/2021 20:25:54 - INFO - __main__ - Step 27445: {'lr': 0.00019981060227045914, 'samples': 878240, 'steps': 1715, 'loss/train': 2.116722345352173} -09/20/2021 20:25:55 - INFO - __main__ - Step 27446: {'lr': 0.00019981060227045914, 'samples': 878272, 'steps': 1715, 'loss/train': 2.0315964221954346} -09/20/2021 20:25:56 - INFO - __main__ - Step 27447: {'lr': 0.00019981060227045914, 'samples': 878304, 'steps': 1715, 'loss/train': 2.349506139755249} -09/20/2021 20:25:57 - INFO - __main__ - Step 27448: {'lr': 0.00019981060227045914, 'samples': 878336, 'steps': 1715, 'loss/train': 2.538654327392578} -09/20/2021 20:25:58 - INFO - __main__ - Step 27449: {'lr': 0.00019981060227045914, 'samples': 878368, 'steps': 1715, 'loss/train': 2.9514098167419434} -09/20/2021 20:25:59 - INFO - __main__ - Step 27450: {'lr': 0.00019981060227045914, 'samples': 878400, 'steps': 1715, 'loss/train': 3.7534873485565186} -09/20/2021 20:25:59 - INFO - __main__ - Step 27451: {'lr': 0.00019981060227045914, 'samples': 878432, 'steps': 1715, 'loss/train': 2.158909320831299} -09/20/2021 20:26:00 - INFO - __main__ - Step 27452: {'lr': 0.00019981060227045914, 'samples': 878464, 'steps': 1715, 'loss/train': 3.235741376876831} -09/20/2021 20:26:01 - INFO - __main__ - Step 27453: {'lr': 0.00019981060227045914, 'samples': 878496, 'steps': 1715, 'loss/train': 2.6022465229034424} -09/20/2021 20:26:02 - INFO - __main__ - Step 27454: {'lr': 0.00019981060227045914, 'samples': 878528, 'steps': 1715, 'loss/train': 3.7195794582366943} -09/20/2021 20:26:02 - INFO - __main__ - Step 27455: {'lr': 0.00019981060227045914, 'samples': 878560, 'steps': 1715, 'loss/train': 3.5753471851348877} -09/20/2021 20:26:03 - INFO - __main__ - Step 27456: {'lr': 0.00019981060227045914, 'samples': 878592, 'steps': 1715, 'loss/train': 2.561886787414551} -09/20/2021 20:26:04 - INFO - __main__ - Step 27457: {'lr': 0.00019981020965719587, 'samples': 878624, 'steps': 1716, 'loss/train': 3.10129714012146} -09/20/2021 20:26:05 - INFO - __main__ - Step 27458: {'lr': 0.00019981020965719587, 'samples': 878656, 'steps': 1716, 'loss/train': 2.860645294189453} -09/20/2021 20:26:05 - INFO - __main__ - Step 27459: {'lr': 0.00019981020965719587, 'samples': 878688, 'steps': 1716, 'loss/train': 2.041116952896118} -09/20/2021 20:26:06 - INFO - __main__ - Step 27460: {'lr': 0.00019981020965719587, 'samples': 878720, 'steps': 1716, 'loss/train': 2.817221164703369} -09/20/2021 20:26:07 - INFO - __main__ - Step 27461: {'lr': 0.00019981020965719587, 'samples': 878752, 'steps': 1716, 'loss/train': 3.0442514419555664} -09/20/2021 20:26:08 - INFO - __main__ - Step 27462: {'lr': 0.00019981020965719587, 'samples': 878784, 'steps': 1716, 'loss/train': 3.038489580154419} -09/20/2021 20:26:08 - INFO - __main__ - Step 27463: {'lr': 0.00019981020965719587, 'samples': 878816, 'steps': 1716, 'loss/train': 2.069553852081299} -09/20/2021 20:26:09 - INFO - __main__ - Step 27464: {'lr': 0.00019981020965719587, 'samples': 878848, 'steps': 1716, 'loss/train': 4.4097981452941895} -09/20/2021 20:26:10 - INFO - __main__ - Step 27465: {'lr': 0.00019981020965719587, 'samples': 878880, 'steps': 1716, 'loss/train': 2.739280939102173} -09/20/2021 20:26:11 - INFO - __main__ - Step 27466: {'lr': 0.00019981020965719587, 'samples': 878912, 'steps': 1716, 'loss/train': 3.586542844772339} -09/20/2021 20:26:11 - INFO - __main__ - Step 27467: {'lr': 0.00019981020965719587, 'samples': 878944, 'steps': 1716, 'loss/train': 2.2535712718963623} -09/20/2021 20:26:12 - INFO - __main__ - Step 27468: {'lr': 0.00019981020965719587, 'samples': 878976, 'steps': 1716, 'loss/train': 2.591163158416748} -09/20/2021 20:26:13 - INFO - __main__ - Step 27469: {'lr': 0.00019981020965719587, 'samples': 879008, 'steps': 1716, 'loss/train': 1.9863773584365845} -09/20/2021 20:26:14 - INFO - __main__ - Step 27470: {'lr': 0.00019981020965719587, 'samples': 879040, 'steps': 1716, 'loss/train': 1.5903302431106567} -09/20/2021 20:26:14 - INFO - __main__ - Step 27471: {'lr': 0.00019981020965719587, 'samples': 879072, 'steps': 1716, 'loss/train': 2.3122451305389404} -09/20/2021 20:26:15 - INFO - __main__ - Step 27472: {'lr': 0.00019981020965719587, 'samples': 879104, 'steps': 1716, 'loss/train': 2.8679678440093994} -09/20/2021 20:26:16 - INFO - __main__ - Step 27473: {'lr': 0.00019980981663780524, 'samples': 879136, 'steps': 1717, 'loss/train': 2.330051898956299} -09/20/2021 20:26:17 - INFO - __main__ - Step 27474: {'lr': 0.00019980981663780524, 'samples': 879168, 'steps': 1717, 'loss/train': 3.391582489013672} -09/20/2021 20:26:18 - INFO - __main__ - Step 27475: {'lr': 0.00019980981663780524, 'samples': 879200, 'steps': 1717, 'loss/train': 3.1693508625030518} -09/20/2021 20:26:18 - INFO - __main__ - Step 27476: {'lr': 0.00019980981663780524, 'samples': 879232, 'steps': 1717, 'loss/train': 1.9825087785720825} -09/20/2021 20:26:19 - INFO - __main__ - Step 27477: {'lr': 0.00019980981663780524, 'samples': 879264, 'steps': 1717, 'loss/train': 3.317617893218994} -09/20/2021 20:26:20 - INFO - __main__ - Step 27478: {'lr': 0.00019980981663780524, 'samples': 879296, 'steps': 1717, 'loss/train': 2.6340553760528564} -09/20/2021 20:26:21 - INFO - __main__ - Step 27479: {'lr': 0.00019980981663780524, 'samples': 879328, 'steps': 1717, 'loss/train': 2.9070780277252197} -09/20/2021 20:26:22 - INFO - __main__ - Step 27480: {'lr': 0.00019980981663780524, 'samples': 879360, 'steps': 1717, 'loss/train': 2.848769187927246} -09/20/2021 20:26:23 - INFO - __main__ - Step 27481: {'lr': 0.00019980981663780524, 'samples': 879392, 'steps': 1717, 'loss/train': 1.756775975227356} -09/20/2021 20:26:23 - INFO - __main__ - Step 27482: {'lr': 0.00019980981663780524, 'samples': 879424, 'steps': 1717, 'loss/train': 0.61907958984375} -09/20/2021 20:26:24 - INFO - __main__ - Step 27483: {'lr': 0.00019980981663780524, 'samples': 879456, 'steps': 1717, 'loss/train': 1.3286488056182861} -09/20/2021 20:26:25 - INFO - __main__ - Step 27484: {'lr': 0.00019980981663780524, 'samples': 879488, 'steps': 1717, 'loss/train': 3.033919334411621} -09/20/2021 20:26:26 - INFO - __main__ - Step 27485: {'lr': 0.00019980981663780524, 'samples': 879520, 'steps': 1717, 'loss/train': 3.085740804672241} -09/20/2021 20:26:26 - INFO - __main__ - Step 27486: {'lr': 0.00019980981663780524, 'samples': 879552, 'steps': 1717, 'loss/train': 3.3756344318389893} -09/20/2021 20:26:27 - INFO - __main__ - Step 27487: {'lr': 0.00019980981663780524, 'samples': 879584, 'steps': 1717, 'loss/train': 3.7309069633483887} -09/20/2021 20:26:28 - INFO - __main__ - Step 27488: {'lr': 0.00019980981663780524, 'samples': 879616, 'steps': 1717, 'loss/train': 2.4905893802642822} -09/20/2021 20:26:29 - INFO - __main__ - Step 27489: {'lr': 0.00019980942321228885, 'samples': 879648, 'steps': 1718, 'loss/train': 4.136690616607666} -09/20/2021 20:26:29 - INFO - __main__ - Step 27490: {'lr': 0.00019980942321228885, 'samples': 879680, 'steps': 1718, 'loss/train': 2.768828868865967} -09/20/2021 20:26:30 - INFO - __main__ - Step 27491: {'lr': 0.00019980942321228885, 'samples': 879712, 'steps': 1718, 'loss/train': 3.091073989868164} -09/20/2021 20:26:31 - INFO - __main__ - Step 27492: {'lr': 0.00019980942321228885, 'samples': 879744, 'steps': 1718, 'loss/train': 2.6603896617889404} -09/20/2021 20:26:32 - INFO - __main__ - Step 27493: {'lr': 0.00019980942321228885, 'samples': 879776, 'steps': 1718, 'loss/train': 3.1987640857696533} -09/20/2021 20:26:32 - INFO - __main__ - Step 27494: {'lr': 0.00019980942321228885, 'samples': 879808, 'steps': 1718, 'loss/train': 1.7250440120697021} -09/20/2021 20:26:33 - INFO - __main__ - Step 27495: {'lr': 0.00019980942321228885, 'samples': 879840, 'steps': 1718, 'loss/train': 3.0808677673339844} -09/20/2021 20:26:34 - INFO - __main__ - Step 27496: {'lr': 0.00019980942321228885, 'samples': 879872, 'steps': 1718, 'loss/train': 2.8717405796051025} -09/20/2021 20:26:35 - INFO - __main__ - Step 27497: {'lr': 0.00019980942321228885, 'samples': 879904, 'steps': 1718, 'loss/train': 2.802001476287842} -09/20/2021 20:26:35 - INFO - __main__ - Step 27498: {'lr': 0.00019980942321228885, 'samples': 879936, 'steps': 1718, 'loss/train': 3.0924980640411377} -09/20/2021 20:26:36 - INFO - __main__ - Step 27499: {'lr': 0.00019980942321228885, 'samples': 879968, 'steps': 1718, 'loss/train': 2.4991672039031982} -09/20/2021 20:26:37 - INFO - __main__ - Step 27500: {'lr': 0.00019980942321228885, 'samples': 880000, 'steps': 1718, 'loss/train': 2.479139566421509} -09/20/2021 20:26:38 - INFO - __main__ - Step 27501: {'lr': 0.00019980942321228885, 'samples': 880032, 'steps': 1718, 'loss/train': 2.907670497894287} -09/20/2021 20:26:38 - INFO - __main__ - Step 27502: {'lr': 0.00019980942321228885, 'samples': 880064, 'steps': 1718, 'loss/train': 2.718517303466797} -09/20/2021 20:26:39 - INFO - __main__ - Step 27503: {'lr': 0.00019980942321228885, 'samples': 880096, 'steps': 1718, 'loss/train': 3.283475160598755} -09/20/2021 20:26:40 - INFO - __main__ - Step 27504: {'lr': 0.00019980942321228885, 'samples': 880128, 'steps': 1718, 'loss/train': 2.304297924041748} -09/20/2021 20:26:41 - INFO - __main__ - Step 27505: {'lr': 0.00019980902938064832, 'samples': 880160, 'steps': 1719, 'loss/train': 0.9794718027114868} -09/20/2021 20:26:42 - INFO - __main__ - Step 27506: {'lr': 0.00019980902938064832, 'samples': 880192, 'steps': 1719, 'loss/train': 2.624551773071289} -09/20/2021 20:26:42 - INFO - __main__ - Step 27507: {'lr': 0.00019980902938064832, 'samples': 880224, 'steps': 1719, 'loss/train': 3.400700330734253} -09/20/2021 20:26:43 - INFO - __main__ - Step 27508: {'lr': 0.00019980902938064832, 'samples': 880256, 'steps': 1719, 'loss/train': 3.5495519638061523} -09/20/2021 20:26:44 - INFO - __main__ - Step 27509: {'lr': 0.00019980902938064832, 'samples': 880288, 'steps': 1719, 'loss/train': 2.610046625137329} -09/20/2021 20:26:45 - INFO - __main__ - Step 27510: {'lr': 0.00019980902938064832, 'samples': 880320, 'steps': 1719, 'loss/train': 1.0225542783737183} -09/20/2021 20:26:46 - INFO - __main__ - Step 27511: {'lr': 0.00019980902938064832, 'samples': 880352, 'steps': 1719, 'loss/train': 2.4009382724761963} -09/20/2021 20:26:47 - INFO - __main__ - Step 27512: {'lr': 0.00019980902938064832, 'samples': 880384, 'steps': 1719, 'loss/train': 2.541320323944092} -09/20/2021 20:26:47 - INFO - __main__ - Step 27513: {'lr': 0.00019980902938064832, 'samples': 880416, 'steps': 1719, 'loss/train': 2.023280620574951} -09/20/2021 20:26:48 - INFO - __main__ - Step 27514: {'lr': 0.00019980902938064832, 'samples': 880448, 'steps': 1719, 'loss/train': 2.856656551361084} -09/20/2021 20:26:49 - INFO - __main__ - Step 27515: {'lr': 0.00019980902938064832, 'samples': 880480, 'steps': 1719, 'loss/train': 2.5679068565368652} -09/20/2021 20:26:50 - INFO - __main__ - Step 27516: {'lr': 0.00019980902938064832, 'samples': 880512, 'steps': 1719, 'loss/train': 2.1181859970092773} -09/20/2021 20:26:50 - INFO - __main__ - Step 27517: {'lr': 0.00019980902938064832, 'samples': 880544, 'steps': 1719, 'loss/train': 3.146364450454712} -09/20/2021 20:26:51 - INFO - __main__ - Step 27518: {'lr': 0.00019980902938064832, 'samples': 880576, 'steps': 1719, 'loss/train': 1.9772738218307495} -09/20/2021 20:26:52 - INFO - __main__ - Step 27519: {'lr': 0.00019980902938064832, 'samples': 880608, 'steps': 1719, 'loss/train': 2.901902198791504} -09/20/2021 20:26:53 - INFO - __main__ - Step 27520: {'lr': 0.00019980902938064832, 'samples': 880640, 'steps': 1719, 'loss/train': 2.998060464859009} -09/20/2021 20:26:54 - INFO - __main__ - Step 27521: {'lr': 0.00019980863514288522, 'samples': 880672, 'steps': 1720, 'loss/train': 3.2955853939056396} -09/20/2021 20:26:54 - INFO - __main__ - Step 27522: {'lr': 0.00019980863514288522, 'samples': 880704, 'steps': 1720, 'loss/train': 3.535930633544922} -09/20/2021 20:26:55 - INFO - __main__ - Step 27523: {'lr': 0.00019980863514288522, 'samples': 880736, 'steps': 1720, 'loss/train': 2.063048839569092} -09/20/2021 20:26:56 - INFO - __main__ - Step 27524: {'lr': 0.00019980863514288522, 'samples': 880768, 'steps': 1720, 'loss/train': 3.0076868534088135} -09/20/2021 20:26:57 - INFO - __main__ - Step 27525: {'lr': 0.00019980863514288522, 'samples': 880800, 'steps': 1720, 'loss/train': 3.5624618530273438} -09/20/2021 20:26:57 - INFO - __main__ - Step 27526: {'lr': 0.00019980863514288522, 'samples': 880832, 'steps': 1720, 'loss/train': 2.9052419662475586} -09/20/2021 20:26:58 - INFO - __main__ - Step 27527: {'lr': 0.00019980863514288522, 'samples': 880864, 'steps': 1720, 'loss/train': 3.5513739585876465} -09/20/2021 20:26:59 - INFO - __main__ - Step 27528: {'lr': 0.00019980863514288522, 'samples': 880896, 'steps': 1720, 'loss/train': 3.177281618118286} -09/20/2021 20:27:00 - INFO - __main__ - Step 27529: {'lr': 0.00019980863514288522, 'samples': 880928, 'steps': 1720, 'loss/train': 2.1119027137756348} -09/20/2021 20:27:00 - INFO - __main__ - Step 27530: {'lr': 0.00019980863514288522, 'samples': 880960, 'steps': 1720, 'loss/train': 3.2767066955566406} -09/20/2021 20:27:01 - INFO - __main__ - Step 27531: {'lr': 0.00019980863514288522, 'samples': 880992, 'steps': 1720, 'loss/train': 2.5516505241394043} -09/20/2021 20:27:02 - INFO - __main__ - Step 27532: {'lr': 0.00019980863514288522, 'samples': 881024, 'steps': 1720, 'loss/train': 1.0017093420028687} -09/20/2021 20:27:03 - INFO - __main__ - Step 27533: {'lr': 0.00019980863514288522, 'samples': 881056, 'steps': 1720, 'loss/train': 2.836387872695923} -09/20/2021 20:27:03 - INFO - __main__ - Step 27534: {'lr': 0.00019980863514288522, 'samples': 881088, 'steps': 1720, 'loss/train': 3.284881114959717} -09/20/2021 20:27:04 - INFO - __main__ - Step 27535: {'lr': 0.00019980863514288522, 'samples': 881120, 'steps': 1720, 'loss/train': 2.4830751419067383} -09/20/2021 20:27:05 - INFO - __main__ - Step 27536: {'lr': 0.00019980863514288522, 'samples': 881152, 'steps': 1720, 'loss/train': 2.9043774604797363} -09/20/2021 20:27:06 - INFO - __main__ - Step 27537: {'lr': 0.0001998082404990012, 'samples': 881184, 'steps': 1721, 'loss/train': 3.3533742427825928} -09/20/2021 20:27:06 - INFO - __main__ - Step 27538: {'lr': 0.0001998082404990012, 'samples': 881216, 'steps': 1721, 'loss/train': 2.8073132038116455} -09/20/2021 20:27:07 - INFO - __main__ - Step 27539: {'lr': 0.0001998082404990012, 'samples': 881248, 'steps': 1721, 'loss/train': 2.937584161758423} -09/20/2021 20:27:08 - INFO - __main__ - Step 27540: {'lr': 0.0001998082404990012, 'samples': 881280, 'steps': 1721, 'loss/train': 2.253566026687622} -09/20/2021 20:27:09 - INFO - __main__ - Step 27541: {'lr': 0.0001998082404990012, 'samples': 881312, 'steps': 1721, 'loss/train': 1.2587053775787354} -09/20/2021 20:27:09 - INFO - __main__ - Step 27542: {'lr': 0.0001998082404990012, 'samples': 881344, 'steps': 1721, 'loss/train': 0.5421027541160583} -09/20/2021 20:27:10 - INFO - __main__ - Step 27543: {'lr': 0.0001998082404990012, 'samples': 881376, 'steps': 1721, 'loss/train': 2.560616970062256} -09/20/2021 20:27:12 - INFO - __main__ - Step 27544: {'lr': 0.0001998082404990012, 'samples': 881408, 'steps': 1721, 'loss/train': 3.3112831115722656} -09/20/2021 20:27:12 - INFO - __main__ - Step 27545: {'lr': 0.0001998082404990012, 'samples': 881440, 'steps': 1721, 'loss/train': 2.135758876800537} -09/20/2021 20:27:13 - INFO - __main__ - Step 27546: {'lr': 0.0001998082404990012, 'samples': 881472, 'steps': 1721, 'loss/train': 3.35105299949646} -09/20/2021 20:27:14 - INFO - __main__ - Step 27547: {'lr': 0.0001998082404990012, 'samples': 881504, 'steps': 1721, 'loss/train': 2.8017797470092773} -09/20/2021 20:27:15 - INFO - __main__ - Step 27548: {'lr': 0.0001998082404990012, 'samples': 881536, 'steps': 1721, 'loss/train': 2.3123021125793457} -09/20/2021 20:27:15 - INFO - __main__ - Step 27549: {'lr': 0.0001998082404990012, 'samples': 881568, 'steps': 1721, 'loss/train': 2.7130446434020996} -09/20/2021 20:27:16 - INFO - __main__ - Step 27550: {'lr': 0.0001998082404990012, 'samples': 881600, 'steps': 1721, 'loss/train': 2.113348960876465} -09/20/2021 20:27:17 - INFO - __main__ - Step 27551: {'lr': 0.0001998082404990012, 'samples': 881632, 'steps': 1721, 'loss/train': 2.609204053878784} -09/20/2021 20:27:18 - INFO - __main__ - Step 27552: {'lr': 0.0001998082404990012, 'samples': 881664, 'steps': 1721, 'loss/train': 3.0263407230377197} -09/20/2021 20:27:18 - INFO - __main__ - Step 27553: {'lr': 0.0001998078454489978, 'samples': 881696, 'steps': 1722, 'loss/train': 2.4237565994262695} -09/20/2021 20:27:19 - INFO - __main__ - Step 27554: {'lr': 0.0001998078454489978, 'samples': 881728, 'steps': 1722, 'loss/train': 2.0349082946777344} -09/20/2021 20:27:20 - INFO - __main__ - Step 27555: {'lr': 0.0001998078454489978, 'samples': 881760, 'steps': 1722, 'loss/train': 2.2136194705963135} -09/20/2021 20:27:21 - INFO - __main__ - Step 27556: {'lr': 0.0001998078454489978, 'samples': 881792, 'steps': 1722, 'loss/train': 2.9992361068725586} -09/20/2021 20:27:21 - INFO - __main__ - Step 27557: {'lr': 0.0001998078454489978, 'samples': 881824, 'steps': 1722, 'loss/train': 2.836191177368164} -09/20/2021 20:27:22 - INFO - __main__ - Step 27558: {'lr': 0.0001998078454489978, 'samples': 881856, 'steps': 1722, 'loss/train': 3.3752429485321045} -09/20/2021 20:27:23 - INFO - __main__ - Step 27559: {'lr': 0.0001998078454489978, 'samples': 881888, 'steps': 1722, 'loss/train': 2.471524715423584} -09/20/2021 20:27:24 - INFO - __main__ - Step 27560: {'lr': 0.0001998078454489978, 'samples': 881920, 'steps': 1722, 'loss/train': 1.8450464010238647} -09/20/2021 20:27:24 - INFO - __main__ - Step 27561: {'lr': 0.0001998078454489978, 'samples': 881952, 'steps': 1722, 'loss/train': 2.533616304397583} -09/20/2021 20:27:25 - INFO - __main__ - Step 27562: {'lr': 0.0001998078454489978, 'samples': 881984, 'steps': 1722, 'loss/train': 3.349712610244751} -09/20/2021 20:27:26 - INFO - __main__ - Step 27563: {'lr': 0.0001998078454489978, 'samples': 882016, 'steps': 1722, 'loss/train': 2.9129891395568848} -09/20/2021 20:27:27 - INFO - __main__ - Step 27564: {'lr': 0.0001998078454489978, 'samples': 882048, 'steps': 1722, 'loss/train': 3.219257116317749} -09/20/2021 20:27:27 - INFO - __main__ - Step 27565: {'lr': 0.0001998078454489978, 'samples': 882080, 'steps': 1722, 'loss/train': 2.004934787750244} -09/20/2021 20:27:28 - INFO - __main__ - Step 27566: {'lr': 0.0001998078454489978, 'samples': 882112, 'steps': 1722, 'loss/train': 2.6800858974456787} -09/20/2021 20:27:29 - INFO - __main__ - Step 27567: {'lr': 0.0001998078454489978, 'samples': 882144, 'steps': 1722, 'loss/train': 1.7404496669769287} -09/20/2021 20:27:30 - INFO - __main__ - Step 27568: {'lr': 0.0001998078454489978, 'samples': 882176, 'steps': 1722, 'loss/train': 2.953263521194458} -09/20/2021 20:27:31 - INFO - __main__ - Step 27569: {'lr': 0.00019980744999287668, 'samples': 882208, 'steps': 1723, 'loss/train': 1.6451154947280884} -09/20/2021 20:27:31 - INFO - __main__ - Step 27570: {'lr': 0.00019980744999287668, 'samples': 882240, 'steps': 1723, 'loss/train': 1.8622410297393799} -09/20/2021 20:27:32 - INFO - __main__ - Step 27571: {'lr': 0.00019980744999287668, 'samples': 882272, 'steps': 1723, 'loss/train': 2.533127784729004} -09/20/2021 20:27:33 - INFO - __main__ - Step 27572: {'lr': 0.00019980744999287668, 'samples': 882304, 'steps': 1723, 'loss/train': 1.701709270477295} -09/20/2021 20:27:34 - INFO - __main__ - Step 27573: {'lr': 0.00019980744999287668, 'samples': 882336, 'steps': 1723, 'loss/train': 2.5079903602600098} -09/20/2021 20:27:35 - INFO - __main__ - Step 27574: {'lr': 0.00019980744999287668, 'samples': 882368, 'steps': 1723, 'loss/train': 2.2905209064483643} -09/20/2021 20:27:36 - INFO - __main__ - Step 27575: {'lr': 0.00019980744999287668, 'samples': 882400, 'steps': 1723, 'loss/train': 2.284107208251953} -09/20/2021 20:27:36 - INFO - __main__ - Step 27576: {'lr': 0.00019980744999287668, 'samples': 882432, 'steps': 1723, 'loss/train': 1.4255547523498535} -09/20/2021 20:27:37 - INFO - __main__ - Step 27577: {'lr': 0.00019980744999287668, 'samples': 882464, 'steps': 1723, 'loss/train': 2.905123233795166} -09/20/2021 20:27:38 - INFO - __main__ - Step 27578: {'lr': 0.00019980744999287668, 'samples': 882496, 'steps': 1723, 'loss/train': 1.5258803367614746} -09/20/2021 20:27:39 - INFO - __main__ - Step 27579: {'lr': 0.00019980744999287668, 'samples': 882528, 'steps': 1723, 'loss/train': 2.302851676940918} -09/20/2021 20:27:39 - INFO - __main__ - Step 27580: {'lr': 0.00019980744999287668, 'samples': 882560, 'steps': 1723, 'loss/train': 2.648763418197632} -09/20/2021 20:27:40 - INFO - __main__ - Step 27581: {'lr': 0.00019980744999287668, 'samples': 882592, 'steps': 1723, 'loss/train': 2.373080253601074} -09/20/2021 20:27:41 - INFO - __main__ - Step 27582: {'lr': 0.00019980744999287668, 'samples': 882624, 'steps': 1723, 'loss/train': 2.225609540939331} -09/20/2021 20:27:42 - INFO - __main__ - Step 27583: {'lr': 0.00019980744999287668, 'samples': 882656, 'steps': 1723, 'loss/train': 2.6832497119903564} -09/20/2021 20:27:42 - INFO - __main__ - Step 27584: {'lr': 0.00019980744999287668, 'samples': 882688, 'steps': 1723, 'loss/train': 2.6297240257263184} -09/20/2021 20:27:43 - INFO - __main__ - Step 27585: {'lr': 0.00019980705413063943, 'samples': 882720, 'steps': 1724, 'loss/train': 3.0633020401000977} -09/20/2021 20:27:44 - INFO - __main__ - Step 27586: {'lr': 0.00019980705413063943, 'samples': 882752, 'steps': 1724, 'loss/train': 2.8427414894104004} -09/20/2021 20:27:45 - INFO - __main__ - Step 27587: {'lr': 0.00019980705413063943, 'samples': 882784, 'steps': 1724, 'loss/train': 2.5917680263519287} -09/20/2021 20:27:46 - INFO - __main__ - Step 27588: {'lr': 0.00019980705413063943, 'samples': 882816, 'steps': 1724, 'loss/train': 5.359700679779053} -09/20/2021 20:27:46 - INFO - __main__ - Step 27589: {'lr': 0.00019980705413063943, 'samples': 882848, 'steps': 1724, 'loss/train': 2.8508212566375732} -09/20/2021 20:27:47 - INFO - __main__ - Step 27590: {'lr': 0.00019980705413063943, 'samples': 882880, 'steps': 1724, 'loss/train': 2.044595956802368} -09/20/2021 20:27:48 - INFO - __main__ - Step 27591: {'lr': 0.00019980705413063943, 'samples': 882912, 'steps': 1724, 'loss/train': 3.214808702468872} -09/20/2021 20:27:49 - INFO - __main__ - Step 27592: {'lr': 0.00019980705413063943, 'samples': 882944, 'steps': 1724, 'loss/train': 1.4518306255340576} -09/20/2021 20:27:49 - INFO - __main__ - Step 27593: {'lr': 0.00019980705413063943, 'samples': 882976, 'steps': 1724, 'loss/train': 2.826462745666504} -09/20/2021 20:27:50 - INFO - __main__ - Step 27594: {'lr': 0.00019980705413063943, 'samples': 883008, 'steps': 1724, 'loss/train': 3.8938632011413574} -09/20/2021 20:27:51 - INFO - __main__ - Step 27595: {'lr': 0.00019980705413063943, 'samples': 883040, 'steps': 1724, 'loss/train': 1.963646650314331} -09/20/2021 20:27:52 - INFO - __main__ - Step 27596: {'lr': 0.00019980705413063943, 'samples': 883072, 'steps': 1724, 'loss/train': 3.0037899017333984} -09/20/2021 20:27:52 - INFO - __main__ - Step 27597: {'lr': 0.00019980705413063943, 'samples': 883104, 'steps': 1724, 'loss/train': 2.9827959537506104} -09/20/2021 20:27:53 - INFO - __main__ - Step 27598: {'lr': 0.00019980705413063943, 'samples': 883136, 'steps': 1724, 'loss/train': 2.1242544651031494} -09/20/2021 20:27:54 - INFO - __main__ - Step 27599: {'lr': 0.00019980705413063943, 'samples': 883168, 'steps': 1724, 'loss/train': 3.599092483520508} -09/20/2021 20:27:55 - INFO - __main__ - Step 27600: {'lr': 0.00019980705413063943, 'samples': 883200, 'steps': 1724, 'loss/train': 2.348365306854248} -09/20/2021 20:27:55 - INFO - __main__ - Step 27601: {'lr': 0.00019980665786228764, 'samples': 883232, 'steps': 1725, 'loss/train': 1.994882583618164} -09/20/2021 20:27:56 - INFO - __main__ - Step 27602: {'lr': 0.00019980665786228764, 'samples': 883264, 'steps': 1725, 'loss/train': 2.317762613296509} -09/20/2021 20:27:57 - INFO - __main__ - Step 27603: {'lr': 0.00019980665786228764, 'samples': 883296, 'steps': 1725, 'loss/train': 2.7458889484405518} -09/20/2021 20:27:58 - INFO - __main__ - Step 27604: {'lr': 0.00019980665786228764, 'samples': 883328, 'steps': 1725, 'loss/train': 2.1308367252349854} -09/20/2021 20:28:00 - INFO - __main__ - Step 27605: {'lr': 0.00019980665786228764, 'samples': 883360, 'steps': 1725, 'loss/train': 2.115403413772583} -09/20/2021 20:28:00 - INFO - __main__ - Step 27606: {'lr': 0.00019980665786228764, 'samples': 883392, 'steps': 1725, 'loss/train': 2.889296770095825} -09/20/2021 20:28:01 - INFO - __main__ - Step 27607: {'lr': 0.00019980665786228764, 'samples': 883424, 'steps': 1725, 'loss/train': 2.8462648391723633} -09/20/2021 20:28:02 - INFO - __main__ - Step 27608: {'lr': 0.00019980665786228764, 'samples': 883456, 'steps': 1725, 'loss/train': 2.7720725536346436} -09/20/2021 20:28:03 - INFO - __main__ - Step 27609: {'lr': 0.00019980665786228764, 'samples': 883488, 'steps': 1725, 'loss/train': 3.830810308456421} -09/20/2021 20:28:03 - INFO - __main__ - Step 27610: {'lr': 0.00019980665786228764, 'samples': 883520, 'steps': 1725, 'loss/train': 2.600175619125366} -09/20/2021 20:28:04 - INFO - __main__ - Step 27611: {'lr': 0.00019980665786228764, 'samples': 883552, 'steps': 1725, 'loss/train': 2.2280054092407227} -09/20/2021 20:28:05 - INFO - __main__ - Step 27612: {'lr': 0.00019980665786228764, 'samples': 883584, 'steps': 1725, 'loss/train': 3.1653382778167725} -09/20/2021 20:28:06 - INFO - __main__ - Step 27613: {'lr': 0.00019980665786228764, 'samples': 883616, 'steps': 1725, 'loss/train': 2.6074821949005127} -09/20/2021 20:28:06 - INFO - __main__ - Step 27614: {'lr': 0.00019980665786228764, 'samples': 883648, 'steps': 1725, 'loss/train': 2.621600389480591} -09/20/2021 20:28:07 - INFO - __main__ - Step 27615: {'lr': 0.00019980665786228764, 'samples': 883680, 'steps': 1725, 'loss/train': 3.5825634002685547} -09/20/2021 20:28:08 - INFO - __main__ - Step 27616: {'lr': 0.00019980665786228764, 'samples': 883712, 'steps': 1725, 'loss/train': 3.4635257720947266} -09/20/2021 20:28:09 - INFO - __main__ - Step 27617: {'lr': 0.000199806261187823, 'samples': 883744, 'steps': 1726, 'loss/train': 2.5788283348083496} -09/20/2021 20:28:09 - INFO - __main__ - Step 27618: {'lr': 0.000199806261187823, 'samples': 883776, 'steps': 1726, 'loss/train': 3.2650015354156494} -09/20/2021 20:28:10 - INFO - __main__ - Step 27619: {'lr': 0.000199806261187823, 'samples': 883808, 'steps': 1726, 'loss/train': 3.4175610542297363} -09/20/2021 20:28:11 - INFO - __main__ - Step 27620: {'lr': 0.000199806261187823, 'samples': 883840, 'steps': 1726, 'loss/train': 3.2541747093200684} -09/20/2021 20:28:12 - INFO - __main__ - Step 27621: {'lr': 0.000199806261187823, 'samples': 883872, 'steps': 1726, 'loss/train': 3.0863943099975586} -09/20/2021 20:28:12 - INFO - __main__ - Step 27622: {'lr': 0.000199806261187823, 'samples': 883904, 'steps': 1726, 'loss/train': 3.4200196266174316} -09/20/2021 20:28:13 - INFO - __main__ - Step 27623: {'lr': 0.000199806261187823, 'samples': 883936, 'steps': 1726, 'loss/train': 3.442808151245117} -09/20/2021 20:28:14 - INFO - __main__ - Step 27624: {'lr': 0.000199806261187823, 'samples': 883968, 'steps': 1726, 'loss/train': 3.384282112121582} -09/20/2021 20:28:15 - INFO - __main__ - Step 27625: {'lr': 0.000199806261187823, 'samples': 884000, 'steps': 1726, 'loss/train': 3.3420562744140625} -09/20/2021 20:28:15 - INFO - __main__ - Step 27626: {'lr': 0.000199806261187823, 'samples': 884032, 'steps': 1726, 'loss/train': 2.7684733867645264} -09/20/2021 20:28:16 - INFO - __main__ - Step 27627: {'lr': 0.000199806261187823, 'samples': 884064, 'steps': 1726, 'loss/train': 3.5358996391296387} -09/20/2021 20:28:17 - INFO - __main__ - Step 27628: {'lr': 0.000199806261187823, 'samples': 884096, 'steps': 1726, 'loss/train': 1.7698513269424438} -09/20/2021 20:28:18 - INFO - __main__ - Step 27629: {'lr': 0.000199806261187823, 'samples': 884128, 'steps': 1726, 'loss/train': 2.735319137573242} -09/20/2021 20:28:18 - INFO - __main__ - Step 27630: {'lr': 0.000199806261187823, 'samples': 884160, 'steps': 1726, 'loss/train': 4.634904861450195} -09/20/2021 20:28:19 - INFO - __main__ - Step 27631: {'lr': 0.000199806261187823, 'samples': 884192, 'steps': 1726, 'loss/train': 2.8469879627227783} -09/20/2021 20:28:20 - INFO - __main__ - Step 27632: {'lr': 0.000199806261187823, 'samples': 884224, 'steps': 1726, 'loss/train': 1.7072447538375854} -09/20/2021 20:28:21 - INFO - __main__ - Step 27633: {'lr': 0.00019980586410724702, 'samples': 884256, 'steps': 1727, 'loss/train': 1.3992598056793213} -09/20/2021 20:28:22 - INFO - __main__ - Step 27634: {'lr': 0.00019980586410724702, 'samples': 884288, 'steps': 1727, 'loss/train': 2.111525774002075} -09/20/2021 20:28:22 - INFO - __main__ - Step 27635: {'lr': 0.00019980586410724702, 'samples': 884320, 'steps': 1727, 'loss/train': 1.7705705165863037} -09/20/2021 20:28:23 - INFO - __main__ - Step 27636: {'lr': 0.00019980586410724702, 'samples': 884352, 'steps': 1727, 'loss/train': 2.2731313705444336} -09/20/2021 20:28:24 - INFO - __main__ - Step 27637: {'lr': 0.00019980586410724702, 'samples': 884384, 'steps': 1727, 'loss/train': 2.0856423377990723} -09/20/2021 20:28:25 - INFO - __main__ - Step 27638: {'lr': 0.00019980586410724702, 'samples': 884416, 'steps': 1727, 'loss/train': 2.0275957584381104} -09/20/2021 20:28:25 - INFO - __main__ - Step 27639: {'lr': 0.00019980586410724702, 'samples': 884448, 'steps': 1727, 'loss/train': 2.455686330795288} -09/20/2021 20:28:26 - INFO - __main__ - Step 27640: {'lr': 0.00019980586410724702, 'samples': 884480, 'steps': 1727, 'loss/train': 3.0559730529785156} -09/20/2021 20:28:27 - INFO - __main__ - Step 27641: {'lr': 0.00019980586410724702, 'samples': 884512, 'steps': 1727, 'loss/train': 2.5723226070404053} -09/20/2021 20:28:28 - INFO - __main__ - Step 27642: {'lr': 0.00019980586410724702, 'samples': 884544, 'steps': 1727, 'loss/train': 2.602908134460449} -09/20/2021 20:28:29 - INFO - __main__ - Step 27643: {'lr': 0.00019980586410724702, 'samples': 884576, 'steps': 1727, 'loss/train': 3.1439931392669678} -09/20/2021 20:28:30 - INFO - __main__ - Step 27644: {'lr': 0.00019980586410724702, 'samples': 884608, 'steps': 1727, 'loss/train': 1.7898845672607422} -09/20/2021 20:28:31 - INFO - __main__ - Step 27645: {'lr': 0.00019980586410724702, 'samples': 884640, 'steps': 1727, 'loss/train': 2.213801383972168} -09/20/2021 20:28:32 - INFO - __main__ - Step 27646: {'lr': 0.00019980586410724702, 'samples': 884672, 'steps': 1727, 'loss/train': 2.7264182567596436} -09/20/2021 20:28:32 - INFO - __main__ - Step 27647: {'lr': 0.00019980586410724702, 'samples': 884704, 'steps': 1727, 'loss/train': 2.7973804473876953} -09/20/2021 20:28:33 - INFO - __main__ - Step 27648: {'lr': 0.00019980586410724702, 'samples': 884736, 'steps': 1727, 'loss/train': 3.233375072479248} -09/20/2021 20:28:34 - INFO - __main__ - Step 27649: {'lr': 0.0001998054666205614, 'samples': 884768, 'steps': 1728, 'loss/train': 2.981635093688965} -09/20/2021 20:28:35 - INFO - __main__ - Step 27650: {'lr': 0.0001998054666205614, 'samples': 884800, 'steps': 1728, 'loss/train': 2.854053497314453} -09/20/2021 20:28:36 - INFO - __main__ - Step 27651: {'lr': 0.0001998054666205614, 'samples': 884832, 'steps': 1728, 'loss/train': 2.7896344661712646} -09/20/2021 20:28:36 - INFO - __main__ - Step 27652: {'lr': 0.0001998054666205614, 'samples': 884864, 'steps': 1728, 'loss/train': 2.4094998836517334} -09/20/2021 20:28:37 - INFO - __main__ - Step 27653: {'lr': 0.0001998054666205614, 'samples': 884896, 'steps': 1728, 'loss/train': 2.7809951305389404} -09/20/2021 20:28:38 - INFO - __main__ - Step 27654: {'lr': 0.0001998054666205614, 'samples': 884928, 'steps': 1728, 'loss/train': 1.764034628868103} -09/20/2021 20:28:39 - INFO - __main__ - Step 27655: {'lr': 0.0001998054666205614, 'samples': 884960, 'steps': 1728, 'loss/train': 2.699500322341919} -09/20/2021 20:28:39 - INFO - __main__ - Step 27656: {'lr': 0.0001998054666205614, 'samples': 884992, 'steps': 1728, 'loss/train': 2.355893611907959} -09/20/2021 20:28:40 - INFO - __main__ - Step 27657: {'lr': 0.0001998054666205614, 'samples': 885024, 'steps': 1728, 'loss/train': 2.563345432281494} -09/20/2021 20:28:41 - INFO - __main__ - Step 27658: {'lr': 0.0001998054666205614, 'samples': 885056, 'steps': 1728, 'loss/train': 2.504776954650879} -09/20/2021 20:28:42 - INFO - __main__ - Step 27659: {'lr': 0.0001998054666205614, 'samples': 885088, 'steps': 1728, 'loss/train': 2.0857889652252197} -09/20/2021 20:28:42 - INFO - __main__ - Step 27660: {'lr': 0.0001998054666205614, 'samples': 885120, 'steps': 1728, 'loss/train': 4.297728061676025} -09/20/2021 20:28:43 - INFO - __main__ - Step 27661: {'lr': 0.0001998054666205614, 'samples': 885152, 'steps': 1728, 'loss/train': 2.2990121841430664} -09/20/2021 20:28:44 - INFO - __main__ - Step 27662: {'lr': 0.0001998054666205614, 'samples': 885184, 'steps': 1728, 'loss/train': 2.016998052597046} -09/20/2021 20:28:45 - INFO - __main__ - Step 27663: {'lr': 0.0001998054666205614, 'samples': 885216, 'steps': 1728, 'loss/train': 2.647614002227783} -09/20/2021 20:28:45 - INFO - __main__ - Step 27664: {'lr': 0.0001998054666205614, 'samples': 885248, 'steps': 1728, 'loss/train': 1.9574686288833618} -09/20/2021 20:28:46 - INFO - __main__ - Step 27665: {'lr': 0.00019980506872776773, 'samples': 885280, 'steps': 1729, 'loss/train': 2.6970276832580566} -09/20/2021 20:28:47 - INFO - __main__ - Step 27666: {'lr': 0.00019980506872776773, 'samples': 885312, 'steps': 1729, 'loss/train': 2.7151200771331787} -09/20/2021 20:28:48 - INFO - __main__ - Step 27667: {'lr': 0.00019980506872776773, 'samples': 885344, 'steps': 1729, 'loss/train': 1.6287287473678589} -09/20/2021 20:28:48 - INFO - __main__ - Step 27668: {'lr': 0.00019980506872776773, 'samples': 885376, 'steps': 1729, 'loss/train': 3.630676746368408} -09/20/2021 20:28:49 - INFO - __main__ - Step 27669: {'lr': 0.00019980506872776773, 'samples': 885408, 'steps': 1729, 'loss/train': 2.097261428833008} -09/20/2021 20:28:50 - INFO - __main__ - Step 27670: {'lr': 0.00019980506872776773, 'samples': 885440, 'steps': 1729, 'loss/train': 9.108383178710938} -09/20/2021 20:28:51 - INFO - __main__ - Step 27671: {'lr': 0.00019980506872776773, 'samples': 885472, 'steps': 1729, 'loss/train': 3.1353187561035156} -09/20/2021 20:28:51 - INFO - __main__ - Step 27672: {'lr': 0.00019980506872776773, 'samples': 885504, 'steps': 1729, 'loss/train': 3.190915822982788} -09/20/2021 20:28:52 - INFO - __main__ - Step 27673: {'lr': 0.00019980506872776773, 'samples': 885536, 'steps': 1729, 'loss/train': 1.837921142578125} -09/20/2021 20:28:53 - INFO - __main__ - Step 27674: {'lr': 0.00019980506872776773, 'samples': 885568, 'steps': 1729, 'loss/train': 3.4347832202911377} -09/20/2021 20:28:54 - INFO - __main__ - Step 27675: {'lr': 0.00019980506872776773, 'samples': 885600, 'steps': 1729, 'loss/train': 3.0106592178344727} -09/20/2021 20:28:55 - INFO - __main__ - Step 27676: {'lr': 0.00019980506872776773, 'samples': 885632, 'steps': 1729, 'loss/train': 3.21760630607605} -09/20/2021 20:28:56 - INFO - __main__ - Step 27677: {'lr': 0.00019980506872776773, 'samples': 885664, 'steps': 1729, 'loss/train': 2.8806591033935547} -09/20/2021 20:28:57 - INFO - __main__ - Step 27678: {'lr': 0.00019980506872776773, 'samples': 885696, 'steps': 1729, 'loss/train': 2.64339280128479} -09/20/2021 20:28:57 - INFO - __main__ - Step 27679: {'lr': 0.00019980506872776773, 'samples': 885728, 'steps': 1729, 'loss/train': 4.166584014892578} -09/20/2021 20:28:58 - INFO - __main__ - Step 27680: {'lr': 0.00019980506872776773, 'samples': 885760, 'steps': 1729, 'loss/train': 2.109304428100586} -09/20/2021 20:28:59 - INFO - __main__ - Step 27681: {'lr': 0.0001998046704288676, 'samples': 885792, 'steps': 1730, 'loss/train': 1.8911939859390259} -09/20/2021 20:29:00 - INFO - __main__ - Step 27682: {'lr': 0.0001998046704288676, 'samples': 885824, 'steps': 1730, 'loss/train': 2.8168416023254395} -09/20/2021 20:29:00 - INFO - __main__ - Step 27683: {'lr': 0.0001998046704288676, 'samples': 885856, 'steps': 1730, 'loss/train': 2.835642099380493} -09/20/2021 20:29:01 - INFO - __main__ - Step 27684: {'lr': 0.0001998046704288676, 'samples': 885888, 'steps': 1730, 'loss/train': 2.595592737197876} -09/20/2021 20:29:02 - INFO - __main__ - Step 27685: {'lr': 0.0001998046704288676, 'samples': 885920, 'steps': 1730, 'loss/train': 2.235761880874634} -09/20/2021 20:29:03 - INFO - __main__ - Step 27686: {'lr': 0.0001998046704288676, 'samples': 885952, 'steps': 1730, 'loss/train': 2.4449076652526855} -09/20/2021 20:29:03 - INFO - __main__ - Step 27687: {'lr': 0.0001998046704288676, 'samples': 885984, 'steps': 1730, 'loss/train': 2.827946186065674} -09/20/2021 20:29:04 - INFO - __main__ - Step 27688: {'lr': 0.0001998046704288676, 'samples': 886016, 'steps': 1730, 'loss/train': 2.0481739044189453} -09/20/2021 20:29:05 - INFO - __main__ - Step 27689: {'lr': 0.0001998046704288676, 'samples': 886048, 'steps': 1730, 'loss/train': 3.3582091331481934} -09/20/2021 20:29:06 - INFO - __main__ - Step 27690: {'lr': 0.0001998046704288676, 'samples': 886080, 'steps': 1730, 'loss/train': 2.670424222946167} -09/20/2021 20:29:06 - INFO - __main__ - Step 27691: {'lr': 0.0001998046704288676, 'samples': 886112, 'steps': 1730, 'loss/train': 3.158456563949585} -09/20/2021 20:29:07 - INFO - __main__ - Step 27692: {'lr': 0.0001998046704288676, 'samples': 886144, 'steps': 1730, 'loss/train': 2.48738169670105} -09/20/2021 20:29:08 - INFO - __main__ - Step 27693: {'lr': 0.0001998046704288676, 'samples': 886176, 'steps': 1730, 'loss/train': 2.4543232917785645} -09/20/2021 20:29:09 - INFO - __main__ - Step 27694: {'lr': 0.0001998046704288676, 'samples': 886208, 'steps': 1730, 'loss/train': 1.7729988098144531} -09/20/2021 20:29:09 - INFO - __main__ - Step 27695: {'lr': 0.0001998046704288676, 'samples': 886240, 'steps': 1730, 'loss/train': 3.0500447750091553} -09/20/2021 20:29:10 - INFO - __main__ - Step 27696: {'lr': 0.0001998046704288676, 'samples': 886272, 'steps': 1730, 'loss/train': 2.927621603012085} -09/20/2021 20:29:11 - INFO - __main__ - Step 27697: {'lr': 0.00019980427172386264, 'samples': 886304, 'steps': 1731, 'loss/train': 2.99658203125} -09/20/2021 20:29:12 - INFO - __main__ - Step 27698: {'lr': 0.00019980427172386264, 'samples': 886336, 'steps': 1731, 'loss/train': 2.955624580383301} -09/20/2021 20:29:13 - INFO - __main__ - Step 27699: {'lr': 0.00019980427172386264, 'samples': 886368, 'steps': 1731, 'loss/train': 2.52154803276062} -09/20/2021 20:29:13 - INFO - __main__ - Step 27700: {'lr': 0.00019980427172386264, 'samples': 886400, 'steps': 1731, 'loss/train': 2.8908956050872803} -09/20/2021 20:29:14 - INFO - __main__ - Step 27701: {'lr': 0.00019980427172386264, 'samples': 886432, 'steps': 1731, 'loss/train': 3.053846836090088} -09/20/2021 20:29:15 - INFO - __main__ - Step 27702: {'lr': 0.00019980427172386264, 'samples': 886464, 'steps': 1731, 'loss/train': 2.1123435497283936} -09/20/2021 20:29:16 - INFO - __main__ - Step 27703: {'lr': 0.00019980427172386264, 'samples': 886496, 'steps': 1731, 'loss/train': 2.0888867378234863} -09/20/2021 20:29:16 - INFO - __main__ - Step 27704: {'lr': 0.00019980427172386264, 'samples': 886528, 'steps': 1731, 'loss/train': 0.7350143194198608} -09/20/2021 20:29:17 - INFO - __main__ - Step 27705: {'lr': 0.00019980427172386264, 'samples': 886560, 'steps': 1731, 'loss/train': 2.0399670600891113} -09/20/2021 20:29:18 - INFO - __main__ - Step 27706: {'lr': 0.00019980427172386264, 'samples': 886592, 'steps': 1731, 'loss/train': 1.961281418800354} -09/20/2021 20:29:19 - INFO - __main__ - Step 27707: {'lr': 0.00019980427172386264, 'samples': 886624, 'steps': 1731, 'loss/train': 1.0539271831512451} -09/20/2021 20:29:20 - INFO - __main__ - Step 27708: {'lr': 0.00019980427172386264, 'samples': 886656, 'steps': 1731, 'loss/train': 2.333949565887451} -09/20/2021 20:29:21 - INFO - __main__ - Step 27709: {'lr': 0.00019980427172386264, 'samples': 886688, 'steps': 1731, 'loss/train': 1.554529070854187} -09/20/2021 20:29:21 - INFO - __main__ - Step 27710: {'lr': 0.00019980427172386264, 'samples': 886720, 'steps': 1731, 'loss/train': 2.463787317276001} -09/20/2021 20:29:22 - INFO - __main__ - Step 27711: {'lr': 0.00019980427172386264, 'samples': 886752, 'steps': 1731, 'loss/train': 1.387638807296753} -09/20/2021 20:29:23 - INFO - __main__ - Step 27712: {'lr': 0.00019980427172386264, 'samples': 886784, 'steps': 1731, 'loss/train': 3.219444990158081} -09/20/2021 20:29:24 - INFO - __main__ - Step 27713: {'lr': 0.0001998038726127545, 'samples': 886816, 'steps': 1732, 'loss/train': 2.93569016456604} -09/20/2021 20:29:25 - INFO - __main__ - Step 27714: {'lr': 0.0001998038726127545, 'samples': 886848, 'steps': 1732, 'loss/train': 2.821859121322632} -09/20/2021 20:29:25 - INFO - __main__ - Step 27715: {'lr': 0.0001998038726127545, 'samples': 886880, 'steps': 1732, 'loss/train': 3.2214338779449463} -09/20/2021 20:29:26 - INFO - __main__ - Step 27716: {'lr': 0.0001998038726127545, 'samples': 886912, 'steps': 1732, 'loss/train': 2.6663079261779785} -09/20/2021 20:29:27 - INFO - __main__ - Step 27717: {'lr': 0.0001998038726127545, 'samples': 886944, 'steps': 1732, 'loss/train': 3.4141459465026855} -09/20/2021 20:29:28 - INFO - __main__ - Step 27718: {'lr': 0.0001998038726127545, 'samples': 886976, 'steps': 1732, 'loss/train': 3.7252132892608643} -09/20/2021 20:29:28 - INFO - __main__ - Step 27719: {'lr': 0.0001998038726127545, 'samples': 887008, 'steps': 1732, 'loss/train': 2.644113779067993} -09/20/2021 20:29:29 - INFO - __main__ - Step 27720: {'lr': 0.0001998038726127545, 'samples': 887040, 'steps': 1732, 'loss/train': 2.335972547531128} -09/20/2021 20:29:30 - INFO - __main__ - Step 27721: {'lr': 0.0001998038726127545, 'samples': 887072, 'steps': 1732, 'loss/train': 1.8691775798797607} -09/20/2021 20:29:31 - INFO - __main__ - Step 27722: {'lr': 0.0001998038726127545, 'samples': 887104, 'steps': 1732, 'loss/train': 2.487840414047241} -09/20/2021 20:29:31 - INFO - __main__ - Step 27723: {'lr': 0.0001998038726127545, 'samples': 887136, 'steps': 1732, 'loss/train': 3.0541532039642334} -09/20/2021 20:29:32 - INFO - __main__ - Step 27724: {'lr': 0.0001998038726127545, 'samples': 887168, 'steps': 1732, 'loss/train': 0.8146301507949829} -09/20/2021 20:29:33 - INFO - __main__ - Step 27725: {'lr': 0.0001998038726127545, 'samples': 887200, 'steps': 1732, 'loss/train': 2.4920663833618164} -09/20/2021 20:29:34 - INFO - __main__ - Step 27726: {'lr': 0.0001998038726127545, 'samples': 887232, 'steps': 1732, 'loss/train': 2.931216239929199} -09/20/2021 20:29:34 - INFO - __main__ - Step 27727: {'lr': 0.0001998038726127545, 'samples': 887264, 'steps': 1732, 'loss/train': 2.434234380722046} -09/20/2021 20:29:35 - INFO - __main__ - Step 27728: {'lr': 0.0001998038726127545, 'samples': 887296, 'steps': 1732, 'loss/train': 3.0315299034118652} -09/20/2021 20:29:36 - INFO - __main__ - Step 27729: {'lr': 0.00019980347309554478, 'samples': 887328, 'steps': 1733, 'loss/train': 2.4998507499694824} -09/20/2021 20:29:37 - INFO - __main__ - Step 27730: {'lr': 0.00019980347309554478, 'samples': 887360, 'steps': 1733, 'loss/train': 2.011986494064331} -09/20/2021 20:29:37 - INFO - __main__ - Step 27731: {'lr': 0.00019980347309554478, 'samples': 887392, 'steps': 1733, 'loss/train': 2.81091046333313} -09/20/2021 20:29:38 - INFO - __main__ - Step 27732: {'lr': 0.00019980347309554478, 'samples': 887424, 'steps': 1733, 'loss/train': 2.6356093883514404} -09/20/2021 20:29:39 - INFO - __main__ - Step 27733: {'lr': 0.00019980347309554478, 'samples': 887456, 'steps': 1733, 'loss/train': 2.6369307041168213} -09/20/2021 20:29:40 - INFO - __main__ - Step 27734: {'lr': 0.00019980347309554478, 'samples': 887488, 'steps': 1733, 'loss/train': 3.5686159133911133} -09/20/2021 20:29:40 - INFO - __main__ - Step 27735: {'lr': 0.00019980347309554478, 'samples': 887520, 'steps': 1733, 'loss/train': 3.627720832824707} -09/20/2021 20:29:41 - INFO - __main__ - Step 27736: {'lr': 0.00019980347309554478, 'samples': 887552, 'steps': 1733, 'loss/train': 2.5645055770874023} -09/20/2021 20:29:43 - INFO - __main__ - Step 27737: {'lr': 0.00019980347309554478, 'samples': 887584, 'steps': 1733, 'loss/train': 2.7715375423431396} -09/20/2021 20:29:44 - INFO - __main__ - Step 27738: {'lr': 0.00019980347309554478, 'samples': 887616, 'steps': 1733, 'loss/train': 2.7169249057769775} -09/20/2021 20:29:44 - INFO - __main__ - Step 27739: {'lr': 0.00019980347309554478, 'samples': 887648, 'steps': 1733, 'loss/train': 1.0212318897247314} -09/20/2021 20:29:45 - INFO - __main__ - Step 27740: {'lr': 0.00019980347309554478, 'samples': 887680, 'steps': 1733, 'loss/train': 1.5788910388946533} -09/20/2021 20:29:46 - INFO - __main__ - Step 27741: {'lr': 0.00019980347309554478, 'samples': 887712, 'steps': 1733, 'loss/train': 3.132303237915039} -09/20/2021 20:29:47 - INFO - __main__ - Step 27742: {'lr': 0.00019980347309554478, 'samples': 887744, 'steps': 1733, 'loss/train': 2.6241698265075684} -09/20/2021 20:29:47 - INFO - __main__ - Step 27743: {'lr': 0.00019980347309554478, 'samples': 887776, 'steps': 1733, 'loss/train': 1.690719485282898} -09/20/2021 20:29:48 - INFO - __main__ - Step 27744: {'lr': 0.00019980347309554478, 'samples': 887808, 'steps': 1733, 'loss/train': 1.9264051914215088} -09/20/2021 20:29:49 - INFO - __main__ - Step 27745: {'lr': 0.00019980307317223511, 'samples': 887840, 'steps': 1734, 'loss/train': 2.2750132083892822} -09/20/2021 20:29:50 - INFO - __main__ - Step 27746: {'lr': 0.00019980307317223511, 'samples': 887872, 'steps': 1734, 'loss/train': 2.3192479610443115} -09/20/2021 20:29:50 - INFO - __main__ - Step 27747: {'lr': 0.00019980307317223511, 'samples': 887904, 'steps': 1734, 'loss/train': 0.6404913663864136} -09/20/2021 20:29:51 - INFO - __main__ - Step 27748: {'lr': 0.00019980307317223511, 'samples': 887936, 'steps': 1734, 'loss/train': 2.784801959991455} -09/20/2021 20:29:52 - INFO - __main__ - Step 27749: {'lr': 0.00019980307317223511, 'samples': 887968, 'steps': 1734, 'loss/train': 2.452094078063965} -09/20/2021 20:29:53 - INFO - __main__ - Step 27750: {'lr': 0.00019980307317223511, 'samples': 888000, 'steps': 1734, 'loss/train': 3.049114227294922} -09/20/2021 20:29:53 - INFO - __main__ - Step 27751: {'lr': 0.00019980307317223511, 'samples': 888032, 'steps': 1734, 'loss/train': 2.3238625526428223} -09/20/2021 20:29:54 - INFO - __main__ - Step 27752: {'lr': 0.00019980307317223511, 'samples': 888064, 'steps': 1734, 'loss/train': 2.3123481273651123} -09/20/2021 20:29:55 - INFO - __main__ - Step 27753: {'lr': 0.00019980307317223511, 'samples': 888096, 'steps': 1734, 'loss/train': 2.7510037422180176} -09/20/2021 20:29:56 - INFO - __main__ - Step 27754: {'lr': 0.00019980307317223511, 'samples': 888128, 'steps': 1734, 'loss/train': 2.471644639968872} -09/20/2021 20:29:56 - INFO - __main__ - Step 27755: {'lr': 0.00019980307317223511, 'samples': 888160, 'steps': 1734, 'loss/train': 0.46484893560409546} -09/20/2021 20:29:57 - INFO - __main__ - Step 27756: {'lr': 0.00019980307317223511, 'samples': 888192, 'steps': 1734, 'loss/train': 0.3611500561237335} -09/20/2021 20:29:58 - INFO - __main__ - Step 27757: {'lr': 0.00019980307317223511, 'samples': 888224, 'steps': 1734, 'loss/train': 0.4917001724243164} -09/20/2021 20:29:59 - INFO - __main__ - Step 27758: {'lr': 0.00019980307317223511, 'samples': 888256, 'steps': 1734, 'loss/train': 0.3839399516582489} -09/20/2021 20:29:59 - INFO - __main__ - Step 27759: {'lr': 0.00019980307317223511, 'samples': 888288, 'steps': 1734, 'loss/train': 0.5904985070228577} -09/20/2021 20:30:00 - INFO - __main__ - Step 27760: {'lr': 0.00019980307317223511, 'samples': 888320, 'steps': 1734, 'loss/train': 2.4175825119018555} -09/20/2021 20:30:01 - INFO - __main__ - Step 27761: {'lr': 0.00019980267284282717, 'samples': 888352, 'steps': 1735, 'loss/train': 2.628603219985962} -09/20/2021 20:30:02 - INFO - __main__ - Step 27762: {'lr': 0.00019980267284282717, 'samples': 888384, 'steps': 1735, 'loss/train': 3.7539050579071045} -09/20/2021 20:30:03 - INFO - __main__ - Step 27763: {'lr': 0.00019980267284282717, 'samples': 888416, 'steps': 1735, 'loss/train': 2.9478442668914795} -09/20/2021 20:30:03 - INFO - __main__ - Step 27764: {'lr': 0.00019980267284282717, 'samples': 888448, 'steps': 1735, 'loss/train': 2.2832157611846924} -09/20/2021 20:30:04 - INFO - __main__ - Step 27765: {'lr': 0.00019980267284282717, 'samples': 888480, 'steps': 1735, 'loss/train': 2.5581891536712646} -09/20/2021 20:30:05 - INFO - __main__ - Step 27766: {'lr': 0.00019980267284282717, 'samples': 888512, 'steps': 1735, 'loss/train': 2.684445858001709} -09/20/2021 20:30:06 - INFO - __main__ - Step 27767: {'lr': 0.00019980267284282717, 'samples': 888544, 'steps': 1735, 'loss/train': 3.2414777278900146} -09/20/2021 20:30:07 - INFO - __main__ - Step 27768: {'lr': 0.00019980267284282717, 'samples': 888576, 'steps': 1735, 'loss/train': 2.482184886932373} -09/20/2021 20:30:08 - INFO - __main__ - Step 27769: {'lr': 0.00019980267284282717, 'samples': 888608, 'steps': 1735, 'loss/train': 3.263150930404663} -09/20/2021 20:30:08 - INFO - __main__ - Step 27770: {'lr': 0.00019980267284282717, 'samples': 888640, 'steps': 1735, 'loss/train': 3.977440118789673} -09/20/2021 20:30:09 - INFO - __main__ - Step 27771: {'lr': 0.00019980267284282717, 'samples': 888672, 'steps': 1735, 'loss/train': 2.53584623336792} -09/20/2021 20:30:10 - INFO - __main__ - Step 27772: {'lr': 0.00019980267284282717, 'samples': 888704, 'steps': 1735, 'loss/train': 2.5301172733306885} -09/20/2021 20:30:11 - INFO - __main__ - Step 27773: {'lr': 0.00019980267284282717, 'samples': 888736, 'steps': 1735, 'loss/train': 2.9989516735076904} -09/20/2021 20:30:11 - INFO - __main__ - Step 27774: {'lr': 0.00019980267284282717, 'samples': 888768, 'steps': 1735, 'loss/train': 2.528653860092163} -09/20/2021 20:30:12 - INFO - __main__ - Step 27775: {'lr': 0.00019980267284282717, 'samples': 888800, 'steps': 1735, 'loss/train': 2.1390297412872314} -09/20/2021 20:30:13 - INFO - __main__ - Step 27776: {'lr': 0.00019980267284282717, 'samples': 888832, 'steps': 1735, 'loss/train': 3.0724728107452393} -09/20/2021 20:30:14 - INFO - __main__ - Step 27777: {'lr': 0.0001998022721073225, 'samples': 888864, 'steps': 1736, 'loss/train': 2.8529269695281982} -09/20/2021 20:30:15 - INFO - __main__ - Step 27778: {'lr': 0.0001998022721073225, 'samples': 888896, 'steps': 1736, 'loss/train': 2.5107173919677734} -09/20/2021 20:30:15 - INFO - __main__ - Step 27779: {'lr': 0.0001998022721073225, 'samples': 888928, 'steps': 1736, 'loss/train': 4.225265979766846} -09/20/2021 20:30:16 - INFO - __main__ - Step 27780: {'lr': 0.0001998022721073225, 'samples': 888960, 'steps': 1736, 'loss/train': 2.365288019180298} -09/20/2021 20:30:17 - INFO - __main__ - Step 27781: {'lr': 0.0001998022721073225, 'samples': 888992, 'steps': 1736, 'loss/train': 1.7204735279083252} -09/20/2021 20:30:18 - INFO - __main__ - Step 27782: {'lr': 0.0001998022721073225, 'samples': 889024, 'steps': 1736, 'loss/train': 1.92604660987854} -09/20/2021 20:30:18 - INFO - __main__ - Step 27783: {'lr': 0.0001998022721073225, 'samples': 889056, 'steps': 1736, 'loss/train': 2.4574267864227295} -09/20/2021 20:30:19 - INFO - __main__ - Step 27784: {'lr': 0.0001998022721073225, 'samples': 889088, 'steps': 1736, 'loss/train': 3.5862395763397217} -09/20/2021 20:30:20 - INFO - __main__ - Step 27785: {'lr': 0.0001998022721073225, 'samples': 889120, 'steps': 1736, 'loss/train': 2.9425976276397705} -09/20/2021 20:30:21 - INFO - __main__ - Step 27786: {'lr': 0.0001998022721073225, 'samples': 889152, 'steps': 1736, 'loss/train': 3.346203088760376} -09/20/2021 20:30:21 - INFO - __main__ - Step 27787: {'lr': 0.0001998022721073225, 'samples': 889184, 'steps': 1736, 'loss/train': 1.9156932830810547} -09/20/2021 20:30:22 - INFO - __main__ - Step 27788: {'lr': 0.0001998022721073225, 'samples': 889216, 'steps': 1736, 'loss/train': 3.1993908882141113} -09/20/2021 20:30:23 - INFO - __main__ - Step 27789: {'lr': 0.0001998022721073225, 'samples': 889248, 'steps': 1736, 'loss/train': 2.8492071628570557} -09/20/2021 20:30:24 - INFO - __main__ - Step 27790: {'lr': 0.0001998022721073225, 'samples': 889280, 'steps': 1736, 'loss/train': 2.181053638458252} -09/20/2021 20:30:24 - INFO - __main__ - Step 27791: {'lr': 0.0001998022721073225, 'samples': 889312, 'steps': 1736, 'loss/train': 2.4584145545959473} -09/20/2021 20:30:25 - INFO - __main__ - Step 27792: {'lr': 0.0001998022721073225, 'samples': 889344, 'steps': 1736, 'loss/train': 2.6243040561676025} -09/20/2021 20:30:26 - INFO - __main__ - Step 27793: {'lr': 0.00019980187096572277, 'samples': 889376, 'steps': 1737, 'loss/train': 2.3692240715026855} -09/20/2021 20:30:27 - INFO - __main__ - Step 27794: {'lr': 0.00019980187096572277, 'samples': 889408, 'steps': 1737, 'loss/train': 3.820424795150757} -09/20/2021 20:30:27 - INFO - __main__ - Step 27795: {'lr': 0.00019980187096572277, 'samples': 889440, 'steps': 1737, 'loss/train': 3.087045192718506} -09/20/2021 20:30:28 - INFO - __main__ - Step 27796: {'lr': 0.00019980187096572277, 'samples': 889472, 'steps': 1737, 'loss/train': 2.8228490352630615} -09/20/2021 20:30:29 - INFO - __main__ - Step 27797: {'lr': 0.00019980187096572277, 'samples': 889504, 'steps': 1737, 'loss/train': 3.412393808364868} -09/20/2021 20:30:30 - INFO - __main__ - Step 27798: {'lr': 0.00019980187096572277, 'samples': 889536, 'steps': 1737, 'loss/train': 1.2418442964553833} -09/20/2021 20:30:30 - INFO - __main__ - Step 27799: {'lr': 0.00019980187096572277, 'samples': 889568, 'steps': 1737, 'loss/train': 3.444979667663574} -09/20/2021 20:30:32 - INFO - __main__ - Step 27800: {'lr': 0.00019980187096572277, 'samples': 889600, 'steps': 1737, 'loss/train': 3.143648862838745} -09/20/2021 20:30:32 - INFO - __main__ - Step 27801: {'lr': 0.00019980187096572277, 'samples': 889632, 'steps': 1737, 'loss/train': 3.2899398803710938} -09/20/2021 20:30:33 - INFO - __main__ - Step 27802: {'lr': 0.00019980187096572277, 'samples': 889664, 'steps': 1737, 'loss/train': 2.9898762702941895} -09/20/2021 20:30:34 - INFO - __main__ - Step 27803: {'lr': 0.00019980187096572277, 'samples': 889696, 'steps': 1737, 'loss/train': 2.192835569381714} -09/20/2021 20:30:35 - INFO - __main__ - Step 27804: {'lr': 0.00019980187096572277, 'samples': 889728, 'steps': 1737, 'loss/train': 4.1201863288879395} -09/20/2021 20:30:35 - INFO - __main__ - Step 27805: {'lr': 0.00019980187096572277, 'samples': 889760, 'steps': 1737, 'loss/train': 2.517284393310547} -09/20/2021 20:30:36 - INFO - __main__ - Step 27806: {'lr': 0.00019980187096572277, 'samples': 889792, 'steps': 1737, 'loss/train': 2.7389187812805176} -09/20/2021 20:30:37 - INFO - __main__ - Step 27807: {'lr': 0.00019980187096572277, 'samples': 889824, 'steps': 1737, 'loss/train': 2.965000629425049} -09/20/2021 20:30:38 - INFO - __main__ - Step 27808: {'lr': 0.00019980187096572277, 'samples': 889856, 'steps': 1737, 'loss/train': 2.621912717819214} -09/20/2021 20:30:39 - INFO - __main__ - Step 27809: {'lr': 0.00019980146941802964, 'samples': 889888, 'steps': 1738, 'loss/train': 2.2675628662109375} -09/20/2021 20:30:39 - INFO - __main__ - Step 27810: {'lr': 0.00019980146941802964, 'samples': 889920, 'steps': 1738, 'loss/train': 2.5053977966308594} -09/20/2021 20:30:40 - INFO - __main__ - Step 27811: {'lr': 0.00019980146941802964, 'samples': 889952, 'steps': 1738, 'loss/train': 3.0822174549102783} -09/20/2021 20:30:41 - INFO - __main__ - Step 27812: {'lr': 0.00019980146941802964, 'samples': 889984, 'steps': 1738, 'loss/train': 1.9711449146270752} -09/20/2021 20:30:42 - INFO - __main__ - Step 27813: {'lr': 0.00019980146941802964, 'samples': 890016, 'steps': 1738, 'loss/train': 2.2380142211914062} -09/20/2021 20:30:42 - INFO - __main__ - Step 27814: {'lr': 0.00019980146941802964, 'samples': 890048, 'steps': 1738, 'loss/train': 2.410938024520874} -09/20/2021 20:30:43 - INFO - __main__ - Step 27815: {'lr': 0.00019980146941802964, 'samples': 890080, 'steps': 1738, 'loss/train': 2.3320178985595703} -09/20/2021 20:30:44 - INFO - __main__ - Step 27816: {'lr': 0.00019980146941802964, 'samples': 890112, 'steps': 1738, 'loss/train': 3.8321967124938965} -09/20/2021 20:30:45 - INFO - __main__ - Step 27817: {'lr': 0.00019980146941802964, 'samples': 890144, 'steps': 1738, 'loss/train': 3.0435285568237305} -09/20/2021 20:30:45 - INFO - __main__ - Step 27818: {'lr': 0.00019980146941802964, 'samples': 890176, 'steps': 1738, 'loss/train': 2.872526168823242} -09/20/2021 20:30:46 - INFO - __main__ - Step 27819: {'lr': 0.00019980146941802964, 'samples': 890208, 'steps': 1738, 'loss/train': 2.5482585430145264} -09/20/2021 20:30:47 - INFO - __main__ - Step 27820: {'lr': 0.00019980146941802964, 'samples': 890240, 'steps': 1738, 'loss/train': 2.3957760334014893} -09/20/2021 20:30:48 - INFO - __main__ - Step 27821: {'lr': 0.00019980146941802964, 'samples': 890272, 'steps': 1738, 'loss/train': 2.2377285957336426} -09/20/2021 20:30:48 - INFO - __main__ - Step 27822: {'lr': 0.00019980146941802964, 'samples': 890304, 'steps': 1738, 'loss/train': 1.945857048034668} -09/20/2021 20:30:49 - INFO - __main__ - Step 27823: {'lr': 0.00019980146941802964, 'samples': 890336, 'steps': 1738, 'loss/train': 2.4884674549102783} -09/20/2021 20:30:50 - INFO - __main__ - Step 27824: {'lr': 0.00019980146941802964, 'samples': 890368, 'steps': 1738, 'loss/train': 1.958808183670044} -09/20/2021 20:30:51 - INFO - __main__ - Step 27825: {'lr': 0.00019980106746424471, 'samples': 890400, 'steps': 1739, 'loss/train': 1.7533812522888184} -09/20/2021 20:30:51 - INFO - __main__ - Step 27826: {'lr': 0.00019980106746424471, 'samples': 890432, 'steps': 1739, 'loss/train': 2.0820722579956055} -09/20/2021 20:30:52 - INFO - __main__ - Step 27827: {'lr': 0.00019980106746424471, 'samples': 890464, 'steps': 1739, 'loss/train': 2.453000783920288} -09/20/2021 20:30:53 - INFO - __main__ - Step 27828: {'lr': 0.00019980106746424471, 'samples': 890496, 'steps': 1739, 'loss/train': 3.028701066970825} -09/20/2021 20:30:54 - INFO - __main__ - Step 27829: {'lr': 0.00019980106746424471, 'samples': 890528, 'steps': 1739, 'loss/train': 2.964245319366455} -09/20/2021 20:30:54 - INFO - __main__ - Step 27830: {'lr': 0.00019980106746424471, 'samples': 890560, 'steps': 1739, 'loss/train': 2.1614716053009033} -09/20/2021 20:30:56 - INFO - __main__ - Step 27831: {'lr': 0.00019980106746424471, 'samples': 890592, 'steps': 1739, 'loss/train': 2.1114394664764404} -09/20/2021 20:30:57 - INFO - __main__ - Step 27832: {'lr': 0.00019980106746424471, 'samples': 890624, 'steps': 1739, 'loss/train': 2.3658554553985596} -09/20/2021 20:30:57 - INFO - __main__ - Step 27833: {'lr': 0.00019980106746424471, 'samples': 890656, 'steps': 1739, 'loss/train': 1.9276565313339233} -09/20/2021 20:30:58 - INFO - __main__ - Step 27834: {'lr': 0.00019980106746424471, 'samples': 890688, 'steps': 1739, 'loss/train': 3.1237101554870605} -09/20/2021 20:30:59 - INFO - __main__ - Step 27835: {'lr': 0.00019980106746424471, 'samples': 890720, 'steps': 1739, 'loss/train': 2.881577730178833} -09/20/2021 20:31:00 - INFO - __main__ - Step 27836: {'lr': 0.00019980106746424471, 'samples': 890752, 'steps': 1739, 'loss/train': 2.603299140930176} -09/20/2021 20:31:00 - INFO - __main__ - Step 27837: {'lr': 0.00019980106746424471, 'samples': 890784, 'steps': 1739, 'loss/train': 2.595541477203369} -09/20/2021 20:31:01 - INFO - __main__ - Step 27838: {'lr': 0.00019980106746424471, 'samples': 890816, 'steps': 1739, 'loss/train': 3.1725404262542725} -09/20/2021 20:31:02 - INFO - __main__ - Step 27839: {'lr': 0.00019980106746424471, 'samples': 890848, 'steps': 1739, 'loss/train': 2.442979574203491} -09/20/2021 20:31:03 - INFO - __main__ - Step 27840: {'lr': 0.00019980106746424471, 'samples': 890880, 'steps': 1739, 'loss/train': 2.864614248275757} -09/20/2021 20:31:03 - INFO - __main__ - Step 27841: {'lr': 0.00019980066510436964, 'samples': 890912, 'steps': 1740, 'loss/train': 2.714672327041626} -09/20/2021 20:31:04 - INFO - __main__ - Step 27842: {'lr': 0.00019980066510436964, 'samples': 890944, 'steps': 1740, 'loss/train': 3.332345485687256} -09/20/2021 20:31:05 - INFO - __main__ - Step 27843: {'lr': 0.00019980066510436964, 'samples': 890976, 'steps': 1740, 'loss/train': 2.5251803398132324} -09/20/2021 20:31:06 - INFO - __main__ - Step 27844: {'lr': 0.00019980066510436964, 'samples': 891008, 'steps': 1740, 'loss/train': 2.612224578857422} -09/20/2021 20:31:06 - INFO - __main__ - Step 27845: {'lr': 0.00019980066510436964, 'samples': 891040, 'steps': 1740, 'loss/train': 2.4953927993774414} -09/20/2021 20:31:07 - INFO - __main__ - Step 27846: {'lr': 0.00019980066510436964, 'samples': 891072, 'steps': 1740, 'loss/train': 2.9003496170043945} -09/20/2021 20:31:08 - INFO - __main__ - Step 27847: {'lr': 0.00019980066510436964, 'samples': 891104, 'steps': 1740, 'loss/train': 3.094026803970337} -09/20/2021 20:31:09 - INFO - __main__ - Step 27848: {'lr': 0.00019980066510436964, 'samples': 891136, 'steps': 1740, 'loss/train': 2.504493474960327} -09/20/2021 20:31:09 - INFO - __main__ - Step 27849: {'lr': 0.00019980066510436964, 'samples': 891168, 'steps': 1740, 'loss/train': 2.047065496444702} -09/20/2021 20:31:10 - INFO - __main__ - Step 27850: {'lr': 0.00019980066510436964, 'samples': 891200, 'steps': 1740, 'loss/train': 3.2867445945739746} -09/20/2021 20:31:11 - INFO - __main__ - Step 27851: {'lr': 0.00019980066510436964, 'samples': 891232, 'steps': 1740, 'loss/train': 2.6658034324645996} -09/20/2021 20:31:12 - INFO - __main__ - Step 27852: {'lr': 0.00019980066510436964, 'samples': 891264, 'steps': 1740, 'loss/train': 2.615105628967285} -09/20/2021 20:31:12 - INFO - __main__ - Step 27853: {'lr': 0.00019980066510436964, 'samples': 891296, 'steps': 1740, 'loss/train': 2.581477403640747} -09/20/2021 20:31:13 - INFO - __main__ - Step 27854: {'lr': 0.00019980066510436964, 'samples': 891328, 'steps': 1740, 'loss/train': 2.929527759552002} -09/20/2021 20:31:14 - INFO - __main__ - Step 27855: {'lr': 0.00019980066510436964, 'samples': 891360, 'steps': 1740, 'loss/train': 2.230929374694824} -09/20/2021 20:31:15 - INFO - __main__ - Step 27856: {'lr': 0.00019980066510436964, 'samples': 891392, 'steps': 1740, 'loss/train': 2.617967367172241} -09/20/2021 20:31:16 - INFO - __main__ - Step 27857: {'lr': 0.000199800262338406, 'samples': 891424, 'steps': 1741, 'loss/train': 1.7575187683105469} -09/20/2021 20:31:16 - INFO - __main__ - Step 27858: {'lr': 0.000199800262338406, 'samples': 891456, 'steps': 1741, 'loss/train': 2.6717312335968018} -09/20/2021 20:31:17 - INFO - __main__ - Step 27859: {'lr': 0.000199800262338406, 'samples': 891488, 'steps': 1741, 'loss/train': 2.969449281692505} -09/20/2021 20:31:18 - INFO - __main__ - Step 27860: {'lr': 0.000199800262338406, 'samples': 891520, 'steps': 1741, 'loss/train': 2.5704047679901123} -09/20/2021 20:31:19 - INFO - __main__ - Step 27861: {'lr': 0.000199800262338406, 'samples': 891552, 'steps': 1741, 'loss/train': 2.16501522064209} -09/20/2021 20:31:20 - INFO - __main__ - Step 27862: {'lr': 0.000199800262338406, 'samples': 891584, 'steps': 1741, 'loss/train': 2.622279405593872} -09/20/2021 20:31:21 - INFO - __main__ - Step 27863: {'lr': 0.000199800262338406, 'samples': 891616, 'steps': 1741, 'loss/train': 2.5779194831848145} -09/20/2021 20:31:21 - INFO - __main__ - Step 27864: {'lr': 0.000199800262338406, 'samples': 891648, 'steps': 1741, 'loss/train': 2.5181939601898193} -09/20/2021 20:31:22 - INFO - __main__ - Step 27865: {'lr': 0.000199800262338406, 'samples': 891680, 'steps': 1741, 'loss/train': 2.752824306488037} -09/20/2021 20:31:23 - INFO - __main__ - Step 27866: {'lr': 0.000199800262338406, 'samples': 891712, 'steps': 1741, 'loss/train': 4.078419208526611} -09/20/2021 20:31:24 - INFO - __main__ - Step 27867: {'lr': 0.000199800262338406, 'samples': 891744, 'steps': 1741, 'loss/train': 2.9646689891815186} -09/20/2021 20:31:24 - INFO - __main__ - Step 27868: {'lr': 0.000199800262338406, 'samples': 891776, 'steps': 1741, 'loss/train': 2.6641271114349365} -09/20/2021 20:31:25 - INFO - __main__ - Step 27869: {'lr': 0.000199800262338406, 'samples': 891808, 'steps': 1741, 'loss/train': 2.7454190254211426} -09/20/2021 20:31:26 - INFO - __main__ - Step 27870: {'lr': 0.000199800262338406, 'samples': 891840, 'steps': 1741, 'loss/train': 2.9575536251068115} -09/20/2021 20:31:27 - INFO - __main__ - Step 27871: {'lr': 0.000199800262338406, 'samples': 891872, 'steps': 1741, 'loss/train': 2.43519926071167} -09/20/2021 20:31:27 - INFO - __main__ - Step 27872: {'lr': 0.000199800262338406, 'samples': 891904, 'steps': 1741, 'loss/train': 2.887906074523926} -09/20/2021 20:31:28 - INFO - __main__ - Step 27873: {'lr': 0.00019979985916635554, 'samples': 891936, 'steps': 1742, 'loss/train': 2.481365203857422} -09/20/2021 20:31:29 - INFO - __main__ - Step 27874: {'lr': 0.00019979985916635554, 'samples': 891968, 'steps': 1742, 'loss/train': 2.8328752517700195} -09/20/2021 20:31:30 - INFO - __main__ - Step 27875: {'lr': 0.00019979985916635554, 'samples': 892000, 'steps': 1742, 'loss/train': 1.5266615152359009} -09/20/2021 20:31:30 - INFO - __main__ - Step 27876: {'lr': 0.00019979985916635554, 'samples': 892032, 'steps': 1742, 'loss/train': 2.1790406703948975} -09/20/2021 20:31:31 - INFO - __main__ - Step 27877: {'lr': 0.00019979985916635554, 'samples': 892064, 'steps': 1742, 'loss/train': 2.8304097652435303} -09/20/2021 20:31:32 - INFO - __main__ - Step 27878: {'lr': 0.00019979985916635554, 'samples': 892096, 'steps': 1742, 'loss/train': 2.278486490249634} -09/20/2021 20:31:33 - INFO - __main__ - Step 27879: {'lr': 0.00019979985916635554, 'samples': 892128, 'steps': 1742, 'loss/train': 2.4384825229644775} -09/20/2021 20:31:33 - INFO - __main__ - Step 27880: {'lr': 0.00019979985916635554, 'samples': 892160, 'steps': 1742, 'loss/train': 2.7883119583129883} -09/20/2021 20:31:34 - INFO - __main__ - Step 27881: {'lr': 0.00019979985916635554, 'samples': 892192, 'steps': 1742, 'loss/train': 2.6498844623565674} -09/20/2021 20:31:35 - INFO - __main__ - Step 27882: {'lr': 0.00019979985916635554, 'samples': 892224, 'steps': 1742, 'loss/train': 2.518885612487793} -09/20/2021 20:31:36 - INFO - __main__ - Step 27883: {'lr': 0.00019979985916635554, 'samples': 892256, 'steps': 1742, 'loss/train': 2.4347434043884277} -09/20/2021 20:31:36 - INFO - __main__ - Step 27884: {'lr': 0.00019979985916635554, 'samples': 892288, 'steps': 1742, 'loss/train': 3.068002462387085} -09/20/2021 20:31:37 - INFO - __main__ - Step 27885: {'lr': 0.00019979985916635554, 'samples': 892320, 'steps': 1742, 'loss/train': 3.0542781352996826} -09/20/2021 20:31:38 - INFO - __main__ - Step 27886: {'lr': 0.00019979985916635554, 'samples': 892352, 'steps': 1742, 'loss/train': 2.456712007522583} -09/20/2021 20:31:39 - INFO - __main__ - Step 27887: {'lr': 0.00019979985916635554, 'samples': 892384, 'steps': 1742, 'loss/train': 2.373990297317505} -09/20/2021 20:31:39 - INFO - __main__ - Step 27888: {'lr': 0.00019979985916635554, 'samples': 892416, 'steps': 1742, 'loss/train': 2.596428632736206} -09/20/2021 20:31:40 - INFO - __main__ - Step 27889: {'lr': 0.0001997994555882198, 'samples': 892448, 'steps': 1743, 'loss/train': 2.2947449684143066} -09/20/2021 20:31:41 - INFO - __main__ - Step 27890: {'lr': 0.0001997994555882198, 'samples': 892480, 'steps': 1743, 'loss/train': 2.336334466934204} -09/20/2021 20:31:42 - INFO - __main__ - Step 27891: {'lr': 0.0001997994555882198, 'samples': 892512, 'steps': 1743, 'loss/train': 2.9976043701171875} -09/20/2021 20:31:43 - INFO - __main__ - Step 27892: {'lr': 0.0001997994555882198, 'samples': 892544, 'steps': 1743, 'loss/train': 2.7236289978027344} -09/20/2021 20:31:44 - INFO - __main__ - Step 27893: {'lr': 0.0001997994555882198, 'samples': 892576, 'steps': 1743, 'loss/train': 3.3573641777038574} -09/20/2021 20:31:45 - INFO - __main__ - Step 27894: {'lr': 0.0001997994555882198, 'samples': 892608, 'steps': 1743, 'loss/train': 2.445533514022827} -09/20/2021 20:31:45 - INFO - __main__ - Step 27895: {'lr': 0.0001997994555882198, 'samples': 892640, 'steps': 1743, 'loss/train': 4.17313814163208} -09/20/2021 20:31:46 - INFO - __main__ - Step 27896: {'lr': 0.0001997994555882198, 'samples': 892672, 'steps': 1743, 'loss/train': 2.6000304222106934} -09/20/2021 20:31:47 - INFO - __main__ - Step 27897: {'lr': 0.0001997994555882198, 'samples': 892704, 'steps': 1743, 'loss/train': 2.7193360328674316} -09/20/2021 20:31:48 - INFO - __main__ - Step 27898: {'lr': 0.0001997994555882198, 'samples': 892736, 'steps': 1743, 'loss/train': 2.764486312866211} -09/20/2021 20:31:48 - INFO - __main__ - Step 27899: {'lr': 0.0001997994555882198, 'samples': 892768, 'steps': 1743, 'loss/train': 2.832204580307007} -09/20/2021 20:31:49 - INFO - __main__ - Step 27900: {'lr': 0.0001997994555882198, 'samples': 892800, 'steps': 1743, 'loss/train': 2.845134973526001} -09/20/2021 20:31:50 - INFO - __main__ - Step 27901: {'lr': 0.0001997994555882198, 'samples': 892832, 'steps': 1743, 'loss/train': 2.110861301422119} -09/20/2021 20:31:51 - INFO - __main__ - Step 27902: {'lr': 0.0001997994555882198, 'samples': 892864, 'steps': 1743, 'loss/train': 2.036975145339966} -09/20/2021 20:31:51 - INFO - __main__ - Step 27903: {'lr': 0.0001997994555882198, 'samples': 892896, 'steps': 1743, 'loss/train': 3.1958272457122803} -09/20/2021 20:31:52 - INFO - __main__ - Step 27904: {'lr': 0.0001997994555882198, 'samples': 892928, 'steps': 1743, 'loss/train': 2.4376025199890137} -09/20/2021 20:31:53 - INFO - __main__ - Step 27905: {'lr': 0.00019979905160400047, 'samples': 892960, 'steps': 1744, 'loss/train': 2.7650461196899414} -09/20/2021 20:31:54 - INFO - __main__ - Step 27906: {'lr': 0.00019979905160400047, 'samples': 892992, 'steps': 1744, 'loss/train': 2.654446840286255} -09/20/2021 20:31:54 - INFO - __main__ - Step 27907: {'lr': 0.00019979905160400047, 'samples': 893024, 'steps': 1744, 'loss/train': 2.685080051422119} -09/20/2021 20:31:55 - INFO - __main__ - Step 27908: {'lr': 0.00019979905160400047, 'samples': 893056, 'steps': 1744, 'loss/train': 2.555762767791748} -09/20/2021 20:31:56 - INFO - __main__ - Step 27909: {'lr': 0.00019979905160400047, 'samples': 893088, 'steps': 1744, 'loss/train': 3.2701210975646973} -09/20/2021 20:31:57 - INFO - __main__ - Step 27910: {'lr': 0.00019979905160400047, 'samples': 893120, 'steps': 1744, 'loss/train': 3.446192502975464} -09/20/2021 20:31:57 - INFO - __main__ - Step 27911: {'lr': 0.00019979905160400047, 'samples': 893152, 'steps': 1744, 'loss/train': 2.5143728256225586} -09/20/2021 20:31:58 - INFO - __main__ - Step 27912: {'lr': 0.00019979905160400047, 'samples': 893184, 'steps': 1744, 'loss/train': 1.5726385116577148} -09/20/2021 20:31:59 - INFO - __main__ - Step 27913: {'lr': 0.00019979905160400047, 'samples': 893216, 'steps': 1744, 'loss/train': 2.913257122039795} -09/20/2021 20:32:00 - INFO - __main__ - Step 27914: {'lr': 0.00019979905160400047, 'samples': 893248, 'steps': 1744, 'loss/train': 1.223887324333191} -09/20/2021 20:32:00 - INFO - __main__ - Step 27915: {'lr': 0.00019979905160400047, 'samples': 893280, 'steps': 1744, 'loss/train': 2.6894731521606445} -09/20/2021 20:32:01 - INFO - __main__ - Step 27916: {'lr': 0.00019979905160400047, 'samples': 893312, 'steps': 1744, 'loss/train': 1.9657710790634155} -09/20/2021 20:32:02 - INFO - __main__ - Step 27917: {'lr': 0.00019979905160400047, 'samples': 893344, 'steps': 1744, 'loss/train': 2.3652124404907227} -09/20/2021 20:32:03 - INFO - __main__ - Step 27918: {'lr': 0.00019979905160400047, 'samples': 893376, 'steps': 1744, 'loss/train': 2.451272964477539} -09/20/2021 20:32:03 - INFO - __main__ - Step 27919: {'lr': 0.00019979905160400047, 'samples': 893408, 'steps': 1744, 'loss/train': 0.5674018263816833} -09/20/2021 20:32:04 - INFO - __main__ - Step 27920: {'lr': 0.00019979905160400047, 'samples': 893440, 'steps': 1744, 'loss/train': 2.7801928520202637} -09/20/2021 20:32:05 - INFO - __main__ - Step 27921: {'lr': 0.0001997986472136992, 'samples': 893472, 'steps': 1745, 'loss/train': 2.7647454738616943} -09/20/2021 20:32:06 - INFO - __main__ - Step 27922: {'lr': 0.0001997986472136992, 'samples': 893504, 'steps': 1745, 'loss/train': 2.3364624977111816} -09/20/2021 20:32:07 - INFO - __main__ - Step 27923: {'lr': 0.0001997986472136992, 'samples': 893536, 'steps': 1745, 'loss/train': 2.756709337234497} -09/20/2021 20:32:08 - INFO - __main__ - Step 27924: {'lr': 0.0001997986472136992, 'samples': 893568, 'steps': 1745, 'loss/train': 2.4084253311157227} -09/20/2021 20:32:09 - INFO - __main__ - Step 27925: {'lr': 0.0001997986472136992, 'samples': 893600, 'steps': 1745, 'loss/train': 2.9691364765167236} -09/20/2021 20:32:09 - INFO - __main__ - Step 27926: {'lr': 0.0001997986472136992, 'samples': 893632, 'steps': 1745, 'loss/train': 3.1740550994873047} -09/20/2021 20:32:10 - INFO - __main__ - Step 27927: {'lr': 0.0001997986472136992, 'samples': 893664, 'steps': 1745, 'loss/train': 2.673508644104004} -09/20/2021 20:32:11 - INFO - __main__ - Step 27928: {'lr': 0.0001997986472136992, 'samples': 893696, 'steps': 1745, 'loss/train': 1.9320780038833618} -09/20/2021 20:32:12 - INFO - __main__ - Step 27929: {'lr': 0.0001997986472136992, 'samples': 893728, 'steps': 1745, 'loss/train': 2.153947353363037} -09/20/2021 20:32:12 - INFO - __main__ - Step 27930: {'lr': 0.0001997986472136992, 'samples': 893760, 'steps': 1745, 'loss/train': 3.6913468837738037} -09/20/2021 20:32:13 - INFO - __main__ - Step 27931: {'lr': 0.0001997986472136992, 'samples': 893792, 'steps': 1745, 'loss/train': 2.9901583194732666} -09/20/2021 20:32:14 - INFO - __main__ - Step 27932: {'lr': 0.0001997986472136992, 'samples': 893824, 'steps': 1745, 'loss/train': 2.5829317569732666} -09/20/2021 20:32:15 - INFO - __main__ - Step 27933: {'lr': 0.0001997986472136992, 'samples': 893856, 'steps': 1745, 'loss/train': 2.2552382946014404} -09/20/2021 20:32:15 - INFO - __main__ - Step 27934: {'lr': 0.0001997986472136992, 'samples': 893888, 'steps': 1745, 'loss/train': 2.8799996376037598} -09/20/2021 20:32:16 - INFO - __main__ - Step 27935: {'lr': 0.0001997986472136992, 'samples': 893920, 'steps': 1745, 'loss/train': 2.469036102294922} -09/20/2021 20:32:17 - INFO - __main__ - Step 27936: {'lr': 0.0001997986472136992, 'samples': 893952, 'steps': 1745, 'loss/train': 2.7360870838165283} -09/20/2021 20:32:18 - INFO - __main__ - Step 27937: {'lr': 0.0001997982424173176, 'samples': 893984, 'steps': 1746, 'loss/train': 2.619537115097046} -09/20/2021 20:32:19 - INFO - __main__ - Step 27938: {'lr': 0.0001997982424173176, 'samples': 894016, 'steps': 1746, 'loss/train': 1.8414130210876465} -09/20/2021 20:32:19 - INFO - __main__ - Step 27939: {'lr': 0.0001997982424173176, 'samples': 894048, 'steps': 1746, 'loss/train': 2.9188761711120605} -09/20/2021 20:32:20 - INFO - __main__ - Step 27940: {'lr': 0.0001997982424173176, 'samples': 894080, 'steps': 1746, 'loss/train': 2.700486183166504} -09/20/2021 20:32:21 - INFO - __main__ - Step 27941: {'lr': 0.0001997982424173176, 'samples': 894112, 'steps': 1746, 'loss/train': 2.7736899852752686} -09/20/2021 20:32:22 - INFO - __main__ - Step 27942: {'lr': 0.0001997982424173176, 'samples': 894144, 'steps': 1746, 'loss/train': 3.3182973861694336} -09/20/2021 20:32:22 - INFO - __main__ - Step 27943: {'lr': 0.0001997982424173176, 'samples': 894176, 'steps': 1746, 'loss/train': 2.0282201766967773} -09/20/2021 20:32:23 - INFO - __main__ - Step 27944: {'lr': 0.0001997982424173176, 'samples': 894208, 'steps': 1746, 'loss/train': 2.319084405899048} -09/20/2021 20:32:24 - INFO - __main__ - Step 27945: {'lr': 0.0001997982424173176, 'samples': 894240, 'steps': 1746, 'loss/train': 2.570681095123291} -09/20/2021 20:32:25 - INFO - __main__ - Step 27946: {'lr': 0.0001997982424173176, 'samples': 894272, 'steps': 1746, 'loss/train': 2.6562323570251465} -09/20/2021 20:32:25 - INFO - __main__ - Step 27947: {'lr': 0.0001997982424173176, 'samples': 894304, 'steps': 1746, 'loss/train': 2.5270490646362305} -09/20/2021 20:32:26 - INFO - __main__ - Step 27948: {'lr': 0.0001997982424173176, 'samples': 894336, 'steps': 1746, 'loss/train': 2.4960901737213135} -09/20/2021 20:32:27 - INFO - __main__ - Step 27949: {'lr': 0.0001997982424173176, 'samples': 894368, 'steps': 1746, 'loss/train': 3.1844334602355957} -09/20/2021 20:32:28 - INFO - __main__ - Step 27950: {'lr': 0.0001997982424173176, 'samples': 894400, 'steps': 1746, 'loss/train': 2.379324436187744} -09/20/2021 20:32:28 - INFO - __main__ - Step 27951: {'lr': 0.0001997982424173176, 'samples': 894432, 'steps': 1746, 'loss/train': 2.846717357635498} -09/20/2021 20:32:29 - INFO - __main__ - Step 27952: {'lr': 0.0001997982424173176, 'samples': 894464, 'steps': 1746, 'loss/train': 2.583115339279175} -09/20/2021 20:32:30 - INFO - __main__ - Step 27953: {'lr': 0.00019979783721485738, 'samples': 894496, 'steps': 1747, 'loss/train': 2.8863260746002197} -09/20/2021 20:32:31 - INFO - __main__ - Step 27954: {'lr': 0.00019979783721485738, 'samples': 894528, 'steps': 1747, 'loss/train': 2.883821964263916} -09/20/2021 20:32:32 - INFO - __main__ - Step 27955: {'lr': 0.00019979783721485738, 'samples': 894560, 'steps': 1747, 'loss/train': 2.7507386207580566} -09/20/2021 20:32:33 - INFO - __main__ - Step 27956: {'lr': 0.00019979783721485738, 'samples': 894592, 'steps': 1747, 'loss/train': 3.1072194576263428} -09/20/2021 20:32:33 - INFO - __main__ - Step 27957: {'lr': 0.00019979783721485738, 'samples': 894624, 'steps': 1747, 'loss/train': 2.617480516433716} -09/20/2021 20:32:34 - INFO - __main__ - Step 27958: {'lr': 0.00019979783721485738, 'samples': 894656, 'steps': 1747, 'loss/train': 3.376570463180542} -09/20/2021 20:32:35 - INFO - __main__ - Step 27959: {'lr': 0.00019979783721485738, 'samples': 894688, 'steps': 1747, 'loss/train': 0.36073851585388184} -09/20/2021 20:32:36 - INFO - __main__ - Step 27960: {'lr': 0.00019979783721485738, 'samples': 894720, 'steps': 1747, 'loss/train': 3.4539058208465576} -09/20/2021 20:32:36 - INFO - __main__ - Step 27961: {'lr': 0.00019979783721485738, 'samples': 894752, 'steps': 1747, 'loss/train': 2.7348058223724365} -09/20/2021 20:32:37 - INFO - __main__ - Step 27962: {'lr': 0.00019979783721485738, 'samples': 894784, 'steps': 1747, 'loss/train': 2.600759744644165} -09/20/2021 20:32:38 - INFO - __main__ - Step 27963: {'lr': 0.00019979783721485738, 'samples': 894816, 'steps': 1747, 'loss/train': 3.7143683433532715} -09/20/2021 20:32:39 - INFO - __main__ - Step 27964: {'lr': 0.00019979783721485738, 'samples': 894848, 'steps': 1747, 'loss/train': 2.406815528869629} -09/20/2021 20:32:39 - INFO - __main__ - Step 27965: {'lr': 0.00019979783721485738, 'samples': 894880, 'steps': 1747, 'loss/train': 2.841235399246216} -09/20/2021 20:32:40 - INFO - __main__ - Step 27966: {'lr': 0.00019979783721485738, 'samples': 894912, 'steps': 1747, 'loss/train': 2.8912084102630615} -09/20/2021 20:32:41 - INFO - __main__ - Step 27967: {'lr': 0.00019979783721485738, 'samples': 894944, 'steps': 1747, 'loss/train': 2.5182368755340576} -09/20/2021 20:32:42 - INFO - __main__ - Step 27968: {'lr': 0.00019979783721485738, 'samples': 894976, 'steps': 1747, 'loss/train': 2.65814471244812} -09/20/2021 20:32:43 - INFO - __main__ - Step 27969: {'lr': 0.0001997974316063201, 'samples': 895008, 'steps': 1748, 'loss/train': 2.3244168758392334} -09/20/2021 20:32:43 - INFO - __main__ - Step 27970: {'lr': 0.0001997974316063201, 'samples': 895040, 'steps': 1748, 'loss/train': 2.274543523788452} -09/20/2021 20:32:44 - INFO - __main__ - Step 27971: {'lr': 0.0001997974316063201, 'samples': 895072, 'steps': 1748, 'loss/train': 2.814584493637085} -09/20/2021 20:32:45 - INFO - __main__ - Step 27972: {'lr': 0.0001997974316063201, 'samples': 895104, 'steps': 1748, 'loss/train': 2.9677000045776367} -09/20/2021 20:32:46 - INFO - __main__ - Step 27973: {'lr': 0.0001997974316063201, 'samples': 895136, 'steps': 1748, 'loss/train': 2.0653629302978516} -09/20/2021 20:32:46 - INFO - __main__ - Step 27974: {'lr': 0.0001997974316063201, 'samples': 895168, 'steps': 1748, 'loss/train': 2.9289283752441406} -09/20/2021 20:32:47 - INFO - __main__ - Step 27975: {'lr': 0.0001997974316063201, 'samples': 895200, 'steps': 1748, 'loss/train': 3.668696880340576} -09/20/2021 20:32:48 - INFO - __main__ - Step 27976: {'lr': 0.0001997974316063201, 'samples': 895232, 'steps': 1748, 'loss/train': 1.7419404983520508} -09/20/2021 20:32:49 - INFO - __main__ - Step 27977: {'lr': 0.0001997974316063201, 'samples': 895264, 'steps': 1748, 'loss/train': 2.762225866317749} -09/20/2021 20:32:49 - INFO - __main__ - Step 27978: {'lr': 0.0001997974316063201, 'samples': 895296, 'steps': 1748, 'loss/train': 2.026782512664795} -09/20/2021 20:32:50 - INFO - __main__ - Step 27979: {'lr': 0.0001997974316063201, 'samples': 895328, 'steps': 1748, 'loss/train': 2.5268406867980957} -09/20/2021 20:32:51 - INFO - __main__ - Step 27980: {'lr': 0.0001997974316063201, 'samples': 895360, 'steps': 1748, 'loss/train': 2.797053098678589} -09/20/2021 20:32:52 - INFO - __main__ - Step 27981: {'lr': 0.0001997974316063201, 'samples': 895392, 'steps': 1748, 'loss/train': 3.1988742351531982} -09/20/2021 20:32:52 - INFO - __main__ - Step 27982: {'lr': 0.0001997974316063201, 'samples': 895424, 'steps': 1748, 'loss/train': 2.384319543838501} -09/20/2021 20:32:53 - INFO - __main__ - Step 27983: {'lr': 0.0001997974316063201, 'samples': 895456, 'steps': 1748, 'loss/train': 2.208719253540039} -09/20/2021 20:32:55 - INFO - __main__ - Step 27984: {'lr': 0.0001997974316063201, 'samples': 895488, 'steps': 1748, 'loss/train': 1.7341573238372803} -09/20/2021 20:32:56 - INFO - __main__ - Step 27985: {'lr': 0.00019979702559170748, 'samples': 895520, 'steps': 1749, 'loss/train': 2.9562876224517822} -09/20/2021 20:32:57 - INFO - __main__ - Step 27986: {'lr': 0.00019979702559170748, 'samples': 895552, 'steps': 1749, 'loss/train': 2.471949338912964} -09/20/2021 20:32:57 - INFO - __main__ - Step 27987: {'lr': 0.00019979702559170748, 'samples': 895584, 'steps': 1749, 'loss/train': 2.0826921463012695} -09/20/2021 20:32:58 - INFO - __main__ - Step 27988: {'lr': 0.00019979702559170748, 'samples': 895616, 'steps': 1749, 'loss/train': 3.365178108215332} -09/20/2021 20:32:59 - INFO - __main__ - Step 27989: {'lr': 0.00019979702559170748, 'samples': 895648, 'steps': 1749, 'loss/train': 3.0490150451660156} -09/20/2021 20:33:00 - INFO - __main__ - Step 27990: {'lr': 0.00019979702559170748, 'samples': 895680, 'steps': 1749, 'loss/train': 3.137660026550293} -09/20/2021 20:33:00 - INFO - __main__ - Step 27991: {'lr': 0.00019979702559170748, 'samples': 895712, 'steps': 1749, 'loss/train': 2.8316240310668945} -09/20/2021 20:33:01 - INFO - __main__ - Step 27992: {'lr': 0.00019979702559170748, 'samples': 895744, 'steps': 1749, 'loss/train': 1.8742483854293823} -09/20/2021 20:33:02 - INFO - __main__ - Step 27993: {'lr': 0.00019979702559170748, 'samples': 895776, 'steps': 1749, 'loss/train': 2.528691530227661} -09/20/2021 20:33:03 - INFO - __main__ - Step 27994: {'lr': 0.00019979702559170748, 'samples': 895808, 'steps': 1749, 'loss/train': 2.8578226566314697} -09/20/2021 20:33:03 - INFO - __main__ - Step 27995: {'lr': 0.00019979702559170748, 'samples': 895840, 'steps': 1749, 'loss/train': 3.052037239074707} -09/20/2021 20:33:04 - INFO - __main__ - Step 27996: {'lr': 0.00019979702559170748, 'samples': 895872, 'steps': 1749, 'loss/train': 3.342806339263916} -09/20/2021 20:33:05 - INFO - __main__ - Step 27997: {'lr': 0.00019979702559170748, 'samples': 895904, 'steps': 1749, 'loss/train': 2.588944435119629} -09/20/2021 20:33:06 - INFO - __main__ - Step 27998: {'lr': 0.00019979702559170748, 'samples': 895936, 'steps': 1749, 'loss/train': 3.057393789291382} -09/20/2021 20:33:06 - INFO - __main__ - Step 27999: {'lr': 0.00019979702559170748, 'samples': 895968, 'steps': 1749, 'loss/train': 2.7109158039093018} -09/20/2021 20:33:07 - INFO - __main__ - Step 28000: {'lr': 0.00019979702559170748, 'samples': 896000, 'steps': 1749, 'loss/train': 1.861201286315918} -09/20/2021 20:33:08 - INFO - __main__ - Step 28001: {'lr': 0.00019979661917102115, 'samples': 896032, 'steps': 1750, 'loss/train': 3.0945382118225098} -09/20/2021 20:33:09 - INFO - __main__ - Step 28002: {'lr': 0.00019979661917102115, 'samples': 896064, 'steps': 1750, 'loss/train': 2.6922178268432617} -09/20/2021 20:33:09 - INFO - __main__ - Step 28003: {'lr': 0.00019979661917102115, 'samples': 896096, 'steps': 1750, 'loss/train': 0.9108004570007324} -09/20/2021 20:33:10 - INFO - __main__ - Step 28004: {'lr': 0.00019979661917102115, 'samples': 896128, 'steps': 1750, 'loss/train': 2.565216302871704} -09/20/2021 20:33:11 - INFO - __main__ - Step 28005: {'lr': 0.00019979661917102115, 'samples': 896160, 'steps': 1750, 'loss/train': 2.867853879928589} -09/20/2021 20:33:12 - INFO - __main__ - Step 28006: {'lr': 0.00019979661917102115, 'samples': 896192, 'steps': 1750, 'loss/train': 2.4526891708374023} -09/20/2021 20:33:12 - INFO - __main__ - Step 28007: {'lr': 0.00019979661917102115, 'samples': 896224, 'steps': 1750, 'loss/train': 2.70796799659729} -09/20/2021 20:33:13 - INFO - __main__ - Step 28008: {'lr': 0.00019979661917102115, 'samples': 896256, 'steps': 1750, 'loss/train': 1.0057350397109985} -09/20/2021 20:33:14 - INFO - __main__ - Step 28009: {'lr': 0.00019979661917102115, 'samples': 896288, 'steps': 1750, 'loss/train': 2.4675259590148926} -09/20/2021 20:33:15 - INFO - __main__ - Step 28010: {'lr': 0.00019979661917102115, 'samples': 896320, 'steps': 1750, 'loss/train': 2.6283371448516846} -09/20/2021 20:33:15 - INFO - __main__ - Step 28011: {'lr': 0.00019979661917102115, 'samples': 896352, 'steps': 1750, 'loss/train': 2.4758336544036865} -09/20/2021 20:33:16 - INFO - __main__ - Step 28012: {'lr': 0.00019979661917102115, 'samples': 896384, 'steps': 1750, 'loss/train': 1.7643293142318726} -09/20/2021 20:33:17 - INFO - __main__ - Step 28013: {'lr': 0.00019979661917102115, 'samples': 896416, 'steps': 1750, 'loss/train': 3.126307964324951} -09/20/2021 20:33:18 - INFO - __main__ - Step 28014: {'lr': 0.00019979661917102115, 'samples': 896448, 'steps': 1750, 'loss/train': 3.2814109325408936} -09/20/2021 20:33:19 - INFO - __main__ - Step 28015: {'lr': 0.00019979661917102115, 'samples': 896480, 'steps': 1750, 'loss/train': 3.5926353931427} -09/20/2021 20:33:20 - INFO - __main__ - Step 28016: {'lr': 0.00019979661917102115, 'samples': 896512, 'steps': 1750, 'loss/train': 2.243364095687866} -09/20/2021 20:33:21 - INFO - __main__ - Step 28017: {'lr': 0.00019979621234426275, 'samples': 896544, 'steps': 1751, 'loss/train': 2.1546075344085693} -09/20/2021 20:33:21 - INFO - __main__ - Step 28018: {'lr': 0.00019979621234426275, 'samples': 896576, 'steps': 1751, 'loss/train': 3.512578248977661} -09/20/2021 20:33:22 - INFO - __main__ - Step 28019: {'lr': 0.00019979621234426275, 'samples': 896608, 'steps': 1751, 'loss/train': 3.126143455505371} -09/20/2021 20:33:23 - INFO - __main__ - Step 28020: {'lr': 0.00019979621234426275, 'samples': 896640, 'steps': 1751, 'loss/train': 2.927661418914795} -09/20/2021 20:33:24 - INFO - __main__ - Step 28021: {'lr': 0.00019979621234426275, 'samples': 896672, 'steps': 1751, 'loss/train': 3.1542587280273438} -09/20/2021 20:33:24 - INFO - __main__ - Step 28022: {'lr': 0.00019979621234426275, 'samples': 896704, 'steps': 1751, 'loss/train': 2.3882195949554443} -09/20/2021 20:33:25 - INFO - __main__ - Step 28023: {'lr': 0.00019979621234426275, 'samples': 896736, 'steps': 1751, 'loss/train': 2.5315465927124023} -09/20/2021 20:33:26 - INFO - __main__ - Step 28024: {'lr': 0.00019979621234426275, 'samples': 896768, 'steps': 1751, 'loss/train': 2.546692132949829} -09/20/2021 20:33:27 - INFO - __main__ - Step 28025: {'lr': 0.00019979621234426275, 'samples': 896800, 'steps': 1751, 'loss/train': 2.9977667331695557} -09/20/2021 20:33:27 - INFO - __main__ - Step 28026: {'lr': 0.00019979621234426275, 'samples': 896832, 'steps': 1751, 'loss/train': 1.9795805215835571} -09/20/2021 20:33:28 - INFO - __main__ - Step 28027: {'lr': 0.00019979621234426275, 'samples': 896864, 'steps': 1751, 'loss/train': 2.8306286334991455} -09/20/2021 20:33:29 - INFO - __main__ - Step 28028: {'lr': 0.00019979621234426275, 'samples': 896896, 'steps': 1751, 'loss/train': 1.9857804775238037} -09/20/2021 20:33:30 - INFO - __main__ - Step 28029: {'lr': 0.00019979621234426275, 'samples': 896928, 'steps': 1751, 'loss/train': 2.256288528442383} -09/20/2021 20:33:30 - INFO - __main__ - Step 28030: {'lr': 0.00019979621234426275, 'samples': 896960, 'steps': 1751, 'loss/train': 2.9996895790100098} -09/20/2021 20:33:31 - INFO - __main__ - Step 28031: {'lr': 0.00019979621234426275, 'samples': 896992, 'steps': 1751, 'loss/train': 2.5366671085357666} -09/20/2021 20:33:32 - INFO - __main__ - Step 28032: {'lr': 0.00019979621234426275, 'samples': 897024, 'steps': 1751, 'loss/train': 2.8115034103393555} -09/20/2021 20:33:33 - INFO - __main__ - Step 28033: {'lr': 0.00019979580511143396, 'samples': 897056, 'steps': 1752, 'loss/train': 2.779857873916626} -09/20/2021 20:33:34 - INFO - __main__ - Step 28034: {'lr': 0.00019979580511143396, 'samples': 897088, 'steps': 1752, 'loss/train': 2.804535388946533} -09/20/2021 20:33:34 - INFO - __main__ - Step 28035: {'lr': 0.00019979580511143396, 'samples': 897120, 'steps': 1752, 'loss/train': 2.1509928703308105} -09/20/2021 20:33:35 - INFO - __main__ - Step 28036: {'lr': 0.00019979580511143396, 'samples': 897152, 'steps': 1752, 'loss/train': 2.5373613834381104} -09/20/2021 20:33:36 - INFO - __main__ - Step 28037: {'lr': 0.00019979580511143396, 'samples': 897184, 'steps': 1752, 'loss/train': 2.811671018600464} -09/20/2021 20:33:37 - INFO - __main__ - Step 28038: {'lr': 0.00019979580511143396, 'samples': 897216, 'steps': 1752, 'loss/train': 2.8903684616088867} -09/20/2021 20:33:37 - INFO - __main__ - Step 28039: {'lr': 0.00019979580511143396, 'samples': 897248, 'steps': 1752, 'loss/train': 2.6041226387023926} -09/20/2021 20:33:38 - INFO - __main__ - Step 28040: {'lr': 0.00019979580511143396, 'samples': 897280, 'steps': 1752, 'loss/train': 1.7091654539108276} -09/20/2021 20:33:39 - INFO - __main__ - Step 28041: {'lr': 0.00019979580511143396, 'samples': 897312, 'steps': 1752, 'loss/train': 2.578552722930908} -09/20/2021 20:33:40 - INFO - __main__ - Step 28042: {'lr': 0.00019979580511143396, 'samples': 897344, 'steps': 1752, 'loss/train': 1.4839953184127808} -09/20/2021 20:33:40 - INFO - __main__ - Step 28043: {'lr': 0.00019979580511143396, 'samples': 897376, 'steps': 1752, 'loss/train': 2.244556427001953} -09/20/2021 20:33:41 - INFO - __main__ - Step 28044: {'lr': 0.00019979580511143396, 'samples': 897408, 'steps': 1752, 'loss/train': 3.0313496589660645} -09/20/2021 20:33:42 - INFO - __main__ - Step 28045: {'lr': 0.00019979580511143396, 'samples': 897440, 'steps': 1752, 'loss/train': 2.5341904163360596} -09/20/2021 20:33:44 - INFO - __main__ - Step 28046: {'lr': 0.00019979580511143396, 'samples': 897472, 'steps': 1752, 'loss/train': 2.560354471206665} -09/20/2021 20:33:44 - INFO - __main__ - Step 28047: {'lr': 0.00019979580511143396, 'samples': 897504, 'steps': 1752, 'loss/train': 2.9866440296173096} -09/20/2021 20:33:45 - INFO - __main__ - Step 28048: {'lr': 0.00019979580511143396, 'samples': 897536, 'steps': 1752, 'loss/train': 2.095975399017334} -09/20/2021 20:33:46 - INFO - __main__ - Step 28049: {'lr': 0.00019979539747253645, 'samples': 897568, 'steps': 1753, 'loss/train': 3.1071040630340576} -09/20/2021 20:33:47 - INFO - __main__ - Step 28050: {'lr': 0.00019979539747253645, 'samples': 897600, 'steps': 1753, 'loss/train': 2.6489648818969727} -09/20/2021 20:33:48 - INFO - __main__ - Step 28051: {'lr': 0.00019979539747253645, 'samples': 897632, 'steps': 1753, 'loss/train': 2.2073135375976562} -09/20/2021 20:33:48 - INFO - __main__ - Step 28052: {'lr': 0.00019979539747253645, 'samples': 897664, 'steps': 1753, 'loss/train': 2.9074859619140625} -09/20/2021 20:33:49 - INFO - __main__ - Step 28053: {'lr': 0.00019979539747253645, 'samples': 897696, 'steps': 1753, 'loss/train': 2.8654062747955322} -09/20/2021 20:33:50 - INFO - __main__ - Step 28054: {'lr': 0.00019979539747253645, 'samples': 897728, 'steps': 1753, 'loss/train': 2.640582323074341} -09/20/2021 20:33:51 - INFO - __main__ - Step 28055: {'lr': 0.00019979539747253645, 'samples': 897760, 'steps': 1753, 'loss/train': 2.361933469772339} -09/20/2021 20:33:51 - INFO - __main__ - Step 28056: {'lr': 0.00019979539747253645, 'samples': 897792, 'steps': 1753, 'loss/train': 2.0241858959198} -09/20/2021 20:33:52 - INFO - __main__ - Step 28057: {'lr': 0.00019979539747253645, 'samples': 897824, 'steps': 1753, 'loss/train': 4.025968074798584} -09/20/2021 20:33:53 - INFO - __main__ - Step 28058: {'lr': 0.00019979539747253645, 'samples': 897856, 'steps': 1753, 'loss/train': 2.68397855758667} -09/20/2021 20:33:54 - INFO - __main__ - Step 28059: {'lr': 0.00019979539747253645, 'samples': 897888, 'steps': 1753, 'loss/train': 2.4074459075927734} -09/20/2021 20:33:54 - INFO - __main__ - Step 28060: {'lr': 0.00019979539747253645, 'samples': 897920, 'steps': 1753, 'loss/train': 2.620675802230835} -09/20/2021 20:33:55 - INFO - __main__ - Step 28061: {'lr': 0.00019979539747253645, 'samples': 897952, 'steps': 1753, 'loss/train': 2.3433196544647217} -09/20/2021 20:33:56 - INFO - __main__ - Step 28062: {'lr': 0.00019979539747253645, 'samples': 897984, 'steps': 1753, 'loss/train': 2.77524471282959} -09/20/2021 20:33:57 - INFO - __main__ - Step 28063: {'lr': 0.00019979539747253645, 'samples': 898016, 'steps': 1753, 'loss/train': 1.8044410943984985} -09/20/2021 20:33:57 - INFO - __main__ - Step 28064: {'lr': 0.00019979539747253645, 'samples': 898048, 'steps': 1753, 'loss/train': 2.653111696243286} -09/20/2021 20:33:58 - INFO - __main__ - Step 28065: {'lr': 0.00019979498942757182, 'samples': 898080, 'steps': 1754, 'loss/train': 2.634122610092163} -09/20/2021 20:33:59 - INFO - __main__ - Step 28066: {'lr': 0.00019979498942757182, 'samples': 898112, 'steps': 1754, 'loss/train': 2.4754343032836914} -09/20/2021 20:34:00 - INFO - __main__ - Step 28067: {'lr': 0.00019979498942757182, 'samples': 898144, 'steps': 1754, 'loss/train': 2.5632846355438232} -09/20/2021 20:34:01 - INFO - __main__ - Step 28068: {'lr': 0.00019979498942757182, 'samples': 898176, 'steps': 1754, 'loss/train': 0.8360360264778137} -09/20/2021 20:34:01 - INFO - __main__ - Step 28069: {'lr': 0.00019979498942757182, 'samples': 898208, 'steps': 1754, 'loss/train': 2.6781678199768066} -09/20/2021 20:34:02 - INFO - __main__ - Step 28070: {'lr': 0.00019979498942757182, 'samples': 898240, 'steps': 1754, 'loss/train': 2.4666779041290283} -09/20/2021 20:34:03 - INFO - __main__ - Step 28071: {'lr': 0.00019979498942757182, 'samples': 898272, 'steps': 1754, 'loss/train': 1.2930561304092407} -09/20/2021 20:34:04 - INFO - __main__ - Step 28072: {'lr': 0.00019979498942757182, 'samples': 898304, 'steps': 1754, 'loss/train': 2.8773040771484375} -09/20/2021 20:34:04 - INFO - __main__ - Step 28073: {'lr': 0.00019979498942757182, 'samples': 898336, 'steps': 1754, 'loss/train': 2.5428786277770996} -09/20/2021 20:34:05 - INFO - __main__ - Step 28074: {'lr': 0.00019979498942757182, 'samples': 898368, 'steps': 1754, 'loss/train': 2.275949478149414} -09/20/2021 20:34:06 - INFO - __main__ - Step 28075: {'lr': 0.00019979498942757182, 'samples': 898400, 'steps': 1754, 'loss/train': 2.0236570835113525} -09/20/2021 20:34:07 - INFO - __main__ - Step 28076: {'lr': 0.00019979498942757182, 'samples': 898432, 'steps': 1754, 'loss/train': 1.2960354089736938} -09/20/2021 20:34:07 - INFO - __main__ - Step 28077: {'lr': 0.00019979498942757182, 'samples': 898464, 'steps': 1754, 'loss/train': 0.7467934489250183} -09/20/2021 20:34:08 - INFO - __main__ - Step 28078: {'lr': 0.00019979498942757182, 'samples': 898496, 'steps': 1754, 'loss/train': 0.4370272159576416} -09/20/2021 20:34:09 - INFO - __main__ - Step 28079: {'lr': 0.00019979498942757182, 'samples': 898528, 'steps': 1754, 'loss/train': 1.0253078937530518} -09/20/2021 20:34:10 - INFO - __main__ - Step 28080: {'lr': 0.00019979498942757182, 'samples': 898560, 'steps': 1754, 'loss/train': 0.7539458870887756} -09/20/2021 20:34:10 - INFO - __main__ - Step 28081: {'lr': 0.00019979458097654177, 'samples': 898592, 'steps': 1755, 'loss/train': 0.34997543692588806} -09/20/2021 20:34:11 - INFO - __main__ - Step 28082: {'lr': 0.00019979458097654177, 'samples': 898624, 'steps': 1755, 'loss/train': 0.3975237011909485} -09/20/2021 20:34:12 - INFO - __main__ - Step 28083: {'lr': 0.00019979458097654177, 'samples': 898656, 'steps': 1755, 'loss/train': 0.7996476292610168} -09/20/2021 20:34:13 - INFO - __main__ - Step 28084: {'lr': 0.00019979458097654177, 'samples': 898688, 'steps': 1755, 'loss/train': 0.5341813564300537} -09/20/2021 20:34:14 - INFO - __main__ - Step 28085: {'lr': 0.00019979458097654177, 'samples': 898720, 'steps': 1755, 'loss/train': 0.8720182180404663} -09/20/2021 20:34:15 - INFO - __main__ - Step 28086: {'lr': 0.00019979458097654177, 'samples': 898752, 'steps': 1755, 'loss/train': 2.4749584197998047} -09/20/2021 20:34:15 - INFO - __main__ - Step 28087: {'lr': 0.00019979458097654177, 'samples': 898784, 'steps': 1755, 'loss/train': 1.6858679056167603} -09/20/2021 20:34:16 - INFO - __main__ - Step 28088: {'lr': 0.00019979458097654177, 'samples': 898816, 'steps': 1755, 'loss/train': 2.8897807598114014} -09/20/2021 20:34:17 - INFO - __main__ - Step 28089: {'lr': 0.00019979458097654177, 'samples': 898848, 'steps': 1755, 'loss/train': 2.4568870067596436} -09/20/2021 20:34:18 - INFO - __main__ - Step 28090: {'lr': 0.00019979458097654177, 'samples': 898880, 'steps': 1755, 'loss/train': 2.9535293579101562} -09/20/2021 20:34:18 - INFO - __main__ - Step 28091: {'lr': 0.00019979458097654177, 'samples': 898912, 'steps': 1755, 'loss/train': 2.7098827362060547} -09/20/2021 20:34:19 - INFO - __main__ - Step 28092: {'lr': 0.00019979458097654177, 'samples': 898944, 'steps': 1755, 'loss/train': 2.3276607990264893} -09/20/2021 20:34:20 - INFO - __main__ - Step 28093: {'lr': 0.00019979458097654177, 'samples': 898976, 'steps': 1755, 'loss/train': 1.9887230396270752} -09/20/2021 20:34:21 - INFO - __main__ - Step 28094: {'lr': 0.00019979458097654177, 'samples': 899008, 'steps': 1755, 'loss/train': 3.244741916656494} -09/20/2021 20:34:21 - INFO - __main__ - Step 28095: {'lr': 0.00019979458097654177, 'samples': 899040, 'steps': 1755, 'loss/train': 2.3525288105010986} -09/20/2021 20:34:22 - INFO - __main__ - Step 28096: {'lr': 0.00019979458097654177, 'samples': 899072, 'steps': 1755, 'loss/train': 2.475829839706421} -09/20/2021 20:34:23 - INFO - __main__ - Step 28097: {'lr': 0.00019979417211944797, 'samples': 899104, 'steps': 1756, 'loss/train': 1.627610445022583} -09/20/2021 20:34:24 - INFO - __main__ - Step 28098: {'lr': 0.00019979417211944797, 'samples': 899136, 'steps': 1756, 'loss/train': 2.1259498596191406} -09/20/2021 20:34:25 - INFO - __main__ - Step 28099: {'lr': 0.00019979417211944797, 'samples': 899168, 'steps': 1756, 'loss/train': 1.424021601676941} -09/20/2021 20:34:25 - INFO - __main__ - Step 28100: {'lr': 0.00019979417211944797, 'samples': 899200, 'steps': 1756, 'loss/train': 2.8982250690460205} -09/20/2021 20:34:26 - INFO - __main__ - Step 28101: {'lr': 0.00019979417211944797, 'samples': 899232, 'steps': 1756, 'loss/train': 2.627575397491455} -09/20/2021 20:34:27 - INFO - __main__ - Step 28102: {'lr': 0.00019979417211944797, 'samples': 899264, 'steps': 1756, 'loss/train': 2.0342764854431152} -09/20/2021 20:34:28 - INFO - __main__ - Step 28103: {'lr': 0.00019979417211944797, 'samples': 899296, 'steps': 1756, 'loss/train': 2.2061076164245605} -09/20/2021 20:34:28 - INFO - __main__ - Step 28104: {'lr': 0.00019979417211944797, 'samples': 899328, 'steps': 1756, 'loss/train': 3.155565023422241} -09/20/2021 20:34:29 - INFO - __main__ - Step 28105: {'lr': 0.00019979417211944797, 'samples': 899360, 'steps': 1756, 'loss/train': 2.806299924850464} -09/20/2021 20:34:30 - INFO - __main__ - Step 28106: {'lr': 0.00019979417211944797, 'samples': 899392, 'steps': 1756, 'loss/train': 1.3397513628005981} -09/20/2021 20:34:31 - INFO - __main__ - Step 28107: {'lr': 0.00019979417211944797, 'samples': 899424, 'steps': 1756, 'loss/train': 2.227240562438965} -09/20/2021 20:34:31 - INFO - __main__ - Step 28108: {'lr': 0.00019979417211944797, 'samples': 899456, 'steps': 1756, 'loss/train': 2.209224224090576} -09/20/2021 20:34:32 - INFO - __main__ - Step 28109: {'lr': 0.00019979417211944797, 'samples': 899488, 'steps': 1756, 'loss/train': 3.2279772758483887} -09/20/2021 20:34:33 - INFO - __main__ - Step 28110: {'lr': 0.00019979417211944797, 'samples': 899520, 'steps': 1756, 'loss/train': 2.1135661602020264} -09/20/2021 20:34:34 - INFO - __main__ - Step 28111: {'lr': 0.00019979417211944797, 'samples': 899552, 'steps': 1756, 'loss/train': 1.4468944072723389} -09/20/2021 20:34:34 - INFO - __main__ - Step 28112: {'lr': 0.00019979417211944797, 'samples': 899584, 'steps': 1756, 'loss/train': 2.3355345726013184} -09/20/2021 20:34:35 - INFO - __main__ - Step 28113: {'lr': 0.00019979376285629208, 'samples': 899616, 'steps': 1757, 'loss/train': 4.043959617614746} -09/20/2021 20:34:36 - INFO - __main__ - Step 28114: {'lr': 0.00019979376285629208, 'samples': 899648, 'steps': 1757, 'loss/train': 2.7171006202697754} -09/20/2021 20:34:37 - INFO - __main__ - Step 28115: {'lr': 0.00019979376285629208, 'samples': 899680, 'steps': 1757, 'loss/train': 3.2187883853912354} -09/20/2021 20:34:38 - INFO - __main__ - Step 28116: {'lr': 0.00019979376285629208, 'samples': 899712, 'steps': 1757, 'loss/train': 2.115828514099121} -09/20/2021 20:34:39 - INFO - __main__ - Step 28117: {'lr': 0.00019979376285629208, 'samples': 899744, 'steps': 1757, 'loss/train': 3.3327598571777344} -09/20/2021 20:34:40 - INFO - __main__ - Step 28118: {'lr': 0.00019979376285629208, 'samples': 899776, 'steps': 1757, 'loss/train': 2.2575981616973877} -09/20/2021 20:34:40 - INFO - __main__ - Step 28119: {'lr': 0.00019979376285629208, 'samples': 899808, 'steps': 1757, 'loss/train': 2.759697198867798} -09/20/2021 20:34:41 - INFO - __main__ - Step 28120: {'lr': 0.00019979376285629208, 'samples': 899840, 'steps': 1757, 'loss/train': 2.721691370010376} -09/20/2021 20:34:42 - INFO - __main__ - Step 28121: {'lr': 0.00019979376285629208, 'samples': 899872, 'steps': 1757, 'loss/train': 2.615340232849121} -09/20/2021 20:34:43 - INFO - __main__ - Step 28122: {'lr': 0.00019979376285629208, 'samples': 899904, 'steps': 1757, 'loss/train': 2.0939505100250244} -09/20/2021 20:34:43 - INFO - __main__ - Step 28123: {'lr': 0.00019979376285629208, 'samples': 899936, 'steps': 1757, 'loss/train': 3.0250751972198486} -09/20/2021 20:34:44 - INFO - __main__ - Step 28124: {'lr': 0.00019979376285629208, 'samples': 899968, 'steps': 1757, 'loss/train': 2.2685227394104004} -09/20/2021 20:34:45 - INFO - __main__ - Step 28125: {'lr': 0.00019979376285629208, 'samples': 900000, 'steps': 1757, 'loss/train': 2.5029942989349365} -09/20/2021 20:34:46 - INFO - __main__ - Step 28126: {'lr': 0.00019979376285629208, 'samples': 900032, 'steps': 1757, 'loss/train': 0.6026774644851685} -09/20/2021 20:34:46 - INFO - __main__ - Step 28127: {'lr': 0.00019979376285629208, 'samples': 900064, 'steps': 1757, 'loss/train': 2.653587818145752} -09/20/2021 20:34:47 - INFO - __main__ - Step 28128: {'lr': 0.00019979376285629208, 'samples': 900096, 'steps': 1757, 'loss/train': 2.7721502780914307} -09/20/2021 20:34:48 - INFO - __main__ - Step 28129: {'lr': 0.00019979335318707575, 'samples': 900128, 'steps': 1758, 'loss/train': 2.7289316654205322} -09/20/2021 20:34:49 - INFO - __main__ - Step 28130: {'lr': 0.00019979335318707575, 'samples': 900160, 'steps': 1758, 'loss/train': 2.3855533599853516} -09/20/2021 20:34:49 - INFO - __main__ - Step 28131: {'lr': 0.00019979335318707575, 'samples': 900192, 'steps': 1758, 'loss/train': 2.8048129081726074} -09/20/2021 20:34:50 - INFO - __main__ - Step 28132: {'lr': 0.00019979335318707575, 'samples': 900224, 'steps': 1758, 'loss/train': 2.3562510013580322} -09/20/2021 20:34:51 - INFO - __main__ - Step 28133: {'lr': 0.00019979335318707575, 'samples': 900256, 'steps': 1758, 'loss/train': 1.9893136024475098} -09/20/2021 20:34:52 - INFO - __main__ - Step 28134: {'lr': 0.00019979335318707575, 'samples': 900288, 'steps': 1758, 'loss/train': 2.456252098083496} -09/20/2021 20:34:52 - INFO - __main__ - Step 28135: {'lr': 0.00019979335318707575, 'samples': 900320, 'steps': 1758, 'loss/train': 2.4712679386138916} -09/20/2021 20:34:53 - INFO - __main__ - Step 28136: {'lr': 0.00019979335318707575, 'samples': 900352, 'steps': 1758, 'loss/train': 1.76068913936615} -09/20/2021 20:34:54 - INFO - __main__ - Step 28137: {'lr': 0.00019979335318707575, 'samples': 900384, 'steps': 1758, 'loss/train': 2.3548803329467773} -09/20/2021 20:34:55 - INFO - __main__ - Step 28138: {'lr': 0.00019979335318707575, 'samples': 900416, 'steps': 1758, 'loss/train': 1.7171542644500732} -09/20/2021 20:34:55 - INFO - __main__ - Step 28139: {'lr': 0.00019979335318707575, 'samples': 900448, 'steps': 1758, 'loss/train': 5.9084954261779785} -09/20/2021 20:34:56 - INFO - __main__ - Step 28140: {'lr': 0.00019979335318707575, 'samples': 900480, 'steps': 1758, 'loss/train': 5.810564994812012} -09/20/2021 20:34:57 - INFO - __main__ - Step 28141: {'lr': 0.00019979335318707575, 'samples': 900512, 'steps': 1758, 'loss/train': 5.861917972564697} -09/20/2021 20:34:58 - INFO - __main__ - Step 28142: {'lr': 0.00019979335318707575, 'samples': 900544, 'steps': 1758, 'loss/train': 2.951885461807251} -09/20/2021 20:34:58 - INFO - __main__ - Step 28143: {'lr': 0.00019979335318707575, 'samples': 900576, 'steps': 1758, 'loss/train': 2.6020243167877197} -09/20/2021 20:34:59 - INFO - __main__ - Step 28144: {'lr': 0.00019979335318707575, 'samples': 900608, 'steps': 1758, 'loss/train': 2.5162882804870605} -09/20/2021 20:35:00 - INFO - __main__ - Step 28145: {'lr': 0.00019979294311180064, 'samples': 900640, 'steps': 1759, 'loss/train': 2.728667974472046} -09/20/2021 20:35:02 - INFO - __main__ - Step 28146: {'lr': 0.00019979294311180064, 'samples': 900672, 'steps': 1759, 'loss/train': 2.2550883293151855} -09/20/2021 20:35:02 - INFO - __main__ - Step 28147: {'lr': 0.00019979294311180064, 'samples': 900704, 'steps': 1759, 'loss/train': 2.890990972518921} -09/20/2021 20:35:03 - INFO - __main__ - Step 28148: {'lr': 0.00019979294311180064, 'samples': 900736, 'steps': 1759, 'loss/train': 3.07580828666687} -09/20/2021 20:35:04 - INFO - __main__ - Step 28149: {'lr': 0.00019979294311180064, 'samples': 900768, 'steps': 1759, 'loss/train': 2.763589859008789} -09/20/2021 20:35:05 - INFO - __main__ - Step 28150: {'lr': 0.00019979294311180064, 'samples': 900800, 'steps': 1759, 'loss/train': 2.7156505584716797} -09/20/2021 20:35:05 - INFO - __main__ - Step 28151: {'lr': 0.00019979294311180064, 'samples': 900832, 'steps': 1759, 'loss/train': 2.2872819900512695} -09/20/2021 20:35:06 - INFO - __main__ - Step 28152: {'lr': 0.00019979294311180064, 'samples': 900864, 'steps': 1759, 'loss/train': 2.906797409057617} -09/20/2021 20:35:07 - INFO - __main__ - Step 28153: {'lr': 0.00019979294311180064, 'samples': 900896, 'steps': 1759, 'loss/train': 2.364910125732422} -09/20/2021 20:35:08 - INFO - __main__ - Step 28154: {'lr': 0.00019979294311180064, 'samples': 900928, 'steps': 1759, 'loss/train': 2.4977610111236572} -09/20/2021 20:35:08 - INFO - __main__ - Step 28155: {'lr': 0.00019979294311180064, 'samples': 900960, 'steps': 1759, 'loss/train': 1.9782623052597046} -09/20/2021 20:35:09 - INFO - __main__ - Step 28156: {'lr': 0.00019979294311180064, 'samples': 900992, 'steps': 1759, 'loss/train': 2.3402292728424072} -09/20/2021 20:35:10 - INFO - __main__ - Step 28157: {'lr': 0.00019979294311180064, 'samples': 901024, 'steps': 1759, 'loss/train': 3.5994725227355957} -09/20/2021 20:35:11 - INFO - __main__ - Step 28158: {'lr': 0.00019979294311180064, 'samples': 901056, 'steps': 1759, 'loss/train': 2.11305832862854} -09/20/2021 20:35:11 - INFO - __main__ - Step 28159: {'lr': 0.00019979294311180064, 'samples': 901088, 'steps': 1759, 'loss/train': 2.059142589569092} -09/20/2021 20:35:12 - INFO - __main__ - Step 28160: {'lr': 0.00019979294311180064, 'samples': 901120, 'steps': 1759, 'loss/train': 2.070884943008423} -09/20/2021 20:35:13 - INFO - __main__ - Step 28161: {'lr': 0.00019979253263046842, 'samples': 901152, 'steps': 1760, 'loss/train': 2.809056282043457} -09/20/2021 20:35:14 - INFO - __main__ - Step 28162: {'lr': 0.00019979253263046842, 'samples': 901184, 'steps': 1760, 'loss/train': 2.7182278633117676} -09/20/2021 20:35:15 - INFO - __main__ - Step 28163: {'lr': 0.00019979253263046842, 'samples': 901216, 'steps': 1760, 'loss/train': 2.616732120513916} -09/20/2021 20:35:15 - INFO - __main__ - Step 28164: {'lr': 0.00019979253263046842, 'samples': 901248, 'steps': 1760, 'loss/train': 1.0152652263641357} -09/20/2021 20:35:16 - INFO - __main__ - Step 28165: {'lr': 0.00019979253263046842, 'samples': 901280, 'steps': 1760, 'loss/train': 2.9522018432617188} -09/20/2021 20:35:17 - INFO - __main__ - Step 28166: {'lr': 0.00019979253263046842, 'samples': 901312, 'steps': 1760, 'loss/train': 2.8321008682250977} -09/20/2021 20:35:18 - INFO - __main__ - Step 28167: {'lr': 0.00019979253263046842, 'samples': 901344, 'steps': 1760, 'loss/train': 2.46675705909729} -09/20/2021 20:35:18 - INFO - __main__ - Step 28168: {'lr': 0.00019979253263046842, 'samples': 901376, 'steps': 1760, 'loss/train': 1.4550012350082397} -09/20/2021 20:35:19 - INFO - __main__ - Step 28169: {'lr': 0.00019979253263046842, 'samples': 901408, 'steps': 1760, 'loss/train': 3.297431468963623} -09/20/2021 20:35:20 - INFO - __main__ - Step 28170: {'lr': 0.00019979253263046842, 'samples': 901440, 'steps': 1760, 'loss/train': 1.9436793327331543} -09/20/2021 20:35:21 - INFO - __main__ - Step 28171: {'lr': 0.00019979253263046842, 'samples': 901472, 'steps': 1760, 'loss/train': 1.2926827669143677} -09/20/2021 20:35:21 - INFO - __main__ - Step 28172: {'lr': 0.00019979253263046842, 'samples': 901504, 'steps': 1760, 'loss/train': 0.9827225804328918} -09/20/2021 20:35:22 - INFO - __main__ - Step 28173: {'lr': 0.00019979253263046842, 'samples': 901536, 'steps': 1760, 'loss/train': 0.6452434659004211} -09/20/2021 20:35:23 - INFO - __main__ - Step 28174: {'lr': 0.00019979253263046842, 'samples': 901568, 'steps': 1760, 'loss/train': 0.7080342173576355} -09/20/2021 20:35:24 - INFO - __main__ - Step 28175: {'lr': 0.00019979253263046842, 'samples': 901600, 'steps': 1760, 'loss/train': 1.0054655075073242} -09/20/2021 20:35:24 - INFO - __main__ - Step 28176: {'lr': 0.00019979253263046842, 'samples': 901632, 'steps': 1760, 'loss/train': 1.1514489650726318} -09/20/2021 20:35:25 - INFO - __main__ - Step 28177: {'lr': 0.0001997921217430808, 'samples': 901664, 'steps': 1761, 'loss/train': 2.061115264892578} -09/20/2021 20:35:27 - INFO - __main__ - Step 28178: {'lr': 0.0001997921217430808, 'samples': 901696, 'steps': 1761, 'loss/train': 2.8011412620544434} -09/20/2021 20:35:28 - INFO - __main__ - Step 28179: {'lr': 0.0001997921217430808, 'samples': 901728, 'steps': 1761, 'loss/train': 2.4475913047790527} -09/20/2021 20:35:28 - INFO - __main__ - Step 28180: {'lr': 0.0001997921217430808, 'samples': 901760, 'steps': 1761, 'loss/train': 0.8820478916168213} -09/20/2021 20:35:29 - INFO - __main__ - Step 28181: {'lr': 0.0001997921217430808, 'samples': 901792, 'steps': 1761, 'loss/train': 2.069678544998169} -09/20/2021 20:35:30 - INFO - __main__ - Step 28182: {'lr': 0.0001997921217430808, 'samples': 901824, 'steps': 1761, 'loss/train': 2.8230528831481934} -09/20/2021 20:35:31 - INFO - __main__ - Step 28183: {'lr': 0.0001997921217430808, 'samples': 901856, 'steps': 1761, 'loss/train': 2.3229434490203857} -09/20/2021 20:35:31 - INFO - __main__ - Step 28184: {'lr': 0.0001997921217430808, 'samples': 901888, 'steps': 1761, 'loss/train': 2.1416327953338623} -09/20/2021 20:35:32 - INFO - __main__ - Step 28185: {'lr': 0.0001997921217430808, 'samples': 901920, 'steps': 1761, 'loss/train': 2.5305726528167725} -09/20/2021 20:35:33 - INFO - __main__ - Step 28186: {'lr': 0.0001997921217430808, 'samples': 901952, 'steps': 1761, 'loss/train': 3.1857099533081055} -09/20/2021 20:35:34 - INFO - __main__ - Step 28187: {'lr': 0.0001997921217430808, 'samples': 901984, 'steps': 1761, 'loss/train': 2.62170147895813} -09/20/2021 20:35:34 - INFO - __main__ - Step 28188: {'lr': 0.0001997921217430808, 'samples': 902016, 'steps': 1761, 'loss/train': 2.5579018592834473} -09/20/2021 20:35:35 - INFO - __main__ - Step 28189: {'lr': 0.0001997921217430808, 'samples': 902048, 'steps': 1761, 'loss/train': 2.078190326690674} -09/20/2021 20:35:36 - INFO - __main__ - Step 28190: {'lr': 0.0001997921217430808, 'samples': 902080, 'steps': 1761, 'loss/train': 2.634021282196045} -09/20/2021 20:35:37 - INFO - __main__ - Step 28191: {'lr': 0.0001997921217430808, 'samples': 902112, 'steps': 1761, 'loss/train': 1.9614628553390503} -09/20/2021 20:35:37 - INFO - __main__ - Step 28192: {'lr': 0.0001997921217430808, 'samples': 902144, 'steps': 1761, 'loss/train': 2.285010814666748} -09/20/2021 20:35:38 - INFO - __main__ - Step 28193: {'lr': 0.0001997917104496394, 'samples': 902176, 'steps': 1762, 'loss/train': 2.4956042766571045} -09/20/2021 20:35:39 - INFO - __main__ - Step 28194: {'lr': 0.0001997917104496394, 'samples': 902208, 'steps': 1762, 'loss/train': 2.0663816928863525} -09/20/2021 20:35:40 - INFO - __main__ - Step 28195: {'lr': 0.0001997917104496394, 'samples': 902240, 'steps': 1762, 'loss/train': 4.11752986907959} -09/20/2021 20:35:40 - INFO - __main__ - Step 28196: {'lr': 0.0001997917104496394, 'samples': 902272, 'steps': 1762, 'loss/train': 2.440152406692505} -09/20/2021 20:35:41 - INFO - __main__ - Step 28197: {'lr': 0.0001997917104496394, 'samples': 902304, 'steps': 1762, 'loss/train': 3.0113723278045654} -09/20/2021 20:35:42 - INFO - __main__ - Step 28198: {'lr': 0.0001997917104496394, 'samples': 902336, 'steps': 1762, 'loss/train': 3.0055909156799316} -09/20/2021 20:35:43 - INFO - __main__ - Step 28199: {'lr': 0.0001997917104496394, 'samples': 902368, 'steps': 1762, 'loss/train': 2.5878231525421143} -09/20/2021 20:35:43 - INFO - __main__ - Step 28200: {'lr': 0.0001997917104496394, 'samples': 902400, 'steps': 1762, 'loss/train': 3.736072063446045} -09/20/2021 20:35:44 - INFO - __main__ - Step 28201: {'lr': 0.0001997917104496394, 'samples': 902432, 'steps': 1762, 'loss/train': 3.031174659729004} -09/20/2021 20:35:45 - INFO - __main__ - Step 28202: {'lr': 0.0001997917104496394, 'samples': 902464, 'steps': 1762, 'loss/train': 2.5098063945770264} -09/20/2021 20:35:46 - INFO - __main__ - Step 28203: {'lr': 0.0001997917104496394, 'samples': 902496, 'steps': 1762, 'loss/train': 2.7553207874298096} -09/20/2021 20:35:46 - INFO - __main__ - Step 28204: {'lr': 0.0001997917104496394, 'samples': 902528, 'steps': 1762, 'loss/train': 3.9302186965942383} -09/20/2021 20:35:47 - INFO - __main__ - Step 28205: {'lr': 0.0001997917104496394, 'samples': 902560, 'steps': 1762, 'loss/train': 2.4979054927825928} -09/20/2021 20:35:48 - INFO - __main__ - Step 28206: {'lr': 0.0001997917104496394, 'samples': 902592, 'steps': 1762, 'loss/train': 2.068418025970459} -09/20/2021 20:35:49 - INFO - __main__ - Step 28207: {'lr': 0.0001997917104496394, 'samples': 902624, 'steps': 1762, 'loss/train': 2.329430103302002} -09/20/2021 20:35:49 - INFO - __main__ - Step 28208: {'lr': 0.0001997917104496394, 'samples': 902656, 'steps': 1762, 'loss/train': 2.201005697250366} -09/20/2021 20:35:50 - INFO - __main__ - Step 28209: {'lr': 0.00019979129875014593, 'samples': 902688, 'steps': 1763, 'loss/train': 2.291069746017456} -09/20/2021 20:35:52 - INFO - __main__ - Step 28210: {'lr': 0.00019979129875014593, 'samples': 902720, 'steps': 1763, 'loss/train': 3.6354496479034424} -09/20/2021 20:35:52 - INFO - __main__ - Step 28211: {'lr': 0.00019979129875014593, 'samples': 902752, 'steps': 1763, 'loss/train': 3.6367218494415283} -09/20/2021 20:35:53 - INFO - __main__ - Step 28212: {'lr': 0.00019979129875014593, 'samples': 902784, 'steps': 1763, 'loss/train': 2.1638898849487305} -09/20/2021 20:35:54 - INFO - __main__ - Step 28213: {'lr': 0.00019979129875014593, 'samples': 902816, 'steps': 1763, 'loss/train': 2.658881902694702} -09/20/2021 20:35:55 - INFO - __main__ - Step 28214: {'lr': 0.00019979129875014593, 'samples': 902848, 'steps': 1763, 'loss/train': 3.088853359222412} -09/20/2021 20:35:55 - INFO - __main__ - Step 28215: {'lr': 0.00019979129875014593, 'samples': 902880, 'steps': 1763, 'loss/train': 2.1240198612213135} -09/20/2021 20:35:56 - INFO - __main__ - Step 28216: {'lr': 0.00019979129875014593, 'samples': 902912, 'steps': 1763, 'loss/train': 2.3814949989318848} -09/20/2021 20:35:57 - INFO - __main__ - Step 28217: {'lr': 0.00019979129875014593, 'samples': 902944, 'steps': 1763, 'loss/train': 1.9340929985046387} -09/20/2021 20:35:58 - INFO - __main__ - Step 28218: {'lr': 0.00019979129875014593, 'samples': 902976, 'steps': 1763, 'loss/train': 3.067795991897583} -09/20/2021 20:35:58 - INFO - __main__ - Step 28219: {'lr': 0.00019979129875014593, 'samples': 903008, 'steps': 1763, 'loss/train': 2.457982301712036} -09/20/2021 20:35:59 - INFO - __main__ - Step 28220: {'lr': 0.00019979129875014593, 'samples': 903040, 'steps': 1763, 'loss/train': 2.3532657623291016} -09/20/2021 20:36:00 - INFO - __main__ - Step 28221: {'lr': 0.00019979129875014593, 'samples': 903072, 'steps': 1763, 'loss/train': 3.0924394130706787} -09/20/2021 20:36:01 - INFO - __main__ - Step 28222: {'lr': 0.00019979129875014593, 'samples': 903104, 'steps': 1763, 'loss/train': 3.1846084594726562} -09/20/2021 20:36:01 - INFO - __main__ - Step 28223: {'lr': 0.00019979129875014593, 'samples': 903136, 'steps': 1763, 'loss/train': 2.2844693660736084} -09/20/2021 20:36:02 - INFO - __main__ - Step 28224: {'lr': 0.00019979129875014593, 'samples': 903168, 'steps': 1763, 'loss/train': 2.167422294616699} -09/20/2021 20:36:03 - INFO - __main__ - Step 28225: {'lr': 0.00019979088664460207, 'samples': 903200, 'steps': 1764, 'loss/train': 2.155677080154419} -09/20/2021 20:36:04 - INFO - __main__ - Step 28226: {'lr': 0.00019979088664460207, 'samples': 903232, 'steps': 1764, 'loss/train': 2.694291830062866} -09/20/2021 20:36:05 - INFO - __main__ - Step 28227: {'lr': 0.00019979088664460207, 'samples': 903264, 'steps': 1764, 'loss/train': 2.510540008544922} -09/20/2021 20:36:05 - INFO - __main__ - Step 28228: {'lr': 0.00019979088664460207, 'samples': 903296, 'steps': 1764, 'loss/train': 1.7053604125976562} -09/20/2021 20:36:06 - INFO - __main__ - Step 28229: {'lr': 0.00019979088664460207, 'samples': 903328, 'steps': 1764, 'loss/train': 3.304295539855957} -09/20/2021 20:36:07 - INFO - __main__ - Step 28230: {'lr': 0.00019979088664460207, 'samples': 903360, 'steps': 1764, 'loss/train': 3.2440502643585205} -09/20/2021 20:36:08 - INFO - __main__ - Step 28231: {'lr': 0.00019979088664460207, 'samples': 903392, 'steps': 1764, 'loss/train': 0.5495918989181519} -09/20/2021 20:36:08 - INFO - __main__ - Step 28232: {'lr': 0.00019979088664460207, 'samples': 903424, 'steps': 1764, 'loss/train': 2.7635412216186523} -09/20/2021 20:36:09 - INFO - __main__ - Step 28233: {'lr': 0.00019979088664460207, 'samples': 903456, 'steps': 1764, 'loss/train': 1.5013015270233154} -09/20/2021 20:36:10 - INFO - __main__ - Step 28234: {'lr': 0.00019979088664460207, 'samples': 903488, 'steps': 1764, 'loss/train': 2.0601396560668945} -09/20/2021 20:36:11 - INFO - __main__ - Step 28235: {'lr': 0.00019979088664460207, 'samples': 903520, 'steps': 1764, 'loss/train': 1.8319275379180908} -09/20/2021 20:36:11 - INFO - __main__ - Step 28236: {'lr': 0.00019979088664460207, 'samples': 903552, 'steps': 1764, 'loss/train': 2.018950939178467} -09/20/2021 20:36:12 - INFO - __main__ - Step 28237: {'lr': 0.00019979088664460207, 'samples': 903584, 'steps': 1764, 'loss/train': 1.3200757503509521} -09/20/2021 20:36:13 - INFO - __main__ - Step 28238: {'lr': 0.00019979088664460207, 'samples': 903616, 'steps': 1764, 'loss/train': 2.753514289855957} -09/20/2021 20:36:14 - INFO - __main__ - Step 28239: {'lr': 0.00019979088664460207, 'samples': 903648, 'steps': 1764, 'loss/train': 2.6515865325927734} -09/20/2021 20:36:15 - INFO - __main__ - Step 28240: {'lr': 0.00019979088664460207, 'samples': 903680, 'steps': 1764, 'loss/train': 2.327197790145874} -09/20/2021 20:36:16 - INFO - __main__ - Step 28241: {'lr': 0.00019979047413300947, 'samples': 903712, 'steps': 1765, 'loss/train': 2.5824859142303467} -09/20/2021 20:36:16 - INFO - __main__ - Step 28242: {'lr': 0.00019979047413300947, 'samples': 903744, 'steps': 1765, 'loss/train': 1.7955029010772705} -09/20/2021 20:36:17 - INFO - __main__ - Step 28243: {'lr': 0.00019979047413300947, 'samples': 903776, 'steps': 1765, 'loss/train': 3.089315891265869} -09/20/2021 20:36:18 - INFO - __main__ - Step 28244: {'lr': 0.00019979047413300947, 'samples': 903808, 'steps': 1765, 'loss/train': 5.2030839920043945} -09/20/2021 20:36:19 - INFO - __main__ - Step 28245: {'lr': 0.00019979047413300947, 'samples': 903840, 'steps': 1765, 'loss/train': 3.7095754146575928} -09/20/2021 20:36:19 - INFO - __main__ - Step 28246: {'lr': 0.00019979047413300947, 'samples': 903872, 'steps': 1765, 'loss/train': 2.641775608062744} -09/20/2021 20:36:20 - INFO - __main__ - Step 28247: {'lr': 0.00019979047413300947, 'samples': 903904, 'steps': 1765, 'loss/train': 3.0481951236724854} -09/20/2021 20:36:21 - INFO - __main__ - Step 28248: {'lr': 0.00019979047413300947, 'samples': 903936, 'steps': 1765, 'loss/train': 3.4531400203704834} -09/20/2021 20:36:22 - INFO - __main__ - Step 28249: {'lr': 0.00019979047413300947, 'samples': 903968, 'steps': 1765, 'loss/train': 3.1833114624023438} -09/20/2021 20:36:22 - INFO - __main__ - Step 28250: {'lr': 0.00019979047413300947, 'samples': 904000, 'steps': 1765, 'loss/train': 0.613858699798584} -09/20/2021 20:36:23 - INFO - __main__ - Step 28251: {'lr': 0.00019979047413300947, 'samples': 904032, 'steps': 1765, 'loss/train': 3.5755951404571533} -09/20/2021 20:36:24 - INFO - __main__ - Step 28252: {'lr': 0.00019979047413300947, 'samples': 904064, 'steps': 1765, 'loss/train': 1.9345872402191162} -09/20/2021 20:36:25 - INFO - __main__ - Step 28253: {'lr': 0.00019979047413300947, 'samples': 904096, 'steps': 1765, 'loss/train': 2.7377612590789795} -09/20/2021 20:36:25 - INFO - __main__ - Step 28254: {'lr': 0.00019979047413300947, 'samples': 904128, 'steps': 1765, 'loss/train': 3.3759002685546875} -09/20/2021 20:36:26 - INFO - __main__ - Step 28255: {'lr': 0.00019979047413300947, 'samples': 904160, 'steps': 1765, 'loss/train': 2.2509567737579346} -09/20/2021 20:36:27 - INFO - __main__ - Step 28256: {'lr': 0.00019979047413300947, 'samples': 904192, 'steps': 1765, 'loss/train': 0.6272528171539307} -09/20/2021 20:36:28 - INFO - __main__ - Step 28257: {'lr': 0.0001997900612153698, 'samples': 904224, 'steps': 1766, 'loss/train': 2.6718993186950684} -09/20/2021 20:36:29 - INFO - __main__ - Step 28258: {'lr': 0.0001997900612153698, 'samples': 904256, 'steps': 1766, 'loss/train': 2.7577404975891113} -09/20/2021 20:36:29 - INFO - __main__ - Step 28259: {'lr': 0.0001997900612153698, 'samples': 904288, 'steps': 1766, 'loss/train': 3.376685619354248} -09/20/2021 20:36:30 - INFO - __main__ - Step 28260: {'lr': 0.0001997900612153698, 'samples': 904320, 'steps': 1766, 'loss/train': 2.0571653842926025} -09/20/2021 20:36:31 - INFO - __main__ - Step 28261: {'lr': 0.0001997900612153698, 'samples': 904352, 'steps': 1766, 'loss/train': 1.408764362335205} -09/20/2021 20:36:32 - INFO - __main__ - Step 28262: {'lr': 0.0001997900612153698, 'samples': 904384, 'steps': 1766, 'loss/train': 2.0089964866638184} -09/20/2021 20:36:32 - INFO - __main__ - Step 28263: {'lr': 0.0001997900612153698, 'samples': 904416, 'steps': 1766, 'loss/train': 6.743584632873535} -09/20/2021 20:36:33 - INFO - __main__ - Step 28264: {'lr': 0.0001997900612153698, 'samples': 904448, 'steps': 1766, 'loss/train': 1.9176408052444458} -09/20/2021 20:36:34 - INFO - __main__ - Step 28265: {'lr': 0.0001997900612153698, 'samples': 904480, 'steps': 1766, 'loss/train': 2.549044370651245} -09/20/2021 20:36:35 - INFO - __main__ - Step 28266: {'lr': 0.0001997900612153698, 'samples': 904512, 'steps': 1766, 'loss/train': 2.6993284225463867} -09/20/2021 20:36:35 - INFO - __main__ - Step 28267: {'lr': 0.0001997900612153698, 'samples': 904544, 'steps': 1766, 'loss/train': 3.001816749572754} -09/20/2021 20:36:36 - INFO - __main__ - Step 28268: {'lr': 0.0001997900612153698, 'samples': 904576, 'steps': 1766, 'loss/train': 2.0555903911590576} -09/20/2021 20:36:37 - INFO - __main__ - Step 28269: {'lr': 0.0001997900612153698, 'samples': 904608, 'steps': 1766, 'loss/train': 2.671504497528076} -09/20/2021 20:36:38 - INFO - __main__ - Step 28270: {'lr': 0.0001997900612153698, 'samples': 904640, 'steps': 1766, 'loss/train': 2.1083414554595947} -09/20/2021 20:36:38 - INFO - __main__ - Step 28271: {'lr': 0.0001997900612153698, 'samples': 904672, 'steps': 1766, 'loss/train': 2.594205379486084} -09/20/2021 20:36:40 - INFO - __main__ - Step 28272: {'lr': 0.0001997900612153698, 'samples': 904704, 'steps': 1766, 'loss/train': 1.9184527397155762} -09/20/2021 20:36:41 - INFO - __main__ - Step 28273: {'lr': 0.00019978964789168477, 'samples': 904736, 'steps': 1767, 'loss/train': 2.7516870498657227} -09/20/2021 20:36:41 - INFO - __main__ - Step 28274: {'lr': 0.00019978964789168477, 'samples': 904768, 'steps': 1767, 'loss/train': 3.0608527660369873} -09/20/2021 20:36:42 - INFO - __main__ - Step 28275: {'lr': 0.00019978964789168477, 'samples': 904800, 'steps': 1767, 'loss/train': 2.2661149501800537} -09/20/2021 20:36:43 - INFO - __main__ - Step 28276: {'lr': 0.00019978964789168477, 'samples': 904832, 'steps': 1767, 'loss/train': 2.4725563526153564} -09/20/2021 20:36:44 - INFO - __main__ - Step 28277: {'lr': 0.00019978964789168477, 'samples': 904864, 'steps': 1767, 'loss/train': 2.389389991760254} -09/20/2021 20:36:44 - INFO - __main__ - Step 28278: {'lr': 0.00019978964789168477, 'samples': 904896, 'steps': 1767, 'loss/train': 4.629029750823975} -09/20/2021 20:36:45 - INFO - __main__ - Step 28279: {'lr': 0.00019978964789168477, 'samples': 904928, 'steps': 1767, 'loss/train': 2.7902204990386963} -09/20/2021 20:36:46 - INFO - __main__ - Step 28280: {'lr': 0.00019978964789168477, 'samples': 904960, 'steps': 1767, 'loss/train': 2.621123790740967} -09/20/2021 20:36:47 - INFO - __main__ - Step 28281: {'lr': 0.00019978964789168477, 'samples': 904992, 'steps': 1767, 'loss/train': 2.1972386837005615} -09/20/2021 20:36:47 - INFO - __main__ - Step 28282: {'lr': 0.00019978964789168477, 'samples': 905024, 'steps': 1767, 'loss/train': 2.110652208328247} -09/20/2021 20:36:48 - INFO - __main__ - Step 28283: {'lr': 0.00019978964789168477, 'samples': 905056, 'steps': 1767, 'loss/train': 2.7672622203826904} -09/20/2021 20:36:49 - INFO - __main__ - Step 28284: {'lr': 0.00019978964789168477, 'samples': 905088, 'steps': 1767, 'loss/train': 2.295140027999878} -09/20/2021 20:36:50 - INFO - __main__ - Step 28285: {'lr': 0.00019978964789168477, 'samples': 905120, 'steps': 1767, 'loss/train': 2.887678384780884} -09/20/2021 20:36:50 - INFO - __main__ - Step 28286: {'lr': 0.00019978964789168477, 'samples': 905152, 'steps': 1767, 'loss/train': 3.0905990600585938} -09/20/2021 20:36:51 - INFO - __main__ - Step 28287: {'lr': 0.00019978964789168477, 'samples': 905184, 'steps': 1767, 'loss/train': 2.6912803649902344} -09/20/2021 20:36:52 - INFO - __main__ - Step 28288: {'lr': 0.00019978964789168477, 'samples': 905216, 'steps': 1767, 'loss/train': 2.966423988342285} -09/20/2021 20:36:53 - INFO - __main__ - Step 28289: {'lr': 0.00019978923416195604, 'samples': 905248, 'steps': 1768, 'loss/train': 3.122843027114868} -09/20/2021 20:36:54 - INFO - __main__ - Step 28290: {'lr': 0.00019978923416195604, 'samples': 905280, 'steps': 1768, 'loss/train': 2.6181304454803467} -09/20/2021 20:36:54 - INFO - __main__ - Step 28291: {'lr': 0.00019978923416195604, 'samples': 905312, 'steps': 1768, 'loss/train': 2.7030837535858154} -09/20/2021 20:36:55 - INFO - __main__ - Step 28292: {'lr': 0.00019978923416195604, 'samples': 905344, 'steps': 1768, 'loss/train': 2.656982421875} -09/20/2021 20:36:56 - INFO - __main__ - Step 28293: {'lr': 0.00019978923416195604, 'samples': 905376, 'steps': 1768, 'loss/train': 2.779158353805542} -09/20/2021 20:36:57 - INFO - __main__ - Step 28294: {'lr': 0.00019978923416195604, 'samples': 905408, 'steps': 1768, 'loss/train': 2.139402151107788} -09/20/2021 20:36:57 - INFO - __main__ - Step 28295: {'lr': 0.00019978923416195604, 'samples': 905440, 'steps': 1768, 'loss/train': 2.455437421798706} -09/20/2021 20:36:58 - INFO - __main__ - Step 28296: {'lr': 0.00019978923416195604, 'samples': 905472, 'steps': 1768, 'loss/train': 2.5315682888031006} -09/20/2021 20:36:59 - INFO - __main__ - Step 28297: {'lr': 0.00019978923416195604, 'samples': 905504, 'steps': 1768, 'loss/train': 1.7075265645980835} -09/20/2021 20:37:00 - INFO - __main__ - Step 28298: {'lr': 0.00019978923416195604, 'samples': 905536, 'steps': 1768, 'loss/train': 6.4022626876831055} -09/20/2021 20:37:00 - INFO - __main__ - Step 28299: {'lr': 0.00019978923416195604, 'samples': 905568, 'steps': 1768, 'loss/train': 6.396364212036133} -09/20/2021 20:37:01 - INFO - __main__ - Step 28300: {'lr': 0.00019978923416195604, 'samples': 905600, 'steps': 1768, 'loss/train': 6.399734020233154} -09/20/2021 20:37:02 - INFO - __main__ - Step 28301: {'lr': 0.00019978923416195604, 'samples': 905632, 'steps': 1768, 'loss/train': 6.483792781829834} -09/20/2021 20:37:03 - INFO - __main__ - Step 28302: {'lr': 0.00019978923416195604, 'samples': 905664, 'steps': 1768, 'loss/train': 6.460859298706055} -09/20/2021 20:37:03 - INFO - __main__ - Step 28303: {'lr': 0.00019978923416195604, 'samples': 905696, 'steps': 1768, 'loss/train': 6.373241424560547} -09/20/2021 20:37:04 - INFO - __main__ - Step 28304: {'lr': 0.00019978923416195604, 'samples': 905728, 'steps': 1768, 'loss/train': 2.6894114017486572} -09/20/2021 20:37:05 - INFO - __main__ - Step 28305: {'lr': 0.00019978882002618533, 'samples': 905760, 'steps': 1769, 'loss/train': 3.004258155822754} -09/20/2021 20:37:07 - INFO - __main__ - Step 28306: {'lr': 0.00019978882002618533, 'samples': 905792, 'steps': 1769, 'loss/train': 2.7906296253204346} -09/20/2021 20:37:08 - INFO - __main__ - Step 28307: {'lr': 0.00019978882002618533, 'samples': 905824, 'steps': 1769, 'loss/train': 2.9658122062683105} -09/20/2021 20:37:08 - INFO - __main__ - Step 28308: {'lr': 0.00019978882002618533, 'samples': 905856, 'steps': 1769, 'loss/train': 2.5452396869659424} -09/20/2021 20:37:09 - INFO - __main__ - Step 28309: {'lr': 0.00019978882002618533, 'samples': 905888, 'steps': 1769, 'loss/train': 3.10207462310791} -09/20/2021 20:37:10 - INFO - __main__ - Step 28310: {'lr': 0.00019978882002618533, 'samples': 905920, 'steps': 1769, 'loss/train': 2.430584192276001} -09/20/2021 20:37:11 - INFO - __main__ - Step 28311: {'lr': 0.00019978882002618533, 'samples': 905952, 'steps': 1769, 'loss/train': 2.7782528400421143} -09/20/2021 20:37:11 - INFO - __main__ - Step 28312: {'lr': 0.00019978882002618533, 'samples': 905984, 'steps': 1769, 'loss/train': 2.385645627975464} -09/20/2021 20:37:12 - INFO - __main__ - Step 28313: {'lr': 0.00019978882002618533, 'samples': 906016, 'steps': 1769, 'loss/train': 5.430466175079346} -09/20/2021 20:37:13 - INFO - __main__ - Step 28314: {'lr': 0.00019978882002618533, 'samples': 906048, 'steps': 1769, 'loss/train': 2.892117738723755} -09/20/2021 20:37:14 - INFO - __main__ - Step 28315: {'lr': 0.00019978882002618533, 'samples': 906080, 'steps': 1769, 'loss/train': 2.739129066467285} -09/20/2021 20:37:14 - INFO - __main__ - Step 28316: {'lr': 0.00019978882002618533, 'samples': 906112, 'steps': 1769, 'loss/train': 1.9744879007339478} -09/20/2021 20:37:15 - INFO - __main__ - Step 28317: {'lr': 0.00019978882002618533, 'samples': 906144, 'steps': 1769, 'loss/train': 2.8447933197021484} -09/20/2021 20:37:16 - INFO - __main__ - Step 28318: {'lr': 0.00019978882002618533, 'samples': 906176, 'steps': 1769, 'loss/train': 2.9366064071655273} -09/20/2021 20:37:17 - INFO - __main__ - Step 28319: {'lr': 0.00019978882002618533, 'samples': 906208, 'steps': 1769, 'loss/train': 2.2532782554626465} -09/20/2021 20:37:17 - INFO - __main__ - Step 28320: {'lr': 0.00019978882002618533, 'samples': 906240, 'steps': 1769, 'loss/train': 2.837160110473633} -09/20/2021 20:37:18 - INFO - __main__ - Step 28321: {'lr': 0.00019978840548437427, 'samples': 906272, 'steps': 1770, 'loss/train': 2.2979483604431152} -09/20/2021 20:37:19 - INFO - __main__ - Step 28322: {'lr': 0.00019978840548437427, 'samples': 906304, 'steps': 1770, 'loss/train': 2.247183084487915} -09/20/2021 20:37:20 - INFO - __main__ - Step 28323: {'lr': 0.00019978840548437427, 'samples': 906336, 'steps': 1770, 'loss/train': 0.6994745135307312} -09/20/2021 20:37:20 - INFO - __main__ - Step 28324: {'lr': 0.00019978840548437427, 'samples': 906368, 'steps': 1770, 'loss/train': 0.3871310353279114} -09/20/2021 20:37:21 - INFO - __main__ - Step 28325: {'lr': 0.00019978840548437427, 'samples': 906400, 'steps': 1770, 'loss/train': 0.9912471175193787} -09/20/2021 20:37:22 - INFO - __main__ - Step 28326: {'lr': 0.00019978840548437427, 'samples': 906432, 'steps': 1770, 'loss/train': 2.3857083320617676} -09/20/2021 20:37:23 - INFO - __main__ - Step 28327: {'lr': 0.00019978840548437427, 'samples': 906464, 'steps': 1770, 'loss/train': 3.418423891067505} -09/20/2021 20:37:23 - INFO - __main__ - Step 28328: {'lr': 0.00019978840548437427, 'samples': 906496, 'steps': 1770, 'loss/train': 2.2577805519104004} -09/20/2021 20:37:24 - INFO - __main__ - Step 28329: {'lr': 0.00019978840548437427, 'samples': 906528, 'steps': 1770, 'loss/train': 2.5424933433532715} -09/20/2021 20:37:25 - INFO - __main__ - Step 28330: {'lr': 0.00019978840548437427, 'samples': 906560, 'steps': 1770, 'loss/train': 2.7582743167877197} -09/20/2021 20:37:26 - INFO - __main__ - Step 28331: {'lr': 0.00019978840548437427, 'samples': 906592, 'steps': 1770, 'loss/train': 3.6591320037841797} -09/20/2021 20:37:26 - INFO - __main__ - Step 28332: {'lr': 0.00019978840548437427, 'samples': 906624, 'steps': 1770, 'loss/train': 2.128662347793579} -09/20/2021 20:37:27 - INFO - __main__ - Step 28333: {'lr': 0.00019978840548437427, 'samples': 906656, 'steps': 1770, 'loss/train': 2.830766439437866} -09/20/2021 20:37:28 - INFO - __main__ - Step 28334: {'lr': 0.00019978840548437427, 'samples': 906688, 'steps': 1770, 'loss/train': 2.0165274143218994} -09/20/2021 20:37:29 - INFO - __main__ - Step 28335: {'lr': 0.00019978840548437427, 'samples': 906720, 'steps': 1770, 'loss/train': 2.360882043838501} -09/20/2021 20:37:29 - INFO - __main__ - Step 28336: {'lr': 0.00019978840548437427, 'samples': 906752, 'steps': 1770, 'loss/train': 2.3086483478546143} -09/20/2021 20:37:31 - INFO - __main__ - Step 28337: {'lr': 0.0001997879905365246, 'samples': 906784, 'steps': 1771, 'loss/train': 3.337717056274414} -09/20/2021 20:37:32 - INFO - __main__ - Step 28338: {'lr': 0.0001997879905365246, 'samples': 906816, 'steps': 1771, 'loss/train': 2.587951421737671} -09/20/2021 20:37:32 - INFO - __main__ - Step 28339: {'lr': 0.0001997879905365246, 'samples': 906848, 'steps': 1771, 'loss/train': 2.8037402629852295} -09/20/2021 20:37:33 - INFO - __main__ - Step 28340: {'lr': 0.0001997879905365246, 'samples': 906880, 'steps': 1771, 'loss/train': 2.7023327350616455} -09/20/2021 20:37:34 - INFO - __main__ - Step 28341: {'lr': 0.0001997879905365246, 'samples': 906912, 'steps': 1771, 'loss/train': 2.349876880645752} -09/20/2021 20:37:35 - INFO - __main__ - Step 28342: {'lr': 0.0001997879905365246, 'samples': 906944, 'steps': 1771, 'loss/train': 0.7008247375488281} -09/20/2021 20:37:35 - INFO - __main__ - Step 28343: {'lr': 0.0001997879905365246, 'samples': 906976, 'steps': 1771, 'loss/train': 2.4505038261413574} -09/20/2021 20:37:36 - INFO - __main__ - Step 28344: {'lr': 0.0001997879905365246, 'samples': 907008, 'steps': 1771, 'loss/train': 2.9076244831085205} -09/20/2021 20:37:37 - INFO - __main__ - Step 28345: {'lr': 0.0001997879905365246, 'samples': 907040, 'steps': 1771, 'loss/train': 1.6787304878234863} -09/20/2021 20:37:38 - INFO - __main__ - Step 28346: {'lr': 0.0001997879905365246, 'samples': 907072, 'steps': 1771, 'loss/train': 2.2596566677093506} -09/20/2021 20:37:38 - INFO - __main__ - Step 28347: {'lr': 0.0001997879905365246, 'samples': 907104, 'steps': 1771, 'loss/train': 2.991365671157837} -09/20/2021 20:37:39 - INFO - __main__ - Step 28348: {'lr': 0.0001997879905365246, 'samples': 907136, 'steps': 1771, 'loss/train': 2.7205209732055664} -09/20/2021 20:37:40 - INFO - __main__ - Step 28349: {'lr': 0.0001997879905365246, 'samples': 907168, 'steps': 1771, 'loss/train': 3.4584550857543945} -09/20/2021 20:37:41 - INFO - __main__ - Step 28350: {'lr': 0.0001997879905365246, 'samples': 907200, 'steps': 1771, 'loss/train': 2.1003365516662598} -09/20/2021 20:37:41 - INFO - __main__ - Step 28351: {'lr': 0.0001997879905365246, 'samples': 907232, 'steps': 1771, 'loss/train': 3.3217110633850098} -09/20/2021 20:37:42 - INFO - __main__ - Step 28352: {'lr': 0.0001997879905365246, 'samples': 907264, 'steps': 1771, 'loss/train': 1.800117015838623} -09/20/2021 20:37:43 - INFO - __main__ - Step 28353: {'lr': 0.00019978757518263794, 'samples': 907296, 'steps': 1772, 'loss/train': 1.60886812210083} -09/20/2021 20:37:44 - INFO - __main__ - Step 28354: {'lr': 0.00019978757518263794, 'samples': 907328, 'steps': 1772, 'loss/train': 2.8094098567962646} -09/20/2021 20:37:45 - INFO - __main__ - Step 28355: {'lr': 0.00019978757518263794, 'samples': 907360, 'steps': 1772, 'loss/train': 1.7466435432434082} -09/20/2021 20:37:45 - INFO - __main__ - Step 28356: {'lr': 0.00019978757518263794, 'samples': 907392, 'steps': 1772, 'loss/train': 2.3972880840301514} -09/20/2021 20:37:46 - INFO - __main__ - Step 28357: {'lr': 0.00019978757518263794, 'samples': 907424, 'steps': 1772, 'loss/train': 2.306229591369629} -09/20/2021 20:37:47 - INFO - __main__ - Step 28358: {'lr': 0.00019978757518263794, 'samples': 907456, 'steps': 1772, 'loss/train': 2.663254976272583} -09/20/2021 20:37:48 - INFO - __main__ - Step 28359: {'lr': 0.00019978757518263794, 'samples': 907488, 'steps': 1772, 'loss/train': 0.9708133339881897} -09/20/2021 20:37:48 - INFO - __main__ - Step 28360: {'lr': 0.00019978757518263794, 'samples': 907520, 'steps': 1772, 'loss/train': 3.00893497467041} -09/20/2021 20:37:49 - INFO - __main__ - Step 28361: {'lr': 0.00019978757518263794, 'samples': 907552, 'steps': 1772, 'loss/train': 3.203914165496826} -09/20/2021 20:37:50 - INFO - __main__ - Step 28362: {'lr': 0.00019978757518263794, 'samples': 907584, 'steps': 1772, 'loss/train': 1.857620358467102} -09/20/2021 20:37:51 - INFO - __main__ - Step 28363: {'lr': 0.00019978757518263794, 'samples': 907616, 'steps': 1772, 'loss/train': 1.9373464584350586} -09/20/2021 20:37:51 - INFO - __main__ - Step 28364: {'lr': 0.00019978757518263794, 'samples': 907648, 'steps': 1772, 'loss/train': 2.3578758239746094} -09/20/2021 20:37:52 - INFO - __main__ - Step 28365: {'lr': 0.00019978757518263794, 'samples': 907680, 'steps': 1772, 'loss/train': 3.8264060020446777} -09/20/2021 20:37:53 - INFO - __main__ - Step 28366: {'lr': 0.00019978757518263794, 'samples': 907712, 'steps': 1772, 'loss/train': 1.9780848026275635} -09/20/2021 20:37:54 - INFO - __main__ - Step 28367: {'lr': 0.00019978757518263794, 'samples': 907744, 'steps': 1772, 'loss/train': 3.133559465408325} -09/20/2021 20:37:55 - INFO - __main__ - Step 28368: {'lr': 0.00019978757518263794, 'samples': 907776, 'steps': 1772, 'loss/train': 2.2657768726348877} -09/20/2021 20:37:56 - INFO - __main__ - Step 28369: {'lr': 0.0001997871594227161, 'samples': 907808, 'steps': 1773, 'loss/train': 1.7223128080368042} -09/20/2021 20:37:57 - INFO - __main__ - Step 28370: {'lr': 0.0001997871594227161, 'samples': 907840, 'steps': 1773, 'loss/train': 2.4007787704467773} -09/20/2021 20:37:58 - INFO - __main__ - Step 28371: {'lr': 0.0001997871594227161, 'samples': 907872, 'steps': 1773, 'loss/train': 2.392078399658203} -09/20/2021 20:37:58 - INFO - __main__ - Step 28372: {'lr': 0.0001997871594227161, 'samples': 907904, 'steps': 1773, 'loss/train': 3.3231234550476074} -09/20/2021 20:37:59 - INFO - __main__ - Step 28373: {'lr': 0.0001997871594227161, 'samples': 907936, 'steps': 1773, 'loss/train': 3.0570027828216553} -09/20/2021 20:38:00 - INFO - __main__ - Step 28374: {'lr': 0.0001997871594227161, 'samples': 907968, 'steps': 1773, 'loss/train': 2.7886505126953125} -09/20/2021 20:38:01 - INFO - __main__ - Step 28375: {'lr': 0.0001997871594227161, 'samples': 908000, 'steps': 1773, 'loss/train': 3.0497426986694336} -09/20/2021 20:38:01 - INFO - __main__ - Step 28376: {'lr': 0.0001997871594227161, 'samples': 908032, 'steps': 1773, 'loss/train': 3.2698237895965576} -09/20/2021 20:38:02 - INFO - __main__ - Step 28377: {'lr': 0.0001997871594227161, 'samples': 908064, 'steps': 1773, 'loss/train': 3.200284004211426} -09/20/2021 20:38:03 - INFO - __main__ - Step 28378: {'lr': 0.0001997871594227161, 'samples': 908096, 'steps': 1773, 'loss/train': 2.9423768520355225} -09/20/2021 20:38:04 - INFO - __main__ - Step 28379: {'lr': 0.0001997871594227161, 'samples': 908128, 'steps': 1773, 'loss/train': 1.6462337970733643} -09/20/2021 20:38:04 - INFO - __main__ - Step 28380: {'lr': 0.0001997871594227161, 'samples': 908160, 'steps': 1773, 'loss/train': 3.225259304046631} -09/20/2021 20:38:05 - INFO - __main__ - Step 28381: {'lr': 0.0001997871594227161, 'samples': 908192, 'steps': 1773, 'loss/train': 2.7226195335388184} -09/20/2021 20:38:06 - INFO - __main__ - Step 28382: {'lr': 0.0001997871594227161, 'samples': 908224, 'steps': 1773, 'loss/train': 3.1801249980926514} -09/20/2021 20:38:07 - INFO - __main__ - Step 28383: {'lr': 0.0001997871594227161, 'samples': 908256, 'steps': 1773, 'loss/train': 2.3570239543914795} -09/20/2021 20:38:07 - INFO - __main__ - Step 28384: {'lr': 0.0001997871594227161, 'samples': 908288, 'steps': 1773, 'loss/train': 0.6695912480354309} -09/20/2021 20:38:08 - INFO - __main__ - Step 28385: {'lr': 0.00019978674325676064, 'samples': 908320, 'steps': 1774, 'loss/train': 0.38568949699401855} -09/20/2021 20:38:09 - INFO - __main__ - Step 28386: {'lr': 0.00019978674325676064, 'samples': 908352, 'steps': 1774, 'loss/train': 0.38724812865257263} -09/20/2021 20:38:10 - INFO - __main__ - Step 28387: {'lr': 0.00019978674325676064, 'samples': 908384, 'steps': 1774, 'loss/train': 0.6511082053184509} -09/20/2021 20:38:10 - INFO - __main__ - Step 28388: {'lr': 0.00019978674325676064, 'samples': 908416, 'steps': 1774, 'loss/train': 0.5317159295082092} -09/20/2021 20:38:11 - INFO - __main__ - Step 28389: {'lr': 0.00019978674325676064, 'samples': 908448, 'steps': 1774, 'loss/train': 0.3661177456378937} -09/20/2021 20:38:12 - INFO - __main__ - Step 28390: {'lr': 0.00019978674325676064, 'samples': 908480, 'steps': 1774, 'loss/train': 2.463141679763794} -09/20/2021 20:38:13 - INFO - __main__ - Step 28391: {'lr': 0.00019978674325676064, 'samples': 908512, 'steps': 1774, 'loss/train': 3.1057260036468506} -09/20/2021 20:38:13 - INFO - __main__ - Step 28392: {'lr': 0.00019978674325676064, 'samples': 908544, 'steps': 1774, 'loss/train': 2.7118453979492188} -09/20/2021 20:38:14 - INFO - __main__ - Step 28393: {'lr': 0.00019978674325676064, 'samples': 908576, 'steps': 1774, 'loss/train': 2.537097454071045} -09/20/2021 20:38:15 - INFO - __main__ - Step 28394: {'lr': 0.00019978674325676064, 'samples': 908608, 'steps': 1774, 'loss/train': 3.4307773113250732} -09/20/2021 20:38:16 - INFO - __main__ - Step 28395: {'lr': 0.00019978674325676064, 'samples': 908640, 'steps': 1774, 'loss/train': 2.266470432281494} -09/20/2021 20:38:16 - INFO - __main__ - Step 28396: {'lr': 0.00019978674325676064, 'samples': 908672, 'steps': 1774, 'loss/train': 3.434494733810425} -09/20/2021 20:38:17 - INFO - __main__ - Step 28397: {'lr': 0.00019978674325676064, 'samples': 908704, 'steps': 1774, 'loss/train': 2.9977378845214844} -09/20/2021 20:38:18 - INFO - __main__ - Step 28398: {'lr': 0.00019978674325676064, 'samples': 908736, 'steps': 1774, 'loss/train': 2.5227437019348145} -09/20/2021 20:38:19 - INFO - __main__ - Step 28399: {'lr': 0.00019978674325676064, 'samples': 908768, 'steps': 1774, 'loss/train': 3.2351677417755127} -09/20/2021 20:38:20 - INFO - __main__ - Step 28400: {'lr': 0.00019978674325676064, 'samples': 908800, 'steps': 1774, 'loss/train': 3.127466917037964} -09/20/2021 20:38:21 - INFO - __main__ - Step 28401: {'lr': 0.0001997863266847733, 'samples': 908832, 'steps': 1775, 'loss/train': 3.4580163955688477} -09/20/2021 20:38:22 - INFO - __main__ - Step 28402: {'lr': 0.0001997863266847733, 'samples': 908864, 'steps': 1775, 'loss/train': 2.156916379928589} -09/20/2021 20:38:22 - INFO - __main__ - Step 28403: {'lr': 0.0001997863266847733, 'samples': 908896, 'steps': 1775, 'loss/train': 2.3001208305358887} -09/20/2021 20:38:23 - INFO - __main__ - Step 28404: {'lr': 0.0001997863266847733, 'samples': 908928, 'steps': 1775, 'loss/train': 2.5853404998779297} -09/20/2021 20:38:24 - INFO - __main__ - Step 28405: {'lr': 0.0001997863266847733, 'samples': 908960, 'steps': 1775, 'loss/train': 2.5707788467407227} -09/20/2021 20:38:25 - INFO - __main__ - Step 28406: {'lr': 0.0001997863266847733, 'samples': 908992, 'steps': 1775, 'loss/train': 2.510624647140503} -09/20/2021 20:38:25 - INFO - __main__ - Step 28407: {'lr': 0.0001997863266847733, 'samples': 909024, 'steps': 1775, 'loss/train': 3.020961284637451} -09/20/2021 20:38:26 - INFO - __main__ - Step 28408: {'lr': 0.0001997863266847733, 'samples': 909056, 'steps': 1775, 'loss/train': 2.2937171459198} -09/20/2021 20:38:27 - INFO - __main__ - Step 28409: {'lr': 0.0001997863266847733, 'samples': 909088, 'steps': 1775, 'loss/train': 2.3618321418762207} -09/20/2021 20:38:28 - INFO - __main__ - Step 28410: {'lr': 0.0001997863266847733, 'samples': 909120, 'steps': 1775, 'loss/train': 2.27347469329834} -09/20/2021 20:38:28 - INFO - __main__ - Step 28411: {'lr': 0.0001997863266847733, 'samples': 909152, 'steps': 1775, 'loss/train': 2.5246663093566895} -09/20/2021 20:38:29 - INFO - __main__ - Step 28412: {'lr': 0.0001997863266847733, 'samples': 909184, 'steps': 1775, 'loss/train': 1.9114488363265991} -09/20/2021 20:38:30 - INFO - __main__ - Step 28413: {'lr': 0.0001997863266847733, 'samples': 909216, 'steps': 1775, 'loss/train': 2.9510116577148438} -09/20/2021 20:38:31 - INFO - __main__ - Step 28414: {'lr': 0.0001997863266847733, 'samples': 909248, 'steps': 1775, 'loss/train': 2.0989983081817627} -09/20/2021 20:38:31 - INFO - __main__ - Step 28415: {'lr': 0.0001997863266847733, 'samples': 909280, 'steps': 1775, 'loss/train': 2.808621644973755} -09/20/2021 20:38:32 - INFO - __main__ - Step 28416: {'lr': 0.0001997863266847733, 'samples': 909312, 'steps': 1775, 'loss/train': 2.8204500675201416} -09/20/2021 20:38:33 - INFO - __main__ - Step 28417: {'lr': 0.00019978590970675582, 'samples': 909344, 'steps': 1776, 'loss/train': 2.94442081451416} -09/20/2021 20:38:34 - INFO - __main__ - Step 28418: {'lr': 0.00019978590970675582, 'samples': 909376, 'steps': 1776, 'loss/train': 2.489363670349121} -09/20/2021 20:38:34 - INFO - __main__ - Step 28419: {'lr': 0.00019978590970675582, 'samples': 909408, 'steps': 1776, 'loss/train': 3.330028533935547} -09/20/2021 20:38:35 - INFO - __main__ - Step 28420: {'lr': 0.00019978590970675582, 'samples': 909440, 'steps': 1776, 'loss/train': 2.6147775650024414} -09/20/2021 20:38:36 - INFO - __main__ - Step 28421: {'lr': 0.00019978590970675582, 'samples': 909472, 'steps': 1776, 'loss/train': 1.309133768081665} -09/20/2021 20:38:37 - INFO - __main__ - Step 28422: {'lr': 0.00019978590970675582, 'samples': 909504, 'steps': 1776, 'loss/train': 2.2782928943634033} -09/20/2021 20:38:37 - INFO - __main__ - Step 28423: {'lr': 0.00019978590970675582, 'samples': 909536, 'steps': 1776, 'loss/train': 2.2704110145568848} -09/20/2021 20:38:38 - INFO - __main__ - Step 28424: {'lr': 0.00019978590970675582, 'samples': 909568, 'steps': 1776, 'loss/train': 2.8990418910980225} -09/20/2021 20:38:39 - INFO - __main__ - Step 28425: {'lr': 0.00019978590970675582, 'samples': 909600, 'steps': 1776, 'loss/train': 2.6090869903564453} -09/20/2021 20:38:40 - INFO - __main__ - Step 28426: {'lr': 0.00019978590970675582, 'samples': 909632, 'steps': 1776, 'loss/train': 1.6463110446929932} -09/20/2021 20:38:40 - INFO - __main__ - Step 28427: {'lr': 0.00019978590970675582, 'samples': 909664, 'steps': 1776, 'loss/train': 1.8386310338974} -09/20/2021 20:38:41 - INFO - __main__ - Step 28428: {'lr': 0.00019978590970675582, 'samples': 909696, 'steps': 1776, 'loss/train': 2.6751065254211426} -09/20/2021 20:38:42 - INFO - __main__ - Step 28429: {'lr': 0.00019978590970675582, 'samples': 909728, 'steps': 1776, 'loss/train': 2.926044225692749} -09/20/2021 20:38:43 - INFO - __main__ - Step 28430: {'lr': 0.00019978590970675582, 'samples': 909760, 'steps': 1776, 'loss/train': 2.367914915084839} -09/20/2021 20:38:44 - INFO - __main__ - Step 28431: {'lr': 0.00019978590970675582, 'samples': 909792, 'steps': 1776, 'loss/train': 0.7200709581375122} -09/20/2021 20:38:45 - INFO - __main__ - Step 28432: {'lr': 0.00019978590970675582, 'samples': 909824, 'steps': 1776, 'loss/train': 1.9824882745742798} -09/20/2021 20:38:46 - INFO - __main__ - Step 28433: {'lr': 0.00019978549232270985, 'samples': 909856, 'steps': 1777, 'loss/train': 2.0762691497802734} -09/20/2021 20:38:46 - INFO - __main__ - Step 28434: {'lr': 0.00019978549232270985, 'samples': 909888, 'steps': 1777, 'loss/train': 2.6234138011932373} -09/20/2021 20:38:47 - INFO - __main__ - Step 28435: {'lr': 0.00019978549232270985, 'samples': 909920, 'steps': 1777, 'loss/train': 2.6522176265716553} -09/20/2021 20:38:48 - INFO - __main__ - Step 28436: {'lr': 0.00019978549232270985, 'samples': 909952, 'steps': 1777, 'loss/train': 2.0929274559020996} -09/20/2021 20:38:49 - INFO - __main__ - Step 28437: {'lr': 0.00019978549232270985, 'samples': 909984, 'steps': 1777, 'loss/train': 2.141685962677002} -09/20/2021 20:38:49 - INFO - __main__ - Step 28438: {'lr': 0.00019978549232270985, 'samples': 910016, 'steps': 1777, 'loss/train': 2.6091878414154053} -09/20/2021 20:38:50 - INFO - __main__ - Step 28439: {'lr': 0.00019978549232270985, 'samples': 910048, 'steps': 1777, 'loss/train': 3.232046604156494} -09/20/2021 20:38:51 - INFO - __main__ - Step 28440: {'lr': 0.00019978549232270985, 'samples': 910080, 'steps': 1777, 'loss/train': 2.6853020191192627} -09/20/2021 20:38:52 - INFO - __main__ - Step 28441: {'lr': 0.00019978549232270985, 'samples': 910112, 'steps': 1777, 'loss/train': 2.178529739379883} -09/20/2021 20:38:52 - INFO - __main__ - Step 28442: {'lr': 0.00019978549232270985, 'samples': 910144, 'steps': 1777, 'loss/train': 2.8326451778411865} -09/20/2021 20:38:53 - INFO - __main__ - Step 28443: {'lr': 0.00019978549232270985, 'samples': 910176, 'steps': 1777, 'loss/train': 2.3918581008911133} -09/20/2021 20:38:54 - INFO - __main__ - Step 28444: {'lr': 0.00019978549232270985, 'samples': 910208, 'steps': 1777, 'loss/train': 3.2718849182128906} -09/20/2021 20:38:55 - INFO - __main__ - Step 28445: {'lr': 0.00019978549232270985, 'samples': 910240, 'steps': 1777, 'loss/train': 3.035372734069824} -09/20/2021 20:38:55 - INFO - __main__ - Step 28446: {'lr': 0.00019978549232270985, 'samples': 910272, 'steps': 1777, 'loss/train': 3.6519722938537598} -09/20/2021 20:38:56 - INFO - __main__ - Step 28447: {'lr': 0.00019978549232270985, 'samples': 910304, 'steps': 1777, 'loss/train': 2.2249233722686768} -09/20/2021 20:38:57 - INFO - __main__ - Step 28448: {'lr': 0.00019978549232270985, 'samples': 910336, 'steps': 1777, 'loss/train': 2.02944016456604} -09/20/2021 20:38:58 - INFO - __main__ - Step 28449: {'lr': 0.00019978507453263707, 'samples': 910368, 'steps': 1778, 'loss/train': 2.413020133972168} -09/20/2021 20:38:58 - INFO - __main__ - Step 28450: {'lr': 0.00019978507453263707, 'samples': 910400, 'steps': 1778, 'loss/train': 2.496825695037842} -09/20/2021 20:38:59 - INFO - __main__ - Step 28451: {'lr': 0.00019978507453263707, 'samples': 910432, 'steps': 1778, 'loss/train': 1.9501153230667114} -09/20/2021 20:39:00 - INFO - __main__ - Step 28452: {'lr': 0.00019978507453263707, 'samples': 910464, 'steps': 1778, 'loss/train': 2.080437183380127} -09/20/2021 20:39:01 - INFO - __main__ - Step 28453: {'lr': 0.00019978507453263707, 'samples': 910496, 'steps': 1778, 'loss/train': 3.3378915786743164} -09/20/2021 20:39:01 - INFO - __main__ - Step 28454: {'lr': 0.00019978507453263707, 'samples': 910528, 'steps': 1778, 'loss/train': 1.54012131690979} -09/20/2021 20:39:02 - INFO - __main__ - Step 28455: {'lr': 0.00019978507453263707, 'samples': 910560, 'steps': 1778, 'loss/train': 3.0269315242767334} -09/20/2021 20:39:03 - INFO - __main__ - Step 28456: {'lr': 0.00019978507453263707, 'samples': 910592, 'steps': 1778, 'loss/train': 2.513538360595703} -09/20/2021 20:39:04 - INFO - __main__ - Step 28457: {'lr': 0.00019978507453263707, 'samples': 910624, 'steps': 1778, 'loss/train': 2.676740884780884} -09/20/2021 20:39:04 - INFO - __main__ - Step 28458: {'lr': 0.00019978507453263707, 'samples': 910656, 'steps': 1778, 'loss/train': 3.1714906692504883} -09/20/2021 20:39:05 - INFO - __main__ - Step 28459: {'lr': 0.00019978507453263707, 'samples': 910688, 'steps': 1778, 'loss/train': 2.8217644691467285} -09/20/2021 20:39:06 - INFO - __main__ - Step 28460: {'lr': 0.00019978507453263707, 'samples': 910720, 'steps': 1778, 'loss/train': 3.7178568840026855} -09/20/2021 20:39:07 - INFO - __main__ - Step 28461: {'lr': 0.00019978507453263707, 'samples': 910752, 'steps': 1778, 'loss/train': 3.2069144248962402} -09/20/2021 20:39:08 - INFO - __main__ - Step 28462: {'lr': 0.00019978507453263707, 'samples': 910784, 'steps': 1778, 'loss/train': 2.9458906650543213} -09/20/2021 20:39:09 - INFO - __main__ - Step 28463: {'lr': 0.00019978507453263707, 'samples': 910816, 'steps': 1778, 'loss/train': 0.4932063817977905} -09/20/2021 20:39:09 - INFO - __main__ - Step 28464: {'lr': 0.00019978507453263707, 'samples': 910848, 'steps': 1778, 'loss/train': 2.9866580963134766} -09/20/2021 20:39:10 - INFO - __main__ - Step 28465: {'lr': 0.00019978465633653923, 'samples': 910880, 'steps': 1779, 'loss/train': 2.429462194442749} -09/20/2021 20:39:11 - INFO - __main__ - Step 28466: {'lr': 0.00019978465633653923, 'samples': 910912, 'steps': 1779, 'loss/train': 2.449634552001953} -09/20/2021 20:39:12 - INFO - __main__ - Step 28467: {'lr': 0.00019978465633653923, 'samples': 910944, 'steps': 1779, 'loss/train': 0.45011746883392334} -09/20/2021 20:39:13 - INFO - __main__ - Step 28468: {'lr': 0.00019978465633653923, 'samples': 910976, 'steps': 1779, 'loss/train': 2.688293218612671} -09/20/2021 20:39:13 - INFO - __main__ - Step 28469: {'lr': 0.00019978465633653923, 'samples': 911008, 'steps': 1779, 'loss/train': 2.2997093200683594} -09/20/2021 20:39:14 - INFO - __main__ - Step 28470: {'lr': 0.00019978465633653923, 'samples': 911040, 'steps': 1779, 'loss/train': 2.911067247390747} -09/20/2021 20:39:15 - INFO - __main__ - Step 28471: {'lr': 0.00019978465633653923, 'samples': 911072, 'steps': 1779, 'loss/train': 2.5873565673828125} -09/20/2021 20:39:16 - INFO - __main__ - Step 28472: {'lr': 0.00019978465633653923, 'samples': 911104, 'steps': 1779, 'loss/train': 1.6480772495269775} -09/20/2021 20:39:16 - INFO - __main__ - Step 28473: {'lr': 0.00019978465633653923, 'samples': 911136, 'steps': 1779, 'loss/train': 3.2723028659820557} -09/20/2021 20:39:17 - INFO - __main__ - Step 28474: {'lr': 0.00019978465633653923, 'samples': 911168, 'steps': 1779, 'loss/train': 1.0038989782333374} -09/20/2021 20:39:18 - INFO - __main__ - Step 28475: {'lr': 0.00019978465633653923, 'samples': 911200, 'steps': 1779, 'loss/train': 2.091477394104004} -09/20/2021 20:39:19 - INFO - __main__ - Step 28476: {'lr': 0.00019978465633653923, 'samples': 911232, 'steps': 1779, 'loss/train': 2.4434144496917725} -09/20/2021 20:39:19 - INFO - __main__ - Step 28477: {'lr': 0.00019978465633653923, 'samples': 911264, 'steps': 1779, 'loss/train': 0.9082856774330139} -09/20/2021 20:39:20 - INFO - __main__ - Step 28478: {'lr': 0.00019978465633653923, 'samples': 911296, 'steps': 1779, 'loss/train': 0.5984295010566711} -09/20/2021 20:39:21 - INFO - __main__ - Step 28479: {'lr': 0.00019978465633653923, 'samples': 911328, 'steps': 1779, 'loss/train': 2.0949487686157227} -09/20/2021 20:39:22 - INFO - __main__ - Step 28480: {'lr': 0.00019978465633653923, 'samples': 911360, 'steps': 1779, 'loss/train': 1.9001367092132568} -09/20/2021 20:39:23 - INFO - __main__ - Step 28481: {'lr': 0.00019978423773441803, 'samples': 911392, 'steps': 1780, 'loss/train': 0.5796273350715637} -09/20/2021 20:39:23 - INFO - __main__ - Step 28482: {'lr': 0.00019978423773441803, 'samples': 911424, 'steps': 1780, 'loss/train': 1.8142411708831787} -09/20/2021 20:39:24 - INFO - __main__ - Step 28483: {'lr': 0.00019978423773441803, 'samples': 911456, 'steps': 1780, 'loss/train': 0.6119629740715027} -09/20/2021 20:39:25 - INFO - __main__ - Step 28484: {'lr': 0.00019978423773441803, 'samples': 911488, 'steps': 1780, 'loss/train': 2.0591881275177} -09/20/2021 20:39:26 - INFO - __main__ - Step 28485: {'lr': 0.00019978423773441803, 'samples': 911520, 'steps': 1780, 'loss/train': 2.747934579849243} -09/20/2021 20:39:26 - INFO - __main__ - Step 28486: {'lr': 0.00019978423773441803, 'samples': 911552, 'steps': 1780, 'loss/train': 3.7708921432495117} -09/20/2021 20:39:27 - INFO - __main__ - Step 28487: {'lr': 0.00019978423773441803, 'samples': 911584, 'steps': 1780, 'loss/train': 2.0843966007232666} -09/20/2021 20:39:28 - INFO - __main__ - Step 28488: {'lr': 0.00019978423773441803, 'samples': 911616, 'steps': 1780, 'loss/train': 2.3641467094421387} -09/20/2021 20:39:29 - INFO - __main__ - Step 28489: {'lr': 0.00019978423773441803, 'samples': 911648, 'steps': 1780, 'loss/train': 2.2958226203918457} -09/20/2021 20:39:29 - INFO - __main__ - Step 28490: {'lr': 0.00019978423773441803, 'samples': 911680, 'steps': 1780, 'loss/train': 2.873983860015869} -09/20/2021 20:39:30 - INFO - __main__ - Step 28491: {'lr': 0.00019978423773441803, 'samples': 911712, 'steps': 1780, 'loss/train': 2.526397466659546} -09/20/2021 20:39:31 - INFO - __main__ - Step 28492: {'lr': 0.00019978423773441803, 'samples': 911744, 'steps': 1780, 'loss/train': 2.097538948059082} -09/20/2021 20:39:32 - INFO - __main__ - Step 28493: {'lr': 0.00019978423773441803, 'samples': 911776, 'steps': 1780, 'loss/train': 2.6699624061584473} -09/20/2021 20:39:33 - INFO - __main__ - Step 28494: {'lr': 0.00019978423773441803, 'samples': 911808, 'steps': 1780, 'loss/train': 1.2649967670440674} -09/20/2021 20:39:34 - INFO - __main__ - Step 28495: {'lr': 0.00019978423773441803, 'samples': 911840, 'steps': 1780, 'loss/train': 2.034303665161133} -09/20/2021 20:39:34 - INFO - __main__ - Step 28496: {'lr': 0.00019978423773441803, 'samples': 911872, 'steps': 1780, 'loss/train': 1.3830657005310059} -09/20/2021 20:39:35 - INFO - __main__ - Step 28497: {'lr': 0.00019978381872627515, 'samples': 911904, 'steps': 1781, 'loss/train': 3.0171892642974854} -09/20/2021 20:39:36 - INFO - __main__ - Step 28498: {'lr': 0.00019978381872627515, 'samples': 911936, 'steps': 1781, 'loss/train': 2.8891477584838867} -09/20/2021 20:39:37 - INFO - __main__ - Step 28499: {'lr': 0.00019978381872627515, 'samples': 911968, 'steps': 1781, 'loss/train': 1.551985740661621} -09/20/2021 20:39:38 - INFO - __main__ - Step 28500: {'lr': 0.00019978381872627515, 'samples': 912000, 'steps': 1781, 'loss/train': 1.805639386177063} -09/20/2021 20:39:38 - INFO - __main__ - Step 28501: {'lr': 0.00019978381872627515, 'samples': 912032, 'steps': 1781, 'loss/train': 1.872816562652588} -09/20/2021 20:39:39 - INFO - __main__ - Step 28502: {'lr': 0.00019978381872627515, 'samples': 912064, 'steps': 1781, 'loss/train': 1.7262603044509888} -09/20/2021 20:39:40 - INFO - __main__ - Step 28503: {'lr': 0.00019978381872627515, 'samples': 912096, 'steps': 1781, 'loss/train': 1.8592106103897095} -09/20/2021 20:39:41 - INFO - __main__ - Step 28504: {'lr': 0.00019978381872627515, 'samples': 912128, 'steps': 1781, 'loss/train': 3.0269875526428223} -09/20/2021 20:39:41 - INFO - __main__ - Step 28505: {'lr': 0.00019978381872627515, 'samples': 912160, 'steps': 1781, 'loss/train': 2.475105047225952} -09/20/2021 20:39:42 - INFO - __main__ - Step 28506: {'lr': 0.00019978381872627515, 'samples': 912192, 'steps': 1781, 'loss/train': 2.961094379425049} -09/20/2021 20:39:43 - INFO - __main__ - Step 28507: {'lr': 0.00019978381872627515, 'samples': 912224, 'steps': 1781, 'loss/train': 2.2131290435791016} -09/20/2021 20:39:44 - INFO - __main__ - Step 28508: {'lr': 0.00019978381872627515, 'samples': 912256, 'steps': 1781, 'loss/train': 2.319488048553467} -09/20/2021 20:39:44 - INFO - __main__ - Step 28509: {'lr': 0.00019978381872627515, 'samples': 912288, 'steps': 1781, 'loss/train': 1.8564093112945557} -09/20/2021 20:39:45 - INFO - __main__ - Step 28510: {'lr': 0.00019978381872627515, 'samples': 912320, 'steps': 1781, 'loss/train': 2.0463037490844727} -09/20/2021 20:39:46 - INFO - __main__ - Step 28511: {'lr': 0.00019978381872627515, 'samples': 912352, 'steps': 1781, 'loss/train': 2.8092362880706787} -09/20/2021 20:39:47 - INFO - __main__ - Step 28512: {'lr': 0.00019978381872627515, 'samples': 912384, 'steps': 1781, 'loss/train': 2.3838210105895996} -09/20/2021 20:39:47 - INFO - __main__ - Step 28513: {'lr': 0.00019978339931211227, 'samples': 912416, 'steps': 1782, 'loss/train': 2.7725677490234375} -09/20/2021 20:39:48 - INFO - __main__ - Step 28514: {'lr': 0.00019978339931211227, 'samples': 912448, 'steps': 1782, 'loss/train': 3.704435110092163} -09/20/2021 20:39:49 - INFO - __main__ - Step 28515: {'lr': 0.00019978339931211227, 'samples': 912480, 'steps': 1782, 'loss/train': 2.0918378829956055} -09/20/2021 20:39:50 - INFO - __main__ - Step 28516: {'lr': 0.00019978339931211227, 'samples': 912512, 'steps': 1782, 'loss/train': 2.806859254837036} -09/20/2021 20:39:50 - INFO - __main__ - Step 28517: {'lr': 0.00019978339931211227, 'samples': 912544, 'steps': 1782, 'loss/train': 3.497791290283203} -09/20/2021 20:39:51 - INFO - __main__ - Step 28518: {'lr': 0.00019978339931211227, 'samples': 912576, 'steps': 1782, 'loss/train': 1.3278008699417114} -09/20/2021 20:39:52 - INFO - __main__ - Step 28519: {'lr': 0.00019978339931211227, 'samples': 912608, 'steps': 1782, 'loss/train': 2.0374250411987305} -09/20/2021 20:39:53 - INFO - __main__ - Step 28520: {'lr': 0.00019978339931211227, 'samples': 912640, 'steps': 1782, 'loss/train': 0.4540654420852661} -09/20/2021 20:39:53 - INFO - __main__ - Step 28521: {'lr': 0.00019978339931211227, 'samples': 912672, 'steps': 1782, 'loss/train': 2.2492058277130127} -09/20/2021 20:39:54 - INFO - __main__ - Step 28522: {'lr': 0.00019978339931211227, 'samples': 912704, 'steps': 1782, 'loss/train': 1.934531807899475} -09/20/2021 20:39:55 - INFO - __main__ - Step 28523: {'lr': 0.00019978339931211227, 'samples': 912736, 'steps': 1782, 'loss/train': 1.4780173301696777} -09/20/2021 20:39:56 - INFO - __main__ - Step 28524: {'lr': 0.00019978339931211227, 'samples': 912768, 'steps': 1782, 'loss/train': 3.625054359436035} -09/20/2021 20:39:57 - INFO - __main__ - Step 28525: {'lr': 0.00019978339931211227, 'samples': 912800, 'steps': 1782, 'loss/train': 3.083350658416748} -09/20/2021 20:39:58 - INFO - __main__ - Step 28526: {'lr': 0.00019978339931211227, 'samples': 912832, 'steps': 1782, 'loss/train': 2.9294016361236572} -09/20/2021 20:39:58 - INFO - __main__ - Step 28527: {'lr': 0.00019978339931211227, 'samples': 912864, 'steps': 1782, 'loss/train': 3.3132970333099365} -09/20/2021 20:39:59 - INFO - __main__ - Step 28528: {'lr': 0.00019978339931211227, 'samples': 912896, 'steps': 1782, 'loss/train': 2.5201432704925537} -09/20/2021 20:40:00 - INFO - __main__ - Step 28529: {'lr': 0.00019978297949193113, 'samples': 912928, 'steps': 1783, 'loss/train': 2.939345359802246} -09/20/2021 20:40:01 - INFO - __main__ - Step 28530: {'lr': 0.00019978297949193113, 'samples': 912960, 'steps': 1783, 'loss/train': 2.1816065311431885} -09/20/2021 20:40:02 - INFO - __main__ - Step 28531: {'lr': 0.00019978297949193113, 'samples': 912992, 'steps': 1783, 'loss/train': 1.41914963722229} -09/20/2021 20:40:02 - INFO - __main__ - Step 28532: {'lr': 0.00019978297949193113, 'samples': 913024, 'steps': 1783, 'loss/train': 2.673027515411377} -09/20/2021 20:40:03 - INFO - __main__ - Step 28533: {'lr': 0.00019978297949193113, 'samples': 913056, 'steps': 1783, 'loss/train': 2.0896034240722656} -09/20/2021 20:40:04 - INFO - __main__ - Step 28534: {'lr': 0.00019978297949193113, 'samples': 913088, 'steps': 1783, 'loss/train': 2.7015299797058105} -09/20/2021 20:40:05 - INFO - __main__ - Step 28535: {'lr': 0.00019978297949193113, 'samples': 913120, 'steps': 1783, 'loss/train': 2.0026042461395264} -09/20/2021 20:40:05 - INFO - __main__ - Step 28536: {'lr': 0.00019978297949193113, 'samples': 913152, 'steps': 1783, 'loss/train': 3.322045087814331} -09/20/2021 20:40:06 - INFO - __main__ - Step 28537: {'lr': 0.00019978297949193113, 'samples': 913184, 'steps': 1783, 'loss/train': 0.8046040534973145} -09/20/2021 20:40:07 - INFO - __main__ - Step 28538: {'lr': 0.00019978297949193113, 'samples': 913216, 'steps': 1783, 'loss/train': 2.5126476287841797} -09/20/2021 20:40:08 - INFO - __main__ - Step 28539: {'lr': 0.00019978297949193113, 'samples': 913248, 'steps': 1783, 'loss/train': 2.770256757736206} -09/20/2021 20:40:08 - INFO - __main__ - Step 28540: {'lr': 0.00019978297949193113, 'samples': 913280, 'steps': 1783, 'loss/train': 2.6771323680877686} -09/20/2021 20:40:09 - INFO - __main__ - Step 28541: {'lr': 0.00019978297949193113, 'samples': 913312, 'steps': 1783, 'loss/train': 2.447845220565796} -09/20/2021 20:40:10 - INFO - __main__ - Step 28542: {'lr': 0.00019978297949193113, 'samples': 913344, 'steps': 1783, 'loss/train': 0.7132733464241028} -09/20/2021 20:40:11 - INFO - __main__ - Step 28543: {'lr': 0.00019978297949193113, 'samples': 913376, 'steps': 1783, 'loss/train': 1.8535236120224} -09/20/2021 20:40:11 - INFO - __main__ - Step 28544: {'lr': 0.00019978297949193113, 'samples': 913408, 'steps': 1783, 'loss/train': 3.261218547821045} -09/20/2021 20:40:12 - INFO - __main__ - Step 28545: {'lr': 0.00019978255926573346, 'samples': 913440, 'steps': 1784, 'loss/train': 2.2305915355682373} -09/20/2021 20:40:13 - INFO - __main__ - Step 28546: {'lr': 0.00019978255926573346, 'samples': 913472, 'steps': 1784, 'loss/train': 2.7501180171966553} -09/20/2021 20:40:14 - INFO - __main__ - Step 28547: {'lr': 0.00019978255926573346, 'samples': 913504, 'steps': 1784, 'loss/train': 2.6103310585021973} -09/20/2021 20:40:14 - INFO - __main__ - Step 28548: {'lr': 0.00019978255926573346, 'samples': 913536, 'steps': 1784, 'loss/train': 2.6392786502838135} -09/20/2021 20:40:15 - INFO - __main__ - Step 28549: {'lr': 0.00019978255926573346, 'samples': 913568, 'steps': 1784, 'loss/train': 3.0612049102783203} -09/20/2021 20:40:16 - INFO - __main__ - Step 28550: {'lr': 0.00019978255926573346, 'samples': 913600, 'steps': 1784, 'loss/train': 2.01735520362854} -09/20/2021 20:40:17 - INFO - __main__ - Step 28551: {'lr': 0.00019978255926573346, 'samples': 913632, 'steps': 1784, 'loss/train': 2.707587242126465} -09/20/2021 20:40:17 - INFO - __main__ - Step 28552: {'lr': 0.00019978255926573346, 'samples': 913664, 'steps': 1784, 'loss/train': 2.3870458602905273} -09/20/2021 20:40:18 - INFO - __main__ - Step 28553: {'lr': 0.00019978255926573346, 'samples': 913696, 'steps': 1784, 'loss/train': 0.4825453460216522} -09/20/2021 20:40:19 - INFO - __main__ - Step 28554: {'lr': 0.00019978255926573346, 'samples': 913728, 'steps': 1784, 'loss/train': 2.433385133743286} -09/20/2021 20:40:20 - INFO - __main__ - Step 28555: {'lr': 0.00019978255926573346, 'samples': 913760, 'steps': 1784, 'loss/train': 1.9169985055923462} -09/20/2021 20:40:21 - INFO - __main__ - Step 28556: {'lr': 0.00019978255926573346, 'samples': 913792, 'steps': 1784, 'loss/train': 2.7424795627593994} -09/20/2021 20:40:22 - INFO - __main__ - Step 28557: {'lr': 0.00019978255926573346, 'samples': 913824, 'steps': 1784, 'loss/train': 3.0045981407165527} -09/20/2021 20:40:23 - INFO - __main__ - Step 28558: {'lr': 0.00019978255926573346, 'samples': 913856, 'steps': 1784, 'loss/train': 1.6399173736572266} -09/20/2021 20:40:23 - INFO - __main__ - Step 28559: {'lr': 0.00019978255926573346, 'samples': 913888, 'steps': 1784, 'loss/train': 2.2463972568511963} -09/20/2021 20:40:24 - INFO - __main__ - Step 28560: {'lr': 0.00019978255926573346, 'samples': 913920, 'steps': 1784, 'loss/train': 1.2318753004074097} -09/20/2021 20:40:25 - INFO - __main__ - Step 28561: {'lr': 0.00019978213863352094, 'samples': 913952, 'steps': 1785, 'loss/train': 1.809181809425354} -09/20/2021 20:40:26 - INFO - __main__ - Step 28562: {'lr': 0.00019978213863352094, 'samples': 913984, 'steps': 1785, 'loss/train': 2.8935275077819824} -09/20/2021 20:40:27 - INFO - __main__ - Step 28563: {'lr': 0.00019978213863352094, 'samples': 914016, 'steps': 1785, 'loss/train': 2.062944173812866} -09/20/2021 20:40:27 - INFO - __main__ - Step 28564: {'lr': 0.00019978213863352094, 'samples': 914048, 'steps': 1785, 'loss/train': 3.098449468612671} -09/20/2021 20:40:28 - INFO - __main__ - Step 28565: {'lr': 0.00019978213863352094, 'samples': 914080, 'steps': 1785, 'loss/train': 2.4465067386627197} -09/20/2021 20:40:29 - INFO - __main__ - Step 28566: {'lr': 0.00019978213863352094, 'samples': 914112, 'steps': 1785, 'loss/train': 2.5173943042755127} -09/20/2021 20:40:30 - INFO - __main__ - Step 28567: {'lr': 0.00019978213863352094, 'samples': 914144, 'steps': 1785, 'loss/train': 2.3691062927246094} -09/20/2021 20:40:30 - INFO - __main__ - Step 28568: {'lr': 0.00019978213863352094, 'samples': 914176, 'steps': 1785, 'loss/train': 2.8640897274017334} -09/20/2021 20:40:31 - INFO - __main__ - Step 28569: {'lr': 0.00019978213863352094, 'samples': 914208, 'steps': 1785, 'loss/train': 1.7509081363677979} -09/20/2021 20:40:32 - INFO - __main__ - Step 28570: {'lr': 0.00019978213863352094, 'samples': 914240, 'steps': 1785, 'loss/train': 3.056396961212158} -09/20/2021 20:40:33 - INFO - __main__ - Step 28571: {'lr': 0.00019978213863352094, 'samples': 914272, 'steps': 1785, 'loss/train': 1.7637633085250854} -09/20/2021 20:40:33 - INFO - __main__ - Step 28572: {'lr': 0.00019978213863352094, 'samples': 914304, 'steps': 1785, 'loss/train': 1.947911024093628} -09/20/2021 20:40:34 - INFO - __main__ - Step 28573: {'lr': 0.00019978213863352094, 'samples': 914336, 'steps': 1785, 'loss/train': 3.7684998512268066} -09/20/2021 20:40:35 - INFO - __main__ - Step 28574: {'lr': 0.00019978213863352094, 'samples': 914368, 'steps': 1785, 'loss/train': 3.7228565216064453} -09/20/2021 20:40:36 - INFO - __main__ - Step 28575: {'lr': 0.00019978213863352094, 'samples': 914400, 'steps': 1785, 'loss/train': 3.6300132274627686} -09/20/2021 20:40:36 - INFO - __main__ - Step 28576: {'lr': 0.00019978213863352094, 'samples': 914432, 'steps': 1785, 'loss/train': 2.1363468170166016} -09/20/2021 20:40:37 - INFO - __main__ - Step 28577: {'lr': 0.00019978171759529528, 'samples': 914464, 'steps': 1786, 'loss/train': 4.644251346588135} -09/20/2021 20:40:38 - INFO - __main__ - Step 28578: {'lr': 0.00019978171759529528, 'samples': 914496, 'steps': 1786, 'loss/train': 3.5343570709228516} -09/20/2021 20:40:39 - INFO - __main__ - Step 28579: {'lr': 0.00019978171759529528, 'samples': 914528, 'steps': 1786, 'loss/train': 2.3348567485809326} -09/20/2021 20:40:39 - INFO - __main__ - Step 28580: {'lr': 0.00019978171759529528, 'samples': 914560, 'steps': 1786, 'loss/train': 2.8999111652374268} -09/20/2021 20:40:40 - INFO - __main__ - Step 28581: {'lr': 0.00019978171759529528, 'samples': 914592, 'steps': 1786, 'loss/train': 2.6064441204071045} -09/20/2021 20:40:41 - INFO - __main__ - Step 28582: {'lr': 0.00019978171759529528, 'samples': 914624, 'steps': 1786, 'loss/train': 1.7409826517105103} -09/20/2021 20:40:42 - INFO - __main__ - Step 28583: {'lr': 0.00019978171759529528, 'samples': 914656, 'steps': 1786, 'loss/train': 2.973228931427002} -09/20/2021 20:40:42 - INFO - __main__ - Step 28584: {'lr': 0.00019978171759529528, 'samples': 914688, 'steps': 1786, 'loss/train': 2.743119716644287} -09/20/2021 20:40:43 - INFO - __main__ - Step 28585: {'lr': 0.00019978171759529528, 'samples': 914720, 'steps': 1786, 'loss/train': 3.172459363937378} -09/20/2021 20:40:44 - INFO - __main__ - Step 28586: {'lr': 0.00019978171759529528, 'samples': 914752, 'steps': 1786, 'loss/train': 2.965963125228882} -09/20/2021 20:40:45 - INFO - __main__ - Step 28587: {'lr': 0.00019978171759529528, 'samples': 914784, 'steps': 1786, 'loss/train': 2.0514180660247803} -09/20/2021 20:40:46 - INFO - __main__ - Step 28588: {'lr': 0.00019978171759529528, 'samples': 914816, 'steps': 1786, 'loss/train': 2.2922310829162598} -09/20/2021 20:40:47 - INFO - __main__ - Step 28589: {'lr': 0.00019978171759529528, 'samples': 914848, 'steps': 1786, 'loss/train': 1.790147066116333} -09/20/2021 20:40:47 - INFO - __main__ - Step 28590: {'lr': 0.00019978171759529528, 'samples': 914880, 'steps': 1786, 'loss/train': 2.9404773712158203} -09/20/2021 20:40:48 - INFO - __main__ - Step 28591: {'lr': 0.00019978171759529528, 'samples': 914912, 'steps': 1786, 'loss/train': 2.4624247550964355} -09/20/2021 20:40:49 - INFO - __main__ - Step 28592: {'lr': 0.00019978171759529528, 'samples': 914944, 'steps': 1786, 'loss/train': 2.704238176345825} -09/20/2021 20:40:50 - INFO - __main__ - Step 28593: {'lr': 0.0001997812961510582, 'samples': 914976, 'steps': 1787, 'loss/train': 2.7807679176330566} -09/20/2021 20:40:51 - INFO - __main__ - Step 28594: {'lr': 0.0001997812961510582, 'samples': 915008, 'steps': 1787, 'loss/train': 3.5137693881988525} -09/20/2021 20:40:51 - INFO - __main__ - Step 28595: {'lr': 0.0001997812961510582, 'samples': 915040, 'steps': 1787, 'loss/train': 2.530547618865967} -09/20/2021 20:40:52 - INFO - __main__ - Step 28596: {'lr': 0.0001997812961510582, 'samples': 915072, 'steps': 1787, 'loss/train': 1.98014497756958} -09/20/2021 20:40:53 - INFO - __main__ - Step 28597: {'lr': 0.0001997812961510582, 'samples': 915104, 'steps': 1787, 'loss/train': 2.911353349685669} -09/20/2021 20:40:54 - INFO - __main__ - Step 28598: {'lr': 0.0001997812961510582, 'samples': 915136, 'steps': 1787, 'loss/train': 1.9326574802398682} -09/20/2021 20:40:54 - INFO - __main__ - Step 28599: {'lr': 0.0001997812961510582, 'samples': 915168, 'steps': 1787, 'loss/train': 4.035880088806152} -09/20/2021 20:40:55 - INFO - __main__ - Step 28600: {'lr': 0.0001997812961510582, 'samples': 915200, 'steps': 1787, 'loss/train': 1.42741858959198} -09/20/2021 20:40:56 - INFO - __main__ - Step 28601: {'lr': 0.0001997812961510582, 'samples': 915232, 'steps': 1787, 'loss/train': 1.8351150751113892} -09/20/2021 20:40:57 - INFO - __main__ - Step 28602: {'lr': 0.0001997812961510582, 'samples': 915264, 'steps': 1787, 'loss/train': 2.3258743286132812} -09/20/2021 20:40:57 - INFO - __main__ - Step 28603: {'lr': 0.0001997812961510582, 'samples': 915296, 'steps': 1787, 'loss/train': 2.565426826477051} -09/20/2021 20:40:58 - INFO - __main__ - Step 28604: {'lr': 0.0001997812961510582, 'samples': 915328, 'steps': 1787, 'loss/train': 2.883683919906616} -09/20/2021 20:40:59 - INFO - __main__ - Step 28605: {'lr': 0.0001997812961510582, 'samples': 915360, 'steps': 1787, 'loss/train': 1.9125932455062866} -09/20/2021 20:41:00 - INFO - __main__ - Step 28606: {'lr': 0.0001997812961510582, 'samples': 915392, 'steps': 1787, 'loss/train': 2.6051595211029053} -09/20/2021 20:41:00 - INFO - __main__ - Step 28607: {'lr': 0.0001997812961510582, 'samples': 915424, 'steps': 1787, 'loss/train': 1.7734853029251099} -09/20/2021 20:41:01 - INFO - __main__ - Step 28608: {'lr': 0.0001997812961510582, 'samples': 915456, 'steps': 1787, 'loss/train': 3.135920524597168} -09/20/2021 20:41:02 - INFO - __main__ - Step 28609: {'lr': 0.00019978087430081137, 'samples': 915488, 'steps': 1788, 'loss/train': 1.4189900159835815} -09/20/2021 20:41:03 - INFO - __main__ - Step 28610: {'lr': 0.00019978087430081137, 'samples': 915520, 'steps': 1788, 'loss/train': 2.3081135749816895} -09/20/2021 20:41:03 - INFO - __main__ - Step 28611: {'lr': 0.00019978087430081137, 'samples': 915552, 'steps': 1788, 'loss/train': 2.089952230453491} -09/20/2021 20:41:04 - INFO - __main__ - Step 28612: {'lr': 0.00019978087430081137, 'samples': 915584, 'steps': 1788, 'loss/train': 2.432366132736206} -09/20/2021 20:41:05 - INFO - __main__ - Step 28613: {'lr': 0.00019978087430081137, 'samples': 915616, 'steps': 1788, 'loss/train': 3.343268871307373} -09/20/2021 20:41:06 - INFO - __main__ - Step 28614: {'lr': 0.00019978087430081137, 'samples': 915648, 'steps': 1788, 'loss/train': 1.9778432846069336} -09/20/2021 20:41:06 - INFO - __main__ - Step 28615: {'lr': 0.00019978087430081137, 'samples': 915680, 'steps': 1788, 'loss/train': 3.1076862812042236} -09/20/2021 20:41:07 - INFO - __main__ - Step 28616: {'lr': 0.00019978087430081137, 'samples': 915712, 'steps': 1788, 'loss/train': 4.076054573059082} -09/20/2021 20:41:09 - INFO - __main__ - Step 28617: {'lr': 0.00019978087430081137, 'samples': 915744, 'steps': 1788, 'loss/train': 2.3942737579345703} -09/20/2021 20:41:09 - INFO - __main__ - Step 28618: {'lr': 0.00019978087430081137, 'samples': 915776, 'steps': 1788, 'loss/train': 1.7721407413482666} -09/20/2021 20:41:10 - INFO - __main__ - Step 28619: {'lr': 0.00019978087430081137, 'samples': 915808, 'steps': 1788, 'loss/train': 2.0592286586761475} -09/20/2021 20:41:11 - INFO - __main__ - Step 28620: {'lr': 0.00019978087430081137, 'samples': 915840, 'steps': 1788, 'loss/train': 1.960841417312622} -09/20/2021 20:41:12 - INFO - __main__ - Step 28621: {'lr': 0.00019978087430081137, 'samples': 915872, 'steps': 1788, 'loss/train': 1.6771246194839478} -09/20/2021 20:41:12 - INFO - __main__ - Step 28622: {'lr': 0.00019978087430081137, 'samples': 915904, 'steps': 1788, 'loss/train': 2.4785470962524414} -09/20/2021 20:41:13 - INFO - __main__ - Step 28623: {'lr': 0.00019978087430081137, 'samples': 915936, 'steps': 1788, 'loss/train': 2.7159016132354736} -09/20/2021 20:41:14 - INFO - __main__ - Step 28624: {'lr': 0.00019978087430081137, 'samples': 915968, 'steps': 1788, 'loss/train': 2.148099422454834} -09/20/2021 20:41:15 - INFO - __main__ - Step 28625: {'lr': 0.0001997804520445566, 'samples': 916000, 'steps': 1789, 'loss/train': 1.367034673690796} -09/20/2021 20:41:15 - INFO - __main__ - Step 28626: {'lr': 0.0001997804520445566, 'samples': 916032, 'steps': 1789, 'loss/train': 2.302476644515991} -09/20/2021 20:41:16 - INFO - __main__ - Step 28627: {'lr': 0.0001997804520445566, 'samples': 916064, 'steps': 1789, 'loss/train': 2.503885269165039} -09/20/2021 20:41:17 - INFO - __main__ - Step 28628: {'lr': 0.0001997804520445566, 'samples': 916096, 'steps': 1789, 'loss/train': 1.9258785247802734} -09/20/2021 20:41:18 - INFO - __main__ - Step 28629: {'lr': 0.0001997804520445566, 'samples': 916128, 'steps': 1789, 'loss/train': 2.784658432006836} -09/20/2021 20:41:18 - INFO - __main__ - Step 28630: {'lr': 0.0001997804520445566, 'samples': 916160, 'steps': 1789, 'loss/train': 2.424095392227173} -09/20/2021 20:41:19 - INFO - __main__ - Step 28631: {'lr': 0.0001997804520445566, 'samples': 916192, 'steps': 1789, 'loss/train': 2.8435165882110596} -09/20/2021 20:41:20 - INFO - __main__ - Step 28632: {'lr': 0.0001997804520445566, 'samples': 916224, 'steps': 1789, 'loss/train': 0.4797658324241638} -09/20/2021 20:41:21 - INFO - __main__ - Step 28633: {'lr': 0.0001997804520445566, 'samples': 916256, 'steps': 1789, 'loss/train': 1.7819899320602417} -09/20/2021 20:41:21 - INFO - __main__ - Step 28634: {'lr': 0.0001997804520445566, 'samples': 916288, 'steps': 1789, 'loss/train': 3.059177875518799} -09/20/2021 20:41:22 - INFO - __main__ - Step 28635: {'lr': 0.0001997804520445566, 'samples': 916320, 'steps': 1789, 'loss/train': 2.4500668048858643} -09/20/2021 20:41:23 - INFO - __main__ - Step 28636: {'lr': 0.0001997804520445566, 'samples': 916352, 'steps': 1789, 'loss/train': 3.055549383163452} -09/20/2021 20:41:24 - INFO - __main__ - Step 28637: {'lr': 0.0001997804520445566, 'samples': 916384, 'steps': 1789, 'loss/train': 2.6711058616638184} -09/20/2021 20:41:24 - INFO - __main__ - Step 28638: {'lr': 0.0001997804520445566, 'samples': 916416, 'steps': 1789, 'loss/train': 2.8188774585723877} -09/20/2021 20:41:25 - INFO - __main__ - Step 28639: {'lr': 0.0001997804520445566, 'samples': 916448, 'steps': 1789, 'loss/train': 1.5209462642669678} -09/20/2021 20:41:26 - INFO - __main__ - Step 28640: {'lr': 0.0001997804520445566, 'samples': 916480, 'steps': 1789, 'loss/train': 0.9997690320014954} -09/20/2021 20:41:27 - INFO - __main__ - Step 28641: {'lr': 0.00019978002938229555, 'samples': 916512, 'steps': 1790, 'loss/train': 2.3064687252044678} -09/20/2021 20:41:28 - INFO - __main__ - Step 28642: {'lr': 0.00019978002938229555, 'samples': 916544, 'steps': 1790, 'loss/train': 2.5850112438201904} -09/20/2021 20:41:28 - INFO - __main__ - Step 28643: {'lr': 0.00019978002938229555, 'samples': 916576, 'steps': 1790, 'loss/train': 2.016955614089966} -09/20/2021 20:41:29 - INFO - __main__ - Step 28644: {'lr': 0.00019978002938229555, 'samples': 916608, 'steps': 1790, 'loss/train': 2.899754047393799} -09/20/2021 20:41:30 - INFO - __main__ - Step 28645: {'lr': 0.00019978002938229555, 'samples': 916640, 'steps': 1790, 'loss/train': 0.862207293510437} -09/20/2021 20:41:31 - INFO - __main__ - Step 28646: {'lr': 0.00019978002938229555, 'samples': 916672, 'steps': 1790, 'loss/train': 2.625051498413086} -09/20/2021 20:41:31 - INFO - __main__ - Step 28647: {'lr': 0.00019978002938229555, 'samples': 916704, 'steps': 1790, 'loss/train': 2.1443276405334473} -09/20/2021 20:41:32 - INFO - __main__ - Step 28648: {'lr': 0.00019978002938229555, 'samples': 916736, 'steps': 1790, 'loss/train': 3.306771755218506} -09/20/2021 20:41:33 - INFO - __main__ - Step 28649: {'lr': 0.00019978002938229555, 'samples': 916768, 'steps': 1790, 'loss/train': 1.9675341844558716} -09/20/2021 20:41:35 - INFO - __main__ - Step 28650: {'lr': 0.00019978002938229555, 'samples': 916800, 'steps': 1790, 'loss/train': 1.8786771297454834} -09/20/2021 20:41:35 - INFO - __main__ - Step 28651: {'lr': 0.00019978002938229555, 'samples': 916832, 'steps': 1790, 'loss/train': 1.8109816312789917} -09/20/2021 20:41:36 - INFO - __main__ - Step 28652: {'lr': 0.00019978002938229555, 'samples': 916864, 'steps': 1790, 'loss/train': 3.503925323486328} -09/20/2021 20:41:37 - INFO - __main__ - Step 28653: {'lr': 0.00019978002938229555, 'samples': 916896, 'steps': 1790, 'loss/train': 2.8022069931030273} -09/20/2021 20:41:38 - INFO - __main__ - Step 28654: {'lr': 0.00019978002938229555, 'samples': 916928, 'steps': 1790, 'loss/train': 3.9873220920562744} -09/20/2021 20:41:38 - INFO - __main__ - Step 28655: {'lr': 0.00019978002938229555, 'samples': 916960, 'steps': 1790, 'loss/train': 1.0337307453155518} -09/20/2021 20:41:39 - INFO - __main__ - Step 28656: {'lr': 0.00019978002938229555, 'samples': 916992, 'steps': 1790, 'loss/train': 2.0862669944763184} -09/20/2021 20:41:40 - INFO - __main__ - Step 28657: {'lr': 0.00019977960631402993, 'samples': 917024, 'steps': 1791, 'loss/train': 2.4074337482452393} -09/20/2021 20:41:41 - INFO - __main__ - Step 28658: {'lr': 0.00019977960631402993, 'samples': 917056, 'steps': 1791, 'loss/train': 1.6692174673080444} -09/20/2021 20:41:42 - INFO - __main__ - Step 28659: {'lr': 0.00019977960631402993, 'samples': 917088, 'steps': 1791, 'loss/train': 2.515155553817749} -09/20/2021 20:41:42 - INFO - __main__ - Step 28660: {'lr': 0.00019977960631402993, 'samples': 917120, 'steps': 1791, 'loss/train': 2.462944269180298} -09/20/2021 20:41:43 - INFO - __main__ - Step 28661: {'lr': 0.00019977960631402993, 'samples': 917152, 'steps': 1791, 'loss/train': 2.416250705718994} -09/20/2021 20:41:44 - INFO - __main__ - Step 28662: {'lr': 0.00019977960631402993, 'samples': 917184, 'steps': 1791, 'loss/train': 2.411961793899536} -09/20/2021 20:41:45 - INFO - __main__ - Step 28663: {'lr': 0.00019977960631402993, 'samples': 917216, 'steps': 1791, 'loss/train': 2.631370782852173} -09/20/2021 20:41:45 - INFO - __main__ - Step 28664: {'lr': 0.00019977960631402993, 'samples': 917248, 'steps': 1791, 'loss/train': 2.697821855545044} -09/20/2021 20:41:46 - INFO - __main__ - Step 28665: {'lr': 0.00019977960631402993, 'samples': 917280, 'steps': 1791, 'loss/train': 3.2275943756103516} -09/20/2021 20:41:47 - INFO - __main__ - Step 28666: {'lr': 0.00019977960631402993, 'samples': 917312, 'steps': 1791, 'loss/train': 2.5683932304382324} -09/20/2021 20:41:48 - INFO - __main__ - Step 28667: {'lr': 0.00019977960631402993, 'samples': 917344, 'steps': 1791, 'loss/train': 3.246119260787964} -09/20/2021 20:41:48 - INFO - __main__ - Step 28668: {'lr': 0.00019977960631402993, 'samples': 917376, 'steps': 1791, 'loss/train': 2.9289019107818604} -09/20/2021 20:41:49 - INFO - __main__ - Step 28669: {'lr': 0.00019977960631402993, 'samples': 917408, 'steps': 1791, 'loss/train': 2.6734654903411865} -09/20/2021 20:41:50 - INFO - __main__ - Step 28670: {'lr': 0.00019977960631402993, 'samples': 917440, 'steps': 1791, 'loss/train': 1.9198193550109863} -09/20/2021 20:41:51 - INFO - __main__ - Step 28671: {'lr': 0.00019977960631402993, 'samples': 917472, 'steps': 1791, 'loss/train': 1.3654755353927612} -09/20/2021 20:41:51 - INFO - __main__ - Step 28672: {'lr': 0.00019977960631402993, 'samples': 917504, 'steps': 1791, 'loss/train': 2.5323872566223145} -09/20/2021 20:41:52 - INFO - __main__ - Step 28673: {'lr': 0.00019977918283976148, 'samples': 917536, 'steps': 1792, 'loss/train': 2.618530750274658} -09/20/2021 20:41:53 - INFO - __main__ - Step 28674: {'lr': 0.00019977918283976148, 'samples': 917568, 'steps': 1792, 'loss/train': 3.0010199546813965} -09/20/2021 20:41:54 - INFO - __main__ - Step 28675: {'lr': 0.00019977918283976148, 'samples': 917600, 'steps': 1792, 'loss/train': 1.4905654191970825} -09/20/2021 20:41:54 - INFO - __main__ - Step 28676: {'lr': 0.00019977918283976148, 'samples': 917632, 'steps': 1792, 'loss/train': 4.2973103523254395} -09/20/2021 20:41:55 - INFO - __main__ - Step 28677: {'lr': 0.00019977918283976148, 'samples': 917664, 'steps': 1792, 'loss/train': 2.5906975269317627} -09/20/2021 20:41:56 - INFO - __main__ - Step 28678: {'lr': 0.00019977918283976148, 'samples': 917696, 'steps': 1792, 'loss/train': 2.1313083171844482} -09/20/2021 20:41:57 - INFO - __main__ - Step 28679: {'lr': 0.00019977918283976148, 'samples': 917728, 'steps': 1792, 'loss/train': 1.6528034210205078} -09/20/2021 20:41:58 - INFO - __main__ - Step 28680: {'lr': 0.00019977918283976148, 'samples': 917760, 'steps': 1792, 'loss/train': 2.2950985431671143} -09/20/2021 20:41:59 - INFO - __main__ - Step 28681: {'lr': 0.00019977918283976148, 'samples': 917792, 'steps': 1792, 'loss/train': 2.1315701007843018} -09/20/2021 20:41:59 - INFO - __main__ - Step 28682: {'lr': 0.00019977918283976148, 'samples': 917824, 'steps': 1792, 'loss/train': 2.325124979019165} -09/20/2021 20:42:00 - INFO - __main__ - Step 28683: {'lr': 0.00019977918283976148, 'samples': 917856, 'steps': 1792, 'loss/train': 3.0917983055114746} -09/20/2021 20:42:01 - INFO - __main__ - Step 28684: {'lr': 0.00019977918283976148, 'samples': 917888, 'steps': 1792, 'loss/train': 2.5415265560150146} -09/20/2021 20:42:02 - INFO - __main__ - Step 28685: {'lr': 0.00019977918283976148, 'samples': 917920, 'steps': 1792, 'loss/train': 3.6225028038024902} -09/20/2021 20:42:02 - INFO - __main__ - Step 28686: {'lr': 0.00019977918283976148, 'samples': 917952, 'steps': 1792, 'loss/train': 3.2434589862823486} -09/20/2021 20:42:03 - INFO - __main__ - Step 28687: {'lr': 0.00019977918283976148, 'samples': 917984, 'steps': 1792, 'loss/train': 2.1545751094818115} -09/20/2021 20:42:04 - INFO - __main__ - Step 28688: {'lr': 0.00019977918283976148, 'samples': 918016, 'steps': 1792, 'loss/train': 2.5970358848571777} -09/20/2021 20:42:05 - INFO - __main__ - Step 28689: {'lr': 0.00019977875895949194, 'samples': 918048, 'steps': 1793, 'loss/train': 2.8857882022857666} -09/20/2021 20:42:06 - INFO - __main__ - Step 28690: {'lr': 0.00019977875895949194, 'samples': 918080, 'steps': 1793, 'loss/train': 3.277876615524292} -09/20/2021 20:42:06 - INFO - __main__ - Step 28691: {'lr': 0.00019977875895949194, 'samples': 918112, 'steps': 1793, 'loss/train': 2.2351465225219727} -09/20/2021 20:42:07 - INFO - __main__ - Step 28692: {'lr': 0.00019977875895949194, 'samples': 918144, 'steps': 1793, 'loss/train': 1.7488071918487549} -09/20/2021 20:42:08 - INFO - __main__ - Step 28693: {'lr': 0.00019977875895949194, 'samples': 918176, 'steps': 1793, 'loss/train': 1.8610411882400513} -09/20/2021 20:42:09 - INFO - __main__ - Step 28694: {'lr': 0.00019977875895949194, 'samples': 918208, 'steps': 1793, 'loss/train': 2.5939362049102783} -09/20/2021 20:42:09 - INFO - __main__ - Step 28695: {'lr': 0.00019977875895949194, 'samples': 918240, 'steps': 1793, 'loss/train': 2.9059321880340576} -09/20/2021 20:42:10 - INFO - __main__ - Step 28696: {'lr': 0.00019977875895949194, 'samples': 918272, 'steps': 1793, 'loss/train': 1.825380802154541} -09/20/2021 20:42:11 - INFO - __main__ - Step 28697: {'lr': 0.00019977875895949194, 'samples': 918304, 'steps': 1793, 'loss/train': 3.554042100906372} -09/20/2021 20:42:12 - INFO - __main__ - Step 28698: {'lr': 0.00019977875895949194, 'samples': 918336, 'steps': 1793, 'loss/train': 2.336444854736328} -09/20/2021 20:42:12 - INFO - __main__ - Step 28699: {'lr': 0.00019977875895949194, 'samples': 918368, 'steps': 1793, 'loss/train': 2.1275031566619873} -09/20/2021 20:42:13 - INFO - __main__ - Step 28700: {'lr': 0.00019977875895949194, 'samples': 918400, 'steps': 1793, 'loss/train': 2.7521355152130127} -09/20/2021 20:42:14 - INFO - __main__ - Step 28701: {'lr': 0.00019977875895949194, 'samples': 918432, 'steps': 1793, 'loss/train': 3.575164794921875} -09/20/2021 20:42:15 - INFO - __main__ - Step 28702: {'lr': 0.00019977875895949194, 'samples': 918464, 'steps': 1793, 'loss/train': 2.3663582801818848} -09/20/2021 20:42:15 - INFO - __main__ - Step 28703: {'lr': 0.00019977875895949194, 'samples': 918496, 'steps': 1793, 'loss/train': 2.8360345363616943} -09/20/2021 20:42:16 - INFO - __main__ - Step 28704: {'lr': 0.00019977875895949194, 'samples': 918528, 'steps': 1793, 'loss/train': 2.439610481262207} -09/20/2021 20:42:17 - INFO - __main__ - Step 28705: {'lr': 0.000199778334673223, 'samples': 918560, 'steps': 1794, 'loss/train': 1.9306946992874146} -09/20/2021 20:42:18 - INFO - __main__ - Step 28706: {'lr': 0.000199778334673223, 'samples': 918592, 'steps': 1794, 'loss/train': 3.0974667072296143} -09/20/2021 20:42:18 - INFO - __main__ - Step 28707: {'lr': 0.000199778334673223, 'samples': 918624, 'steps': 1794, 'loss/train': 5.381501197814941} -09/20/2021 20:42:19 - INFO - __main__ - Step 28708: {'lr': 0.000199778334673223, 'samples': 918656, 'steps': 1794, 'loss/train': 3.0485570430755615} -09/20/2021 20:42:20 - INFO - __main__ - Step 28709: {'lr': 0.000199778334673223, 'samples': 918688, 'steps': 1794, 'loss/train': 3.0574169158935547} -09/20/2021 20:42:21 - INFO - __main__ - Step 28710: {'lr': 0.000199778334673223, 'samples': 918720, 'steps': 1794, 'loss/train': 2.5167198181152344} -09/20/2021 20:42:22 - INFO - __main__ - Step 28711: {'lr': 0.000199778334673223, 'samples': 918752, 'steps': 1794, 'loss/train': 2.5495760440826416} -09/20/2021 20:42:23 - INFO - __main__ - Step 28712: {'lr': 0.000199778334673223, 'samples': 918784, 'steps': 1794, 'loss/train': 2.727464437484741} -09/20/2021 20:42:24 - INFO - __main__ - Step 28713: {'lr': 0.000199778334673223, 'samples': 918816, 'steps': 1794, 'loss/train': 0.46667173504829407} -09/20/2021 20:42:24 - INFO - __main__ - Step 28714: {'lr': 0.000199778334673223, 'samples': 918848, 'steps': 1794, 'loss/train': 2.071491241455078} -09/20/2021 20:42:25 - INFO - __main__ - Step 28715: {'lr': 0.000199778334673223, 'samples': 918880, 'steps': 1794, 'loss/train': 3.1354939937591553} -09/20/2021 20:42:26 - INFO - __main__ - Step 28716: {'lr': 0.000199778334673223, 'samples': 918912, 'steps': 1794, 'loss/train': 3.0637259483337402} -09/20/2021 20:42:27 - INFO - __main__ - Step 28717: {'lr': 0.000199778334673223, 'samples': 918944, 'steps': 1794, 'loss/train': 2.3422470092773438} -09/20/2021 20:42:27 - INFO - __main__ - Step 28718: {'lr': 0.000199778334673223, 'samples': 918976, 'steps': 1794, 'loss/train': 3.738424062728882} -09/20/2021 20:42:28 - INFO - __main__ - Step 28719: {'lr': 0.000199778334673223, 'samples': 919008, 'steps': 1794, 'loss/train': 2.740622043609619} -09/20/2021 20:42:29 - INFO - __main__ - Step 28720: {'lr': 0.000199778334673223, 'samples': 919040, 'steps': 1794, 'loss/train': 3.000629186630249} -09/20/2021 20:42:30 - INFO - __main__ - Step 28721: {'lr': 0.0001997779099809564, 'samples': 919072, 'steps': 1795, 'loss/train': 2.3125662803649902} -09/20/2021 20:42:31 - INFO - __main__ - Step 28722: {'lr': 0.0001997779099809564, 'samples': 919104, 'steps': 1795, 'loss/train': 1.3857804536819458} -09/20/2021 20:42:31 - INFO - __main__ - Step 28723: {'lr': 0.0001997779099809564, 'samples': 919136, 'steps': 1795, 'loss/train': 2.4738292694091797} -09/20/2021 20:42:32 - INFO - __main__ - Step 28724: {'lr': 0.0001997779099809564, 'samples': 919168, 'steps': 1795, 'loss/train': 1.711998462677002} -09/20/2021 20:42:33 - INFO - __main__ - Step 28725: {'lr': 0.0001997779099809564, 'samples': 919200, 'steps': 1795, 'loss/train': 1.5864572525024414} -09/20/2021 20:42:34 - INFO - __main__ - Step 28726: {'lr': 0.0001997779099809564, 'samples': 919232, 'steps': 1795, 'loss/train': 1.731096625328064} -09/20/2021 20:42:34 - INFO - __main__ - Step 28727: {'lr': 0.0001997779099809564, 'samples': 919264, 'steps': 1795, 'loss/train': 3.4738974571228027} -09/20/2021 20:42:35 - INFO - __main__ - Step 28728: {'lr': 0.0001997779099809564, 'samples': 919296, 'steps': 1795, 'loss/train': 1.467104196548462} -09/20/2021 20:42:36 - INFO - __main__ - Step 28729: {'lr': 0.0001997779099809564, 'samples': 919328, 'steps': 1795, 'loss/train': 2.4658491611480713} -09/20/2021 20:42:37 - INFO - __main__ - Step 28730: {'lr': 0.0001997779099809564, 'samples': 919360, 'steps': 1795, 'loss/train': 2.61594557762146} -09/20/2021 20:42:37 - INFO - __main__ - Step 28731: {'lr': 0.0001997779099809564, 'samples': 919392, 'steps': 1795, 'loss/train': 2.761320114135742} -09/20/2021 20:42:38 - INFO - __main__ - Step 28732: {'lr': 0.0001997779099809564, 'samples': 919424, 'steps': 1795, 'loss/train': 3.014275074005127} -09/20/2021 20:42:39 - INFO - __main__ - Step 28733: {'lr': 0.0001997779099809564, 'samples': 919456, 'steps': 1795, 'loss/train': 1.6879541873931885} -09/20/2021 20:42:40 - INFO - __main__ - Step 28734: {'lr': 0.0001997779099809564, 'samples': 919488, 'steps': 1795, 'loss/train': 1.0663865804672241} -09/20/2021 20:42:40 - INFO - __main__ - Step 28735: {'lr': 0.0001997779099809564, 'samples': 919520, 'steps': 1795, 'loss/train': 2.0422048568725586} -09/20/2021 20:42:41 - INFO - __main__ - Step 28736: {'lr': 0.0001997779099809564, 'samples': 919552, 'steps': 1795, 'loss/train': 1.956183671951294} -09/20/2021 20:42:42 - INFO - __main__ - Step 28737: {'lr': 0.00019977748488269391, 'samples': 919584, 'steps': 1796, 'loss/train': 2.3388326168060303} -09/20/2021 20:42:43 - INFO - __main__ - Step 28738: {'lr': 0.00019977748488269391, 'samples': 919616, 'steps': 1796, 'loss/train': 2.648308515548706} -09/20/2021 20:42:43 - INFO - __main__ - Step 28739: {'lr': 0.00019977748488269391, 'samples': 919648, 'steps': 1796, 'loss/train': 2.7179832458496094} -09/20/2021 20:42:44 - INFO - __main__ - Step 28740: {'lr': 0.00019977748488269391, 'samples': 919680, 'steps': 1796, 'loss/train': 2.7158396244049072} -09/20/2021 20:42:46 - INFO - __main__ - Step 28741: {'lr': 0.00019977748488269391, 'samples': 919712, 'steps': 1796, 'loss/train': 2.564042091369629} -09/20/2021 20:42:46 - INFO - __main__ - Step 28742: {'lr': 0.00019977748488269391, 'samples': 919744, 'steps': 1796, 'loss/train': 0.675998866558075} -09/20/2021 20:42:47 - INFO - __main__ - Step 28743: {'lr': 0.00019977748488269391, 'samples': 919776, 'steps': 1796, 'loss/train': 0.48876953125} -09/20/2021 20:42:48 - INFO - __main__ - Step 28744: {'lr': 0.00019977748488269391, 'samples': 919808, 'steps': 1796, 'loss/train': 0.4666619896888733} -09/20/2021 20:42:49 - INFO - __main__ - Step 28745: {'lr': 0.00019977748488269391, 'samples': 919840, 'steps': 1796, 'loss/train': 0.5885902047157288} -09/20/2021 20:42:49 - INFO - __main__ - Step 28746: {'lr': 0.00019977748488269391, 'samples': 919872, 'steps': 1796, 'loss/train': 3.5815794467926025} -09/20/2021 20:42:50 - INFO - __main__ - Step 28747: {'lr': 0.00019977748488269391, 'samples': 919904, 'steps': 1796, 'loss/train': 3.5097086429595947} -09/20/2021 20:42:51 - INFO - __main__ - Step 28748: {'lr': 0.00019977748488269391, 'samples': 919936, 'steps': 1796, 'loss/train': 2.3529319763183594} -09/20/2021 20:42:52 - INFO - __main__ - Step 28749: {'lr': 0.00019977748488269391, 'samples': 919968, 'steps': 1796, 'loss/train': 1.9824705123901367} -09/20/2021 20:42:52 - INFO - __main__ - Step 28750: {'lr': 0.00019977748488269391, 'samples': 920000, 'steps': 1796, 'loss/train': 0.8714020252227783} -09/20/2021 20:42:53 - INFO - __main__ - Step 28751: {'lr': 0.00019977748488269391, 'samples': 920032, 'steps': 1796, 'loss/train': 2.418260335922241} -09/20/2021 20:42:54 - INFO - __main__ - Step 28752: {'lr': 0.00019977748488269391, 'samples': 920064, 'steps': 1796, 'loss/train': 1.9685847759246826} -09/20/2021 20:42:55 - INFO - __main__ - Step 28753: {'lr': 0.0001997770593784372, 'samples': 920096, 'steps': 1797, 'loss/train': 2.2727129459381104} -09/20/2021 20:42:55 - INFO - __main__ - Step 28754: {'lr': 0.0001997770593784372, 'samples': 920128, 'steps': 1797, 'loss/train': 3.223332166671753} -09/20/2021 20:42:56 - INFO - __main__ - Step 28755: {'lr': 0.0001997770593784372, 'samples': 920160, 'steps': 1797, 'loss/train': 2.1856281757354736} -09/20/2021 20:42:57 - INFO - __main__ - Step 28756: {'lr': 0.0001997770593784372, 'samples': 920192, 'steps': 1797, 'loss/train': 3.2447047233581543} -09/20/2021 20:42:58 - INFO - __main__ - Step 28757: {'lr': 0.0001997770593784372, 'samples': 920224, 'steps': 1797, 'loss/train': 2.336745023727417} -09/20/2021 20:42:58 - INFO - __main__ - Step 28758: {'lr': 0.0001997770593784372, 'samples': 920256, 'steps': 1797, 'loss/train': 2.934619903564453} -09/20/2021 20:42:59 - INFO - __main__ - Step 28759: {'lr': 0.0001997770593784372, 'samples': 920288, 'steps': 1797, 'loss/train': 3.0274717807769775} -09/20/2021 20:43:00 - INFO - __main__ - Step 28760: {'lr': 0.0001997770593784372, 'samples': 920320, 'steps': 1797, 'loss/train': 2.494089126586914} -09/20/2021 20:43:01 - INFO - __main__ - Step 28761: {'lr': 0.0001997770593784372, 'samples': 920352, 'steps': 1797, 'loss/train': 2.6709115505218506} -09/20/2021 20:43:01 - INFO - __main__ - Step 28762: {'lr': 0.0001997770593784372, 'samples': 920384, 'steps': 1797, 'loss/train': 2.081606388092041} -09/20/2021 20:43:02 - INFO - __main__ - Step 28763: {'lr': 0.0001997770593784372, 'samples': 920416, 'steps': 1797, 'loss/train': 3.061211585998535} -09/20/2021 20:43:03 - INFO - __main__ - Step 28764: {'lr': 0.0001997770593784372, 'samples': 920448, 'steps': 1797, 'loss/train': 2.2873971462249756} -09/20/2021 20:43:04 - INFO - __main__ - Step 28765: {'lr': 0.0001997770593784372, 'samples': 920480, 'steps': 1797, 'loss/train': 1.047554850578308} -09/20/2021 20:43:04 - INFO - __main__ - Step 28766: {'lr': 0.0001997770593784372, 'samples': 920512, 'steps': 1797, 'loss/train': 2.7576746940612793} -09/20/2021 20:43:05 - INFO - __main__ - Step 28767: {'lr': 0.0001997770593784372, 'samples': 920544, 'steps': 1797, 'loss/train': 2.4729793071746826} -09/20/2021 20:43:06 - INFO - __main__ - Step 28768: {'lr': 0.0001997770593784372, 'samples': 920576, 'steps': 1797, 'loss/train': 2.1853675842285156} -09/20/2021 20:43:07 - INFO - __main__ - Step 28769: {'lr': 0.000199776633468188, 'samples': 920608, 'steps': 1798, 'loss/train': 1.8271784782409668} -09/20/2021 20:43:08 - INFO - __main__ - Step 28770: {'lr': 0.000199776633468188, 'samples': 920640, 'steps': 1798, 'loss/train': 2.7937581539154053} -09/20/2021 20:43:08 - INFO - __main__ - Step 28771: {'lr': 0.000199776633468188, 'samples': 920672, 'steps': 1798, 'loss/train': 2.932248592376709} -09/20/2021 20:43:09 - INFO - __main__ - Step 28772: {'lr': 0.000199776633468188, 'samples': 920704, 'steps': 1798, 'loss/train': 2.399888277053833} -09/20/2021 20:43:11 - INFO - __main__ - Step 28773: {'lr': 0.000199776633468188, 'samples': 920736, 'steps': 1798, 'loss/train': 1.550405740737915} -09/20/2021 20:43:12 - INFO - __main__ - Step 28774: {'lr': 0.000199776633468188, 'samples': 920768, 'steps': 1798, 'loss/train': 2.7450435161590576} -09/20/2021 20:43:12 - INFO - __main__ - Step 28775: {'lr': 0.000199776633468188, 'samples': 920800, 'steps': 1798, 'loss/train': 1.0596290826797485} -09/20/2021 20:43:13 - INFO - __main__ - Step 28776: {'lr': 0.000199776633468188, 'samples': 920832, 'steps': 1798, 'loss/train': 2.497225522994995} -09/20/2021 20:43:14 - INFO - __main__ - Step 28777: {'lr': 0.000199776633468188, 'samples': 920864, 'steps': 1798, 'loss/train': 2.284324884414673} -09/20/2021 20:43:15 - INFO - __main__ - Step 28778: {'lr': 0.000199776633468188, 'samples': 920896, 'steps': 1798, 'loss/train': 3.24560809135437} -09/20/2021 20:43:15 - INFO - __main__ - Step 28779: {'lr': 0.000199776633468188, 'samples': 920928, 'steps': 1798, 'loss/train': 2.7499892711639404} -09/20/2021 20:43:16 - INFO - __main__ - Step 28780: {'lr': 0.000199776633468188, 'samples': 920960, 'steps': 1798, 'loss/train': 2.585392475128174} -09/20/2021 20:43:17 - INFO - __main__ - Step 28781: {'lr': 0.000199776633468188, 'samples': 920992, 'steps': 1798, 'loss/train': 0.8296481370925903} -09/20/2021 20:43:18 - INFO - __main__ - Step 28782: {'lr': 0.000199776633468188, 'samples': 921024, 'steps': 1798, 'loss/train': 2.8689446449279785} -09/20/2021 20:43:18 - INFO - __main__ - Step 28783: {'lr': 0.000199776633468188, 'samples': 921056, 'steps': 1798, 'loss/train': 2.556842565536499} -09/20/2021 20:43:19 - INFO - __main__ - Step 28784: {'lr': 0.000199776633468188, 'samples': 921088, 'steps': 1798, 'loss/train': 2.212113857269287} -09/20/2021 20:43:20 - INFO - __main__ - Step 28785: {'lr': 0.0001997762071519481, 'samples': 921120, 'steps': 1799, 'loss/train': 3.4023637771606445} -09/20/2021 20:43:21 - INFO - __main__ - Step 28786: {'lr': 0.0001997762071519481, 'samples': 921152, 'steps': 1799, 'loss/train': 3.3080952167510986} -09/20/2021 20:43:21 - INFO - __main__ - Step 28787: {'lr': 0.0001997762071519481, 'samples': 921184, 'steps': 1799, 'loss/train': 2.8362042903900146} -09/20/2021 20:43:22 - INFO - __main__ - Step 28788: {'lr': 0.0001997762071519481, 'samples': 921216, 'steps': 1799, 'loss/train': 1.7692381143569946} -09/20/2021 20:43:23 - INFO - __main__ - Step 28789: {'lr': 0.0001997762071519481, 'samples': 921248, 'steps': 1799, 'loss/train': 2.193486213684082} -09/20/2021 20:43:24 - INFO - __main__ - Step 28790: {'lr': 0.0001997762071519481, 'samples': 921280, 'steps': 1799, 'loss/train': 2.526155471801758} -09/20/2021 20:43:24 - INFO - __main__ - Step 28791: {'lr': 0.0001997762071519481, 'samples': 921312, 'steps': 1799, 'loss/train': 1.098882794380188} -09/20/2021 20:43:25 - INFO - __main__ - Step 28792: {'lr': 0.0001997762071519481, 'samples': 921344, 'steps': 1799, 'loss/train': 1.2055906057357788} -09/20/2021 20:43:26 - INFO - __main__ - Step 28793: {'lr': 0.0001997762071519481, 'samples': 921376, 'steps': 1799, 'loss/train': 1.145068645477295} -09/20/2021 20:43:27 - INFO - __main__ - Step 28794: {'lr': 0.0001997762071519481, 'samples': 921408, 'steps': 1799, 'loss/train': 0.9238439202308655} -09/20/2021 20:43:27 - INFO - __main__ - Step 28795: {'lr': 0.0001997762071519481, 'samples': 921440, 'steps': 1799, 'loss/train': 1.0034481287002563} -09/20/2021 20:43:28 - INFO - __main__ - Step 28796: {'lr': 0.0001997762071519481, 'samples': 921472, 'steps': 1799, 'loss/train': 1.15377676486969} -09/20/2021 20:43:29 - INFO - __main__ - Step 28797: {'lr': 0.0001997762071519481, 'samples': 921504, 'steps': 1799, 'loss/train': 1.2094172239303589} -09/20/2021 20:43:30 - INFO - __main__ - Step 28798: {'lr': 0.0001997762071519481, 'samples': 921536, 'steps': 1799, 'loss/train': 1.4067233800888062} -09/20/2021 20:43:30 - INFO - __main__ - Step 28799: {'lr': 0.0001997762071519481, 'samples': 921568, 'steps': 1799, 'loss/train': 2.6914961338043213} -09/20/2021 20:43:31 - INFO - __main__ - Step 28800: {'lr': 0.0001997762071519481, 'samples': 921600, 'steps': 1799, 'loss/train': 2.619086742401123} -09/20/2021 20:43:32 - INFO - __main__ - Step 28801: {'lr': 0.0001997757804297192, 'samples': 921632, 'steps': 1800, 'loss/train': 3.2198166847229004} -09/20/2021 20:43:33 - INFO - __main__ - Step 28802: {'lr': 0.0001997757804297192, 'samples': 921664, 'steps': 1800, 'loss/train': 2.421985149383545} -09/20/2021 20:43:34 - INFO - __main__ - Step 28803: {'lr': 0.0001997757804297192, 'samples': 921696, 'steps': 1800, 'loss/train': 2.7120914459228516} -09/20/2021 20:43:34 - INFO - __main__ - Step 28804: {'lr': 0.0001997757804297192, 'samples': 921728, 'steps': 1800, 'loss/train': 1.4499115943908691} -09/20/2021 20:43:35 - INFO - __main__ - Step 28805: {'lr': 0.0001997757804297192, 'samples': 921760, 'steps': 1800, 'loss/train': 3.1573452949523926} -09/20/2021 20:43:36 - INFO - __main__ - Step 28806: {'lr': 0.0001997757804297192, 'samples': 921792, 'steps': 1800, 'loss/train': 2.619974374771118} -09/20/2021 20:43:37 - INFO - __main__ - Step 28807: {'lr': 0.0001997757804297192, 'samples': 921824, 'steps': 1800, 'loss/train': 2.47245717048645} -09/20/2021 20:43:37 - INFO - __main__ - Step 28808: {'lr': 0.0001997757804297192, 'samples': 921856, 'steps': 1800, 'loss/train': 0.6898397207260132} -09/20/2021 20:43:39 - INFO - __main__ - Step 28809: {'lr': 0.0001997757804297192, 'samples': 921888, 'steps': 1800, 'loss/train': 1.8638383150100708} -09/20/2021 20:43:39 - INFO - __main__ - Step 28810: {'lr': 0.0001997757804297192, 'samples': 921920, 'steps': 1800, 'loss/train': 1.8908811807632446} -09/20/2021 20:43:40 - INFO - __main__ - Step 28811: {'lr': 0.0001997757804297192, 'samples': 921952, 'steps': 1800, 'loss/train': 2.858945369720459} -09/20/2021 20:43:41 - INFO - __main__ - Step 28812: {'lr': 0.0001997757804297192, 'samples': 921984, 'steps': 1800, 'loss/train': 3.4741859436035156} -09/20/2021 20:43:42 - INFO - __main__ - Step 28813: {'lr': 0.0001997757804297192, 'samples': 922016, 'steps': 1800, 'loss/train': 2.5328528881073} -09/20/2021 20:43:42 - INFO - __main__ - Step 28814: {'lr': 0.0001997757804297192, 'samples': 922048, 'steps': 1800, 'loss/train': 2.6772053241729736} -09/20/2021 20:43:43 - INFO - __main__ - Step 28815: {'lr': 0.0001997757804297192, 'samples': 922080, 'steps': 1800, 'loss/train': 3.4355878829956055} -09/20/2021 20:43:44 - INFO - __main__ - Step 28816: {'lr': 0.0001997757804297192, 'samples': 922112, 'steps': 1800, 'loss/train': 2.6131975650787354} -09/20/2021 20:43:45 - INFO - __main__ - Step 28817: {'lr': 0.00019977535330150303, 'samples': 922144, 'steps': 1801, 'loss/train': 2.876591920852661} -09/20/2021 20:43:46 - INFO - __main__ - Step 28818: {'lr': 0.00019977535330150303, 'samples': 922176, 'steps': 1801, 'loss/train': 3.6384949684143066} -09/20/2021 20:43:46 - INFO - __main__ - Step 28819: {'lr': 0.00019977535330150303, 'samples': 922208, 'steps': 1801, 'loss/train': 2.182194232940674} -09/20/2021 20:43:47 - INFO - __main__ - Step 28820: {'lr': 0.00019977535330150303, 'samples': 922240, 'steps': 1801, 'loss/train': 3.34492826461792} -09/20/2021 20:43:48 - INFO - __main__ - Step 28821: {'lr': 0.00019977535330150303, 'samples': 922272, 'steps': 1801, 'loss/train': 2.38830304145813} -09/20/2021 20:43:49 - INFO - __main__ - Step 28822: {'lr': 0.00019977535330150303, 'samples': 922304, 'steps': 1801, 'loss/train': 2.705486536026001} -09/20/2021 20:43:49 - INFO - __main__ - Step 28823: {'lr': 0.00019977535330150303, 'samples': 922336, 'steps': 1801, 'loss/train': 2.8386964797973633} -09/20/2021 20:43:50 - INFO - __main__ - Step 28824: {'lr': 0.00019977535330150303, 'samples': 922368, 'steps': 1801, 'loss/train': 1.8401917219161987} -09/20/2021 20:43:51 - INFO - __main__ - Step 28825: {'lr': 0.00019977535330150303, 'samples': 922400, 'steps': 1801, 'loss/train': 2.333193302154541} -09/20/2021 20:43:52 - INFO - __main__ - Step 28826: {'lr': 0.00019977535330150303, 'samples': 922432, 'steps': 1801, 'loss/train': 2.3664729595184326} -09/20/2021 20:43:52 - INFO - __main__ - Step 28827: {'lr': 0.00019977535330150303, 'samples': 922464, 'steps': 1801, 'loss/train': 3.2806918621063232} -09/20/2021 20:43:53 - INFO - __main__ - Step 28828: {'lr': 0.00019977535330150303, 'samples': 922496, 'steps': 1801, 'loss/train': 3.325839042663574} -09/20/2021 20:43:54 - INFO - __main__ - Step 28829: {'lr': 0.00019977535330150303, 'samples': 922528, 'steps': 1801, 'loss/train': 2.5987985134124756} -09/20/2021 20:43:55 - INFO - __main__ - Step 28830: {'lr': 0.00019977535330150303, 'samples': 922560, 'steps': 1801, 'loss/train': 3.0923006534576416} -09/20/2021 20:43:55 - INFO - __main__ - Step 28831: {'lr': 0.00019977535330150303, 'samples': 922592, 'steps': 1801, 'loss/train': 2.560485363006592} -09/20/2021 20:43:56 - INFO - __main__ - Step 28832: {'lr': 0.00019977535330150303, 'samples': 922624, 'steps': 1801, 'loss/train': 2.9249444007873535} -09/20/2021 20:43:57 - INFO - __main__ - Step 28833: {'lr': 0.0001997749257673013, 'samples': 922656, 'steps': 1802, 'loss/train': 2.64068341255188} -09/20/2021 20:43:58 - INFO - __main__ - Step 28834: {'lr': 0.0001997749257673013, 'samples': 922688, 'steps': 1802, 'loss/train': 2.9346296787261963} -09/20/2021 20:43:58 - INFO - __main__ - Step 28835: {'lr': 0.0001997749257673013, 'samples': 922720, 'steps': 1802, 'loss/train': 1.7272318601608276} -09/20/2021 20:43:59 - INFO - __main__ - Step 28836: {'lr': 0.0001997749257673013, 'samples': 922752, 'steps': 1802, 'loss/train': 3.158095359802246} -09/20/2021 20:44:00 - INFO - __main__ - Step 28837: {'lr': 0.0001997749257673013, 'samples': 922784, 'steps': 1802, 'loss/train': 2.3938896656036377} -09/20/2021 20:44:01 - INFO - __main__ - Step 28838: {'lr': 0.0001997749257673013, 'samples': 922816, 'steps': 1802, 'loss/train': 2.3944900035858154} -09/20/2021 20:44:01 - INFO - __main__ - Step 28839: {'lr': 0.0001997749257673013, 'samples': 922848, 'steps': 1802, 'loss/train': 0.3750227987766266} -09/20/2021 20:44:02 - INFO - __main__ - Step 28840: {'lr': 0.0001997749257673013, 'samples': 922880, 'steps': 1802, 'loss/train': 0.47639453411102295} -09/20/2021 20:44:04 - INFO - __main__ - Step 28841: {'lr': 0.0001997749257673013, 'samples': 922912, 'steps': 1802, 'loss/train': 0.3447372317314148} -09/20/2021 20:44:04 - INFO - __main__ - Step 28842: {'lr': 0.0001997749257673013, 'samples': 922944, 'steps': 1802, 'loss/train': 3.458461046218872} -09/20/2021 20:44:05 - INFO - __main__ - Step 28843: {'lr': 0.0001997749257673013, 'samples': 922976, 'steps': 1802, 'loss/train': 1.8536659479141235} -09/20/2021 20:44:06 - INFO - __main__ - Step 28844: {'lr': 0.0001997749257673013, 'samples': 923008, 'steps': 1802, 'loss/train': 2.902179002761841} -09/20/2021 20:44:07 - INFO - __main__ - Step 28845: {'lr': 0.0001997749257673013, 'samples': 923040, 'steps': 1802, 'loss/train': 2.4647769927978516} -09/20/2021 20:44:07 - INFO - __main__ - Step 28846: {'lr': 0.0001997749257673013, 'samples': 923072, 'steps': 1802, 'loss/train': 3.40977144241333} -09/20/2021 20:44:08 - INFO - __main__ - Step 28847: {'lr': 0.0001997749257673013, 'samples': 923104, 'steps': 1802, 'loss/train': 2.490175485610962} -09/20/2021 20:44:09 - INFO - __main__ - Step 28848: {'lr': 0.0001997749257673013, 'samples': 923136, 'steps': 1802, 'loss/train': 1.961765170097351} -09/20/2021 20:44:10 - INFO - __main__ - Step 28849: {'lr': 0.00019977449782711582, 'samples': 923168, 'steps': 1803, 'loss/train': 2.93572735786438} -09/20/2021 20:44:11 - INFO - __main__ - Step 28850: {'lr': 0.00019977449782711582, 'samples': 923200, 'steps': 1803, 'loss/train': 3.2339494228363037} -09/20/2021 20:44:11 - INFO - __main__ - Step 28851: {'lr': 0.00019977449782711582, 'samples': 923232, 'steps': 1803, 'loss/train': 2.2069039344787598} -09/20/2021 20:44:12 - INFO - __main__ - Step 28852: {'lr': 0.00019977449782711582, 'samples': 923264, 'steps': 1803, 'loss/train': 1.8081927299499512} -09/20/2021 20:44:13 - INFO - __main__ - Step 28853: {'lr': 0.00019977449782711582, 'samples': 923296, 'steps': 1803, 'loss/train': 3.2010419368743896} -09/20/2021 20:44:14 - INFO - __main__ - Step 28854: {'lr': 0.00019977449782711582, 'samples': 923328, 'steps': 1803, 'loss/train': 1.6866965293884277} -09/20/2021 20:44:14 - INFO - __main__ - Step 28855: {'lr': 0.00019977449782711582, 'samples': 923360, 'steps': 1803, 'loss/train': 2.332596778869629} -09/20/2021 20:44:15 - INFO - __main__ - Step 28856: {'lr': 0.00019977449782711582, 'samples': 923392, 'steps': 1803, 'loss/train': 6.0340576171875} -09/20/2021 20:44:16 - INFO - __main__ - Step 28857: {'lr': 0.00019977449782711582, 'samples': 923424, 'steps': 1803, 'loss/train': 2.3622472286224365} -09/20/2021 20:44:17 - INFO - __main__ - Step 28858: {'lr': 0.00019977449782711582, 'samples': 923456, 'steps': 1803, 'loss/train': 2.414498805999756} -09/20/2021 20:44:17 - INFO - __main__ - Step 28859: {'lr': 0.00019977449782711582, 'samples': 923488, 'steps': 1803, 'loss/train': 3.6093740463256836} -09/20/2021 20:44:18 - INFO - __main__ - Step 28860: {'lr': 0.00019977449782711582, 'samples': 923520, 'steps': 1803, 'loss/train': 2.778679370880127} -09/20/2021 20:44:19 - INFO - __main__ - Step 28861: {'lr': 0.00019977449782711582, 'samples': 923552, 'steps': 1803, 'loss/train': 2.610707998275757} -09/20/2021 20:44:20 - INFO - __main__ - Step 28862: {'lr': 0.00019977449782711582, 'samples': 923584, 'steps': 1803, 'loss/train': 2.9587700366973877} -09/20/2021 20:44:20 - INFO - __main__ - Step 28863: {'lr': 0.00019977449782711582, 'samples': 923616, 'steps': 1803, 'loss/train': 3.2647860050201416} -09/20/2021 20:44:21 - INFO - __main__ - Step 28864: {'lr': 0.00019977449782711582, 'samples': 923648, 'steps': 1803, 'loss/train': 2.442779064178467} -09/20/2021 20:44:22 - INFO - __main__ - Step 28865: {'lr': 0.00019977406948094829, 'samples': 923680, 'steps': 1804, 'loss/train': 2.209360361099243} -09/20/2021 20:44:23 - INFO - __main__ - Step 28866: {'lr': 0.00019977406948094829, 'samples': 923712, 'steps': 1804, 'loss/train': 2.352404832839966} -09/20/2021 20:44:23 - INFO - __main__ - Step 28867: {'lr': 0.00019977406948094829, 'samples': 923744, 'steps': 1804, 'loss/train': 0.4575144052505493} -09/20/2021 20:44:24 - INFO - __main__ - Step 28868: {'lr': 0.00019977406948094829, 'samples': 923776, 'steps': 1804, 'loss/train': 1.5745983123779297} -09/20/2021 20:44:25 - INFO - __main__ - Step 28869: {'lr': 0.00019977406948094829, 'samples': 923808, 'steps': 1804, 'loss/train': 2.9295761585235596} -09/20/2021 20:44:26 - INFO - __main__ - Step 28870: {'lr': 0.00019977406948094829, 'samples': 923840, 'steps': 1804, 'loss/train': 2.410189628601074} -09/20/2021 20:44:26 - INFO - __main__ - Step 28871: {'lr': 0.00019977406948094829, 'samples': 923872, 'steps': 1804, 'loss/train': 4.139418125152588} -09/20/2021 20:44:27 - INFO - __main__ - Step 28872: {'lr': 0.00019977406948094829, 'samples': 923904, 'steps': 1804, 'loss/train': 4.240849494934082} -09/20/2021 20:44:29 - INFO - __main__ - Step 28873: {'lr': 0.00019977406948094829, 'samples': 923936, 'steps': 1804, 'loss/train': 4.109306335449219} -09/20/2021 20:44:29 - INFO - __main__ - Step 28874: {'lr': 0.00019977406948094829, 'samples': 923968, 'steps': 1804, 'loss/train': 3.1539463996887207} -09/20/2021 20:44:30 - INFO - __main__ - Step 28875: {'lr': 0.00019977406948094829, 'samples': 924000, 'steps': 1804, 'loss/train': 2.7794055938720703} -09/20/2021 20:44:31 - INFO - __main__ - Step 28876: {'lr': 0.00019977406948094829, 'samples': 924032, 'steps': 1804, 'loss/train': 1.8070948123931885} -09/20/2021 20:44:32 - INFO - __main__ - Step 28877: {'lr': 0.00019977406948094829, 'samples': 924064, 'steps': 1804, 'loss/train': 2.038393020629883} -09/20/2021 20:44:32 - INFO - __main__ - Step 28878: {'lr': 0.00019977406948094829, 'samples': 924096, 'steps': 1804, 'loss/train': 2.861680746078491} -09/20/2021 20:44:33 - INFO - __main__ - Step 28879: {'lr': 0.00019977406948094829, 'samples': 924128, 'steps': 1804, 'loss/train': 1.3544458150863647} -09/20/2021 20:44:34 - INFO - __main__ - Step 28880: {'lr': 0.00019977406948094829, 'samples': 924160, 'steps': 1804, 'loss/train': 2.7752230167388916} -09/20/2021 20:44:35 - INFO - __main__ - Step 28881: {'lr': 0.00019977364072880046, 'samples': 924192, 'steps': 1805, 'loss/train': 2.9729092121124268} -09/20/2021 20:44:36 - INFO - __main__ - Step 28882: {'lr': 0.00019977364072880046, 'samples': 924224, 'steps': 1805, 'loss/train': 3.4572155475616455} -09/20/2021 20:44:36 - INFO - __main__ - Step 28883: {'lr': 0.00019977364072880046, 'samples': 924256, 'steps': 1805, 'loss/train': 3.31559157371521} -09/20/2021 20:44:37 - INFO - __main__ - Step 28884: {'lr': 0.00019977364072880046, 'samples': 924288, 'steps': 1805, 'loss/train': 2.4540724754333496} -09/20/2021 20:44:38 - INFO - __main__ - Step 28885: {'lr': 0.00019977364072880046, 'samples': 924320, 'steps': 1805, 'loss/train': 0.9744234085083008} -09/20/2021 20:44:39 - INFO - __main__ - Step 28886: {'lr': 0.00019977364072880046, 'samples': 924352, 'steps': 1805, 'loss/train': 3.0439109802246094} -09/20/2021 20:44:39 - INFO - __main__ - Step 28887: {'lr': 0.00019977364072880046, 'samples': 924384, 'steps': 1805, 'loss/train': 2.4777133464813232} -09/20/2021 20:44:40 - INFO - __main__ - Step 28888: {'lr': 0.00019977364072880046, 'samples': 924416, 'steps': 1805, 'loss/train': 2.4641551971435547} -09/20/2021 20:44:41 - INFO - __main__ - Step 28889: {'lr': 0.00019977364072880046, 'samples': 924448, 'steps': 1805, 'loss/train': 2.152686357498169} -09/20/2021 20:44:42 - INFO - __main__ - Step 28890: {'lr': 0.00019977364072880046, 'samples': 924480, 'steps': 1805, 'loss/train': 1.1814860105514526} -09/20/2021 20:44:42 - INFO - __main__ - Step 28891: {'lr': 0.00019977364072880046, 'samples': 924512, 'steps': 1805, 'loss/train': 2.9997828006744385} -09/20/2021 20:44:43 - INFO - __main__ - Step 28892: {'lr': 0.00019977364072880046, 'samples': 924544, 'steps': 1805, 'loss/train': 1.8076233863830566} -09/20/2021 20:44:44 - INFO - __main__ - Step 28893: {'lr': 0.00019977364072880046, 'samples': 924576, 'steps': 1805, 'loss/train': 2.7421469688415527} -09/20/2021 20:44:45 - INFO - __main__ - Step 28894: {'lr': 0.00019977364072880046, 'samples': 924608, 'steps': 1805, 'loss/train': 3.274005174636841} -09/20/2021 20:44:45 - INFO - __main__ - Step 28895: {'lr': 0.00019977364072880046, 'samples': 924640, 'steps': 1805, 'loss/train': 0.6757150888442993} -09/20/2021 20:44:46 - INFO - __main__ - Step 28896: {'lr': 0.00019977364072880046, 'samples': 924672, 'steps': 1805, 'loss/train': 2.63541841506958} -09/20/2021 20:44:47 - INFO - __main__ - Step 28897: {'lr': 0.00019977321157067408, 'samples': 924704, 'steps': 1806, 'loss/train': 1.8570002317428589} -09/20/2021 20:44:48 - INFO - __main__ - Step 28898: {'lr': 0.00019977321157067408, 'samples': 924736, 'steps': 1806, 'loss/train': 2.179490566253662} -09/20/2021 20:44:48 - INFO - __main__ - Step 28899: {'lr': 0.00019977321157067408, 'samples': 924768, 'steps': 1806, 'loss/train': 2.592911958694458} -09/20/2021 20:44:49 - INFO - __main__ - Step 28900: {'lr': 0.00019977321157067408, 'samples': 924800, 'steps': 1806, 'loss/train': 3.3186402320861816} -09/20/2021 20:44:50 - INFO - __main__ - Step 28901: {'lr': 0.00019977321157067408, 'samples': 924832, 'steps': 1806, 'loss/train': 2.1713130474090576} -09/20/2021 20:44:51 - INFO - __main__ - Step 28902: {'lr': 0.00019977321157067408, 'samples': 924864, 'steps': 1806, 'loss/train': 2.332348108291626} -09/20/2021 20:44:51 - INFO - __main__ - Step 28903: {'lr': 0.00019977321157067408, 'samples': 924896, 'steps': 1806, 'loss/train': 2.1678802967071533} -09/20/2021 20:44:52 - INFO - __main__ - Step 28904: {'lr': 0.00019977321157067408, 'samples': 924928, 'steps': 1806, 'loss/train': 0.8390363454818726} -09/20/2021 20:44:53 - INFO - __main__ - Step 28905: {'lr': 0.00019977321157067408, 'samples': 924960, 'steps': 1806, 'loss/train': 0.6929572820663452} -09/20/2021 20:44:54 - INFO - __main__ - Step 28906: {'lr': 0.00019977321157067408, 'samples': 924992, 'steps': 1806, 'loss/train': 0.6407752633094788} -09/20/2021 20:44:55 - INFO - __main__ - Step 28907: {'lr': 0.00019977321157067408, 'samples': 925024, 'steps': 1806, 'loss/train': 0.41614633798599243} -09/20/2021 20:44:56 - INFO - __main__ - Step 28908: {'lr': 0.00019977321157067408, 'samples': 925056, 'steps': 1806, 'loss/train': 3.4930548667907715} -09/20/2021 20:44:57 - INFO - __main__ - Step 28909: {'lr': 0.00019977321157067408, 'samples': 925088, 'steps': 1806, 'loss/train': 2.920374870300293} -09/20/2021 20:44:57 - INFO - __main__ - Step 28910: {'lr': 0.00019977321157067408, 'samples': 925120, 'steps': 1806, 'loss/train': 2.876452922821045} -09/20/2021 20:44:58 - INFO - __main__ - Step 28911: {'lr': 0.00019977321157067408, 'samples': 925152, 'steps': 1806, 'loss/train': 2.899778127670288} -09/20/2021 20:44:59 - INFO - __main__ - Step 28912: {'lr': 0.00019977321157067408, 'samples': 925184, 'steps': 1806, 'loss/train': 2.937042236328125} -09/20/2021 20:45:00 - INFO - __main__ - Step 28913: {'lr': 0.00019977278200657085, 'samples': 925216, 'steps': 1807, 'loss/train': 2.8943347930908203} -09/20/2021 20:45:01 - INFO - __main__ - Step 28914: {'lr': 0.00019977278200657085, 'samples': 925248, 'steps': 1807, 'loss/train': 2.5001142024993896} -09/20/2021 20:45:01 - INFO - __main__ - Step 28915: {'lr': 0.00019977278200657085, 'samples': 925280, 'steps': 1807, 'loss/train': 2.20819354057312} -09/20/2021 20:45:02 - INFO - __main__ - Step 28916: {'lr': 0.00019977278200657085, 'samples': 925312, 'steps': 1807, 'loss/train': 2.949368715286255} -09/20/2021 20:45:03 - INFO - __main__ - Step 28917: {'lr': 0.00019977278200657085, 'samples': 925344, 'steps': 1807, 'loss/train': 2.84165358543396} -09/20/2021 20:45:04 - INFO - __main__ - Step 28918: {'lr': 0.00019977278200657085, 'samples': 925376, 'steps': 1807, 'loss/train': 2.533485174179077} -09/20/2021 20:45:04 - INFO - __main__ - Step 28919: {'lr': 0.00019977278200657085, 'samples': 925408, 'steps': 1807, 'loss/train': 2.5230753421783447} -09/20/2021 20:45:05 - INFO - __main__ - Step 28920: {'lr': 0.00019977278200657085, 'samples': 925440, 'steps': 1807, 'loss/train': 2.6855030059814453} -09/20/2021 20:45:06 - INFO - __main__ - Step 28921: {'lr': 0.00019977278200657085, 'samples': 925472, 'steps': 1807, 'loss/train': 2.341360330581665} -09/20/2021 20:45:07 - INFO - __main__ - Step 28922: {'lr': 0.00019977278200657085, 'samples': 925504, 'steps': 1807, 'loss/train': 3.2741451263427734} -09/20/2021 20:45:07 - INFO - __main__ - Step 28923: {'lr': 0.00019977278200657085, 'samples': 925536, 'steps': 1807, 'loss/train': 2.687069892883301} -09/20/2021 20:45:08 - INFO - __main__ - Step 28924: {'lr': 0.00019977278200657085, 'samples': 925568, 'steps': 1807, 'loss/train': 1.8978136777877808} -09/20/2021 20:45:09 - INFO - __main__ - Step 28925: {'lr': 0.00019977278200657085, 'samples': 925600, 'steps': 1807, 'loss/train': 2.85709285736084} -09/20/2021 20:45:10 - INFO - __main__ - Step 28926: {'lr': 0.00019977278200657085, 'samples': 925632, 'steps': 1807, 'loss/train': 3.010200023651123} -09/20/2021 20:45:10 - INFO - __main__ - Step 28927: {'lr': 0.00019977278200657085, 'samples': 925664, 'steps': 1807, 'loss/train': 3.4269914627075195} -09/20/2021 20:45:11 - INFO - __main__ - Step 28928: {'lr': 0.00019977278200657085, 'samples': 925696, 'steps': 1807, 'loss/train': 2.8249471187591553} -09/20/2021 20:45:12 - INFO - __main__ - Step 28929: {'lr': 0.0001997723520364926, 'samples': 925728, 'steps': 1808, 'loss/train': 1.936702013015747} -09/20/2021 20:45:13 - INFO - __main__ - Step 28930: {'lr': 0.0001997723520364926, 'samples': 925760, 'steps': 1808, 'loss/train': 1.7663089036941528} -09/20/2021 20:45:14 - INFO - __main__ - Step 28931: {'lr': 0.0001997723520364926, 'samples': 925792, 'steps': 1808, 'loss/train': 2.0767619609832764} -09/20/2021 20:45:14 - INFO - __main__ - Step 28932: {'lr': 0.0001997723520364926, 'samples': 925824, 'steps': 1808, 'loss/train': 2.7674362659454346} -09/20/2021 20:45:15 - INFO - __main__ - Step 28933: {'lr': 0.0001997723520364926, 'samples': 925856, 'steps': 1808, 'loss/train': 2.3812978267669678} -09/20/2021 20:45:16 - INFO - __main__ - Step 28934: {'lr': 0.0001997723520364926, 'samples': 925888, 'steps': 1808, 'loss/train': 2.5419094562530518} -09/20/2021 20:45:17 - INFO - __main__ - Step 28935: {'lr': 0.0001997723520364926, 'samples': 925920, 'steps': 1808, 'loss/train': 2.3671112060546875} -09/20/2021 20:45:17 - INFO - __main__ - Step 28936: {'lr': 0.0001997723520364926, 'samples': 925952, 'steps': 1808, 'loss/train': 2.4930784702301025} -09/20/2021 20:45:18 - INFO - __main__ - Step 28937: {'lr': 0.0001997723520364926, 'samples': 925984, 'steps': 1808, 'loss/train': 2.5779895782470703} -09/20/2021 20:45:19 - INFO - __main__ - Step 28938: {'lr': 0.0001997723520364926, 'samples': 926016, 'steps': 1808, 'loss/train': 2.496087074279785} -09/20/2021 20:45:20 - INFO - __main__ - Step 28939: {'lr': 0.0001997723520364926, 'samples': 926048, 'steps': 1808, 'loss/train': 2.8479747772216797} -09/20/2021 20:45:21 - INFO - __main__ - Step 28940: {'lr': 0.0001997723520364926, 'samples': 926080, 'steps': 1808, 'loss/train': 4.034645080566406} -09/20/2021 20:45:22 - INFO - __main__ - Step 28941: {'lr': 0.0001997723520364926, 'samples': 926112, 'steps': 1808, 'loss/train': 3.1167914867401123} -09/20/2021 20:45:22 - INFO - __main__ - Step 28942: {'lr': 0.0001997723520364926, 'samples': 926144, 'steps': 1808, 'loss/train': 2.5508830547332764} -09/20/2021 20:45:23 - INFO - __main__ - Step 28943: {'lr': 0.0001997723520364926, 'samples': 926176, 'steps': 1808, 'loss/train': 2.385521411895752} -09/20/2021 20:45:24 - INFO - __main__ - Step 28944: {'lr': 0.0001997723520364926, 'samples': 926208, 'steps': 1808, 'loss/train': 2.1547129154205322} -09/20/2021 20:45:25 - INFO - __main__ - Step 28945: {'lr': 0.000199771921660441, 'samples': 926240, 'steps': 1809, 'loss/train': 3.508937358856201} -09/20/2021 20:45:25 - INFO - __main__ - Step 28946: {'lr': 0.000199771921660441, 'samples': 926272, 'steps': 1809, 'loss/train': 1.9101113080978394} -09/20/2021 20:45:26 - INFO - __main__ - Step 28947: {'lr': 0.000199771921660441, 'samples': 926304, 'steps': 1809, 'loss/train': 2.3543643951416016} -09/20/2021 20:45:27 - INFO - __main__ - Step 28948: {'lr': 0.000199771921660441, 'samples': 926336, 'steps': 1809, 'loss/train': 3.214458703994751} -09/20/2021 20:45:28 - INFO - __main__ - Step 28949: {'lr': 0.000199771921660441, 'samples': 926368, 'steps': 1809, 'loss/train': 2.6260244846343994} -09/20/2021 20:45:28 - INFO - __main__ - Step 28950: {'lr': 0.000199771921660441, 'samples': 926400, 'steps': 1809, 'loss/train': 2.426175355911255} -09/20/2021 20:45:29 - INFO - __main__ - Step 28951: {'lr': 0.000199771921660441, 'samples': 926432, 'steps': 1809, 'loss/train': 2.704514741897583} -09/20/2021 20:45:30 - INFO - __main__ - Step 28952: {'lr': 0.000199771921660441, 'samples': 926464, 'steps': 1809, 'loss/train': 2.2716095447540283} -09/20/2021 20:45:31 - INFO - __main__ - Step 28953: {'lr': 0.000199771921660441, 'samples': 926496, 'steps': 1809, 'loss/train': 2.5073699951171875} -09/20/2021 20:45:31 - INFO - __main__ - Step 28954: {'lr': 0.000199771921660441, 'samples': 926528, 'steps': 1809, 'loss/train': 2.5463194847106934} -09/20/2021 20:45:32 - INFO - __main__ - Step 28955: {'lr': 0.000199771921660441, 'samples': 926560, 'steps': 1809, 'loss/train': 2.175711154937744} -09/20/2021 20:45:33 - INFO - __main__ - Step 28956: {'lr': 0.000199771921660441, 'samples': 926592, 'steps': 1809, 'loss/train': 2.5634803771972656} -09/20/2021 20:45:34 - INFO - __main__ - Step 28957: {'lr': 0.000199771921660441, 'samples': 926624, 'steps': 1809, 'loss/train': 1.1833447217941284} -09/20/2021 20:45:34 - INFO - __main__ - Step 28958: {'lr': 0.000199771921660441, 'samples': 926656, 'steps': 1809, 'loss/train': 2.5834689140319824} -09/20/2021 20:45:35 - INFO - __main__ - Step 28959: {'lr': 0.000199771921660441, 'samples': 926688, 'steps': 1809, 'loss/train': 3.946171283721924} -09/20/2021 20:45:36 - INFO - __main__ - Step 28960: {'lr': 0.000199771921660441, 'samples': 926720, 'steps': 1809, 'loss/train': 1.1554198265075684} -09/20/2021 20:45:37 - INFO - __main__ - Step 28961: {'lr': 0.0001997714908784179, 'samples': 926752, 'steps': 1810, 'loss/train': 2.2406859397888184} -09/20/2021 20:45:38 - INFO - __main__ - Step 28962: {'lr': 0.0001997714908784179, 'samples': 926784, 'steps': 1810, 'loss/train': 2.732429027557373} -09/20/2021 20:45:38 - INFO - __main__ - Step 28963: {'lr': 0.0001997714908784179, 'samples': 926816, 'steps': 1810, 'loss/train': 2.5695414543151855} -09/20/2021 20:45:39 - INFO - __main__ - Step 28964: {'lr': 0.0001997714908784179, 'samples': 926848, 'steps': 1810, 'loss/train': 1.597022294998169} -09/20/2021 20:45:40 - INFO - __main__ - Step 28965: {'lr': 0.0001997714908784179, 'samples': 926880, 'steps': 1810, 'loss/train': 3.5072824954986572} -09/20/2021 20:45:41 - INFO - __main__ - Step 28966: {'lr': 0.0001997714908784179, 'samples': 926912, 'steps': 1810, 'loss/train': 2.1590895652770996} -09/20/2021 20:45:41 - INFO - __main__ - Step 28967: {'lr': 0.0001997714908784179, 'samples': 926944, 'steps': 1810, 'loss/train': 3.0859432220458984} -09/20/2021 20:45:42 - INFO - __main__ - Step 28968: {'lr': 0.0001997714908784179, 'samples': 926976, 'steps': 1810, 'loss/train': 2.2631723880767822} -09/20/2021 20:45:43 - INFO - __main__ - Step 28969: {'lr': 0.0001997714908784179, 'samples': 927008, 'steps': 1810, 'loss/train': 3.152946949005127} -09/20/2021 20:45:44 - INFO - __main__ - Step 28970: {'lr': 0.0001997714908784179, 'samples': 927040, 'steps': 1810, 'loss/train': 3.3620502948760986} -09/20/2021 20:45:45 - INFO - __main__ - Step 28971: {'lr': 0.0001997714908784179, 'samples': 927072, 'steps': 1810, 'loss/train': 2.395002841949463} -09/20/2021 20:45:46 - INFO - __main__ - Step 28972: {'lr': 0.0001997714908784179, 'samples': 927104, 'steps': 1810, 'loss/train': 2.2456209659576416} -09/20/2021 20:45:47 - INFO - __main__ - Step 28973: {'lr': 0.0001997714908784179, 'samples': 927136, 'steps': 1810, 'loss/train': 2.6043283939361572} -09/20/2021 20:45:48 - INFO - __main__ - Step 28974: {'lr': 0.0001997714908784179, 'samples': 927168, 'steps': 1810, 'loss/train': 2.256119728088379} -09/20/2021 20:45:48 - INFO - __main__ - Step 28975: {'lr': 0.0001997714908784179, 'samples': 927200, 'steps': 1810, 'loss/train': 4.775822639465332} -09/20/2021 20:45:49 - INFO - __main__ - Step 28976: {'lr': 0.0001997714908784179, 'samples': 927232, 'steps': 1810, 'loss/train': 4.683933734893799} -09/20/2021 20:45:50 - INFO - __main__ - Step 28977: {'lr': 0.00019977105969042492, 'samples': 927264, 'steps': 1811, 'loss/train': 2.543773889541626} -09/20/2021 20:45:51 - INFO - __main__ - Step 28978: {'lr': 0.00019977105969042492, 'samples': 927296, 'steps': 1811, 'loss/train': 2.2436885833740234} -09/20/2021 20:45:52 - INFO - __main__ - Step 28979: {'lr': 0.00019977105969042492, 'samples': 927328, 'steps': 1811, 'loss/train': 0.9130746722221375} -09/20/2021 20:45:52 - INFO - __main__ - Step 28980: {'lr': 0.00019977105969042492, 'samples': 927360, 'steps': 1811, 'loss/train': 2.239738941192627} -09/20/2021 20:45:53 - INFO - __main__ - Step 28981: {'lr': 0.00019977105969042492, 'samples': 927392, 'steps': 1811, 'loss/train': 3.0084095001220703} -09/20/2021 20:45:54 - INFO - __main__ - Step 28982: {'lr': 0.00019977105969042492, 'samples': 927424, 'steps': 1811, 'loss/train': 2.3778226375579834} -09/20/2021 20:45:55 - INFO - __main__ - Step 28983: {'lr': 0.00019977105969042492, 'samples': 927456, 'steps': 1811, 'loss/train': 3.1245486736297607} -09/20/2021 20:45:55 - INFO - __main__ - Step 28984: {'lr': 0.00019977105969042492, 'samples': 927488, 'steps': 1811, 'loss/train': 3.285618782043457} -09/20/2021 20:45:56 - INFO - __main__ - Step 28985: {'lr': 0.00019977105969042492, 'samples': 927520, 'steps': 1811, 'loss/train': 3.209825277328491} -09/20/2021 20:45:57 - INFO - __main__ - Step 28986: {'lr': 0.00019977105969042492, 'samples': 927552, 'steps': 1811, 'loss/train': 2.3016254901885986} -09/20/2021 20:45:58 - INFO - __main__ - Step 28987: {'lr': 0.00019977105969042492, 'samples': 927584, 'steps': 1811, 'loss/train': 2.9163217544555664} -09/20/2021 20:45:58 - INFO - __main__ - Step 28988: {'lr': 0.00019977105969042492, 'samples': 927616, 'steps': 1811, 'loss/train': 3.0549323558807373} -09/20/2021 20:45:59 - INFO - __main__ - Step 28989: {'lr': 0.00019977105969042492, 'samples': 927648, 'steps': 1811, 'loss/train': 2.836576461791992} -09/20/2021 20:46:00 - INFO - __main__ - Step 28990: {'lr': 0.00019977105969042492, 'samples': 927680, 'steps': 1811, 'loss/train': 2.788257122039795} -09/20/2021 20:46:01 - INFO - __main__ - Step 28991: {'lr': 0.00019977105969042492, 'samples': 927712, 'steps': 1811, 'loss/train': 3.186304807662964} -09/20/2021 20:46:01 - INFO - __main__ - Step 28992: {'lr': 0.00019977105969042492, 'samples': 927744, 'steps': 1811, 'loss/train': 2.1146693229675293} -09/20/2021 20:46:02 - INFO - __main__ - Step 28993: {'lr': 0.0001997706280964639, 'samples': 927776, 'steps': 1812, 'loss/train': 0.6583606600761414} -09/20/2021 20:46:03 - INFO - __main__ - Step 28994: {'lr': 0.0001997706280964639, 'samples': 927808, 'steps': 1812, 'loss/train': 1.8020302057266235} -09/20/2021 20:46:04 - INFO - __main__ - Step 28995: {'lr': 0.0001997706280964639, 'samples': 927840, 'steps': 1812, 'loss/train': 3.1007044315338135} -09/20/2021 20:46:04 - INFO - __main__ - Step 28996: {'lr': 0.0001997706280964639, 'samples': 927872, 'steps': 1812, 'loss/train': 1.7072628736495972} -09/20/2021 20:46:05 - INFO - __main__ - Step 28997: {'lr': 0.0001997706280964639, 'samples': 927904, 'steps': 1812, 'loss/train': 2.726001262664795} -09/20/2021 20:46:06 - INFO - __main__ - Step 28998: {'lr': 0.0001997706280964639, 'samples': 927936, 'steps': 1812, 'loss/train': 3.2011160850524902} -09/20/2021 20:46:07 - INFO - __main__ - Step 28999: {'lr': 0.0001997706280964639, 'samples': 927968, 'steps': 1812, 'loss/train': 1.995944619178772} -09/20/2021 20:46:07 - INFO - __main__ - Step 29000: {'lr': 0.0001997706280964639, 'samples': 928000, 'steps': 1812, 'loss/train': 3.691669464111328} -09/20/2021 20:46:08 - INFO - __main__ - Step 29001: {'lr': 0.0001997706280964639, 'samples': 928032, 'steps': 1812, 'loss/train': 0.6245760321617126} -09/20/2021 20:46:10 - INFO - __main__ - Step 29002: {'lr': 0.0001997706280964639, 'samples': 928064, 'steps': 1812, 'loss/train': 1.7756699323654175} -09/20/2021 20:46:10 - INFO - __main__ - Step 29003: {'lr': 0.0001997706280964639, 'samples': 928096, 'steps': 1812, 'loss/train': 3.1551384925842285} -09/20/2021 20:46:11 - INFO - __main__ - Step 29004: {'lr': 0.0001997706280964639, 'samples': 928128, 'steps': 1812, 'loss/train': 3.153301477432251} -09/20/2021 20:46:12 - INFO - __main__ - Step 29005: {'lr': 0.0001997706280964639, 'samples': 928160, 'steps': 1812, 'loss/train': 2.6709649562835693} -09/20/2021 20:46:13 - INFO - __main__ - Step 29006: {'lr': 0.0001997706280964639, 'samples': 928192, 'steps': 1812, 'loss/train': 3.249016284942627} -09/20/2021 20:46:13 - INFO - __main__ - Step 29007: {'lr': 0.0001997706280964639, 'samples': 928224, 'steps': 1812, 'loss/train': 1.0593972206115723} -09/20/2021 20:46:14 - INFO - __main__ - Step 29008: {'lr': 0.0001997706280964639, 'samples': 928256, 'steps': 1812, 'loss/train': 1.1823619604110718} -09/20/2021 20:46:15 - INFO - __main__ - Step 29009: {'lr': 0.00019977019609653663, 'samples': 928288, 'steps': 1813, 'loss/train': 3.215909481048584} -09/20/2021 20:46:16 - INFO - __main__ - Step 29010: {'lr': 0.00019977019609653663, 'samples': 928320, 'steps': 1813, 'loss/train': 3.1992077827453613} -09/20/2021 20:46:17 - INFO - __main__ - Step 29011: {'lr': 0.00019977019609653663, 'samples': 928352, 'steps': 1813, 'loss/train': 1.1950891017913818} -09/20/2021 20:46:17 - INFO - __main__ - Step 29012: {'lr': 0.00019977019609653663, 'samples': 928384, 'steps': 1813, 'loss/train': 2.203911304473877} -09/20/2021 20:46:18 - INFO - __main__ - Step 29013: {'lr': 0.00019977019609653663, 'samples': 928416, 'steps': 1813, 'loss/train': 2.7100157737731934} -09/20/2021 20:46:19 - INFO - __main__ - Step 29014: {'lr': 0.00019977019609653663, 'samples': 928448, 'steps': 1813, 'loss/train': 2.537686824798584} -09/20/2021 20:46:20 - INFO - __main__ - Step 29015: {'lr': 0.00019977019609653663, 'samples': 928480, 'steps': 1813, 'loss/train': 1.3602948188781738} -09/20/2021 20:46:20 - INFO - __main__ - Step 29016: {'lr': 0.00019977019609653663, 'samples': 928512, 'steps': 1813, 'loss/train': 2.760834217071533} -09/20/2021 20:46:21 - INFO - __main__ - Step 29017: {'lr': 0.00019977019609653663, 'samples': 928544, 'steps': 1813, 'loss/train': 2.370290994644165} -09/20/2021 20:46:22 - INFO - __main__ - Step 29018: {'lr': 0.00019977019609653663, 'samples': 928576, 'steps': 1813, 'loss/train': 2.9757120609283447} -09/20/2021 20:46:23 - INFO - __main__ - Step 29019: {'lr': 0.00019977019609653663, 'samples': 928608, 'steps': 1813, 'loss/train': 3.0856831073760986} -09/20/2021 20:46:23 - INFO - __main__ - Step 29020: {'lr': 0.00019977019609653663, 'samples': 928640, 'steps': 1813, 'loss/train': 3.5127639770507812} -09/20/2021 20:46:24 - INFO - __main__ - Step 29021: {'lr': 0.00019977019609653663, 'samples': 928672, 'steps': 1813, 'loss/train': 4.068304538726807} -09/20/2021 20:46:25 - INFO - __main__ - Step 29022: {'lr': 0.00019977019609653663, 'samples': 928704, 'steps': 1813, 'loss/train': 3.552502155303955} -09/20/2021 20:46:26 - INFO - __main__ - Step 29023: {'lr': 0.00019977019609653663, 'samples': 928736, 'steps': 1813, 'loss/train': 2.8375322818756104} -09/20/2021 20:46:26 - INFO - __main__ - Step 29024: {'lr': 0.00019977019609653663, 'samples': 928768, 'steps': 1813, 'loss/train': 2.244553565979004} -09/20/2021 20:46:27 - INFO - __main__ - Step 29025: {'lr': 0.00019976976369064477, 'samples': 928800, 'steps': 1814, 'loss/train': 3.3671252727508545} -09/20/2021 20:46:28 - INFO - __main__ - Step 29026: {'lr': 0.00019976976369064477, 'samples': 928832, 'steps': 1814, 'loss/train': 1.6760995388031006} -09/20/2021 20:46:29 - INFO - __main__ - Step 29027: {'lr': 0.00019976976369064477, 'samples': 928864, 'steps': 1814, 'loss/train': 2.1153995990753174} -09/20/2021 20:46:29 - INFO - __main__ - Step 29028: {'lr': 0.00019976976369064477, 'samples': 928896, 'steps': 1814, 'loss/train': 2.0908665657043457} -09/20/2021 20:46:30 - INFO - __main__ - Step 29029: {'lr': 0.00019976976369064477, 'samples': 928928, 'steps': 1814, 'loss/train': 1.9244126081466675} -09/20/2021 20:46:31 - INFO - __main__ - Step 29030: {'lr': 0.00019976976369064477, 'samples': 928960, 'steps': 1814, 'loss/train': 2.271937608718872} -09/20/2021 20:46:32 - INFO - __main__ - Step 29031: {'lr': 0.00019976976369064477, 'samples': 928992, 'steps': 1814, 'loss/train': 2.6519572734832764} -09/20/2021 20:46:32 - INFO - __main__ - Step 29032: {'lr': 0.00019976976369064477, 'samples': 929024, 'steps': 1814, 'loss/train': 2.7001051902770996} -09/20/2021 20:46:33 - INFO - __main__ - Step 29033: {'lr': 0.00019976976369064477, 'samples': 929056, 'steps': 1814, 'loss/train': 2.1526966094970703} -09/20/2021 20:46:35 - INFO - __main__ - Step 29034: {'lr': 0.00019976976369064477, 'samples': 929088, 'steps': 1814, 'loss/train': 2.0385286808013916} -09/20/2021 20:46:35 - INFO - __main__ - Step 29035: {'lr': 0.00019976976369064477, 'samples': 929120, 'steps': 1814, 'loss/train': 2.610346555709839} -09/20/2021 20:46:36 - INFO - __main__ - Step 29036: {'lr': 0.00019976976369064477, 'samples': 929152, 'steps': 1814, 'loss/train': 2.452651262283325} -09/20/2021 20:46:37 - INFO - __main__ - Step 29037: {'lr': 0.00019976976369064477, 'samples': 929184, 'steps': 1814, 'loss/train': 2.562166452407837} -09/20/2021 20:46:38 - INFO - __main__ - Step 29038: {'lr': 0.00019976976369064477, 'samples': 929216, 'steps': 1814, 'loss/train': 2.75524640083313} -09/20/2021 20:46:38 - INFO - __main__ - Step 29039: {'lr': 0.00019976976369064477, 'samples': 929248, 'steps': 1814, 'loss/train': 2.3087055683135986} -09/20/2021 20:46:39 - INFO - __main__ - Step 29040: {'lr': 0.00019976976369064477, 'samples': 929280, 'steps': 1814, 'loss/train': 2.7732162475585938} -09/20/2021 20:46:40 - INFO - __main__ - Step 29041: {'lr': 0.00019976933087879014, 'samples': 929312, 'steps': 1815, 'loss/train': 3.240908622741699} -09/20/2021 20:46:41 - INFO - __main__ - Step 29042: {'lr': 0.00019976933087879014, 'samples': 929344, 'steps': 1815, 'loss/train': 2.1263656616210938} -09/20/2021 20:46:41 - INFO - __main__ - Step 29043: {'lr': 0.00019976933087879014, 'samples': 929376, 'steps': 1815, 'loss/train': 2.2986385822296143} -09/20/2021 20:46:42 - INFO - __main__ - Step 29044: {'lr': 0.00019976933087879014, 'samples': 929408, 'steps': 1815, 'loss/train': 1.7854335308074951} -09/20/2021 20:46:43 - INFO - __main__ - Step 29045: {'lr': 0.00019976933087879014, 'samples': 929440, 'steps': 1815, 'loss/train': 2.8887381553649902} -09/20/2021 20:46:44 - INFO - __main__ - Step 29046: {'lr': 0.00019976933087879014, 'samples': 929472, 'steps': 1815, 'loss/train': 2.2998313903808594} -09/20/2021 20:46:44 - INFO - __main__ - Step 29047: {'lr': 0.00019976933087879014, 'samples': 929504, 'steps': 1815, 'loss/train': 2.6489901542663574} -09/20/2021 20:46:45 - INFO - __main__ - Step 29048: {'lr': 0.00019976933087879014, 'samples': 929536, 'steps': 1815, 'loss/train': 2.9669923782348633} -09/20/2021 20:46:46 - INFO - __main__ - Step 29049: {'lr': 0.00019976933087879014, 'samples': 929568, 'steps': 1815, 'loss/train': 1.7018922567367554} -09/20/2021 20:46:47 - INFO - __main__ - Step 29050: {'lr': 0.00019976933087879014, 'samples': 929600, 'steps': 1815, 'loss/train': 2.665050983428955} -09/20/2021 20:46:47 - INFO - __main__ - Step 29051: {'lr': 0.00019976933087879014, 'samples': 929632, 'steps': 1815, 'loss/train': 2.852802038192749} -09/20/2021 20:46:48 - INFO - __main__ - Step 29052: {'lr': 0.00019976933087879014, 'samples': 929664, 'steps': 1815, 'loss/train': 2.5931904315948486} -09/20/2021 20:46:49 - INFO - __main__ - Step 29053: {'lr': 0.00019976933087879014, 'samples': 929696, 'steps': 1815, 'loss/train': 2.2509360313415527} -09/20/2021 20:46:50 - INFO - __main__ - Step 29054: {'lr': 0.00019976933087879014, 'samples': 929728, 'steps': 1815, 'loss/train': 2.913341760635376} -09/20/2021 20:46:50 - INFO - __main__ - Step 29055: {'lr': 0.00019976933087879014, 'samples': 929760, 'steps': 1815, 'loss/train': 2.5190658569335938} -09/20/2021 20:46:51 - INFO - __main__ - Step 29056: {'lr': 0.00019976933087879014, 'samples': 929792, 'steps': 1815, 'loss/train': 2.3812267780303955} -09/20/2021 20:46:52 - INFO - __main__ - Step 29057: {'lr': 0.0001997688976609745, 'samples': 929824, 'steps': 1816, 'loss/train': 2.699648380279541} -09/20/2021 20:46:53 - INFO - __main__ - Step 29058: {'lr': 0.0001997688976609745, 'samples': 929856, 'steps': 1816, 'loss/train': 3.0305378437042236} -09/20/2021 20:46:54 - INFO - __main__ - Step 29059: {'lr': 0.0001997688976609745, 'samples': 929888, 'steps': 1816, 'loss/train': 2.7991843223571777} -09/20/2021 20:46:54 - INFO - __main__ - Step 29060: {'lr': 0.0001997688976609745, 'samples': 929920, 'steps': 1816, 'loss/train': 2.910398244857788} -09/20/2021 20:46:55 - INFO - __main__ - Step 29061: {'lr': 0.0001997688976609745, 'samples': 929952, 'steps': 1816, 'loss/train': 1.294724941253662} -09/20/2021 20:46:56 - INFO - __main__ - Step 29062: {'lr': 0.0001997688976609745, 'samples': 929984, 'steps': 1816, 'loss/train': 2.2270915508270264} -09/20/2021 20:46:57 - INFO - __main__ - Step 29063: {'lr': 0.0001997688976609745, 'samples': 930016, 'steps': 1816, 'loss/train': 2.7425525188446045} -09/20/2021 20:46:57 - INFO - __main__ - Step 29064: {'lr': 0.0001997688976609745, 'samples': 930048, 'steps': 1816, 'loss/train': 3.1663200855255127} -09/20/2021 20:46:59 - INFO - __main__ - Step 29065: {'lr': 0.0001997688976609745, 'samples': 930080, 'steps': 1816, 'loss/train': 3.1520144939422607} -09/20/2021 20:46:59 - INFO - __main__ - Step 29066: {'lr': 0.0001997688976609745, 'samples': 930112, 'steps': 1816, 'loss/train': 3.0802700519561768} -09/20/2021 20:47:00 - INFO - __main__ - Step 29067: {'lr': 0.0001997688976609745, 'samples': 930144, 'steps': 1816, 'loss/train': 2.724024772644043} -09/20/2021 20:47:01 - INFO - __main__ - Step 29068: {'lr': 0.0001997688976609745, 'samples': 930176, 'steps': 1816, 'loss/train': 2.7890427112579346} -09/20/2021 20:47:02 - INFO - __main__ - Step 29069: {'lr': 0.0001997688976609745, 'samples': 930208, 'steps': 1816, 'loss/train': 2.7366433143615723} -09/20/2021 20:47:02 - INFO - __main__ - Step 29070: {'lr': 0.0001997688976609745, 'samples': 930240, 'steps': 1816, 'loss/train': 2.6875076293945312} -09/20/2021 20:47:03 - INFO - __main__ - Step 29071: {'lr': 0.0001997688976609745, 'samples': 930272, 'steps': 1816, 'loss/train': 2.2117464542388916} -09/20/2021 20:47:04 - INFO - __main__ - Step 29072: {'lr': 0.0001997688976609745, 'samples': 930304, 'steps': 1816, 'loss/train': 3.0160677433013916} -09/20/2021 20:47:05 - INFO - __main__ - Step 29073: {'lr': 0.0001997684640371996, 'samples': 930336, 'steps': 1817, 'loss/train': 2.9745380878448486} -09/20/2021 20:47:05 - INFO - __main__ - Step 29074: {'lr': 0.0001997684640371996, 'samples': 930368, 'steps': 1817, 'loss/train': 2.963496685028076} -09/20/2021 20:47:06 - INFO - __main__ - Step 29075: {'lr': 0.0001997684640371996, 'samples': 930400, 'steps': 1817, 'loss/train': 3.970613479614258} -09/20/2021 20:47:07 - INFO - __main__ - Step 29076: {'lr': 0.0001997684640371996, 'samples': 930432, 'steps': 1817, 'loss/train': 1.9498655796051025} -09/20/2021 20:47:08 - INFO - __main__ - Step 29077: {'lr': 0.0001997684640371996, 'samples': 930464, 'steps': 1817, 'loss/train': 1.9952248334884644} -09/20/2021 20:47:08 - INFO - __main__ - Step 29078: {'lr': 0.0001997684640371996, 'samples': 930496, 'steps': 1817, 'loss/train': 3.2687017917633057} -09/20/2021 20:47:09 - INFO - __main__ - Step 29079: {'lr': 0.0001997684640371996, 'samples': 930528, 'steps': 1817, 'loss/train': 2.240046262741089} -09/20/2021 20:47:10 - INFO - __main__ - Step 29080: {'lr': 0.0001997684640371996, 'samples': 930560, 'steps': 1817, 'loss/train': 2.9513230323791504} -09/20/2021 20:47:11 - INFO - __main__ - Step 29081: {'lr': 0.0001997684640371996, 'samples': 930592, 'steps': 1817, 'loss/train': 2.7809834480285645} -09/20/2021 20:47:11 - INFO - __main__ - Step 29082: {'lr': 0.0001997684640371996, 'samples': 930624, 'steps': 1817, 'loss/train': 3.2131192684173584} -09/20/2021 20:47:12 - INFO - __main__ - Step 29083: {'lr': 0.0001997684640371996, 'samples': 930656, 'steps': 1817, 'loss/train': 3.113373041152954} -09/20/2021 20:47:13 - INFO - __main__ - Step 29084: {'lr': 0.0001997684640371996, 'samples': 930688, 'steps': 1817, 'loss/train': 2.696681499481201} -09/20/2021 20:47:14 - INFO - __main__ - Step 29085: {'lr': 0.0001997684640371996, 'samples': 930720, 'steps': 1817, 'loss/train': 0.5921892523765564} -09/20/2021 20:47:14 - INFO - __main__ - Step 29086: {'lr': 0.0001997684640371996, 'samples': 930752, 'steps': 1817, 'loss/train': 1.8336223363876343} -09/20/2021 20:47:15 - INFO - __main__ - Step 29087: {'lr': 0.0001997684640371996, 'samples': 930784, 'steps': 1817, 'loss/train': 2.788241386413574} -09/20/2021 20:47:16 - INFO - __main__ - Step 29088: {'lr': 0.0001997684640371996, 'samples': 930816, 'steps': 1817, 'loss/train': 1.7143975496292114} -09/20/2021 20:47:17 - INFO - __main__ - Step 29089: {'lr': 0.00019976803000746723, 'samples': 930848, 'steps': 1818, 'loss/train': 1.9487483501434326} -09/20/2021 20:47:18 - INFO - __main__ - Step 29090: {'lr': 0.00019976803000746723, 'samples': 930880, 'steps': 1818, 'loss/train': 2.2548608779907227} -09/20/2021 20:47:18 - INFO - __main__ - Step 29091: {'lr': 0.00019976803000746723, 'samples': 930912, 'steps': 1818, 'loss/train': 3.056211471557617} -09/20/2021 20:47:19 - INFO - __main__ - Step 29092: {'lr': 0.00019976803000746723, 'samples': 930944, 'steps': 1818, 'loss/train': 1.5183686017990112} -09/20/2021 20:47:20 - INFO - __main__ - Step 29093: {'lr': 0.00019976803000746723, 'samples': 930976, 'steps': 1818, 'loss/train': 2.2357475757598877} -09/20/2021 20:47:21 - INFO - __main__ - Step 29094: {'lr': 0.00019976803000746723, 'samples': 931008, 'steps': 1818, 'loss/train': 2.928621768951416} -09/20/2021 20:47:21 - INFO - __main__ - Step 29095: {'lr': 0.00019976803000746723, 'samples': 931040, 'steps': 1818, 'loss/train': 2.3964412212371826} -09/20/2021 20:47:23 - INFO - __main__ - Step 29096: {'lr': 0.00019976803000746723, 'samples': 931072, 'steps': 1818, 'loss/train': 3.722714424133301} -09/20/2021 20:47:23 - INFO - __main__ - Step 29097: {'lr': 0.00019976803000746723, 'samples': 931104, 'steps': 1818, 'loss/train': 2.979370594024658} -09/20/2021 20:47:24 - INFO - __main__ - Step 29098: {'lr': 0.00019976803000746723, 'samples': 931136, 'steps': 1818, 'loss/train': 2.6160452365875244} -09/20/2021 20:47:25 - INFO - __main__ - Step 29099: {'lr': 0.00019976803000746723, 'samples': 931168, 'steps': 1818, 'loss/train': 2.469245433807373} -09/20/2021 20:47:26 - INFO - __main__ - Step 29100: {'lr': 0.00019976803000746723, 'samples': 931200, 'steps': 1818, 'loss/train': 2.903470516204834} -09/20/2021 20:47:26 - INFO - __main__ - Step 29101: {'lr': 0.00019976803000746723, 'samples': 931232, 'steps': 1818, 'loss/train': 2.4233622550964355} -09/20/2021 20:47:27 - INFO - __main__ - Step 29102: {'lr': 0.00019976803000746723, 'samples': 931264, 'steps': 1818, 'loss/train': 2.920682430267334} -09/20/2021 20:47:28 - INFO - __main__ - Step 29103: {'lr': 0.00019976803000746723, 'samples': 931296, 'steps': 1818, 'loss/train': 2.4184179306030273} -09/20/2021 20:47:29 - INFO - __main__ - Step 29104: {'lr': 0.00019976803000746723, 'samples': 931328, 'steps': 1818, 'loss/train': 0.385136216878891} -09/20/2021 20:47:30 - INFO - __main__ - Step 29105: {'lr': 0.0001997675955717791, 'samples': 931360, 'steps': 1819, 'loss/train': 0.557336151599884} -09/20/2021 20:47:30 - INFO - __main__ - Step 29106: {'lr': 0.0001997675955717791, 'samples': 931392, 'steps': 1819, 'loss/train': 1.7579309940338135} -09/20/2021 20:47:31 - INFO - __main__ - Step 29107: {'lr': 0.0001997675955717791, 'samples': 931424, 'steps': 1819, 'loss/train': 2.026275873184204} -09/20/2021 20:47:32 - INFO - __main__ - Step 29108: {'lr': 0.0001997675955717791, 'samples': 931456, 'steps': 1819, 'loss/train': 2.074570655822754} -09/20/2021 20:47:33 - INFO - __main__ - Step 29109: {'lr': 0.0001997675955717791, 'samples': 931488, 'steps': 1819, 'loss/train': 1.8349791765213013} -09/20/2021 20:47:33 - INFO - __main__ - Step 29110: {'lr': 0.0001997675955717791, 'samples': 931520, 'steps': 1819, 'loss/train': 1.4329490661621094} -09/20/2021 20:47:34 - INFO - __main__ - Step 29111: {'lr': 0.0001997675955717791, 'samples': 931552, 'steps': 1819, 'loss/train': 3.017859697341919} -09/20/2021 20:47:35 - INFO - __main__ - Step 29112: {'lr': 0.0001997675955717791, 'samples': 931584, 'steps': 1819, 'loss/train': 2.809134006500244} -09/20/2021 20:47:36 - INFO - __main__ - Step 29113: {'lr': 0.0001997675955717791, 'samples': 931616, 'steps': 1819, 'loss/train': 2.172612428665161} -09/20/2021 20:47:36 - INFO - __main__ - Step 29114: {'lr': 0.0001997675955717791, 'samples': 931648, 'steps': 1819, 'loss/train': 2.623884439468384} -09/20/2021 20:47:37 - INFO - __main__ - Step 29115: {'lr': 0.0001997675955717791, 'samples': 931680, 'steps': 1819, 'loss/train': 3.6741037368774414} -09/20/2021 20:47:38 - INFO - __main__ - Step 29116: {'lr': 0.0001997675955717791, 'samples': 931712, 'steps': 1819, 'loss/train': 1.948070764541626} -09/20/2021 20:47:39 - INFO - __main__ - Step 29117: {'lr': 0.0001997675955717791, 'samples': 931744, 'steps': 1819, 'loss/train': 2.889816999435425} -09/20/2021 20:47:39 - INFO - __main__ - Step 29118: {'lr': 0.0001997675955717791, 'samples': 931776, 'steps': 1819, 'loss/train': 2.7141776084899902} -09/20/2021 20:47:40 - INFO - __main__ - Step 29119: {'lr': 0.0001997675955717791, 'samples': 931808, 'steps': 1819, 'loss/train': 2.478421211242676} -09/20/2021 20:47:41 - INFO - __main__ - Step 29120: {'lr': 0.0001997675955717791, 'samples': 931840, 'steps': 1819, 'loss/train': 2.564854860305786} -09/20/2021 20:47:42 - INFO - __main__ - Step 29121: {'lr': 0.00019976716073013702, 'samples': 931872, 'steps': 1820, 'loss/train': 2.5903501510620117} -09/20/2021 20:47:42 - INFO - __main__ - Step 29122: {'lr': 0.00019976716073013702, 'samples': 931904, 'steps': 1820, 'loss/train': 2.4105613231658936} -09/20/2021 20:47:43 - INFO - __main__ - Step 29123: {'lr': 0.00019976716073013702, 'samples': 931936, 'steps': 1820, 'loss/train': 2.5938243865966797} -09/20/2021 20:47:44 - INFO - __main__ - Step 29124: {'lr': 0.00019976716073013702, 'samples': 931968, 'steps': 1820, 'loss/train': 3.0884759426116943} -09/20/2021 20:47:45 - INFO - __main__ - Step 29125: {'lr': 0.00019976716073013702, 'samples': 932000, 'steps': 1820, 'loss/train': 2.16943097114563} -09/20/2021 20:47:45 - INFO - __main__ - Step 29126: {'lr': 0.00019976716073013702, 'samples': 932032, 'steps': 1820, 'loss/train': 3.822097063064575} -09/20/2021 20:47:47 - INFO - __main__ - Step 29127: {'lr': 0.00019976716073013702, 'samples': 932064, 'steps': 1820, 'loss/train': 3.76992130279541} -09/20/2021 20:47:47 - INFO - __main__ - Step 29128: {'lr': 0.00019976716073013702, 'samples': 932096, 'steps': 1820, 'loss/train': 2.2041513919830322} -09/20/2021 20:47:48 - INFO - __main__ - Step 29129: {'lr': 0.00019976716073013702, 'samples': 932128, 'steps': 1820, 'loss/train': 2.199411392211914} -09/20/2021 20:47:49 - INFO - __main__ - Step 29130: {'lr': 0.00019976716073013702, 'samples': 932160, 'steps': 1820, 'loss/train': 2.02828049659729} -09/20/2021 20:47:50 - INFO - __main__ - Step 29131: {'lr': 0.00019976716073013702, 'samples': 932192, 'steps': 1820, 'loss/train': 2.7071332931518555} -09/20/2021 20:47:50 - INFO - __main__ - Step 29132: {'lr': 0.00019976716073013702, 'samples': 932224, 'steps': 1820, 'loss/train': 2.659963369369507} -09/20/2021 20:47:51 - INFO - __main__ - Step 29133: {'lr': 0.00019976716073013702, 'samples': 932256, 'steps': 1820, 'loss/train': 2.508237361907959} -09/20/2021 20:47:52 - INFO - __main__ - Step 29134: {'lr': 0.00019976716073013702, 'samples': 932288, 'steps': 1820, 'loss/train': 2.3703107833862305} -09/20/2021 20:47:53 - INFO - __main__ - Step 29135: {'lr': 0.00019976716073013702, 'samples': 932320, 'steps': 1820, 'loss/train': 2.667633295059204} -09/20/2021 20:47:53 - INFO - __main__ - Step 29136: {'lr': 0.00019976716073013702, 'samples': 932352, 'steps': 1820, 'loss/train': 3.2114038467407227} -09/20/2021 20:47:54 - INFO - __main__ - Step 29137: {'lr': 0.00019976672548254273, 'samples': 932384, 'steps': 1821, 'loss/train': 0.9777027368545532} -09/20/2021 20:47:55 - INFO - __main__ - Step 29138: {'lr': 0.00019976672548254273, 'samples': 932416, 'steps': 1821, 'loss/train': 2.783283233642578} -09/20/2021 20:47:56 - INFO - __main__ - Step 29139: {'lr': 0.00019976672548254273, 'samples': 932448, 'steps': 1821, 'loss/train': 1.9650254249572754} -09/20/2021 20:47:57 - INFO - __main__ - Step 29140: {'lr': 0.00019976672548254273, 'samples': 932480, 'steps': 1821, 'loss/train': 2.416274070739746} -09/20/2021 20:47:57 - INFO - __main__ - Step 29141: {'lr': 0.00019976672548254273, 'samples': 932512, 'steps': 1821, 'loss/train': 2.8863108158111572} -09/20/2021 20:47:58 - INFO - __main__ - Step 29142: {'lr': 0.00019976672548254273, 'samples': 932544, 'steps': 1821, 'loss/train': 2.189652919769287} -09/20/2021 20:47:59 - INFO - __main__ - Step 29143: {'lr': 0.00019976672548254273, 'samples': 932576, 'steps': 1821, 'loss/train': 3.168642520904541} -09/20/2021 20:48:00 - INFO - __main__ - Step 29144: {'lr': 0.00019976672548254273, 'samples': 932608, 'steps': 1821, 'loss/train': 3.5658750534057617} -09/20/2021 20:48:00 - INFO - __main__ - Step 29145: {'lr': 0.00019976672548254273, 'samples': 932640, 'steps': 1821, 'loss/train': 2.045623302459717} -09/20/2021 20:48:01 - INFO - __main__ - Step 29146: {'lr': 0.00019976672548254273, 'samples': 932672, 'steps': 1821, 'loss/train': 1.6119951009750366} -09/20/2021 20:48:02 - INFO - __main__ - Step 29147: {'lr': 0.00019976672548254273, 'samples': 932704, 'steps': 1821, 'loss/train': 3.0766680240631104} -09/20/2021 20:48:03 - INFO - __main__ - Step 29148: {'lr': 0.00019976672548254273, 'samples': 932736, 'steps': 1821, 'loss/train': 2.5002498626708984} -09/20/2021 20:48:03 - INFO - __main__ - Step 29149: {'lr': 0.00019976672548254273, 'samples': 932768, 'steps': 1821, 'loss/train': 2.5506227016448975} -09/20/2021 20:48:04 - INFO - __main__ - Step 29150: {'lr': 0.00019976672548254273, 'samples': 932800, 'steps': 1821, 'loss/train': 2.794890880584717} -09/20/2021 20:48:05 - INFO - __main__ - Step 29151: {'lr': 0.00019976672548254273, 'samples': 932832, 'steps': 1821, 'loss/train': 2.6442837715148926} -09/20/2021 20:48:06 - INFO - __main__ - Step 29152: {'lr': 0.00019976672548254273, 'samples': 932864, 'steps': 1821, 'loss/train': 2.5626978874206543} -09/20/2021 20:48:06 - INFO - __main__ - Step 29153: {'lr': 0.00019976628982899805, 'samples': 932896, 'steps': 1822, 'loss/train': 2.7602076530456543} -09/20/2021 20:48:07 - INFO - __main__ - Step 29154: {'lr': 0.00019976628982899805, 'samples': 932928, 'steps': 1822, 'loss/train': 2.713747978210449} -09/20/2021 20:48:08 - INFO - __main__ - Step 29155: {'lr': 0.00019976628982899805, 'samples': 932960, 'steps': 1822, 'loss/train': 2.462428569793701} -09/20/2021 20:48:09 - INFO - __main__ - Step 29156: {'lr': 0.00019976628982899805, 'samples': 932992, 'steps': 1822, 'loss/train': 2.2147135734558105} -09/20/2021 20:48:10 - INFO - __main__ - Step 29157: {'lr': 0.00019976628982899805, 'samples': 933024, 'steps': 1822, 'loss/train': 2.8065154552459717} -09/20/2021 20:48:11 - INFO - __main__ - Step 29158: {'lr': 0.00019976628982899805, 'samples': 933056, 'steps': 1822, 'loss/train': 2.747328996658325} -09/20/2021 20:48:11 - INFO - __main__ - Step 29159: {'lr': 0.00019976628982899805, 'samples': 933088, 'steps': 1822, 'loss/train': 1.87923264503479} -09/20/2021 20:48:12 - INFO - __main__ - Step 29160: {'lr': 0.00019976628982899805, 'samples': 933120, 'steps': 1822, 'loss/train': 1.7589788436889648} -09/20/2021 20:48:13 - INFO - __main__ - Step 29161: {'lr': 0.00019976628982899805, 'samples': 933152, 'steps': 1822, 'loss/train': 2.247407913208008} -09/20/2021 20:48:14 - INFO - __main__ - Step 29162: {'lr': 0.00019976628982899805, 'samples': 933184, 'steps': 1822, 'loss/train': 5.633066654205322} -09/20/2021 20:48:14 - INFO - __main__ - Step 29163: {'lr': 0.00019976628982899805, 'samples': 933216, 'steps': 1822, 'loss/train': 2.9221510887145996} -09/20/2021 20:48:15 - INFO - __main__ - Step 29164: {'lr': 0.00019976628982899805, 'samples': 933248, 'steps': 1822, 'loss/train': 2.4633371829986572} -09/20/2021 20:48:16 - INFO - __main__ - Step 29165: {'lr': 0.00019976628982899805, 'samples': 933280, 'steps': 1822, 'loss/train': 3.259049415588379} -09/20/2021 20:48:17 - INFO - __main__ - Step 29166: {'lr': 0.00019976628982899805, 'samples': 933312, 'steps': 1822, 'loss/train': 2.714125871658325} -09/20/2021 20:48:17 - INFO - __main__ - Step 29167: {'lr': 0.00019976628982899805, 'samples': 933344, 'steps': 1822, 'loss/train': 2.219489574432373} -09/20/2021 20:48:18 - INFO - __main__ - Step 29168: {'lr': 0.00019976628982899805, 'samples': 933376, 'steps': 1822, 'loss/train': 0.6690407991409302} -09/20/2021 20:48:19 - INFO - __main__ - Step 29169: {'lr': 0.00019976585376950472, 'samples': 933408, 'steps': 1823, 'loss/train': 2.197479486465454} -09/20/2021 20:48:20 - INFO - __main__ - Step 29170: {'lr': 0.00019976585376950472, 'samples': 933440, 'steps': 1823, 'loss/train': 2.1981358528137207} -09/20/2021 20:48:21 - INFO - __main__ - Step 29171: {'lr': 0.00019976585376950472, 'samples': 933472, 'steps': 1823, 'loss/train': 2.022244930267334} -09/20/2021 20:48:21 - INFO - __main__ - Step 29172: {'lr': 0.00019976585376950472, 'samples': 933504, 'steps': 1823, 'loss/train': 2.504115581512451} -09/20/2021 20:48:22 - INFO - __main__ - Step 29173: {'lr': 0.00019976585376950472, 'samples': 933536, 'steps': 1823, 'loss/train': 2.3021140098571777} -09/20/2021 20:48:23 - INFO - __main__ - Step 29174: {'lr': 0.00019976585376950472, 'samples': 933568, 'steps': 1823, 'loss/train': 2.6749050617218018} -09/20/2021 20:48:24 - INFO - __main__ - Step 29175: {'lr': 0.00019976585376950472, 'samples': 933600, 'steps': 1823, 'loss/train': 2.4105279445648193} -09/20/2021 20:48:24 - INFO - __main__ - Step 29176: {'lr': 0.00019976585376950472, 'samples': 933632, 'steps': 1823, 'loss/train': 0.7608739137649536} -09/20/2021 20:48:25 - INFO - __main__ - Step 29177: {'lr': 0.00019976585376950472, 'samples': 933664, 'steps': 1823, 'loss/train': 1.9567723274230957} -09/20/2021 20:48:26 - INFO - __main__ - Step 29178: {'lr': 0.00019976585376950472, 'samples': 933696, 'steps': 1823, 'loss/train': 1.968879222869873} -09/20/2021 20:48:27 - INFO - __main__ - Step 29179: {'lr': 0.00019976585376950472, 'samples': 933728, 'steps': 1823, 'loss/train': 2.3921566009521484} -09/20/2021 20:48:27 - INFO - __main__ - Step 29180: {'lr': 0.00019976585376950472, 'samples': 933760, 'steps': 1823, 'loss/train': 2.738917589187622} -09/20/2021 20:48:28 - INFO - __main__ - Step 29181: {'lr': 0.00019976585376950472, 'samples': 933792, 'steps': 1823, 'loss/train': 2.072214126586914} -09/20/2021 20:48:29 - INFO - __main__ - Step 29182: {'lr': 0.00019976585376950472, 'samples': 933824, 'steps': 1823, 'loss/train': 3.031325101852417} -09/20/2021 20:48:30 - INFO - __main__ - Step 29183: {'lr': 0.00019976585376950472, 'samples': 933856, 'steps': 1823, 'loss/train': 2.1388418674468994} -09/20/2021 20:48:30 - INFO - __main__ - Step 29184: {'lr': 0.00019976585376950472, 'samples': 933888, 'steps': 1823, 'loss/train': 2.706575393676758} -09/20/2021 20:48:31 - INFO - __main__ - Step 29185: {'lr': 0.0001997654173040645, 'samples': 933920, 'steps': 1824, 'loss/train': 3.8089230060577393} -09/20/2021 20:48:32 - INFO - __main__ - Step 29186: {'lr': 0.0001997654173040645, 'samples': 933952, 'steps': 1824, 'loss/train': 2.7822954654693604} -09/20/2021 20:48:33 - INFO - __main__ - Step 29187: {'lr': 0.0001997654173040645, 'samples': 933984, 'steps': 1824, 'loss/train': 3.237805128097534} -09/20/2021 20:48:33 - INFO - __main__ - Step 29188: {'lr': 0.0001997654173040645, 'samples': 934016, 'steps': 1824, 'loss/train': 2.4783775806427} -09/20/2021 20:48:35 - INFO - __main__ - Step 29189: {'lr': 0.0001997654173040645, 'samples': 934048, 'steps': 1824, 'loss/train': 3.098952054977417} -09/20/2021 20:48:36 - INFO - __main__ - Step 29190: {'lr': 0.0001997654173040645, 'samples': 934080, 'steps': 1824, 'loss/train': 0.2869201898574829} -09/20/2021 20:48:36 - INFO - __main__ - Step 29191: {'lr': 0.0001997654173040645, 'samples': 934112, 'steps': 1824, 'loss/train': 0.4843382239341736} -09/20/2021 20:48:37 - INFO - __main__ - Step 29192: {'lr': 0.0001997654173040645, 'samples': 934144, 'steps': 1824, 'loss/train': 0.5148805379867554} -09/20/2021 20:48:38 - INFO - __main__ - Step 29193: {'lr': 0.0001997654173040645, 'samples': 934176, 'steps': 1824, 'loss/train': 2.5803918838500977} -09/20/2021 20:48:39 - INFO - __main__ - Step 29194: {'lr': 0.0001997654173040645, 'samples': 934208, 'steps': 1824, 'loss/train': 2.6520490646362305} -09/20/2021 20:48:39 - INFO - __main__ - Step 29195: {'lr': 0.0001997654173040645, 'samples': 934240, 'steps': 1824, 'loss/train': 2.5744855403900146} -09/20/2021 20:48:40 - INFO - __main__ - Step 29196: {'lr': 0.0001997654173040645, 'samples': 934272, 'steps': 1824, 'loss/train': 2.9513347148895264} -09/20/2021 20:48:41 - INFO - __main__ - Step 29197: {'lr': 0.0001997654173040645, 'samples': 934304, 'steps': 1824, 'loss/train': 0.4295450448989868} -09/20/2021 20:48:42 - INFO - __main__ - Step 29198: {'lr': 0.0001997654173040645, 'samples': 934336, 'steps': 1824, 'loss/train': 1.6920732259750366} -09/20/2021 20:48:42 - INFO - __main__ - Step 29199: {'lr': 0.0001997654173040645, 'samples': 934368, 'steps': 1824, 'loss/train': 1.4041770696640015} -09/20/2021 20:48:43 - INFO - __main__ - Step 29200: {'lr': 0.0001997654173040645, 'samples': 934400, 'steps': 1824, 'loss/train': 2.683856964111328} -09/20/2021 20:48:44 - INFO - __main__ - Step 29201: {'lr': 0.0001997649804326792, 'samples': 934432, 'steps': 1825, 'loss/train': 2.5659594535827637} -09/20/2021 20:48:45 - INFO - __main__ - Step 29202: {'lr': 0.0001997649804326792, 'samples': 934464, 'steps': 1825, 'loss/train': 2.370882987976074} -09/20/2021 20:48:45 - INFO - __main__ - Step 29203: {'lr': 0.0001997649804326792, 'samples': 934496, 'steps': 1825, 'loss/train': 2.3313143253326416} -09/20/2021 20:48:46 - INFO - __main__ - Step 29204: {'lr': 0.0001997649804326792, 'samples': 934528, 'steps': 1825, 'loss/train': 1.9616148471832275} -09/20/2021 20:48:47 - INFO - __main__ - Step 29205: {'lr': 0.0001997649804326792, 'samples': 934560, 'steps': 1825, 'loss/train': 2.539764881134033} -09/20/2021 20:48:48 - INFO - __main__ - Step 29206: {'lr': 0.0001997649804326792, 'samples': 934592, 'steps': 1825, 'loss/train': 1.350483775138855} -09/20/2021 20:48:48 - INFO - __main__ - Step 29207: {'lr': 0.0001997649804326792, 'samples': 934624, 'steps': 1825, 'loss/train': 2.0321619510650635} -09/20/2021 20:48:49 - INFO - __main__ - Step 29208: {'lr': 0.0001997649804326792, 'samples': 934656, 'steps': 1825, 'loss/train': 2.185288667678833} -09/20/2021 20:48:50 - INFO - __main__ - Step 29209: {'lr': 0.0001997649804326792, 'samples': 934688, 'steps': 1825, 'loss/train': 2.9799647331237793} -09/20/2021 20:48:51 - INFO - __main__ - Step 29210: {'lr': 0.0001997649804326792, 'samples': 934720, 'steps': 1825, 'loss/train': 3.8004980087280273} -09/20/2021 20:48:51 - INFO - __main__ - Step 29211: {'lr': 0.0001997649804326792, 'samples': 934752, 'steps': 1825, 'loss/train': 2.1096572875976562} -09/20/2021 20:48:52 - INFO - __main__ - Step 29212: {'lr': 0.0001997649804326792, 'samples': 934784, 'steps': 1825, 'loss/train': 2.0451273918151855} -09/20/2021 20:48:53 - INFO - __main__ - Step 29213: {'lr': 0.0001997649804326792, 'samples': 934816, 'steps': 1825, 'loss/train': 1.5969817638397217} -09/20/2021 20:48:54 - INFO - __main__ - Step 29214: {'lr': 0.0001997649804326792, 'samples': 934848, 'steps': 1825, 'loss/train': 0.4919348955154419} -09/20/2021 20:48:54 - INFO - __main__ - Step 29215: {'lr': 0.0001997649804326792, 'samples': 934880, 'steps': 1825, 'loss/train': 3.0815093517303467} -09/20/2021 20:48:55 - INFO - __main__ - Step 29216: {'lr': 0.0001997649804326792, 'samples': 934912, 'steps': 1825, 'loss/train': 2.4936201572418213} -09/20/2021 20:48:56 - INFO - __main__ - Step 29217: {'lr': 0.0001997645431553506, 'samples': 934944, 'steps': 1826, 'loss/train': 2.2024571895599365} -09/20/2021 20:48:57 - INFO - __main__ - Step 29218: {'lr': 0.0001997645431553506, 'samples': 934976, 'steps': 1826, 'loss/train': 1.567006230354309} -09/20/2021 20:48:59 - INFO - __main__ - Step 29219: {'lr': 0.0001997645431553506, 'samples': 935008, 'steps': 1826, 'loss/train': 1.9360003471374512} -09/20/2021 20:48:59 - INFO - __main__ - Step 29220: {'lr': 0.0001997645431553506, 'samples': 935040, 'steps': 1826, 'loss/train': 2.23085618019104} -09/20/2021 20:49:00 - INFO - __main__ - Step 29221: {'lr': 0.0001997645431553506, 'samples': 935072, 'steps': 1826, 'loss/train': 2.573730945587158} -09/20/2021 20:49:01 - INFO - __main__ - Step 29222: {'lr': 0.0001997645431553506, 'samples': 935104, 'steps': 1826, 'loss/train': 1.5107131004333496} -09/20/2021 20:49:02 - INFO - __main__ - Step 29223: {'lr': 0.0001997645431553506, 'samples': 935136, 'steps': 1826, 'loss/train': 2.3736298084259033} -09/20/2021 20:49:02 - INFO - __main__ - Step 29224: {'lr': 0.0001997645431553506, 'samples': 935168, 'steps': 1826, 'loss/train': 2.8826868534088135} -09/20/2021 20:49:03 - INFO - __main__ - Step 29225: {'lr': 0.0001997645431553506, 'samples': 935200, 'steps': 1826, 'loss/train': 1.0422515869140625} -09/20/2021 20:49:04 - INFO - __main__ - Step 29226: {'lr': 0.0001997645431553506, 'samples': 935232, 'steps': 1826, 'loss/train': 1.2990846633911133} -09/20/2021 20:49:05 - INFO - __main__ - Step 29227: {'lr': 0.0001997645431553506, 'samples': 935264, 'steps': 1826, 'loss/train': 0.9499590396881104} -09/20/2021 20:49:05 - INFO - __main__ - Step 29228: {'lr': 0.0001997645431553506, 'samples': 935296, 'steps': 1826, 'loss/train': 0.8871707916259766} -09/20/2021 20:49:06 - INFO - __main__ - Step 29229: {'lr': 0.0001997645431553506, 'samples': 935328, 'steps': 1826, 'loss/train': 0.9514679312705994} -09/20/2021 20:49:07 - INFO - __main__ - Step 29230: {'lr': 0.0001997645431553506, 'samples': 935360, 'steps': 1826, 'loss/train': 1.052310824394226} -09/20/2021 20:49:08 - INFO - __main__ - Step 29231: {'lr': 0.0001997645431553506, 'samples': 935392, 'steps': 1826, 'loss/train': 0.8983493447303772} -09/20/2021 20:49:08 - INFO - __main__ - Step 29232: {'lr': 0.0001997645431553506, 'samples': 935424, 'steps': 1826, 'loss/train': 1.0243785381317139} -09/20/2021 20:49:09 - INFO - __main__ - Step 29233: {'lr': 0.00019976410547208043, 'samples': 935456, 'steps': 1827, 'loss/train': 1.4540133476257324} -09/20/2021 20:49:10 - INFO - __main__ - Step 29234: {'lr': 0.00019976410547208043, 'samples': 935488, 'steps': 1827, 'loss/train': 3.279047727584839} -09/20/2021 20:49:11 - INFO - __main__ - Step 29235: {'lr': 0.00019976410547208043, 'samples': 935520, 'steps': 1827, 'loss/train': 3.5920019149780273} -09/20/2021 20:49:11 - INFO - __main__ - Step 29236: {'lr': 0.00019976410547208043, 'samples': 935552, 'steps': 1827, 'loss/train': 2.063253879547119} -09/20/2021 20:49:12 - INFO - __main__ - Step 29237: {'lr': 0.00019976410547208043, 'samples': 935584, 'steps': 1827, 'loss/train': 2.3026235103607178} -09/20/2021 20:49:13 - INFO - __main__ - Step 29238: {'lr': 0.00019976410547208043, 'samples': 935616, 'steps': 1827, 'loss/train': 2.8966312408447266} -09/20/2021 20:49:14 - INFO - __main__ - Step 29239: {'lr': 0.00019976410547208043, 'samples': 935648, 'steps': 1827, 'loss/train': 2.609032392501831} -09/20/2021 20:49:14 - INFO - __main__ - Step 29240: {'lr': 0.00019976410547208043, 'samples': 935680, 'steps': 1827, 'loss/train': 2.588017702102661} -09/20/2021 20:49:15 - INFO - __main__ - Step 29241: {'lr': 0.00019976410547208043, 'samples': 935712, 'steps': 1827, 'loss/train': 2.601045846939087} -09/20/2021 20:49:16 - INFO - __main__ - Step 29242: {'lr': 0.00019976410547208043, 'samples': 935744, 'steps': 1827, 'loss/train': 3.6323251724243164} -09/20/2021 20:49:17 - INFO - __main__ - Step 29243: {'lr': 0.00019976410547208043, 'samples': 935776, 'steps': 1827, 'loss/train': 2.488830327987671} -09/20/2021 20:49:17 - INFO - __main__ - Step 29244: {'lr': 0.00019976410547208043, 'samples': 935808, 'steps': 1827, 'loss/train': 2.875720739364624} -09/20/2021 20:49:18 - INFO - __main__ - Step 29245: {'lr': 0.00019976410547208043, 'samples': 935840, 'steps': 1827, 'loss/train': 1.2072733640670776} -09/20/2021 20:49:19 - INFO - __main__ - Step 29246: {'lr': 0.00019976410547208043, 'samples': 935872, 'steps': 1827, 'loss/train': 2.711151599884033} -09/20/2021 20:49:20 - INFO - __main__ - Step 29247: {'lr': 0.00019976410547208043, 'samples': 935904, 'steps': 1827, 'loss/train': 3.5051355361938477} -09/20/2021 20:49:20 - INFO - __main__ - Step 29248: {'lr': 0.00019976410547208043, 'samples': 935936, 'steps': 1827, 'loss/train': 3.223330020904541} -09/20/2021 20:49:21 - INFO - __main__ - Step 29249: {'lr': 0.0001997636673828705, 'samples': 935968, 'steps': 1828, 'loss/train': 0.6673383712768555} -09/20/2021 20:49:22 - INFO - __main__ - Step 29250: {'lr': 0.0001997636673828705, 'samples': 936000, 'steps': 1828, 'loss/train': 0.2592417001724243} -09/20/2021 20:49:23 - INFO - __main__ - Step 29251: {'lr': 0.0001997636673828705, 'samples': 936032, 'steps': 1828, 'loss/train': 0.4602412283420563} -09/20/2021 20:49:24 - INFO - __main__ - Step 29252: {'lr': 0.0001997636673828705, 'samples': 936064, 'steps': 1828, 'loss/train': 0.2522432804107666} -09/20/2021 20:49:24 - INFO - __main__ - Step 29253: {'lr': 0.0001997636673828705, 'samples': 936096, 'steps': 1828, 'loss/train': 0.40312543511390686} -09/20/2021 20:49:25 - INFO - __main__ - Step 29254: {'lr': 0.0001997636673828705, 'samples': 936128, 'steps': 1828, 'loss/train': 0.6126739978790283} -09/20/2021 20:49:27 - INFO - __main__ - Step 29255: {'lr': 0.0001997636673828705, 'samples': 936160, 'steps': 1828, 'loss/train': 2.476687431335449} -09/20/2021 20:49:27 - INFO - __main__ - Step 29256: {'lr': 0.0001997636673828705, 'samples': 936192, 'steps': 1828, 'loss/train': 3.3165626525878906} -09/20/2021 20:49:28 - INFO - __main__ - Step 29257: {'lr': 0.0001997636673828705, 'samples': 936224, 'steps': 1828, 'loss/train': 2.3791253566741943} -09/20/2021 20:49:29 - INFO - __main__ - Step 29258: {'lr': 0.0001997636673828705, 'samples': 936256, 'steps': 1828, 'loss/train': 1.7014176845550537} -09/20/2021 20:49:30 - INFO - __main__ - Step 29259: {'lr': 0.0001997636673828705, 'samples': 936288, 'steps': 1828, 'loss/train': 2.3161404132843018} -09/20/2021 20:49:30 - INFO - __main__ - Step 29260: {'lr': 0.0001997636673828705, 'samples': 936320, 'steps': 1828, 'loss/train': 2.9616940021514893} -09/20/2021 20:49:31 - INFO - __main__ - Step 29261: {'lr': 0.0001997636673828705, 'samples': 936352, 'steps': 1828, 'loss/train': 2.613783597946167} -09/20/2021 20:49:32 - INFO - __main__ - Step 29262: {'lr': 0.0001997636673828705, 'samples': 936384, 'steps': 1828, 'loss/train': 2.673781394958496} -09/20/2021 20:49:33 - INFO - __main__ - Step 29263: {'lr': 0.0001997636673828705, 'samples': 936416, 'steps': 1828, 'loss/train': 3.0346992015838623} -09/20/2021 20:49:33 - INFO - __main__ - Step 29264: {'lr': 0.0001997636673828705, 'samples': 936448, 'steps': 1828, 'loss/train': 2.6494367122650146} -09/20/2021 20:49:34 - INFO - __main__ - Step 29265: {'lr': 0.0001997632288877226, 'samples': 936480, 'steps': 1829, 'loss/train': 2.689497470855713} -09/20/2021 20:49:35 - INFO - __main__ - Step 29266: {'lr': 0.0001997632288877226, 'samples': 936512, 'steps': 1829, 'loss/train': 1.6793239116668701} -09/20/2021 20:49:36 - INFO - __main__ - Step 29267: {'lr': 0.0001997632288877226, 'samples': 936544, 'steps': 1829, 'loss/train': 3.4957005977630615} -09/20/2021 20:49:36 - INFO - __main__ - Step 29268: {'lr': 0.0001997632288877226, 'samples': 936576, 'steps': 1829, 'loss/train': 0.44735342264175415} -09/20/2021 20:49:37 - INFO - __main__ - Step 29269: {'lr': 0.0001997632288877226, 'samples': 936608, 'steps': 1829, 'loss/train': 0.3300357758998871} -09/20/2021 20:49:38 - INFO - __main__ - Step 29270: {'lr': 0.0001997632288877226, 'samples': 936640, 'steps': 1829, 'loss/train': 2.023388624191284} -09/20/2021 20:49:39 - INFO - __main__ - Step 29271: {'lr': 0.0001997632288877226, 'samples': 936672, 'steps': 1829, 'loss/train': 2.5023059844970703} -09/20/2021 20:49:39 - INFO - __main__ - Step 29272: {'lr': 0.0001997632288877226, 'samples': 936704, 'steps': 1829, 'loss/train': 1.2237898111343384} -09/20/2021 20:49:40 - INFO - __main__ - Step 29273: {'lr': 0.0001997632288877226, 'samples': 936736, 'steps': 1829, 'loss/train': 2.5361082553863525} -09/20/2021 20:49:41 - INFO - __main__ - Step 29274: {'lr': 0.0001997632288877226, 'samples': 936768, 'steps': 1829, 'loss/train': 3.145437479019165} -09/20/2021 20:49:42 - INFO - __main__ - Step 29275: {'lr': 0.0001997632288877226, 'samples': 936800, 'steps': 1829, 'loss/train': 2.7597057819366455} -09/20/2021 20:49:42 - INFO - __main__ - Step 29276: {'lr': 0.0001997632288877226, 'samples': 936832, 'steps': 1829, 'loss/train': 2.8954482078552246} -09/20/2021 20:49:43 - INFO - __main__ - Step 29277: {'lr': 0.0001997632288877226, 'samples': 936864, 'steps': 1829, 'loss/train': 2.4595236778259277} -09/20/2021 20:49:44 - INFO - __main__ - Step 29278: {'lr': 0.0001997632288877226, 'samples': 936896, 'steps': 1829, 'loss/train': 4.071023941040039} -09/20/2021 20:49:45 - INFO - __main__ - Step 29279: {'lr': 0.0001997632288877226, 'samples': 936928, 'steps': 1829, 'loss/train': 2.8234124183654785} -09/20/2021 20:49:45 - INFO - __main__ - Step 29280: {'lr': 0.0001997632288877226, 'samples': 936960, 'steps': 1829, 'loss/train': 2.3683619499206543} -09/20/2021 20:49:46 - INFO - __main__ - Step 29281: {'lr': 0.00019976278998663853, 'samples': 936992, 'steps': 1830, 'loss/train': 2.702761173248291} -09/20/2021 20:49:47 - INFO - __main__ - Step 29282: {'lr': 0.00019976278998663853, 'samples': 937024, 'steps': 1830, 'loss/train': 1.7856147289276123} -09/20/2021 20:49:48 - INFO - __main__ - Step 29283: {'lr': 0.00019976278998663853, 'samples': 937056, 'steps': 1830, 'loss/train': 2.1176657676696777} -09/20/2021 20:49:49 - INFO - __main__ - Step 29284: {'lr': 0.00019976278998663853, 'samples': 937088, 'steps': 1830, 'loss/train': 2.573418617248535} -09/20/2021 20:49:49 - INFO - __main__ - Step 29285: {'lr': 0.00019976278998663853, 'samples': 937120, 'steps': 1830, 'loss/train': 2.449849843978882} -09/20/2021 20:49:50 - INFO - __main__ - Step 29286: {'lr': 0.00019976278998663853, 'samples': 937152, 'steps': 1830, 'loss/train': 1.5567028522491455} -09/20/2021 20:49:52 - INFO - __main__ - Step 29287: {'lr': 0.00019976278998663853, 'samples': 937184, 'steps': 1830, 'loss/train': 2.490109920501709} -09/20/2021 20:49:53 - INFO - __main__ - Step 29288: {'lr': 0.00019976278998663853, 'samples': 937216, 'steps': 1830, 'loss/train': 2.488450288772583} -09/20/2021 20:49:53 - INFO - __main__ - Step 29289: {'lr': 0.00019976278998663853, 'samples': 937248, 'steps': 1830, 'loss/train': 2.779944658279419} -09/20/2021 20:49:54 - INFO - __main__ - Step 29290: {'lr': 0.00019976278998663853, 'samples': 937280, 'steps': 1830, 'loss/train': 2.334059238433838} -09/20/2021 20:49:55 - INFO - __main__ - Step 29291: {'lr': 0.00019976278998663853, 'samples': 937312, 'steps': 1830, 'loss/train': 2.4178123474121094} -09/20/2021 20:49:56 - INFO - __main__ - Step 29292: {'lr': 0.00019976278998663853, 'samples': 937344, 'steps': 1830, 'loss/train': 3.650909900665283} -09/20/2021 20:49:56 - INFO - __main__ - Step 29293: {'lr': 0.00019976278998663853, 'samples': 937376, 'steps': 1830, 'loss/train': 2.679375410079956} -09/20/2021 20:49:57 - INFO - __main__ - Step 29294: {'lr': 0.00019976278998663853, 'samples': 937408, 'steps': 1830, 'loss/train': 2.5789172649383545} -09/20/2021 20:49:58 - INFO - __main__ - Step 29295: {'lr': 0.00019976278998663853, 'samples': 937440, 'steps': 1830, 'loss/train': 2.7040162086486816} -09/20/2021 20:49:59 - INFO - __main__ - Step 29296: {'lr': 0.00019976278998663853, 'samples': 937472, 'steps': 1830, 'loss/train': 2.4928019046783447} -09/20/2021 20:49:59 - INFO - __main__ - Step 29297: {'lr': 0.00019976235067962006, 'samples': 937504, 'steps': 1831, 'loss/train': 3.3274528980255127} -09/20/2021 20:50:00 - INFO - __main__ - Step 29298: {'lr': 0.00019976235067962006, 'samples': 937536, 'steps': 1831, 'loss/train': 1.8490240573883057} -09/20/2021 20:50:01 - INFO - __main__ - Step 29299: {'lr': 0.00019976235067962006, 'samples': 937568, 'steps': 1831, 'loss/train': 2.5240135192871094} -09/20/2021 20:50:02 - INFO - __main__ - Step 29300: {'lr': 0.00019976235067962006, 'samples': 937600, 'steps': 1831, 'loss/train': 3.289191484451294} -09/20/2021 20:50:02 - INFO - __main__ - Step 29301: {'lr': 0.00019976235067962006, 'samples': 937632, 'steps': 1831, 'loss/train': 2.479886054992676} -09/20/2021 20:50:03 - INFO - __main__ - Step 29302: {'lr': 0.00019976235067962006, 'samples': 937664, 'steps': 1831, 'loss/train': 1.9201115369796753} -09/20/2021 20:50:04 - INFO - __main__ - Step 29303: {'lr': 0.00019976235067962006, 'samples': 937696, 'steps': 1831, 'loss/train': 2.312143325805664} -09/20/2021 20:50:05 - INFO - __main__ - Step 29304: {'lr': 0.00019976235067962006, 'samples': 937728, 'steps': 1831, 'loss/train': 1.1393623352050781} -09/20/2021 20:50:05 - INFO - __main__ - Step 29305: {'lr': 0.00019976235067962006, 'samples': 937760, 'steps': 1831, 'loss/train': 2.0288002490997314} -09/20/2021 20:50:06 - INFO - __main__ - Step 29306: {'lr': 0.00019976235067962006, 'samples': 937792, 'steps': 1831, 'loss/train': 2.7394461631774902} -09/20/2021 20:50:07 - INFO - __main__ - Step 29307: {'lr': 0.00019976235067962006, 'samples': 937824, 'steps': 1831, 'loss/train': 2.9459922313690186} -09/20/2021 20:50:08 - INFO - __main__ - Step 29308: {'lr': 0.00019976235067962006, 'samples': 937856, 'steps': 1831, 'loss/train': 3.5805766582489014} -09/20/2021 20:50:08 - INFO - __main__ - Step 29309: {'lr': 0.00019976235067962006, 'samples': 937888, 'steps': 1831, 'loss/train': 2.833425283432007} -09/20/2021 20:50:09 - INFO - __main__ - Step 29310: {'lr': 0.00019976235067962006, 'samples': 937920, 'steps': 1831, 'loss/train': 3.2728235721588135} -09/20/2021 20:50:10 - INFO - __main__ - Step 29311: {'lr': 0.00019976235067962006, 'samples': 937952, 'steps': 1831, 'loss/train': 2.4783599376678467} -09/20/2021 20:50:11 - INFO - __main__ - Step 29312: {'lr': 0.00019976235067962006, 'samples': 937984, 'steps': 1831, 'loss/train': 2.3244078159332275} -09/20/2021 20:50:12 - INFO - __main__ - Step 29313: {'lr': 0.00019976191096666895, 'samples': 938016, 'steps': 1832, 'loss/train': 3.2685670852661133} -09/20/2021 20:50:12 - INFO - __main__ - Step 29314: {'lr': 0.00019976191096666895, 'samples': 938048, 'steps': 1832, 'loss/train': 2.7478761672973633} -09/20/2021 20:50:13 - INFO - __main__ - Step 29315: {'lr': 0.00019976191096666895, 'samples': 938080, 'steps': 1832, 'loss/train': 2.1783132553100586} -09/20/2021 20:50:14 - INFO - __main__ - Step 29316: {'lr': 0.00019976191096666895, 'samples': 938112, 'steps': 1832, 'loss/train': 1.75466787815094} -09/20/2021 20:50:15 - INFO - __main__ - Step 29317: {'lr': 0.00019976191096666895, 'samples': 938144, 'steps': 1832, 'loss/train': 2.164491653442383} -09/20/2021 20:50:16 - INFO - __main__ - Step 29318: {'lr': 0.00019976191096666895, 'samples': 938176, 'steps': 1832, 'loss/train': 2.2122817039489746} -09/20/2021 20:50:17 - INFO - __main__ - Step 29319: {'lr': 0.00019976191096666895, 'samples': 938208, 'steps': 1832, 'loss/train': 2.1574246883392334} -09/20/2021 20:50:17 - INFO - __main__ - Step 29320: {'lr': 0.00019976191096666895, 'samples': 938240, 'steps': 1832, 'loss/train': 1.8536546230316162} -09/20/2021 20:50:18 - INFO - __main__ - Step 29321: {'lr': 0.00019976191096666895, 'samples': 938272, 'steps': 1832, 'loss/train': 2.9134726524353027} -09/20/2021 20:50:19 - INFO - __main__ - Step 29322: {'lr': 0.00019976191096666895, 'samples': 938304, 'steps': 1832, 'loss/train': 2.9074292182922363} -09/20/2021 20:50:20 - INFO - __main__ - Step 29323: {'lr': 0.00019976191096666895, 'samples': 938336, 'steps': 1832, 'loss/train': 2.016908884048462} -09/20/2021 20:50:20 - INFO - __main__ - Step 29324: {'lr': 0.00019976191096666895, 'samples': 938368, 'steps': 1832, 'loss/train': 0.6882854700088501} -09/20/2021 20:50:21 - INFO - __main__ - Step 29325: {'lr': 0.00019976191096666895, 'samples': 938400, 'steps': 1832, 'loss/train': 2.7858219146728516} -09/20/2021 20:50:22 - INFO - __main__ - Step 29326: {'lr': 0.00019976191096666895, 'samples': 938432, 'steps': 1832, 'loss/train': 2.178713083267212} -09/20/2021 20:50:23 - INFO - __main__ - Step 29327: {'lr': 0.00019976191096666895, 'samples': 938464, 'steps': 1832, 'loss/train': 1.8022654056549072} -09/20/2021 20:50:23 - INFO - __main__ - Step 29328: {'lr': 0.00019976191096666895, 'samples': 938496, 'steps': 1832, 'loss/train': 1.4138703346252441} -09/20/2021 20:50:24 - INFO - __main__ - Step 29329: {'lr': 0.000199761470847787, 'samples': 938528, 'steps': 1833, 'loss/train': 2.068563222885132} -09/20/2021 20:50:25 - INFO - __main__ - Step 29330: {'lr': 0.000199761470847787, 'samples': 938560, 'steps': 1833, 'loss/train': 2.1432623863220215} -09/20/2021 20:50:26 - INFO - __main__ - Step 29331: {'lr': 0.000199761470847787, 'samples': 938592, 'steps': 1833, 'loss/train': 1.598812222480774} -09/20/2021 20:50:27 - INFO - __main__ - Step 29332: {'lr': 0.000199761470847787, 'samples': 938624, 'steps': 1833, 'loss/train': 2.0950570106506348} -09/20/2021 20:50:27 - INFO - __main__ - Step 29333: {'lr': 0.000199761470847787, 'samples': 938656, 'steps': 1833, 'loss/train': 2.1532630920410156} -09/20/2021 20:50:28 - INFO - __main__ - Step 29334: {'lr': 0.000199761470847787, 'samples': 938688, 'steps': 1833, 'loss/train': 1.8484797477722168} -09/20/2021 20:50:29 - INFO - __main__ - Step 29335: {'lr': 0.000199761470847787, 'samples': 938720, 'steps': 1833, 'loss/train': 1.6801868677139282} -09/20/2021 20:50:30 - INFO - __main__ - Step 29336: {'lr': 0.000199761470847787, 'samples': 938752, 'steps': 1833, 'loss/train': 2.028306722640991} -09/20/2021 20:50:30 - INFO - __main__ - Step 29337: {'lr': 0.000199761470847787, 'samples': 938784, 'steps': 1833, 'loss/train': 2.8674540519714355} -09/20/2021 20:50:31 - INFO - __main__ - Step 29338: {'lr': 0.000199761470847787, 'samples': 938816, 'steps': 1833, 'loss/train': 1.657637119293213} -09/20/2021 20:50:32 - INFO - __main__ - Step 29339: {'lr': 0.000199761470847787, 'samples': 938848, 'steps': 1833, 'loss/train': 2.744109869003296} -09/20/2021 20:50:33 - INFO - __main__ - Step 29340: {'lr': 0.000199761470847787, 'samples': 938880, 'steps': 1833, 'loss/train': 2.6183621883392334} -09/20/2021 20:50:33 - INFO - __main__ - Step 29341: {'lr': 0.000199761470847787, 'samples': 938912, 'steps': 1833, 'loss/train': 2.468050003051758} -09/20/2021 20:50:34 - INFO - __main__ - Step 29342: {'lr': 0.000199761470847787, 'samples': 938944, 'steps': 1833, 'loss/train': 2.34548282623291} -09/20/2021 20:50:35 - INFO - __main__ - Step 29343: {'lr': 0.000199761470847787, 'samples': 938976, 'steps': 1833, 'loss/train': 2.107872486114502} -09/20/2021 20:50:36 - INFO - __main__ - Step 29344: {'lr': 0.000199761470847787, 'samples': 939008, 'steps': 1833, 'loss/train': 2.509488582611084} -09/20/2021 20:50:36 - INFO - __main__ - Step 29345: {'lr': 0.00019976103032297605, 'samples': 939040, 'steps': 1834, 'loss/train': 2.2905969619750977} -09/20/2021 20:50:37 - INFO - __main__ - Step 29346: {'lr': 0.00019976103032297605, 'samples': 939072, 'steps': 1834, 'loss/train': 2.6089563369750977} -09/20/2021 20:50:38 - INFO - __main__ - Step 29347: {'lr': 0.00019976103032297605, 'samples': 939104, 'steps': 1834, 'loss/train': 2.407581329345703} -09/20/2021 20:50:39 - INFO - __main__ - Step 29348: {'lr': 0.00019976103032297605, 'samples': 939136, 'steps': 1834, 'loss/train': 1.8162609338760376} -09/20/2021 20:50:40 - INFO - __main__ - Step 29349: {'lr': 0.00019976103032297605, 'samples': 939168, 'steps': 1834, 'loss/train': 2.7764129638671875} -09/20/2021 20:50:41 - INFO - __main__ - Step 29350: {'lr': 0.00019976103032297605, 'samples': 939200, 'steps': 1834, 'loss/train': 2.8301503658294678} -09/20/2021 20:50:41 - INFO - __main__ - Step 29351: {'lr': 0.00019976103032297605, 'samples': 939232, 'steps': 1834, 'loss/train': 3.1532514095306396} -09/20/2021 20:50:42 - INFO - __main__ - Step 29352: {'lr': 0.00019976103032297605, 'samples': 939264, 'steps': 1834, 'loss/train': 3.1511764526367188} -09/20/2021 20:50:43 - INFO - __main__ - Step 29353: {'lr': 0.00019976103032297605, 'samples': 939296, 'steps': 1834, 'loss/train': 1.8277581930160522} -09/20/2021 20:50:44 - INFO - __main__ - Step 29354: {'lr': 0.00019976103032297605, 'samples': 939328, 'steps': 1834, 'loss/train': 1.8173811435699463} -09/20/2021 20:50:44 - INFO - __main__ - Step 29355: {'lr': 0.00019976103032297605, 'samples': 939360, 'steps': 1834, 'loss/train': 2.614321231842041} -09/20/2021 20:50:45 - INFO - __main__ - Step 29356: {'lr': 0.00019976103032297605, 'samples': 939392, 'steps': 1834, 'loss/train': 2.8402016162872314} -09/20/2021 20:50:46 - INFO - __main__ - Step 29357: {'lr': 0.00019976103032297605, 'samples': 939424, 'steps': 1834, 'loss/train': 2.956322431564331} -09/20/2021 20:50:47 - INFO - __main__ - Step 29358: {'lr': 0.00019976103032297605, 'samples': 939456, 'steps': 1834, 'loss/train': 1.5932263135910034} -09/20/2021 20:50:47 - INFO - __main__ - Step 29359: {'lr': 0.00019976103032297605, 'samples': 939488, 'steps': 1834, 'loss/train': 2.683847188949585} -09/20/2021 20:50:48 - INFO - __main__ - Step 29360: {'lr': 0.00019976103032297605, 'samples': 939520, 'steps': 1834, 'loss/train': 2.480515956878662} -09/20/2021 20:50:49 - INFO - __main__ - Step 29361: {'lr': 0.0001997605893922378, 'samples': 939552, 'steps': 1835, 'loss/train': 2.6977148056030273} -09/20/2021 20:50:50 - INFO - __main__ - Step 29362: {'lr': 0.0001997605893922378, 'samples': 939584, 'steps': 1835, 'loss/train': 2.1429951190948486} -09/20/2021 20:50:51 - INFO - __main__ - Step 29363: {'lr': 0.0001997605893922378, 'samples': 939616, 'steps': 1835, 'loss/train': 3.040372848510742} -09/20/2021 20:50:51 - INFO - __main__ - Step 29364: {'lr': 0.0001997605893922378, 'samples': 939648, 'steps': 1835, 'loss/train': 3.0048675537109375} -09/20/2021 20:50:52 - INFO - __main__ - Step 29365: {'lr': 0.0001997605893922378, 'samples': 939680, 'steps': 1835, 'loss/train': 2.4757862091064453} -09/20/2021 20:50:53 - INFO - __main__ - Step 29366: {'lr': 0.0001997605893922378, 'samples': 939712, 'steps': 1835, 'loss/train': 2.748789072036743} -09/20/2021 20:50:54 - INFO - __main__ - Step 29367: {'lr': 0.0001997605893922378, 'samples': 939744, 'steps': 1835, 'loss/train': 3.768001079559326} -09/20/2021 20:50:54 - INFO - __main__ - Step 29368: {'lr': 0.0001997605893922378, 'samples': 939776, 'steps': 1835, 'loss/train': 3.690941333770752} -09/20/2021 20:50:55 - INFO - __main__ - Step 29369: {'lr': 0.0001997605893922378, 'samples': 939808, 'steps': 1835, 'loss/train': 2.931164264678955} -09/20/2021 20:50:56 - INFO - __main__ - Step 29370: {'lr': 0.0001997605893922378, 'samples': 939840, 'steps': 1835, 'loss/train': 2.3574094772338867} -09/20/2021 20:50:57 - INFO - __main__ - Step 29371: {'lr': 0.0001997605893922378, 'samples': 939872, 'steps': 1835, 'loss/train': 2.534374237060547} -09/20/2021 20:50:57 - INFO - __main__ - Step 29372: {'lr': 0.0001997605893922378, 'samples': 939904, 'steps': 1835, 'loss/train': 2.7085583209991455} -09/20/2021 20:50:58 - INFO - __main__ - Step 29373: {'lr': 0.0001997605893922378, 'samples': 939936, 'steps': 1835, 'loss/train': 1.4067984819412231} -09/20/2021 20:50:59 - INFO - __main__ - Step 29374: {'lr': 0.0001997605893922378, 'samples': 939968, 'steps': 1835, 'loss/train': 2.8071351051330566} -09/20/2021 20:51:00 - INFO - __main__ - Step 29375: {'lr': 0.0001997605893922378, 'samples': 940000, 'steps': 1835, 'loss/train': 2.5129168033599854} -09/20/2021 20:51:00 - INFO - __main__ - Step 29376: {'lr': 0.0001997605893922378, 'samples': 940032, 'steps': 1835, 'loss/train': 2.4185469150543213} -09/20/2021 20:51:01 - INFO - __main__ - Step 29377: {'lr': 0.00019976014805557415, 'samples': 940064, 'steps': 1836, 'loss/train': 3.4833061695098877} -09/20/2021 20:51:02 - INFO - __main__ - Step 29378: {'lr': 0.00019976014805557415, 'samples': 940096, 'steps': 1836, 'loss/train': 2.246187448501587} -09/20/2021 20:51:03 - INFO - __main__ - Step 29379: {'lr': 0.00019976014805557415, 'samples': 940128, 'steps': 1836, 'loss/train': 2.8869802951812744} -09/20/2021 20:51:04 - INFO - __main__ - Step 29380: {'lr': 0.00019976014805557415, 'samples': 940160, 'steps': 1836, 'loss/train': 1.9319435358047485} -09/20/2021 20:51:05 - INFO - __main__ - Step 29381: {'lr': 0.00019976014805557415, 'samples': 940192, 'steps': 1836, 'loss/train': 3.296565532684326} -09/20/2021 20:51:06 - INFO - __main__ - Step 29382: {'lr': 0.00019976014805557415, 'samples': 940224, 'steps': 1836, 'loss/train': 3.959063768386841} -09/20/2021 20:51:06 - INFO - __main__ - Step 29383: {'lr': 0.00019976014805557415, 'samples': 940256, 'steps': 1836, 'loss/train': 2.803668975830078} -09/20/2021 20:51:07 - INFO - __main__ - Step 29384: {'lr': 0.00019976014805557415, 'samples': 940288, 'steps': 1836, 'loss/train': 1.716361403465271} -09/20/2021 20:51:08 - INFO - __main__ - Step 29385: {'lr': 0.00019976014805557415, 'samples': 940320, 'steps': 1836, 'loss/train': 0.8769187331199646} -09/20/2021 20:51:09 - INFO - __main__ - Step 29386: {'lr': 0.00019976014805557415, 'samples': 940352, 'steps': 1836, 'loss/train': 2.6390044689178467} -09/20/2021 20:51:09 - INFO - __main__ - Step 29387: {'lr': 0.00019976014805557415, 'samples': 940384, 'steps': 1836, 'loss/train': 2.4195761680603027} -09/20/2021 20:51:10 - INFO - __main__ - Step 29388: {'lr': 0.00019976014805557415, 'samples': 940416, 'steps': 1836, 'loss/train': 3.338467836380005} -09/20/2021 20:51:11 - INFO - __main__ - Step 29389: {'lr': 0.00019976014805557415, 'samples': 940448, 'steps': 1836, 'loss/train': 3.604020118713379} -09/20/2021 20:51:12 - INFO - __main__ - Step 29390: {'lr': 0.00019976014805557415, 'samples': 940480, 'steps': 1836, 'loss/train': 2.3840324878692627} -09/20/2021 20:51:12 - INFO - __main__ - Step 29391: {'lr': 0.00019976014805557415, 'samples': 940512, 'steps': 1836, 'loss/train': 2.4427614212036133} -09/20/2021 20:51:13 - INFO - __main__ - Step 29392: {'lr': 0.00019976014805557415, 'samples': 940544, 'steps': 1836, 'loss/train': 1.7724111080169678} -09/20/2021 20:51:14 - INFO - __main__ - Step 29393: {'lr': 0.0001997597063129868, 'samples': 940576, 'steps': 1837, 'loss/train': 2.2862846851348877} -09/20/2021 20:51:15 - INFO - __main__ - Step 29394: {'lr': 0.0001997597063129868, 'samples': 940608, 'steps': 1837, 'loss/train': 2.9920294284820557} -09/20/2021 20:51:15 - INFO - __main__ - Step 29395: {'lr': 0.0001997597063129868, 'samples': 940640, 'steps': 1837, 'loss/train': 3.3923442363739014} -09/20/2021 20:51:16 - INFO - __main__ - Step 29396: {'lr': 0.0001997597063129868, 'samples': 940672, 'steps': 1837, 'loss/train': 3.0030055046081543} -09/20/2021 20:51:17 - INFO - __main__ - Step 29397: {'lr': 0.0001997597063129868, 'samples': 940704, 'steps': 1837, 'loss/train': 2.955777645111084} -09/20/2021 20:51:18 - INFO - __main__ - Step 29398: {'lr': 0.0001997597063129868, 'samples': 940736, 'steps': 1837, 'loss/train': 2.979018211364746} -09/20/2021 20:51:18 - INFO - __main__ - Step 29399: {'lr': 0.0001997597063129868, 'samples': 940768, 'steps': 1837, 'loss/train': 3.086519718170166} -09/20/2021 20:51:19 - INFO - __main__ - Step 29400: {'lr': 0.0001997597063129868, 'samples': 940800, 'steps': 1837, 'loss/train': 3.0374224185943604} -09/20/2021 20:51:20 - INFO - __main__ - Step 29401: {'lr': 0.0001997597063129868, 'samples': 940832, 'steps': 1837, 'loss/train': 2.44107985496521} -09/20/2021 20:51:21 - INFO - __main__ - Step 29402: {'lr': 0.0001997597063129868, 'samples': 940864, 'steps': 1837, 'loss/train': 3.6651830673217773} -09/20/2021 20:51:21 - INFO - __main__ - Step 29403: {'lr': 0.0001997597063129868, 'samples': 940896, 'steps': 1837, 'loss/train': 3.487973213195801} -09/20/2021 20:51:22 - INFO - __main__ - Step 29404: {'lr': 0.0001997597063129868, 'samples': 940928, 'steps': 1837, 'loss/train': 3.59315824508667} -09/20/2021 20:51:23 - INFO - __main__ - Step 29405: {'lr': 0.0001997597063129868, 'samples': 940960, 'steps': 1837, 'loss/train': 2.9020144939422607} -09/20/2021 20:51:24 - INFO - __main__ - Step 29406: {'lr': 0.0001997597063129868, 'samples': 940992, 'steps': 1837, 'loss/train': 3.1193177700042725} -09/20/2021 20:51:24 - INFO - __main__ - Step 29407: {'lr': 0.0001997597063129868, 'samples': 941024, 'steps': 1837, 'loss/train': 2.9559731483459473} -09/20/2021 20:51:25 - INFO - __main__ - Step 29408: {'lr': 0.0001997597063129868, 'samples': 941056, 'steps': 1837, 'loss/train': 2.4607057571411133} -09/20/2021 20:51:26 - INFO - __main__ - Step 29409: {'lr': 0.00019975926416447763, 'samples': 941088, 'steps': 1838, 'loss/train': 2.7596042156219482} -09/20/2021 20:51:27 - INFO - __main__ - Step 29410: {'lr': 0.00019975926416447763, 'samples': 941120, 'steps': 1838, 'loss/train': 2.074587345123291} -09/20/2021 20:51:28 - INFO - __main__ - Step 29411: {'lr': 0.00019975926416447763, 'samples': 941152, 'steps': 1838, 'loss/train': 2.5350966453552246} -09/20/2021 20:51:29 - INFO - __main__ - Step 29412: {'lr': 0.00019975926416447763, 'samples': 941184, 'steps': 1838, 'loss/train': 2.67691707611084} -09/20/2021 20:51:30 - INFO - __main__ - Step 29413: {'lr': 0.00019975926416447763, 'samples': 941216, 'steps': 1838, 'loss/train': 2.8200669288635254} -09/20/2021 20:51:30 - INFO - __main__ - Step 29414: {'lr': 0.00019975926416447763, 'samples': 941248, 'steps': 1838, 'loss/train': 1.0920971632003784} -09/20/2021 20:51:31 - INFO - __main__ - Step 29415: {'lr': 0.00019975926416447763, 'samples': 941280, 'steps': 1838, 'loss/train': 3.880044937133789} -09/20/2021 20:51:32 - INFO - __main__ - Step 29416: {'lr': 0.00019975926416447763, 'samples': 941312, 'steps': 1838, 'loss/train': 2.3870015144348145} -09/20/2021 20:51:33 - INFO - __main__ - Step 29417: {'lr': 0.00019975926416447763, 'samples': 941344, 'steps': 1838, 'loss/train': 2.5180373191833496} -09/20/2021 20:51:33 - INFO - __main__ - Step 29418: {'lr': 0.00019975926416447763, 'samples': 941376, 'steps': 1838, 'loss/train': 3.0336251258850098} -09/20/2021 20:51:34 - INFO - __main__ - Step 29419: {'lr': 0.00019975926416447763, 'samples': 941408, 'steps': 1838, 'loss/train': 2.538968563079834} -09/20/2021 20:51:35 - INFO - __main__ - Step 29420: {'lr': 0.00019975926416447763, 'samples': 941440, 'steps': 1838, 'loss/train': 2.9654221534729004} -09/20/2021 20:51:36 - INFO - __main__ - Step 29421: {'lr': 0.00019975926416447763, 'samples': 941472, 'steps': 1838, 'loss/train': 2.389765739440918} -09/20/2021 20:51:36 - INFO - __main__ - Step 29422: {'lr': 0.00019975926416447763, 'samples': 941504, 'steps': 1838, 'loss/train': 2.3534743785858154} -09/20/2021 20:51:37 - INFO - __main__ - Step 29423: {'lr': 0.00019975926416447763, 'samples': 941536, 'steps': 1838, 'loss/train': 0.9803080558776855} -09/20/2021 20:51:38 - INFO - __main__ - Step 29424: {'lr': 0.00019975926416447763, 'samples': 941568, 'steps': 1838, 'loss/train': 0.9162583351135254} -09/20/2021 20:51:39 - INFO - __main__ - Step 29425: {'lr': 0.00019975882161004838, 'samples': 941600, 'steps': 1839, 'loss/train': 2.726172924041748} -09/20/2021 20:51:40 - INFO - __main__ - Step 29426: {'lr': 0.00019975882161004838, 'samples': 941632, 'steps': 1839, 'loss/train': 3.7662463188171387} -09/20/2021 20:51:40 - INFO - __main__ - Step 29427: {'lr': 0.00019975882161004838, 'samples': 941664, 'steps': 1839, 'loss/train': 1.5817512273788452} -09/20/2021 20:51:41 - INFO - __main__ - Step 29428: {'lr': 0.00019975882161004838, 'samples': 941696, 'steps': 1839, 'loss/train': 2.1695966720581055} -09/20/2021 20:51:42 - INFO - __main__ - Step 29429: {'lr': 0.00019975882161004838, 'samples': 941728, 'steps': 1839, 'loss/train': 2.0059261322021484} -09/20/2021 20:51:43 - INFO - __main__ - Step 29430: {'lr': 0.00019975882161004838, 'samples': 941760, 'steps': 1839, 'loss/train': 1.1852729320526123} -09/20/2021 20:51:43 - INFO - __main__ - Step 29431: {'lr': 0.00019975882161004838, 'samples': 941792, 'steps': 1839, 'loss/train': 2.0619068145751953} -09/20/2021 20:51:44 - INFO - __main__ - Step 29432: {'lr': 0.00019975882161004838, 'samples': 941824, 'steps': 1839, 'loss/train': 2.2940173149108887} -09/20/2021 20:51:45 - INFO - __main__ - Step 29433: {'lr': 0.00019975882161004838, 'samples': 941856, 'steps': 1839, 'loss/train': 2.3049325942993164} -09/20/2021 20:51:46 - INFO - __main__ - Step 29434: {'lr': 0.00019975882161004838, 'samples': 941888, 'steps': 1839, 'loss/train': 2.292675733566284} -09/20/2021 20:51:46 - INFO - __main__ - Step 29435: {'lr': 0.00019975882161004838, 'samples': 941920, 'steps': 1839, 'loss/train': 2.9710774421691895} -09/20/2021 20:51:47 - INFO - __main__ - Step 29436: {'lr': 0.00019975882161004838, 'samples': 941952, 'steps': 1839, 'loss/train': 2.2231574058532715} -09/20/2021 20:51:48 - INFO - __main__ - Step 29437: {'lr': 0.00019975882161004838, 'samples': 941984, 'steps': 1839, 'loss/train': 2.893602132797241} -09/20/2021 20:51:49 - INFO - __main__ - Step 29438: {'lr': 0.00019975882161004838, 'samples': 942016, 'steps': 1839, 'loss/train': 2.636289119720459} -09/20/2021 20:51:49 - INFO - __main__ - Step 29439: {'lr': 0.00019975882161004838, 'samples': 942048, 'steps': 1839, 'loss/train': 3.048495292663574} -09/20/2021 20:51:50 - INFO - __main__ - Step 29440: {'lr': 0.00019975882161004838, 'samples': 942080, 'steps': 1839, 'loss/train': 2.9103479385375977} -09/20/2021 20:51:51 - INFO - __main__ - Step 29441: {'lr': 0.00019975837864970092, 'samples': 942112, 'steps': 1840, 'loss/train': 1.2441000938415527} -09/20/2021 20:51:52 - INFO - __main__ - Step 29442: {'lr': 0.00019975837864970092, 'samples': 942144, 'steps': 1840, 'loss/train': 6.479910373687744} -09/20/2021 20:51:52 - INFO - __main__ - Step 29443: {'lr': 0.00019975837864970092, 'samples': 942176, 'steps': 1840, 'loss/train': 6.390378475189209} -09/20/2021 20:51:53 - INFO - __main__ - Step 29444: {'lr': 0.00019975837864970092, 'samples': 942208, 'steps': 1840, 'loss/train': 6.564370155334473} -09/20/2021 20:51:54 - INFO - __main__ - Step 29445: {'lr': 0.00019975837864970092, 'samples': 942240, 'steps': 1840, 'loss/train': 6.499022483825684} -09/20/2021 20:51:55 - INFO - __main__ - Step 29446: {'lr': 0.00019975837864970092, 'samples': 942272, 'steps': 1840, 'loss/train': 2.641328811645508} -09/20/2021 20:51:56 - INFO - __main__ - Step 29447: {'lr': 0.00019975837864970092, 'samples': 942304, 'steps': 1840, 'loss/train': 3.612820625305176} -09/20/2021 20:51:57 - INFO - __main__ - Step 29448: {'lr': 0.00019975837864970092, 'samples': 942336, 'steps': 1840, 'loss/train': 2.199638605117798} -09/20/2021 20:51:57 - INFO - __main__ - Step 29449: {'lr': 0.00019975837864970092, 'samples': 942368, 'steps': 1840, 'loss/train': 0.39924901723861694} -09/20/2021 20:51:58 - INFO - __main__ - Step 29450: {'lr': 0.00019975837864970092, 'samples': 942400, 'steps': 1840, 'loss/train': 2.6506543159484863} -09/20/2021 20:51:59 - INFO - __main__ - Step 29451: {'lr': 0.00019975837864970092, 'samples': 942432, 'steps': 1840, 'loss/train': 2.2247419357299805} -09/20/2021 20:52:00 - INFO - __main__ - Step 29452: {'lr': 0.00019975837864970092, 'samples': 942464, 'steps': 1840, 'loss/train': 2.164644479751587} -09/20/2021 20:52:00 - INFO - __main__ - Step 29453: {'lr': 0.00019975837864970092, 'samples': 942496, 'steps': 1840, 'loss/train': 2.0198705196380615} -09/20/2021 20:52:01 - INFO - __main__ - Step 29454: {'lr': 0.00019975837864970092, 'samples': 942528, 'steps': 1840, 'loss/train': 2.883810520172119} -09/20/2021 20:52:02 - INFO - __main__ - Step 29455: {'lr': 0.00019975837864970092, 'samples': 942560, 'steps': 1840, 'loss/train': 3.48584246635437} -09/20/2021 20:52:03 - INFO - __main__ - Step 29456: {'lr': 0.00019975837864970092, 'samples': 942592, 'steps': 1840, 'loss/train': 1.5666441917419434} -09/20/2021 20:52:04 - INFO - __main__ - Step 29457: {'lr': 0.00019975793528343694, 'samples': 942624, 'steps': 1841, 'loss/train': 2.37367844581604} -09/20/2021 20:52:04 - INFO - __main__ - Step 29458: {'lr': 0.00019975793528343694, 'samples': 942656, 'steps': 1841, 'loss/train': 2.332071542739868} -09/20/2021 20:52:05 - INFO - __main__ - Step 29459: {'lr': 0.00019975793528343694, 'samples': 942688, 'steps': 1841, 'loss/train': 3.4252617359161377} -09/20/2021 20:52:06 - INFO - __main__ - Step 29460: {'lr': 0.00019975793528343694, 'samples': 942720, 'steps': 1841, 'loss/train': 2.307555913925171} -09/20/2021 20:52:07 - INFO - __main__ - Step 29461: {'lr': 0.00019975793528343694, 'samples': 942752, 'steps': 1841, 'loss/train': 2.8322396278381348} -09/20/2021 20:52:07 - INFO - __main__ - Step 29462: {'lr': 0.00019975793528343694, 'samples': 942784, 'steps': 1841, 'loss/train': 1.9147599935531616} -09/20/2021 20:52:08 - INFO - __main__ - Step 29463: {'lr': 0.00019975793528343694, 'samples': 942816, 'steps': 1841, 'loss/train': 2.458171844482422} -09/20/2021 20:52:09 - INFO - __main__ - Step 29464: {'lr': 0.00019975793528343694, 'samples': 942848, 'steps': 1841, 'loss/train': 2.7946038246154785} -09/20/2021 20:52:10 - INFO - __main__ - Step 29465: {'lr': 0.00019975793528343694, 'samples': 942880, 'steps': 1841, 'loss/train': 2.7930874824523926} -09/20/2021 20:52:10 - INFO - __main__ - Step 29466: {'lr': 0.00019975793528343694, 'samples': 942912, 'steps': 1841, 'loss/train': 1.6471805572509766} -09/20/2021 20:52:11 - INFO - __main__ - Step 29467: {'lr': 0.00019975793528343694, 'samples': 942944, 'steps': 1841, 'loss/train': 3.274182081222534} -09/20/2021 20:52:12 - INFO - __main__ - Step 29468: {'lr': 0.00019975793528343694, 'samples': 942976, 'steps': 1841, 'loss/train': 2.9061710834503174} -09/20/2021 20:52:13 - INFO - __main__ - Step 29469: {'lr': 0.00019975793528343694, 'samples': 943008, 'steps': 1841, 'loss/train': 2.8823049068450928} -09/20/2021 20:52:13 - INFO - __main__ - Step 29470: {'lr': 0.00019975793528343694, 'samples': 943040, 'steps': 1841, 'loss/train': 3.519038438796997} -09/20/2021 20:52:14 - INFO - __main__ - Step 29471: {'lr': 0.00019975793528343694, 'samples': 943072, 'steps': 1841, 'loss/train': 2.4864511489868164} -09/20/2021 20:52:15 - INFO - __main__ - Step 29472: {'lr': 0.00019975793528343694, 'samples': 943104, 'steps': 1841, 'loss/train': 1.474003791809082} -09/20/2021 20:52:16 - INFO - __main__ - Step 29473: {'lr': 0.00019975749151125832, 'samples': 943136, 'steps': 1842, 'loss/train': 3.4940855503082275} -09/20/2021 20:52:16 - INFO - __main__ - Step 29474: {'lr': 0.00019975749151125832, 'samples': 943168, 'steps': 1842, 'loss/train': 1.8912107944488525} -09/20/2021 20:52:17 - INFO - __main__ - Step 29475: {'lr': 0.00019975749151125832, 'samples': 943200, 'steps': 1842, 'loss/train': 1.9106240272521973} -09/20/2021 20:52:19 - INFO - __main__ - Step 29476: {'lr': 0.00019975749151125832, 'samples': 943232, 'steps': 1842, 'loss/train': 2.7027735710144043} -09/20/2021 20:52:19 - INFO - __main__ - Step 29477: {'lr': 0.00019975749151125832, 'samples': 943264, 'steps': 1842, 'loss/train': 2.632143020629883} -09/20/2021 20:52:20 - INFO - __main__ - Step 29478: {'lr': 0.00019975749151125832, 'samples': 943296, 'steps': 1842, 'loss/train': 2.305506944656372} -09/20/2021 20:52:21 - INFO - __main__ - Step 29479: {'lr': 0.00019975749151125832, 'samples': 943328, 'steps': 1842, 'loss/train': 2.864374876022339} -09/20/2021 20:52:21 - INFO - __main__ - Step 29480: {'lr': 0.00019975749151125832, 'samples': 943360, 'steps': 1842, 'loss/train': 2.0291645526885986} -09/20/2021 20:52:22 - INFO - __main__ - Step 29481: {'lr': 0.00019975749151125832, 'samples': 943392, 'steps': 1842, 'loss/train': 2.216878652572632} -09/20/2021 20:52:23 - INFO - __main__ - Step 29482: {'lr': 0.00019975749151125832, 'samples': 943424, 'steps': 1842, 'loss/train': 2.1364617347717285} -09/20/2021 20:52:24 - INFO - __main__ - Step 29483: {'lr': 0.00019975749151125832, 'samples': 943456, 'steps': 1842, 'loss/train': 2.295565128326416} -09/20/2021 20:52:24 - INFO - __main__ - Step 29484: {'lr': 0.00019975749151125832, 'samples': 943488, 'steps': 1842, 'loss/train': 2.7340548038482666} -09/20/2021 20:52:25 - INFO - __main__ - Step 29485: {'lr': 0.00019975749151125832, 'samples': 943520, 'steps': 1842, 'loss/train': 1.9064407348632812} -09/20/2021 20:52:26 - INFO - __main__ - Step 29486: {'lr': 0.00019975749151125832, 'samples': 943552, 'steps': 1842, 'loss/train': 2.002394676208496} -09/20/2021 20:52:27 - INFO - __main__ - Step 29487: {'lr': 0.00019975749151125832, 'samples': 943584, 'steps': 1842, 'loss/train': 2.845435380935669} -09/20/2021 20:52:27 - INFO - __main__ - Step 29488: {'lr': 0.00019975749151125832, 'samples': 943616, 'steps': 1842, 'loss/train': 2.467040538787842} -09/20/2021 20:52:28 - INFO - __main__ - Step 29489: {'lr': 0.00019975704733316688, 'samples': 943648, 'steps': 1843, 'loss/train': 2.110305070877075} -09/20/2021 20:52:29 - INFO - __main__ - Step 29490: {'lr': 0.00019975704733316688, 'samples': 943680, 'steps': 1843, 'loss/train': 2.3613367080688477} -09/20/2021 20:52:30 - INFO - __main__ - Step 29491: {'lr': 0.00019975704733316688, 'samples': 943712, 'steps': 1843, 'loss/train': 1.2101738452911377} -09/20/2021 20:52:31 - INFO - __main__ - Step 29492: {'lr': 0.00019975704733316688, 'samples': 943744, 'steps': 1843, 'loss/train': 2.620420455932617} -09/20/2021 20:52:31 - INFO - __main__ - Step 29493: {'lr': 0.00019975704733316688, 'samples': 943776, 'steps': 1843, 'loss/train': 3.854557514190674} -09/20/2021 20:52:32 - INFO - __main__ - Step 29494: {'lr': 0.00019975704733316688, 'samples': 943808, 'steps': 1843, 'loss/train': 2.8841264247894287} -09/20/2021 20:52:33 - INFO - __main__ - Step 29495: {'lr': 0.00019975704733316688, 'samples': 943840, 'steps': 1843, 'loss/train': 2.972966194152832} -09/20/2021 20:52:34 - INFO - __main__ - Step 29496: {'lr': 0.00019975704733316688, 'samples': 943872, 'steps': 1843, 'loss/train': 2.4642515182495117} -09/20/2021 20:52:34 - INFO - __main__ - Step 29497: {'lr': 0.00019975704733316688, 'samples': 943904, 'steps': 1843, 'loss/train': 0.655433714389801} -09/20/2021 20:52:35 - INFO - __main__ - Step 29498: {'lr': 0.00019975704733316688, 'samples': 943936, 'steps': 1843, 'loss/train': 2.9196319580078125} -09/20/2021 20:52:36 - INFO - __main__ - Step 29499: {'lr': 0.00019975704733316688, 'samples': 943968, 'steps': 1843, 'loss/train': 3.185805082321167} -09/20/2021 20:52:37 - INFO - __main__ - Step 29500: {'lr': 0.00019975704733316688, 'samples': 944000, 'steps': 1843, 'loss/train': 2.7359440326690674} -09/20/2021 20:52:37 - INFO - __main__ - Step 29501: {'lr': 0.00019975704733316688, 'samples': 944032, 'steps': 1843, 'loss/train': 1.8544566631317139} -09/20/2021 20:52:38 - INFO - __main__ - Step 29502: {'lr': 0.00019975704733316688, 'samples': 944064, 'steps': 1843, 'loss/train': 3.120868682861328} -09/20/2021 20:52:39 - INFO - __main__ - Step 29503: {'lr': 0.00019975704733316688, 'samples': 944096, 'steps': 1843, 'loss/train': 2.8314740657806396} -09/20/2021 20:52:40 - INFO - __main__ - Step 29504: {'lr': 0.00019975704733316688, 'samples': 944128, 'steps': 1843, 'loss/train': 2.2231783866882324} -09/20/2021 20:52:41 - INFO - __main__ - Step 29505: {'lr': 0.0001997566027491644, 'samples': 944160, 'steps': 1844, 'loss/train': 2.279350996017456} -09/20/2021 20:52:41 - INFO - __main__ - Step 29506: {'lr': 0.0001997566027491644, 'samples': 944192, 'steps': 1844, 'loss/train': 2.4669175148010254} -09/20/2021 20:52:42 - INFO - __main__ - Step 29507: {'lr': 0.0001997566027491644, 'samples': 944224, 'steps': 1844, 'loss/train': 3.287700653076172} -09/20/2021 20:52:43 - INFO - __main__ - Step 29508: {'lr': 0.0001997566027491644, 'samples': 944256, 'steps': 1844, 'loss/train': 2.206444263458252} -09/20/2021 20:52:44 - INFO - __main__ - Step 29509: {'lr': 0.0001997566027491644, 'samples': 944288, 'steps': 1844, 'loss/train': 1.778831958770752} -09/20/2021 20:52:45 - INFO - __main__ - Step 29510: {'lr': 0.0001997566027491644, 'samples': 944320, 'steps': 1844, 'loss/train': 2.103806495666504} -09/20/2021 20:52:45 - INFO - __main__ - Step 29511: {'lr': 0.0001997566027491644, 'samples': 944352, 'steps': 1844, 'loss/train': 2.1411375999450684} -09/20/2021 20:52:46 - INFO - __main__ - Step 29512: {'lr': 0.0001997566027491644, 'samples': 944384, 'steps': 1844, 'loss/train': 0.5806547999382019} -09/20/2021 20:52:47 - INFO - __main__ - Step 29513: {'lr': 0.0001997566027491644, 'samples': 944416, 'steps': 1844, 'loss/train': 2.0421931743621826} -09/20/2021 20:52:48 - INFO - __main__ - Step 29514: {'lr': 0.0001997566027491644, 'samples': 944448, 'steps': 1844, 'loss/train': 2.526278495788574} -09/20/2021 20:52:48 - INFO - __main__ - Step 29515: {'lr': 0.0001997566027491644, 'samples': 944480, 'steps': 1844, 'loss/train': 3.3628830909729004} -09/20/2021 20:52:49 - INFO - __main__ - Step 29516: {'lr': 0.0001997566027491644, 'samples': 944512, 'steps': 1844, 'loss/train': 2.0589609146118164} -09/20/2021 20:52:50 - INFO - __main__ - Step 29517: {'lr': 0.0001997566027491644, 'samples': 944544, 'steps': 1844, 'loss/train': 2.486453056335449} -09/20/2021 20:52:51 - INFO - __main__ - Step 29518: {'lr': 0.0001997566027491644, 'samples': 944576, 'steps': 1844, 'loss/train': 2.9167237281799316} -09/20/2021 20:52:51 - INFO - __main__ - Step 29519: {'lr': 0.0001997566027491644, 'samples': 944608, 'steps': 1844, 'loss/train': 2.2517364025115967} -09/20/2021 20:52:52 - INFO - __main__ - Step 29520: {'lr': 0.0001997566027491644, 'samples': 944640, 'steps': 1844, 'loss/train': 2.4068410396575928} -09/20/2021 20:52:53 - INFO - __main__ - Step 29521: {'lr': 0.00019975615775925267, 'samples': 944672, 'steps': 1845, 'loss/train': 2.347752332687378} -09/20/2021 20:52:54 - INFO - __main__ - Step 29522: {'lr': 0.00019975615775925267, 'samples': 944704, 'steps': 1845, 'loss/train': 1.6901788711547852} -09/20/2021 20:52:55 - INFO - __main__ - Step 29523: {'lr': 0.00019975615775925267, 'samples': 944736, 'steps': 1845, 'loss/train': 2.447422981262207} -09/20/2021 20:52:55 - INFO - __main__ - Step 29524: {'lr': 0.00019975615775925267, 'samples': 944768, 'steps': 1845, 'loss/train': 3.451293706893921} -09/20/2021 20:52:56 - INFO - __main__ - Step 29525: {'lr': 0.00019975615775925267, 'samples': 944800, 'steps': 1845, 'loss/train': 2.2889928817749023} -09/20/2021 20:52:57 - INFO - __main__ - Step 29526: {'lr': 0.00019975615775925267, 'samples': 944832, 'steps': 1845, 'loss/train': 2.277967929840088} -09/20/2021 20:52:58 - INFO - __main__ - Step 29527: {'lr': 0.00019975615775925267, 'samples': 944864, 'steps': 1845, 'loss/train': 3.0520389080047607} -09/20/2021 20:52:58 - INFO - __main__ - Step 29528: {'lr': 0.00019975615775925267, 'samples': 944896, 'steps': 1845, 'loss/train': 2.992295980453491} -09/20/2021 20:52:59 - INFO - __main__ - Step 29529: {'lr': 0.00019975615775925267, 'samples': 944928, 'steps': 1845, 'loss/train': 2.644596815109253} -09/20/2021 20:53:00 - INFO - __main__ - Step 29530: {'lr': 0.00019975615775925267, 'samples': 944960, 'steps': 1845, 'loss/train': 2.331263542175293} -09/20/2021 20:53:01 - INFO - __main__ - Step 29531: {'lr': 0.00019975615775925267, 'samples': 944992, 'steps': 1845, 'loss/train': 2.0837862491607666} -09/20/2021 20:53:01 - INFO - __main__ - Step 29532: {'lr': 0.00019975615775925267, 'samples': 945024, 'steps': 1845, 'loss/train': 2.6895625591278076} -09/20/2021 20:53:02 - INFO - __main__ - Step 29533: {'lr': 0.00019975615775925267, 'samples': 945056, 'steps': 1845, 'loss/train': 2.1715643405914307} -09/20/2021 20:53:03 - INFO - __main__ - Step 29534: {'lr': 0.00019975615775925267, 'samples': 945088, 'steps': 1845, 'loss/train': 2.2024950981140137} -09/20/2021 20:53:04 - INFO - __main__ - Step 29535: {'lr': 0.00019975615775925267, 'samples': 945120, 'steps': 1845, 'loss/train': 2.0284743309020996} -09/20/2021 20:53:04 - INFO - __main__ - Step 29536: {'lr': 0.00019975615775925267, 'samples': 945152, 'steps': 1845, 'loss/train': 2.063971996307373} -09/20/2021 20:53:05 - INFO - __main__ - Step 29537: {'lr': 0.00019975571236343354, 'samples': 945184, 'steps': 1846, 'loss/train': 2.085207939147949} -09/20/2021 20:53:07 - INFO - __main__ - Step 29538: {'lr': 0.00019975571236343354, 'samples': 945216, 'steps': 1846, 'loss/train': 2.723686456680298} -09/20/2021 20:53:07 - INFO - __main__ - Step 29539: {'lr': 0.00019975571236343354, 'samples': 945248, 'steps': 1846, 'loss/train': 1.7319411039352417} -09/20/2021 20:53:08 - INFO - __main__ - Step 29540: {'lr': 0.00019975571236343354, 'samples': 945280, 'steps': 1846, 'loss/train': 2.664851427078247} -09/20/2021 20:53:09 - INFO - __main__ - Step 29541: {'lr': 0.00019975571236343354, 'samples': 945312, 'steps': 1846, 'loss/train': 3.1346800327301025} -09/20/2021 20:53:10 - INFO - __main__ - Step 29542: {'lr': 0.00019975571236343354, 'samples': 945344, 'steps': 1846, 'loss/train': 1.743039846420288} -09/20/2021 20:53:10 - INFO - __main__ - Step 29543: {'lr': 0.00019975571236343354, 'samples': 945376, 'steps': 1846, 'loss/train': 2.8278985023498535} -09/20/2021 20:53:11 - INFO - __main__ - Step 29544: {'lr': 0.00019975571236343354, 'samples': 945408, 'steps': 1846, 'loss/train': 2.439211368560791} -09/20/2021 20:53:12 - INFO - __main__ - Step 29545: {'lr': 0.00019975571236343354, 'samples': 945440, 'steps': 1846, 'loss/train': 2.6049716472625732} -09/20/2021 20:53:13 - INFO - __main__ - Step 29546: {'lr': 0.00019975571236343354, 'samples': 945472, 'steps': 1846, 'loss/train': 0.6708889603614807} -09/20/2021 20:53:14 - INFO - __main__ - Step 29547: {'lr': 0.00019975571236343354, 'samples': 945504, 'steps': 1846, 'loss/train': 0.4528043568134308} -09/20/2021 20:53:14 - INFO - __main__ - Step 29548: {'lr': 0.00019975571236343354, 'samples': 945536, 'steps': 1846, 'loss/train': 0.651454508304596} -09/20/2021 20:53:15 - INFO - __main__ - Step 29549: {'lr': 0.00019975571236343354, 'samples': 945568, 'steps': 1846, 'loss/train': 0.4033169150352478} -09/20/2021 20:53:16 - INFO - __main__ - Step 29550: {'lr': 0.00019975571236343354, 'samples': 945600, 'steps': 1846, 'loss/train': 2.5765161514282227} -09/20/2021 20:53:17 - INFO - __main__ - Step 29551: {'lr': 0.00019975571236343354, 'samples': 945632, 'steps': 1846, 'loss/train': 2.8793110847473145} -09/20/2021 20:53:17 - INFO - __main__ - Step 29552: {'lr': 0.00019975571236343354, 'samples': 945664, 'steps': 1846, 'loss/train': 2.650031805038452} -09/20/2021 20:53:18 - INFO - __main__ - Step 29553: {'lr': 0.0001997552665617088, 'samples': 945696, 'steps': 1847, 'loss/train': 2.2095813751220703} -09/20/2021 20:53:19 - INFO - __main__ - Step 29554: {'lr': 0.0001997552665617088, 'samples': 945728, 'steps': 1847, 'loss/train': 2.101405620574951} -09/20/2021 20:53:20 - INFO - __main__ - Step 29555: {'lr': 0.0001997552665617088, 'samples': 945760, 'steps': 1847, 'loss/train': 2.618011951446533} -09/20/2021 20:53:20 - INFO - __main__ - Step 29556: {'lr': 0.0001997552665617088, 'samples': 945792, 'steps': 1847, 'loss/train': 2.326892375946045} -09/20/2021 20:53:21 - INFO - __main__ - Step 29557: {'lr': 0.0001997552665617088, 'samples': 945824, 'steps': 1847, 'loss/train': 3.322638988494873} -09/20/2021 20:53:22 - INFO - __main__ - Step 29558: {'lr': 0.0001997552665617088, 'samples': 945856, 'steps': 1847, 'loss/train': 3.7380852699279785} -09/20/2021 20:53:23 - INFO - __main__ - Step 29559: {'lr': 0.0001997552665617088, 'samples': 945888, 'steps': 1847, 'loss/train': 2.309014081954956} -09/20/2021 20:53:23 - INFO - __main__ - Step 29560: {'lr': 0.0001997552665617088, 'samples': 945920, 'steps': 1847, 'loss/train': 2.8766608238220215} -09/20/2021 20:53:24 - INFO - __main__ - Step 29561: {'lr': 0.0001997552665617088, 'samples': 945952, 'steps': 1847, 'loss/train': 2.029017686843872} -09/20/2021 20:53:25 - INFO - __main__ - Step 29562: {'lr': 0.0001997552665617088, 'samples': 945984, 'steps': 1847, 'loss/train': 2.484647035598755} -09/20/2021 20:53:26 - INFO - __main__ - Step 29563: {'lr': 0.0001997552665617088, 'samples': 946016, 'steps': 1847, 'loss/train': 3.497788906097412} -09/20/2021 20:53:26 - INFO - __main__ - Step 29564: {'lr': 0.0001997552665617088, 'samples': 946048, 'steps': 1847, 'loss/train': 2.644510507583618} -09/20/2021 20:53:27 - INFO - __main__ - Step 29565: {'lr': 0.0001997552665617088, 'samples': 946080, 'steps': 1847, 'loss/train': 2.904655694961548} -09/20/2021 20:53:28 - INFO - __main__ - Step 29566: {'lr': 0.0001997552665617088, 'samples': 946112, 'steps': 1847, 'loss/train': 0.5897837281227112} -09/20/2021 20:53:29 - INFO - __main__ - Step 29567: {'lr': 0.0001997552665617088, 'samples': 946144, 'steps': 1847, 'loss/train': 0.6307170391082764} -09/20/2021 20:53:30 - INFO - __main__ - Step 29568: {'lr': 0.0001997552665617088, 'samples': 946176, 'steps': 1847, 'loss/train': 3.277165174484253} -09/20/2021 20:53:31 - INFO - __main__ - Step 29569: {'lr': 0.00019975482035408025, 'samples': 946208, 'steps': 1848, 'loss/train': 2.443371295928955} -09/20/2021 20:53:32 - INFO - __main__ - Step 29570: {'lr': 0.00019975482035408025, 'samples': 946240, 'steps': 1848, 'loss/train': 2.3107502460479736} -09/20/2021 20:53:32 - INFO - __main__ - Step 29571: {'lr': 0.00019975482035408025, 'samples': 946272, 'steps': 1848, 'loss/train': 2.147120952606201} -09/20/2021 20:53:33 - INFO - __main__ - Step 29572: {'lr': 0.00019975482035408025, 'samples': 946304, 'steps': 1848, 'loss/train': 2.4493861198425293} -09/20/2021 20:53:34 - INFO - __main__ - Step 29573: {'lr': 0.00019975482035408025, 'samples': 946336, 'steps': 1848, 'loss/train': 2.3257391452789307} -09/20/2021 20:53:35 - INFO - __main__ - Step 29574: {'lr': 0.00019975482035408025, 'samples': 946368, 'steps': 1848, 'loss/train': 1.7837421894073486} -09/20/2021 20:53:35 - INFO - __main__ - Step 29575: {'lr': 0.00019975482035408025, 'samples': 946400, 'steps': 1848, 'loss/train': 2.973447799682617} -09/20/2021 20:53:36 - INFO - __main__ - Step 29576: {'lr': 0.00019975482035408025, 'samples': 946432, 'steps': 1848, 'loss/train': 2.292100429534912} -09/20/2021 20:53:37 - INFO - __main__ - Step 29577: {'lr': 0.00019975482035408025, 'samples': 946464, 'steps': 1848, 'loss/train': 3.1045455932617188} -09/20/2021 20:53:38 - INFO - __main__ - Step 29578: {'lr': 0.00019975482035408025, 'samples': 946496, 'steps': 1848, 'loss/train': 1.6867928504943848} -09/20/2021 20:53:38 - INFO - __main__ - Step 29579: {'lr': 0.00019975482035408025, 'samples': 946528, 'steps': 1848, 'loss/train': 2.5606603622436523} -09/20/2021 20:53:39 - INFO - __main__ - Step 29580: {'lr': 0.00019975482035408025, 'samples': 946560, 'steps': 1848, 'loss/train': 2.5673463344573975} -09/20/2021 20:53:40 - INFO - __main__ - Step 29581: {'lr': 0.00019975482035408025, 'samples': 946592, 'steps': 1848, 'loss/train': 2.6303608417510986} -09/20/2021 20:53:41 - INFO - __main__ - Step 29582: {'lr': 0.00019975482035408025, 'samples': 946624, 'steps': 1848, 'loss/train': 1.6777567863464355} -09/20/2021 20:53:41 - INFO - __main__ - Step 29583: {'lr': 0.00019975482035408025, 'samples': 946656, 'steps': 1848, 'loss/train': 2.9105308055877686} -09/20/2021 20:53:42 - INFO - __main__ - Step 29584: {'lr': 0.00019975482035408025, 'samples': 946688, 'steps': 1848, 'loss/train': 2.695284366607666} -09/20/2021 20:53:43 - INFO - __main__ - Step 29585: {'lr': 0.00019975437374054975, 'samples': 946720, 'steps': 1849, 'loss/train': 2.6578354835510254} -09/20/2021 20:53:44 - INFO - __main__ - Step 29586: {'lr': 0.00019975437374054975, 'samples': 946752, 'steps': 1849, 'loss/train': 2.4242162704467773} -09/20/2021 20:53:44 - INFO - __main__ - Step 29587: {'lr': 0.00019975437374054975, 'samples': 946784, 'steps': 1849, 'loss/train': 2.916717052459717} -09/20/2021 20:53:45 - INFO - __main__ - Step 29588: {'lr': 0.00019975437374054975, 'samples': 946816, 'steps': 1849, 'loss/train': 2.5811259746551514} -09/20/2021 20:53:46 - INFO - __main__ - Step 29589: {'lr': 0.00019975437374054975, 'samples': 946848, 'steps': 1849, 'loss/train': 2.468808889389038} -09/20/2021 20:53:47 - INFO - __main__ - Step 29590: {'lr': 0.00019975437374054975, 'samples': 946880, 'steps': 1849, 'loss/train': 2.3060779571533203} -09/20/2021 20:53:47 - INFO - __main__ - Step 29591: {'lr': 0.00019975437374054975, 'samples': 946912, 'steps': 1849, 'loss/train': 3.028102159500122} -09/20/2021 20:53:48 - INFO - __main__ - Step 29592: {'lr': 0.00019975437374054975, 'samples': 946944, 'steps': 1849, 'loss/train': 2.368166446685791} -09/20/2021 20:53:49 - INFO - __main__ - Step 29593: {'lr': 0.00019975437374054975, 'samples': 946976, 'steps': 1849, 'loss/train': 2.4534590244293213} -09/20/2021 20:53:50 - INFO - __main__ - Step 29594: {'lr': 0.00019975437374054975, 'samples': 947008, 'steps': 1849, 'loss/train': 2.5822980403900146} -09/20/2021 20:53:50 - INFO - __main__ - Step 29595: {'lr': 0.00019975437374054975, 'samples': 947040, 'steps': 1849, 'loss/train': 2.956860303878784} -09/20/2021 20:53:51 - INFO - __main__ - Step 29596: {'lr': 0.00019975437374054975, 'samples': 947072, 'steps': 1849, 'loss/train': 2.4210116863250732} -09/20/2021 20:53:52 - INFO - __main__ - Step 29597: {'lr': 0.00019975437374054975, 'samples': 947104, 'steps': 1849, 'loss/train': 1.9651051759719849} -09/20/2021 20:53:53 - INFO - __main__ - Step 29598: {'lr': 0.00019975437374054975, 'samples': 947136, 'steps': 1849, 'loss/train': 2.5526278018951416} -09/20/2021 20:53:54 - INFO - __main__ - Step 29599: {'lr': 0.00019975437374054975, 'samples': 947168, 'steps': 1849, 'loss/train': 2.0428669452667236} -09/20/2021 20:53:55 - INFO - __main__ - Step 29600: {'lr': 0.00019975437374054975, 'samples': 947200, 'steps': 1849, 'loss/train': 2.5425286293029785} -09/20/2021 20:53:56 - INFO - __main__ - Step 29601: {'lr': 0.00019975392672111908, 'samples': 947232, 'steps': 1850, 'loss/train': 2.614130735397339} -09/20/2021 20:53:56 - INFO - __main__ - Step 29602: {'lr': 0.00019975392672111908, 'samples': 947264, 'steps': 1850, 'loss/train': 2.604785919189453} -09/20/2021 20:53:57 - INFO - __main__ - Step 29603: {'lr': 0.00019975392672111908, 'samples': 947296, 'steps': 1850, 'loss/train': 0.2821338474750519} -09/20/2021 20:53:58 - INFO - __main__ - Step 29604: {'lr': 0.00019975392672111908, 'samples': 947328, 'steps': 1850, 'loss/train': 0.33066532015800476} -09/20/2021 20:53:59 - INFO - __main__ - Step 29605: {'lr': 0.00019975392672111908, 'samples': 947360, 'steps': 1850, 'loss/train': 3.2857632637023926} -09/20/2021 20:53:59 - INFO - __main__ - Step 29606: {'lr': 0.00019975392672111908, 'samples': 947392, 'steps': 1850, 'loss/train': 2.6803643703460693} -09/20/2021 20:54:00 - INFO - __main__ - Step 29607: {'lr': 0.00019975392672111908, 'samples': 947424, 'steps': 1850, 'loss/train': 0.4306938946247101} -09/20/2021 20:54:01 - INFO - __main__ - Step 29608: {'lr': 0.00019975392672111908, 'samples': 947456, 'steps': 1850, 'loss/train': 0.6514933705329895} -09/20/2021 20:54:02 - INFO - __main__ - Step 29609: {'lr': 0.00019975392672111908, 'samples': 947488, 'steps': 1850, 'loss/train': 0.34498533606529236} -09/20/2021 20:54:02 - INFO - __main__ - Step 29610: {'lr': 0.00019975392672111908, 'samples': 947520, 'steps': 1850, 'loss/train': 0.3258202075958252} -09/20/2021 20:54:03 - INFO - __main__ - Step 29611: {'lr': 0.00019975392672111908, 'samples': 947552, 'steps': 1850, 'loss/train': 3.4269731044769287} -09/20/2021 20:54:04 - INFO - __main__ - Step 29612: {'lr': 0.00019975392672111908, 'samples': 947584, 'steps': 1850, 'loss/train': 2.352379322052002} -09/20/2021 20:54:05 - INFO - __main__ - Step 29613: {'lr': 0.00019975392672111908, 'samples': 947616, 'steps': 1850, 'loss/train': 2.3295419216156006} -09/20/2021 20:54:05 - INFO - __main__ - Step 29614: {'lr': 0.00019975392672111908, 'samples': 947648, 'steps': 1850, 'loss/train': 3.0910816192626953} -09/20/2021 20:54:06 - INFO - __main__ - Step 29615: {'lr': 0.00019975392672111908, 'samples': 947680, 'steps': 1850, 'loss/train': 1.8711107969284058} -09/20/2021 20:54:07 - INFO - __main__ - Step 29616: {'lr': 0.00019975392672111908, 'samples': 947712, 'steps': 1850, 'loss/train': 2.4956841468811035} -09/20/2021 20:54:08 - INFO - __main__ - Step 29617: {'lr': 0.00019975347929579004, 'samples': 947744, 'steps': 1851, 'loss/train': 2.672039031982422} -09/20/2021 20:54:09 - INFO - __main__ - Step 29618: {'lr': 0.00019975347929579004, 'samples': 947776, 'steps': 1851, 'loss/train': 2.778397560119629} -09/20/2021 20:54:09 - INFO - __main__ - Step 29619: {'lr': 0.00019975347929579004, 'samples': 947808, 'steps': 1851, 'loss/train': 2.653230905532837} -09/20/2021 20:54:10 - INFO - __main__ - Step 29620: {'lr': 0.00019975347929579004, 'samples': 947840, 'steps': 1851, 'loss/train': 2.6354916095733643} -09/20/2021 20:54:11 - INFO - __main__ - Step 29621: {'lr': 0.00019975347929579004, 'samples': 947872, 'steps': 1851, 'loss/train': 2.129215955734253} -09/20/2021 20:54:12 - INFO - __main__ - Step 29622: {'lr': 0.00019975347929579004, 'samples': 947904, 'steps': 1851, 'loss/train': 2.586819648742676} -09/20/2021 20:54:12 - INFO - __main__ - Step 29623: {'lr': 0.00019975347929579004, 'samples': 947936, 'steps': 1851, 'loss/train': 2.4591867923736572} -09/20/2021 20:54:13 - INFO - __main__ - Step 29624: {'lr': 0.00019975347929579004, 'samples': 947968, 'steps': 1851, 'loss/train': 2.057203531265259} -09/20/2021 20:54:14 - INFO - __main__ - Step 29625: {'lr': 0.00019975347929579004, 'samples': 948000, 'steps': 1851, 'loss/train': 2.5556325912475586} -09/20/2021 20:54:15 - INFO - __main__ - Step 29626: {'lr': 0.00019975347929579004, 'samples': 948032, 'steps': 1851, 'loss/train': 0.28058284521102905} -09/20/2021 20:54:15 - INFO - __main__ - Step 29627: {'lr': 0.00019975347929579004, 'samples': 948064, 'steps': 1851, 'loss/train': 0.41631969809532166} -09/20/2021 20:54:16 - INFO - __main__ - Step 29628: {'lr': 0.00019975347929579004, 'samples': 948096, 'steps': 1851, 'loss/train': 0.26457422971725464} -09/20/2021 20:54:18 - INFO - __main__ - Step 29629: {'lr': 0.00019975347929579004, 'samples': 948128, 'steps': 1851, 'loss/train': 3.7807841300964355} -09/20/2021 20:54:19 - INFO - __main__ - Step 29630: {'lr': 0.00019975347929579004, 'samples': 948160, 'steps': 1851, 'loss/train': 2.4655325412750244} -09/20/2021 20:54:20 - INFO - __main__ - Step 29631: {'lr': 0.00019975347929579004, 'samples': 948192, 'steps': 1851, 'loss/train': 2.511967182159424} -09/20/2021 20:54:21 - INFO - __main__ - Step 29632: {'lr': 0.00019975347929579004, 'samples': 948224, 'steps': 1851, 'loss/train': 2.8158998489379883} -09/20/2021 20:54:21 - INFO - __main__ - Step 29633: {'lr': 0.0001997530314645645, 'samples': 948256, 'steps': 1852, 'loss/train': 2.210160732269287} -09/20/2021 20:54:22 - INFO - __main__ - Step 29634: {'lr': 0.0001997530314645645, 'samples': 948288, 'steps': 1852, 'loss/train': 2.158677577972412} -09/20/2021 20:54:23 - INFO - __main__ - Step 29635: {'lr': 0.0001997530314645645, 'samples': 948320, 'steps': 1852, 'loss/train': 2.02638578414917} -09/20/2021 20:54:24 - INFO - __main__ - Step 29636: {'lr': 0.0001997530314645645, 'samples': 948352, 'steps': 1852, 'loss/train': 2.1835134029388428} -09/20/2021 20:54:24 - INFO - __main__ - Step 29637: {'lr': 0.0001997530314645645, 'samples': 948384, 'steps': 1852, 'loss/train': 2.155994415283203} -09/20/2021 20:54:25 - INFO - __main__ - Step 29638: {'lr': 0.0001997530314645645, 'samples': 948416, 'steps': 1852, 'loss/train': 2.1720356941223145} -09/20/2021 20:54:26 - INFO - __main__ - Step 29639: {'lr': 0.0001997530314645645, 'samples': 948448, 'steps': 1852, 'loss/train': 2.1817805767059326} -09/20/2021 20:54:27 - INFO - __main__ - Step 29640: {'lr': 0.0001997530314645645, 'samples': 948480, 'steps': 1852, 'loss/train': 2.4530222415924072} -09/20/2021 20:54:27 - INFO - __main__ - Step 29641: {'lr': 0.0001997530314645645, 'samples': 948512, 'steps': 1852, 'loss/train': 2.102269411087036} -09/20/2021 20:54:28 - INFO - __main__ - Step 29642: {'lr': 0.0001997530314645645, 'samples': 948544, 'steps': 1852, 'loss/train': 2.828125} -09/20/2021 20:54:29 - INFO - __main__ - Step 29643: {'lr': 0.0001997530314645645, 'samples': 948576, 'steps': 1852, 'loss/train': 2.3457369804382324} -09/20/2021 20:54:30 - INFO - __main__ - Step 29644: {'lr': 0.0001997530314645645, 'samples': 948608, 'steps': 1852, 'loss/train': 1.28397798538208} -09/20/2021 20:54:30 - INFO - __main__ - Step 29645: {'lr': 0.0001997530314645645, 'samples': 948640, 'steps': 1852, 'loss/train': 2.0751848220825195} -09/20/2021 20:54:31 - INFO - __main__ - Step 29646: {'lr': 0.0001997530314645645, 'samples': 948672, 'steps': 1852, 'loss/train': 2.7970988750457764} -09/20/2021 20:54:32 - INFO - __main__ - Step 29647: {'lr': 0.0001997530314645645, 'samples': 948704, 'steps': 1852, 'loss/train': 2.283003330230713} -09/20/2021 20:54:33 - INFO - __main__ - Step 29648: {'lr': 0.0001997530314645645, 'samples': 948736, 'steps': 1852, 'loss/train': 1.9559392929077148} -09/20/2021 20:54:34 - INFO - __main__ - Step 29649: {'lr': 0.00019975258322744427, 'samples': 948768, 'steps': 1853, 'loss/train': 2.5572030544281006} -09/20/2021 20:54:34 - INFO - __main__ - Step 29650: {'lr': 0.00019975258322744427, 'samples': 948800, 'steps': 1853, 'loss/train': 2.937225341796875} -09/20/2021 20:54:35 - INFO - __main__ - Step 29651: {'lr': 0.00019975258322744427, 'samples': 948832, 'steps': 1853, 'loss/train': 1.9483437538146973} -09/20/2021 20:54:36 - INFO - __main__ - Step 29652: {'lr': 0.00019975258322744427, 'samples': 948864, 'steps': 1853, 'loss/train': 1.372946858406067} -09/20/2021 20:54:37 - INFO - __main__ - Step 29653: {'lr': 0.00019975258322744427, 'samples': 948896, 'steps': 1853, 'loss/train': 1.2078319787979126} -09/20/2021 20:54:37 - INFO - __main__ - Step 29654: {'lr': 0.00019975258322744427, 'samples': 948928, 'steps': 1853, 'loss/train': 1.1401772499084473} -09/20/2021 20:54:38 - INFO - __main__ - Step 29655: {'lr': 0.00019975258322744427, 'samples': 948960, 'steps': 1853, 'loss/train': 1.3728466033935547} -09/20/2021 20:54:39 - INFO - __main__ - Step 29656: {'lr': 0.00019975258322744427, 'samples': 948992, 'steps': 1853, 'loss/train': 1.2535712718963623} -09/20/2021 20:54:40 - INFO - __main__ - Step 29657: {'lr': 0.00019975258322744427, 'samples': 949024, 'steps': 1853, 'loss/train': 1.1020773649215698} -09/20/2021 20:54:40 - INFO - __main__ - Step 29658: {'lr': 0.00019975258322744427, 'samples': 949056, 'steps': 1853, 'loss/train': 1.3839868307113647} -09/20/2021 20:54:41 - INFO - __main__ - Step 29659: {'lr': 0.00019975258322744427, 'samples': 949088, 'steps': 1853, 'loss/train': 1.2850496768951416} -09/20/2021 20:54:42 - INFO - __main__ - Step 29660: {'lr': 0.00019975258322744427, 'samples': 949120, 'steps': 1853, 'loss/train': 2.0544145107269287} -09/20/2021 20:54:43 - INFO - __main__ - Step 29661: {'lr': 0.00019975258322744427, 'samples': 949152, 'steps': 1853, 'loss/train': 2.0441486835479736} -09/20/2021 20:54:43 - INFO - __main__ - Step 29662: {'lr': 0.00019975258322744427, 'samples': 949184, 'steps': 1853, 'loss/train': 2.9913320541381836} -09/20/2021 20:54:44 - INFO - __main__ - Step 29663: {'lr': 0.00019975258322744427, 'samples': 949216, 'steps': 1853, 'loss/train': 1.9906644821166992} -09/20/2021 20:54:45 - INFO - __main__ - Step 29664: {'lr': 0.00019975258322744427, 'samples': 949248, 'steps': 1853, 'loss/train': 0.6006546020507812} -09/20/2021 20:54:46 - INFO - __main__ - Step 29665: {'lr': 0.00019975213458443117, 'samples': 949280, 'steps': 1854, 'loss/train': 3.1731274127960205} -09/20/2021 20:54:46 - INFO - __main__ - Step 29666: {'lr': 0.00019975213458443117, 'samples': 949312, 'steps': 1854, 'loss/train': 2.4348206520080566} -09/20/2021 20:54:47 - INFO - __main__ - Step 29667: {'lr': 0.00019975213458443117, 'samples': 949344, 'steps': 1854, 'loss/train': 1.8638564348220825} -09/20/2021 20:54:48 - INFO - __main__ - Step 29668: {'lr': 0.00019975213458443117, 'samples': 949376, 'steps': 1854, 'loss/train': 2.371157646179199} -09/20/2021 20:54:49 - INFO - __main__ - Step 29669: {'lr': 0.00019975213458443117, 'samples': 949408, 'steps': 1854, 'loss/train': 2.6143949031829834} -09/20/2021 20:54:50 - INFO - __main__ - Step 29670: {'lr': 0.00019975213458443117, 'samples': 949440, 'steps': 1854, 'loss/train': 3.593780040740967} -09/20/2021 20:54:51 - INFO - __main__ - Step 29671: {'lr': 0.00019975213458443117, 'samples': 949472, 'steps': 1854, 'loss/train': 2.283935785293579} -09/20/2021 20:54:52 - INFO - __main__ - Step 29672: {'lr': 0.00019975213458443117, 'samples': 949504, 'steps': 1854, 'loss/train': 2.693314552307129} -09/20/2021 20:54:52 - INFO - __main__ - Step 29673: {'lr': 0.00019975213458443117, 'samples': 949536, 'steps': 1854, 'loss/train': 3.755103826522827} -09/20/2021 20:54:53 - INFO - __main__ - Step 29674: {'lr': 0.00019975213458443117, 'samples': 949568, 'steps': 1854, 'loss/train': 2.69559645652771} -09/20/2021 20:54:54 - INFO - __main__ - Step 29675: {'lr': 0.00019975213458443117, 'samples': 949600, 'steps': 1854, 'loss/train': 0.7913817763328552} -09/20/2021 20:54:55 - INFO - __main__ - Step 29676: {'lr': 0.00019975213458443117, 'samples': 949632, 'steps': 1854, 'loss/train': 0.6949607133865356} -09/20/2021 20:54:55 - INFO - __main__ - Step 29677: {'lr': 0.00019975213458443117, 'samples': 949664, 'steps': 1854, 'loss/train': 0.4798556864261627} -09/20/2021 20:54:56 - INFO - __main__ - Step 29678: {'lr': 0.00019975213458443117, 'samples': 949696, 'steps': 1854, 'loss/train': 0.24113090336322784} -09/20/2021 20:54:57 - INFO - __main__ - Step 29679: {'lr': 0.00019975213458443117, 'samples': 949728, 'steps': 1854, 'loss/train': 0.2952672243118286} -09/20/2021 20:54:58 - INFO - __main__ - Step 29680: {'lr': 0.00019975213458443117, 'samples': 949760, 'steps': 1854, 'loss/train': 0.8994714617729187} -09/20/2021 20:54:59 - INFO - __main__ - Step 29681: {'lr': 0.00019975168553552705, 'samples': 949792, 'steps': 1855, 'loss/train': 3.2595431804656982} -09/20/2021 20:54:59 - INFO - __main__ - Step 29682: {'lr': 0.00019975168553552705, 'samples': 949824, 'steps': 1855, 'loss/train': 2.152759552001953} -09/20/2021 20:55:00 - INFO - __main__ - Step 29683: {'lr': 0.00019975168553552705, 'samples': 949856, 'steps': 1855, 'loss/train': 2.059945583343506} -09/20/2021 20:55:01 - INFO - __main__ - Step 29684: {'lr': 0.00019975168553552705, 'samples': 949888, 'steps': 1855, 'loss/train': 1.6867947578430176} -09/20/2021 20:55:02 - INFO - __main__ - Step 29685: {'lr': 0.00019975168553552705, 'samples': 949920, 'steps': 1855, 'loss/train': 1.8423149585723877} -09/20/2021 20:55:02 - INFO - __main__ - Step 29686: {'lr': 0.00019975168553552705, 'samples': 949952, 'steps': 1855, 'loss/train': 2.7189269065856934} -09/20/2021 20:55:03 - INFO - __main__ - Step 29687: {'lr': 0.00019975168553552705, 'samples': 949984, 'steps': 1855, 'loss/train': 2.437289237976074} -09/20/2021 20:55:04 - INFO - __main__ - Step 29688: {'lr': 0.00019975168553552705, 'samples': 950016, 'steps': 1855, 'loss/train': 1.6837892532348633} -09/20/2021 20:55:05 - INFO - __main__ - Step 29689: {'lr': 0.00019975168553552705, 'samples': 950048, 'steps': 1855, 'loss/train': 2.83357834815979} -09/20/2021 20:55:05 - INFO - __main__ - Step 29690: {'lr': 0.00019975168553552705, 'samples': 950080, 'steps': 1855, 'loss/train': 2.6536827087402344} -09/20/2021 20:55:06 - INFO - __main__ - Step 29691: {'lr': 0.00019975168553552705, 'samples': 950112, 'steps': 1855, 'loss/train': 3.074357032775879} -09/20/2021 20:55:07 - INFO - __main__ - Step 29692: {'lr': 0.00019975168553552705, 'samples': 950144, 'steps': 1855, 'loss/train': 2.4182493686676025} -09/20/2021 20:55:08 - INFO - __main__ - Step 29693: {'lr': 0.00019975168553552705, 'samples': 950176, 'steps': 1855, 'loss/train': 2.7162208557128906} -09/20/2021 20:55:08 - INFO - __main__ - Step 29694: {'lr': 0.00019975168553552705, 'samples': 950208, 'steps': 1855, 'loss/train': 2.0071280002593994} -09/20/2021 20:55:09 - INFO - __main__ - Step 29695: {'lr': 0.00019975168553552705, 'samples': 950240, 'steps': 1855, 'loss/train': 2.9562149047851562} -09/20/2021 20:55:10 - INFO - __main__ - Step 29696: {'lr': 0.00019975168553552705, 'samples': 950272, 'steps': 1855, 'loss/train': 1.6002694368362427} -09/20/2021 20:55:11 - INFO - __main__ - Step 29697: {'lr': 0.00019975123608073365, 'samples': 950304, 'steps': 1856, 'loss/train': 2.128892660140991} -09/20/2021 20:55:11 - INFO - __main__ - Step 29698: {'lr': 0.00019975123608073365, 'samples': 950336, 'steps': 1856, 'loss/train': 2.330470561981201} -09/20/2021 20:55:12 - INFO - __main__ - Step 29699: {'lr': 0.00019975123608073365, 'samples': 950368, 'steps': 1856, 'loss/train': 2.9112606048583984} -09/20/2021 20:55:14 - INFO - __main__ - Step 29700: {'lr': 0.00019975123608073365, 'samples': 950400, 'steps': 1856, 'loss/train': 3.2083747386932373} -09/20/2021 20:55:14 - INFO - __main__ - Step 29701: {'lr': 0.00019975123608073365, 'samples': 950432, 'steps': 1856, 'loss/train': 2.422501802444458} -09/20/2021 20:55:15 - INFO - __main__ - Step 29702: {'lr': 0.00019975123608073365, 'samples': 950464, 'steps': 1856, 'loss/train': 2.4477992057800293} -09/20/2021 20:55:16 - INFO - __main__ - Step 29703: {'lr': 0.00019975123608073365, 'samples': 950496, 'steps': 1856, 'loss/train': 1.4095693826675415} -09/20/2021 20:55:17 - INFO - __main__ - Step 29704: {'lr': 0.00019975123608073365, 'samples': 950528, 'steps': 1856, 'loss/train': 2.884089231491089} -09/20/2021 20:55:17 - INFO - __main__ - Step 29705: {'lr': 0.00019975123608073365, 'samples': 950560, 'steps': 1856, 'loss/train': 2.44635272026062} -09/20/2021 20:55:18 - INFO - __main__ - Step 29706: {'lr': 0.00019975123608073365, 'samples': 950592, 'steps': 1856, 'loss/train': 3.005815029144287} -09/20/2021 20:55:19 - INFO - __main__ - Step 29707: {'lr': 0.00019975123608073365, 'samples': 950624, 'steps': 1856, 'loss/train': 2.7773990631103516} -09/20/2021 20:55:20 - INFO - __main__ - Step 29708: {'lr': 0.00019975123608073365, 'samples': 950656, 'steps': 1856, 'loss/train': 3.289989948272705} -09/20/2021 20:55:20 - INFO - __main__ - Step 29709: {'lr': 0.00019975123608073365, 'samples': 950688, 'steps': 1856, 'loss/train': 2.6462881565093994} -09/20/2021 20:55:21 - INFO - __main__ - Step 29710: {'lr': 0.00019975123608073365, 'samples': 950720, 'steps': 1856, 'loss/train': 2.599038600921631} -09/20/2021 20:55:22 - INFO - __main__ - Step 29711: {'lr': 0.00019975123608073365, 'samples': 950752, 'steps': 1856, 'loss/train': 2.3038549423217773} -09/20/2021 20:55:23 - INFO - __main__ - Step 29712: {'lr': 0.00019975123608073365, 'samples': 950784, 'steps': 1856, 'loss/train': 2.4878859519958496} -09/20/2021 20:55:24 - INFO - __main__ - Step 29713: {'lr': 0.00019975078622005288, 'samples': 950816, 'steps': 1857, 'loss/train': 2.7038662433624268} -09/20/2021 20:55:24 - INFO - __main__ - Step 29714: {'lr': 0.00019975078622005288, 'samples': 950848, 'steps': 1857, 'loss/train': 2.7002482414245605} -09/20/2021 20:55:25 - INFO - __main__ - Step 29715: {'lr': 0.00019975078622005288, 'samples': 950880, 'steps': 1857, 'loss/train': 2.253180980682373} -09/20/2021 20:55:26 - INFO - __main__ - Step 29716: {'lr': 0.00019975078622005288, 'samples': 950912, 'steps': 1857, 'loss/train': 3.6786844730377197} -09/20/2021 20:55:27 - INFO - __main__ - Step 29717: {'lr': 0.00019975078622005288, 'samples': 950944, 'steps': 1857, 'loss/train': 2.53359055519104} -09/20/2021 20:55:27 - INFO - __main__ - Step 29718: {'lr': 0.00019975078622005288, 'samples': 950976, 'steps': 1857, 'loss/train': 1.9735997915267944} -09/20/2021 20:55:28 - INFO - __main__ - Step 29719: {'lr': 0.00019975078622005288, 'samples': 951008, 'steps': 1857, 'loss/train': 2.8152830600738525} -09/20/2021 20:55:29 - INFO - __main__ - Step 29720: {'lr': 0.00019975078622005288, 'samples': 951040, 'steps': 1857, 'loss/train': 2.5729236602783203} -09/20/2021 20:55:30 - INFO - __main__ - Step 29721: {'lr': 0.00019975078622005288, 'samples': 951072, 'steps': 1857, 'loss/train': 2.7983343601226807} -09/20/2021 20:55:30 - INFO - __main__ - Step 29722: {'lr': 0.00019975078622005288, 'samples': 951104, 'steps': 1857, 'loss/train': 2.3877413272857666} -09/20/2021 20:55:31 - INFO - __main__ - Step 29723: {'lr': 0.00019975078622005288, 'samples': 951136, 'steps': 1857, 'loss/train': 1.5156350135803223} -09/20/2021 20:55:32 - INFO - __main__ - Step 29724: {'lr': 0.00019975078622005288, 'samples': 951168, 'steps': 1857, 'loss/train': 2.331099510192871} -09/20/2021 20:55:33 - INFO - __main__ - Step 29725: {'lr': 0.00019975078622005288, 'samples': 951200, 'steps': 1857, 'loss/train': 3.148420572280884} -09/20/2021 20:55:33 - INFO - __main__ - Step 29726: {'lr': 0.00019975078622005288, 'samples': 951232, 'steps': 1857, 'loss/train': 2.3895726203918457} -09/20/2021 20:55:34 - INFO - __main__ - Step 29727: {'lr': 0.00019975078622005288, 'samples': 951264, 'steps': 1857, 'loss/train': 2.032020092010498} -09/20/2021 20:55:35 - INFO - __main__ - Step 29728: {'lr': 0.00019975078622005288, 'samples': 951296, 'steps': 1857, 'loss/train': 2.3000566959381104} -09/20/2021 20:55:36 - INFO - __main__ - Step 29729: {'lr': 0.00019975033595348655, 'samples': 951328, 'steps': 1858, 'loss/train': 2.6322953701019287} -09/20/2021 20:55:37 - INFO - __main__ - Step 29730: {'lr': 0.00019975033595348655, 'samples': 951360, 'steps': 1858, 'loss/train': 2.2132716178894043} -09/20/2021 20:55:38 - INFO - __main__ - Step 29731: {'lr': 0.00019975033595348655, 'samples': 951392, 'steps': 1858, 'loss/train': 2.788104772567749} -09/20/2021 20:55:39 - INFO - __main__ - Step 29732: {'lr': 0.00019975033595348655, 'samples': 951424, 'steps': 1858, 'loss/train': 3.088118314743042} -09/20/2021 20:55:39 - INFO - __main__ - Step 29733: {'lr': 0.00019975033595348655, 'samples': 951456, 'steps': 1858, 'loss/train': 2.0392308235168457} -09/20/2021 20:55:40 - INFO - __main__ - Step 29734: {'lr': 0.00019975033595348655, 'samples': 951488, 'steps': 1858, 'loss/train': 1.9347054958343506} -09/20/2021 20:55:41 - INFO - __main__ - Step 29735: {'lr': 0.00019975033595348655, 'samples': 951520, 'steps': 1858, 'loss/train': 2.6800148487091064} -09/20/2021 20:55:42 - INFO - __main__ - Step 29736: {'lr': 0.00019975033595348655, 'samples': 951552, 'steps': 1858, 'loss/train': 2.32660174369812} -09/20/2021 20:55:42 - INFO - __main__ - Step 29737: {'lr': 0.00019975033595348655, 'samples': 951584, 'steps': 1858, 'loss/train': 1.9316779375076294} -09/20/2021 20:55:43 - INFO - __main__ - Step 29738: {'lr': 0.00019975033595348655, 'samples': 951616, 'steps': 1858, 'loss/train': 3.3049581050872803} -09/20/2021 20:55:44 - INFO - __main__ - Step 29739: {'lr': 0.00019975033595348655, 'samples': 951648, 'steps': 1858, 'loss/train': 2.397068500518799} -09/20/2021 20:55:45 - INFO - __main__ - Step 29740: {'lr': 0.00019975033595348655, 'samples': 951680, 'steps': 1858, 'loss/train': 3.103341817855835} -09/20/2021 20:55:45 - INFO - __main__ - Step 29741: {'lr': 0.00019975033595348655, 'samples': 951712, 'steps': 1858, 'loss/train': 2.131556272506714} -09/20/2021 20:55:46 - INFO - __main__ - Step 29742: {'lr': 0.00019975033595348655, 'samples': 951744, 'steps': 1858, 'loss/train': 3.836137533187866} -09/20/2021 20:55:47 - INFO - __main__ - Step 29743: {'lr': 0.00019975033595348655, 'samples': 951776, 'steps': 1858, 'loss/train': 2.5153017044067383} -09/20/2021 20:55:48 - INFO - __main__ - Step 29744: {'lr': 0.00019975033595348655, 'samples': 951808, 'steps': 1858, 'loss/train': 2.1204605102539062} -09/20/2021 20:55:49 - INFO - __main__ - Step 29745: {'lr': 0.00019974988528103648, 'samples': 951840, 'steps': 1859, 'loss/train': 2.4206995964050293} -09/20/2021 20:55:49 - INFO - __main__ - Step 29746: {'lr': 0.00019974988528103648, 'samples': 951872, 'steps': 1859, 'loss/train': 2.209775924682617} -09/20/2021 20:55:50 - INFO - __main__ - Step 29747: {'lr': 0.00019974988528103648, 'samples': 951904, 'steps': 1859, 'loss/train': 3.44096302986145} -09/20/2021 20:55:51 - INFO - __main__ - Step 29748: {'lr': 0.00019974988528103648, 'samples': 951936, 'steps': 1859, 'loss/train': 2.960059404373169} -09/20/2021 20:55:52 - INFO - __main__ - Step 29749: {'lr': 0.00019974988528103648, 'samples': 951968, 'steps': 1859, 'loss/train': 2.8590686321258545} -09/20/2021 20:55:52 - INFO - __main__ - Step 29750: {'lr': 0.00019974988528103648, 'samples': 952000, 'steps': 1859, 'loss/train': 2.292233467102051} -09/20/2021 20:55:53 - INFO - __main__ - Step 29751: {'lr': 0.00019974988528103648, 'samples': 952032, 'steps': 1859, 'loss/train': 3.4509024620056152} -09/20/2021 20:55:54 - INFO - __main__ - Step 29752: {'lr': 0.00019974988528103648, 'samples': 952064, 'steps': 1859, 'loss/train': 2.6453166007995605} -09/20/2021 20:55:55 - INFO - __main__ - Step 29753: {'lr': 0.00019974988528103648, 'samples': 952096, 'steps': 1859, 'loss/train': 1.5145357847213745} -09/20/2021 20:55:55 - INFO - __main__ - Step 29754: {'lr': 0.00019974988528103648, 'samples': 952128, 'steps': 1859, 'loss/train': 2.285238027572632} -09/20/2021 20:55:56 - INFO - __main__ - Step 29755: {'lr': 0.00019974988528103648, 'samples': 952160, 'steps': 1859, 'loss/train': 1.5022705793380737} -09/20/2021 20:55:57 - INFO - __main__ - Step 29756: {'lr': 0.00019974988528103648, 'samples': 952192, 'steps': 1859, 'loss/train': 1.8612464666366577} -09/20/2021 20:55:58 - INFO - __main__ - Step 29757: {'lr': 0.00019974988528103648, 'samples': 952224, 'steps': 1859, 'loss/train': 1.6936906576156616} -09/20/2021 20:55:58 - INFO - __main__ - Step 29758: {'lr': 0.00019974988528103648, 'samples': 952256, 'steps': 1859, 'loss/train': 1.6203802824020386} -09/20/2021 20:55:59 - INFO - __main__ - Step 29759: {'lr': 0.00019974988528103648, 'samples': 952288, 'steps': 1859, 'loss/train': 2.8835883140563965} -09/20/2021 20:56:00 - INFO - __main__ - Step 29760: {'lr': 0.00019974988528103648, 'samples': 952320, 'steps': 1859, 'loss/train': 1.8889507055282593} -09/20/2021 20:56:01 - INFO - __main__ - Step 29761: {'lr': 0.00019974943420270454, 'samples': 952352, 'steps': 1860, 'loss/train': 0.9732983112335205} -09/20/2021 20:56:02 - INFO - __main__ - Step 29762: {'lr': 0.00019974943420270454, 'samples': 952384, 'steps': 1860, 'loss/train': 2.648071765899658} -09/20/2021 20:56:03 - INFO - __main__ - Step 29763: {'lr': 0.00019974943420270454, 'samples': 952416, 'steps': 1860, 'loss/train': 3.0632100105285645} -09/20/2021 20:56:04 - INFO - __main__ - Step 29764: {'lr': 0.00019974943420270454, 'samples': 952448, 'steps': 1860, 'loss/train': 2.6095073223114014} -09/20/2021 20:56:04 - INFO - __main__ - Step 29765: {'lr': 0.00019974943420270454, 'samples': 952480, 'steps': 1860, 'loss/train': 2.6430957317352295} -09/20/2021 20:56:05 - INFO - __main__ - Step 29766: {'lr': 0.00019974943420270454, 'samples': 952512, 'steps': 1860, 'loss/train': 2.8498172760009766} -09/20/2021 20:56:06 - INFO - __main__ - Step 29767: {'lr': 0.00019974943420270454, 'samples': 952544, 'steps': 1860, 'loss/train': 2.6355655193328857} -09/20/2021 20:56:07 - INFO - __main__ - Step 29768: {'lr': 0.00019974943420270454, 'samples': 952576, 'steps': 1860, 'loss/train': 2.6237008571624756} -09/20/2021 20:56:07 - INFO - __main__ - Step 29769: {'lr': 0.00019974943420270454, 'samples': 952608, 'steps': 1860, 'loss/train': 1.948380708694458} -09/20/2021 20:56:08 - INFO - __main__ - Step 29770: {'lr': 0.00019974943420270454, 'samples': 952640, 'steps': 1860, 'loss/train': 3.089017868041992} -09/20/2021 20:56:09 - INFO - __main__ - Step 29771: {'lr': 0.00019974943420270454, 'samples': 952672, 'steps': 1860, 'loss/train': 2.6074635982513428} -09/20/2021 20:56:10 - INFO - __main__ - Step 29772: {'lr': 0.00019974943420270454, 'samples': 952704, 'steps': 1860, 'loss/train': 2.1033313274383545} -09/20/2021 20:56:10 - INFO - __main__ - Step 29773: {'lr': 0.00019974943420270454, 'samples': 952736, 'steps': 1860, 'loss/train': 1.0736507177352905} -09/20/2021 20:56:11 - INFO - __main__ - Step 29774: {'lr': 0.00019974943420270454, 'samples': 952768, 'steps': 1860, 'loss/train': 2.711193561553955} -09/20/2021 20:56:12 - INFO - __main__ - Step 29775: {'lr': 0.00019974943420270454, 'samples': 952800, 'steps': 1860, 'loss/train': 3.6094367504119873} -09/20/2021 20:56:13 - INFO - __main__ - Step 29776: {'lr': 0.00019974943420270454, 'samples': 952832, 'steps': 1860, 'loss/train': 2.201411724090576} -09/20/2021 20:56:13 - INFO - __main__ - Step 29777: {'lr': 0.00019974898271849252, 'samples': 952864, 'steps': 1861, 'loss/train': 2.804443836212158} -09/20/2021 20:56:14 - INFO - __main__ - Step 29778: {'lr': 0.00019974898271849252, 'samples': 952896, 'steps': 1861, 'loss/train': 2.1003332138061523} -09/20/2021 20:56:15 - INFO - __main__ - Step 29779: {'lr': 0.00019974898271849252, 'samples': 952928, 'steps': 1861, 'loss/train': 2.9363954067230225} -09/20/2021 20:56:16 - INFO - __main__ - Step 29780: {'lr': 0.00019974898271849252, 'samples': 952960, 'steps': 1861, 'loss/train': 3.89601993560791} -09/20/2021 20:56:16 - INFO - __main__ - Step 29781: {'lr': 0.00019974898271849252, 'samples': 952992, 'steps': 1861, 'loss/train': 1.8459668159484863} -09/20/2021 20:56:17 - INFO - __main__ - Step 29782: {'lr': 0.00019974898271849252, 'samples': 953024, 'steps': 1861, 'loss/train': 1.9597668647766113} -09/20/2021 20:56:18 - INFO - __main__ - Step 29783: {'lr': 0.00019974898271849252, 'samples': 953056, 'steps': 1861, 'loss/train': 2.994615077972412} -09/20/2021 20:56:19 - INFO - __main__ - Step 29784: {'lr': 0.00019974898271849252, 'samples': 953088, 'steps': 1861, 'loss/train': 3.12430477142334} -09/20/2021 20:56:19 - INFO - __main__ - Step 29785: {'lr': 0.00019974898271849252, 'samples': 953120, 'steps': 1861, 'loss/train': 2.064742088317871} -09/20/2021 20:56:20 - INFO - __main__ - Step 29786: {'lr': 0.00019974898271849252, 'samples': 953152, 'steps': 1861, 'loss/train': 2.391160011291504} -09/20/2021 20:56:21 - INFO - __main__ - Step 29787: {'lr': 0.00019974898271849252, 'samples': 953184, 'steps': 1861, 'loss/train': 2.744534969329834} -09/20/2021 20:56:22 - INFO - __main__ - Step 29788: {'lr': 0.00019974898271849252, 'samples': 953216, 'steps': 1861, 'loss/train': 2.9080026149749756} -09/20/2021 20:56:22 - INFO - __main__ - Step 29789: {'lr': 0.00019974898271849252, 'samples': 953248, 'steps': 1861, 'loss/train': 3.1208159923553467} -09/20/2021 20:56:23 - INFO - __main__ - Step 29790: {'lr': 0.00019974898271849252, 'samples': 953280, 'steps': 1861, 'loss/train': 0.9087362885475159} -09/20/2021 20:56:25 - INFO - __main__ - Step 29791: {'lr': 0.00019974898271849252, 'samples': 953312, 'steps': 1861, 'loss/train': 2.2683730125427246} -09/20/2021 20:56:26 - INFO - __main__ - Step 29792: {'lr': 0.00019974898271849252, 'samples': 953344, 'steps': 1861, 'loss/train': 2.2625064849853516} -09/20/2021 20:56:26 - INFO - __main__ - Step 29793: {'lr': 0.00019974853082840228, 'samples': 953376, 'steps': 1862, 'loss/train': 0.7284266948699951} -09/20/2021 20:56:27 - INFO - __main__ - Step 29794: {'lr': 0.00019974853082840228, 'samples': 953408, 'steps': 1862, 'loss/train': 0.5722255706787109} -09/20/2021 20:56:28 - INFO - __main__ - Step 29795: {'lr': 0.00019974853082840228, 'samples': 953440, 'steps': 1862, 'loss/train': 0.3361038565635681} -09/20/2021 20:56:29 - INFO - __main__ - Step 29796: {'lr': 0.00019974853082840228, 'samples': 953472, 'steps': 1862, 'loss/train': 0.4728751480579376} -09/20/2021 20:56:29 - INFO - __main__ - Step 29797: {'lr': 0.00019974853082840228, 'samples': 953504, 'steps': 1862, 'loss/train': 0.24958489835262299} -09/20/2021 20:56:30 - INFO - __main__ - Step 29798: {'lr': 0.00019974853082840228, 'samples': 953536, 'steps': 1862, 'loss/train': 0.5345953106880188} -09/20/2021 20:56:31 - INFO - __main__ - Step 29799: {'lr': 0.00019974853082840228, 'samples': 953568, 'steps': 1862, 'loss/train': 0.7211074233055115} -09/20/2021 20:56:32 - INFO - __main__ - Step 29800: {'lr': 0.00019974853082840228, 'samples': 953600, 'steps': 1862, 'loss/train': 1.6625659465789795} -09/20/2021 20:56:32 - INFO - __main__ - Step 29801: {'lr': 0.00019974853082840228, 'samples': 953632, 'steps': 1862, 'loss/train': 2.6794073581695557} -09/20/2021 20:56:33 - INFO - __main__ - Step 29802: {'lr': 0.00019974853082840228, 'samples': 953664, 'steps': 1862, 'loss/train': 1.7001845836639404} -09/20/2021 20:56:34 - INFO - __main__ - Step 29803: {'lr': 0.00019974853082840228, 'samples': 953696, 'steps': 1862, 'loss/train': 2.2194178104400635} -09/20/2021 20:56:35 - INFO - __main__ - Step 29804: {'lr': 0.00019974853082840228, 'samples': 953728, 'steps': 1862, 'loss/train': 2.133227825164795} -09/20/2021 20:56:35 - INFO - __main__ - Step 29805: {'lr': 0.00019974853082840228, 'samples': 953760, 'steps': 1862, 'loss/train': 2.152421712875366} -09/20/2021 20:56:36 - INFO - __main__ - Step 29806: {'lr': 0.00019974853082840228, 'samples': 953792, 'steps': 1862, 'loss/train': 2.691575050354004} -09/20/2021 20:56:37 - INFO - __main__ - Step 29807: {'lr': 0.00019974853082840228, 'samples': 953824, 'steps': 1862, 'loss/train': 2.846571683883667} -09/20/2021 20:56:38 - INFO - __main__ - Step 29808: {'lr': 0.00019974853082840228, 'samples': 953856, 'steps': 1862, 'loss/train': 2.8155007362365723} -09/20/2021 20:56:39 - INFO - __main__ - Step 29809: {'lr': 0.00019974807853243568, 'samples': 953888, 'steps': 1863, 'loss/train': 2.735652446746826} -09/20/2021 20:56:39 - INFO - __main__ - Step 29810: {'lr': 0.00019974807853243568, 'samples': 953920, 'steps': 1863, 'loss/train': 3.0105152130126953} -09/20/2021 20:56:40 - INFO - __main__ - Step 29811: {'lr': 0.00019974807853243568, 'samples': 953952, 'steps': 1863, 'loss/train': 1.9362705945968628} -09/20/2021 20:56:41 - INFO - __main__ - Step 29812: {'lr': 0.00019974807853243568, 'samples': 953984, 'steps': 1863, 'loss/train': 2.6386523246765137} -09/20/2021 20:56:42 - INFO - __main__ - Step 29813: {'lr': 0.00019974807853243568, 'samples': 954016, 'steps': 1863, 'loss/train': 1.843202829360962} -09/20/2021 20:56:42 - INFO - __main__ - Step 29814: {'lr': 0.00019974807853243568, 'samples': 954048, 'steps': 1863, 'loss/train': 2.7556111812591553} -09/20/2021 20:56:43 - INFO - __main__ - Step 29815: {'lr': 0.00019974807853243568, 'samples': 954080, 'steps': 1863, 'loss/train': 3.2125754356384277} -09/20/2021 20:56:44 - INFO - __main__ - Step 29816: {'lr': 0.00019974807853243568, 'samples': 954112, 'steps': 1863, 'loss/train': 2.506692886352539} -09/20/2021 20:56:45 - INFO - __main__ - Step 29817: {'lr': 0.00019974807853243568, 'samples': 954144, 'steps': 1863, 'loss/train': 2.9888174533843994} -09/20/2021 20:56:45 - INFO - __main__ - Step 29818: {'lr': 0.00019974807853243568, 'samples': 954176, 'steps': 1863, 'loss/train': 1.727858066558838} -09/20/2021 20:56:46 - INFO - __main__ - Step 29819: {'lr': 0.00019974807853243568, 'samples': 954208, 'steps': 1863, 'loss/train': 2.2848825454711914} -09/20/2021 20:56:47 - INFO - __main__ - Step 29820: {'lr': 0.00019974807853243568, 'samples': 954240, 'steps': 1863, 'loss/train': 2.382678985595703} -09/20/2021 20:56:48 - INFO - __main__ - Step 29821: {'lr': 0.00019974807853243568, 'samples': 954272, 'steps': 1863, 'loss/train': 2.389853000640869} -09/20/2021 20:56:49 - INFO - __main__ - Step 29822: {'lr': 0.00019974807853243568, 'samples': 954304, 'steps': 1863, 'loss/train': 2.1580724716186523} -09/20/2021 20:56:50 - INFO - __main__ - Step 29823: {'lr': 0.00019974807853243568, 'samples': 954336, 'steps': 1863, 'loss/train': 2.090066432952881} -09/20/2021 20:56:50 - INFO - __main__ - Step 29824: {'lr': 0.00019974807853243568, 'samples': 954368, 'steps': 1863, 'loss/train': 2.0888049602508545} -09/20/2021 20:56:51 - INFO - __main__ - Step 29825: {'lr': 0.0001997476258305945, 'samples': 954400, 'steps': 1864, 'loss/train': 0.22981767356395721} -09/20/2021 20:56:52 - INFO - __main__ - Step 29826: {'lr': 0.0001997476258305945, 'samples': 954432, 'steps': 1864, 'loss/train': 0.26596537232398987} -09/20/2021 20:56:53 - INFO - __main__ - Step 29827: {'lr': 0.0001997476258305945, 'samples': 954464, 'steps': 1864, 'loss/train': 2.675046920776367} -09/20/2021 20:56:54 - INFO - __main__ - Step 29828: {'lr': 0.0001997476258305945, 'samples': 954496, 'steps': 1864, 'loss/train': 1.8525404930114746} -09/20/2021 20:56:54 - INFO - __main__ - Step 29829: {'lr': 0.0001997476258305945, 'samples': 954528, 'steps': 1864, 'loss/train': 3.0110321044921875} -09/20/2021 20:56:55 - INFO - __main__ - Step 29830: {'lr': 0.0001997476258305945, 'samples': 954560, 'steps': 1864, 'loss/train': 1.9582189321517944} -09/20/2021 20:56:56 - INFO - __main__ - Step 29831: {'lr': 0.0001997476258305945, 'samples': 954592, 'steps': 1864, 'loss/train': 2.439453125} -09/20/2021 20:56:57 - INFO - __main__ - Step 29832: {'lr': 0.0001997476258305945, 'samples': 954624, 'steps': 1864, 'loss/train': 3.3459625244140625} -09/20/2021 20:56:57 - INFO - __main__ - Step 29833: {'lr': 0.0001997476258305945, 'samples': 954656, 'steps': 1864, 'loss/train': 3.2606844902038574} -09/20/2021 20:56:58 - INFO - __main__ - Step 29834: {'lr': 0.0001997476258305945, 'samples': 954688, 'steps': 1864, 'loss/train': 2.48101806640625} -09/20/2021 20:56:59 - INFO - __main__ - Step 29835: {'lr': 0.0001997476258305945, 'samples': 954720, 'steps': 1864, 'loss/train': 3.089425563812256} -09/20/2021 20:57:00 - INFO - __main__ - Step 29836: {'lr': 0.0001997476258305945, 'samples': 954752, 'steps': 1864, 'loss/train': 2.319553852081299} -09/20/2021 20:57:00 - INFO - __main__ - Step 29837: {'lr': 0.0001997476258305945, 'samples': 954784, 'steps': 1864, 'loss/train': 3.1427059173583984} -09/20/2021 20:57:01 - INFO - __main__ - Step 29838: {'lr': 0.0001997476258305945, 'samples': 954816, 'steps': 1864, 'loss/train': 2.991724729537964} -09/20/2021 20:57:02 - INFO - __main__ - Step 29839: {'lr': 0.0001997476258305945, 'samples': 954848, 'steps': 1864, 'loss/train': 2.389831304550171} -09/20/2021 20:57:03 - INFO - __main__ - Step 29840: {'lr': 0.0001997476258305945, 'samples': 954880, 'steps': 1864, 'loss/train': 2.276137351989746} -09/20/2021 20:57:03 - INFO - __main__ - Step 29841: {'lr': 0.0001997471727228806, 'samples': 954912, 'steps': 1865, 'loss/train': 2.793782949447632} -09/20/2021 20:57:04 - INFO - __main__ - Step 29842: {'lr': 0.0001997471727228806, 'samples': 954944, 'steps': 1865, 'loss/train': 2.9569451808929443} -09/20/2021 20:57:05 - INFO - __main__ - Step 29843: {'lr': 0.0001997471727228806, 'samples': 954976, 'steps': 1865, 'loss/train': 1.9546722173690796} -09/20/2021 20:57:06 - INFO - __main__ - Step 29844: {'lr': 0.0001997471727228806, 'samples': 955008, 'steps': 1865, 'loss/train': 2.2963144779205322} -09/20/2021 20:57:06 - INFO - __main__ - Step 29845: {'lr': 0.0001997471727228806, 'samples': 955040, 'steps': 1865, 'loss/train': 2.6911330223083496} -09/20/2021 20:57:07 - INFO - __main__ - Step 29846: {'lr': 0.0001997471727228806, 'samples': 955072, 'steps': 1865, 'loss/train': 2.196465492248535} -09/20/2021 20:57:08 - INFO - __main__ - Step 29847: {'lr': 0.0001997471727228806, 'samples': 955104, 'steps': 1865, 'loss/train': 2.6793360710144043} -09/20/2021 20:57:09 - INFO - __main__ - Step 29848: {'lr': 0.0001997471727228806, 'samples': 955136, 'steps': 1865, 'loss/train': 3.2424325942993164} -09/20/2021 20:57:09 - INFO - __main__ - Step 29849: {'lr': 0.0001997471727228806, 'samples': 955168, 'steps': 1865, 'loss/train': 1.05758535861969} -09/20/2021 20:57:10 - INFO - __main__ - Step 29850: {'lr': 0.0001997471727228806, 'samples': 955200, 'steps': 1865, 'loss/train': 1.7880220413208008} -09/20/2021 20:57:11 - INFO - __main__ - Step 29851: {'lr': 0.0001997471727228806, 'samples': 955232, 'steps': 1865, 'loss/train': 2.4138755798339844} -09/20/2021 20:57:12 - INFO - __main__ - Step 29852: {'lr': 0.0001997471727228806, 'samples': 955264, 'steps': 1865, 'loss/train': 2.0316128730773926} -09/20/2021 20:57:13 - INFO - __main__ - Step 29853: {'lr': 0.0001997471727228806, 'samples': 955296, 'steps': 1865, 'loss/train': 2.2115321159362793} -09/20/2021 20:57:14 - INFO - __main__ - Step 29854: {'lr': 0.0001997471727228806, 'samples': 955328, 'steps': 1865, 'loss/train': 2.5510473251342773} -09/20/2021 20:57:15 - INFO - __main__ - Step 29855: {'lr': 0.0001997471727228806, 'samples': 955360, 'steps': 1865, 'loss/train': 2.250619411468506} -09/20/2021 20:57:15 - INFO - __main__ - Step 29856: {'lr': 0.0001997471727228806, 'samples': 955392, 'steps': 1865, 'loss/train': 2.5978903770446777} -09/20/2021 20:57:16 - INFO - __main__ - Step 29857: {'lr': 0.00019974671920929587, 'samples': 955424, 'steps': 1866, 'loss/train': 2.037278652191162} -09/20/2021 20:57:17 - INFO - __main__ - Step 29858: {'lr': 0.00019974671920929587, 'samples': 955456, 'steps': 1866, 'loss/train': 2.7666845321655273} -09/20/2021 20:57:18 - INFO - __main__ - Step 29859: {'lr': 0.00019974671920929587, 'samples': 955488, 'steps': 1866, 'loss/train': 2.7238385677337646} -09/20/2021 20:57:18 - INFO - __main__ - Step 29860: {'lr': 0.00019974671920929587, 'samples': 955520, 'steps': 1866, 'loss/train': 2.1073215007781982} -09/20/2021 20:57:19 - INFO - __main__ - Step 29861: {'lr': 0.00019974671920929587, 'samples': 955552, 'steps': 1866, 'loss/train': 2.81734037399292} -09/20/2021 20:57:20 - INFO - __main__ - Step 29862: {'lr': 0.00019974671920929587, 'samples': 955584, 'steps': 1866, 'loss/train': 2.732330560684204} -09/20/2021 20:57:21 - INFO - __main__ - Step 29863: {'lr': 0.00019974671920929587, 'samples': 955616, 'steps': 1866, 'loss/train': 2.21462345123291} -09/20/2021 20:57:21 - INFO - __main__ - Step 29864: {'lr': 0.00019974671920929587, 'samples': 955648, 'steps': 1866, 'loss/train': 2.246041774749756} -09/20/2021 20:57:22 - INFO - __main__ - Step 29865: {'lr': 0.00019974671920929587, 'samples': 955680, 'steps': 1866, 'loss/train': 2.454345226287842} -09/20/2021 20:57:23 - INFO - __main__ - Step 29866: {'lr': 0.00019974671920929587, 'samples': 955712, 'steps': 1866, 'loss/train': 2.6633737087249756} -09/20/2021 20:57:24 - INFO - __main__ - Step 29867: {'lr': 0.00019974671920929587, 'samples': 955744, 'steps': 1866, 'loss/train': 3.2518179416656494} -09/20/2021 20:57:24 - INFO - __main__ - Step 29868: {'lr': 0.00019974671920929587, 'samples': 955776, 'steps': 1866, 'loss/train': 2.688228130340576} -09/20/2021 20:57:25 - INFO - __main__ - Step 29869: {'lr': 0.00019974671920929587, 'samples': 955808, 'steps': 1866, 'loss/train': 4.617205619812012} -09/20/2021 20:57:26 - INFO - __main__ - Step 29870: {'lr': 0.00019974671920929587, 'samples': 955840, 'steps': 1866, 'loss/train': 2.242912769317627} -09/20/2021 20:57:27 - INFO - __main__ - Step 29871: {'lr': 0.00019974671920929587, 'samples': 955872, 'steps': 1866, 'loss/train': 2.296149730682373} -09/20/2021 20:57:27 - INFO - __main__ - Step 29872: {'lr': 0.00019974671920929587, 'samples': 955904, 'steps': 1866, 'loss/train': 2.4322166442871094} -09/20/2021 20:57:28 - INFO - __main__ - Step 29873: {'lr': 0.00019974626528984212, 'samples': 955936, 'steps': 1867, 'loss/train': 2.065643072128296} -09/20/2021 20:57:29 - INFO - __main__ - Step 29874: {'lr': 0.00019974626528984212, 'samples': 955968, 'steps': 1867, 'loss/train': 2.7847723960876465} -09/20/2021 20:57:30 - INFO - __main__ - Step 29875: {'lr': 0.00019974626528984212, 'samples': 956000, 'steps': 1867, 'loss/train': 2.5296266078948975} -09/20/2021 20:57:31 - INFO - __main__ - Step 29876: {'lr': 0.00019974626528984212, 'samples': 956032, 'steps': 1867, 'loss/train': 1.8060911893844604} -09/20/2021 20:57:31 - INFO - __main__ - Step 29877: {'lr': 0.00019974626528984212, 'samples': 956064, 'steps': 1867, 'loss/train': 3.472208023071289} -09/20/2021 20:57:32 - INFO - __main__ - Step 29878: {'lr': 0.00019974626528984212, 'samples': 956096, 'steps': 1867, 'loss/train': 2.124056816101074} -09/20/2021 20:57:33 - INFO - __main__ - Step 29879: {'lr': 0.00019974626528984212, 'samples': 956128, 'steps': 1867, 'loss/train': 1.7691186666488647} -09/20/2021 20:57:34 - INFO - __main__ - Step 29880: {'lr': 0.00019974626528984212, 'samples': 956160, 'steps': 1867, 'loss/train': 1.9926267862319946} -09/20/2021 20:57:34 - INFO - __main__ - Step 29881: {'lr': 0.00019974626528984212, 'samples': 956192, 'steps': 1867, 'loss/train': 2.8331704139709473} -09/20/2021 20:57:35 - INFO - __main__ - Step 29882: {'lr': 0.00019974626528984212, 'samples': 956224, 'steps': 1867, 'loss/train': 3.2329959869384766} -09/20/2021 20:57:36 - INFO - __main__ - Step 29883: {'lr': 0.00019974626528984212, 'samples': 956256, 'steps': 1867, 'loss/train': 2.324129819869995} -09/20/2021 20:57:37 - INFO - __main__ - Step 29884: {'lr': 0.00019974626528984212, 'samples': 956288, 'steps': 1867, 'loss/train': 2.062694787979126} -09/20/2021 20:57:38 - INFO - __main__ - Step 29885: {'lr': 0.00019974626528984212, 'samples': 956320, 'steps': 1867, 'loss/train': 1.9917110204696655} -09/20/2021 20:57:39 - INFO - __main__ - Step 29886: {'lr': 0.00019974626528984212, 'samples': 956352, 'steps': 1867, 'loss/train': 2.8601505756378174} -09/20/2021 20:57:39 - INFO - __main__ - Step 29887: {'lr': 0.00019974626528984212, 'samples': 956384, 'steps': 1867, 'loss/train': 3.5281271934509277} -09/20/2021 20:57:40 - INFO - __main__ - Step 29888: {'lr': 0.00019974626528984212, 'samples': 956416, 'steps': 1867, 'loss/train': 2.599452257156372} -09/20/2021 20:57:41 - INFO - __main__ - Step 29889: {'lr': 0.00019974581096452124, 'samples': 956448, 'steps': 1868, 'loss/train': 4.468581199645996} -09/20/2021 20:57:42 - INFO - __main__ - Step 29890: {'lr': 0.00019974581096452124, 'samples': 956480, 'steps': 1868, 'loss/train': 2.389920949935913} -09/20/2021 20:57:42 - INFO - __main__ - Step 29891: {'lr': 0.00019974581096452124, 'samples': 956512, 'steps': 1868, 'loss/train': 2.396174192428589} -09/20/2021 20:57:43 - INFO - __main__ - Step 29892: {'lr': 0.00019974581096452124, 'samples': 956544, 'steps': 1868, 'loss/train': 2.9075591564178467} -09/20/2021 20:57:44 - INFO - __main__ - Step 29893: {'lr': 0.00019974581096452124, 'samples': 956576, 'steps': 1868, 'loss/train': 2.3270654678344727} -09/20/2021 20:57:45 - INFO - __main__ - Step 29894: {'lr': 0.00019974581096452124, 'samples': 956608, 'steps': 1868, 'loss/train': 2.490441083908081} -09/20/2021 20:57:45 - INFO - __main__ - Step 29895: {'lr': 0.00019974581096452124, 'samples': 956640, 'steps': 1868, 'loss/train': 2.5927844047546387} -09/20/2021 20:57:46 - INFO - __main__ - Step 29896: {'lr': 0.00019974581096452124, 'samples': 956672, 'steps': 1868, 'loss/train': 2.10015869140625} -09/20/2021 20:57:47 - INFO - __main__ - Step 29897: {'lr': 0.00019974581096452124, 'samples': 956704, 'steps': 1868, 'loss/train': 2.533686637878418} -09/20/2021 20:57:48 - INFO - __main__ - Step 29898: {'lr': 0.00019974581096452124, 'samples': 956736, 'steps': 1868, 'loss/train': 2.4243369102478027} -09/20/2021 20:57:48 - INFO - __main__ - Step 29899: {'lr': 0.00019974581096452124, 'samples': 956768, 'steps': 1868, 'loss/train': 1.8996126651763916} -09/20/2021 20:57:49 - INFO - __main__ - Step 29900: {'lr': 0.00019974581096452124, 'samples': 956800, 'steps': 1868, 'loss/train': 3.11442494392395} -09/20/2021 20:57:50 - INFO - __main__ - Step 29901: {'lr': 0.00019974581096452124, 'samples': 956832, 'steps': 1868, 'loss/train': 3.182028293609619} -09/20/2021 20:57:51 - INFO - __main__ - Step 29902: {'lr': 0.00019974581096452124, 'samples': 956864, 'steps': 1868, 'loss/train': 1.6699585914611816} -09/20/2021 20:57:51 - INFO - __main__ - Step 29903: {'lr': 0.00019974581096452124, 'samples': 956896, 'steps': 1868, 'loss/train': 2.730715274810791} -09/20/2021 20:57:52 - INFO - __main__ - Step 29904: {'lr': 0.00019974581096452124, 'samples': 956928, 'steps': 1868, 'loss/train': 1.6860145330429077} -09/20/2021 20:57:53 - INFO - __main__ - Step 29905: {'lr': 0.000199745356233335, 'samples': 956960, 'steps': 1869, 'loss/train': 2.3337740898132324} -09/20/2021 20:57:54 - INFO - __main__ - Step 29906: {'lr': 0.000199745356233335, 'samples': 956992, 'steps': 1869, 'loss/train': 2.322453022003174} -09/20/2021 20:57:55 - INFO - __main__ - Step 29907: {'lr': 0.000199745356233335, 'samples': 957024, 'steps': 1869, 'loss/train': 3.0359997749328613} -09/20/2021 20:57:55 - INFO - __main__ - Step 29908: {'lr': 0.000199745356233335, 'samples': 957056, 'steps': 1869, 'loss/train': 1.894990086555481} -09/20/2021 20:57:56 - INFO - __main__ - Step 29909: {'lr': 0.000199745356233335, 'samples': 957088, 'steps': 1869, 'loss/train': 0.9488861560821533} -09/20/2021 20:57:57 - INFO - __main__ - Step 29910: {'lr': 0.000199745356233335, 'samples': 957120, 'steps': 1869, 'loss/train': 2.554065465927124} -09/20/2021 20:57:58 - INFO - __main__ - Step 29911: {'lr': 0.000199745356233335, 'samples': 957152, 'steps': 1869, 'loss/train': 1.9753377437591553} -09/20/2021 20:57:58 - INFO - __main__ - Step 29912: {'lr': 0.000199745356233335, 'samples': 957184, 'steps': 1869, 'loss/train': 2.6108908653259277} -09/20/2021 20:57:59 - INFO - __main__ - Step 29913: {'lr': 0.000199745356233335, 'samples': 957216, 'steps': 1869, 'loss/train': 2.232410430908203} -09/20/2021 20:58:00 - INFO - __main__ - Step 29914: {'lr': 0.000199745356233335, 'samples': 957248, 'steps': 1869, 'loss/train': 2.016686201095581} -09/20/2021 20:58:01 - INFO - __main__ - Step 29915: {'lr': 0.000199745356233335, 'samples': 957280, 'steps': 1869, 'loss/train': 2.2818100452423096} -09/20/2021 20:58:02 - INFO - __main__ - Step 29916: {'lr': 0.000199745356233335, 'samples': 957312, 'steps': 1869, 'loss/train': 3.1168243885040283} -09/20/2021 20:58:03 - INFO - __main__ - Step 29917: {'lr': 0.000199745356233335, 'samples': 957344, 'steps': 1869, 'loss/train': 2.3569679260253906} -09/20/2021 20:58:04 - INFO - __main__ - Step 29918: {'lr': 0.000199745356233335, 'samples': 957376, 'steps': 1869, 'loss/train': 2.3326330184936523} -09/20/2021 20:58:05 - INFO - __main__ - Step 29919: {'lr': 0.000199745356233335, 'samples': 957408, 'steps': 1869, 'loss/train': 2.9377737045288086} -09/20/2021 20:58:05 - INFO - __main__ - Step 29920: {'lr': 0.000199745356233335, 'samples': 957440, 'steps': 1869, 'loss/train': 2.206143379211426} -09/20/2021 20:58:06 - INFO - __main__ - Step 29921: {'lr': 0.0001997449010962853, 'samples': 957472, 'steps': 1870, 'loss/train': 2.4451847076416016} -09/20/2021 20:58:07 - INFO - __main__ - Step 29922: {'lr': 0.0001997449010962853, 'samples': 957504, 'steps': 1870, 'loss/train': 0.7040741443634033} -09/20/2021 20:58:08 - INFO - __main__ - Step 29923: {'lr': 0.0001997449010962853, 'samples': 957536, 'steps': 1870, 'loss/train': 2.5510690212249756} -09/20/2021 20:58:08 - INFO - __main__ - Step 29924: {'lr': 0.0001997449010962853, 'samples': 957568, 'steps': 1870, 'loss/train': 3.851832628250122} -09/20/2021 20:58:09 - INFO - __main__ - Step 29925: {'lr': 0.0001997449010962853, 'samples': 957600, 'steps': 1870, 'loss/train': 2.283003330230713} -09/20/2021 20:58:10 - INFO - __main__ - Step 29926: {'lr': 0.0001997449010962853, 'samples': 957632, 'steps': 1870, 'loss/train': 2.789891242980957} -09/20/2021 20:58:11 - INFO - __main__ - Step 29927: {'lr': 0.0001997449010962853, 'samples': 957664, 'steps': 1870, 'loss/train': 2.0488016605377197} -09/20/2021 20:58:11 - INFO - __main__ - Step 29928: {'lr': 0.0001997449010962853, 'samples': 957696, 'steps': 1870, 'loss/train': 2.9434216022491455} -09/20/2021 20:58:12 - INFO - __main__ - Step 29929: {'lr': 0.0001997449010962853, 'samples': 957728, 'steps': 1870, 'loss/train': 2.4981961250305176} -09/20/2021 20:58:13 - INFO - __main__ - Step 29930: {'lr': 0.0001997449010962853, 'samples': 957760, 'steps': 1870, 'loss/train': 2.7490761280059814} -09/20/2021 20:58:14 - INFO - __main__ - Step 29931: {'lr': 0.0001997449010962853, 'samples': 957792, 'steps': 1870, 'loss/train': 2.6121556758880615} -09/20/2021 20:58:14 - INFO - __main__ - Step 29932: {'lr': 0.0001997449010962853, 'samples': 957824, 'steps': 1870, 'loss/train': 2.9428162574768066} -09/20/2021 20:58:15 - INFO - __main__ - Step 29933: {'lr': 0.0001997449010962853, 'samples': 957856, 'steps': 1870, 'loss/train': 2.6179709434509277} -09/20/2021 20:58:16 - INFO - __main__ - Step 29934: {'lr': 0.0001997449010962853, 'samples': 957888, 'steps': 1870, 'loss/train': 1.7625120878219604} -09/20/2021 20:58:17 - INFO - __main__ - Step 29935: {'lr': 0.0001997449010962853, 'samples': 957920, 'steps': 1870, 'loss/train': 2.089482307434082} -09/20/2021 20:58:17 - INFO - __main__ - Step 29936: {'lr': 0.0001997449010962853, 'samples': 957952, 'steps': 1870, 'loss/train': 3.0628321170806885} -09/20/2021 20:58:18 - INFO - __main__ - Step 29937: {'lr': 0.000199744445553374, 'samples': 957984, 'steps': 1871, 'loss/train': 3.089139461517334} -09/20/2021 20:58:19 - INFO - __main__ - Step 29938: {'lr': 0.000199744445553374, 'samples': 958016, 'steps': 1871, 'loss/train': 2.149994373321533} -09/20/2021 20:58:20 - INFO - __main__ - Step 29939: {'lr': 0.000199744445553374, 'samples': 958048, 'steps': 1871, 'loss/train': 2.0401663780212402} -09/20/2021 20:58:21 - INFO - __main__ - Step 29940: {'lr': 0.000199744445553374, 'samples': 958080, 'steps': 1871, 'loss/train': 2.0211620330810547} -09/20/2021 20:58:21 - INFO - __main__ - Step 29941: {'lr': 0.000199744445553374, 'samples': 958112, 'steps': 1871, 'loss/train': 2.360872268676758} -09/20/2021 20:58:22 - INFO - __main__ - Step 29942: {'lr': 0.000199744445553374, 'samples': 958144, 'steps': 1871, 'loss/train': 1.873211145401001} -09/20/2021 20:58:23 - INFO - __main__ - Step 29943: {'lr': 0.000199744445553374, 'samples': 958176, 'steps': 1871, 'loss/train': 1.5784605741500854} -09/20/2021 20:58:24 - INFO - __main__ - Step 29944: {'lr': 0.000199744445553374, 'samples': 958208, 'steps': 1871, 'loss/train': 2.112746477127075} -09/20/2021 20:58:24 - INFO - __main__ - Step 29945: {'lr': 0.000199744445553374, 'samples': 958240, 'steps': 1871, 'loss/train': 1.695739984512329} -09/20/2021 20:58:25 - INFO - __main__ - Step 29946: {'lr': 0.000199744445553374, 'samples': 958272, 'steps': 1871, 'loss/train': 1.8490689992904663} -09/20/2021 20:58:26 - INFO - __main__ - Step 29947: {'lr': 0.000199744445553374, 'samples': 958304, 'steps': 1871, 'loss/train': 2.5860795974731445} -09/20/2021 20:58:27 - INFO - __main__ - Step 29948: {'lr': 0.000199744445553374, 'samples': 958336, 'steps': 1871, 'loss/train': 2.971588134765625} -09/20/2021 20:58:28 - INFO - __main__ - Step 29949: {'lr': 0.000199744445553374, 'samples': 958368, 'steps': 1871, 'loss/train': 2.776492118835449} -09/20/2021 20:58:29 - INFO - __main__ - Step 29950: {'lr': 0.000199744445553374, 'samples': 958400, 'steps': 1871, 'loss/train': 2.45184063911438} -09/20/2021 20:58:30 - INFO - __main__ - Step 29951: {'lr': 0.000199744445553374, 'samples': 958432, 'steps': 1871, 'loss/train': 3.5244407653808594} -09/20/2021 20:58:31 - INFO - __main__ - Step 29952: {'lr': 0.000199744445553374, 'samples': 958464, 'steps': 1871, 'loss/train': 2.328861713409424} -09/20/2021 20:58:31 - INFO - __main__ - Step 29953: {'lr': 0.0001997439896046029, 'samples': 958496, 'steps': 1872, 'loss/train': 3.2187387943267822} -09/20/2021 20:58:32 - INFO - __main__ - Step 29954: {'lr': 0.0001997439896046029, 'samples': 958528, 'steps': 1872, 'loss/train': 4.264629364013672} -09/20/2021 20:58:33 - INFO - __main__ - Step 29955: {'lr': 0.0001997439896046029, 'samples': 958560, 'steps': 1872, 'loss/train': 3.0707430839538574} -09/20/2021 20:58:34 - INFO - __main__ - Step 29956: {'lr': 0.0001997439896046029, 'samples': 958592, 'steps': 1872, 'loss/train': 3.0091264247894287} -09/20/2021 20:58:34 - INFO - __main__ - Step 29957: {'lr': 0.0001997439896046029, 'samples': 958624, 'steps': 1872, 'loss/train': 2.578960418701172} -09/20/2021 20:58:35 - INFO - __main__ - Step 29958: {'lr': 0.0001997439896046029, 'samples': 958656, 'steps': 1872, 'loss/train': 3.4168739318847656} -09/20/2021 20:58:36 - INFO - __main__ - Step 29959: {'lr': 0.0001997439896046029, 'samples': 958688, 'steps': 1872, 'loss/train': 2.970334529876709} -09/20/2021 20:58:37 - INFO - __main__ - Step 29960: {'lr': 0.0001997439896046029, 'samples': 958720, 'steps': 1872, 'loss/train': 2.672093152999878} -09/20/2021 20:58:37 - INFO - __main__ - Step 29961: {'lr': 0.0001997439896046029, 'samples': 958752, 'steps': 1872, 'loss/train': 2.372884750366211} -09/20/2021 20:58:38 - INFO - __main__ - Step 29962: {'lr': 0.0001997439896046029, 'samples': 958784, 'steps': 1872, 'loss/train': 1.938959002494812} -09/20/2021 20:58:39 - INFO - __main__ - Step 29963: {'lr': 0.0001997439896046029, 'samples': 958816, 'steps': 1872, 'loss/train': 3.337381601333618} -09/20/2021 20:58:40 - INFO - __main__ - Step 29964: {'lr': 0.0001997439896046029, 'samples': 958848, 'steps': 1872, 'loss/train': 2.800705909729004} -09/20/2021 20:58:40 - INFO - __main__ - Step 29965: {'lr': 0.0001997439896046029, 'samples': 958880, 'steps': 1872, 'loss/train': 2.1912450790405273} -09/20/2021 20:58:41 - INFO - __main__ - Step 29966: {'lr': 0.0001997439896046029, 'samples': 958912, 'steps': 1872, 'loss/train': 2.545070171356201} -09/20/2021 20:58:42 - INFO - __main__ - Step 29967: {'lr': 0.0001997439896046029, 'samples': 958944, 'steps': 1872, 'loss/train': 2.386786937713623} -09/20/2021 20:58:43 - INFO - __main__ - Step 29968: {'lr': 0.0001997439896046029, 'samples': 958976, 'steps': 1872, 'loss/train': 1.6212514638900757} -09/20/2021 20:58:44 - INFO - __main__ - Step 29969: {'lr': 0.00019974353324997394, 'samples': 959008, 'steps': 1873, 'loss/train': 0.6389968395233154} -09/20/2021 20:58:44 - INFO - __main__ - Step 29970: {'lr': 0.00019974353324997394, 'samples': 959040, 'steps': 1873, 'loss/train': 3.3075149059295654} -09/20/2021 20:58:45 - INFO - __main__ - Step 29971: {'lr': 0.00019974353324997394, 'samples': 959072, 'steps': 1873, 'loss/train': 1.9629955291748047} -09/20/2021 20:58:46 - INFO - __main__ - Step 29972: {'lr': 0.00019974353324997394, 'samples': 959104, 'steps': 1873, 'loss/train': 3.2994747161865234} -09/20/2021 20:58:47 - INFO - __main__ - Step 29973: {'lr': 0.00019974353324997394, 'samples': 959136, 'steps': 1873, 'loss/train': 2.1909139156341553} -09/20/2021 20:58:47 - INFO - __main__ - Step 29974: {'lr': 0.00019974353324997394, 'samples': 959168, 'steps': 1873, 'loss/train': 2.343745708465576} -09/20/2021 20:58:48 - INFO - __main__ - Step 29975: {'lr': 0.00019974353324997394, 'samples': 959200, 'steps': 1873, 'loss/train': 3.4177939891815186} -09/20/2021 20:58:49 - INFO - __main__ - Step 29976: {'lr': 0.00019974353324997394, 'samples': 959232, 'steps': 1873, 'loss/train': 2.1660521030426025} -09/20/2021 20:58:50 - INFO - __main__ - Step 29977: {'lr': 0.00019974353324997394, 'samples': 959264, 'steps': 1873, 'loss/train': 3.338578701019287} -09/20/2021 20:58:50 - INFO - __main__ - Step 29978: {'lr': 0.00019974353324997394, 'samples': 959296, 'steps': 1873, 'loss/train': 2.282470941543579} -09/20/2021 20:58:52 - INFO - __main__ - Step 29979: {'lr': 0.00019974353324997394, 'samples': 959328, 'steps': 1873, 'loss/train': 2.430034875869751} -09/20/2021 20:58:52 - INFO - __main__ - Step 29980: {'lr': 0.00019974353324997394, 'samples': 959360, 'steps': 1873, 'loss/train': 2.986492156982422} -09/20/2021 20:58:53 - INFO - __main__ - Step 29981: {'lr': 0.00019974353324997394, 'samples': 959392, 'steps': 1873, 'loss/train': 3.013296365737915} -09/20/2021 20:58:54 - INFO - __main__ - Step 29982: {'lr': 0.00019974353324997394, 'samples': 959424, 'steps': 1873, 'loss/train': 3.2030162811279297} -09/20/2021 20:58:55 - INFO - __main__ - Step 29983: {'lr': 0.00019974353324997394, 'samples': 959456, 'steps': 1873, 'loss/train': 0.8725700974464417} -09/20/2021 20:58:55 - INFO - __main__ - Step 29984: {'lr': 0.00019974353324997394, 'samples': 959488, 'steps': 1873, 'loss/train': 2.452181577682495} -09/20/2021 20:58:56 - INFO - __main__ - Step 29985: {'lr': 0.00019974307648948893, 'samples': 959520, 'steps': 1874, 'loss/train': 2.98545241355896} -09/20/2021 20:58:57 - INFO - __main__ - Step 29986: {'lr': 0.00019974307648948893, 'samples': 959552, 'steps': 1874, 'loss/train': 2.477381944656372} -09/20/2021 20:58:58 - INFO - __main__ - Step 29987: {'lr': 0.00019974307648948893, 'samples': 959584, 'steps': 1874, 'loss/train': 2.1442134380340576} -09/20/2021 20:58:59 - INFO - __main__ - Step 29988: {'lr': 0.00019974307648948893, 'samples': 959616, 'steps': 1874, 'loss/train': 3.0312328338623047} -09/20/2021 20:58:59 - INFO - __main__ - Step 29989: {'lr': 0.00019974307648948893, 'samples': 959648, 'steps': 1874, 'loss/train': 2.1082935333251953} -09/20/2021 20:59:00 - INFO - __main__ - Step 29990: {'lr': 0.00019974307648948893, 'samples': 959680, 'steps': 1874, 'loss/train': 1.7982021570205688} -09/20/2021 20:59:01 - INFO - __main__ - Step 29991: {'lr': 0.00019974307648948893, 'samples': 959712, 'steps': 1874, 'loss/train': 2.206343412399292} -09/20/2021 20:59:02 - INFO - __main__ - Step 29992: {'lr': 0.00019974307648948893, 'samples': 959744, 'steps': 1874, 'loss/train': 1.9471170902252197} -09/20/2021 20:59:02 - INFO - __main__ - Step 29993: {'lr': 0.00019974307648948893, 'samples': 959776, 'steps': 1874, 'loss/train': 2.814849853515625} -09/20/2021 20:59:03 - INFO - __main__ - Step 29994: {'lr': 0.00019974307648948893, 'samples': 959808, 'steps': 1874, 'loss/train': 1.7712830305099487} -09/20/2021 20:59:04 - INFO - __main__ - Step 29995: {'lr': 0.00019974307648948893, 'samples': 959840, 'steps': 1874, 'loss/train': 2.9757022857666016} -09/20/2021 20:59:05 - INFO - __main__ - Step 29996: {'lr': 0.00019974307648948893, 'samples': 959872, 'steps': 1874, 'loss/train': 1.98823082447052} -09/20/2021 20:59:05 - INFO - __main__ - Step 29997: {'lr': 0.00019974307648948893, 'samples': 959904, 'steps': 1874, 'loss/train': 1.3344191312789917} -09/20/2021 20:59:06 - INFO - __main__ - Step 29998: {'lr': 0.00019974307648948893, 'samples': 959936, 'steps': 1874, 'loss/train': 1.9112184047698975} -09/20/2021 20:59:07 - INFO - __main__ - Step 29999: {'lr': 0.00019974307648948893, 'samples': 959968, 'steps': 1874, 'loss/train': 2.621112108230591} -09/20/2021 20:59:08 - INFO - __main__ - Step 30000: {'lr': 0.00019974307648948893, 'samples': 960000, 'steps': 1874, 'loss/train': 1.9625228643417358} -09/20/2021 20:59:08 - INFO - __main__ - Step 30001: {'lr': 0.00019974261932314972, 'samples': 960032, 'steps': 1875, 'loss/train': 3.924936056137085} -09/20/2021 20:59:09 - INFO - __main__ - Step 30002: {'lr': 0.00019974261932314972, 'samples': 960064, 'steps': 1875, 'loss/train': 1.866645097732544} -09/20/2021 20:59:10 - INFO - __main__ - Step 30003: {'lr': 0.00019974261932314972, 'samples': 960096, 'steps': 1875, 'loss/train': 2.564316987991333} -09/20/2021 20:59:11 - INFO - __main__ - Step 30004: {'lr': 0.00019974261932314972, 'samples': 960128, 'steps': 1875, 'loss/train': 1.4985822439193726} -09/20/2021 20:59:11 - INFO - __main__ - Step 30005: {'lr': 0.00019974261932314972, 'samples': 960160, 'steps': 1875, 'loss/train': 3.0571162700653076} -09/20/2021 20:59:12 - INFO - __main__ - Step 30006: {'lr': 0.00019974261932314972, 'samples': 960192, 'steps': 1875, 'loss/train': 2.543300151824951} -09/20/2021 20:59:13 - INFO - __main__ - Step 30007: {'lr': 0.00019974261932314972, 'samples': 960224, 'steps': 1875, 'loss/train': 3.074887990951538} -09/20/2021 20:59:14 - INFO - __main__ - Step 30008: {'lr': 0.00019974261932314972, 'samples': 960256, 'steps': 1875, 'loss/train': 2.701967239379883} -09/20/2021 20:59:14 - INFO - __main__ - Step 30009: {'lr': 0.00019974261932314972, 'samples': 960288, 'steps': 1875, 'loss/train': 2.4265170097351074} -09/20/2021 20:59:15 - INFO - __main__ - Step 30010: {'lr': 0.00019974261932314972, 'samples': 960320, 'steps': 1875, 'loss/train': 2.6188743114471436} -09/20/2021 20:59:16 - INFO - __main__ - Step 30011: {'lr': 0.00019974261932314972, 'samples': 960352, 'steps': 1875, 'loss/train': 1.579565405845642} -09/20/2021 20:59:17 - INFO - __main__ - Step 30012: {'lr': 0.00019974261932314972, 'samples': 960384, 'steps': 1875, 'loss/train': 0.8857768177986145} -09/20/2021 20:59:18 - INFO - __main__ - Step 30013: {'lr': 0.00019974261932314972, 'samples': 960416, 'steps': 1875, 'loss/train': 2.1547305583953857} -09/20/2021 20:59:19 - INFO - __main__ - Step 30014: {'lr': 0.00019974261932314972, 'samples': 960448, 'steps': 1875, 'loss/train': 2.281240940093994} -09/20/2021 20:59:19 - INFO - __main__ - Step 30015: {'lr': 0.00019974261932314972, 'samples': 960480, 'steps': 1875, 'loss/train': 1.8431997299194336} -09/20/2021 20:59:20 - INFO - __main__ - Step 30016: {'lr': 0.00019974261932314972, 'samples': 960512, 'steps': 1875, 'loss/train': 2.8947012424468994} -09/20/2021 20:59:21 - INFO - __main__ - Step 30017: {'lr': 0.00019974216175095815, 'samples': 960544, 'steps': 1876, 'loss/train': 2.7645647525787354} -09/20/2021 20:59:22 - INFO - __main__ - Step 30018: {'lr': 0.00019974216175095815, 'samples': 960576, 'steps': 1876, 'loss/train': 2.8297483921051025} -09/20/2021 20:59:23 - INFO - __main__ - Step 30019: {'lr': 0.00019974216175095815, 'samples': 960608, 'steps': 1876, 'loss/train': 3.0180881023406982} -09/20/2021 20:59:23 - INFO - __main__ - Step 30020: {'lr': 0.00019974216175095815, 'samples': 960640, 'steps': 1876, 'loss/train': 2.339970827102661} -09/20/2021 20:59:24 - INFO - __main__ - Step 30021: {'lr': 0.00019974216175095815, 'samples': 960672, 'steps': 1876, 'loss/train': 2.582740545272827} -09/20/2021 20:59:25 - INFO - __main__ - Step 30022: {'lr': 0.00019974216175095815, 'samples': 960704, 'steps': 1876, 'loss/train': 1.8622733354568481} -09/20/2021 20:59:26 - INFO - __main__ - Step 30023: {'lr': 0.00019974216175095815, 'samples': 960736, 'steps': 1876, 'loss/train': 2.720708131790161} -09/20/2021 20:59:26 - INFO - __main__ - Step 30024: {'lr': 0.00019974216175095815, 'samples': 960768, 'steps': 1876, 'loss/train': 2.6723525524139404} -09/20/2021 20:59:27 - INFO - __main__ - Step 30025: {'lr': 0.00019974216175095815, 'samples': 960800, 'steps': 1876, 'loss/train': 2.8623015880584717} -09/20/2021 20:59:28 - INFO - __main__ - Step 30026: {'lr': 0.00019974216175095815, 'samples': 960832, 'steps': 1876, 'loss/train': 2.4798460006713867} -09/20/2021 20:59:29 - INFO - __main__ - Step 30027: {'lr': 0.00019974216175095815, 'samples': 960864, 'steps': 1876, 'loss/train': 2.2694389820098877} -09/20/2021 20:59:29 - INFO - __main__ - Step 30028: {'lr': 0.00019974216175095815, 'samples': 960896, 'steps': 1876, 'loss/train': 3.550048828125} -09/20/2021 20:59:30 - INFO - __main__ - Step 30029: {'lr': 0.00019974216175095815, 'samples': 960928, 'steps': 1876, 'loss/train': 2.4266092777252197} -09/20/2021 20:59:31 - INFO - __main__ - Step 30030: {'lr': 0.00019974216175095815, 'samples': 960960, 'steps': 1876, 'loss/train': 2.1214091777801514} -09/20/2021 20:59:32 - INFO - __main__ - Step 30031: {'lr': 0.00019974216175095815, 'samples': 960992, 'steps': 1876, 'loss/train': 2.147456169128418} -09/20/2021 20:59:32 - INFO - __main__ - Step 30032: {'lr': 0.00019974216175095815, 'samples': 961024, 'steps': 1876, 'loss/train': 3.1009953022003174} -09/20/2021 20:59:33 - INFO - __main__ - Step 30033: {'lr': 0.00019974170377291614, 'samples': 961056, 'steps': 1877, 'loss/train': 2.4270858764648438} -09/20/2021 20:59:34 - INFO - __main__ - Step 30034: {'lr': 0.00019974170377291614, 'samples': 961088, 'steps': 1877, 'loss/train': 1.7652552127838135} -09/20/2021 20:59:35 - INFO - __main__ - Step 30035: {'lr': 0.00019974170377291614, 'samples': 961120, 'steps': 1877, 'loss/train': 2.4484410285949707} -09/20/2021 20:59:35 - INFO - __main__ - Step 30036: {'lr': 0.00019974170377291614, 'samples': 961152, 'steps': 1877, 'loss/train': 2.514688014984131} -09/20/2021 20:59:36 - INFO - __main__ - Step 30037: {'lr': 0.00019974170377291614, 'samples': 961184, 'steps': 1877, 'loss/train': 1.5911424160003662} -09/20/2021 20:59:37 - INFO - __main__ - Step 30038: {'lr': 0.00019974170377291614, 'samples': 961216, 'steps': 1877, 'loss/train': 1.5995967388153076} -09/20/2021 20:59:38 - INFO - __main__ - Step 30039: {'lr': 0.00019974170377291614, 'samples': 961248, 'steps': 1877, 'loss/train': 3.5336296558380127} -09/20/2021 20:59:38 - INFO - __main__ - Step 30040: {'lr': 0.00019974170377291614, 'samples': 961280, 'steps': 1877, 'loss/train': 2.572286605834961} -09/20/2021 20:59:39 - INFO - __main__ - Step 30041: {'lr': 0.00019974170377291614, 'samples': 961312, 'steps': 1877, 'loss/train': 2.0803918838500977} -09/20/2021 20:59:41 - INFO - __main__ - Step 30042: {'lr': 0.00019974170377291614, 'samples': 961344, 'steps': 1877, 'loss/train': 1.472565770149231} -09/20/2021 20:59:41 - INFO - __main__ - Step 30043: {'lr': 0.00019974170377291614, 'samples': 961376, 'steps': 1877, 'loss/train': 2.2917752265930176} -09/20/2021 20:59:42 - INFO - __main__ - Step 30044: {'lr': 0.00019974170377291614, 'samples': 961408, 'steps': 1877, 'loss/train': 2.578686237335205} -09/20/2021 20:59:43 - INFO - __main__ - Step 30045: {'lr': 0.00019974170377291614, 'samples': 961440, 'steps': 1877, 'loss/train': 0.5301979780197144} -09/20/2021 20:59:44 - INFO - __main__ - Step 30046: {'lr': 0.00019974170377291614, 'samples': 961472, 'steps': 1877, 'loss/train': 0.4123939871788025} -09/20/2021 20:59:44 - INFO - __main__ - Step 30047: {'lr': 0.00019974170377291614, 'samples': 961504, 'steps': 1877, 'loss/train': 2.225358247756958} -09/20/2021 20:59:45 - INFO - __main__ - Step 30048: {'lr': 0.00019974170377291614, 'samples': 961536, 'steps': 1877, 'loss/train': 3.136326789855957} -09/20/2021 20:59:46 - INFO - __main__ - Step 30049: {'lr': 0.0001997412453890255, 'samples': 961568, 'steps': 1878, 'loss/train': 2.1988844871520996} -09/20/2021 20:59:47 - INFO - __main__ - Step 30050: {'lr': 0.0001997412453890255, 'samples': 961600, 'steps': 1878, 'loss/train': 2.390824317932129} -09/20/2021 20:59:47 - INFO - __main__ - Step 30051: {'lr': 0.0001997412453890255, 'samples': 961632, 'steps': 1878, 'loss/train': 0.4915890097618103} -09/20/2021 20:59:48 - INFO - __main__ - Step 30052: {'lr': 0.0001997412453890255, 'samples': 961664, 'steps': 1878, 'loss/train': 0.5866619348526001} -09/20/2021 20:59:49 - INFO - __main__ - Step 30053: {'lr': 0.0001997412453890255, 'samples': 961696, 'steps': 1878, 'loss/train': 0.4100806415081024} -09/20/2021 20:59:50 - INFO - __main__ - Step 30054: {'lr': 0.0001997412453890255, 'samples': 961728, 'steps': 1878, 'loss/train': 2.7376716136932373} -09/20/2021 20:59:50 - INFO - __main__ - Step 30055: {'lr': 0.0001997412453890255, 'samples': 961760, 'steps': 1878, 'loss/train': 2.3434746265411377} -09/20/2021 20:59:51 - INFO - __main__ - Step 30056: {'lr': 0.0001997412453890255, 'samples': 961792, 'steps': 1878, 'loss/train': 2.411672592163086} -09/20/2021 20:59:52 - INFO - __main__ - Step 30057: {'lr': 0.0001997412453890255, 'samples': 961824, 'steps': 1878, 'loss/train': 2.6291661262512207} -09/20/2021 20:59:53 - INFO - __main__ - Step 30058: {'lr': 0.0001997412453890255, 'samples': 961856, 'steps': 1878, 'loss/train': 2.877042055130005} -09/20/2021 20:59:53 - INFO - __main__ - Step 30059: {'lr': 0.0001997412453890255, 'samples': 961888, 'steps': 1878, 'loss/train': 2.294872522354126} -09/20/2021 20:59:54 - INFO - __main__ - Step 30060: {'lr': 0.0001997412453890255, 'samples': 961920, 'steps': 1878, 'loss/train': 3.1295461654663086} -09/20/2021 20:59:55 - INFO - __main__ - Step 30061: {'lr': 0.0001997412453890255, 'samples': 961952, 'steps': 1878, 'loss/train': 2.069946527481079} -09/20/2021 20:59:56 - INFO - __main__ - Step 30062: {'lr': 0.0001997412453890255, 'samples': 961984, 'steps': 1878, 'loss/train': 1.9374393224716187} -09/20/2021 20:59:56 - INFO - __main__ - Step 30063: {'lr': 0.0001997412453890255, 'samples': 962016, 'steps': 1878, 'loss/train': 2.6062073707580566} -09/20/2021 20:59:57 - INFO - __main__ - Step 30064: {'lr': 0.0001997412453890255, 'samples': 962048, 'steps': 1878, 'loss/train': 2.1832218170166016} -09/20/2021 20:59:58 - INFO - __main__ - Step 30065: {'lr': 0.00019974078659928816, 'samples': 962080, 'steps': 1879, 'loss/train': 2.529730796813965} -09/20/2021 20:59:59 - INFO - __main__ - Step 30066: {'lr': 0.00019974078659928816, 'samples': 962112, 'steps': 1879, 'loss/train': 1.528885006904602} -09/20/2021 21:00:00 - INFO - __main__ - Step 30067: {'lr': 0.00019974078659928816, 'samples': 962144, 'steps': 1879, 'loss/train': 1.3761593103408813} -09/20/2021 21:00:00 - INFO - __main__ - Step 30068: {'lr': 0.00019974078659928816, 'samples': 962176, 'steps': 1879, 'loss/train': 2.6762702465057373} -09/20/2021 21:00:01 - INFO - __main__ - Step 30069: {'lr': 0.00019974078659928816, 'samples': 962208, 'steps': 1879, 'loss/train': 2.3822875022888184} -09/20/2021 21:00:02 - INFO - __main__ - Step 30070: {'lr': 0.00019974078659928816, 'samples': 962240, 'steps': 1879, 'loss/train': 3.286745071411133} -09/20/2021 21:00:03 - INFO - __main__ - Step 30071: {'lr': 0.00019974078659928816, 'samples': 962272, 'steps': 1879, 'loss/train': 2.071012020111084} -09/20/2021 21:00:04 - INFO - __main__ - Step 30072: {'lr': 0.00019974078659928816, 'samples': 962304, 'steps': 1879, 'loss/train': 1.9924787282943726} -09/20/2021 21:00:05 - INFO - __main__ - Step 30073: {'lr': 0.00019974078659928816, 'samples': 962336, 'steps': 1879, 'loss/train': 2.928849935531616} -09/20/2021 21:00:05 - INFO - __main__ - Step 30074: {'lr': 0.00019974078659928816, 'samples': 962368, 'steps': 1879, 'loss/train': 2.1221001148223877} -09/20/2021 21:00:06 - INFO - __main__ - Step 30075: {'lr': 0.00019974078659928816, 'samples': 962400, 'steps': 1879, 'loss/train': 2.5015780925750732} -09/20/2021 21:00:07 - INFO - __main__ - Step 30076: {'lr': 0.00019974078659928816, 'samples': 962432, 'steps': 1879, 'loss/train': 2.0204310417175293} -09/20/2021 21:00:08 - INFO - __main__ - Step 30077: {'lr': 0.00019974078659928816, 'samples': 962464, 'steps': 1879, 'loss/train': 3.8021061420440674} -09/20/2021 21:00:08 - INFO - __main__ - Step 30078: {'lr': 0.00019974078659928816, 'samples': 962496, 'steps': 1879, 'loss/train': 2.1512134075164795} -09/20/2021 21:00:09 - INFO - __main__ - Step 30079: {'lr': 0.00019974078659928816, 'samples': 962528, 'steps': 1879, 'loss/train': 2.6929047107696533} -09/20/2021 21:00:10 - INFO - __main__ - Step 30080: {'lr': 0.00019974078659928816, 'samples': 962560, 'steps': 1879, 'loss/train': 1.7839136123657227} -09/20/2021 21:00:11 - INFO - __main__ - Step 30081: {'lr': 0.0001997403274037059, 'samples': 962592, 'steps': 1880, 'loss/train': 2.3611366748809814} -09/20/2021 21:00:11 - INFO - __main__ - Step 30082: {'lr': 0.0001997403274037059, 'samples': 962624, 'steps': 1880, 'loss/train': 2.829349994659424} -09/20/2021 21:00:12 - INFO - __main__ - Step 30083: {'lr': 0.0001997403274037059, 'samples': 962656, 'steps': 1880, 'loss/train': 0.33957064151763916} -09/20/2021 21:00:13 - INFO - __main__ - Step 30084: {'lr': 0.0001997403274037059, 'samples': 962688, 'steps': 1880, 'loss/train': 0.3292071521282196} -09/20/2021 21:00:14 - INFO - __main__ - Step 30085: {'lr': 0.0001997403274037059, 'samples': 962720, 'steps': 1880, 'loss/train': 2.4188623428344727} -09/20/2021 21:00:14 - INFO - __main__ - Step 30086: {'lr': 0.0001997403274037059, 'samples': 962752, 'steps': 1880, 'loss/train': 0.8270019888877869} -09/20/2021 21:00:15 - INFO - __main__ - Step 30087: {'lr': 0.0001997403274037059, 'samples': 962784, 'steps': 1880, 'loss/train': 4.016932487487793} -09/20/2021 21:00:16 - INFO - __main__ - Step 30088: {'lr': 0.0001997403274037059, 'samples': 962816, 'steps': 1880, 'loss/train': 2.049971580505371} -09/20/2021 21:00:17 - INFO - __main__ - Step 30089: {'lr': 0.0001997403274037059, 'samples': 962848, 'steps': 1880, 'loss/train': 3.0852019786834717} -09/20/2021 21:00:17 - INFO - __main__ - Step 30090: {'lr': 0.0001997403274037059, 'samples': 962880, 'steps': 1880, 'loss/train': 2.3855931758880615} -09/20/2021 21:00:18 - INFO - __main__ - Step 30091: {'lr': 0.0001997403274037059, 'samples': 962912, 'steps': 1880, 'loss/train': 2.535163640975952} -09/20/2021 21:00:19 - INFO - __main__ - Step 30092: {'lr': 0.0001997403274037059, 'samples': 962944, 'steps': 1880, 'loss/train': 2.747154474258423} -09/20/2021 21:00:20 - INFO - __main__ - Step 30093: {'lr': 0.0001997403274037059, 'samples': 962976, 'steps': 1880, 'loss/train': 2.3118653297424316} -09/20/2021 21:00:20 - INFO - __main__ - Step 30094: {'lr': 0.0001997403274037059, 'samples': 963008, 'steps': 1880, 'loss/train': 2.4309446811676025} -09/20/2021 21:00:21 - INFO - __main__ - Step 30095: {'lr': 0.0001997403274037059, 'samples': 963040, 'steps': 1880, 'loss/train': 1.8596348762512207} -09/20/2021 21:00:22 - INFO - __main__ - Step 30096: {'lr': 0.0001997403274037059, 'samples': 963072, 'steps': 1880, 'loss/train': 2.9468636512756348} -09/20/2021 21:00:23 - INFO - __main__ - Step 30097: {'lr': 0.00019973986780228066, 'samples': 963104, 'steps': 1881, 'loss/train': 2.354750156402588} -09/20/2021 21:00:24 - INFO - __main__ - Step 30098: {'lr': 0.00019973986780228066, 'samples': 963136, 'steps': 1881, 'loss/train': 1.696028709411621} -09/20/2021 21:00:24 - INFO - __main__ - Step 30099: {'lr': 0.00019973986780228066, 'samples': 963168, 'steps': 1881, 'loss/train': 2.3815159797668457} -09/20/2021 21:00:25 - INFO - __main__ - Step 30100: {'lr': 0.00019973986780228066, 'samples': 963200, 'steps': 1881, 'loss/train': 2.5932929515838623} -09/20/2021 21:00:26 - INFO - __main__ - Step 30101: {'lr': 0.00019973986780228066, 'samples': 963232, 'steps': 1881, 'loss/train': 2.101423501968384} -09/20/2021 21:00:27 - INFO - __main__ - Step 30102: {'lr': 0.00019973986780228066, 'samples': 963264, 'steps': 1881, 'loss/train': 2.8991293907165527} -09/20/2021 21:00:27 - INFO - __main__ - Step 30103: {'lr': 0.00019973986780228066, 'samples': 963296, 'steps': 1881, 'loss/train': 2.4620440006256104} -09/20/2021 21:00:28 - INFO - __main__ - Step 30104: {'lr': 0.00019973986780228066, 'samples': 963328, 'steps': 1881, 'loss/train': 1.9806486368179321} -09/20/2021 21:00:29 - INFO - __main__ - Step 30105: {'lr': 0.00019973986780228066, 'samples': 963360, 'steps': 1881, 'loss/train': 2.7441818714141846} -09/20/2021 21:00:30 - INFO - __main__ - Step 30106: {'lr': 0.00019973986780228066, 'samples': 963392, 'steps': 1881, 'loss/train': 5.046632766723633} -09/20/2021 21:00:31 - INFO - __main__ - Step 30107: {'lr': 0.00019973986780228066, 'samples': 963424, 'steps': 1881, 'loss/train': 5.093359470367432} -09/20/2021 21:00:32 - INFO - __main__ - Step 30108: {'lr': 0.00019973986780228066, 'samples': 963456, 'steps': 1881, 'loss/train': 5.579679012298584} -09/20/2021 21:00:32 - INFO - __main__ - Step 30109: {'lr': 0.00019973986780228066, 'samples': 963488, 'steps': 1881, 'loss/train': 1.97396981716156} -09/20/2021 21:00:33 - INFO - __main__ - Step 30110: {'lr': 0.00019973986780228066, 'samples': 963520, 'steps': 1881, 'loss/train': 2.960719585418701} -09/20/2021 21:00:34 - INFO - __main__ - Step 30111: {'lr': 0.00019973986780228066, 'samples': 963552, 'steps': 1881, 'loss/train': 2.7229270935058594} -09/20/2021 21:00:35 - INFO - __main__ - Step 30112: {'lr': 0.00019973986780228066, 'samples': 963584, 'steps': 1881, 'loss/train': 2.4657692909240723} -09/20/2021 21:00:36 - INFO - __main__ - Step 30113: {'lr': 0.00019973940779501428, 'samples': 963616, 'steps': 1882, 'loss/train': 2.285543918609619} -09/20/2021 21:00:36 - INFO - __main__ - Step 30114: {'lr': 0.00019973940779501428, 'samples': 963648, 'steps': 1882, 'loss/train': 2.6947154998779297} -09/20/2021 21:00:37 - INFO - __main__ - Step 30115: {'lr': 0.00019973940779501428, 'samples': 963680, 'steps': 1882, 'loss/train': 2.2558794021606445} -09/20/2021 21:00:38 - INFO - __main__ - Step 30116: {'lr': 0.00019973940779501428, 'samples': 963712, 'steps': 1882, 'loss/train': 2.09887957572937} -09/20/2021 21:00:39 - INFO - __main__ - Step 30117: {'lr': 0.00019973940779501428, 'samples': 963744, 'steps': 1882, 'loss/train': 1.8156400918960571} -09/20/2021 21:00:39 - INFO - __main__ - Step 30118: {'lr': 0.00019973940779501428, 'samples': 963776, 'steps': 1882, 'loss/train': 2.249807596206665} -09/20/2021 21:00:40 - INFO - __main__ - Step 30119: {'lr': 0.00019973940779501428, 'samples': 963808, 'steps': 1882, 'loss/train': 1.9201098680496216} -09/20/2021 21:00:41 - INFO - __main__ - Step 30120: {'lr': 0.00019973940779501428, 'samples': 963840, 'steps': 1882, 'loss/train': 1.7281873226165771} -09/20/2021 21:00:42 - INFO - __main__ - Step 30121: {'lr': 0.00019973940779501428, 'samples': 963872, 'steps': 1882, 'loss/train': 1.4988093376159668} -09/20/2021 21:00:42 - INFO - __main__ - Step 30122: {'lr': 0.00019973940779501428, 'samples': 963904, 'steps': 1882, 'loss/train': 3.297814130783081} -09/20/2021 21:00:43 - INFO - __main__ - Step 30123: {'lr': 0.00019973940779501428, 'samples': 963936, 'steps': 1882, 'loss/train': 2.1349539756774902} -09/20/2021 21:00:44 - INFO - __main__ - Step 30124: {'lr': 0.00019973940779501428, 'samples': 963968, 'steps': 1882, 'loss/train': 1.8666801452636719} -09/20/2021 21:00:45 - INFO - __main__ - Step 30125: {'lr': 0.00019973940779501428, 'samples': 964000, 'steps': 1882, 'loss/train': 2.1724348068237305} -09/20/2021 21:00:45 - INFO - __main__ - Step 30126: {'lr': 0.00019973940779501428, 'samples': 964032, 'steps': 1882, 'loss/train': 1.8218532800674438} -09/20/2021 21:00:46 - INFO - __main__ - Step 30127: {'lr': 0.00019973940779501428, 'samples': 964064, 'steps': 1882, 'loss/train': 4.222012996673584} -09/20/2021 21:00:47 - INFO - __main__ - Step 30128: {'lr': 0.00019973940779501428, 'samples': 964096, 'steps': 1882, 'loss/train': 2.3855857849121094} -09/20/2021 21:00:48 - INFO - __main__ - Step 30129: {'lr': 0.00019973894738190863, 'samples': 964128, 'steps': 1883, 'loss/train': 2.6361069679260254} -09/20/2021 21:00:48 - INFO - __main__ - Step 30130: {'lr': 0.00019973894738190863, 'samples': 964160, 'steps': 1883, 'loss/train': 3.298344373703003} -09/20/2021 21:00:49 - INFO - __main__ - Step 30131: {'lr': 0.00019973894738190863, 'samples': 964192, 'steps': 1883, 'loss/train': 3.0961222648620605} -09/20/2021 21:00:50 - INFO - __main__ - Step 30132: {'lr': 0.00019973894738190863, 'samples': 964224, 'steps': 1883, 'loss/train': 2.6389212608337402} -09/20/2021 21:00:51 - INFO - __main__ - Step 30133: {'lr': 0.00019973894738190863, 'samples': 964256, 'steps': 1883, 'loss/train': 2.4509384632110596} -09/20/2021 21:00:51 - INFO - __main__ - Step 30134: {'lr': 0.00019973894738190863, 'samples': 964288, 'steps': 1883, 'loss/train': 3.015997886657715} -09/20/2021 21:00:52 - INFO - __main__ - Step 30135: {'lr': 0.00019973894738190863, 'samples': 964320, 'steps': 1883, 'loss/train': 2.554297685623169} -09/20/2021 21:00:53 - INFO - __main__ - Step 30136: {'lr': 0.00019973894738190863, 'samples': 964352, 'steps': 1883, 'loss/train': 2.4984495639801025} -09/20/2021 21:00:54 - INFO - __main__ - Step 30137: {'lr': 0.00019973894738190863, 'samples': 964384, 'steps': 1883, 'loss/train': 1.7709765434265137} -09/20/2021 21:00:55 - INFO - __main__ - Step 30138: {'lr': 0.00019973894738190863, 'samples': 964416, 'steps': 1883, 'loss/train': 2.8449087142944336} -09/20/2021 21:00:56 - INFO - __main__ - Step 30139: {'lr': 0.00019973894738190863, 'samples': 964448, 'steps': 1883, 'loss/train': 2.445186138153076} -09/20/2021 21:00:57 - INFO - __main__ - Step 30140: {'lr': 0.00019973894738190863, 'samples': 964480, 'steps': 1883, 'loss/train': 2.3723881244659424} -09/20/2021 21:00:57 - INFO - __main__ - Step 30141: {'lr': 0.00019973894738190863, 'samples': 964512, 'steps': 1883, 'loss/train': 2.4635496139526367} -09/20/2021 21:00:58 - INFO - __main__ - Step 30142: {'lr': 0.00019973894738190863, 'samples': 964544, 'steps': 1883, 'loss/train': 3.171642780303955} -09/20/2021 21:00:59 - INFO - __main__ - Step 30143: {'lr': 0.00019973894738190863, 'samples': 964576, 'steps': 1883, 'loss/train': 3.238860607147217} -09/20/2021 21:01:00 - INFO - __main__ - Step 30144: {'lr': 0.00019973894738190863, 'samples': 964608, 'steps': 1883, 'loss/train': 2.6840322017669678} -09/20/2021 21:01:01 - INFO - __main__ - Step 30145: {'lr': 0.0001997384865629656, 'samples': 964640, 'steps': 1884, 'loss/train': 2.0868449211120605} -09/20/2021 21:01:01 - INFO - __main__ - Step 30146: {'lr': 0.0001997384865629656, 'samples': 964672, 'steps': 1884, 'loss/train': 2.280076742172241} -09/20/2021 21:01:02 - INFO - __main__ - Step 30147: {'lr': 0.0001997384865629656, 'samples': 964704, 'steps': 1884, 'loss/train': 2.8336172103881836} -09/20/2021 21:01:03 - INFO - __main__ - Step 30148: {'lr': 0.0001997384865629656, 'samples': 964736, 'steps': 1884, 'loss/train': 2.6451122760772705} -09/20/2021 21:01:04 - INFO - __main__ - Step 30149: {'lr': 0.0001997384865629656, 'samples': 964768, 'steps': 1884, 'loss/train': 2.345970869064331} -09/20/2021 21:01:04 - INFO - __main__ - Step 30150: {'lr': 0.0001997384865629656, 'samples': 964800, 'steps': 1884, 'loss/train': 2.0917022228240967} -09/20/2021 21:01:05 - INFO - __main__ - Step 30151: {'lr': 0.0001997384865629656, 'samples': 964832, 'steps': 1884, 'loss/train': 2.5389020442962646} -09/20/2021 21:01:06 - INFO - __main__ - Step 30152: {'lr': 0.0001997384865629656, 'samples': 964864, 'steps': 1884, 'loss/train': 4.034683704376221} -09/20/2021 21:01:07 - INFO - __main__ - Step 30153: {'lr': 0.0001997384865629656, 'samples': 964896, 'steps': 1884, 'loss/train': 2.7787673473358154} -09/20/2021 21:01:07 - INFO - __main__ - Step 30154: {'lr': 0.0001997384865629656, 'samples': 964928, 'steps': 1884, 'loss/train': 2.5389111042022705} -09/20/2021 21:01:08 - INFO - __main__ - Step 30155: {'lr': 0.0001997384865629656, 'samples': 964960, 'steps': 1884, 'loss/train': 2.760854482650757} -09/20/2021 21:01:09 - INFO - __main__ - Step 30156: {'lr': 0.0001997384865629656, 'samples': 964992, 'steps': 1884, 'loss/train': 2.380943536758423} -09/20/2021 21:01:10 - INFO - __main__ - Step 30157: {'lr': 0.0001997384865629656, 'samples': 965024, 'steps': 1884, 'loss/train': 2.68630313873291} -09/20/2021 21:01:10 - INFO - __main__ - Step 30158: {'lr': 0.0001997384865629656, 'samples': 965056, 'steps': 1884, 'loss/train': 2.663944959640503} -09/20/2021 21:01:11 - INFO - __main__ - Step 30159: {'lr': 0.0001997384865629656, 'samples': 965088, 'steps': 1884, 'loss/train': 2.5571703910827637} -09/20/2021 21:01:12 - INFO - __main__ - Step 30160: {'lr': 0.0001997384865629656, 'samples': 965120, 'steps': 1884, 'loss/train': 2.1908605098724365} -09/20/2021 21:01:13 - INFO - __main__ - Step 30161: {'lr': 0.00019973802533818706, 'samples': 965152, 'steps': 1885, 'loss/train': 2.938832998275757} -09/20/2021 21:01:13 - INFO - __main__ - Step 30162: {'lr': 0.00019973802533818706, 'samples': 965184, 'steps': 1885, 'loss/train': 2.123464584350586} -09/20/2021 21:01:14 - INFO - __main__ - Step 30163: {'lr': 0.00019973802533818706, 'samples': 965216, 'steps': 1885, 'loss/train': 2.1617555618286133} -09/20/2021 21:01:15 - INFO - __main__ - Step 30164: {'lr': 0.00019973802533818706, 'samples': 965248, 'steps': 1885, 'loss/train': 2.575578451156616} -09/20/2021 21:01:16 - INFO - __main__ - Step 30165: {'lr': 0.00019973802533818706, 'samples': 965280, 'steps': 1885, 'loss/train': 3.3216824531555176} -09/20/2021 21:01:16 - INFO - __main__ - Step 30166: {'lr': 0.00019973802533818706, 'samples': 965312, 'steps': 1885, 'loss/train': 3.9678726196289062} -09/20/2021 21:01:17 - INFO - __main__ - Step 30167: {'lr': 0.00019973802533818706, 'samples': 965344, 'steps': 1885, 'loss/train': 4.272182464599609} -09/20/2021 21:01:18 - INFO - __main__ - Step 30168: {'lr': 0.00019973802533818706, 'samples': 965376, 'steps': 1885, 'loss/train': 1.2544962167739868} -09/20/2021 21:01:19 - INFO - __main__ - Step 30169: {'lr': 0.00019973802533818706, 'samples': 965408, 'steps': 1885, 'loss/train': 1.2865524291992188} -09/20/2021 21:01:20 - INFO - __main__ - Step 30170: {'lr': 0.00019973802533818706, 'samples': 965440, 'steps': 1885, 'loss/train': 2.312854528427124} -09/20/2021 21:01:21 - INFO - __main__ - Step 30171: {'lr': 0.00019973802533818706, 'samples': 965472, 'steps': 1885, 'loss/train': 3.054591655731201} -09/20/2021 21:01:22 - INFO - __main__ - Step 30172: {'lr': 0.00019973802533818706, 'samples': 965504, 'steps': 1885, 'loss/train': 2.0958681106567383} -09/20/2021 21:01:22 - INFO - __main__ - Step 30173: {'lr': 0.00019973802533818706, 'samples': 965536, 'steps': 1885, 'loss/train': 2.426330804824829} -09/20/2021 21:01:23 - INFO - __main__ - Step 30174: {'lr': 0.00019973802533818706, 'samples': 965568, 'steps': 1885, 'loss/train': 2.463160991668701} -09/20/2021 21:01:24 - INFO - __main__ - Step 30175: {'lr': 0.00019973802533818706, 'samples': 965600, 'steps': 1885, 'loss/train': 1.8907452821731567} -09/20/2021 21:01:25 - INFO - __main__ - Step 30176: {'lr': 0.00019973802533818706, 'samples': 965632, 'steps': 1885, 'loss/train': 2.0524327754974365} -09/20/2021 21:01:25 - INFO - __main__ - Step 30177: {'lr': 0.00019973756370757486, 'samples': 965664, 'steps': 1886, 'loss/train': 2.727170944213867} -09/20/2021 21:01:26 - INFO - __main__ - Step 30178: {'lr': 0.00019973756370757486, 'samples': 965696, 'steps': 1886, 'loss/train': 2.1371257305145264} -09/20/2021 21:01:27 - INFO - __main__ - Step 30179: {'lr': 0.00019973756370757486, 'samples': 965728, 'steps': 1886, 'loss/train': 2.9331281185150146} -09/20/2021 21:01:28 - INFO - __main__ - Step 30180: {'lr': 0.00019973756370757486, 'samples': 965760, 'steps': 1886, 'loss/train': 3.0522446632385254} -09/20/2021 21:01:28 - INFO - __main__ - Step 30181: {'lr': 0.00019973756370757486, 'samples': 965792, 'steps': 1886, 'loss/train': 2.1053390502929688} -09/20/2021 21:01:29 - INFO - __main__ - Step 30182: {'lr': 0.00019973756370757486, 'samples': 965824, 'steps': 1886, 'loss/train': 2.459050178527832} -09/20/2021 21:01:30 - INFO - __main__ - Step 30183: {'lr': 0.00019973756370757486, 'samples': 965856, 'steps': 1886, 'loss/train': 2.375675678253174} -09/20/2021 21:01:31 - INFO - __main__ - Step 30184: {'lr': 0.00019973756370757486, 'samples': 965888, 'steps': 1886, 'loss/train': 2.4194369316101074} -09/20/2021 21:01:31 - INFO - __main__ - Step 30185: {'lr': 0.00019973756370757486, 'samples': 965920, 'steps': 1886, 'loss/train': 2.263158082962036} -09/20/2021 21:01:32 - INFO - __main__ - Step 30186: {'lr': 0.00019973756370757486, 'samples': 965952, 'steps': 1886, 'loss/train': 2.2263338565826416} -09/20/2021 21:01:33 - INFO - __main__ - Step 30187: {'lr': 0.00019973756370757486, 'samples': 965984, 'steps': 1886, 'loss/train': 1.8491512537002563} -09/20/2021 21:01:34 - INFO - __main__ - Step 30188: {'lr': 0.00019973756370757486, 'samples': 966016, 'steps': 1886, 'loss/train': 1.7441326379776} -09/20/2021 21:01:34 - INFO - __main__ - Step 30189: {'lr': 0.00019973756370757486, 'samples': 966048, 'steps': 1886, 'loss/train': 2.4688992500305176} -09/20/2021 21:01:35 - INFO - __main__ - Step 30190: {'lr': 0.00019973756370757486, 'samples': 966080, 'steps': 1886, 'loss/train': 1.2889530658721924} -09/20/2021 21:01:36 - INFO - __main__ - Step 30191: {'lr': 0.00019973756370757486, 'samples': 966112, 'steps': 1886, 'loss/train': 1.6988626718521118} -09/20/2021 21:01:37 - INFO - __main__ - Step 30192: {'lr': 0.00019973756370757486, 'samples': 966144, 'steps': 1886, 'loss/train': 1.2743659019470215} -09/20/2021 21:01:38 - INFO - __main__ - Step 30193: {'lr': 0.00019973710167113092, 'samples': 966176, 'steps': 1887, 'loss/train': 2.4482669830322266} -09/20/2021 21:01:38 - INFO - __main__ - Step 30194: {'lr': 0.00019973710167113092, 'samples': 966208, 'steps': 1887, 'loss/train': 1.9192876815795898} -09/20/2021 21:01:39 - INFO - __main__ - Step 30195: {'lr': 0.00019973710167113092, 'samples': 966240, 'steps': 1887, 'loss/train': 1.625113606452942} -09/20/2021 21:01:40 - INFO - __main__ - Step 30196: {'lr': 0.00019973710167113092, 'samples': 966272, 'steps': 1887, 'loss/train': 2.8233838081359863} -09/20/2021 21:01:41 - INFO - __main__ - Step 30197: {'lr': 0.00019973710167113092, 'samples': 966304, 'steps': 1887, 'loss/train': 2.427076578140259} -09/20/2021 21:01:41 - INFO - __main__ - Step 30198: {'lr': 0.00019973710167113092, 'samples': 966336, 'steps': 1887, 'loss/train': 1.5089242458343506} -09/20/2021 21:01:42 - INFO - __main__ - Step 30199: {'lr': 0.00019973710167113092, 'samples': 966368, 'steps': 1887, 'loss/train': 2.4598822593688965} -09/20/2021 21:01:43 - INFO - __main__ - Step 30200: {'lr': 0.00019973710167113092, 'samples': 966400, 'steps': 1887, 'loss/train': 1.9965300559997559} -09/20/2021 21:01:44 - INFO - __main__ - Step 30201: {'lr': 0.00019973710167113092, 'samples': 966432, 'steps': 1887, 'loss/train': 2.174894332885742} -09/20/2021 21:01:45 - INFO - __main__ - Step 30202: {'lr': 0.00019973710167113092, 'samples': 966464, 'steps': 1887, 'loss/train': 2.618293285369873} -09/20/2021 21:01:46 - INFO - __main__ - Step 30203: {'lr': 0.00019973710167113092, 'samples': 966496, 'steps': 1887, 'loss/train': 1.899133563041687} -09/20/2021 21:01:46 - INFO - __main__ - Step 30204: {'lr': 0.00019973710167113092, 'samples': 966528, 'steps': 1887, 'loss/train': 2.3244993686676025} -09/20/2021 21:01:47 - INFO - __main__ - Step 30205: {'lr': 0.00019973710167113092, 'samples': 966560, 'steps': 1887, 'loss/train': 2.038140058517456} -09/20/2021 21:01:48 - INFO - __main__ - Step 30206: {'lr': 0.00019973710167113092, 'samples': 966592, 'steps': 1887, 'loss/train': 1.9220612049102783} -09/20/2021 21:01:49 - INFO - __main__ - Step 30207: {'lr': 0.00019973710167113092, 'samples': 966624, 'steps': 1887, 'loss/train': 2.721193552017212} -09/20/2021 21:01:49 - INFO - __main__ - Step 30208: {'lr': 0.00019973710167113092, 'samples': 966656, 'steps': 1887, 'loss/train': 2.0774612426757812} -09/20/2021 21:01:50 - INFO - __main__ - Step 30209: {'lr': 0.0001997366392288571, 'samples': 966688, 'steps': 1888, 'loss/train': 2.8311049938201904} -09/20/2021 21:01:51 - INFO - __main__ - Step 30210: {'lr': 0.0001997366392288571, 'samples': 966720, 'steps': 1888, 'loss/train': 1.1771740913391113} -09/20/2021 21:01:52 - INFO - __main__ - Step 30211: {'lr': 0.0001997366392288571, 'samples': 966752, 'steps': 1888, 'loss/train': 3.1123430728912354} -09/20/2021 21:01:52 - INFO - __main__ - Step 30212: {'lr': 0.0001997366392288571, 'samples': 966784, 'steps': 1888, 'loss/train': 3.1593713760375977} -09/20/2021 21:01:53 - INFO - __main__ - Step 30213: {'lr': 0.0001997366392288571, 'samples': 966816, 'steps': 1888, 'loss/train': 2.173417806625366} -09/20/2021 21:01:54 - INFO - __main__ - Step 30214: {'lr': 0.0001997366392288571, 'samples': 966848, 'steps': 1888, 'loss/train': 1.759141206741333} -09/20/2021 21:01:55 - INFO - __main__ - Step 30215: {'lr': 0.0001997366392288571, 'samples': 966880, 'steps': 1888, 'loss/train': 3.057960271835327} -09/20/2021 21:01:55 - INFO - __main__ - Step 30216: {'lr': 0.0001997366392288571, 'samples': 966912, 'steps': 1888, 'loss/train': 2.8618969917297363} -09/20/2021 21:01:56 - INFO - __main__ - Step 30217: {'lr': 0.0001997366392288571, 'samples': 966944, 'steps': 1888, 'loss/train': 1.1091011762619019} -09/20/2021 21:01:57 - INFO - __main__ - Step 30218: {'lr': 0.0001997366392288571, 'samples': 966976, 'steps': 1888, 'loss/train': 3.3773491382598877} -09/20/2021 21:01:58 - INFO - __main__ - Step 30219: {'lr': 0.0001997366392288571, 'samples': 967008, 'steps': 1888, 'loss/train': 2.024721622467041} -09/20/2021 21:01:58 - INFO - __main__ - Step 30220: {'lr': 0.0001997366392288571, 'samples': 967040, 'steps': 1888, 'loss/train': 1.073393702507019} -09/20/2021 21:01:59 - INFO - __main__ - Step 30221: {'lr': 0.0001997366392288571, 'samples': 967072, 'steps': 1888, 'loss/train': 2.6722848415374756} -09/20/2021 21:02:00 - INFO - __main__ - Step 30222: {'lr': 0.0001997366392288571, 'samples': 967104, 'steps': 1888, 'loss/train': 1.702574610710144} -09/20/2021 21:02:01 - INFO - __main__ - Step 30223: {'lr': 0.0001997366392288571, 'samples': 967136, 'steps': 1888, 'loss/train': 0.823093593120575} -09/20/2021 21:02:01 - INFO - __main__ - Step 30224: {'lr': 0.0001997366392288571, 'samples': 967168, 'steps': 1888, 'loss/train': 1.8553386926651} -09/20/2021 21:02:02 - INFO - __main__ - Step 30225: {'lr': 0.0001997361763807553, 'samples': 967200, 'steps': 1889, 'loss/train': 2.4653213024139404} -09/20/2021 21:02:03 - INFO - __main__ - Step 30226: {'lr': 0.0001997361763807553, 'samples': 967232, 'steps': 1889, 'loss/train': 2.888474225997925} -09/20/2021 21:02:04 - INFO - __main__ - Step 30227: {'lr': 0.0001997361763807553, 'samples': 967264, 'steps': 1889, 'loss/train': 2.1202986240386963} -09/20/2021 21:02:05 - INFO - __main__ - Step 30228: {'lr': 0.0001997361763807553, 'samples': 967296, 'steps': 1889, 'loss/train': 3.0753417015075684} -09/20/2021 21:02:05 - INFO - __main__ - Step 30229: {'lr': 0.0001997361763807553, 'samples': 967328, 'steps': 1889, 'loss/train': 2.8262922763824463} -09/20/2021 21:02:06 - INFO - __main__ - Step 30230: {'lr': 0.0001997361763807553, 'samples': 967360, 'steps': 1889, 'loss/train': 1.6720197200775146} -09/20/2021 21:02:07 - INFO - __main__ - Step 30231: {'lr': 0.0001997361763807553, 'samples': 967392, 'steps': 1889, 'loss/train': 2.688164234161377} -09/20/2021 21:02:08 - INFO - __main__ - Step 30232: {'lr': 0.0001997361763807553, 'samples': 967424, 'steps': 1889, 'loss/train': 1.7728692293167114} -09/20/2021 21:02:09 - INFO - __main__ - Step 30233: {'lr': 0.0001997361763807553, 'samples': 967456, 'steps': 1889, 'loss/train': 2.5315587520599365} -09/20/2021 21:02:10 - INFO - __main__ - Step 30234: {'lr': 0.0001997361763807553, 'samples': 967488, 'steps': 1889, 'loss/train': 1.8200188875198364} -09/20/2021 21:02:11 - INFO - __main__ - Step 30235: {'lr': 0.0001997361763807553, 'samples': 967520, 'steps': 1889, 'loss/train': 2.172333002090454} -09/20/2021 21:02:12 - INFO - __main__ - Step 30236: {'lr': 0.0001997361763807553, 'samples': 967552, 'steps': 1889, 'loss/train': 2.030797004699707} -09/20/2021 21:02:12 - INFO - __main__ - Step 30237: {'lr': 0.0001997361763807553, 'samples': 967584, 'steps': 1889, 'loss/train': 2.115450143814087} -09/20/2021 21:02:13 - INFO - __main__ - Step 30238: {'lr': 0.0001997361763807553, 'samples': 967616, 'steps': 1889, 'loss/train': 1.5788145065307617} -09/20/2021 21:02:14 - INFO - __main__ - Step 30239: {'lr': 0.0001997361763807553, 'samples': 967648, 'steps': 1889, 'loss/train': 1.7989205121994019} -09/20/2021 21:02:15 - INFO - __main__ - Step 30240: {'lr': 0.0001997361763807553, 'samples': 967680, 'steps': 1889, 'loss/train': 2.9015793800354004} -09/20/2021 21:02:15 - INFO - __main__ - Step 30241: {'lr': 0.00019973571312682735, 'samples': 967712, 'steps': 1890, 'loss/train': 1.2262017726898193} -09/20/2021 21:02:16 - INFO - __main__ - Step 30242: {'lr': 0.00019973571312682735, 'samples': 967744, 'steps': 1890, 'loss/train': 2.1811792850494385} -09/20/2021 21:02:17 - INFO - __main__ - Step 30243: {'lr': 0.00019973571312682735, 'samples': 967776, 'steps': 1890, 'loss/train': 2.2304415702819824} -09/20/2021 21:02:18 - INFO - __main__ - Step 30244: {'lr': 0.00019973571312682735, 'samples': 967808, 'steps': 1890, 'loss/train': 2.4001352787017822} -09/20/2021 21:02:18 - INFO - __main__ - Step 30245: {'lr': 0.00019973571312682735, 'samples': 967840, 'steps': 1890, 'loss/train': 2.7536540031433105} -09/20/2021 21:02:19 - INFO - __main__ - Step 30246: {'lr': 0.00019973571312682735, 'samples': 967872, 'steps': 1890, 'loss/train': 2.503023862838745} -09/20/2021 21:02:20 - INFO - __main__ - Step 30247: {'lr': 0.00019973571312682735, 'samples': 967904, 'steps': 1890, 'loss/train': 2.8532981872558594} -09/20/2021 21:02:21 - INFO - __main__ - Step 30248: {'lr': 0.00019973571312682735, 'samples': 967936, 'steps': 1890, 'loss/train': 2.594489336013794} -09/20/2021 21:02:21 - INFO - __main__ - Step 30249: {'lr': 0.00019973571312682735, 'samples': 967968, 'steps': 1890, 'loss/train': 1.3521872758865356} -09/20/2021 21:02:22 - INFO - __main__ - Step 30250: {'lr': 0.00019973571312682735, 'samples': 968000, 'steps': 1890, 'loss/train': 2.4915425777435303} -09/20/2021 21:02:23 - INFO - __main__ - Step 30251: {'lr': 0.00019973571312682735, 'samples': 968032, 'steps': 1890, 'loss/train': 2.6007251739501953} -09/20/2021 21:02:24 - INFO - __main__ - Step 30252: {'lr': 0.00019973571312682735, 'samples': 968064, 'steps': 1890, 'loss/train': 2.850996255874634} -09/20/2021 21:02:24 - INFO - __main__ - Step 30253: {'lr': 0.00019973571312682735, 'samples': 968096, 'steps': 1890, 'loss/train': 2.848054885864258} -09/20/2021 21:02:25 - INFO - __main__ - Step 30254: {'lr': 0.00019973571312682735, 'samples': 968128, 'steps': 1890, 'loss/train': 2.9607045650482178} -09/20/2021 21:02:26 - INFO - __main__ - Step 30255: {'lr': 0.00019973571312682735, 'samples': 968160, 'steps': 1890, 'loss/train': 3.281853675842285} -09/20/2021 21:02:27 - INFO - __main__ - Step 30256: {'lr': 0.00019973571312682735, 'samples': 968192, 'steps': 1890, 'loss/train': 4.673695087432861} -09/20/2021 21:02:28 - INFO - __main__ - Step 30257: {'lr': 0.00019973524946707518, 'samples': 968224, 'steps': 1891, 'loss/train': 0.9092211127281189} -09/20/2021 21:02:28 - INFO - __main__ - Step 30258: {'lr': 0.00019973524946707518, 'samples': 968256, 'steps': 1891, 'loss/train': 0.9680839776992798} -09/20/2021 21:02:29 - INFO - __main__ - Step 30259: {'lr': 0.00019973524946707518, 'samples': 968288, 'steps': 1891, 'loss/train': 1.0076593160629272} -09/20/2021 21:02:30 - INFO - __main__ - Step 30260: {'lr': 0.00019973524946707518, 'samples': 968320, 'steps': 1891, 'loss/train': 0.7918854355812073} -09/20/2021 21:02:31 - INFO - __main__ - Step 30261: {'lr': 0.00019973524946707518, 'samples': 968352, 'steps': 1891, 'loss/train': 0.8866670727729797} -09/20/2021 21:02:31 - INFO - __main__ - Step 30262: {'lr': 0.00019973524946707518, 'samples': 968384, 'steps': 1891, 'loss/train': 1.0284714698791504} -09/20/2021 21:02:32 - INFO - __main__ - Step 30263: {'lr': 0.00019973524946707518, 'samples': 968416, 'steps': 1891, 'loss/train': 0.9436078071594238} -09/20/2021 21:02:33 - INFO - __main__ - Step 30264: {'lr': 0.00019973524946707518, 'samples': 968448, 'steps': 1891, 'loss/train': 1.2470216751098633} -09/20/2021 21:02:34 - INFO - __main__ - Step 30265: {'lr': 0.00019973524946707518, 'samples': 968480, 'steps': 1891, 'loss/train': 3.29172682762146} -09/20/2021 21:02:34 - INFO - __main__ - Step 30266: {'lr': 0.00019973524946707518, 'samples': 968512, 'steps': 1891, 'loss/train': 2.204242706298828} -09/20/2021 21:02:35 - INFO - __main__ - Step 30267: {'lr': 0.00019973524946707518, 'samples': 968544, 'steps': 1891, 'loss/train': 1.8331187963485718} -09/20/2021 21:02:36 - INFO - __main__ - Step 30268: {'lr': 0.00019973524946707518, 'samples': 968576, 'steps': 1891, 'loss/train': 2.9583609104156494} -09/20/2021 21:02:37 - INFO - __main__ - Step 30269: {'lr': 0.00019973524946707518, 'samples': 968608, 'steps': 1891, 'loss/train': 1.2762444019317627} -09/20/2021 21:02:37 - INFO - __main__ - Step 30270: {'lr': 0.00019973524946707518, 'samples': 968640, 'steps': 1891, 'loss/train': 2.143827199935913} -09/20/2021 21:02:39 - INFO - __main__ - Step 30271: {'lr': 0.00019973524946707518, 'samples': 968672, 'steps': 1891, 'loss/train': 2.367549180984497} -09/20/2021 21:02:39 - INFO - __main__ - Step 30272: {'lr': 0.00019973524946707518, 'samples': 968704, 'steps': 1891, 'loss/train': 2.984598398208618} -09/20/2021 21:02:40 - INFO - __main__ - Step 30273: {'lr': 0.00019973478540150067, 'samples': 968736, 'steps': 1892, 'loss/train': 1.8122079372406006} -09/20/2021 21:02:41 - INFO - __main__ - Step 30274: {'lr': 0.00019973478540150067, 'samples': 968768, 'steps': 1892, 'loss/train': 2.338082790374756} -09/20/2021 21:02:42 - INFO - __main__ - Step 30275: {'lr': 0.00019973478540150067, 'samples': 968800, 'steps': 1892, 'loss/train': 2.2871172428131104} -09/20/2021 21:02:43 - INFO - __main__ - Step 30276: {'lr': 0.00019973478540150067, 'samples': 968832, 'steps': 1892, 'loss/train': 2.6578922271728516} -09/20/2021 21:02:43 - INFO - __main__ - Step 30277: {'lr': 0.00019973478540150067, 'samples': 968864, 'steps': 1892, 'loss/train': 1.1427686214447021} -09/20/2021 21:02:44 - INFO - __main__ - Step 30278: {'lr': 0.00019973478540150067, 'samples': 968896, 'steps': 1892, 'loss/train': 0.5190321803092957} -09/20/2021 21:02:45 - INFO - __main__ - Step 30279: {'lr': 0.00019973478540150067, 'samples': 968928, 'steps': 1892, 'loss/train': 0.4666096866130829} -09/20/2021 21:02:46 - INFO - __main__ - Step 30280: {'lr': 0.00019973478540150067, 'samples': 968960, 'steps': 1892, 'loss/train': 3.8200185298919678} -09/20/2021 21:02:46 - INFO - __main__ - Step 30281: {'lr': 0.00019973478540150067, 'samples': 968992, 'steps': 1892, 'loss/train': 2.0509703159332275} -09/20/2021 21:02:47 - INFO - __main__ - Step 30282: {'lr': 0.00019973478540150067, 'samples': 969024, 'steps': 1892, 'loss/train': 3.337333917617798} -09/20/2021 21:02:48 - INFO - __main__ - Step 30283: {'lr': 0.00019973478540150067, 'samples': 969056, 'steps': 1892, 'loss/train': 2.6904661655426025} -09/20/2021 21:02:49 - INFO - __main__ - Step 30284: {'lr': 0.00019973478540150067, 'samples': 969088, 'steps': 1892, 'loss/train': 3.2366526126861572} -09/20/2021 21:02:49 - INFO - __main__ - Step 30285: {'lr': 0.00019973478540150067, 'samples': 969120, 'steps': 1892, 'loss/train': 2.1468892097473145} -09/20/2021 21:02:50 - INFO - __main__ - Step 30286: {'lr': 0.00019973478540150067, 'samples': 969152, 'steps': 1892, 'loss/train': 2.842763662338257} -09/20/2021 21:02:51 - INFO - __main__ - Step 30287: {'lr': 0.00019973478540150067, 'samples': 969184, 'steps': 1892, 'loss/train': 1.229030728340149} -09/20/2021 21:02:52 - INFO - __main__ - Step 30288: {'lr': 0.00019973478540150067, 'samples': 969216, 'steps': 1892, 'loss/train': 1.6780130863189697} -09/20/2021 21:02:52 - INFO - __main__ - Step 30289: {'lr': 0.0001997343209301057, 'samples': 969248, 'steps': 1893, 'loss/train': 2.699840784072876} -09/20/2021 21:02:53 - INFO - __main__ - Step 30290: {'lr': 0.0001997343209301057, 'samples': 969280, 'steps': 1893, 'loss/train': 2.5833191871643066} -09/20/2021 21:02:54 - INFO - __main__ - Step 30291: {'lr': 0.0001997343209301057, 'samples': 969312, 'steps': 1893, 'loss/train': 3.138362407684326} -09/20/2021 21:02:55 - INFO - __main__ - Step 30292: {'lr': 0.0001997343209301057, 'samples': 969344, 'steps': 1893, 'loss/train': 2.8191721439361572} -09/20/2021 21:02:55 - INFO - __main__ - Step 30293: {'lr': 0.0001997343209301057, 'samples': 969376, 'steps': 1893, 'loss/train': 2.662785053253174} -09/20/2021 21:02:56 - INFO - __main__ - Step 30294: {'lr': 0.0001997343209301057, 'samples': 969408, 'steps': 1893, 'loss/train': 2.4956579208374023} -09/20/2021 21:02:57 - INFO - __main__ - Step 30295: {'lr': 0.0001997343209301057, 'samples': 969440, 'steps': 1893, 'loss/train': 2.969320297241211} -09/20/2021 21:02:58 - INFO - __main__ - Step 30296: {'lr': 0.0001997343209301057, 'samples': 969472, 'steps': 1893, 'loss/train': 2.1658225059509277} -09/20/2021 21:02:58 - INFO - __main__ - Step 30297: {'lr': 0.0001997343209301057, 'samples': 969504, 'steps': 1893, 'loss/train': 2.923224925994873} -09/20/2021 21:02:59 - INFO - __main__ - Step 30298: {'lr': 0.0001997343209301057, 'samples': 969536, 'steps': 1893, 'loss/train': 2.143320322036743} -09/20/2021 21:03:00 - INFO - __main__ - Step 30299: {'lr': 0.0001997343209301057, 'samples': 969568, 'steps': 1893, 'loss/train': 2.2428858280181885} -09/20/2021 21:03:01 - INFO - __main__ - Step 30300: {'lr': 0.0001997343209301057, 'samples': 969600, 'steps': 1893, 'loss/train': 2.745142698287964} -09/20/2021 21:03:01 - INFO - __main__ - Step 30301: {'lr': 0.0001997343209301057, 'samples': 969632, 'steps': 1893, 'loss/train': 3.14213228225708} -09/20/2021 21:03:02 - INFO - __main__ - Step 30302: {'lr': 0.0001997343209301057, 'samples': 969664, 'steps': 1893, 'loss/train': 2.703864574432373} -09/20/2021 21:03:04 - INFO - __main__ - Step 30303: {'lr': 0.0001997343209301057, 'samples': 969696, 'steps': 1893, 'loss/train': 2.250403642654419} -09/20/2021 21:03:05 - INFO - __main__ - Step 30304: {'lr': 0.0001997343209301057, 'samples': 969728, 'steps': 1893, 'loss/train': 2.3337981700897217} -09/20/2021 21:03:06 - INFO - __main__ - Step 30305: {'lr': 0.00019973385605289218, 'samples': 969760, 'steps': 1894, 'loss/train': 2.0303101539611816} -09/20/2021 21:03:06 - INFO - __main__ - Step 30306: {'lr': 0.00019973385605289218, 'samples': 969792, 'steps': 1894, 'loss/train': 3.160438060760498} -09/20/2021 21:03:07 - INFO - __main__ - Step 30307: {'lr': 0.00019973385605289218, 'samples': 969824, 'steps': 1894, 'loss/train': 3.354301929473877} -09/20/2021 21:03:08 - INFO - __main__ - Step 30308: {'lr': 0.00019973385605289218, 'samples': 969856, 'steps': 1894, 'loss/train': 2.2373621463775635} -09/20/2021 21:03:09 - INFO - __main__ - Step 30309: {'lr': 0.00019973385605289218, 'samples': 969888, 'steps': 1894, 'loss/train': 2.5045201778411865} -09/20/2021 21:03:09 - INFO - __main__ - Step 30310: {'lr': 0.00019973385605289218, 'samples': 969920, 'steps': 1894, 'loss/train': 2.853851556777954} -09/20/2021 21:03:10 - INFO - __main__ - Step 30311: {'lr': 0.00019973385605289218, 'samples': 969952, 'steps': 1894, 'loss/train': 2.121812343597412} -09/20/2021 21:03:11 - INFO - __main__ - Step 30312: {'lr': 0.00019973385605289218, 'samples': 969984, 'steps': 1894, 'loss/train': 4.13682746887207} -09/20/2021 21:03:12 - INFO - __main__ - Step 30313: {'lr': 0.00019973385605289218, 'samples': 970016, 'steps': 1894, 'loss/train': 2.3383772373199463} -09/20/2021 21:03:12 - INFO - __main__ - Step 30314: {'lr': 0.00019973385605289218, 'samples': 970048, 'steps': 1894, 'loss/train': 3.0633060932159424} -09/20/2021 21:03:13 - INFO - __main__ - Step 30315: {'lr': 0.00019973385605289218, 'samples': 970080, 'steps': 1894, 'loss/train': 2.3002288341522217} -09/20/2021 21:03:14 - INFO - __main__ - Step 30316: {'lr': 0.00019973385605289218, 'samples': 970112, 'steps': 1894, 'loss/train': 3.653775453567505} -09/20/2021 21:03:15 - INFO - __main__ - Step 30317: {'lr': 0.00019973385605289218, 'samples': 970144, 'steps': 1894, 'loss/train': 2.753178119659424} -09/20/2021 21:03:15 - INFO - __main__ - Step 30318: {'lr': 0.00019973385605289218, 'samples': 970176, 'steps': 1894, 'loss/train': 2.532426595687866} -09/20/2021 21:03:16 - INFO - __main__ - Step 30319: {'lr': 0.00019973385605289218, 'samples': 970208, 'steps': 1894, 'loss/train': 1.5663114786148071} -09/20/2021 21:03:17 - INFO - __main__ - Step 30320: {'lr': 0.00019973385605289218, 'samples': 970240, 'steps': 1894, 'loss/train': 2.3210268020629883} -09/20/2021 21:03:18 - INFO - __main__ - Step 30321: {'lr': 0.00019973339076986198, 'samples': 970272, 'steps': 1895, 'loss/train': 4.161489486694336} -09/20/2021 21:03:18 - INFO - __main__ - Step 30322: {'lr': 0.00019973339076986198, 'samples': 970304, 'steps': 1895, 'loss/train': 2.5834591388702393} -09/20/2021 21:03:19 - INFO - __main__ - Step 30323: {'lr': 0.00019973339076986198, 'samples': 970336, 'steps': 1895, 'loss/train': 2.2471115589141846} -09/20/2021 21:03:20 - INFO - __main__ - Step 30324: {'lr': 0.00019973339076986198, 'samples': 970368, 'steps': 1895, 'loss/train': 1.838489055633545} -09/20/2021 21:03:21 - INFO - __main__ - Step 30325: {'lr': 0.00019973339076986198, 'samples': 970400, 'steps': 1895, 'loss/train': 2.0146026611328125} -09/20/2021 21:03:21 - INFO - __main__ - Step 30326: {'lr': 0.00019973339076986198, 'samples': 970432, 'steps': 1895, 'loss/train': 1.6948647499084473} -09/20/2021 21:03:22 - INFO - __main__ - Step 30327: {'lr': 0.00019973339076986198, 'samples': 970464, 'steps': 1895, 'loss/train': 1.9803053140640259} -09/20/2021 21:03:23 - INFO - __main__ - Step 30328: {'lr': 0.00019973339076986198, 'samples': 970496, 'steps': 1895, 'loss/train': 2.1245334148406982} -09/20/2021 21:03:24 - INFO - __main__ - Step 30329: {'lr': 0.00019973339076986198, 'samples': 970528, 'steps': 1895, 'loss/train': 1.5424212217330933} -09/20/2021 21:03:24 - INFO - __main__ - Step 30330: {'lr': 0.00019973339076986198, 'samples': 970560, 'steps': 1895, 'loss/train': 1.872498869895935} -09/20/2021 21:03:25 - INFO - __main__ - Step 30331: {'lr': 0.00019973339076986198, 'samples': 970592, 'steps': 1895, 'loss/train': 2.415774345397949} -09/20/2021 21:03:26 - INFO - __main__ - Step 30332: {'lr': 0.00019973339076986198, 'samples': 970624, 'steps': 1895, 'loss/train': 2.0253522396087646} -09/20/2021 21:03:27 - INFO - __main__ - Step 30333: {'lr': 0.00019973339076986198, 'samples': 970656, 'steps': 1895, 'loss/train': 3.0518503189086914} -09/20/2021 21:03:28 - INFO - __main__ - Step 30334: {'lr': 0.00019973339076986198, 'samples': 970688, 'steps': 1895, 'loss/train': 2.20918345451355} -09/20/2021 21:03:29 - INFO - __main__ - Step 30335: {'lr': 0.00019973339076986198, 'samples': 970720, 'steps': 1895, 'loss/train': 2.497969627380371} -09/20/2021 21:03:29 - INFO - __main__ - Step 30336: {'lr': 0.00019973339076986198, 'samples': 970752, 'steps': 1895, 'loss/train': 1.1027553081512451} -09/20/2021 21:03:30 - INFO - __main__ - Step 30337: {'lr': 0.00019973292508101702, 'samples': 970784, 'steps': 1896, 'loss/train': 1.9970779418945312} -09/20/2021 21:03:31 - INFO - __main__ - Step 30338: {'lr': 0.00019973292508101702, 'samples': 970816, 'steps': 1896, 'loss/train': 1.8371063470840454} -09/20/2021 21:03:32 - INFO - __main__ - Step 30339: {'lr': 0.00019973292508101702, 'samples': 970848, 'steps': 1896, 'loss/train': 2.8106515407562256} -09/20/2021 21:03:33 - INFO - __main__ - Step 30340: {'lr': 0.00019973292508101702, 'samples': 970880, 'steps': 1896, 'loss/train': 1.3271909952163696} -09/20/2021 21:03:33 - INFO - __main__ - Step 30341: {'lr': 0.00019973292508101702, 'samples': 970912, 'steps': 1896, 'loss/train': 2.447511672973633} -09/20/2021 21:03:34 - INFO - __main__ - Step 30342: {'lr': 0.00019973292508101702, 'samples': 970944, 'steps': 1896, 'loss/train': 2.850400447845459} -09/20/2021 21:03:35 - INFO - __main__ - Step 30343: {'lr': 0.00019973292508101702, 'samples': 970976, 'steps': 1896, 'loss/train': 2.760774850845337} -09/20/2021 21:03:36 - INFO - __main__ - Step 30344: {'lr': 0.00019973292508101702, 'samples': 971008, 'steps': 1896, 'loss/train': 2.212790012359619} -09/20/2021 21:03:36 - INFO - __main__ - Step 30345: {'lr': 0.00019973292508101702, 'samples': 971040, 'steps': 1896, 'loss/train': 2.8521921634674072} -09/20/2021 21:03:37 - INFO - __main__ - Step 30346: {'lr': 0.00019973292508101702, 'samples': 971072, 'steps': 1896, 'loss/train': 1.8776662349700928} -09/20/2021 21:03:38 - INFO - __main__ - Step 30347: {'lr': 0.00019973292508101702, 'samples': 971104, 'steps': 1896, 'loss/train': 2.5295262336730957} -09/20/2021 21:03:39 - INFO - __main__ - Step 30348: {'lr': 0.00019973292508101702, 'samples': 971136, 'steps': 1896, 'loss/train': 3.5714776515960693} -09/20/2021 21:03:39 - INFO - __main__ - Step 30349: {'lr': 0.00019973292508101702, 'samples': 971168, 'steps': 1896, 'loss/train': 2.514418363571167} -09/20/2021 21:03:40 - INFO - __main__ - Step 30350: {'lr': 0.00019973292508101702, 'samples': 971200, 'steps': 1896, 'loss/train': 2.1661341190338135} -09/20/2021 21:03:41 - INFO - __main__ - Step 30351: {'lr': 0.00019973292508101702, 'samples': 971232, 'steps': 1896, 'loss/train': 2.8116462230682373} -09/20/2021 21:03:42 - INFO - __main__ - Step 30352: {'lr': 0.00019973292508101702, 'samples': 971264, 'steps': 1896, 'loss/train': 2.6700491905212402} -09/20/2021 21:03:42 - INFO - __main__ - Step 30353: {'lr': 0.00019973245898635914, 'samples': 971296, 'steps': 1897, 'loss/train': 2.8775105476379395} -09/20/2021 21:03:43 - INFO - __main__ - Step 30354: {'lr': 0.00019973245898635914, 'samples': 971328, 'steps': 1897, 'loss/train': 0.9787517786026001} -09/20/2021 21:03:44 - INFO - __main__ - Step 30355: {'lr': 0.00019973245898635914, 'samples': 971360, 'steps': 1897, 'loss/train': 3.07971453666687} -09/20/2021 21:03:45 - INFO - __main__ - Step 30356: {'lr': 0.00019973245898635914, 'samples': 971392, 'steps': 1897, 'loss/train': 2.457609176635742} -09/20/2021 21:03:45 - INFO - __main__ - Step 30357: {'lr': 0.00019973245898635914, 'samples': 971424, 'steps': 1897, 'loss/train': 2.9107556343078613} -09/20/2021 21:03:46 - INFO - __main__ - Step 30358: {'lr': 0.00019973245898635914, 'samples': 971456, 'steps': 1897, 'loss/train': 2.79445481300354} -09/20/2021 21:03:47 - INFO - __main__ - Step 30359: {'lr': 0.00019973245898635914, 'samples': 971488, 'steps': 1897, 'loss/train': 2.3512046337127686} -09/20/2021 21:03:48 - INFO - __main__ - Step 30360: {'lr': 0.00019973245898635914, 'samples': 971520, 'steps': 1897, 'loss/train': 0.39038047194480896} -09/20/2021 21:03:48 - INFO - __main__ - Step 30361: {'lr': 0.00019973245898635914, 'samples': 971552, 'steps': 1897, 'loss/train': 2.3978986740112305} -09/20/2021 21:03:49 - INFO - __main__ - Step 30362: {'lr': 0.00019973245898635914, 'samples': 971584, 'steps': 1897, 'loss/train': 2.0770699977874756} -09/20/2021 21:03:50 - INFO - __main__ - Step 30363: {'lr': 0.00019973245898635914, 'samples': 971616, 'steps': 1897, 'loss/train': 3.627440929412842} -09/20/2021 21:03:51 - INFO - __main__ - Step 30364: {'lr': 0.00019973245898635914, 'samples': 971648, 'steps': 1897, 'loss/train': 2.6788084506988525} -09/20/2021 21:03:52 - INFO - __main__ - Step 30365: {'lr': 0.00019973245898635914, 'samples': 971680, 'steps': 1897, 'loss/train': 2.6123695373535156} -09/20/2021 21:03:53 - INFO - __main__ - Step 30366: {'lr': 0.00019973245898635914, 'samples': 971712, 'steps': 1897, 'loss/train': 2.970592975616455} -09/20/2021 21:03:53 - INFO - __main__ - Step 30367: {'lr': 0.00019973245898635914, 'samples': 971744, 'steps': 1897, 'loss/train': 2.3343093395233154} -09/20/2021 21:03:54 - INFO - __main__ - Step 30368: {'lr': 0.00019973245898635914, 'samples': 971776, 'steps': 1897, 'loss/train': 2.457000970840454} -09/20/2021 21:03:55 - INFO - __main__ - Step 30369: {'lr': 0.0001997319924858903, 'samples': 971808, 'steps': 1898, 'loss/train': 1.3732898235321045} -09/20/2021 21:03:56 - INFO - __main__ - Step 30370: {'lr': 0.0001997319924858903, 'samples': 971840, 'steps': 1898, 'loss/train': 2.916293144226074} -09/20/2021 21:03:57 - INFO - __main__ - Step 30371: {'lr': 0.0001997319924858903, 'samples': 971872, 'steps': 1898, 'loss/train': 1.9992647171020508} -09/20/2021 21:03:57 - INFO - __main__ - Step 30372: {'lr': 0.0001997319924858903, 'samples': 971904, 'steps': 1898, 'loss/train': 2.3585007190704346} -09/20/2021 21:03:58 - INFO - __main__ - Step 30373: {'lr': 0.0001997319924858903, 'samples': 971936, 'steps': 1898, 'loss/train': 2.0950210094451904} -09/20/2021 21:03:59 - INFO - __main__ - Step 30374: {'lr': 0.0001997319924858903, 'samples': 971968, 'steps': 1898, 'loss/train': 1.9974390268325806} -09/20/2021 21:04:00 - INFO - __main__ - Step 30375: {'lr': 0.0001997319924858903, 'samples': 972000, 'steps': 1898, 'loss/train': 2.9360623359680176} -09/20/2021 21:04:00 - INFO - __main__ - Step 30376: {'lr': 0.0001997319924858903, 'samples': 972032, 'steps': 1898, 'loss/train': 3.0199971199035645} -09/20/2021 21:04:01 - INFO - __main__ - Step 30377: {'lr': 0.0001997319924858903, 'samples': 972064, 'steps': 1898, 'loss/train': 3.121898889541626} -09/20/2021 21:04:02 - INFO - __main__ - Step 30378: {'lr': 0.0001997319924858903, 'samples': 972096, 'steps': 1898, 'loss/train': 2.9033472537994385} -09/20/2021 21:04:03 - INFO - __main__ - Step 30379: {'lr': 0.0001997319924858903, 'samples': 972128, 'steps': 1898, 'loss/train': 0.5891798734664917} -09/20/2021 21:04:03 - INFO - __main__ - Step 30380: {'lr': 0.0001997319924858903, 'samples': 972160, 'steps': 1898, 'loss/train': 3.4406497478485107} -09/20/2021 21:04:04 - INFO - __main__ - Step 30381: {'lr': 0.0001997319924858903, 'samples': 972192, 'steps': 1898, 'loss/train': 1.5385653972625732} -09/20/2021 21:04:05 - INFO - __main__ - Step 30382: {'lr': 0.0001997319924858903, 'samples': 972224, 'steps': 1898, 'loss/train': 3.0207269191741943} -09/20/2021 21:04:06 - INFO - __main__ - Step 30383: {'lr': 0.0001997319924858903, 'samples': 972256, 'steps': 1898, 'loss/train': 2.7656784057617188} -09/20/2021 21:04:06 - INFO - __main__ - Step 30384: {'lr': 0.0001997319924858903, 'samples': 972288, 'steps': 1898, 'loss/train': 4.035382270812988} -09/20/2021 21:04:07 - INFO - __main__ - Step 30385: {'lr': 0.00019973152557961233, 'samples': 972320, 'steps': 1899, 'loss/train': 3.7753264904022217} -09/20/2021 21:04:08 - INFO - __main__ - Step 30386: {'lr': 0.00019973152557961233, 'samples': 972352, 'steps': 1899, 'loss/train': 1.6790804862976074} -09/20/2021 21:04:09 - INFO - __main__ - Step 30387: {'lr': 0.00019973152557961233, 'samples': 972384, 'steps': 1899, 'loss/train': 2.311271905899048} -09/20/2021 21:04:09 - INFO - __main__ - Step 30388: {'lr': 0.00019973152557961233, 'samples': 972416, 'steps': 1899, 'loss/train': 2.176525831222534} -09/20/2021 21:04:10 - INFO - __main__ - Step 30389: {'lr': 0.00019973152557961233, 'samples': 972448, 'steps': 1899, 'loss/train': 2.0140247344970703} -09/20/2021 21:04:11 - INFO - __main__ - Step 30390: {'lr': 0.00019973152557961233, 'samples': 972480, 'steps': 1899, 'loss/train': 1.9293040037155151} -09/20/2021 21:04:12 - INFO - __main__ - Step 30391: {'lr': 0.00019973152557961233, 'samples': 972512, 'steps': 1899, 'loss/train': 2.584827423095703} -09/20/2021 21:04:12 - INFO - __main__ - Step 30392: {'lr': 0.00019973152557961233, 'samples': 972544, 'steps': 1899, 'loss/train': 1.6860216856002808} -09/20/2021 21:04:13 - INFO - __main__ - Step 30393: {'lr': 0.00019973152557961233, 'samples': 972576, 'steps': 1899, 'loss/train': 2.5608415603637695} -09/20/2021 21:04:14 - INFO - __main__ - Step 30394: {'lr': 0.00019973152557961233, 'samples': 972608, 'steps': 1899, 'loss/train': 2.4774296283721924} -09/20/2021 21:04:15 - INFO - __main__ - Step 30395: {'lr': 0.00019973152557961233, 'samples': 972640, 'steps': 1899, 'loss/train': 1.526573896408081} -09/20/2021 21:04:16 - INFO - __main__ - Step 30396: {'lr': 0.00019973152557961233, 'samples': 972672, 'steps': 1899, 'loss/train': 2.9487600326538086} -09/20/2021 21:04:17 - INFO - __main__ - Step 30397: {'lr': 0.00019973152557961233, 'samples': 972704, 'steps': 1899, 'loss/train': 2.295898199081421} -09/20/2021 21:04:17 - INFO - __main__ - Step 30398: {'lr': 0.00019973152557961233, 'samples': 972736, 'steps': 1899, 'loss/train': 2.69460129737854} -09/20/2021 21:04:18 - INFO - __main__ - Step 30399: {'lr': 0.00019973152557961233, 'samples': 972768, 'steps': 1899, 'loss/train': 2.9018025398254395} -09/20/2021 21:04:19 - INFO - __main__ - Step 30400: {'lr': 0.00019973152557961233, 'samples': 972800, 'steps': 1899, 'loss/train': 1.5399130582809448} -09/20/2021 21:04:20 - INFO - __main__ - Step 30401: {'lr': 0.0001997310582675272, 'samples': 972832, 'steps': 1900, 'loss/train': 2.124889612197876} -09/20/2021 21:04:21 - INFO - __main__ - Step 30402: {'lr': 0.0001997310582675272, 'samples': 972864, 'steps': 1900, 'loss/train': 2.347992420196533} -09/20/2021 21:04:21 - INFO - __main__ - Step 30403: {'lr': 0.0001997310582675272, 'samples': 972896, 'steps': 1900, 'loss/train': 2.6569457054138184} -09/20/2021 21:04:22 - INFO - __main__ - Step 30404: {'lr': 0.0001997310582675272, 'samples': 972928, 'steps': 1900, 'loss/train': 2.6692423820495605} -09/20/2021 21:04:23 - INFO - __main__ - Step 30405: {'lr': 0.0001997310582675272, 'samples': 972960, 'steps': 1900, 'loss/train': 2.1586661338806152} -09/20/2021 21:04:24 - INFO - __main__ - Step 30406: {'lr': 0.0001997310582675272, 'samples': 972992, 'steps': 1900, 'loss/train': 2.792881727218628} -09/20/2021 21:04:24 - INFO - __main__ - Step 30407: {'lr': 0.0001997310582675272, 'samples': 973024, 'steps': 1900, 'loss/train': 2.6350231170654297} -09/20/2021 21:04:25 - INFO - __main__ - Step 30408: {'lr': 0.0001997310582675272, 'samples': 973056, 'steps': 1900, 'loss/train': 2.2184455394744873} -09/20/2021 21:04:26 - INFO - __main__ - Step 30409: {'lr': 0.0001997310582675272, 'samples': 973088, 'steps': 1900, 'loss/train': 2.879707098007202} -09/20/2021 21:04:27 - INFO - __main__ - Step 30410: {'lr': 0.0001997310582675272, 'samples': 973120, 'steps': 1900, 'loss/train': 2.732938289642334} -09/20/2021 21:04:27 - INFO - __main__ - Step 30411: {'lr': 0.0001997310582675272, 'samples': 973152, 'steps': 1900, 'loss/train': 2.9646201133728027} -09/20/2021 21:04:28 - INFO - __main__ - Step 30412: {'lr': 0.0001997310582675272, 'samples': 973184, 'steps': 1900, 'loss/train': 2.801448106765747} -09/20/2021 21:04:29 - INFO - __main__ - Step 30413: {'lr': 0.0001997310582675272, 'samples': 973216, 'steps': 1900, 'loss/train': 0.9137740135192871} -09/20/2021 21:04:30 - INFO - __main__ - Step 30414: {'lr': 0.0001997310582675272, 'samples': 973248, 'steps': 1900, 'loss/train': 2.7400758266448975} -09/20/2021 21:04:30 - INFO - __main__ - Step 30415: {'lr': 0.0001997310582675272, 'samples': 973280, 'steps': 1900, 'loss/train': 2.4536843299865723} -09/20/2021 21:04:31 - INFO - __main__ - Step 30416: {'lr': 0.0001997310582675272, 'samples': 973312, 'steps': 1900, 'loss/train': 2.661153554916382} -09/20/2021 21:04:32 - INFO - __main__ - Step 30417: {'lr': 0.00019973059054963677, 'samples': 973344, 'steps': 1901, 'loss/train': 2.482365608215332} -09/20/2021 21:04:33 - INFO - __main__ - Step 30418: {'lr': 0.00019973059054963677, 'samples': 973376, 'steps': 1901, 'loss/train': 2.7128853797912598} -09/20/2021 21:04:33 - INFO - __main__ - Step 30419: {'lr': 0.00019973059054963677, 'samples': 973408, 'steps': 1901, 'loss/train': 2.7706503868103027} -09/20/2021 21:04:34 - INFO - __main__ - Step 30420: {'lr': 0.00019973059054963677, 'samples': 973440, 'steps': 1901, 'loss/train': 1.7831562757492065} -09/20/2021 21:04:35 - INFO - __main__ - Step 30421: {'lr': 0.00019973059054963677, 'samples': 973472, 'steps': 1901, 'loss/train': 3.846937417984009} -09/20/2021 21:04:36 - INFO - __main__ - Step 30422: {'lr': 0.00019973059054963677, 'samples': 973504, 'steps': 1901, 'loss/train': 2.757018804550171} -09/20/2021 21:04:36 - INFO - __main__ - Step 30423: {'lr': 0.00019973059054963677, 'samples': 973536, 'steps': 1901, 'loss/train': 2.5292885303497314} -09/20/2021 21:04:37 - INFO - __main__ - Step 30424: {'lr': 0.00019973059054963677, 'samples': 973568, 'steps': 1901, 'loss/train': 2.331223726272583} -09/20/2021 21:04:39 - INFO - __main__ - Step 30425: {'lr': 0.00019973059054963677, 'samples': 973600, 'steps': 1901, 'loss/train': 2.1503827571868896} -09/20/2021 21:04:39 - INFO - __main__ - Step 30426: {'lr': 0.00019973059054963677, 'samples': 973632, 'steps': 1901, 'loss/train': 2.5333666801452637} -09/20/2021 21:04:40 - INFO - __main__ - Step 30427: {'lr': 0.00019973059054963677, 'samples': 973664, 'steps': 1901, 'loss/train': 3.269594669342041} -09/20/2021 21:04:41 - INFO - __main__ - Step 30428: {'lr': 0.00019973059054963677, 'samples': 973696, 'steps': 1901, 'loss/train': 2.538606882095337} -09/20/2021 21:04:42 - INFO - __main__ - Step 30429: {'lr': 0.00019973059054963677, 'samples': 973728, 'steps': 1901, 'loss/train': 2.985245704650879} -09/20/2021 21:04:42 - INFO - __main__ - Step 30430: {'lr': 0.00019973059054963677, 'samples': 973760, 'steps': 1901, 'loss/train': 2.268946647644043} -09/20/2021 21:04:43 - INFO - __main__ - Step 30431: {'lr': 0.00019973059054963677, 'samples': 973792, 'steps': 1901, 'loss/train': 2.0894649028778076} -09/20/2021 21:04:44 - INFO - __main__ - Step 30432: {'lr': 0.00019973059054963677, 'samples': 973824, 'steps': 1901, 'loss/train': 1.8686484098434448} -09/20/2021 21:04:45 - INFO - __main__ - Step 30433: {'lr': 0.00019973012242594296, 'samples': 973856, 'steps': 1902, 'loss/train': 1.006397008895874} -09/20/2021 21:04:46 - INFO - __main__ - Step 30434: {'lr': 0.00019973012242594296, 'samples': 973888, 'steps': 1902, 'loss/train': 2.6716184616088867} -09/20/2021 21:04:46 - INFO - __main__ - Step 30435: {'lr': 0.00019973012242594296, 'samples': 973920, 'steps': 1902, 'loss/train': 2.3426175117492676} -09/20/2021 21:04:47 - INFO - __main__ - Step 30436: {'lr': 0.00019973012242594296, 'samples': 973952, 'steps': 1902, 'loss/train': 2.234663724899292} -09/20/2021 21:04:48 - INFO - __main__ - Step 30437: {'lr': 0.00019973012242594296, 'samples': 973984, 'steps': 1902, 'loss/train': 2.058109998703003} -09/20/2021 21:04:49 - INFO - __main__ - Step 30438: {'lr': 0.00019973012242594296, 'samples': 974016, 'steps': 1902, 'loss/train': 2.9860522747039795} -09/20/2021 21:04:49 - INFO - __main__ - Step 30439: {'lr': 0.00019973012242594296, 'samples': 974048, 'steps': 1902, 'loss/train': 0.8207422494888306} -09/20/2021 21:04:50 - INFO - __main__ - Step 30440: {'lr': 0.00019973012242594296, 'samples': 974080, 'steps': 1902, 'loss/train': 2.5994927883148193} -09/20/2021 21:04:51 - INFO - __main__ - Step 30441: {'lr': 0.00019973012242594296, 'samples': 974112, 'steps': 1902, 'loss/train': 2.592712640762329} -09/20/2021 21:04:52 - INFO - __main__ - Step 30442: {'lr': 0.00019973012242594296, 'samples': 974144, 'steps': 1902, 'loss/train': 1.4880081415176392} -09/20/2021 21:04:52 - INFO - __main__ - Step 30443: {'lr': 0.00019973012242594296, 'samples': 974176, 'steps': 1902, 'loss/train': 1.0916659832000732} -09/20/2021 21:04:53 - INFO - __main__ - Step 30444: {'lr': 0.00019973012242594296, 'samples': 974208, 'steps': 1902, 'loss/train': 2.1369316577911377} -09/20/2021 21:04:54 - INFO - __main__ - Step 30445: {'lr': 0.00019973012242594296, 'samples': 974240, 'steps': 1902, 'loss/train': 3.1966166496276855} -09/20/2021 21:04:55 - INFO - __main__ - Step 30446: {'lr': 0.00019973012242594296, 'samples': 974272, 'steps': 1902, 'loss/train': 2.189314603805542} -09/20/2021 21:04:55 - INFO - __main__ - Step 30447: {'lr': 0.00019973012242594296, 'samples': 974304, 'steps': 1902, 'loss/train': 2.9544293880462646} -09/20/2021 21:04:56 - INFO - __main__ - Step 30448: {'lr': 0.00019973012242594296, 'samples': 974336, 'steps': 1902, 'loss/train': 2.6632513999938965} -09/20/2021 21:04:57 - INFO - __main__ - Step 30449: {'lr': 0.00019972965389644767, 'samples': 974368, 'steps': 1903, 'loss/train': 2.494858741760254} -09/20/2021 21:04:58 - INFO - __main__ - Step 30450: {'lr': 0.00019972965389644767, 'samples': 974400, 'steps': 1903, 'loss/train': 2.0655226707458496} -09/20/2021 21:04:58 - INFO - __main__ - Step 30451: {'lr': 0.00019972965389644767, 'samples': 974432, 'steps': 1903, 'loss/train': 0.7151556015014648} -09/20/2021 21:04:59 - INFO - __main__ - Step 30452: {'lr': 0.00019972965389644767, 'samples': 974464, 'steps': 1903, 'loss/train': 1.8530521392822266} -09/20/2021 21:05:00 - INFO - __main__ - Step 30453: {'lr': 0.00019972965389644767, 'samples': 974496, 'steps': 1903, 'loss/train': 1.5506477355957031} -09/20/2021 21:05:01 - INFO - __main__ - Step 30454: {'lr': 0.00019972965389644767, 'samples': 974528, 'steps': 1903, 'loss/train': 1.2804123163223267} -09/20/2021 21:05:01 - INFO - __main__ - Step 30455: {'lr': 0.00019972965389644767, 'samples': 974560, 'steps': 1903, 'loss/train': 3.4674651622772217} -09/20/2021 21:05:03 - INFO - __main__ - Step 30456: {'lr': 0.00019972965389644767, 'samples': 974592, 'steps': 1903, 'loss/train': 2.0434391498565674} -09/20/2021 21:05:04 - INFO - __main__ - Step 30457: {'lr': 0.00019972965389644767, 'samples': 974624, 'steps': 1903, 'loss/train': 2.489441156387329} -09/20/2021 21:05:04 - INFO - __main__ - Step 30458: {'lr': 0.00019972965389644767, 'samples': 974656, 'steps': 1903, 'loss/train': 2.798340082168579} -09/20/2021 21:05:05 - INFO - __main__ - Step 30459: {'lr': 0.00019972965389644767, 'samples': 974688, 'steps': 1903, 'loss/train': 2.0207903385162354} -09/20/2021 21:05:06 - INFO - __main__ - Step 30460: {'lr': 0.00019972965389644767, 'samples': 974720, 'steps': 1903, 'loss/train': 0.5732291340827942} -09/20/2021 21:05:07 - INFO - __main__ - Step 30461: {'lr': 0.00019972965389644767, 'samples': 974752, 'steps': 1903, 'loss/train': 2.1370887756347656} -09/20/2021 21:05:08 - INFO - __main__ - Step 30462: {'lr': 0.00019972965389644767, 'samples': 974784, 'steps': 1903, 'loss/train': 1.7043524980545044} -09/20/2021 21:05:08 - INFO - __main__ - Step 30463: {'lr': 0.00019972965389644767, 'samples': 974816, 'steps': 1903, 'loss/train': 1.8052648305892944} -09/20/2021 21:05:09 - INFO - __main__ - Step 30464: {'lr': 0.00019972965389644767, 'samples': 974848, 'steps': 1903, 'loss/train': 1.4710993766784668} -09/20/2021 21:05:10 - INFO - __main__ - Step 30465: {'lr': 0.0001997291849611528, 'samples': 974880, 'steps': 1904, 'loss/train': 2.45904278755188} -09/20/2021 21:05:11 - INFO - __main__ - Step 30466: {'lr': 0.0001997291849611528, 'samples': 974912, 'steps': 1904, 'loss/train': 2.59045147895813} -09/20/2021 21:05:11 - INFO - __main__ - Step 30467: {'lr': 0.0001997291849611528, 'samples': 974944, 'steps': 1904, 'loss/train': 3.091728925704956} -09/20/2021 21:05:12 - INFO - __main__ - Step 30468: {'lr': 0.0001997291849611528, 'samples': 974976, 'steps': 1904, 'loss/train': 2.7421185970306396} -09/20/2021 21:05:13 - INFO - __main__ - Step 30469: {'lr': 0.0001997291849611528, 'samples': 975008, 'steps': 1904, 'loss/train': 2.1711621284484863} -09/20/2021 21:05:14 - INFO - __main__ - Step 30470: {'lr': 0.0001997291849611528, 'samples': 975040, 'steps': 1904, 'loss/train': 2.0230307579040527} -09/20/2021 21:05:14 - INFO - __main__ - Step 30471: {'lr': 0.0001997291849611528, 'samples': 975072, 'steps': 1904, 'loss/train': 2.607351541519165} -09/20/2021 21:05:15 - INFO - __main__ - Step 30472: {'lr': 0.0001997291849611528, 'samples': 975104, 'steps': 1904, 'loss/train': 1.2650620937347412} -09/20/2021 21:05:16 - INFO - __main__ - Step 30473: {'lr': 0.0001997291849611528, 'samples': 975136, 'steps': 1904, 'loss/train': 2.4233005046844482} -09/20/2021 21:05:17 - INFO - __main__ - Step 30474: {'lr': 0.0001997291849611528, 'samples': 975168, 'steps': 1904, 'loss/train': 4.1138081550598145} -09/20/2021 21:05:17 - INFO - __main__ - Step 30475: {'lr': 0.0001997291849611528, 'samples': 975200, 'steps': 1904, 'loss/train': 1.7395912408828735} -09/20/2021 21:05:18 - INFO - __main__ - Step 30476: {'lr': 0.0001997291849611528, 'samples': 975232, 'steps': 1904, 'loss/train': 2.8807003498077393} -09/20/2021 21:05:19 - INFO - __main__ - Step 30477: {'lr': 0.0001997291849611528, 'samples': 975264, 'steps': 1904, 'loss/train': 2.465806245803833} -09/20/2021 21:05:20 - INFO - __main__ - Step 30478: {'lr': 0.0001997291849611528, 'samples': 975296, 'steps': 1904, 'loss/train': 2.4274649620056152} -09/20/2021 21:05:20 - INFO - __main__ - Step 30479: {'lr': 0.0001997291849611528, 'samples': 975328, 'steps': 1904, 'loss/train': 2.6419217586517334} -09/20/2021 21:05:21 - INFO - __main__ - Step 30480: {'lr': 0.0001997291849611528, 'samples': 975360, 'steps': 1904, 'loss/train': 2.7969727516174316} -09/20/2021 21:05:22 - INFO - __main__ - Step 30481: {'lr': 0.0001997287156200603, 'samples': 975392, 'steps': 1905, 'loss/train': 2.6923317909240723} -09/20/2021 21:05:23 - INFO - __main__ - Step 30482: {'lr': 0.0001997287156200603, 'samples': 975424, 'steps': 1905, 'loss/train': 2.88262677192688} -09/20/2021 21:05:24 - INFO - __main__ - Step 30483: {'lr': 0.0001997287156200603, 'samples': 975456, 'steps': 1905, 'loss/train': 2.820394992828369} -09/20/2021 21:05:24 - INFO - __main__ - Step 30484: {'lr': 0.0001997287156200603, 'samples': 975488, 'steps': 1905, 'loss/train': 2.970531702041626} -09/20/2021 21:05:25 - INFO - __main__ - Step 30485: {'lr': 0.0001997287156200603, 'samples': 975520, 'steps': 1905, 'loss/train': 3.020789623260498} -09/20/2021 21:05:26 - INFO - __main__ - Step 30486: {'lr': 0.0001997287156200603, 'samples': 975552, 'steps': 1905, 'loss/train': 2.9782490730285645} -09/20/2021 21:05:27 - INFO - __main__ - Step 30487: {'lr': 0.0001997287156200603, 'samples': 975584, 'steps': 1905, 'loss/train': 2.927457332611084} -09/20/2021 21:05:27 - INFO - __main__ - Step 30488: {'lr': 0.0001997287156200603, 'samples': 975616, 'steps': 1905, 'loss/train': 1.2513489723205566} -09/20/2021 21:05:28 - INFO - __main__ - Step 30489: {'lr': 0.0001997287156200603, 'samples': 975648, 'steps': 1905, 'loss/train': 2.8726580142974854} -09/20/2021 21:05:29 - INFO - __main__ - Step 30490: {'lr': 0.0001997287156200603, 'samples': 975680, 'steps': 1905, 'loss/train': 3.1503190994262695} -09/20/2021 21:05:30 - INFO - __main__ - Step 30491: {'lr': 0.0001997287156200603, 'samples': 975712, 'steps': 1905, 'loss/train': 2.2251524925231934} -09/20/2021 21:05:31 - INFO - __main__ - Step 30492: {'lr': 0.0001997287156200603, 'samples': 975744, 'steps': 1905, 'loss/train': 2.9254136085510254} -09/20/2021 21:05:32 - INFO - __main__ - Step 30493: {'lr': 0.0001997287156200603, 'samples': 975776, 'steps': 1905, 'loss/train': 2.2628772258758545} -09/20/2021 21:05:32 - INFO - __main__ - Step 30494: {'lr': 0.0001997287156200603, 'samples': 975808, 'steps': 1905, 'loss/train': 2.167233467102051} -09/20/2021 21:05:33 - INFO - __main__ - Step 30495: {'lr': 0.0001997287156200603, 'samples': 975840, 'steps': 1905, 'loss/train': 1.6670496463775635} -09/20/2021 21:05:34 - INFO - __main__ - Step 30496: {'lr': 0.0001997287156200603, 'samples': 975872, 'steps': 1905, 'loss/train': 2.5546555519104004} -09/20/2021 21:05:35 - INFO - __main__ - Step 30497: {'lr': 0.000199728245873172, 'samples': 975904, 'steps': 1906, 'loss/train': 2.89929461479187} -09/20/2021 21:05:35 - INFO - __main__ - Step 30498: {'lr': 0.000199728245873172, 'samples': 975936, 'steps': 1906, 'loss/train': 2.9089155197143555} -09/20/2021 21:05:36 - INFO - __main__ - Step 30499: {'lr': 0.000199728245873172, 'samples': 975968, 'steps': 1906, 'loss/train': 2.511427164077759} -09/20/2021 21:05:37 - INFO - __main__ - Step 30500: {'lr': 0.000199728245873172, 'samples': 976000, 'steps': 1906, 'loss/train': 2.927199125289917} -09/20/2021 21:05:38 - INFO - __main__ - Step 30501: {'lr': 0.000199728245873172, 'samples': 976032, 'steps': 1906, 'loss/train': 2.697620391845703} -09/20/2021 21:05:38 - INFO - __main__ - Step 30502: {'lr': 0.000199728245873172, 'samples': 976064, 'steps': 1906, 'loss/train': 2.359983205795288} -09/20/2021 21:05:39 - INFO - __main__ - Step 30503: {'lr': 0.000199728245873172, 'samples': 976096, 'steps': 1906, 'loss/train': 2.4714348316192627} -09/20/2021 21:05:40 - INFO - __main__ - Step 30504: {'lr': 0.000199728245873172, 'samples': 976128, 'steps': 1906, 'loss/train': 2.8907554149627686} -09/20/2021 21:05:41 - INFO - __main__ - Step 30505: {'lr': 0.000199728245873172, 'samples': 976160, 'steps': 1906, 'loss/train': 2.2730391025543213} -09/20/2021 21:05:41 - INFO - __main__ - Step 30506: {'lr': 0.000199728245873172, 'samples': 976192, 'steps': 1906, 'loss/train': 1.7086626291275024} -09/20/2021 21:05:42 - INFO - __main__ - Step 30507: {'lr': 0.000199728245873172, 'samples': 976224, 'steps': 1906, 'loss/train': 1.238287329673767} -09/20/2021 21:05:43 - INFO - __main__ - Step 30508: {'lr': 0.000199728245873172, 'samples': 976256, 'steps': 1906, 'loss/train': 2.8480312824249268} -09/20/2021 21:05:44 - INFO - __main__ - Step 30509: {'lr': 0.000199728245873172, 'samples': 976288, 'steps': 1906, 'loss/train': 2.319976806640625} -09/20/2021 21:05:44 - INFO - __main__ - Step 30510: {'lr': 0.000199728245873172, 'samples': 976320, 'steps': 1906, 'loss/train': 2.3125054836273193} -09/20/2021 21:05:45 - INFO - __main__ - Step 30511: {'lr': 0.000199728245873172, 'samples': 976352, 'steps': 1906, 'loss/train': 2.600982427597046} -09/20/2021 21:05:46 - INFO - __main__ - Step 30512: {'lr': 0.000199728245873172, 'samples': 976384, 'steps': 1906, 'loss/train': 2.4782800674438477} -09/20/2021 21:05:47 - INFO - __main__ - Step 30513: {'lr': 0.00019972777572048987, 'samples': 976416, 'steps': 1907, 'loss/train': 3.1498587131500244} -09/20/2021 21:05:48 - INFO - __main__ - Step 30514: {'lr': 0.00019972777572048987, 'samples': 976448, 'steps': 1907, 'loss/train': 0.9830114841461182} -09/20/2021 21:05:48 - INFO - __main__ - Step 30515: {'lr': 0.00019972777572048987, 'samples': 976480, 'steps': 1907, 'loss/train': 3.0826520919799805} -09/20/2021 21:05:49 - INFO - __main__ - Step 30516: {'lr': 0.00019972777572048987, 'samples': 976512, 'steps': 1907, 'loss/train': 2.1761722564697266} -09/20/2021 21:05:50 - INFO - __main__ - Step 30517: {'lr': 0.00019972777572048987, 'samples': 976544, 'steps': 1907, 'loss/train': 1.7190818786621094} -09/20/2021 21:05:51 - INFO - __main__ - Step 30518: {'lr': 0.00019972777572048987, 'samples': 976576, 'steps': 1907, 'loss/train': 2.566108226776123} -09/20/2021 21:05:51 - INFO - __main__ - Step 30519: {'lr': 0.00019972777572048987, 'samples': 976608, 'steps': 1907, 'loss/train': 2.3758556842803955} -09/20/2021 21:05:53 - INFO - __main__ - Step 30520: {'lr': 0.00019972777572048987, 'samples': 976640, 'steps': 1907, 'loss/train': 2.3264706134796143} -09/20/2021 21:05:53 - INFO - __main__ - Step 30521: {'lr': 0.00019972777572048987, 'samples': 976672, 'steps': 1907, 'loss/train': 2.0135412216186523} -09/20/2021 21:05:54 - INFO - __main__ - Step 30522: {'lr': 0.00019972777572048987, 'samples': 976704, 'steps': 1907, 'loss/train': 2.762901782989502} -09/20/2021 21:05:55 - INFO - __main__ - Step 30523: {'lr': 0.00019972777572048987, 'samples': 976736, 'steps': 1907, 'loss/train': 2.4924440383911133} -09/20/2021 21:05:56 - INFO - __main__ - Step 30524: {'lr': 0.00019972777572048987, 'samples': 976768, 'steps': 1907, 'loss/train': 3.6881775856018066} -09/20/2021 21:05:56 - INFO - __main__ - Step 30525: {'lr': 0.00019972777572048987, 'samples': 976800, 'steps': 1907, 'loss/train': 2.2999744415283203} -09/20/2021 21:05:57 - INFO - __main__ - Step 30526: {'lr': 0.00019972777572048987, 'samples': 976832, 'steps': 1907, 'loss/train': 0.3276318609714508} -09/20/2021 21:05:58 - INFO - __main__ - Step 30527: {'lr': 0.00019972777572048987, 'samples': 976864, 'steps': 1907, 'loss/train': 0.2734604775905609} -09/20/2021 21:05:59 - INFO - __main__ - Step 30528: {'lr': 0.00019972777572048987, 'samples': 976896, 'steps': 1907, 'loss/train': 0.4273170530796051} -09/20/2021 21:06:00 - INFO - __main__ - Step 30529: {'lr': 0.0001997273051620158, 'samples': 976928, 'steps': 1908, 'loss/train': 0.37551748752593994} -09/20/2021 21:06:00 - INFO - __main__ - Step 30530: {'lr': 0.0001997273051620158, 'samples': 976960, 'steps': 1908, 'loss/train': 2.979241371154785} -09/20/2021 21:06:01 - INFO - __main__ - Step 30531: {'lr': 0.0001997273051620158, 'samples': 976992, 'steps': 1908, 'loss/train': 1.5451014041900635} -09/20/2021 21:06:02 - INFO - __main__ - Step 30532: {'lr': 0.0001997273051620158, 'samples': 977024, 'steps': 1908, 'loss/train': 2.3368706703186035} -09/20/2021 21:06:03 - INFO - __main__ - Step 30533: {'lr': 0.0001997273051620158, 'samples': 977056, 'steps': 1908, 'loss/train': 2.6628057956695557} -09/20/2021 21:06:03 - INFO - __main__ - Step 30534: {'lr': 0.0001997273051620158, 'samples': 977088, 'steps': 1908, 'loss/train': 0.3247653841972351} -09/20/2021 21:06:04 - INFO - __main__ - Step 30535: {'lr': 0.0001997273051620158, 'samples': 977120, 'steps': 1908, 'loss/train': 0.34525591135025024} -09/20/2021 21:06:05 - INFO - __main__ - Step 30536: {'lr': 0.0001997273051620158, 'samples': 977152, 'steps': 1908, 'loss/train': 1.6372262239456177} -09/20/2021 21:06:06 - INFO - __main__ - Step 30537: {'lr': 0.0001997273051620158, 'samples': 977184, 'steps': 1908, 'loss/train': 1.2610892057418823} -09/20/2021 21:06:06 - INFO - __main__ - Step 30538: {'lr': 0.0001997273051620158, 'samples': 977216, 'steps': 1908, 'loss/train': 1.3493036031723022} -09/20/2021 21:06:07 - INFO - __main__ - Step 30539: {'lr': 0.0001997273051620158, 'samples': 977248, 'steps': 1908, 'loss/train': 1.1850337982177734} -09/20/2021 21:06:08 - INFO - __main__ - Step 30540: {'lr': 0.0001997273051620158, 'samples': 977280, 'steps': 1908, 'loss/train': 1.6956392526626587} -09/20/2021 21:06:09 - INFO - __main__ - Step 30541: {'lr': 0.0001997273051620158, 'samples': 977312, 'steps': 1908, 'loss/train': 2.4742016792297363} -09/20/2021 21:06:09 - INFO - __main__ - Step 30542: {'lr': 0.0001997273051620158, 'samples': 977344, 'steps': 1908, 'loss/train': 2.894045829772949} -09/20/2021 21:06:10 - INFO - __main__ - Step 30543: {'lr': 0.0001997273051620158, 'samples': 977376, 'steps': 1908, 'loss/train': 2.7550837993621826} -09/20/2021 21:06:11 - INFO - __main__ - Step 30544: {'lr': 0.0001997273051620158, 'samples': 977408, 'steps': 1908, 'loss/train': 2.0479447841644287} -09/20/2021 21:06:12 - INFO - __main__ - Step 30545: {'lr': 0.0001997268341977517, 'samples': 977440, 'steps': 1909, 'loss/train': 2.6751961708068848} -09/20/2021 21:06:12 - INFO - __main__ - Step 30546: {'lr': 0.0001997268341977517, 'samples': 977472, 'steps': 1909, 'loss/train': 2.616032838821411} -09/20/2021 21:06:13 - INFO - __main__ - Step 30547: {'lr': 0.0001997268341977517, 'samples': 977504, 'steps': 1909, 'loss/train': 2.8937389850616455} -09/20/2021 21:06:14 - INFO - __main__ - Step 30548: {'lr': 0.0001997268341977517, 'samples': 977536, 'steps': 1909, 'loss/train': 2.2113749980926514} -09/20/2021 21:06:15 - INFO - __main__ - Step 30549: {'lr': 0.0001997268341977517, 'samples': 977568, 'steps': 1909, 'loss/train': 1.8147857189178467} -09/20/2021 21:06:15 - INFO - __main__ - Step 30550: {'lr': 0.0001997268341977517, 'samples': 977600, 'steps': 1909, 'loss/train': 2.4441158771514893} -09/20/2021 21:06:17 - INFO - __main__ - Step 30551: {'lr': 0.0001997268341977517, 'samples': 977632, 'steps': 1909, 'loss/train': 3.039492607116699} -09/20/2021 21:06:18 - INFO - __main__ - Step 30552: {'lr': 0.0001997268341977517, 'samples': 977664, 'steps': 1909, 'loss/train': 2.6829049587249756} -09/20/2021 21:06:19 - INFO - __main__ - Step 30553: {'lr': 0.0001997268341977517, 'samples': 977696, 'steps': 1909, 'loss/train': 1.809602975845337} -09/20/2021 21:06:20 - INFO - __main__ - Step 30554: {'lr': 0.0001997268341977517, 'samples': 977728, 'steps': 1909, 'loss/train': 2.044682741165161} -09/20/2021 21:06:20 - INFO - __main__ - Step 30555: {'lr': 0.0001997268341977517, 'samples': 977760, 'steps': 1909, 'loss/train': 2.904075860977173} -09/20/2021 21:06:21 - INFO - __main__ - Step 30556: {'lr': 0.0001997268341977517, 'samples': 977792, 'steps': 1909, 'loss/train': 3.905454158782959} -09/20/2021 21:06:22 - INFO - __main__ - Step 30557: {'lr': 0.0001997268341977517, 'samples': 977824, 'steps': 1909, 'loss/train': 2.299805164337158} -09/20/2021 21:06:23 - INFO - __main__ - Step 30558: {'lr': 0.0001997268341977517, 'samples': 977856, 'steps': 1909, 'loss/train': 1.8525720834732056} -09/20/2021 21:06:23 - INFO - __main__ - Step 30559: {'lr': 0.0001997268341977517, 'samples': 977888, 'steps': 1909, 'loss/train': 4.926590919494629} -09/20/2021 21:06:24 - INFO - __main__ - Step 30560: {'lr': 0.0001997268341977517, 'samples': 977920, 'steps': 1909, 'loss/train': 3.6159257888793945} -09/20/2021 21:06:25 - INFO - __main__ - Step 30561: {'lr': 0.00019972636282769953, 'samples': 977952, 'steps': 1910, 'loss/train': 2.9480769634246826} -09/20/2021 21:06:26 - INFO - __main__ - Step 30562: {'lr': 0.00019972636282769953, 'samples': 977984, 'steps': 1910, 'loss/train': 3.169459342956543} -09/20/2021 21:06:26 - INFO - __main__ - Step 30563: {'lr': 0.00019972636282769953, 'samples': 978016, 'steps': 1910, 'loss/train': 2.1226274967193604} -09/20/2021 21:06:27 - INFO - __main__ - Step 30564: {'lr': 0.00019972636282769953, 'samples': 978048, 'steps': 1910, 'loss/train': 1.3028205633163452} -09/20/2021 21:06:28 - INFO - __main__ - Step 30565: {'lr': 0.00019972636282769953, 'samples': 978080, 'steps': 1910, 'loss/train': 2.7314436435699463} -09/20/2021 21:06:29 - INFO - __main__ - Step 30566: {'lr': 0.00019972636282769953, 'samples': 978112, 'steps': 1910, 'loss/train': 1.0829336643218994} -09/20/2021 21:06:29 - INFO - __main__ - Step 30567: {'lr': 0.00019972636282769953, 'samples': 978144, 'steps': 1910, 'loss/train': 2.7114479541778564} -09/20/2021 21:06:30 - INFO - __main__ - Step 30568: {'lr': 0.00019972636282769953, 'samples': 978176, 'steps': 1910, 'loss/train': 2.540555477142334} -09/20/2021 21:06:31 - INFO - __main__ - Step 30569: {'lr': 0.00019972636282769953, 'samples': 978208, 'steps': 1910, 'loss/train': 1.8384236097335815} -09/20/2021 21:06:32 - INFO - __main__ - Step 30570: {'lr': 0.00019972636282769953, 'samples': 978240, 'steps': 1910, 'loss/train': 2.312666654586792} -09/20/2021 21:06:32 - INFO - __main__ - Step 30571: {'lr': 0.00019972636282769953, 'samples': 978272, 'steps': 1910, 'loss/train': 2.7513861656188965} -09/20/2021 21:06:33 - INFO - __main__ - Step 30572: {'lr': 0.00019972636282769953, 'samples': 978304, 'steps': 1910, 'loss/train': 2.903323173522949} -09/20/2021 21:06:34 - INFO - __main__ - Step 30573: {'lr': 0.00019972636282769953, 'samples': 978336, 'steps': 1910, 'loss/train': 2.687145471572876} -09/20/2021 21:06:35 - INFO - __main__ - Step 30574: {'lr': 0.00019972636282769953, 'samples': 978368, 'steps': 1910, 'loss/train': 2.760054588317871} -09/20/2021 21:06:35 - INFO - __main__ - Step 30575: {'lr': 0.00019972636282769953, 'samples': 978400, 'steps': 1910, 'loss/train': 2.719317674636841} -09/20/2021 21:06:36 - INFO - __main__ - Step 30576: {'lr': 0.00019972636282769953, 'samples': 978432, 'steps': 1910, 'loss/train': 2.6622214317321777} -09/20/2021 21:06:37 - INFO - __main__ - Step 30577: {'lr': 0.00019972589105186114, 'samples': 978464, 'steps': 1911, 'loss/train': 2.4461021423339844} -09/20/2021 21:06:38 - INFO - __main__ - Step 30578: {'lr': 0.00019972589105186114, 'samples': 978496, 'steps': 1911, 'loss/train': 2.6019093990325928} -09/20/2021 21:06:39 - INFO - __main__ - Step 30579: {'lr': 0.00019972589105186114, 'samples': 978528, 'steps': 1911, 'loss/train': 2.3782544136047363} -09/20/2021 21:06:39 - INFO - __main__ - Step 30580: {'lr': 0.00019972589105186114, 'samples': 978560, 'steps': 1911, 'loss/train': 2.5191543102264404} -09/20/2021 21:06:40 - INFO - __main__ - Step 30581: {'lr': 0.00019972589105186114, 'samples': 978592, 'steps': 1911, 'loss/train': 2.6216650009155273} -09/20/2021 21:06:41 - INFO - __main__ - Step 30582: {'lr': 0.00019972589105186114, 'samples': 978624, 'steps': 1911, 'loss/train': 2.472616672515869} -09/20/2021 21:06:42 - INFO - __main__ - Step 30583: {'lr': 0.00019972589105186114, 'samples': 978656, 'steps': 1911, 'loss/train': 2.52032470703125} -09/20/2021 21:06:42 - INFO - __main__ - Step 30584: {'lr': 0.00019972589105186114, 'samples': 978688, 'steps': 1911, 'loss/train': 2.4330508708953857} -09/20/2021 21:06:43 - INFO - __main__ - Step 30585: {'lr': 0.00019972589105186114, 'samples': 978720, 'steps': 1911, 'loss/train': 0.9573628306388855} -09/20/2021 21:06:44 - INFO - __main__ - Step 30586: {'lr': 0.00019972589105186114, 'samples': 978752, 'steps': 1911, 'loss/train': 2.525815725326538} -09/20/2021 21:06:45 - INFO - __main__ - Step 30587: {'lr': 0.00019972589105186114, 'samples': 978784, 'steps': 1911, 'loss/train': 2.5801479816436768} -09/20/2021 21:06:45 - INFO - __main__ - Step 30588: {'lr': 0.00019972589105186114, 'samples': 978816, 'steps': 1911, 'loss/train': 2.561284065246582} -09/20/2021 21:06:46 - INFO - __main__ - Step 30589: {'lr': 0.00019972589105186114, 'samples': 978848, 'steps': 1911, 'loss/train': 2.5580861568450928} -09/20/2021 21:06:47 - INFO - __main__ - Step 30590: {'lr': 0.00019972589105186114, 'samples': 978880, 'steps': 1911, 'loss/train': 2.7952322959899902} -09/20/2021 21:06:48 - INFO - __main__ - Step 30591: {'lr': 0.00019972589105186114, 'samples': 978912, 'steps': 1911, 'loss/train': 2.788618326187134} -09/20/2021 21:06:48 - INFO - __main__ - Step 30592: {'lr': 0.00019972589105186114, 'samples': 978944, 'steps': 1911, 'loss/train': 2.7898929119110107} -09/20/2021 21:06:49 - INFO - __main__ - Step 30593: {'lr': 0.00019972541887023853, 'samples': 978976, 'steps': 1912, 'loss/train': 2.7551956176757812} -09/20/2021 21:06:51 - INFO - __main__ - Step 30594: {'lr': 0.00019972541887023853, 'samples': 979008, 'steps': 1912, 'loss/train': 3.029179573059082} -09/20/2021 21:06:51 - INFO - __main__ - Step 30595: {'lr': 0.00019972541887023853, 'samples': 979040, 'steps': 1912, 'loss/train': 2.4024932384490967} -09/20/2021 21:06:52 - INFO - __main__ - Step 30596: {'lr': 0.00019972541887023853, 'samples': 979072, 'steps': 1912, 'loss/train': 2.4519612789154053} -09/20/2021 21:06:53 - INFO - __main__ - Step 30597: {'lr': 0.00019972541887023853, 'samples': 979104, 'steps': 1912, 'loss/train': 2.987271785736084} -09/20/2021 21:06:54 - INFO - __main__ - Step 30598: {'lr': 0.00019972541887023853, 'samples': 979136, 'steps': 1912, 'loss/train': 2.6608035564422607} -09/20/2021 21:06:54 - INFO - __main__ - Step 30599: {'lr': 0.00019972541887023853, 'samples': 979168, 'steps': 1912, 'loss/train': 2.103464126586914} -09/20/2021 21:06:55 - INFO - __main__ - Step 30600: {'lr': 0.00019972541887023853, 'samples': 979200, 'steps': 1912, 'loss/train': 1.7764652967453003} -09/20/2021 21:06:56 - INFO - __main__ - Step 30601: {'lr': 0.00019972541887023853, 'samples': 979232, 'steps': 1912, 'loss/train': 2.3819854259490967} -09/20/2021 21:06:57 - INFO - __main__ - Step 30602: {'lr': 0.00019972541887023853, 'samples': 979264, 'steps': 1912, 'loss/train': 2.3114230632781982} -09/20/2021 21:06:57 - INFO - __main__ - Step 30603: {'lr': 0.00019972541887023853, 'samples': 979296, 'steps': 1912, 'loss/train': 3.0593996047973633} -09/20/2021 21:06:58 - INFO - __main__ - Step 30604: {'lr': 0.00019972541887023853, 'samples': 979328, 'steps': 1912, 'loss/train': 2.376328229904175} -09/20/2021 21:06:59 - INFO - __main__ - Step 30605: {'lr': 0.00019972541887023853, 'samples': 979360, 'steps': 1912, 'loss/train': 3.173480987548828} -09/20/2021 21:07:00 - INFO - __main__ - Step 30606: {'lr': 0.00019972541887023853, 'samples': 979392, 'steps': 1912, 'loss/train': 2.08501935005188} -09/20/2021 21:07:00 - INFO - __main__ - Step 30607: {'lr': 0.00019972541887023853, 'samples': 979424, 'steps': 1912, 'loss/train': 2.49301815032959} -09/20/2021 21:07:01 - INFO - __main__ - Step 30608: {'lr': 0.00019972541887023853, 'samples': 979456, 'steps': 1912, 'loss/train': 2.5182037353515625} -09/20/2021 21:07:02 - INFO - __main__ - Step 30609: {'lr': 0.00019972494628283353, 'samples': 979488, 'steps': 1913, 'loss/train': 2.3122055530548096} -09/20/2021 21:07:03 - INFO - __main__ - Step 30610: {'lr': 0.00019972494628283353, 'samples': 979520, 'steps': 1913, 'loss/train': 2.4344005584716797} -09/20/2021 21:07:04 - INFO - __main__ - Step 30611: {'lr': 0.00019972494628283353, 'samples': 979552, 'steps': 1913, 'loss/train': 2.8525967597961426} -09/20/2021 21:07:04 - INFO - __main__ - Step 30612: {'lr': 0.00019972494628283353, 'samples': 979584, 'steps': 1913, 'loss/train': 2.28922700881958} -09/20/2021 21:07:05 - INFO - __main__ - Step 30613: {'lr': 0.00019972494628283353, 'samples': 979616, 'steps': 1913, 'loss/train': 3.719119071960449} -09/20/2021 21:07:06 - INFO - __main__ - Step 30614: {'lr': 0.00019972494628283353, 'samples': 979648, 'steps': 1913, 'loss/train': 2.2137691974639893} -09/20/2021 21:07:07 - INFO - __main__ - Step 30615: {'lr': 0.00019972494628283353, 'samples': 979680, 'steps': 1913, 'loss/train': 3.24617862701416} -09/20/2021 21:07:07 - INFO - __main__ - Step 30616: {'lr': 0.00019972494628283353, 'samples': 979712, 'steps': 1913, 'loss/train': 2.6561365127563477} -09/20/2021 21:07:08 - INFO - __main__ - Step 30617: {'lr': 0.00019972494628283353, 'samples': 979744, 'steps': 1913, 'loss/train': 1.7369060516357422} -09/20/2021 21:07:09 - INFO - __main__ - Step 30618: {'lr': 0.00019972494628283353, 'samples': 979776, 'steps': 1913, 'loss/train': 3.34138822555542} -09/20/2021 21:07:10 - INFO - __main__ - Step 30619: {'lr': 0.00019972494628283353, 'samples': 979808, 'steps': 1913, 'loss/train': 3.1408321857452393} -09/20/2021 21:07:10 - INFO - __main__ - Step 30620: {'lr': 0.00019972494628283353, 'samples': 979840, 'steps': 1913, 'loss/train': 2.623581886291504} -09/20/2021 21:07:11 - INFO - __main__ - Step 30621: {'lr': 0.00019972494628283353, 'samples': 979872, 'steps': 1913, 'loss/train': 1.924306035041809} -09/20/2021 21:07:12 - INFO - __main__ - Step 30622: {'lr': 0.00019972494628283353, 'samples': 979904, 'steps': 1913, 'loss/train': 2.8926870822906494} -09/20/2021 21:07:13 - INFO - __main__ - Step 30623: {'lr': 0.00019972494628283353, 'samples': 979936, 'steps': 1913, 'loss/train': 3.227815628051758} -09/20/2021 21:07:13 - INFO - __main__ - Step 30624: {'lr': 0.00019972494628283353, 'samples': 979968, 'steps': 1913, 'loss/train': 2.9747862815856934} -09/20/2021 21:07:15 - INFO - __main__ - Step 30625: {'lr': 0.00019972447328964817, 'samples': 980000, 'steps': 1914, 'loss/train': 1.9299029111862183} -09/20/2021 21:07:16 - INFO - __main__ - Step 30626: {'lr': 0.00019972447328964817, 'samples': 980032, 'steps': 1914, 'loss/train': 2.9248411655426025} -09/20/2021 21:07:17 - INFO - __main__ - Step 30627: {'lr': 0.00019972447328964817, 'samples': 980064, 'steps': 1914, 'loss/train': 2.2083606719970703} -09/20/2021 21:07:17 - INFO - __main__ - Step 30628: {'lr': 0.00019972447328964817, 'samples': 980096, 'steps': 1914, 'loss/train': 3.3076794147491455} -09/20/2021 21:07:18 - INFO - __main__ - Step 30629: {'lr': 0.00019972447328964817, 'samples': 980128, 'steps': 1914, 'loss/train': 3.1409599781036377} -09/20/2021 21:07:19 - INFO - __main__ - Step 30630: {'lr': 0.00019972447328964817, 'samples': 980160, 'steps': 1914, 'loss/train': 2.5190045833587646} -09/20/2021 21:07:20 - INFO - __main__ - Step 30631: {'lr': 0.00019972447328964817, 'samples': 980192, 'steps': 1914, 'loss/train': 0.571560263633728} -09/20/2021 21:07:20 - INFO - __main__ - Step 30632: {'lr': 0.00019972447328964817, 'samples': 980224, 'steps': 1914, 'loss/train': 2.00687575340271} -09/20/2021 21:07:21 - INFO - __main__ - Step 30633: {'lr': 0.00019972447328964817, 'samples': 980256, 'steps': 1914, 'loss/train': 1.8928159475326538} -09/20/2021 21:07:22 - INFO - __main__ - Step 30634: {'lr': 0.00019972447328964817, 'samples': 980288, 'steps': 1914, 'loss/train': 2.5830800533294678} -09/20/2021 21:07:23 - INFO - __main__ - Step 30635: {'lr': 0.00019972447328964817, 'samples': 980320, 'steps': 1914, 'loss/train': 1.9472179412841797} -09/20/2021 21:07:23 - INFO - __main__ - Step 30636: {'lr': 0.00019972447328964817, 'samples': 980352, 'steps': 1914, 'loss/train': 2.4751524925231934} -09/20/2021 21:07:24 - INFO - __main__ - Step 30637: {'lr': 0.00019972447328964817, 'samples': 980384, 'steps': 1914, 'loss/train': 2.568826675415039} -09/20/2021 21:07:25 - INFO - __main__ - Step 30638: {'lr': 0.00019972447328964817, 'samples': 980416, 'steps': 1914, 'loss/train': 2.671957492828369} -09/20/2021 21:07:26 - INFO - __main__ - Step 30639: {'lr': 0.00019972447328964817, 'samples': 980448, 'steps': 1914, 'loss/train': 1.9791409969329834} -09/20/2021 21:07:26 - INFO - __main__ - Step 30640: {'lr': 0.00019972447328964817, 'samples': 980480, 'steps': 1914, 'loss/train': 1.4814114570617676} -09/20/2021 21:07:27 - INFO - __main__ - Step 30641: {'lr': 0.00019972399989068426, 'samples': 980512, 'steps': 1915, 'loss/train': 1.8684666156768799} -09/20/2021 21:07:28 - INFO - __main__ - Step 30642: {'lr': 0.00019972399989068426, 'samples': 980544, 'steps': 1915, 'loss/train': 2.7146248817443848} -09/20/2021 21:07:29 - INFO - __main__ - Step 30643: {'lr': 0.00019972399989068426, 'samples': 980576, 'steps': 1915, 'loss/train': 3.2246670722961426} -09/20/2021 21:07:30 - INFO - __main__ - Step 30644: {'lr': 0.00019972399989068426, 'samples': 980608, 'steps': 1915, 'loss/train': 2.711202621459961} -09/20/2021 21:07:30 - INFO - __main__ - Step 30645: {'lr': 0.00019972399989068426, 'samples': 980640, 'steps': 1915, 'loss/train': 2.418303966522217} -09/20/2021 21:07:31 - INFO - __main__ - Step 30646: {'lr': 0.00019972399989068426, 'samples': 980672, 'steps': 1915, 'loss/train': 2.113262414932251} -09/20/2021 21:07:32 - INFO - __main__ - Step 30647: {'lr': 0.00019972399989068426, 'samples': 980704, 'steps': 1915, 'loss/train': 1.506125569343567} -09/20/2021 21:07:33 - INFO - __main__ - Step 30648: {'lr': 0.00019972399989068426, 'samples': 980736, 'steps': 1915, 'loss/train': 1.7261961698532104} -09/20/2021 21:07:33 - INFO - __main__ - Step 30649: {'lr': 0.00019972399989068426, 'samples': 980768, 'steps': 1915, 'loss/train': 2.4121651649475098} -09/20/2021 21:07:34 - INFO - __main__ - Step 30650: {'lr': 0.00019972399989068426, 'samples': 980800, 'steps': 1915, 'loss/train': 1.8365579843521118} -09/20/2021 21:07:35 - INFO - __main__ - Step 30651: {'lr': 0.00019972399989068426, 'samples': 980832, 'steps': 1915, 'loss/train': 3.17677903175354} -09/20/2021 21:07:36 - INFO - __main__ - Step 30652: {'lr': 0.00019972399989068426, 'samples': 980864, 'steps': 1915, 'loss/train': 1.696293592453003} -09/20/2021 21:07:36 - INFO - __main__ - Step 30653: {'lr': 0.00019972399989068426, 'samples': 980896, 'steps': 1915, 'loss/train': 2.275012493133545} -09/20/2021 21:07:37 - INFO - __main__ - Step 30654: {'lr': 0.00019972399989068426, 'samples': 980928, 'steps': 1915, 'loss/train': 2.961193561553955} -09/20/2021 21:07:38 - INFO - __main__ - Step 30655: {'lr': 0.00019972399989068426, 'samples': 980960, 'steps': 1915, 'loss/train': 2.66420578956604} -09/20/2021 21:07:39 - INFO - __main__ - Step 30656: {'lr': 0.00019972399989068426, 'samples': 980992, 'steps': 1915, 'loss/train': 1.557385802268982} -09/20/2021 21:07:40 - INFO - __main__ - Step 30657: {'lr': 0.0001997235260859438, 'samples': 981024, 'steps': 1916, 'loss/train': 2.797767162322998} -09/20/2021 21:07:41 - INFO - __main__ - Step 30658: {'lr': 0.0001997235260859438, 'samples': 981056, 'steps': 1916, 'loss/train': 2.0997824668884277} -09/20/2021 21:07:41 - INFO - __main__ - Step 30659: {'lr': 0.0001997235260859438, 'samples': 981088, 'steps': 1916, 'loss/train': 2.688217878341675} -09/20/2021 21:07:42 - INFO - __main__ - Step 30660: {'lr': 0.0001997235260859438, 'samples': 981120, 'steps': 1916, 'loss/train': 2.9088478088378906} -09/20/2021 21:07:43 - INFO - __main__ - Step 30661: {'lr': 0.0001997235260859438, 'samples': 981152, 'steps': 1916, 'loss/train': 2.808450222015381} -09/20/2021 21:07:44 - INFO - __main__ - Step 30662: {'lr': 0.0001997235260859438, 'samples': 981184, 'steps': 1916, 'loss/train': 3.0501677989959717} -09/20/2021 21:07:44 - INFO - __main__ - Step 30663: {'lr': 0.0001997235260859438, 'samples': 981216, 'steps': 1916, 'loss/train': 2.5582151412963867} -09/20/2021 21:07:45 - INFO - __main__ - Step 30664: {'lr': 0.0001997235260859438, 'samples': 981248, 'steps': 1916, 'loss/train': 2.2739083766937256} -09/20/2021 21:07:46 - INFO - __main__ - Step 30665: {'lr': 0.0001997235260859438, 'samples': 981280, 'steps': 1916, 'loss/train': 2.051427125930786} -09/20/2021 21:07:47 - INFO - __main__ - Step 30666: {'lr': 0.0001997235260859438, 'samples': 981312, 'steps': 1916, 'loss/train': 1.696182131767273} -09/20/2021 21:07:47 - INFO - __main__ - Step 30667: {'lr': 0.0001997235260859438, 'samples': 981344, 'steps': 1916, 'loss/train': 2.2714385986328125} -09/20/2021 21:07:48 - INFO - __main__ - Step 30668: {'lr': 0.0001997235260859438, 'samples': 981376, 'steps': 1916, 'loss/train': 2.2279272079467773} -09/20/2021 21:07:49 - INFO - __main__ - Step 30669: {'lr': 0.0001997235260859438, 'samples': 981408, 'steps': 1916, 'loss/train': 3.744192123413086} -09/20/2021 21:07:50 - INFO - __main__ - Step 30670: {'lr': 0.0001997235260859438, 'samples': 981440, 'steps': 1916, 'loss/train': 2.646437406539917} -09/20/2021 21:07:50 - INFO - __main__ - Step 30671: {'lr': 0.0001997235260859438, 'samples': 981472, 'steps': 1916, 'loss/train': 3.975001096725464} -09/20/2021 21:07:51 - INFO - __main__ - Step 30672: {'lr': 0.0001997235260859438, 'samples': 981504, 'steps': 1916, 'loss/train': 2.680098295211792} -09/20/2021 21:07:52 - INFO - __main__ - Step 30673: {'lr': 0.00019972305187542872, 'samples': 981536, 'steps': 1917, 'loss/train': 2.5659379959106445} -09/20/2021 21:07:53 - INFO - __main__ - Step 30674: {'lr': 0.00019972305187542872, 'samples': 981568, 'steps': 1917, 'loss/train': 2.875892162322998} -09/20/2021 21:07:54 - INFO - __main__ - Step 30675: {'lr': 0.00019972305187542872, 'samples': 981600, 'steps': 1917, 'loss/train': 1.1182154417037964} -09/20/2021 21:07:54 - INFO - __main__ - Step 30676: {'lr': 0.00019972305187542872, 'samples': 981632, 'steps': 1917, 'loss/train': 2.4762959480285645} -09/20/2021 21:07:55 - INFO - __main__ - Step 30677: {'lr': 0.00019972305187542872, 'samples': 981664, 'steps': 1917, 'loss/train': 2.3717167377471924} -09/20/2021 21:07:56 - INFO - __main__ - Step 30678: {'lr': 0.00019972305187542872, 'samples': 981696, 'steps': 1917, 'loss/train': 2.4431350231170654} -09/20/2021 21:07:57 - INFO - __main__ - Step 30679: {'lr': 0.00019972305187542872, 'samples': 981728, 'steps': 1917, 'loss/train': 1.9528498649597168} -09/20/2021 21:07:57 - INFO - __main__ - Step 30680: {'lr': 0.00019972305187542872, 'samples': 981760, 'steps': 1917, 'loss/train': 2.580700159072876} -09/20/2021 21:07:58 - INFO - __main__ - Step 30681: {'lr': 0.00019972305187542872, 'samples': 981792, 'steps': 1917, 'loss/train': 2.70424485206604} -09/20/2021 21:07:59 - INFO - __main__ - Step 30682: {'lr': 0.00019972305187542872, 'samples': 981824, 'steps': 1917, 'loss/train': 2.2994089126586914} -09/20/2021 21:08:00 - INFO - __main__ - Step 30683: {'lr': 0.00019972305187542872, 'samples': 981856, 'steps': 1917, 'loss/train': 3.1115312576293945} -09/20/2021 21:08:00 - INFO - __main__ - Step 30684: {'lr': 0.00019972305187542872, 'samples': 981888, 'steps': 1917, 'loss/train': 2.5282490253448486} -09/20/2021 21:08:01 - INFO - __main__ - Step 30685: {'lr': 0.00019972305187542872, 'samples': 981920, 'steps': 1917, 'loss/train': 2.940814971923828} -09/20/2021 21:08:02 - INFO - __main__ - Step 30686: {'lr': 0.00019972305187542872, 'samples': 981952, 'steps': 1917, 'loss/train': 3.0228705406188965} -09/20/2021 21:08:03 - INFO - __main__ - Step 30687: {'lr': 0.00019972305187542872, 'samples': 981984, 'steps': 1917, 'loss/train': 3.819261312484741} -09/20/2021 21:08:04 - INFO - __main__ - Step 30688: {'lr': 0.00019972305187542872, 'samples': 982016, 'steps': 1917, 'loss/train': 3.292924165725708} -09/20/2021 21:08:05 - INFO - __main__ - Step 30689: {'lr': 0.0001997225772591409, 'samples': 982048, 'steps': 1918, 'loss/train': 2.635058641433716} -09/20/2021 21:08:06 - INFO - __main__ - Step 30690: {'lr': 0.0001997225772591409, 'samples': 982080, 'steps': 1918, 'loss/train': 2.3041481971740723} -09/20/2021 21:08:07 - INFO - __main__ - Step 30691: {'lr': 0.0001997225772591409, 'samples': 982112, 'steps': 1918, 'loss/train': 2.776193141937256} -09/20/2021 21:08:07 - INFO - __main__ - Step 30692: {'lr': 0.0001997225772591409, 'samples': 982144, 'steps': 1918, 'loss/train': 2.165811061859131} -09/20/2021 21:08:08 - INFO - __main__ - Step 30693: {'lr': 0.0001997225772591409, 'samples': 982176, 'steps': 1918, 'loss/train': 0.5135034322738647} -09/20/2021 21:08:09 - INFO - __main__ - Step 30694: {'lr': 0.0001997225772591409, 'samples': 982208, 'steps': 1918, 'loss/train': 3.0222084522247314} -09/20/2021 21:08:10 - INFO - __main__ - Step 30695: {'lr': 0.0001997225772591409, 'samples': 982240, 'steps': 1918, 'loss/train': 2.198411464691162} -09/20/2021 21:08:10 - INFO - __main__ - Step 30696: {'lr': 0.0001997225772591409, 'samples': 982272, 'steps': 1918, 'loss/train': 3.3387279510498047} -09/20/2021 21:08:11 - INFO - __main__ - Step 30697: {'lr': 0.0001997225772591409, 'samples': 982304, 'steps': 1918, 'loss/train': 2.0667619705200195} -09/20/2021 21:08:12 - INFO - __main__ - Step 30698: {'lr': 0.0001997225772591409, 'samples': 982336, 'steps': 1918, 'loss/train': 2.479694366455078} -09/20/2021 21:08:13 - INFO - __main__ - Step 30699: {'lr': 0.0001997225772591409, 'samples': 982368, 'steps': 1918, 'loss/train': 1.3146491050720215} -09/20/2021 21:08:13 - INFO - __main__ - Step 30700: {'lr': 0.0001997225772591409, 'samples': 982400, 'steps': 1918, 'loss/train': 2.198990821838379} -09/20/2021 21:08:14 - INFO - __main__ - Step 30701: {'lr': 0.0001997225772591409, 'samples': 982432, 'steps': 1918, 'loss/train': 3.4402148723602295} -09/20/2021 21:08:15 - INFO - __main__ - Step 30702: {'lr': 0.0001997225772591409, 'samples': 982464, 'steps': 1918, 'loss/train': 2.402599573135376} -09/20/2021 21:08:16 - INFO - __main__ - Step 30703: {'lr': 0.0001997225772591409, 'samples': 982496, 'steps': 1918, 'loss/train': 2.5227653980255127} -09/20/2021 21:08:16 - INFO - __main__ - Step 30704: {'lr': 0.0001997225772591409, 'samples': 982528, 'steps': 1918, 'loss/train': 2.0774593353271484} -09/20/2021 21:08:17 - INFO - __main__ - Step 30705: {'lr': 0.00019972210223708232, 'samples': 982560, 'steps': 1919, 'loss/train': 3.021064281463623} -09/20/2021 21:08:18 - INFO - __main__ - Step 30706: {'lr': 0.00019972210223708232, 'samples': 982592, 'steps': 1919, 'loss/train': 0.9126273989677429} -09/20/2021 21:08:19 - INFO - __main__ - Step 30707: {'lr': 0.00019972210223708232, 'samples': 982624, 'steps': 1919, 'loss/train': 1.6319533586502075} -09/20/2021 21:08:19 - INFO - __main__ - Step 30708: {'lr': 0.00019972210223708232, 'samples': 982656, 'steps': 1919, 'loss/train': 2.508439302444458} -09/20/2021 21:08:20 - INFO - __main__ - Step 30709: {'lr': 0.00019972210223708232, 'samples': 982688, 'steps': 1919, 'loss/train': 2.678326368331909} -09/20/2021 21:08:21 - INFO - __main__ - Step 30710: {'lr': 0.00019972210223708232, 'samples': 982720, 'steps': 1919, 'loss/train': 2.2439630031585693} -09/20/2021 21:08:22 - INFO - __main__ - Step 30711: {'lr': 0.00019972210223708232, 'samples': 982752, 'steps': 1919, 'loss/train': 3.441258192062378} -09/20/2021 21:08:22 - INFO - __main__ - Step 30712: {'lr': 0.00019972210223708232, 'samples': 982784, 'steps': 1919, 'loss/train': 4.295429229736328} -09/20/2021 21:08:23 - INFO - __main__ - Step 30713: {'lr': 0.00019972210223708232, 'samples': 982816, 'steps': 1919, 'loss/train': 3.911468982696533} -09/20/2021 21:08:24 - INFO - __main__ - Step 30714: {'lr': 0.00019972210223708232, 'samples': 982848, 'steps': 1919, 'loss/train': 3.9579591751098633} -09/20/2021 21:08:25 - INFO - __main__ - Step 30715: {'lr': 0.00019972210223708232, 'samples': 982880, 'steps': 1919, 'loss/train': 2.4818832874298096} -09/20/2021 21:08:25 - INFO - __main__ - Step 30716: {'lr': 0.00019972210223708232, 'samples': 982912, 'steps': 1919, 'loss/train': 1.7893598079681396} -09/20/2021 21:08:26 - INFO - __main__ - Step 30717: {'lr': 0.00019972210223708232, 'samples': 982944, 'steps': 1919, 'loss/train': 2.5896823406219482} -09/20/2021 21:08:27 - INFO - __main__ - Step 30718: {'lr': 0.00019972210223708232, 'samples': 982976, 'steps': 1919, 'loss/train': 2.7497060298919678} -09/20/2021 21:08:28 - INFO - __main__ - Step 30719: {'lr': 0.00019972210223708232, 'samples': 983008, 'steps': 1919, 'loss/train': 2.6706125736236572} -09/20/2021 21:08:28 - INFO - __main__ - Step 30720: {'lr': 0.00019972210223708232, 'samples': 983040, 'steps': 1919, 'loss/train': 2.756181240081787} -09/20/2021 21:08:29 - INFO - __main__ - Step 30721: {'lr': 0.00019972162680925487, 'samples': 983072, 'steps': 1920, 'loss/train': 2.5938265323638916} -09/20/2021 21:08:31 - INFO - __main__ - Step 30722: {'lr': 0.00019972162680925487, 'samples': 983104, 'steps': 1920, 'loss/train': 2.4215281009674072} -09/20/2021 21:08:31 - INFO - __main__ - Step 30723: {'lr': 0.00019972162680925487, 'samples': 983136, 'steps': 1920, 'loss/train': 2.4491961002349854} -09/20/2021 21:08:32 - INFO - __main__ - Step 30724: {'lr': 0.00019972162680925487, 'samples': 983168, 'steps': 1920, 'loss/train': 1.9623208045959473} -09/20/2021 21:08:33 - INFO - __main__ - Step 30725: {'lr': 0.00019972162680925487, 'samples': 983200, 'steps': 1920, 'loss/train': 2.1454553604125977} -09/20/2021 21:08:34 - INFO - __main__ - Step 30726: {'lr': 0.00019972162680925487, 'samples': 983232, 'steps': 1920, 'loss/train': 2.9683854579925537} -09/20/2021 21:08:34 - INFO - __main__ - Step 30727: {'lr': 0.00019972162680925487, 'samples': 983264, 'steps': 1920, 'loss/train': 3.3752942085266113} -09/20/2021 21:08:35 - INFO - __main__ - Step 30728: {'lr': 0.00019972162680925487, 'samples': 983296, 'steps': 1920, 'loss/train': 2.586493730545044} -09/20/2021 21:08:36 - INFO - __main__ - Step 30729: {'lr': 0.00019972162680925487, 'samples': 983328, 'steps': 1920, 'loss/train': 0.7070488333702087} -09/20/2021 21:08:37 - INFO - __main__ - Step 30730: {'lr': 0.00019972162680925487, 'samples': 983360, 'steps': 1920, 'loss/train': 2.3238284587860107} -09/20/2021 21:08:37 - INFO - __main__ - Step 30731: {'lr': 0.00019972162680925487, 'samples': 983392, 'steps': 1920, 'loss/train': 2.830781936645508} -09/20/2021 21:08:38 - INFO - __main__ - Step 30732: {'lr': 0.00019972162680925487, 'samples': 983424, 'steps': 1920, 'loss/train': 3.437776565551758} -09/20/2021 21:08:39 - INFO - __main__ - Step 30733: {'lr': 0.00019972162680925487, 'samples': 983456, 'steps': 1920, 'loss/train': 2.2801361083984375} -09/20/2021 21:08:40 - INFO - __main__ - Step 30734: {'lr': 0.00019972162680925487, 'samples': 983488, 'steps': 1920, 'loss/train': 2.770052909851074} -09/20/2021 21:08:40 - INFO - __main__ - Step 30735: {'lr': 0.00019972162680925487, 'samples': 983520, 'steps': 1920, 'loss/train': 2.349008560180664} -09/20/2021 21:08:41 - INFO - __main__ - Step 30736: {'lr': 0.00019972162680925487, 'samples': 983552, 'steps': 1920, 'loss/train': 2.806934356689453} -09/20/2021 21:08:42 - INFO - __main__ - Step 30737: {'lr': 0.00019972115097566053, 'samples': 983584, 'steps': 1921, 'loss/train': 2.9581379890441895} -09/20/2021 21:08:43 - INFO - __main__ - Step 30738: {'lr': 0.00019972115097566053, 'samples': 983616, 'steps': 1921, 'loss/train': 2.588324546813965} -09/20/2021 21:08:44 - INFO - __main__ - Step 30739: {'lr': 0.00019972115097566053, 'samples': 983648, 'steps': 1921, 'loss/train': 2.3554160594940186} -09/20/2021 21:08:44 - INFO - __main__ - Step 30740: {'lr': 0.00019972115097566053, 'samples': 983680, 'steps': 1921, 'loss/train': 2.712367534637451} -09/20/2021 21:08:45 - INFO - __main__ - Step 30741: {'lr': 0.00019972115097566053, 'samples': 983712, 'steps': 1921, 'loss/train': 2.091085195541382} -09/20/2021 21:08:46 - INFO - __main__ - Step 30742: {'lr': 0.00019972115097566053, 'samples': 983744, 'steps': 1921, 'loss/train': 1.5570038557052612} -09/20/2021 21:08:47 - INFO - __main__ - Step 30743: {'lr': 0.00019972115097566053, 'samples': 983776, 'steps': 1921, 'loss/train': 2.380934000015259} -09/20/2021 21:08:47 - INFO - __main__ - Step 30744: {'lr': 0.00019972115097566053, 'samples': 983808, 'steps': 1921, 'loss/train': 2.6885485649108887} -09/20/2021 21:08:48 - INFO - __main__ - Step 30745: {'lr': 0.00019972115097566053, 'samples': 983840, 'steps': 1921, 'loss/train': 2.1751348972320557} -09/20/2021 21:08:49 - INFO - __main__ - Step 30746: {'lr': 0.00019972115097566053, 'samples': 983872, 'steps': 1921, 'loss/train': 1.7736098766326904} -09/20/2021 21:08:50 - INFO - __main__ - Step 30747: {'lr': 0.00019972115097566053, 'samples': 983904, 'steps': 1921, 'loss/train': 1.5843970775604248} -09/20/2021 21:08:50 - INFO - __main__ - Step 30748: {'lr': 0.00019972115097566053, 'samples': 983936, 'steps': 1921, 'loss/train': 1.4523091316223145} -09/20/2021 21:08:51 - INFO - __main__ - Step 30749: {'lr': 0.00019972115097566053, 'samples': 983968, 'steps': 1921, 'loss/train': 1.7197964191436768} -09/20/2021 21:08:52 - INFO - __main__ - Step 30750: {'lr': 0.00019972115097566053, 'samples': 984000, 'steps': 1921, 'loss/train': 2.4589200019836426} -09/20/2021 21:08:53 - INFO - __main__ - Step 30751: {'lr': 0.00019972115097566053, 'samples': 984032, 'steps': 1921, 'loss/train': 2.961395502090454} -09/20/2021 21:08:54 - INFO - __main__ - Step 30752: {'lr': 0.00019972115097566053, 'samples': 984064, 'steps': 1921, 'loss/train': 2.3165829181671143} -09/20/2021 21:08:55 - INFO - __main__ - Step 30753: {'lr': 0.0001997206747363012, 'samples': 984096, 'steps': 1922, 'loss/train': 0.8055421113967896} -09/20/2021 21:08:55 - INFO - __main__ - Step 30754: {'lr': 0.0001997206747363012, 'samples': 984128, 'steps': 1922, 'loss/train': 3.4060873985290527} -09/20/2021 21:08:56 - INFO - __main__ - Step 30755: {'lr': 0.0001997206747363012, 'samples': 984160, 'steps': 1922, 'loss/train': 2.555755138397217} -09/20/2021 21:08:57 - INFO - __main__ - Step 30756: {'lr': 0.0001997206747363012, 'samples': 984192, 'steps': 1922, 'loss/train': 2.745227813720703} -09/20/2021 21:08:58 - INFO - __main__ - Step 30757: {'lr': 0.0001997206747363012, 'samples': 984224, 'steps': 1922, 'loss/train': 2.6179747581481934} -09/20/2021 21:08:58 - INFO - __main__ - Step 30758: {'lr': 0.0001997206747363012, 'samples': 984256, 'steps': 1922, 'loss/train': 2.1155993938446045} -09/20/2021 21:08:59 - INFO - __main__ - Step 30759: {'lr': 0.0001997206747363012, 'samples': 984288, 'steps': 1922, 'loss/train': 1.6834909915924072} -09/20/2021 21:09:00 - INFO - __main__ - Step 30760: {'lr': 0.0001997206747363012, 'samples': 984320, 'steps': 1922, 'loss/train': 2.1240994930267334} -09/20/2021 21:09:01 - INFO - __main__ - Step 30761: {'lr': 0.0001997206747363012, 'samples': 984352, 'steps': 1922, 'loss/train': 2.509599447250366} -09/20/2021 21:09:01 - INFO - __main__ - Step 30762: {'lr': 0.0001997206747363012, 'samples': 984384, 'steps': 1922, 'loss/train': 1.7639391422271729} -09/20/2021 21:09:02 - INFO - __main__ - Step 30763: {'lr': 0.0001997206747363012, 'samples': 984416, 'steps': 1922, 'loss/train': 2.7939298152923584} -09/20/2021 21:09:03 - INFO - __main__ - Step 30764: {'lr': 0.0001997206747363012, 'samples': 984448, 'steps': 1922, 'loss/train': 2.324686288833618} -09/20/2021 21:09:04 - INFO - __main__ - Step 30765: {'lr': 0.0001997206747363012, 'samples': 984480, 'steps': 1922, 'loss/train': 2.2334671020507812} -09/20/2021 21:09:04 - INFO - __main__ - Step 30766: {'lr': 0.0001997206747363012, 'samples': 984512, 'steps': 1922, 'loss/train': 2.0691237449645996} -09/20/2021 21:09:05 - INFO - __main__ - Step 30767: {'lr': 0.0001997206747363012, 'samples': 984544, 'steps': 1922, 'loss/train': 3.440131664276123} -09/20/2021 21:09:06 - INFO - __main__ - Step 30768: {'lr': 0.0001997206747363012, 'samples': 984576, 'steps': 1922, 'loss/train': 2.3086793422698975} -09/20/2021 21:09:07 - INFO - __main__ - Step 30769: {'lr': 0.00019972019809117884, 'samples': 984608, 'steps': 1923, 'loss/train': 3.1540584564208984} -09/20/2021 21:09:08 - INFO - __main__ - Step 30770: {'lr': 0.00019972019809117884, 'samples': 984640, 'steps': 1923, 'loss/train': 2.2634999752044678} -09/20/2021 21:09:08 - INFO - __main__ - Step 30771: {'lr': 0.00019972019809117884, 'samples': 984672, 'steps': 1923, 'loss/train': 2.819556951522827} -09/20/2021 21:09:09 - INFO - __main__ - Step 30772: {'lr': 0.00019972019809117884, 'samples': 984704, 'steps': 1923, 'loss/train': 2.5952553749084473} -09/20/2021 21:09:10 - INFO - __main__ - Step 30773: {'lr': 0.00019972019809117884, 'samples': 984736, 'steps': 1923, 'loss/train': 2.580183267593384} -09/20/2021 21:09:11 - INFO - __main__ - Step 30774: {'lr': 0.00019972019809117884, 'samples': 984768, 'steps': 1923, 'loss/train': 2.123103618621826} -09/20/2021 21:09:11 - INFO - __main__ - Step 30775: {'lr': 0.00019972019809117884, 'samples': 984800, 'steps': 1923, 'loss/train': 2.6489193439483643} -09/20/2021 21:09:12 - INFO - __main__ - Step 30776: {'lr': 0.00019972019809117884, 'samples': 984832, 'steps': 1923, 'loss/train': 3.129589557647705} -09/20/2021 21:09:13 - INFO - __main__ - Step 30777: {'lr': 0.00019972019809117884, 'samples': 984864, 'steps': 1923, 'loss/train': 2.2091288566589355} -09/20/2021 21:09:14 - INFO - __main__ - Step 30778: {'lr': 0.00019972019809117884, 'samples': 984896, 'steps': 1923, 'loss/train': 2.2136640548706055} -09/20/2021 21:09:14 - INFO - __main__ - Step 30779: {'lr': 0.00019972019809117884, 'samples': 984928, 'steps': 1923, 'loss/train': 2.3577077388763428} -09/20/2021 21:09:15 - INFO - __main__ - Step 30780: {'lr': 0.00019972019809117884, 'samples': 984960, 'steps': 1923, 'loss/train': 2.0694429874420166} -09/20/2021 21:09:16 - INFO - __main__ - Step 30781: {'lr': 0.00019972019809117884, 'samples': 984992, 'steps': 1923, 'loss/train': 1.965226411819458} -09/20/2021 21:09:17 - INFO - __main__ - Step 30782: {'lr': 0.00019972019809117884, 'samples': 985024, 'steps': 1923, 'loss/train': 2.6885077953338623} -09/20/2021 21:09:18 - INFO - __main__ - Step 30783: {'lr': 0.00019972019809117884, 'samples': 985056, 'steps': 1923, 'loss/train': 2.335407018661499} -09/20/2021 21:09:19 - INFO - __main__ - Step 30784: {'lr': 0.00019972019809117884, 'samples': 985088, 'steps': 1923, 'loss/train': 1.2160875797271729} -09/20/2021 21:09:19 - INFO - __main__ - Step 30785: {'lr': 0.00019971972104029537, 'samples': 985120, 'steps': 1924, 'loss/train': 2.4282429218292236} -09/20/2021 21:09:20 - INFO - __main__ - Step 30786: {'lr': 0.00019971972104029537, 'samples': 985152, 'steps': 1924, 'loss/train': 2.238656520843506} -09/20/2021 21:09:21 - INFO - __main__ - Step 30787: {'lr': 0.00019971972104029537, 'samples': 985184, 'steps': 1924, 'loss/train': 1.5664608478546143} -09/20/2021 21:09:22 - INFO - __main__ - Step 30788: {'lr': 0.00019971972104029537, 'samples': 985216, 'steps': 1924, 'loss/train': 2.1679744720458984} -09/20/2021 21:09:22 - INFO - __main__ - Step 30789: {'lr': 0.00019971972104029537, 'samples': 985248, 'steps': 1924, 'loss/train': 2.9043385982513428} -09/20/2021 21:09:23 - INFO - __main__ - Step 30790: {'lr': 0.00019971972104029537, 'samples': 985280, 'steps': 1924, 'loss/train': 1.1394530534744263} -09/20/2021 21:09:24 - INFO - __main__ - Step 30791: {'lr': 0.00019971972104029537, 'samples': 985312, 'steps': 1924, 'loss/train': 2.1153512001037598} -09/20/2021 21:09:25 - INFO - __main__ - Step 30792: {'lr': 0.00019971972104029537, 'samples': 985344, 'steps': 1924, 'loss/train': 2.196587562561035} -09/20/2021 21:09:25 - INFO - __main__ - Step 30793: {'lr': 0.00019971972104029537, 'samples': 985376, 'steps': 1924, 'loss/train': 4.210282802581787} -09/20/2021 21:09:26 - INFO - __main__ - Step 30794: {'lr': 0.00019971972104029537, 'samples': 985408, 'steps': 1924, 'loss/train': 3.231879949569702} -09/20/2021 21:09:27 - INFO - __main__ - Step 30795: {'lr': 0.00019971972104029537, 'samples': 985440, 'steps': 1924, 'loss/train': 2.665309190750122} -09/20/2021 21:09:28 - INFO - __main__ - Step 30796: {'lr': 0.00019971972104029537, 'samples': 985472, 'steps': 1924, 'loss/train': 2.3785159587860107} -09/20/2021 21:09:28 - INFO - __main__ - Step 30797: {'lr': 0.00019971972104029537, 'samples': 985504, 'steps': 1924, 'loss/train': 2.021390199661255} -09/20/2021 21:09:29 - INFO - __main__ - Step 30798: {'lr': 0.00019971972104029537, 'samples': 985536, 'steps': 1924, 'loss/train': 3.138002872467041} -09/20/2021 21:09:30 - INFO - __main__ - Step 30799: {'lr': 0.00019971972104029537, 'samples': 985568, 'steps': 1924, 'loss/train': 2.3177480697631836} -09/20/2021 21:09:31 - INFO - __main__ - Step 30800: {'lr': 0.00019971972104029537, 'samples': 985600, 'steps': 1924, 'loss/train': 3.0515074729919434} -09/20/2021 21:09:32 - INFO - __main__ - Step 30801: {'lr': 0.00019971924358365274, 'samples': 985632, 'steps': 1925, 'loss/train': 2.758287191390991} -09/20/2021 21:09:32 - INFO - __main__ - Step 30802: {'lr': 0.00019971924358365274, 'samples': 985664, 'steps': 1925, 'loss/train': 2.2516391277313232} -09/20/2021 21:09:33 - INFO - __main__ - Step 30803: {'lr': 0.00019971924358365274, 'samples': 985696, 'steps': 1925, 'loss/train': 2.6506197452545166} -09/20/2021 21:09:34 - INFO - __main__ - Step 30804: {'lr': 0.00019971924358365274, 'samples': 985728, 'steps': 1925, 'loss/train': 2.3357460498809814} -09/20/2021 21:09:35 - INFO - __main__ - Step 30805: {'lr': 0.00019971924358365274, 'samples': 985760, 'steps': 1925, 'loss/train': 2.7904467582702637} -09/20/2021 21:09:35 - INFO - __main__ - Step 30806: {'lr': 0.00019971924358365274, 'samples': 985792, 'steps': 1925, 'loss/train': 1.9339431524276733} -09/20/2021 21:09:36 - INFO - __main__ - Step 30807: {'lr': 0.00019971924358365274, 'samples': 985824, 'steps': 1925, 'loss/train': 2.520420789718628} -09/20/2021 21:09:37 - INFO - __main__ - Step 30808: {'lr': 0.00019971924358365274, 'samples': 985856, 'steps': 1925, 'loss/train': 2.2773988246917725} -09/20/2021 21:09:38 - INFO - __main__ - Step 30809: {'lr': 0.00019971924358365274, 'samples': 985888, 'steps': 1925, 'loss/train': 1.9503251314163208} -09/20/2021 21:09:38 - INFO - __main__ - Step 30810: {'lr': 0.00019971924358365274, 'samples': 985920, 'steps': 1925, 'loss/train': 2.901238203048706} -09/20/2021 21:09:39 - INFO - __main__ - Step 30811: {'lr': 0.00019971924358365274, 'samples': 985952, 'steps': 1925, 'loss/train': 2.895353317260742} -09/20/2021 21:09:40 - INFO - __main__ - Step 30812: {'lr': 0.00019971924358365274, 'samples': 985984, 'steps': 1925, 'loss/train': 2.6176769733428955} -09/20/2021 21:09:41 - INFO - __main__ - Step 30813: {'lr': 0.00019971924358365274, 'samples': 986016, 'steps': 1925, 'loss/train': 2.626103162765503} -09/20/2021 21:09:42 - INFO - __main__ - Step 30814: {'lr': 0.00019971924358365274, 'samples': 986048, 'steps': 1925, 'loss/train': 1.7378461360931396} -09/20/2021 21:09:43 - INFO - __main__ - Step 30815: {'lr': 0.00019971924358365274, 'samples': 986080, 'steps': 1925, 'loss/train': 2.233924627304077} -09/20/2021 21:09:43 - INFO - __main__ - Step 30816: {'lr': 0.00019971924358365274, 'samples': 986112, 'steps': 1925, 'loss/train': 2.957695245742798} -09/20/2021 21:09:44 - INFO - __main__ - Step 30817: {'lr': 0.0001997187657212529, 'samples': 986144, 'steps': 1926, 'loss/train': 2.4425995349884033} -09/20/2021 21:09:45 - INFO - __main__ - Step 30818: {'lr': 0.0001997187657212529, 'samples': 986176, 'steps': 1926, 'loss/train': 3.022420644760132} -09/20/2021 21:09:46 - INFO - __main__ - Step 30819: {'lr': 0.0001997187657212529, 'samples': 986208, 'steps': 1926, 'loss/train': 2.1409413814544678} -09/20/2021 21:09:47 - INFO - __main__ - Step 30820: {'lr': 0.0001997187657212529, 'samples': 986240, 'steps': 1926, 'loss/train': 2.6427950859069824} -09/20/2021 21:09:47 - INFO - __main__ - Step 30821: {'lr': 0.0001997187657212529, 'samples': 986272, 'steps': 1926, 'loss/train': 2.8535306453704834} -09/20/2021 21:09:48 - INFO - __main__ - Step 30822: {'lr': 0.0001997187657212529, 'samples': 986304, 'steps': 1926, 'loss/train': 3.746152400970459} -09/20/2021 21:09:49 - INFO - __main__ - Step 30823: {'lr': 0.0001997187657212529, 'samples': 986336, 'steps': 1926, 'loss/train': 2.3005847930908203} -09/20/2021 21:09:50 - INFO - __main__ - Step 30824: {'lr': 0.0001997187657212529, 'samples': 986368, 'steps': 1926, 'loss/train': 2.233025550842285} -09/20/2021 21:09:50 - INFO - __main__ - Step 30825: {'lr': 0.0001997187657212529, 'samples': 986400, 'steps': 1926, 'loss/train': 1.9551109075546265} -09/20/2021 21:09:51 - INFO - __main__ - Step 30826: {'lr': 0.0001997187657212529, 'samples': 986432, 'steps': 1926, 'loss/train': 2.045102119445801} -09/20/2021 21:09:52 - INFO - __main__ - Step 30827: {'lr': 0.0001997187657212529, 'samples': 986464, 'steps': 1926, 'loss/train': 0.6285618543624878} -09/20/2021 21:09:53 - INFO - __main__ - Step 30828: {'lr': 0.0001997187657212529, 'samples': 986496, 'steps': 1926, 'loss/train': 1.1730934381484985} -09/20/2021 21:09:53 - INFO - __main__ - Step 30829: {'lr': 0.0001997187657212529, 'samples': 986528, 'steps': 1926, 'loss/train': 1.9015295505523682} -09/20/2021 21:09:54 - INFO - __main__ - Step 30830: {'lr': 0.0001997187657212529, 'samples': 986560, 'steps': 1926, 'loss/train': 1.465632677078247} -09/20/2021 21:09:55 - INFO - __main__ - Step 30831: {'lr': 0.0001997187657212529, 'samples': 986592, 'steps': 1926, 'loss/train': 2.490143299102783} -09/20/2021 21:09:56 - INFO - __main__ - Step 30832: {'lr': 0.0001997187657212529, 'samples': 986624, 'steps': 1926, 'loss/train': 2.181293487548828} -09/20/2021 21:09:56 - INFO - __main__ - Step 30833: {'lr': 0.00019971828745309782, 'samples': 986656, 'steps': 1927, 'loss/train': 2.732335090637207} -09/20/2021 21:09:57 - INFO - __main__ - Step 30834: {'lr': 0.00019971828745309782, 'samples': 986688, 'steps': 1927, 'loss/train': 3.7189371585845947} -09/20/2021 21:09:58 - INFO - __main__ - Step 30835: {'lr': 0.00019971828745309782, 'samples': 986720, 'steps': 1927, 'loss/train': 1.9456053972244263} -09/20/2021 21:09:59 - INFO - __main__ - Step 30836: {'lr': 0.00019971828745309782, 'samples': 986752, 'steps': 1927, 'loss/train': 2.6713433265686035} -09/20/2021 21:09:59 - INFO - __main__ - Step 30837: {'lr': 0.00019971828745309782, 'samples': 986784, 'steps': 1927, 'loss/train': 2.7496814727783203} -09/20/2021 21:10:00 - INFO - __main__ - Step 30838: {'lr': 0.00019971828745309782, 'samples': 986816, 'steps': 1927, 'loss/train': 1.9751936197280884} -09/20/2021 21:10:01 - INFO - __main__ - Step 30839: {'lr': 0.00019971828745309782, 'samples': 986848, 'steps': 1927, 'loss/train': 2.7472176551818848} -09/20/2021 21:10:02 - INFO - __main__ - Step 30840: {'lr': 0.00019971828745309782, 'samples': 986880, 'steps': 1927, 'loss/train': 2.304396629333496} -09/20/2021 21:10:02 - INFO - __main__ - Step 30841: {'lr': 0.00019971828745309782, 'samples': 986912, 'steps': 1927, 'loss/train': 2.880342721939087} -09/20/2021 21:10:03 - INFO - __main__ - Step 30842: {'lr': 0.00019971828745309782, 'samples': 986944, 'steps': 1927, 'loss/train': 0.7473819851875305} -09/20/2021 21:10:04 - INFO - __main__ - Step 30843: {'lr': 0.00019971828745309782, 'samples': 986976, 'steps': 1927, 'loss/train': 0.8198965191841125} -09/20/2021 21:10:05 - INFO - __main__ - Step 30844: {'lr': 0.00019971828745309782, 'samples': 987008, 'steps': 1927, 'loss/train': 1.5751909017562866} -09/20/2021 21:10:07 - INFO - __main__ - Step 30845: {'lr': 0.00019971828745309782, 'samples': 987040, 'steps': 1927, 'loss/train': 2.7175450325012207} -09/20/2021 21:10:07 - INFO - __main__ - Step 30846: {'lr': 0.00019971828745309782, 'samples': 987072, 'steps': 1927, 'loss/train': 2.0668325424194336} -09/20/2021 21:10:08 - INFO - __main__ - Step 30847: {'lr': 0.00019971828745309782, 'samples': 987104, 'steps': 1927, 'loss/train': 2.2172935009002686} -09/20/2021 21:10:09 - INFO - __main__ - Step 30848: {'lr': 0.00019971828745309782, 'samples': 987136, 'steps': 1927, 'loss/train': 1.758872389793396} -09/20/2021 21:10:10 - INFO - __main__ - Step 30849: {'lr': 0.00019971780877918937, 'samples': 987168, 'steps': 1928, 'loss/train': 1.619006633758545} -09/20/2021 21:10:10 - INFO - __main__ - Step 30850: {'lr': 0.00019971780877918937, 'samples': 987200, 'steps': 1928, 'loss/train': 1.4048060178756714} -09/20/2021 21:10:11 - INFO - __main__ - Step 30851: {'lr': 0.00019971780877918937, 'samples': 987232, 'steps': 1928, 'loss/train': 1.6584103107452393} -09/20/2021 21:10:12 - INFO - __main__ - Step 30852: {'lr': 0.00019971780877918937, 'samples': 987264, 'steps': 1928, 'loss/train': 1.86482834815979} -09/20/2021 21:10:13 - INFO - __main__ - Step 30853: {'lr': 0.00019971780877918937, 'samples': 987296, 'steps': 1928, 'loss/train': 1.5620547533035278} -09/20/2021 21:10:13 - INFO - __main__ - Step 30854: {'lr': 0.00019971780877918937, 'samples': 987328, 'steps': 1928, 'loss/train': 3.1619389057159424} -09/20/2021 21:10:14 - INFO - __main__ - Step 30855: {'lr': 0.00019971780877918937, 'samples': 987360, 'steps': 1928, 'loss/train': 3.0589163303375244} -09/20/2021 21:10:15 - INFO - __main__ - Step 30856: {'lr': 0.00019971780877918937, 'samples': 987392, 'steps': 1928, 'loss/train': 1.0344226360321045} -09/20/2021 21:10:16 - INFO - __main__ - Step 30857: {'lr': 0.00019971780877918937, 'samples': 987424, 'steps': 1928, 'loss/train': 2.2354090213775635} -09/20/2021 21:10:16 - INFO - __main__ - Step 30858: {'lr': 0.00019971780877918937, 'samples': 987456, 'steps': 1928, 'loss/train': 3.200565814971924} -09/20/2021 21:10:17 - INFO - __main__ - Step 30859: {'lr': 0.00019971780877918937, 'samples': 987488, 'steps': 1928, 'loss/train': 2.483241558074951} -09/20/2021 21:10:18 - INFO - __main__ - Step 30860: {'lr': 0.00019971780877918937, 'samples': 987520, 'steps': 1928, 'loss/train': 2.001452684402466} -09/20/2021 21:10:19 - INFO - __main__ - Step 30861: {'lr': 0.00019971780877918937, 'samples': 987552, 'steps': 1928, 'loss/train': 2.846938371658325} -09/20/2021 21:10:19 - INFO - __main__ - Step 30862: {'lr': 0.00019971780877918937, 'samples': 987584, 'steps': 1928, 'loss/train': 1.6066030263900757} -09/20/2021 21:10:20 - INFO - __main__ - Step 30863: {'lr': 0.00019971780877918937, 'samples': 987616, 'steps': 1928, 'loss/train': 2.9387598037719727} -09/20/2021 21:10:21 - INFO - __main__ - Step 30864: {'lr': 0.00019971780877918937, 'samples': 987648, 'steps': 1928, 'loss/train': 2.6830430030822754} -09/20/2021 21:10:22 - INFO - __main__ - Step 30865: {'lr': 0.00019971732969952959, 'samples': 987680, 'steps': 1929, 'loss/train': 2.5132052898406982} -09/20/2021 21:10:23 - INFO - __main__ - Step 30866: {'lr': 0.00019971732969952959, 'samples': 987712, 'steps': 1929, 'loss/train': 2.1244168281555176} -09/20/2021 21:10:23 - INFO - __main__ - Step 30867: {'lr': 0.00019971732969952959, 'samples': 987744, 'steps': 1929, 'loss/train': 3.8990418910980225} -09/20/2021 21:10:24 - INFO - __main__ - Step 30868: {'lr': 0.00019971732969952959, 'samples': 987776, 'steps': 1929, 'loss/train': 0.947260320186615} -09/20/2021 21:10:25 - INFO - __main__ - Step 30869: {'lr': 0.00019971732969952959, 'samples': 987808, 'steps': 1929, 'loss/train': 1.0523607730865479} -09/20/2021 21:10:26 - INFO - __main__ - Step 30870: {'lr': 0.00019971732969952959, 'samples': 987840, 'steps': 1929, 'loss/train': 0.9594197273254395} -09/20/2021 21:10:26 - INFO - __main__ - Step 30871: {'lr': 0.00019971732969952959, 'samples': 987872, 'steps': 1929, 'loss/train': 0.8540502190589905} -09/20/2021 21:10:27 - INFO - __main__ - Step 30872: {'lr': 0.00019971732969952959, 'samples': 987904, 'steps': 1929, 'loss/train': 0.7528305649757385} -09/20/2021 21:10:28 - INFO - __main__ - Step 30873: {'lr': 0.00019971732969952959, 'samples': 987936, 'steps': 1929, 'loss/train': 0.9596297144889832} -09/20/2021 21:10:29 - INFO - __main__ - Step 30874: {'lr': 0.00019971732969952959, 'samples': 987968, 'steps': 1929, 'loss/train': 1.055027961730957} -09/20/2021 21:10:29 - INFO - __main__ - Step 30875: {'lr': 0.00019971732969952959, 'samples': 988000, 'steps': 1929, 'loss/train': 1.1312988996505737} -09/20/2021 21:10:30 - INFO - __main__ - Step 30876: {'lr': 0.00019971732969952959, 'samples': 988032, 'steps': 1929, 'loss/train': 0.5344702005386353} -09/20/2021 21:10:31 - INFO - __main__ - Step 30877: {'lr': 0.00019971732969952959, 'samples': 988064, 'steps': 1929, 'loss/train': 3.1220524311065674} -09/20/2021 21:10:32 - INFO - __main__ - Step 30878: {'lr': 0.00019971732969952959, 'samples': 988096, 'steps': 1929, 'loss/train': 2.811399221420288} -09/20/2021 21:10:32 - INFO - __main__ - Step 30879: {'lr': 0.00019971732969952959, 'samples': 988128, 'steps': 1929, 'loss/train': 2.559474468231201} -09/20/2021 21:10:33 - INFO - __main__ - Step 30880: {'lr': 0.00019971732969952959, 'samples': 988160, 'steps': 1929, 'loss/train': 3.035649061203003} -09/20/2021 21:10:34 - INFO - __main__ - Step 30881: {'lr': 0.00019971685021412034, 'samples': 988192, 'steps': 1930, 'loss/train': 2.058840036392212} -09/20/2021 21:10:35 - INFO - __main__ - Step 30882: {'lr': 0.00019971685021412034, 'samples': 988224, 'steps': 1930, 'loss/train': 1.7004547119140625} -09/20/2021 21:10:36 - INFO - __main__ - Step 30883: {'lr': 0.00019971685021412034, 'samples': 988256, 'steps': 1930, 'loss/train': 2.1908698081970215} -09/20/2021 21:10:37 - INFO - __main__ - Step 30884: {'lr': 0.00019971685021412034, 'samples': 988288, 'steps': 1930, 'loss/train': 3.1160428524017334} -09/20/2021 21:10:38 - INFO - __main__ - Step 30885: {'lr': 0.00019971685021412034, 'samples': 988320, 'steps': 1930, 'loss/train': 2.5386741161346436} -09/20/2021 21:10:38 - INFO - __main__ - Step 30886: {'lr': 0.00019971685021412034, 'samples': 988352, 'steps': 1930, 'loss/train': 1.7540555000305176} -09/20/2021 21:10:39 - INFO - __main__ - Step 30887: {'lr': 0.00019971685021412034, 'samples': 988384, 'steps': 1930, 'loss/train': 2.2366905212402344} -09/20/2021 21:10:40 - INFO - __main__ - Step 30888: {'lr': 0.00019971685021412034, 'samples': 988416, 'steps': 1930, 'loss/train': 2.798131227493286} -09/20/2021 21:10:41 - INFO - __main__ - Step 30889: {'lr': 0.00019971685021412034, 'samples': 988448, 'steps': 1930, 'loss/train': 2.2053382396698} -09/20/2021 21:10:41 - INFO - __main__ - Step 30890: {'lr': 0.00019971685021412034, 'samples': 988480, 'steps': 1930, 'loss/train': 3.108405828475952} -09/20/2021 21:10:42 - INFO - __main__ - Step 30891: {'lr': 0.00019971685021412034, 'samples': 988512, 'steps': 1930, 'loss/train': 0.5507237315177917} -09/20/2021 21:10:43 - INFO - __main__ - Step 30892: {'lr': 0.00019971685021412034, 'samples': 988544, 'steps': 1930, 'loss/train': 2.1902239322662354} -09/20/2021 21:10:44 - INFO - __main__ - Step 30893: {'lr': 0.00019971685021412034, 'samples': 988576, 'steps': 1930, 'loss/train': 1.8080785274505615} -09/20/2021 21:10:44 - INFO - __main__ - Step 30894: {'lr': 0.00019971685021412034, 'samples': 988608, 'steps': 1930, 'loss/train': 2.8117496967315674} -09/20/2021 21:10:45 - INFO - __main__ - Step 30895: {'lr': 0.00019971685021412034, 'samples': 988640, 'steps': 1930, 'loss/train': 2.79048490524292} -09/20/2021 21:10:46 - INFO - __main__ - Step 30896: {'lr': 0.00019971685021412034, 'samples': 988672, 'steps': 1930, 'loss/train': 2.1464345455169678} -09/20/2021 21:10:47 - INFO - __main__ - Step 30897: {'lr': 0.00019971637032296363, 'samples': 988704, 'steps': 1931, 'loss/train': 3.662886381149292} -09/20/2021 21:10:48 - INFO - __main__ - Step 30898: {'lr': 0.00019971637032296363, 'samples': 988736, 'steps': 1931, 'loss/train': 2.7698633670806885} -09/20/2021 21:10:48 - INFO - __main__ - Step 30899: {'lr': 0.00019971637032296363, 'samples': 988768, 'steps': 1931, 'loss/train': 2.5805413722991943} -09/20/2021 21:10:49 - INFO - __main__ - Step 30900: {'lr': 0.00019971637032296363, 'samples': 988800, 'steps': 1931, 'loss/train': 2.6210784912109375} -09/20/2021 21:10:50 - INFO - __main__ - Step 30901: {'lr': 0.00019971637032296363, 'samples': 988832, 'steps': 1931, 'loss/train': 2.3759570121765137} -09/20/2021 21:10:51 - INFO - __main__ - Step 30902: {'lr': 0.00019971637032296363, 'samples': 988864, 'steps': 1931, 'loss/train': 1.8451673984527588} -09/20/2021 21:10:51 - INFO - __main__ - Step 30903: {'lr': 0.00019971637032296363, 'samples': 988896, 'steps': 1931, 'loss/train': 2.303609848022461} -09/20/2021 21:10:52 - INFO - __main__ - Step 30904: {'lr': 0.00019971637032296363, 'samples': 988928, 'steps': 1931, 'loss/train': 2.0399742126464844} -09/20/2021 21:10:53 - INFO - __main__ - Step 30905: {'lr': 0.00019971637032296363, 'samples': 988960, 'steps': 1931, 'loss/train': 1.7073532342910767} -09/20/2021 21:10:54 - INFO - __main__ - Step 30906: {'lr': 0.00019971637032296363, 'samples': 988992, 'steps': 1931, 'loss/train': 3.1930840015411377} -09/20/2021 21:10:54 - INFO - __main__ - Step 30907: {'lr': 0.00019971637032296363, 'samples': 989024, 'steps': 1931, 'loss/train': 3.088244915008545} -09/20/2021 21:10:55 - INFO - __main__ - Step 30908: {'lr': 0.00019971637032296363, 'samples': 989056, 'steps': 1931, 'loss/train': 1.2507915496826172} -09/20/2021 21:10:56 - INFO - __main__ - Step 30909: {'lr': 0.00019971637032296363, 'samples': 989088, 'steps': 1931, 'loss/train': 1.5084952116012573} -09/20/2021 21:10:57 - INFO - __main__ - Step 30910: {'lr': 0.00019971637032296363, 'samples': 989120, 'steps': 1931, 'loss/train': 2.4293859004974365} -09/20/2021 21:10:57 - INFO - __main__ - Step 30911: {'lr': 0.00019971637032296363, 'samples': 989152, 'steps': 1931, 'loss/train': 2.788285493850708} -09/20/2021 21:10:58 - INFO - __main__ - Step 30912: {'lr': 0.00019971637032296363, 'samples': 989184, 'steps': 1931, 'loss/train': 3.2940876483917236} -09/20/2021 21:10:59 - INFO - __main__ - Step 30913: {'lr': 0.0001997158900260614, 'samples': 989216, 'steps': 1932, 'loss/train': 3.093031406402588} -09/20/2021 21:11:00 - INFO - __main__ - Step 30914: {'lr': 0.0001997158900260614, 'samples': 989248, 'steps': 1932, 'loss/train': 3.3499817848205566} -09/20/2021 21:11:00 - INFO - __main__ - Step 30915: {'lr': 0.0001997158900260614, 'samples': 989280, 'steps': 1932, 'loss/train': 3.3117237091064453} -09/20/2021 21:11:01 - INFO - __main__ - Step 30916: {'lr': 0.0001997158900260614, 'samples': 989312, 'steps': 1932, 'loss/train': 3.5793521404266357} -09/20/2021 21:11:02 - INFO - __main__ - Step 30917: {'lr': 0.0001997158900260614, 'samples': 989344, 'steps': 1932, 'loss/train': 1.4522905349731445} -09/20/2021 21:11:03 - INFO - __main__ - Step 30918: {'lr': 0.0001997158900260614, 'samples': 989376, 'steps': 1932, 'loss/train': 2.3659963607788086} -09/20/2021 21:11:04 - INFO - __main__ - Step 30919: {'lr': 0.0001997158900260614, 'samples': 989408, 'steps': 1932, 'loss/train': 3.286623954772949} -09/20/2021 21:11:05 - INFO - __main__ - Step 30920: {'lr': 0.0001997158900260614, 'samples': 989440, 'steps': 1932, 'loss/train': 2.204097270965576} -09/20/2021 21:11:05 - INFO - __main__ - Step 30921: {'lr': 0.0001997158900260614, 'samples': 989472, 'steps': 1932, 'loss/train': 2.0894112586975098} -09/20/2021 21:11:06 - INFO - __main__ - Step 30922: {'lr': 0.0001997158900260614, 'samples': 989504, 'steps': 1932, 'loss/train': 0.6664326786994934} -09/20/2021 21:11:07 - INFO - __main__ - Step 30923: {'lr': 0.0001997158900260614, 'samples': 989536, 'steps': 1932, 'loss/train': 2.9888927936553955} -09/20/2021 21:11:08 - INFO - __main__ - Step 30924: {'lr': 0.0001997158900260614, 'samples': 989568, 'steps': 1932, 'loss/train': 1.699535846710205} -09/20/2021 21:11:08 - INFO - __main__ - Step 30925: {'lr': 0.0001997158900260614, 'samples': 989600, 'steps': 1932, 'loss/train': 2.198824644088745} -09/20/2021 21:11:09 - INFO - __main__ - Step 30926: {'lr': 0.0001997158900260614, 'samples': 989632, 'steps': 1932, 'loss/train': 2.4605579376220703} -09/20/2021 21:11:10 - INFO - __main__ - Step 30927: {'lr': 0.0001997158900260614, 'samples': 989664, 'steps': 1932, 'loss/train': 2.094581365585327} -09/20/2021 21:11:11 - INFO - __main__ - Step 30928: {'lr': 0.0001997158900260614, 'samples': 989696, 'steps': 1932, 'loss/train': 3.543668508529663} -09/20/2021 21:11:12 - INFO - __main__ - Step 30929: {'lr': 0.00019971540932341562, 'samples': 989728, 'steps': 1933, 'loss/train': 3.2374179363250732} -09/20/2021 21:11:12 - INFO - __main__ - Step 30930: {'lr': 0.00019971540932341562, 'samples': 989760, 'steps': 1933, 'loss/train': 3.7487645149230957} -09/20/2021 21:11:13 - INFO - __main__ - Step 30931: {'lr': 0.00019971540932341562, 'samples': 989792, 'steps': 1933, 'loss/train': 3.7252326011657715} -09/20/2021 21:11:14 - INFO - __main__ - Step 30932: {'lr': 0.00019971540932341562, 'samples': 989824, 'steps': 1933, 'loss/train': 2.7953200340270996} -09/20/2021 21:11:15 - INFO - __main__ - Step 30933: {'lr': 0.00019971540932341562, 'samples': 989856, 'steps': 1933, 'loss/train': 3.218106746673584} -09/20/2021 21:11:15 - INFO - __main__ - Step 30934: {'lr': 0.00019971540932341562, 'samples': 989888, 'steps': 1933, 'loss/train': 2.170212745666504} -09/20/2021 21:11:16 - INFO - __main__ - Step 30935: {'lr': 0.00019971540932341562, 'samples': 989920, 'steps': 1933, 'loss/train': 2.297475576400757} -09/20/2021 21:11:17 - INFO - __main__ - Step 30936: {'lr': 0.00019971540932341562, 'samples': 989952, 'steps': 1933, 'loss/train': 0.7576940059661865} -09/20/2021 21:11:18 - INFO - __main__ - Step 30937: {'lr': 0.00019971540932341562, 'samples': 989984, 'steps': 1933, 'loss/train': 2.4648611545562744} -09/20/2021 21:11:18 - INFO - __main__ - Step 30938: {'lr': 0.00019971540932341562, 'samples': 990016, 'steps': 1933, 'loss/train': 2.9321272373199463} -09/20/2021 21:11:19 - INFO - __main__ - Step 30939: {'lr': 0.00019971540932341562, 'samples': 990048, 'steps': 1933, 'loss/train': 2.0202531814575195} -09/20/2021 21:11:20 - INFO - __main__ - Step 30940: {'lr': 0.00019971540932341562, 'samples': 990080, 'steps': 1933, 'loss/train': 2.8893961906433105} -09/20/2021 21:11:21 - INFO - __main__ - Step 30941: {'lr': 0.00019971540932341562, 'samples': 990112, 'steps': 1933, 'loss/train': 2.425586700439453} -09/20/2021 21:11:21 - INFO - __main__ - Step 30942: {'lr': 0.00019971540932341562, 'samples': 990144, 'steps': 1933, 'loss/train': 2.0477380752563477} -09/20/2021 21:11:22 - INFO - __main__ - Step 30943: {'lr': 0.00019971540932341562, 'samples': 990176, 'steps': 1933, 'loss/train': 2.355957508087158} -09/20/2021 21:11:23 - INFO - __main__ - Step 30944: {'lr': 0.00019971540932341562, 'samples': 990208, 'steps': 1933, 'loss/train': 0.5893957614898682} -09/20/2021 21:11:24 - INFO - __main__ - Step 30945: {'lr': 0.00019971492821502817, 'samples': 990240, 'steps': 1934, 'loss/train': 2.0483057498931885} -09/20/2021 21:11:24 - INFO - __main__ - Step 30946: {'lr': 0.00019971492821502817, 'samples': 990272, 'steps': 1934, 'loss/train': 1.2587120532989502} -09/20/2021 21:11:25 - INFO - __main__ - Step 30947: {'lr': 0.00019971492821502817, 'samples': 990304, 'steps': 1934, 'loss/train': 1.959261417388916} -09/20/2021 21:11:26 - INFO - __main__ - Step 30948: {'lr': 0.00019971492821502817, 'samples': 990336, 'steps': 1934, 'loss/train': 1.8851580619812012} -09/20/2021 21:11:28 - INFO - __main__ - Step 30949: {'lr': 0.00019971492821502817, 'samples': 990368, 'steps': 1934, 'loss/train': 2.8697359561920166} -09/20/2021 21:11:29 - INFO - __main__ - Step 30950: {'lr': 0.00019971492821502817, 'samples': 990400, 'steps': 1934, 'loss/train': 3.9920945167541504} -09/20/2021 21:11:29 - INFO - __main__ - Step 30951: {'lr': 0.00019971492821502817, 'samples': 990432, 'steps': 1934, 'loss/train': 4.442068576812744} -09/20/2021 21:11:30 - INFO - __main__ - Step 30952: {'lr': 0.00019971492821502817, 'samples': 990464, 'steps': 1934, 'loss/train': 3.938140630722046} -09/20/2021 21:11:31 - INFO - __main__ - Step 30953: {'lr': 0.00019971492821502817, 'samples': 990496, 'steps': 1934, 'loss/train': 1.9667755365371704} -09/20/2021 21:11:32 - INFO - __main__ - Step 30954: {'lr': 0.00019971492821502817, 'samples': 990528, 'steps': 1934, 'loss/train': 0.3326389789581299} -09/20/2021 21:11:32 - INFO - __main__ - Step 30955: {'lr': 0.00019971492821502817, 'samples': 990560, 'steps': 1934, 'loss/train': 0.30386561155319214} -09/20/2021 21:11:33 - INFO - __main__ - Step 30956: {'lr': 0.00019971492821502817, 'samples': 990592, 'steps': 1934, 'loss/train': 0.2648647427558899} -09/20/2021 21:11:34 - INFO - __main__ - Step 30957: {'lr': 0.00019971492821502817, 'samples': 990624, 'steps': 1934, 'loss/train': 0.30388879776000977} -09/20/2021 21:11:35 - INFO - __main__ - Step 30958: {'lr': 0.00019971492821502817, 'samples': 990656, 'steps': 1934, 'loss/train': 1.9316385984420776} -09/20/2021 21:11:35 - INFO - __main__ - Step 30959: {'lr': 0.00019971492821502817, 'samples': 990688, 'steps': 1934, 'loss/train': 1.5679377317428589} -09/20/2021 21:11:36 - INFO - __main__ - Step 30960: {'lr': 0.00019971492821502817, 'samples': 990720, 'steps': 1934, 'loss/train': 2.8143229484558105} -09/20/2021 21:11:37 - INFO - __main__ - Step 30961: {'lr': 0.0001997144467009011, 'samples': 990752, 'steps': 1935, 'loss/train': 2.969228506088257} -09/20/2021 21:11:38 - INFO - __main__ - Step 30962: {'lr': 0.0001997144467009011, 'samples': 990784, 'steps': 1935, 'loss/train': 2.237611770629883} -09/20/2021 21:11:39 - INFO - __main__ - Step 30963: {'lr': 0.0001997144467009011, 'samples': 990816, 'steps': 1935, 'loss/train': 2.7320632934570312} -09/20/2021 21:11:39 - INFO - __main__ - Step 30964: {'lr': 0.0001997144467009011, 'samples': 990848, 'steps': 1935, 'loss/train': 2.584057331085205} -09/20/2021 21:11:40 - INFO - __main__ - Step 30965: {'lr': 0.0001997144467009011, 'samples': 990880, 'steps': 1935, 'loss/train': 2.7251718044281006} -09/20/2021 21:11:41 - INFO - __main__ - Step 30966: {'lr': 0.0001997144467009011, 'samples': 990912, 'steps': 1935, 'loss/train': 3.245007276535034} -09/20/2021 21:11:42 - INFO - __main__ - Step 30967: {'lr': 0.0001997144467009011, 'samples': 990944, 'steps': 1935, 'loss/train': 2.5910420417785645} -09/20/2021 21:11:42 - INFO - __main__ - Step 30968: {'lr': 0.0001997144467009011, 'samples': 990976, 'steps': 1935, 'loss/train': 2.548175573348999} -09/20/2021 21:11:43 - INFO - __main__ - Step 30969: {'lr': 0.0001997144467009011, 'samples': 991008, 'steps': 1935, 'loss/train': 2.0164647102355957} -09/20/2021 21:11:44 - INFO - __main__ - Step 30970: {'lr': 0.0001997144467009011, 'samples': 991040, 'steps': 1935, 'loss/train': 2.0755629539489746} -09/20/2021 21:11:45 - INFO - __main__ - Step 30971: {'lr': 0.0001997144467009011, 'samples': 991072, 'steps': 1935, 'loss/train': 2.879615306854248} -09/20/2021 21:11:45 - INFO - __main__ - Step 30972: {'lr': 0.0001997144467009011, 'samples': 991104, 'steps': 1935, 'loss/train': 2.604095935821533} -09/20/2021 21:11:46 - INFO - __main__ - Step 30973: {'lr': 0.0001997144467009011, 'samples': 991136, 'steps': 1935, 'loss/train': 2.9600133895874023} -09/20/2021 21:11:47 - INFO - __main__ - Step 30974: {'lr': 0.0001997144467009011, 'samples': 991168, 'steps': 1935, 'loss/train': 2.8135340213775635} -09/20/2021 21:11:48 - INFO - __main__ - Step 30975: {'lr': 0.0001997144467009011, 'samples': 991200, 'steps': 1935, 'loss/train': 2.5159709453582764} -09/20/2021 21:11:48 - INFO - __main__ - Step 30976: {'lr': 0.0001997144467009011, 'samples': 991232, 'steps': 1935, 'loss/train': 2.9601845741271973} -09/20/2021 21:11:49 - INFO - __main__ - Step 30977: {'lr': 0.00019971396478103636, 'samples': 991264, 'steps': 1936, 'loss/train': 2.3001134395599365} -09/20/2021 21:11:50 - INFO - __main__ - Step 30978: {'lr': 0.00019971396478103636, 'samples': 991296, 'steps': 1936, 'loss/train': 2.9266326427459717} -09/20/2021 21:11:51 - INFO - __main__ - Step 30979: {'lr': 0.00019971396478103636, 'samples': 991328, 'steps': 1936, 'loss/train': 2.871821403503418} -09/20/2021 21:11:52 - INFO - __main__ - Step 30980: {'lr': 0.00019971396478103636, 'samples': 991360, 'steps': 1936, 'loss/train': 2.3419511318206787} -09/20/2021 21:11:53 - INFO - __main__ - Step 30981: {'lr': 0.00019971396478103636, 'samples': 991392, 'steps': 1936, 'loss/train': 2.2714455127716064} -09/20/2021 21:11:54 - INFO - __main__ - Step 30982: {'lr': 0.00019971396478103636, 'samples': 991424, 'steps': 1936, 'loss/train': 3.513154983520508} -09/20/2021 21:11:54 - INFO - __main__ - Step 30983: {'lr': 0.00019971396478103636, 'samples': 991456, 'steps': 1936, 'loss/train': 2.285860538482666} -09/20/2021 21:11:55 - INFO - __main__ - Step 30984: {'lr': 0.00019971396478103636, 'samples': 991488, 'steps': 1936, 'loss/train': 2.4697153568267822} -09/20/2021 21:11:56 - INFO - __main__ - Step 30985: {'lr': 0.00019971396478103636, 'samples': 991520, 'steps': 1936, 'loss/train': 2.7677159309387207} -09/20/2021 21:11:57 - INFO - __main__ - Step 30986: {'lr': 0.00019971396478103636, 'samples': 991552, 'steps': 1936, 'loss/train': 2.4280471801757812} -09/20/2021 21:11:57 - INFO - __main__ - Step 30987: {'lr': 0.00019971396478103636, 'samples': 991584, 'steps': 1936, 'loss/train': 3.1796839237213135} -09/20/2021 21:11:58 - INFO - __main__ - Step 30988: {'lr': 0.00019971396478103636, 'samples': 991616, 'steps': 1936, 'loss/train': 2.5578250885009766} -09/20/2021 21:11:59 - INFO - __main__ - Step 30989: {'lr': 0.00019971396478103636, 'samples': 991648, 'steps': 1936, 'loss/train': 3.2776615619659424} -09/20/2021 21:12:00 - INFO - __main__ - Step 30990: {'lr': 0.00019971396478103636, 'samples': 991680, 'steps': 1936, 'loss/train': 3.1254615783691406} -09/20/2021 21:12:00 - INFO - __main__ - Step 30991: {'lr': 0.00019971396478103636, 'samples': 991712, 'steps': 1936, 'loss/train': 2.3312478065490723} -09/20/2021 21:12:01 - INFO - __main__ - Step 30992: {'lr': 0.00019971396478103636, 'samples': 991744, 'steps': 1936, 'loss/train': 3.134772539138794} -09/20/2021 21:12:02 - INFO - __main__ - Step 30993: {'lr': 0.0001997134824554358, 'samples': 991776, 'steps': 1937, 'loss/train': 3.02497935295105} -09/20/2021 21:12:03 - INFO - __main__ - Step 30994: {'lr': 0.0001997134824554358, 'samples': 991808, 'steps': 1937, 'loss/train': 2.2158772945404053} -09/20/2021 21:12:03 - INFO - __main__ - Step 30995: {'lr': 0.0001997134824554358, 'samples': 991840, 'steps': 1937, 'loss/train': 3.0463016033172607} -09/20/2021 21:12:04 - INFO - __main__ - Step 30996: {'lr': 0.0001997134824554358, 'samples': 991872, 'steps': 1937, 'loss/train': 2.675612449645996} -09/20/2021 21:12:05 - INFO - __main__ - Step 30997: {'lr': 0.0001997134824554358, 'samples': 991904, 'steps': 1937, 'loss/train': 1.548485517501831} -09/20/2021 21:12:06 - INFO - __main__ - Step 30998: {'lr': 0.0001997134824554358, 'samples': 991936, 'steps': 1937, 'loss/train': 4.160103797912598} -09/20/2021 21:12:06 - INFO - __main__ - Step 30999: {'lr': 0.0001997134824554358, 'samples': 991968, 'steps': 1937, 'loss/train': 3.1810855865478516} -09/20/2021 21:12:07 - INFO - __main__ - Step 31000: {'lr': 0.0001997134824554358, 'samples': 992000, 'steps': 1937, 'loss/train': 1.8667277097702026} -09/20/2021 21:12:08 - INFO - __main__ - Step 31001: {'lr': 0.0001997134824554358, 'samples': 992032, 'steps': 1937, 'loss/train': 2.602792739868164} -09/20/2021 21:12:09 - INFO - __main__ - Step 31002: {'lr': 0.0001997134824554358, 'samples': 992064, 'steps': 1937, 'loss/train': 3.0463078022003174} -09/20/2021 21:12:09 - INFO - __main__ - Step 31003: {'lr': 0.0001997134824554358, 'samples': 992096, 'steps': 1937, 'loss/train': 3.1729440689086914} -09/20/2021 21:12:10 - INFO - __main__ - Step 31004: {'lr': 0.0001997134824554358, 'samples': 992128, 'steps': 1937, 'loss/train': 2.320730209350586} -09/20/2021 21:12:11 - INFO - __main__ - Step 31005: {'lr': 0.0001997134824554358, 'samples': 992160, 'steps': 1937, 'loss/train': 2.1485369205474854} -09/20/2021 21:12:12 - INFO - __main__ - Step 31006: {'lr': 0.0001997134824554358, 'samples': 992192, 'steps': 1937, 'loss/train': 2.8360884189605713} -09/20/2021 21:12:12 - INFO - __main__ - Step 31007: {'lr': 0.0001997134824554358, 'samples': 992224, 'steps': 1937, 'loss/train': 1.5655170679092407} -09/20/2021 21:12:13 - INFO - __main__ - Step 31008: {'lr': 0.0001997134824554358, 'samples': 992256, 'steps': 1937, 'loss/train': 2.2781713008880615} -09/20/2021 21:12:14 - INFO - __main__ - Step 31009: {'lr': 0.00019971299972410155, 'samples': 992288, 'steps': 1938, 'loss/train': 1.3680059909820557} -09/20/2021 21:12:16 - INFO - __main__ - Step 31010: {'lr': 0.00019971299972410155, 'samples': 992320, 'steps': 1938, 'loss/train': 2.0249407291412354} -09/20/2021 21:12:16 - INFO - __main__ - Step 31011: {'lr': 0.00019971299972410155, 'samples': 992352, 'steps': 1938, 'loss/train': 2.2648682594299316} -09/20/2021 21:12:17 - INFO - __main__ - Step 31012: {'lr': 0.00019971299972410155, 'samples': 992384, 'steps': 1938, 'loss/train': 2.5766730308532715} -09/20/2021 21:12:18 - INFO - __main__ - Step 31013: {'lr': 0.00019971299972410155, 'samples': 992416, 'steps': 1938, 'loss/train': 2.3699376583099365} -09/20/2021 21:12:19 - INFO - __main__ - Step 31014: {'lr': 0.00019971299972410155, 'samples': 992448, 'steps': 1938, 'loss/train': 1.6242715120315552} -09/20/2021 21:12:19 - INFO - __main__ - Step 31015: {'lr': 0.00019971299972410155, 'samples': 992480, 'steps': 1938, 'loss/train': 2.220902919769287} -09/20/2021 21:12:20 - INFO - __main__ - Step 31016: {'lr': 0.00019971299972410155, 'samples': 992512, 'steps': 1938, 'loss/train': 2.0473766326904297} -09/20/2021 21:12:21 - INFO - __main__ - Step 31017: {'lr': 0.00019971299972410155, 'samples': 992544, 'steps': 1938, 'loss/train': 2.7235262393951416} -09/20/2021 21:12:22 - INFO - __main__ - Step 31018: {'lr': 0.00019971299972410155, 'samples': 992576, 'steps': 1938, 'loss/train': 2.6364269256591797} -09/20/2021 21:12:22 - INFO - __main__ - Step 31019: {'lr': 0.00019971299972410155, 'samples': 992608, 'steps': 1938, 'loss/train': 2.6953952312469482} -09/20/2021 21:12:23 - INFO - __main__ - Step 31020: {'lr': 0.00019971299972410155, 'samples': 992640, 'steps': 1938, 'loss/train': 3.3899788856506348} -09/20/2021 21:12:24 - INFO - __main__ - Step 31021: {'lr': 0.00019971299972410155, 'samples': 992672, 'steps': 1938, 'loss/train': 2.3673489093780518} -09/20/2021 21:12:25 - INFO - __main__ - Step 31022: {'lr': 0.00019971299972410155, 'samples': 992704, 'steps': 1938, 'loss/train': 2.0113718509674072} -09/20/2021 21:12:25 - INFO - __main__ - Step 31023: {'lr': 0.00019971299972410155, 'samples': 992736, 'steps': 1938, 'loss/train': 0.8425117135047913} -09/20/2021 21:12:26 - INFO - __main__ - Step 31024: {'lr': 0.00019971299972410155, 'samples': 992768, 'steps': 1938, 'loss/train': 3.048915386199951} -09/20/2021 21:12:27 - INFO - __main__ - Step 31025: {'lr': 0.00019971251658703547, 'samples': 992800, 'steps': 1939, 'loss/train': 3.2735369205474854} -09/20/2021 21:12:28 - INFO - __main__ - Step 31026: {'lr': 0.00019971251658703547, 'samples': 992832, 'steps': 1939, 'loss/train': 0.8182510137557983} -09/20/2021 21:12:28 - INFO - __main__ - Step 31027: {'lr': 0.00019971251658703547, 'samples': 992864, 'steps': 1939, 'loss/train': 0.3249647617340088} -09/20/2021 21:12:29 - INFO - __main__ - Step 31028: {'lr': 0.00019971251658703547, 'samples': 992896, 'steps': 1939, 'loss/train': 0.40768253803253174} -09/20/2021 21:12:30 - INFO - __main__ - Step 31029: {'lr': 0.00019971251658703547, 'samples': 992928, 'steps': 1939, 'loss/train': 0.2339787483215332} -09/20/2021 21:12:31 - INFO - __main__ - Step 31030: {'lr': 0.00019971251658703547, 'samples': 992960, 'steps': 1939, 'loss/train': 0.5608299970626831} -09/20/2021 21:12:31 - INFO - __main__ - Step 31031: {'lr': 0.00019971251658703547, 'samples': 992992, 'steps': 1939, 'loss/train': 2.373699426651001} -09/20/2021 21:12:32 - INFO - __main__ - Step 31032: {'lr': 0.00019971251658703547, 'samples': 993024, 'steps': 1939, 'loss/train': 2.3589742183685303} -09/20/2021 21:12:33 - INFO - __main__ - Step 31033: {'lr': 0.00019971251658703547, 'samples': 993056, 'steps': 1939, 'loss/train': 0.5536507964134216} -09/20/2021 21:12:34 - INFO - __main__ - Step 31034: {'lr': 0.00019971251658703547, 'samples': 993088, 'steps': 1939, 'loss/train': 3.115201234817505} -09/20/2021 21:12:34 - INFO - __main__ - Step 31035: {'lr': 0.00019971251658703547, 'samples': 993120, 'steps': 1939, 'loss/train': 2.7908952236175537} -09/20/2021 21:12:35 - INFO - __main__ - Step 31036: {'lr': 0.00019971251658703547, 'samples': 993152, 'steps': 1939, 'loss/train': 1.8466054201126099} -09/20/2021 21:12:36 - INFO - __main__ - Step 31037: {'lr': 0.00019971251658703547, 'samples': 993184, 'steps': 1939, 'loss/train': 1.9384479522705078} -09/20/2021 21:12:37 - INFO - __main__ - Step 31038: {'lr': 0.00019971251658703547, 'samples': 993216, 'steps': 1939, 'loss/train': 1.7058827877044678} -09/20/2021 21:12:37 - INFO - __main__ - Step 31039: {'lr': 0.00019971251658703547, 'samples': 993248, 'steps': 1939, 'loss/train': 1.5668559074401855} -09/20/2021 21:12:38 - INFO - __main__ - Step 31040: {'lr': 0.00019971251658703547, 'samples': 993280, 'steps': 1939, 'loss/train': 1.8014719486236572} -09/20/2021 21:12:40 - INFO - __main__ - Step 31041: {'lr': 0.00019971203304423952, 'samples': 993312, 'steps': 1940, 'loss/train': 2.3537909984588623} -09/20/2021 21:12:40 - INFO - __main__ - Step 31042: {'lr': 0.00019971203304423952, 'samples': 993344, 'steps': 1940, 'loss/train': 2.7926299571990967} -09/20/2021 21:12:41 - INFO - __main__ - Step 31043: {'lr': 0.00019971203304423952, 'samples': 993376, 'steps': 1940, 'loss/train': 2.7381656169891357} -09/20/2021 21:12:42 - INFO - __main__ - Step 31044: {'lr': 0.00019971203304423952, 'samples': 993408, 'steps': 1940, 'loss/train': 2.627230405807495} -09/20/2021 21:12:43 - INFO - __main__ - Step 31045: {'lr': 0.00019971203304423952, 'samples': 993440, 'steps': 1940, 'loss/train': 1.4098104238510132} -09/20/2021 21:12:43 - INFO - __main__ - Step 31046: {'lr': 0.00019971203304423952, 'samples': 993472, 'steps': 1940, 'loss/train': 2.4891562461853027} -09/20/2021 21:12:44 - INFO - __main__ - Step 31047: {'lr': 0.00019971203304423952, 'samples': 993504, 'steps': 1940, 'loss/train': 2.420203447341919} -09/20/2021 21:12:45 - INFO - __main__ - Step 31048: {'lr': 0.00019971203304423952, 'samples': 993536, 'steps': 1940, 'loss/train': 1.953550934791565} -09/20/2021 21:12:46 - INFO - __main__ - Step 31049: {'lr': 0.00019971203304423952, 'samples': 993568, 'steps': 1940, 'loss/train': 2.6094346046447754} -09/20/2021 21:12:46 - INFO - __main__ - Step 31050: {'lr': 0.00019971203304423952, 'samples': 993600, 'steps': 1940, 'loss/train': 2.9907984733581543} -09/20/2021 21:12:47 - INFO - __main__ - Step 31051: {'lr': 0.00019971203304423952, 'samples': 993632, 'steps': 1940, 'loss/train': 2.5327186584472656} -09/20/2021 21:12:48 - INFO - __main__ - Step 31052: {'lr': 0.00019971203304423952, 'samples': 993664, 'steps': 1940, 'loss/train': 1.7711822986602783} -09/20/2021 21:12:49 - INFO - __main__ - Step 31053: {'lr': 0.00019971203304423952, 'samples': 993696, 'steps': 1940, 'loss/train': 2.990996837615967} -09/20/2021 21:12:49 - INFO - __main__ - Step 31054: {'lr': 0.00019971203304423952, 'samples': 993728, 'steps': 1940, 'loss/train': 2.241251230239868} -09/20/2021 21:12:50 - INFO - __main__ - Step 31055: {'lr': 0.00019971203304423952, 'samples': 993760, 'steps': 1940, 'loss/train': 2.491398811340332} -09/20/2021 21:12:51 - INFO - __main__ - Step 31056: {'lr': 0.00019971203304423952, 'samples': 993792, 'steps': 1940, 'loss/train': 2.588251829147339} -09/20/2021 21:12:52 - INFO - __main__ - Step 31057: {'lr': 0.0001997115490957157, 'samples': 993824, 'steps': 1941, 'loss/train': 2.514486074447632} -09/20/2021 21:12:53 - INFO - __main__ - Step 31058: {'lr': 0.0001997115490957157, 'samples': 993856, 'steps': 1941, 'loss/train': 1.674021601676941} -09/20/2021 21:12:53 - INFO - __main__ - Step 31059: {'lr': 0.0001997115490957157, 'samples': 993888, 'steps': 1941, 'loss/train': 2.1803910732269287} -09/20/2021 21:12:54 - INFO - __main__ - Step 31060: {'lr': 0.0001997115490957157, 'samples': 993920, 'steps': 1941, 'loss/train': 2.3241653442382812} -09/20/2021 21:12:55 - INFO - __main__ - Step 31061: {'lr': 0.0001997115490957157, 'samples': 993952, 'steps': 1941, 'loss/train': 2.683908462524414} -09/20/2021 21:12:56 - INFO - __main__ - Step 31062: {'lr': 0.0001997115490957157, 'samples': 993984, 'steps': 1941, 'loss/train': 1.2516709566116333} -09/20/2021 21:12:56 - INFO - __main__ - Step 31063: {'lr': 0.0001997115490957157, 'samples': 994016, 'steps': 1941, 'loss/train': 2.2096128463745117} -09/20/2021 21:12:57 - INFO - __main__ - Step 31064: {'lr': 0.0001997115490957157, 'samples': 994048, 'steps': 1941, 'loss/train': 3.225700855255127} -09/20/2021 21:12:58 - INFO - __main__ - Step 31065: {'lr': 0.0001997115490957157, 'samples': 994080, 'steps': 1941, 'loss/train': 2.472932815551758} -09/20/2021 21:12:59 - INFO - __main__ - Step 31066: {'lr': 0.0001997115490957157, 'samples': 994112, 'steps': 1941, 'loss/train': 2.21529483795166} -09/20/2021 21:12:59 - INFO - __main__ - Step 31067: {'lr': 0.0001997115490957157, 'samples': 994144, 'steps': 1941, 'loss/train': 2.451467275619507} -09/20/2021 21:13:00 - INFO - __main__ - Step 31068: {'lr': 0.0001997115490957157, 'samples': 994176, 'steps': 1941, 'loss/train': 2.048361301422119} -09/20/2021 21:13:01 - INFO - __main__ - Step 31069: {'lr': 0.0001997115490957157, 'samples': 994208, 'steps': 1941, 'loss/train': 1.9455337524414062} -09/20/2021 21:13:02 - INFO - __main__ - Step 31070: {'lr': 0.0001997115490957157, 'samples': 994240, 'steps': 1941, 'loss/train': 2.0577661991119385} -09/20/2021 21:13:03 - INFO - __main__ - Step 31071: {'lr': 0.0001997115490957157, 'samples': 994272, 'steps': 1941, 'loss/train': 2.21043062210083} -09/20/2021 21:13:04 - INFO - __main__ - Step 31072: {'lr': 0.0001997115490957157, 'samples': 994304, 'steps': 1941, 'loss/train': 2.6106419563293457} -09/20/2021 21:13:05 - INFO - __main__ - Step 31073: {'lr': 0.00019971106474146603, 'samples': 994336, 'steps': 1942, 'loss/train': 2.737011432647705} -09/20/2021 21:13:05 - INFO - __main__ - Step 31074: {'lr': 0.00019971106474146603, 'samples': 994368, 'steps': 1942, 'loss/train': 1.4737013578414917} -09/20/2021 21:13:06 - INFO - __main__ - Step 31075: {'lr': 0.00019971106474146603, 'samples': 994400, 'steps': 1942, 'loss/train': 2.3178038597106934} -09/20/2021 21:13:07 - INFO - __main__ - Step 31076: {'lr': 0.00019971106474146603, 'samples': 994432, 'steps': 1942, 'loss/train': 2.6224541664123535} -09/20/2021 21:13:08 - INFO - __main__ - Step 31077: {'lr': 0.00019971106474146603, 'samples': 994464, 'steps': 1942, 'loss/train': 2.9801363945007324} -09/20/2021 21:13:08 - INFO - __main__ - Step 31078: {'lr': 0.00019971106474146603, 'samples': 994496, 'steps': 1942, 'loss/train': 2.689513683319092} -09/20/2021 21:13:09 - INFO - __main__ - Step 31079: {'lr': 0.00019971106474146603, 'samples': 994528, 'steps': 1942, 'loss/train': 2.974066972732544} -09/20/2021 21:13:10 - INFO - __main__ - Step 31080: {'lr': 0.00019971106474146603, 'samples': 994560, 'steps': 1942, 'loss/train': 1.7042135000228882} -09/20/2021 21:13:11 - INFO - __main__ - Step 31081: {'lr': 0.00019971106474146603, 'samples': 994592, 'steps': 1942, 'loss/train': 2.6028785705566406} -09/20/2021 21:13:11 - INFO - __main__ - Step 31082: {'lr': 0.00019971106474146603, 'samples': 994624, 'steps': 1942, 'loss/train': 3.0996549129486084} -09/20/2021 21:13:12 - INFO - __main__ - Step 31083: {'lr': 0.00019971106474146603, 'samples': 994656, 'steps': 1942, 'loss/train': 2.224539279937744} -09/20/2021 21:13:13 - INFO - __main__ - Step 31084: {'lr': 0.00019971106474146603, 'samples': 994688, 'steps': 1942, 'loss/train': 3.0497353076934814} -09/20/2021 21:13:14 - INFO - __main__ - Step 31085: {'lr': 0.00019971106474146603, 'samples': 994720, 'steps': 1942, 'loss/train': 2.932102918624878} -09/20/2021 21:13:14 - INFO - __main__ - Step 31086: {'lr': 0.00019971106474146603, 'samples': 994752, 'steps': 1942, 'loss/train': 3.1337265968322754} -09/20/2021 21:13:15 - INFO - __main__ - Step 31087: {'lr': 0.00019971106474146603, 'samples': 994784, 'steps': 1942, 'loss/train': 1.8328012228012085} -09/20/2021 21:13:16 - INFO - __main__ - Step 31088: {'lr': 0.00019971106474146603, 'samples': 994816, 'steps': 1942, 'loss/train': 2.361567258834839} -09/20/2021 21:13:17 - INFO - __main__ - Step 31089: {'lr': 0.00019971057998149235, 'samples': 994848, 'steps': 1943, 'loss/train': 2.182497501373291} -09/20/2021 21:13:17 - INFO - __main__ - Step 31090: {'lr': 0.00019971057998149235, 'samples': 994880, 'steps': 1943, 'loss/train': 2.4574708938598633} -09/20/2021 21:13:18 - INFO - __main__ - Step 31091: {'lr': 0.00019971057998149235, 'samples': 994912, 'steps': 1943, 'loss/train': 2.6985270977020264} -09/20/2021 21:13:19 - INFO - __main__ - Step 31092: {'lr': 0.00019971057998149235, 'samples': 994944, 'steps': 1943, 'loss/train': 3.2045295238494873} -09/20/2021 21:13:20 - INFO - __main__ - Step 31093: {'lr': 0.00019971057998149235, 'samples': 994976, 'steps': 1943, 'loss/train': 2.5067172050476074} -09/20/2021 21:13:20 - INFO - __main__ - Step 31094: {'lr': 0.00019971057998149235, 'samples': 995008, 'steps': 1943, 'loss/train': 3.488136053085327} -09/20/2021 21:13:21 - INFO - __main__ - Step 31095: {'lr': 0.00019971057998149235, 'samples': 995040, 'steps': 1943, 'loss/train': 2.567697286605835} -09/20/2021 21:13:22 - INFO - __main__ - Step 31096: {'lr': 0.00019971057998149235, 'samples': 995072, 'steps': 1943, 'loss/train': 2.4145610332489014} -09/20/2021 21:13:23 - INFO - __main__ - Step 31097: {'lr': 0.00019971057998149235, 'samples': 995104, 'steps': 1943, 'loss/train': 2.3718042373657227} -09/20/2021 21:13:23 - INFO - __main__ - Step 31098: {'lr': 0.00019971057998149235, 'samples': 995136, 'steps': 1943, 'loss/train': 2.7654483318328857} -09/20/2021 21:13:24 - INFO - __main__ - Step 31099: {'lr': 0.00019971057998149235, 'samples': 995168, 'steps': 1943, 'loss/train': 1.8646588325500488} -09/20/2021 21:13:25 - INFO - __main__ - Step 31100: {'lr': 0.00019971057998149235, 'samples': 995200, 'steps': 1943, 'loss/train': 1.9947271347045898} -09/20/2021 21:13:26 - INFO - __main__ - Step 31101: {'lr': 0.00019971057998149235, 'samples': 995232, 'steps': 1943, 'loss/train': 2.67555570602417} -09/20/2021 21:13:27 - INFO - __main__ - Step 31102: {'lr': 0.00019971057998149235, 'samples': 995264, 'steps': 1943, 'loss/train': 2.174506425857544} -09/20/2021 21:13:28 - INFO - __main__ - Step 31103: {'lr': 0.00019971057998149235, 'samples': 995296, 'steps': 1943, 'loss/train': 3.3837344646453857} -09/20/2021 21:13:29 - INFO - __main__ - Step 31104: {'lr': 0.00019971057998149235, 'samples': 995328, 'steps': 1943, 'loss/train': 2.552363872528076} -09/20/2021 21:13:29 - INFO - __main__ - Step 31105: {'lr': 0.00019971009481579673, 'samples': 995360, 'steps': 1944, 'loss/train': 2.8794147968292236} -09/20/2021 21:13:30 - INFO - __main__ - Step 31106: {'lr': 0.00019971009481579673, 'samples': 995392, 'steps': 1944, 'loss/train': 2.5512619018554688} -09/20/2021 21:13:31 - INFO - __main__ - Step 31107: {'lr': 0.00019971009481579673, 'samples': 995424, 'steps': 1944, 'loss/train': 2.3061323165893555} -09/20/2021 21:13:32 - INFO - __main__ - Step 31108: {'lr': 0.00019971009481579673, 'samples': 995456, 'steps': 1944, 'loss/train': 2.8037261962890625} -09/20/2021 21:13:32 - INFO - __main__ - Step 31109: {'lr': 0.00019971009481579673, 'samples': 995488, 'steps': 1944, 'loss/train': 2.298370361328125} -09/20/2021 21:13:33 - INFO - __main__ - Step 31110: {'lr': 0.00019971009481579673, 'samples': 995520, 'steps': 1944, 'loss/train': 1.8083088397979736} -09/20/2021 21:13:34 - INFO - __main__ - Step 31111: {'lr': 0.00019971009481579673, 'samples': 995552, 'steps': 1944, 'loss/train': 1.3587794303894043} -09/20/2021 21:13:35 - INFO - __main__ - Step 31112: {'lr': 0.00019971009481579673, 'samples': 995584, 'steps': 1944, 'loss/train': 0.41277825832366943} -09/20/2021 21:13:35 - INFO - __main__ - Step 31113: {'lr': 0.00019971009481579673, 'samples': 995616, 'steps': 1944, 'loss/train': 0.7543125152587891} -09/20/2021 21:13:36 - INFO - __main__ - Step 31114: {'lr': 0.00019971009481579673, 'samples': 995648, 'steps': 1944, 'loss/train': 0.26888182759284973} -09/20/2021 21:13:37 - INFO - __main__ - Step 31115: {'lr': 0.00019971009481579673, 'samples': 995680, 'steps': 1944, 'loss/train': 0.34989187121391296} -09/20/2021 21:13:38 - INFO - __main__ - Step 31116: {'lr': 0.00019971009481579673, 'samples': 995712, 'steps': 1944, 'loss/train': 3.1438944339752197} -09/20/2021 21:13:38 - INFO - __main__ - Step 31117: {'lr': 0.00019971009481579673, 'samples': 995744, 'steps': 1944, 'loss/train': 1.8312976360321045} -09/20/2021 21:13:39 - INFO - __main__ - Step 31118: {'lr': 0.00019971009481579673, 'samples': 995776, 'steps': 1944, 'loss/train': 1.9408546686172485} -09/20/2021 21:13:40 - INFO - __main__ - Step 31119: {'lr': 0.00019971009481579673, 'samples': 995808, 'steps': 1944, 'loss/train': 2.142826795578003} -09/20/2021 21:13:41 - INFO - __main__ - Step 31120: {'lr': 0.00019971009481579673, 'samples': 995840, 'steps': 1944, 'loss/train': 1.706496238708496} -09/20/2021 21:13:42 - INFO - __main__ - Step 31121: {'lr': 0.00019970960924438116, 'samples': 995872, 'steps': 1945, 'loss/train': 2.7179739475250244} -09/20/2021 21:13:42 - INFO - __main__ - Step 31122: {'lr': 0.00019970960924438116, 'samples': 995904, 'steps': 1945, 'loss/train': 2.877786636352539} -09/20/2021 21:13:43 - INFO - __main__ - Step 31123: {'lr': 0.00019970960924438116, 'samples': 995936, 'steps': 1945, 'loss/train': 3.0700697898864746} -09/20/2021 21:13:44 - INFO - __main__ - Step 31124: {'lr': 0.00019970960924438116, 'samples': 995968, 'steps': 1945, 'loss/train': 2.7097225189208984} -09/20/2021 21:13:45 - INFO - __main__ - Step 31125: {'lr': 0.00019970960924438116, 'samples': 996000, 'steps': 1945, 'loss/train': 2.6699936389923096} -09/20/2021 21:13:45 - INFO - __main__ - Step 31126: {'lr': 0.00019970960924438116, 'samples': 996032, 'steps': 1945, 'loss/train': 2.159541606903076} -09/20/2021 21:13:46 - INFO - __main__ - Step 31127: {'lr': 0.00019970960924438116, 'samples': 996064, 'steps': 1945, 'loss/train': 2.626997709274292} -09/20/2021 21:13:47 - INFO - __main__ - Step 31128: {'lr': 0.00019970960924438116, 'samples': 996096, 'steps': 1945, 'loss/train': 2.7546494007110596} -09/20/2021 21:13:48 - INFO - __main__ - Step 31129: {'lr': 0.00019970960924438116, 'samples': 996128, 'steps': 1945, 'loss/train': 2.3451058864593506} -09/20/2021 21:13:48 - INFO - __main__ - Step 31130: {'lr': 0.00019970960924438116, 'samples': 996160, 'steps': 1945, 'loss/train': 2.288825273513794} -09/20/2021 21:13:49 - INFO - __main__ - Step 31131: {'lr': 0.00019970960924438116, 'samples': 996192, 'steps': 1945, 'loss/train': 3.250594139099121} -09/20/2021 21:13:50 - INFO - __main__ - Step 31132: {'lr': 0.00019970960924438116, 'samples': 996224, 'steps': 1945, 'loss/train': 2.7413649559020996} -09/20/2021 21:13:51 - INFO - __main__ - Step 31133: {'lr': 0.00019970960924438116, 'samples': 996256, 'steps': 1945, 'loss/train': 2.4360194206237793} -09/20/2021 21:13:52 - INFO - __main__ - Step 31134: {'lr': 0.00019970960924438116, 'samples': 996288, 'steps': 1945, 'loss/train': 2.412348985671997} -09/20/2021 21:13:53 - INFO - __main__ - Step 31135: {'lr': 0.00019970960924438116, 'samples': 996320, 'steps': 1945, 'loss/train': 2.995877742767334} -09/20/2021 21:13:53 - INFO - __main__ - Step 31136: {'lr': 0.00019970960924438116, 'samples': 996352, 'steps': 1945, 'loss/train': 2.0223021507263184} -09/20/2021 21:13:54 - INFO - __main__ - Step 31137: {'lr': 0.00019970912326724755, 'samples': 996384, 'steps': 1946, 'loss/train': 1.4819632768630981} -09/20/2021 21:13:55 - INFO - __main__ - Step 31138: {'lr': 0.00019970912326724755, 'samples': 996416, 'steps': 1946, 'loss/train': 2.131706714630127} -09/20/2021 21:13:56 - INFO - __main__ - Step 31139: {'lr': 0.00019970912326724755, 'samples': 996448, 'steps': 1946, 'loss/train': 2.2028486728668213} -09/20/2021 21:13:56 - INFO - __main__ - Step 31140: {'lr': 0.00019970912326724755, 'samples': 996480, 'steps': 1946, 'loss/train': 2.7519569396972656} -09/20/2021 21:13:57 - INFO - __main__ - Step 31141: {'lr': 0.00019970912326724755, 'samples': 996512, 'steps': 1946, 'loss/train': 2.992426872253418} -09/20/2021 21:13:58 - INFO - __main__ - Step 31142: {'lr': 0.00019970912326724755, 'samples': 996544, 'steps': 1946, 'loss/train': 2.8652658462524414} -09/20/2021 21:13:59 - INFO - __main__ - Step 31143: {'lr': 0.00019970912326724755, 'samples': 996576, 'steps': 1946, 'loss/train': 2.6615076065063477} -09/20/2021 21:13:59 - INFO - __main__ - Step 31144: {'lr': 0.00019970912326724755, 'samples': 996608, 'steps': 1946, 'loss/train': 2.7384774684906006} -09/20/2021 21:14:00 - INFO - __main__ - Step 31145: {'lr': 0.00019970912326724755, 'samples': 996640, 'steps': 1946, 'loss/train': 2.2180886268615723} -09/20/2021 21:14:01 - INFO - __main__ - Step 31146: {'lr': 0.00019970912326724755, 'samples': 996672, 'steps': 1946, 'loss/train': 2.366927146911621} -09/20/2021 21:14:02 - INFO - __main__ - Step 31147: {'lr': 0.00019970912326724755, 'samples': 996704, 'steps': 1946, 'loss/train': 1.9665911197662354} -09/20/2021 21:14:02 - INFO - __main__ - Step 31148: {'lr': 0.00019970912326724755, 'samples': 996736, 'steps': 1946, 'loss/train': 2.2108278274536133} -09/20/2021 21:14:03 - INFO - __main__ - Step 31149: {'lr': 0.00019970912326724755, 'samples': 996768, 'steps': 1946, 'loss/train': 2.794813871383667} -09/20/2021 21:14:04 - INFO - __main__ - Step 31150: {'lr': 0.00019970912326724755, 'samples': 996800, 'steps': 1946, 'loss/train': 2.8025379180908203} -09/20/2021 21:14:05 - INFO - __main__ - Step 31151: {'lr': 0.00019970912326724755, 'samples': 996832, 'steps': 1946, 'loss/train': 1.982417106628418} -09/20/2021 21:14:05 - INFO - __main__ - Step 31152: {'lr': 0.00019970912326724755, 'samples': 996864, 'steps': 1946, 'loss/train': 2.2778289318084717} -09/20/2021 21:14:06 - INFO - __main__ - Step 31153: {'lr': 0.0001997086368843979, 'samples': 996896, 'steps': 1947, 'loss/train': 2.1412341594696045} -09/20/2021 21:14:07 - INFO - __main__ - Step 31154: {'lr': 0.0001997086368843979, 'samples': 996928, 'steps': 1947, 'loss/train': 2.4223854541778564} -09/20/2021 21:14:08 - INFO - __main__ - Step 31155: {'lr': 0.0001997086368843979, 'samples': 996960, 'steps': 1947, 'loss/train': 3.065831184387207} -09/20/2021 21:14:09 - INFO - __main__ - Step 31156: {'lr': 0.0001997086368843979, 'samples': 996992, 'steps': 1947, 'loss/train': 1.7340967655181885} -09/20/2021 21:14:09 - INFO - __main__ - Step 31157: {'lr': 0.0001997086368843979, 'samples': 997024, 'steps': 1947, 'loss/train': 2.8446176052093506} -09/20/2021 21:14:10 - INFO - __main__ - Step 31158: {'lr': 0.0001997086368843979, 'samples': 997056, 'steps': 1947, 'loss/train': 2.855670213699341} -09/20/2021 21:14:11 - INFO - __main__ - Step 31159: {'lr': 0.0001997086368843979, 'samples': 997088, 'steps': 1947, 'loss/train': 2.8521170616149902} -09/20/2021 21:14:12 - INFO - __main__ - Step 31160: {'lr': 0.0001997086368843979, 'samples': 997120, 'steps': 1947, 'loss/train': 3.8932955265045166} -09/20/2021 21:14:12 - INFO - __main__ - Step 31161: {'lr': 0.0001997086368843979, 'samples': 997152, 'steps': 1947, 'loss/train': 2.320970296859741} -09/20/2021 21:14:13 - INFO - __main__ - Step 31162: {'lr': 0.0001997086368843979, 'samples': 997184, 'steps': 1947, 'loss/train': 2.0296571254730225} -09/20/2021 21:14:14 - INFO - __main__ - Step 31163: {'lr': 0.0001997086368843979, 'samples': 997216, 'steps': 1947, 'loss/train': 2.9343013763427734} -09/20/2021 21:14:15 - INFO - __main__ - Step 31164: {'lr': 0.0001997086368843979, 'samples': 997248, 'steps': 1947, 'loss/train': 2.7115767002105713} -09/20/2021 21:14:16 - INFO - __main__ - Step 31165: {'lr': 0.0001997086368843979, 'samples': 997280, 'steps': 1947, 'loss/train': 2.9072558879852295} -09/20/2021 21:14:17 - INFO - __main__ - Step 31166: {'lr': 0.0001997086368843979, 'samples': 997312, 'steps': 1947, 'loss/train': 2.789760112762451} -09/20/2021 21:14:17 - INFO - __main__ - Step 31167: {'lr': 0.0001997086368843979, 'samples': 997344, 'steps': 1947, 'loss/train': 3.1071155071258545} -09/20/2021 21:14:18 - INFO - __main__ - Step 31168: {'lr': 0.0001997086368843979, 'samples': 997376, 'steps': 1947, 'loss/train': 1.893705129623413} -09/20/2021 21:14:19 - INFO - __main__ - Step 31169: {'lr': 0.00019970815009583422, 'samples': 997408, 'steps': 1948, 'loss/train': 1.4739978313446045} -09/20/2021 21:14:20 - INFO - __main__ - Step 31170: {'lr': 0.00019970815009583422, 'samples': 997440, 'steps': 1948, 'loss/train': 2.1464481353759766} -09/20/2021 21:14:20 - INFO - __main__ - Step 31171: {'lr': 0.00019970815009583422, 'samples': 997472, 'steps': 1948, 'loss/train': 2.340228796005249} -09/20/2021 21:14:21 - INFO - __main__ - Step 31172: {'lr': 0.00019970815009583422, 'samples': 997504, 'steps': 1948, 'loss/train': 1.6651136875152588} -09/20/2021 21:14:22 - INFO - __main__ - Step 31173: {'lr': 0.00019970815009583422, 'samples': 997536, 'steps': 1948, 'loss/train': 2.6514830589294434} -09/20/2021 21:14:23 - INFO - __main__ - Step 31174: {'lr': 0.00019970815009583422, 'samples': 997568, 'steps': 1948, 'loss/train': 2.5070548057556152} -09/20/2021 21:14:23 - INFO - __main__ - Step 31175: {'lr': 0.00019970815009583422, 'samples': 997600, 'steps': 1948, 'loss/train': 2.0402345657348633} -09/20/2021 21:14:24 - INFO - __main__ - Step 31176: {'lr': 0.00019970815009583422, 'samples': 997632, 'steps': 1948, 'loss/train': 2.254049062728882} -09/20/2021 21:14:25 - INFO - __main__ - Step 31177: {'lr': 0.00019970815009583422, 'samples': 997664, 'steps': 1948, 'loss/train': 1.6134310960769653} -09/20/2021 21:14:26 - INFO - __main__ - Step 31178: {'lr': 0.00019970815009583422, 'samples': 997696, 'steps': 1948, 'loss/train': 2.704929828643799} -09/20/2021 21:14:26 - INFO - __main__ - Step 31179: {'lr': 0.00019970815009583422, 'samples': 997728, 'steps': 1948, 'loss/train': 1.6494698524475098} -09/20/2021 21:14:27 - INFO - __main__ - Step 31180: {'lr': 0.00019970815009583422, 'samples': 997760, 'steps': 1948, 'loss/train': 2.090625286102295} -09/20/2021 21:14:28 - INFO - __main__ - Step 31181: {'lr': 0.00019970815009583422, 'samples': 997792, 'steps': 1948, 'loss/train': 1.8451666831970215} -09/20/2021 21:14:29 - INFO - __main__ - Step 31182: {'lr': 0.00019970815009583422, 'samples': 997824, 'steps': 1948, 'loss/train': 2.5371172428131104} -09/20/2021 21:14:29 - INFO - __main__ - Step 31183: {'lr': 0.00019970815009583422, 'samples': 997856, 'steps': 1948, 'loss/train': 3.044128179550171} -09/20/2021 21:14:30 - INFO - __main__ - Step 31184: {'lr': 0.00019970815009583422, 'samples': 997888, 'steps': 1948, 'loss/train': 1.9017598628997803} -09/20/2021 21:14:31 - INFO - __main__ - Step 31185: {'lr': 0.0001997076629015584, 'samples': 997920, 'steps': 1949, 'loss/train': 1.9498929977416992} -09/20/2021 21:14:32 - INFO - __main__ - Step 31186: {'lr': 0.0001997076629015584, 'samples': 997952, 'steps': 1949, 'loss/train': 2.807802200317383} -09/20/2021 21:14:33 - INFO - __main__ - Step 31187: {'lr': 0.0001997076629015584, 'samples': 997984, 'steps': 1949, 'loss/train': 2.518671989440918} -09/20/2021 21:14:33 - INFO - __main__ - Step 31188: {'lr': 0.0001997076629015584, 'samples': 998016, 'steps': 1949, 'loss/train': 2.9117543697357178} -09/20/2021 21:14:34 - INFO - __main__ - Step 31189: {'lr': 0.0001997076629015584, 'samples': 998048, 'steps': 1949, 'loss/train': 2.96219801902771} -09/20/2021 21:14:35 - INFO - __main__ - Step 31190: {'lr': 0.0001997076629015584, 'samples': 998080, 'steps': 1949, 'loss/train': 2.3717434406280518} -09/20/2021 21:14:36 - INFO - __main__ - Step 31191: {'lr': 0.0001997076629015584, 'samples': 998112, 'steps': 1949, 'loss/train': 2.4343936443328857} -09/20/2021 21:14:36 - INFO - __main__ - Step 31192: {'lr': 0.0001997076629015584, 'samples': 998144, 'steps': 1949, 'loss/train': 2.7755820751190186} -09/20/2021 21:14:37 - INFO - __main__ - Step 31193: {'lr': 0.0001997076629015584, 'samples': 998176, 'steps': 1949, 'loss/train': 2.073605537414551} -09/20/2021 21:14:38 - INFO - __main__ - Step 31194: {'lr': 0.0001997076629015584, 'samples': 998208, 'steps': 1949, 'loss/train': 2.487705945968628} -09/20/2021 21:14:39 - INFO - __main__ - Step 31195: {'lr': 0.0001997076629015584, 'samples': 998240, 'steps': 1949, 'loss/train': 2.9927563667297363} -09/20/2021 21:14:40 - INFO - __main__ - Step 31196: {'lr': 0.0001997076629015584, 'samples': 998272, 'steps': 1949, 'loss/train': 2.969310760498047} -09/20/2021 21:14:41 - INFO - __main__ - Step 31197: {'lr': 0.0001997076629015584, 'samples': 998304, 'steps': 1949, 'loss/train': 2.307603120803833} -09/20/2021 21:14:41 - INFO - __main__ - Step 31198: {'lr': 0.0001997076629015584, 'samples': 998336, 'steps': 1949, 'loss/train': 2.2703657150268555} -09/20/2021 21:14:42 - INFO - __main__ - Step 31199: {'lr': 0.0001997076629015584, 'samples': 998368, 'steps': 1949, 'loss/train': 1.8397800922393799} -09/20/2021 21:14:43 - INFO - __main__ - Step 31200: {'lr': 0.0001997076629015584, 'samples': 998400, 'steps': 1949, 'loss/train': 2.607898473739624} -09/20/2021 21:14:44 - INFO - __main__ - Step 31201: {'lr': 0.00019970717530157255, 'samples': 998432, 'steps': 1950, 'loss/train': 2.1185688972473145} -09/20/2021 21:14:45 - INFO - __main__ - Step 31202: {'lr': 0.00019970717530157255, 'samples': 998464, 'steps': 1950, 'loss/train': 3.101513624191284} -09/20/2021 21:14:45 - INFO - __main__ - Step 31203: {'lr': 0.00019970717530157255, 'samples': 998496, 'steps': 1950, 'loss/train': 2.6256699562072754} -09/20/2021 21:14:46 - INFO - __main__ - Step 31204: {'lr': 0.00019970717530157255, 'samples': 998528, 'steps': 1950, 'loss/train': 2.929361343383789} -09/20/2021 21:14:47 - INFO - __main__ - Step 31205: {'lr': 0.00019970717530157255, 'samples': 998560, 'steps': 1950, 'loss/train': 2.622199058532715} -09/20/2021 21:14:48 - INFO - __main__ - Step 31206: {'lr': 0.00019970717530157255, 'samples': 998592, 'steps': 1950, 'loss/train': 3.1942033767700195} -09/20/2021 21:14:48 - INFO - __main__ - Step 31207: {'lr': 0.00019970717530157255, 'samples': 998624, 'steps': 1950, 'loss/train': 1.9271372556686401} -09/20/2021 21:14:49 - INFO - __main__ - Step 31208: {'lr': 0.00019970717530157255, 'samples': 998656, 'steps': 1950, 'loss/train': 2.1531338691711426} -09/20/2021 21:14:50 - INFO - __main__ - Step 31209: {'lr': 0.00019970717530157255, 'samples': 998688, 'steps': 1950, 'loss/train': 2.37119460105896} -09/20/2021 21:14:51 - INFO - __main__ - Step 31210: {'lr': 0.00019970717530157255, 'samples': 998720, 'steps': 1950, 'loss/train': 2.5116515159606934} -09/20/2021 21:14:51 - INFO - __main__ - Step 31211: {'lr': 0.00019970717530157255, 'samples': 998752, 'steps': 1950, 'loss/train': 1.6456942558288574} -09/20/2021 21:14:52 - INFO - __main__ - Step 31212: {'lr': 0.00019970717530157255, 'samples': 998784, 'steps': 1950, 'loss/train': 0.2327975630760193} -09/20/2021 21:14:53 - INFO - __main__ - Step 31213: {'lr': 0.00019970717530157255, 'samples': 998816, 'steps': 1950, 'loss/train': 2.6312692165374756} -09/20/2021 21:14:54 - INFO - __main__ - Step 31214: {'lr': 0.00019970717530157255, 'samples': 998848, 'steps': 1950, 'loss/train': 2.6708528995513916} -09/20/2021 21:14:54 - INFO - __main__ - Step 31215: {'lr': 0.00019970717530157255, 'samples': 998880, 'steps': 1950, 'loss/train': 3.3722410202026367} -09/20/2021 21:14:55 - INFO - __main__ - Step 31216: {'lr': 0.00019970717530157255, 'samples': 998912, 'steps': 1950, 'loss/train': 1.5506600141525269} -09/20/2021 21:14:56 - INFO - __main__ - Step 31217: {'lr': 0.00019970668729587856, 'samples': 998944, 'steps': 1951, 'loss/train': 2.823479175567627} -09/20/2021 21:14:57 - INFO - __main__ - Step 31218: {'lr': 0.00019970668729587856, 'samples': 998976, 'steps': 1951, 'loss/train': 4.558077335357666} -09/20/2021 21:14:57 - INFO - __main__ - Step 31219: {'lr': 0.00019970668729587856, 'samples': 999008, 'steps': 1951, 'loss/train': 1.792926549911499} -09/20/2021 21:14:58 - INFO - __main__ - Step 31220: {'lr': 0.00019970668729587856, 'samples': 999040, 'steps': 1951, 'loss/train': 2.707188367843628} -09/20/2021 21:14:59 - INFO - __main__ - Step 31221: {'lr': 0.00019970668729587856, 'samples': 999072, 'steps': 1951, 'loss/train': 3.1763534545898438} -09/20/2021 21:15:00 - INFO - __main__ - Step 31222: {'lr': 0.00019970668729587856, 'samples': 999104, 'steps': 1951, 'loss/train': 2.955866575241089} -09/20/2021 21:15:00 - INFO - __main__ - Step 31223: {'lr': 0.00019970668729587856, 'samples': 999136, 'steps': 1951, 'loss/train': 1.7516977787017822} -09/20/2021 21:15:01 - INFO - __main__ - Step 31224: {'lr': 0.00019970668729587856, 'samples': 999168, 'steps': 1951, 'loss/train': 2.862140417098999} -09/20/2021 21:15:02 - INFO - __main__ - Step 31225: {'lr': 0.00019970668729587856, 'samples': 999200, 'steps': 1951, 'loss/train': 2.5031604766845703} -09/20/2021 21:15:03 - INFO - __main__ - Step 31226: {'lr': 0.00019970668729587856, 'samples': 999232, 'steps': 1951, 'loss/train': 3.361168384552002} -09/20/2021 21:15:04 - INFO - __main__ - Step 31227: {'lr': 0.00019970668729587856, 'samples': 999264, 'steps': 1951, 'loss/train': 1.1787714958190918} -09/20/2021 21:15:05 - INFO - __main__ - Step 31228: {'lr': 0.00019970668729587856, 'samples': 999296, 'steps': 1951, 'loss/train': 1.7399872541427612} -09/20/2021 21:15:06 - INFO - __main__ - Step 31229: {'lr': 0.00019970668729587856, 'samples': 999328, 'steps': 1951, 'loss/train': 1.5354913473129272} -09/20/2021 21:15:06 - INFO - __main__ - Step 31230: {'lr': 0.00019970668729587856, 'samples': 999360, 'steps': 1951, 'loss/train': 1.751617193222046} -09/20/2021 21:15:07 - INFO - __main__ - Step 31231: {'lr': 0.00019970668729587856, 'samples': 999392, 'steps': 1951, 'loss/train': 2.560598134994507} -09/20/2021 21:15:08 - INFO - __main__ - Step 31232: {'lr': 0.00019970668729587856, 'samples': 999424, 'steps': 1951, 'loss/train': 2.8800816535949707} -09/20/2021 21:15:09 - INFO - __main__ - Step 31233: {'lr': 0.00019970619888447845, 'samples': 999456, 'steps': 1952, 'loss/train': 2.8320350646972656} -09/20/2021 21:15:10 - INFO - __main__ - Step 31234: {'lr': 0.00019970619888447845, 'samples': 999488, 'steps': 1952, 'loss/train': 1.6787787675857544} -09/20/2021 21:15:10 - INFO - __main__ - Step 31235: {'lr': 0.00019970619888447845, 'samples': 999520, 'steps': 1952, 'loss/train': 0.19387100636959076} -09/20/2021 21:15:11 - INFO - __main__ - Step 31236: {'lr': 0.00019970619888447845, 'samples': 999552, 'steps': 1952, 'loss/train': 0.4387930631637573} -09/20/2021 21:15:12 - INFO - __main__ - Step 31237: {'lr': 0.00019970619888447845, 'samples': 999584, 'steps': 1952, 'loss/train': 0.14265406131744385} -09/20/2021 21:15:13 - INFO - __main__ - Step 31238: {'lr': 0.00019970619888447845, 'samples': 999616, 'steps': 1952, 'loss/train': 0.29219600558280945} -09/20/2021 21:15:13 - INFO - __main__ - Step 31239: {'lr': 0.00019970619888447845, 'samples': 999648, 'steps': 1952, 'loss/train': 4.585582256317139} -09/20/2021 21:15:14 - INFO - __main__ - Step 31240: {'lr': 0.00019970619888447845, 'samples': 999680, 'steps': 1952, 'loss/train': 3.98854660987854} -09/20/2021 21:15:15 - INFO - __main__ - Step 31241: {'lr': 0.00019970619888447845, 'samples': 999712, 'steps': 1952, 'loss/train': 1.8419334888458252} -09/20/2021 21:15:16 - INFO - __main__ - Step 31242: {'lr': 0.00019970619888447845, 'samples': 999744, 'steps': 1952, 'loss/train': 2.854976177215576} -09/20/2021 21:15:16 - INFO - __main__ - Step 31243: {'lr': 0.00019970619888447845, 'samples': 999776, 'steps': 1952, 'loss/train': 2.66701602935791} -09/20/2021 21:15:17 - INFO - __main__ - Step 31244: {'lr': 0.00019970619888447845, 'samples': 999808, 'steps': 1952, 'loss/train': 2.600020408630371} -09/20/2021 21:15:18 - INFO - __main__ - Step 31245: {'lr': 0.00019970619888447845, 'samples': 999840, 'steps': 1952, 'loss/train': 2.3134851455688477} -09/20/2021 21:15:19 - INFO - __main__ - Step 31246: {'lr': 0.00019970619888447845, 'samples': 999872, 'steps': 1952, 'loss/train': 2.2179758548736572} -09/20/2021 21:15:19 - INFO - __main__ - Step 31247: {'lr': 0.00019970619888447845, 'samples': 999904, 'steps': 1952, 'loss/train': 2.362971305847168} -09/20/2021 21:15:20 - INFO - __main__ - Step 31248: {'lr': 0.00019970619888447845, 'samples': 999936, 'steps': 1952, 'loss/train': 2.270284652709961} -09/20/2021 21:15:21 - INFO - __main__ - Step 31249: {'lr': 0.00019970571006737423, 'samples': 999968, 'steps': 1953, 'loss/train': 2.5869362354278564} -09/20/2021 21:15:22 - INFO - __main__ - Step 31250: {'lr': 0.00019970571006737423, 'samples': 1000000, 'steps': 1953, 'loss/train': 2.4628078937530518} -09/20/2021 21:15:22 - INFO - __main__ - Step 31251: {'lr': 0.00019970571006737423, 'samples': 1000032, 'steps': 1953, 'loss/train': 3.0147178173065186} -09/20/2021 21:15:23 - INFO - __main__ - Step 31252: {'lr': 0.00019970571006737423, 'samples': 1000064, 'steps': 1953, 'loss/train': 1.0164514780044556} -09/20/2021 21:15:24 - INFO - __main__ - Step 31253: {'lr': 0.00019970571006737423, 'samples': 1000096, 'steps': 1953, 'loss/train': 2.4545607566833496} -09/20/2021 21:15:25 - INFO - __main__ - Step 31254: {'lr': 0.00019970571006737423, 'samples': 1000128, 'steps': 1953, 'loss/train': 2.386981248855591} -09/20/2021 21:15:25 - INFO - __main__ - Step 31255: {'lr': 0.00019970571006737423, 'samples': 1000160, 'steps': 1953, 'loss/train': 2.185678482055664} -09/20/2021 21:15:27 - INFO - __main__ - Step 31256: {'lr': 0.00019970571006737423, 'samples': 1000192, 'steps': 1953, 'loss/train': 3.237755298614502} -09/20/2021 21:15:28 - INFO - __main__ - Step 31257: {'lr': 0.00019970571006737423, 'samples': 1000224, 'steps': 1953, 'loss/train': 3.0680344104766846} -09/20/2021 21:15:29 - INFO - __main__ - Step 31258: {'lr': 0.00019970571006737423, 'samples': 1000256, 'steps': 1953, 'loss/train': 1.8428009748458862} -09/20/2021 21:15:30 - INFO - __main__ - Step 31259: {'lr': 0.00019970571006737423, 'samples': 1000288, 'steps': 1953, 'loss/train': 2.4585697650909424} -09/20/2021 21:15:30 - INFO - __main__ - Step 31260: {'lr': 0.00019970571006737423, 'samples': 1000320, 'steps': 1953, 'loss/train': 2.634870767593384} -09/20/2021 21:15:31 - INFO - __main__ - Step 31261: {'lr': 0.00019970571006737423, 'samples': 1000352, 'steps': 1953, 'loss/train': 1.8336580991744995} -09/20/2021 21:15:32 - INFO - __main__ - Step 31262: {'lr': 0.00019970571006737423, 'samples': 1000384, 'steps': 1953, 'loss/train': 2.6519246101379395} -09/20/2021 21:15:33 - INFO - __main__ - Step 31263: {'lr': 0.00019970571006737423, 'samples': 1000416, 'steps': 1953, 'loss/train': 2.4950673580169678} -09/20/2021 21:15:33 - INFO - __main__ - Step 31264: {'lr': 0.00019970571006737423, 'samples': 1000448, 'steps': 1953, 'loss/train': 1.6028807163238525} -09/20/2021 21:15:34 - INFO - __main__ - Step 31265: {'lr': 0.0001997052208445678, 'samples': 1000480, 'steps': 1954, 'loss/train': 1.7023118734359741} -09/20/2021 21:15:35 - INFO - __main__ - Step 31266: {'lr': 0.0001997052208445678, 'samples': 1000512, 'steps': 1954, 'loss/train': 1.7774133682250977} -09/20/2021 21:15:36 - INFO - __main__ - Step 31267: {'lr': 0.0001997052208445678, 'samples': 1000544, 'steps': 1954, 'loss/train': 1.7852321863174438} -09/20/2021 21:15:36 - INFO - __main__ - Step 31268: {'lr': 0.0001997052208445678, 'samples': 1000576, 'steps': 1954, 'loss/train': 2.0078952312469482} -09/20/2021 21:15:37 - INFO - __main__ - Step 31269: {'lr': 0.0001997052208445678, 'samples': 1000608, 'steps': 1954, 'loss/train': 2.3893489837646484} -09/20/2021 21:15:38 - INFO - __main__ - Step 31270: {'lr': 0.0001997052208445678, 'samples': 1000640, 'steps': 1954, 'loss/train': 0.4889482855796814} -09/20/2021 21:15:39 - INFO - __main__ - Step 31271: {'lr': 0.0001997052208445678, 'samples': 1000672, 'steps': 1954, 'loss/train': 0.8118903040885925} -09/20/2021 21:15:39 - INFO - __main__ - Step 31272: {'lr': 0.0001997052208445678, 'samples': 1000704, 'steps': 1954, 'loss/train': 3.3098530769348145} -09/20/2021 21:15:40 - INFO - __main__ - Step 31273: {'lr': 0.0001997052208445678, 'samples': 1000736, 'steps': 1954, 'loss/train': 3.5463931560516357} -09/20/2021 21:15:41 - INFO - __main__ - Step 31274: {'lr': 0.0001997052208445678, 'samples': 1000768, 'steps': 1954, 'loss/train': 2.388784885406494} -09/20/2021 21:15:42 - INFO - __main__ - Step 31275: {'lr': 0.0001997052208445678, 'samples': 1000800, 'steps': 1954, 'loss/train': 2.183551788330078} -09/20/2021 21:15:42 - INFO - __main__ - Step 31276: {'lr': 0.0001997052208445678, 'samples': 1000832, 'steps': 1954, 'loss/train': 1.5842117071151733} -09/20/2021 21:15:43 - INFO - __main__ - Step 31277: {'lr': 0.0001997052208445678, 'samples': 1000864, 'steps': 1954, 'loss/train': 2.1308107376098633} -09/20/2021 21:15:44 - INFO - __main__ - Step 31278: {'lr': 0.0001997052208445678, 'samples': 1000896, 'steps': 1954, 'loss/train': 2.057006359100342} -09/20/2021 21:15:45 - INFO - __main__ - Step 31279: {'lr': 0.0001997052208445678, 'samples': 1000928, 'steps': 1954, 'loss/train': 2.0995161533355713} -09/20/2021 21:15:45 - INFO - __main__ - Step 31280: {'lr': 0.0001997052208445678, 'samples': 1000960, 'steps': 1954, 'loss/train': 1.9011539220809937} -09/20/2021 21:15:46 - INFO - __main__ - Step 31281: {'lr': 0.0001997047312160613, 'samples': 1000992, 'steps': 1955, 'loss/train': 2.6920509338378906} -09/20/2021 21:15:47 - INFO - __main__ - Step 31282: {'lr': 0.0001997047312160613, 'samples': 1001024, 'steps': 1955, 'loss/train': 1.6118460893630981} -09/20/2021 21:15:48 - INFO - __main__ - Step 31283: {'lr': 0.0001997047312160613, 'samples': 1001056, 'steps': 1955, 'loss/train': 0.3607073128223419} -09/20/2021 21:15:49 - INFO - __main__ - Step 31284: {'lr': 0.0001997047312160613, 'samples': 1001088, 'steps': 1955, 'loss/train': 0.15163284540176392} -09/20/2021 21:15:49 - INFO - __main__ - Step 31285: {'lr': 0.0001997047312160613, 'samples': 1001120, 'steps': 1955, 'loss/train': 0.6929726004600525} -09/20/2021 21:15:51 - INFO - __main__ - Step 31286: {'lr': 0.0001997047312160613, 'samples': 1001152, 'steps': 1955, 'loss/train': 2.685718536376953} -09/20/2021 21:15:52 - INFO - __main__ - Step 31287: {'lr': 0.0001997047312160613, 'samples': 1001184, 'steps': 1955, 'loss/train': 2.5921218395233154} -09/20/2021 21:15:53 - INFO - __main__ - Step 31288: {'lr': 0.0001997047312160613, 'samples': 1001216, 'steps': 1955, 'loss/train': 2.2961044311523438} -09/20/2021 21:15:53 - INFO - __main__ - Step 31289: {'lr': 0.0001997047312160613, 'samples': 1001248, 'steps': 1955, 'loss/train': 1.8693169355392456} -09/20/2021 21:15:54 - INFO - __main__ - Step 31290: {'lr': 0.0001997047312160613, 'samples': 1001280, 'steps': 1955, 'loss/train': 1.8582161664962769} -09/20/2021 21:15:55 - INFO - __main__ - Step 31291: {'lr': 0.0001997047312160613, 'samples': 1001312, 'steps': 1955, 'loss/train': 2.0398621559143066} -09/20/2021 21:15:56 - INFO - __main__ - Step 31292: {'lr': 0.0001997047312160613, 'samples': 1001344, 'steps': 1955, 'loss/train': 0.5163722038269043} -09/20/2021 21:15:56 - INFO - __main__ - Step 31293: {'lr': 0.0001997047312160613, 'samples': 1001376, 'steps': 1955, 'loss/train': 2.565096378326416} -09/20/2021 21:15:57 - INFO - __main__ - Step 31294: {'lr': 0.0001997047312160613, 'samples': 1001408, 'steps': 1955, 'loss/train': 0.8910395503044128} -09/20/2021 21:15:58 - INFO - __main__ - Step 31295: {'lr': 0.0001997047312160613, 'samples': 1001440, 'steps': 1955, 'loss/train': 0.2524399757385254} -09/20/2021 21:15:59 - INFO - __main__ - Step 31296: {'lr': 0.0001997047312160613, 'samples': 1001472, 'steps': 1955, 'loss/train': 0.30546683073043823} -09/20/2021 21:15:59 - INFO - __main__ - Step 31297: {'lr': 0.00019970424118185656, 'samples': 1001504, 'steps': 1956, 'loss/train': 0.5562770962715149} -09/20/2021 21:16:00 - INFO - __main__ - Step 31298: {'lr': 0.00019970424118185656, 'samples': 1001536, 'steps': 1956, 'loss/train': 0.2862328886985779} -09/20/2021 21:16:01 - INFO - __main__ - Step 31299: {'lr': 0.00019970424118185656, 'samples': 1001568, 'steps': 1956, 'loss/train': 0.42073947191238403} -09/20/2021 21:16:02 - INFO - __main__ - Step 31300: {'lr': 0.00019970424118185656, 'samples': 1001600, 'steps': 1956, 'loss/train': 0.7916825413703918} -09/20/2021 21:16:02 - INFO - __main__ - Step 31301: {'lr': 0.00019970424118185656, 'samples': 1001632, 'steps': 1956, 'loss/train': 2.9559738636016846} -09/20/2021 21:16:03 - INFO - __main__ - Step 31302: {'lr': 0.00019970424118185656, 'samples': 1001664, 'steps': 1956, 'loss/train': 0.9459148645401001} -09/20/2021 21:16:04 - INFO - __main__ - Step 31303: {'lr': 0.00019970424118185656, 'samples': 1001696, 'steps': 1956, 'loss/train': 2.3991050720214844} -09/20/2021 21:16:05 - INFO - __main__ - Step 31304: {'lr': 0.00019970424118185656, 'samples': 1001728, 'steps': 1956, 'loss/train': 1.5555120706558228} -09/20/2021 21:16:05 - INFO - __main__ - Step 31305: {'lr': 0.00019970424118185656, 'samples': 1001760, 'steps': 1956, 'loss/train': 2.6068806648254395} -09/20/2021 21:16:06 - INFO - __main__ - Step 31306: {'lr': 0.00019970424118185656, 'samples': 1001792, 'steps': 1956, 'loss/train': 2.8258984088897705} -09/20/2021 21:16:07 - INFO - __main__ - Step 31307: {'lr': 0.00019970424118185656, 'samples': 1001824, 'steps': 1956, 'loss/train': 2.344552516937256} -09/20/2021 21:16:08 - INFO - __main__ - Step 31308: {'lr': 0.00019970424118185656, 'samples': 1001856, 'steps': 1956, 'loss/train': 1.1028629541397095} -09/20/2021 21:16:08 - INFO - __main__ - Step 31309: {'lr': 0.00019970424118185656, 'samples': 1001888, 'steps': 1956, 'loss/train': 1.5092713832855225} -09/20/2021 21:16:09 - INFO - __main__ - Step 31310: {'lr': 0.00019970424118185656, 'samples': 1001920, 'steps': 1956, 'loss/train': 2.3353700637817383} -09/20/2021 21:16:10 - INFO - __main__ - Step 31311: {'lr': 0.00019970424118185656, 'samples': 1001952, 'steps': 1956, 'loss/train': 2.2634241580963135} -09/20/2021 21:16:11 - INFO - __main__ - Step 31312: {'lr': 0.00019970424118185656, 'samples': 1001984, 'steps': 1956, 'loss/train': 2.591867446899414} -09/20/2021 21:16:12 - INFO - __main__ - Step 31313: {'lr': 0.00019970375074195568, 'samples': 1002016, 'steps': 1957, 'loss/train': 2.0190110206604004} -09/20/2021 21:16:12 - INFO - __main__ - Step 31314: {'lr': 0.00019970375074195568, 'samples': 1002048, 'steps': 1957, 'loss/train': 2.9226796627044678} -09/20/2021 21:16:13 - INFO - __main__ - Step 31315: {'lr': 0.00019970375074195568, 'samples': 1002080, 'steps': 1957, 'loss/train': 2.5095510482788086} -09/20/2021 21:16:14 - INFO - __main__ - Step 31316: {'lr': 0.00019970375074195568, 'samples': 1002112, 'steps': 1957, 'loss/train': 2.022017478942871} -09/20/2021 21:16:15 - INFO - __main__ - Step 31317: {'lr': 0.00019970375074195568, 'samples': 1002144, 'steps': 1957, 'loss/train': 2.477739095687866} -09/20/2021 21:16:16 - INFO - __main__ - Step 31318: {'lr': 0.00019970375074195568, 'samples': 1002176, 'steps': 1957, 'loss/train': 1.8431401252746582} -09/20/2021 21:16:17 - INFO - __main__ - Step 31319: {'lr': 0.00019970375074195568, 'samples': 1002208, 'steps': 1957, 'loss/train': 2.5500993728637695} -09/20/2021 21:16:17 - INFO - __main__ - Step 31320: {'lr': 0.00019970375074195568, 'samples': 1002240, 'steps': 1957, 'loss/train': 0.6545674204826355} -09/20/2021 21:16:18 - INFO - __main__ - Step 31321: {'lr': 0.00019970375074195568, 'samples': 1002272, 'steps': 1957, 'loss/train': 2.6876699924468994} -09/20/2021 21:16:19 - INFO - __main__ - Step 31322: {'lr': 0.00019970375074195568, 'samples': 1002304, 'steps': 1957, 'loss/train': 2.7163119316101074} -09/20/2021 21:16:20 - INFO - __main__ - Step 31323: {'lr': 0.00019970375074195568, 'samples': 1002336, 'steps': 1957, 'loss/train': 2.515279769897461} -09/20/2021 21:16:20 - INFO - __main__ - Step 31324: {'lr': 0.00019970375074195568, 'samples': 1002368, 'steps': 1957, 'loss/train': 2.1427009105682373} -09/20/2021 21:16:21 - INFO - __main__ - Step 31325: {'lr': 0.00019970375074195568, 'samples': 1002400, 'steps': 1957, 'loss/train': 2.737818956375122} -09/20/2021 21:16:22 - INFO - __main__ - Step 31326: {'lr': 0.00019970375074195568, 'samples': 1002432, 'steps': 1957, 'loss/train': 2.0249459743499756} -09/20/2021 21:16:23 - INFO - __main__ - Step 31327: {'lr': 0.00019970375074195568, 'samples': 1002464, 'steps': 1957, 'loss/train': 3.2533576488494873} -09/20/2021 21:16:23 - INFO - __main__ - Step 31328: {'lr': 0.00019970375074195568, 'samples': 1002496, 'steps': 1957, 'loss/train': 2.2918787002563477} -09/20/2021 21:16:24 - INFO - __main__ - Step 31329: {'lr': 0.00019970325989636064, 'samples': 1002528, 'steps': 1958, 'loss/train': 3.2732577323913574} -09/20/2021 21:16:25 - INFO - __main__ - Step 31330: {'lr': 0.00019970325989636064, 'samples': 1002560, 'steps': 1958, 'loss/train': 2.9873435497283936} -09/20/2021 21:16:26 - INFO - __main__ - Step 31331: {'lr': 0.00019970325989636064, 'samples': 1002592, 'steps': 1958, 'loss/train': 2.400165319442749} -09/20/2021 21:16:27 - INFO - __main__ - Step 31332: {'lr': 0.00019970325989636064, 'samples': 1002624, 'steps': 1958, 'loss/train': 2.249777317047119} -09/20/2021 21:16:27 - INFO - __main__ - Step 31333: {'lr': 0.00019970325989636064, 'samples': 1002656, 'steps': 1958, 'loss/train': 2.7076680660247803} -09/20/2021 21:16:28 - INFO - __main__ - Step 31334: {'lr': 0.00019970325989636064, 'samples': 1002688, 'steps': 1958, 'loss/train': 2.653169631958008} -09/20/2021 21:16:29 - INFO - __main__ - Step 31335: {'lr': 0.00019970325989636064, 'samples': 1002720, 'steps': 1958, 'loss/train': 1.5968385934829712} -09/20/2021 21:16:30 - INFO - __main__ - Step 31336: {'lr': 0.00019970325989636064, 'samples': 1002752, 'steps': 1958, 'loss/train': 3.1437573432922363} -09/20/2021 21:16:30 - INFO - __main__ - Step 31337: {'lr': 0.00019970325989636064, 'samples': 1002784, 'steps': 1958, 'loss/train': 2.354930877685547} -09/20/2021 21:16:31 - INFO - __main__ - Step 31338: {'lr': 0.00019970325989636064, 'samples': 1002816, 'steps': 1958, 'loss/train': 2.179910659790039} -09/20/2021 21:16:32 - INFO - __main__ - Step 31339: {'lr': 0.00019970325989636064, 'samples': 1002848, 'steps': 1958, 'loss/train': 1.8537622690200806} -09/20/2021 21:16:33 - INFO - __main__ - Step 31340: {'lr': 0.00019970325989636064, 'samples': 1002880, 'steps': 1958, 'loss/train': 2.4271602630615234} -09/20/2021 21:16:33 - INFO - __main__ - Step 31341: {'lr': 0.00019970325989636064, 'samples': 1002912, 'steps': 1958, 'loss/train': 1.4248366355895996} -09/20/2021 21:16:34 - INFO - __main__ - Step 31342: {'lr': 0.00019970325989636064, 'samples': 1002944, 'steps': 1958, 'loss/train': 2.9990627765655518} -09/20/2021 21:16:35 - INFO - __main__ - Step 31343: {'lr': 0.00019970325989636064, 'samples': 1002976, 'steps': 1958, 'loss/train': 2.4900662899017334} -09/20/2021 21:16:36 - INFO - __main__ - Step 31344: {'lr': 0.00019970325989636064, 'samples': 1003008, 'steps': 1958, 'loss/train': 1.8810343742370605} -09/20/2021 21:16:36 - INFO - __main__ - Step 31345: {'lr': 0.0001997027686450734, 'samples': 1003040, 'steps': 1959, 'loss/train': 2.9351253509521484} -09/20/2021 21:16:37 - INFO - __main__ - Step 31346: {'lr': 0.0001997027686450734, 'samples': 1003072, 'steps': 1959, 'loss/train': 2.0459794998168945} -09/20/2021 21:16:38 - INFO - __main__ - Step 31347: {'lr': 0.0001997027686450734, 'samples': 1003104, 'steps': 1959, 'loss/train': 2.522268056869507} -09/20/2021 21:16:39 - INFO - __main__ - Step 31348: {'lr': 0.0001997027686450734, 'samples': 1003136, 'steps': 1959, 'loss/train': 2.3348209857940674} -09/20/2021 21:16:40 - INFO - __main__ - Step 31349: {'lr': 0.0001997027686450734, 'samples': 1003168, 'steps': 1959, 'loss/train': 3.237623929977417} -09/20/2021 21:16:41 - INFO - __main__ - Step 31350: {'lr': 0.0001997027686450734, 'samples': 1003200, 'steps': 1959, 'loss/train': 3.1109912395477295} -09/20/2021 21:16:41 - INFO - __main__ - Step 31351: {'lr': 0.0001997027686450734, 'samples': 1003232, 'steps': 1959, 'loss/train': 1.7729038000106812} -09/20/2021 21:16:42 - INFO - __main__ - Step 31352: {'lr': 0.0001997027686450734, 'samples': 1003264, 'steps': 1959, 'loss/train': 2.6080758571624756} -09/20/2021 21:16:43 - INFO - __main__ - Step 31353: {'lr': 0.0001997027686450734, 'samples': 1003296, 'steps': 1959, 'loss/train': 2.2754580974578857} -09/20/2021 21:16:44 - INFO - __main__ - Step 31354: {'lr': 0.0001997027686450734, 'samples': 1003328, 'steps': 1959, 'loss/train': 1.9730958938598633} -09/20/2021 21:16:44 - INFO - __main__ - Step 31355: {'lr': 0.0001997027686450734, 'samples': 1003360, 'steps': 1959, 'loss/train': 2.6708507537841797} -09/20/2021 21:16:45 - INFO - __main__ - Step 31356: {'lr': 0.0001997027686450734, 'samples': 1003392, 'steps': 1959, 'loss/train': 2.466944694519043} -09/20/2021 21:16:46 - INFO - __main__ - Step 31357: {'lr': 0.0001997027686450734, 'samples': 1003424, 'steps': 1959, 'loss/train': 2.5636868476867676} -09/20/2021 21:16:47 - INFO - __main__ - Step 31358: {'lr': 0.0001997027686450734, 'samples': 1003456, 'steps': 1959, 'loss/train': 2.7394840717315674} -09/20/2021 21:16:47 - INFO - __main__ - Step 31359: {'lr': 0.0001997027686450734, 'samples': 1003488, 'steps': 1959, 'loss/train': 2.8999428749084473} -09/20/2021 21:16:48 - INFO - __main__ - Step 31360: {'lr': 0.0001997027686450734, 'samples': 1003520, 'steps': 1959, 'loss/train': 2.3794095516204834} -09/20/2021 21:16:49 - INFO - __main__ - Step 31361: {'lr': 0.00019970227698809599, 'samples': 1003552, 'steps': 1960, 'loss/train': 3.1277947425842285} -09/20/2021 21:16:50 - INFO - __main__ - Step 31362: {'lr': 0.00019970227698809599, 'samples': 1003584, 'steps': 1960, 'loss/train': 2.4653561115264893} -09/20/2021 21:16:51 - INFO - __main__ - Step 31363: {'lr': 0.00019970227698809599, 'samples': 1003616, 'steps': 1960, 'loss/train': 2.5516910552978516} -09/20/2021 21:16:51 - INFO - __main__ - Step 31364: {'lr': 0.00019970227698809599, 'samples': 1003648, 'steps': 1960, 'loss/train': 1.8267767429351807} -09/20/2021 21:16:52 - INFO - __main__ - Step 31365: {'lr': 0.00019970227698809599, 'samples': 1003680, 'steps': 1960, 'loss/train': 1.874168872833252} -09/20/2021 21:16:53 - INFO - __main__ - Step 31366: {'lr': 0.00019970227698809599, 'samples': 1003712, 'steps': 1960, 'loss/train': 2.354419469833374} -09/20/2021 21:16:54 - INFO - __main__ - Step 31367: {'lr': 0.00019970227698809599, 'samples': 1003744, 'steps': 1960, 'loss/train': 2.999283790588379} -09/20/2021 21:16:54 - INFO - __main__ - Step 31368: {'lr': 0.00019970227698809599, 'samples': 1003776, 'steps': 1960, 'loss/train': 1.6576941013336182} -09/20/2021 21:16:55 - INFO - __main__ - Step 31369: {'lr': 0.00019970227698809599, 'samples': 1003808, 'steps': 1960, 'loss/train': 2.1661784648895264} -09/20/2021 21:16:56 - INFO - __main__ - Step 31370: {'lr': 0.00019970227698809599, 'samples': 1003840, 'steps': 1960, 'loss/train': 3.880197048187256} -09/20/2021 21:16:57 - INFO - __main__ - Step 31371: {'lr': 0.00019970227698809599, 'samples': 1003872, 'steps': 1960, 'loss/train': 2.48012375831604} -09/20/2021 21:16:57 - INFO - __main__ - Step 31372: {'lr': 0.00019970227698809599, 'samples': 1003904, 'steps': 1960, 'loss/train': 1.9770710468292236} -09/20/2021 21:16:58 - INFO - __main__ - Step 31373: {'lr': 0.00019970227698809599, 'samples': 1003936, 'steps': 1960, 'loss/train': 2.1453018188476562} -09/20/2021 21:16:59 - INFO - __main__ - Step 31374: {'lr': 0.00019970227698809599, 'samples': 1003968, 'steps': 1960, 'loss/train': 0.6276137232780457} -09/20/2021 21:17:00 - INFO - __main__ - Step 31375: {'lr': 0.00019970227698809599, 'samples': 1004000, 'steps': 1960, 'loss/train': 0.12264282256364822} -09/20/2021 21:17:00 - INFO - __main__ - Step 31376: {'lr': 0.00019970227698809599, 'samples': 1004032, 'steps': 1960, 'loss/train': 2.753133773803711} -09/20/2021 21:17:01 - INFO - __main__ - Step 31377: {'lr': 0.0001997017849254304, 'samples': 1004064, 'steps': 1961, 'loss/train': 2.6261978149414062} -09/20/2021 21:17:02 - INFO - __main__ - Step 31378: {'lr': 0.0001997017849254304, 'samples': 1004096, 'steps': 1961, 'loss/train': 2.087305784225464} -09/20/2021 21:17:03 - INFO - __main__ - Step 31379: {'lr': 0.0001997017849254304, 'samples': 1004128, 'steps': 1961, 'loss/train': 2.1965510845184326} -09/20/2021 21:17:04 - INFO - __main__ - Step 31380: {'lr': 0.0001997017849254304, 'samples': 1004160, 'steps': 1961, 'loss/train': 2.5565009117126465} -09/20/2021 21:17:05 - INFO - __main__ - Step 31381: {'lr': 0.0001997017849254304, 'samples': 1004192, 'steps': 1961, 'loss/train': 2.8027188777923584} -09/20/2021 21:17:05 - INFO - __main__ - Step 31382: {'lr': 0.0001997017849254304, 'samples': 1004224, 'steps': 1961, 'loss/train': 1.8274478912353516} -09/20/2021 21:17:06 - INFO - __main__ - Step 31383: {'lr': 0.0001997017849254304, 'samples': 1004256, 'steps': 1961, 'loss/train': 2.4043238162994385} -09/20/2021 21:17:07 - INFO - __main__ - Step 31384: {'lr': 0.0001997017849254304, 'samples': 1004288, 'steps': 1961, 'loss/train': 2.5332984924316406} -09/20/2021 21:17:08 - INFO - __main__ - Step 31385: {'lr': 0.0001997017849254304, 'samples': 1004320, 'steps': 1961, 'loss/train': 2.283015012741089} -09/20/2021 21:17:08 - INFO - __main__ - Step 31386: {'lr': 0.0001997017849254304, 'samples': 1004352, 'steps': 1961, 'loss/train': 3.899846076965332} -09/20/2021 21:17:09 - INFO - __main__ - Step 31387: {'lr': 0.0001997017849254304, 'samples': 1004384, 'steps': 1961, 'loss/train': 2.074470043182373} -09/20/2021 21:17:10 - INFO - __main__ - Step 31388: {'lr': 0.0001997017849254304, 'samples': 1004416, 'steps': 1961, 'loss/train': 1.9648420810699463} -09/20/2021 21:17:11 - INFO - __main__ - Step 31389: {'lr': 0.0001997017849254304, 'samples': 1004448, 'steps': 1961, 'loss/train': 2.4306254386901855} -09/20/2021 21:17:11 - INFO - __main__ - Step 31390: {'lr': 0.0001997017849254304, 'samples': 1004480, 'steps': 1961, 'loss/train': 2.8793485164642334} -09/20/2021 21:17:12 - INFO - __main__ - Step 31391: {'lr': 0.0001997017849254304, 'samples': 1004512, 'steps': 1961, 'loss/train': 2.8945655822753906} -09/20/2021 21:17:13 - INFO - __main__ - Step 31392: {'lr': 0.0001997017849254304, 'samples': 1004544, 'steps': 1961, 'loss/train': 2.6958136558532715} -09/20/2021 21:17:14 - INFO - __main__ - Step 31393: {'lr': 0.00019970129245707862, 'samples': 1004576, 'steps': 1962, 'loss/train': 2.555543899536133} -09/20/2021 21:17:15 - INFO - __main__ - Step 31394: {'lr': 0.00019970129245707862, 'samples': 1004608, 'steps': 1962, 'loss/train': 2.6540989875793457} -09/20/2021 21:17:15 - INFO - __main__ - Step 31395: {'lr': 0.00019970129245707862, 'samples': 1004640, 'steps': 1962, 'loss/train': 1.1397790908813477} -09/20/2021 21:17:16 - INFO - __main__ - Step 31396: {'lr': 0.00019970129245707862, 'samples': 1004672, 'steps': 1962, 'loss/train': 2.122502326965332} -09/20/2021 21:17:17 - INFO - __main__ - Step 31397: {'lr': 0.00019970129245707862, 'samples': 1004704, 'steps': 1962, 'loss/train': 2.5746009349823} -09/20/2021 21:17:18 - INFO - __main__ - Step 31398: {'lr': 0.00019970129245707862, 'samples': 1004736, 'steps': 1962, 'loss/train': 2.38687801361084} -09/20/2021 21:17:18 - INFO - __main__ - Step 31399: {'lr': 0.00019970129245707862, 'samples': 1004768, 'steps': 1962, 'loss/train': 2.053398370742798} -09/20/2021 21:17:19 - INFO - __main__ - Step 31400: {'lr': 0.00019970129245707862, 'samples': 1004800, 'steps': 1962, 'loss/train': 2.7103769779205322} -09/20/2021 21:17:20 - INFO - __main__ - Step 31401: {'lr': 0.00019970129245707862, 'samples': 1004832, 'steps': 1962, 'loss/train': 1.23894464969635} -09/20/2021 21:17:21 - INFO - __main__ - Step 31402: {'lr': 0.00019970129245707862, 'samples': 1004864, 'steps': 1962, 'loss/train': 2.1681277751922607} -09/20/2021 21:17:21 - INFO - __main__ - Step 31403: {'lr': 0.00019970129245707862, 'samples': 1004896, 'steps': 1962, 'loss/train': 1.7792057991027832} -09/20/2021 21:17:22 - INFO - __main__ - Step 31404: {'lr': 0.00019970129245707862, 'samples': 1004928, 'steps': 1962, 'loss/train': 2.1059153079986572} -09/20/2021 21:17:23 - INFO - __main__ - Step 31405: {'lr': 0.00019970129245707862, 'samples': 1004960, 'steps': 1962, 'loss/train': 1.9281586408615112} -09/20/2021 21:17:24 - INFO - __main__ - Step 31406: {'lr': 0.00019970129245707862, 'samples': 1004992, 'steps': 1962, 'loss/train': 2.085845708847046} -09/20/2021 21:17:24 - INFO - __main__ - Step 31407: {'lr': 0.00019970129245707862, 'samples': 1005024, 'steps': 1962, 'loss/train': 2.3591957092285156} -09/20/2021 21:17:25 - INFO - __main__ - Step 31408: {'lr': 0.00019970129245707862, 'samples': 1005056, 'steps': 1962, 'loss/train': 2.4221808910369873} -09/20/2021 21:17:26 - INFO - __main__ - Step 31409: {'lr': 0.00019970079958304268, 'samples': 1005088, 'steps': 1963, 'loss/train': 3.1152713298797607} -09/20/2021 21:17:27 - INFO - __main__ - Step 31410: {'lr': 0.00019970079958304268, 'samples': 1005120, 'steps': 1963, 'loss/train': 2.763237476348877} -09/20/2021 21:17:28 - INFO - __main__ - Step 31411: {'lr': 0.00019970079958304268, 'samples': 1005152, 'steps': 1963, 'loss/train': 3.3001248836517334} -09/20/2021 21:17:29 - INFO - __main__ - Step 31412: {'lr': 0.00019970079958304268, 'samples': 1005184, 'steps': 1963, 'loss/train': 2.048330307006836} -09/20/2021 21:17:30 - INFO - __main__ - Step 31413: {'lr': 0.00019970079958304268, 'samples': 1005216, 'steps': 1963, 'loss/train': 2.257906198501587} -09/20/2021 21:17:30 - INFO - __main__ - Step 31414: {'lr': 0.00019970079958304268, 'samples': 1005248, 'steps': 1963, 'loss/train': 2.58274507522583} -09/20/2021 21:17:31 - INFO - __main__ - Step 31415: {'lr': 0.00019970079958304268, 'samples': 1005280, 'steps': 1963, 'loss/train': 2.2249255180358887} -09/20/2021 21:17:32 - INFO - __main__ - Step 31416: {'lr': 0.00019970079958304268, 'samples': 1005312, 'steps': 1963, 'loss/train': 0.39199402928352356} -09/20/2021 21:17:33 - INFO - __main__ - Step 31417: {'lr': 0.00019970079958304268, 'samples': 1005344, 'steps': 1963, 'loss/train': 0.35372477769851685} -09/20/2021 21:17:33 - INFO - __main__ - Step 31418: {'lr': 0.00019970079958304268, 'samples': 1005376, 'steps': 1963, 'loss/train': 0.2085035890340805} -09/20/2021 21:17:34 - INFO - __main__ - Step 31419: {'lr': 0.00019970079958304268, 'samples': 1005408, 'steps': 1963, 'loss/train': 0.3303864896297455} -09/20/2021 21:17:35 - INFO - __main__ - Step 31420: {'lr': 0.00019970079958304268, 'samples': 1005440, 'steps': 1963, 'loss/train': 1.6295607089996338} -09/20/2021 21:17:36 - INFO - __main__ - Step 31421: {'lr': 0.00019970079958304268, 'samples': 1005472, 'steps': 1963, 'loss/train': 1.034366488456726} -09/20/2021 21:17:36 - INFO - __main__ - Step 31422: {'lr': 0.00019970079958304268, 'samples': 1005504, 'steps': 1963, 'loss/train': 2.4093923568725586} -09/20/2021 21:17:37 - INFO - __main__ - Step 31423: {'lr': 0.00019970079958304268, 'samples': 1005536, 'steps': 1963, 'loss/train': 2.2328710556030273} -09/20/2021 21:17:38 - INFO - __main__ - Step 31424: {'lr': 0.00019970079958304268, 'samples': 1005568, 'steps': 1963, 'loss/train': 2.4186463356018066} -09/20/2021 21:17:39 - INFO - __main__ - Step 31425: {'lr': 0.00019970030630332458, 'samples': 1005600, 'steps': 1964, 'loss/train': 1.482248067855835} -09/20/2021 21:17:40 - INFO - __main__ - Step 31426: {'lr': 0.00019970030630332458, 'samples': 1005632, 'steps': 1964, 'loss/train': 2.535982847213745} -09/20/2021 21:17:40 - INFO - __main__ - Step 31427: {'lr': 0.00019970030630332458, 'samples': 1005664, 'steps': 1964, 'loss/train': 3.0774078369140625} -09/20/2021 21:17:41 - INFO - __main__ - Step 31428: {'lr': 0.00019970030630332458, 'samples': 1005696, 'steps': 1964, 'loss/train': 2.150451421737671} -09/20/2021 21:17:42 - INFO - __main__ - Step 31429: {'lr': 0.00019970030630332458, 'samples': 1005728, 'steps': 1964, 'loss/train': 3.0080482959747314} -09/20/2021 21:17:43 - INFO - __main__ - Step 31430: {'lr': 0.00019970030630332458, 'samples': 1005760, 'steps': 1964, 'loss/train': 1.890092134475708} -09/20/2021 21:17:43 - INFO - __main__ - Step 31431: {'lr': 0.00019970030630332458, 'samples': 1005792, 'steps': 1964, 'loss/train': 0.6262738704681396} -09/20/2021 21:17:44 - INFO - __main__ - Step 31432: {'lr': 0.00019970030630332458, 'samples': 1005824, 'steps': 1964, 'loss/train': 3.303277015686035} -09/20/2021 21:17:45 - INFO - __main__ - Step 31433: {'lr': 0.00019970030630332458, 'samples': 1005856, 'steps': 1964, 'loss/train': 1.5692411661148071} -09/20/2021 21:17:46 - INFO - __main__ - Step 31434: {'lr': 0.00019970030630332458, 'samples': 1005888, 'steps': 1964, 'loss/train': 3.2957968711853027} -09/20/2021 21:17:46 - INFO - __main__ - Step 31435: {'lr': 0.00019970030630332458, 'samples': 1005920, 'steps': 1964, 'loss/train': 2.469269275665283} -09/20/2021 21:17:47 - INFO - __main__ - Step 31436: {'lr': 0.00019970030630332458, 'samples': 1005952, 'steps': 1964, 'loss/train': 2.1550047397613525} -09/20/2021 21:17:48 - INFO - __main__ - Step 31437: {'lr': 0.00019970030630332458, 'samples': 1005984, 'steps': 1964, 'loss/train': 2.0550193786621094} -09/20/2021 21:17:49 - INFO - __main__ - Step 31438: {'lr': 0.00019970030630332458, 'samples': 1006016, 'steps': 1964, 'loss/train': 3.4723870754241943} -09/20/2021 21:17:49 - INFO - __main__ - Step 31439: {'lr': 0.00019970030630332458, 'samples': 1006048, 'steps': 1964, 'loss/train': 2.584688186645508} -09/20/2021 21:17:50 - INFO - __main__ - Step 31440: {'lr': 0.00019970030630332458, 'samples': 1006080, 'steps': 1964, 'loss/train': 1.666847825050354} -09/20/2021 21:17:52 - INFO - __main__ - Step 31441: {'lr': 0.00019969981261792633, 'samples': 1006112, 'steps': 1965, 'loss/train': 2.429719924926758} -09/20/2021 21:17:52 - INFO - __main__ - Step 31442: {'lr': 0.00019969981261792633, 'samples': 1006144, 'steps': 1965, 'loss/train': 1.75575590133667} -09/20/2021 21:17:53 - INFO - __main__ - Step 31443: {'lr': 0.00019969981261792633, 'samples': 1006176, 'steps': 1965, 'loss/train': 3.023560047149658} -09/20/2021 21:17:54 - INFO - __main__ - Step 31444: {'lr': 0.00019969981261792633, 'samples': 1006208, 'steps': 1965, 'loss/train': 2.1461398601531982} -09/20/2021 21:17:55 - INFO - __main__ - Step 31445: {'lr': 0.00019969981261792633, 'samples': 1006240, 'steps': 1965, 'loss/train': 2.5270817279815674} -09/20/2021 21:17:55 - INFO - __main__ - Step 31446: {'lr': 0.00019969981261792633, 'samples': 1006272, 'steps': 1965, 'loss/train': 2.195194721221924} -09/20/2021 21:17:56 - INFO - __main__ - Step 31447: {'lr': 0.00019969981261792633, 'samples': 1006304, 'steps': 1965, 'loss/train': 2.7292773723602295} -09/20/2021 21:17:57 - INFO - __main__ - Step 31448: {'lr': 0.00019969981261792633, 'samples': 1006336, 'steps': 1965, 'loss/train': 2.8216030597686768} -09/20/2021 21:17:58 - INFO - __main__ - Step 31449: {'lr': 0.00019969981261792633, 'samples': 1006368, 'steps': 1965, 'loss/train': 0.3314567506313324} -09/20/2021 21:17:58 - INFO - __main__ - Step 31450: {'lr': 0.00019969981261792633, 'samples': 1006400, 'steps': 1965, 'loss/train': 1.780024528503418} -09/20/2021 21:17:59 - INFO - __main__ - Step 31451: {'lr': 0.00019969981261792633, 'samples': 1006432, 'steps': 1965, 'loss/train': 3.124253511428833} -09/20/2021 21:18:00 - INFO - __main__ - Step 31452: {'lr': 0.00019969981261792633, 'samples': 1006464, 'steps': 1965, 'loss/train': 2.5746023654937744} -09/20/2021 21:18:01 - INFO - __main__ - Step 31453: {'lr': 0.00019969981261792633, 'samples': 1006496, 'steps': 1965, 'loss/train': 2.8148748874664307} -09/20/2021 21:18:01 - INFO - __main__ - Step 31454: {'lr': 0.00019969981261792633, 'samples': 1006528, 'steps': 1965, 'loss/train': 1.4005709886550903} -09/20/2021 21:18:02 - INFO - __main__ - Step 31455: {'lr': 0.00019969981261792633, 'samples': 1006560, 'steps': 1965, 'loss/train': 2.372227191925049} -09/20/2021 21:18:03 - INFO - __main__ - Step 31456: {'lr': 0.00019969981261792633, 'samples': 1006592, 'steps': 1965, 'loss/train': 1.0921974182128906} -09/20/2021 21:18:04 - INFO - __main__ - Step 31457: {'lr': 0.0001996993185268499, 'samples': 1006624, 'steps': 1966, 'loss/train': 2.1074154376983643} -09/20/2021 21:18:04 - INFO - __main__ - Step 31458: {'lr': 0.0001996993185268499, 'samples': 1006656, 'steps': 1966, 'loss/train': 1.2442610263824463} -09/20/2021 21:18:05 - INFO - __main__ - Step 31459: {'lr': 0.0001996993185268499, 'samples': 1006688, 'steps': 1966, 'loss/train': 2.282442331314087} -09/20/2021 21:18:06 - INFO - __main__ - Step 31460: {'lr': 0.0001996993185268499, 'samples': 1006720, 'steps': 1966, 'loss/train': 2.5550386905670166} -09/20/2021 21:18:07 - INFO - __main__ - Step 31461: {'lr': 0.0001996993185268499, 'samples': 1006752, 'steps': 1966, 'loss/train': 2.3236427307128906} -09/20/2021 21:18:07 - INFO - __main__ - Step 31462: {'lr': 0.0001996993185268499, 'samples': 1006784, 'steps': 1966, 'loss/train': 1.5383397340774536} -09/20/2021 21:18:08 - INFO - __main__ - Step 31463: {'lr': 0.0001996993185268499, 'samples': 1006816, 'steps': 1966, 'loss/train': 1.8246594667434692} -09/20/2021 21:18:09 - INFO - __main__ - Step 31464: {'lr': 0.0001996993185268499, 'samples': 1006848, 'steps': 1966, 'loss/train': 1.691819667816162} -09/20/2021 21:18:10 - INFO - __main__ - Step 31465: {'lr': 0.0001996993185268499, 'samples': 1006880, 'steps': 1966, 'loss/train': 1.663489818572998} -09/20/2021 21:18:10 - INFO - __main__ - Step 31466: {'lr': 0.0001996993185268499, 'samples': 1006912, 'steps': 1966, 'loss/train': 2.229522228240967} -09/20/2021 21:18:11 - INFO - __main__ - Step 31467: {'lr': 0.0001996993185268499, 'samples': 1006944, 'steps': 1966, 'loss/train': 3.496915340423584} -09/20/2021 21:18:12 - INFO - __main__ - Step 31468: {'lr': 0.0001996993185268499, 'samples': 1006976, 'steps': 1966, 'loss/train': 3.3908567428588867} -09/20/2021 21:18:13 - INFO - __main__ - Step 31469: {'lr': 0.0001996993185268499, 'samples': 1007008, 'steps': 1966, 'loss/train': 2.2628564834594727} -09/20/2021 21:18:13 - INFO - __main__ - Step 31470: {'lr': 0.0001996993185268499, 'samples': 1007040, 'steps': 1966, 'loss/train': 2.8594820499420166} -09/20/2021 21:18:15 - INFO - __main__ - Step 31471: {'lr': 0.0001996993185268499, 'samples': 1007072, 'steps': 1966, 'loss/train': 2.622898578643799} -09/20/2021 21:18:15 - INFO - __main__ - Step 31472: {'lr': 0.0001996993185268499, 'samples': 1007104, 'steps': 1966, 'loss/train': 1.8278465270996094} -09/20/2021 21:18:16 - INFO - __main__ - Step 31473: {'lr': 0.00019969882403009733, 'samples': 1007136, 'steps': 1967, 'loss/train': 2.1015822887420654} -09/20/2021 21:18:17 - INFO - __main__ - Step 31474: {'lr': 0.00019969882403009733, 'samples': 1007168, 'steps': 1967, 'loss/train': 2.743281841278076} -09/20/2021 21:18:18 - INFO - __main__ - Step 31475: {'lr': 0.00019969882403009733, 'samples': 1007200, 'steps': 1967, 'loss/train': 2.1160027980804443} -09/20/2021 21:18:19 - INFO - __main__ - Step 31476: {'lr': 0.00019969882403009733, 'samples': 1007232, 'steps': 1967, 'loss/train': 2.568774461746216} -09/20/2021 21:18:19 - INFO - __main__ - Step 31477: {'lr': 0.00019969882403009733, 'samples': 1007264, 'steps': 1967, 'loss/train': 2.3714582920074463} -09/20/2021 21:18:20 - INFO - __main__ - Step 31478: {'lr': 0.00019969882403009733, 'samples': 1007296, 'steps': 1967, 'loss/train': 2.373828172683716} -09/20/2021 21:18:21 - INFO - __main__ - Step 31479: {'lr': 0.00019969882403009733, 'samples': 1007328, 'steps': 1967, 'loss/train': 2.518251419067383} -09/20/2021 21:18:22 - INFO - __main__ - Step 31480: {'lr': 0.00019969882403009733, 'samples': 1007360, 'steps': 1967, 'loss/train': 0.5534259676933289} -09/20/2021 21:18:22 - INFO - __main__ - Step 31481: {'lr': 0.00019969882403009733, 'samples': 1007392, 'steps': 1967, 'loss/train': 2.4943606853485107} -09/20/2021 21:18:23 - INFO - __main__ - Step 31482: {'lr': 0.00019969882403009733, 'samples': 1007424, 'steps': 1967, 'loss/train': 2.3965442180633545} -09/20/2021 21:18:24 - INFO - __main__ - Step 31483: {'lr': 0.00019969882403009733, 'samples': 1007456, 'steps': 1967, 'loss/train': 2.2200565338134766} -09/20/2021 21:18:25 - INFO - __main__ - Step 31484: {'lr': 0.00019969882403009733, 'samples': 1007488, 'steps': 1967, 'loss/train': 1.8932459354400635} -09/20/2021 21:18:25 - INFO - __main__ - Step 31485: {'lr': 0.00019969882403009733, 'samples': 1007520, 'steps': 1967, 'loss/train': 2.7202627658843994} -09/20/2021 21:18:26 - INFO - __main__ - Step 31486: {'lr': 0.00019969882403009733, 'samples': 1007552, 'steps': 1967, 'loss/train': 3.052297830581665} -09/20/2021 21:18:27 - INFO - __main__ - Step 31487: {'lr': 0.00019969882403009733, 'samples': 1007584, 'steps': 1967, 'loss/train': 1.9101762771606445} -09/20/2021 21:18:28 - INFO - __main__ - Step 31488: {'lr': 0.00019969882403009733, 'samples': 1007616, 'steps': 1967, 'loss/train': 2.3004398345947266} -09/20/2021 21:18:28 - INFO - __main__ - Step 31489: {'lr': 0.00019969832912767064, 'samples': 1007648, 'steps': 1968, 'loss/train': 2.102060079574585} -09/20/2021 21:18:29 - INFO - __main__ - Step 31490: {'lr': 0.00019969832912767064, 'samples': 1007680, 'steps': 1968, 'loss/train': 2.7175824642181396} -09/20/2021 21:18:30 - INFO - __main__ - Step 31491: {'lr': 0.00019969832912767064, 'samples': 1007712, 'steps': 1968, 'loss/train': 3.797280788421631} -09/20/2021 21:18:31 - INFO - __main__ - Step 31492: {'lr': 0.00019969832912767064, 'samples': 1007744, 'steps': 1968, 'loss/train': 2.5249569416046143} -09/20/2021 21:18:31 - INFO - __main__ - Step 31493: {'lr': 0.00019969832912767064, 'samples': 1007776, 'steps': 1968, 'loss/train': 2.500831365585327} -09/20/2021 21:18:32 - INFO - __main__ - Step 31494: {'lr': 0.00019969832912767064, 'samples': 1007808, 'steps': 1968, 'loss/train': 2.163818120956421} -09/20/2021 21:18:33 - INFO - __main__ - Step 31495: {'lr': 0.00019969832912767064, 'samples': 1007840, 'steps': 1968, 'loss/train': 2.449254274368286} -09/20/2021 21:18:34 - INFO - __main__ - Step 31496: {'lr': 0.00019969832912767064, 'samples': 1007872, 'steps': 1968, 'loss/train': 2.5977635383605957} -09/20/2021 21:18:34 - INFO - __main__ - Step 31497: {'lr': 0.00019969832912767064, 'samples': 1007904, 'steps': 1968, 'loss/train': 2.743821382522583} -09/20/2021 21:18:35 - INFO - __main__ - Step 31498: {'lr': 0.00019969832912767064, 'samples': 1007936, 'steps': 1968, 'loss/train': 1.9313017129898071} -09/20/2021 21:18:36 - INFO - __main__ - Step 31499: {'lr': 0.00019969832912767064, 'samples': 1007968, 'steps': 1968, 'loss/train': 4.529175281524658} -09/20/2021 21:18:37 - INFO - __main__ - Step 31500: {'lr': 0.00019969832912767064, 'samples': 1008000, 'steps': 1968, 'loss/train': 2.427727460861206} -09/20/2021 21:18:37 - INFO - __main__ - Step 31501: {'lr': 0.00019969832912767064, 'samples': 1008032, 'steps': 1968, 'loss/train': 2.357736110687256} -09/20/2021 21:18:39 - INFO - __main__ - Step 31502: {'lr': 0.00019969832912767064, 'samples': 1008064, 'steps': 1968, 'loss/train': 2.345344066619873} -09/20/2021 21:18:40 - INFO - __main__ - Step 31503: {'lr': 0.00019969832912767064, 'samples': 1008096, 'steps': 1968, 'loss/train': 1.6825525760650635} -09/20/2021 21:18:40 - INFO - __main__ - Step 31504: {'lr': 0.00019969832912767064, 'samples': 1008128, 'steps': 1968, 'loss/train': 2.6878809928894043} -09/20/2021 21:18:41 - INFO - __main__ - Step 31505: {'lr': 0.00019969783381957188, 'samples': 1008160, 'steps': 1969, 'loss/train': 3.334886312484741} -09/20/2021 21:18:42 - INFO - __main__ - Step 31506: {'lr': 0.00019969783381957188, 'samples': 1008192, 'steps': 1969, 'loss/train': 2.3041460514068604} -09/20/2021 21:18:43 - INFO - __main__ - Step 31507: {'lr': 0.00019969783381957188, 'samples': 1008224, 'steps': 1969, 'loss/train': 1.9865621328353882} -09/20/2021 21:18:43 - INFO - __main__ - Step 31508: {'lr': 0.00019969783381957188, 'samples': 1008256, 'steps': 1969, 'loss/train': 3.110321521759033} -09/20/2021 21:18:44 - INFO - __main__ - Step 31509: {'lr': 0.00019969783381957188, 'samples': 1008288, 'steps': 1969, 'loss/train': 4.414320468902588} -09/20/2021 21:18:45 - INFO - __main__ - Step 31510: {'lr': 0.00019969783381957188, 'samples': 1008320, 'steps': 1969, 'loss/train': 2.662099599838257} -09/20/2021 21:18:46 - INFO - __main__ - Step 31511: {'lr': 0.00019969783381957188, 'samples': 1008352, 'steps': 1969, 'loss/train': 2.4853768348693848} -09/20/2021 21:18:46 - INFO - __main__ - Step 31512: {'lr': 0.00019969783381957188, 'samples': 1008384, 'steps': 1969, 'loss/train': 2.772956609725952} -09/20/2021 21:18:47 - INFO - __main__ - Step 31513: {'lr': 0.00019969783381957188, 'samples': 1008416, 'steps': 1969, 'loss/train': 2.064999580383301} -09/20/2021 21:18:48 - INFO - __main__ - Step 31514: {'lr': 0.00019969783381957188, 'samples': 1008448, 'steps': 1969, 'loss/train': 2.248108386993408} -09/20/2021 21:18:49 - INFO - __main__ - Step 31515: {'lr': 0.00019969783381957188, 'samples': 1008480, 'steps': 1969, 'loss/train': 1.9852893352508545} -09/20/2021 21:18:49 - INFO - __main__ - Step 31516: {'lr': 0.00019969783381957188, 'samples': 1008512, 'steps': 1969, 'loss/train': 2.222686290740967} -09/20/2021 21:18:50 - INFO - __main__ - Step 31517: {'lr': 0.00019969783381957188, 'samples': 1008544, 'steps': 1969, 'loss/train': 2.369804859161377} -09/20/2021 21:18:51 - INFO - __main__ - Step 31518: {'lr': 0.00019969783381957188, 'samples': 1008576, 'steps': 1969, 'loss/train': 2.074418783187866} -09/20/2021 21:18:52 - INFO - __main__ - Step 31519: {'lr': 0.00019969783381957188, 'samples': 1008608, 'steps': 1969, 'loss/train': 3.2425644397735596} -09/20/2021 21:18:52 - INFO - __main__ - Step 31520: {'lr': 0.00019969783381957188, 'samples': 1008640, 'steps': 1969, 'loss/train': 3.3435587882995605} -09/20/2021 21:18:53 - INFO - __main__ - Step 31521: {'lr': 0.00019969733810580297, 'samples': 1008672, 'steps': 1970, 'loss/train': 2.2868294715881348} -09/20/2021 21:18:54 - INFO - __main__ - Step 31522: {'lr': 0.00019969733810580297, 'samples': 1008704, 'steps': 1970, 'loss/train': 2.818814516067505} -09/20/2021 21:18:55 - INFO - __main__ - Step 31523: {'lr': 0.00019969733810580297, 'samples': 1008736, 'steps': 1970, 'loss/train': 2.428999900817871} -09/20/2021 21:18:56 - INFO - __main__ - Step 31524: {'lr': 0.00019969733810580297, 'samples': 1008768, 'steps': 1970, 'loss/train': 2.1291635036468506} -09/20/2021 21:18:56 - INFO - __main__ - Step 31525: {'lr': 0.00019969733810580297, 'samples': 1008800, 'steps': 1970, 'loss/train': 3.25811767578125} -09/20/2021 21:18:57 - INFO - __main__ - Step 31526: {'lr': 0.00019969733810580297, 'samples': 1008832, 'steps': 1970, 'loss/train': 1.7981703281402588} -09/20/2021 21:18:58 - INFO - __main__ - Step 31527: {'lr': 0.00019969733810580297, 'samples': 1008864, 'steps': 1970, 'loss/train': 1.408454179763794} -09/20/2021 21:18:59 - INFO - __main__ - Step 31528: {'lr': 0.00019969733810580297, 'samples': 1008896, 'steps': 1970, 'loss/train': 1.27688729763031} -09/20/2021 21:18:59 - INFO - __main__ - Step 31529: {'lr': 0.00019969733810580297, 'samples': 1008928, 'steps': 1970, 'loss/train': 1.3045586347579956} -09/20/2021 21:19:00 - INFO - __main__ - Step 31530: {'lr': 0.00019969733810580297, 'samples': 1008960, 'steps': 1970, 'loss/train': 2.4262423515319824} -09/20/2021 21:19:01 - INFO - __main__ - Step 31531: {'lr': 0.00019969733810580297, 'samples': 1008992, 'steps': 1970, 'loss/train': 3.1360549926757812} -09/20/2021 21:19:02 - INFO - __main__ - Step 31532: {'lr': 0.00019969733810580297, 'samples': 1009024, 'steps': 1970, 'loss/train': 3.55167555809021} -09/20/2021 21:19:02 - INFO - __main__ - Step 31533: {'lr': 0.00019969733810580297, 'samples': 1009056, 'steps': 1970, 'loss/train': 1.4576743841171265} -09/20/2021 21:19:04 - INFO - __main__ - Step 31534: {'lr': 0.00019969733810580297, 'samples': 1009088, 'steps': 1970, 'loss/train': 4.16673469543457} -09/20/2021 21:19:04 - INFO - __main__ - Step 31535: {'lr': 0.00019969733810580297, 'samples': 1009120, 'steps': 1970, 'loss/train': 2.3962481021881104} -09/20/2021 21:19:05 - INFO - __main__ - Step 31536: {'lr': 0.00019969733810580297, 'samples': 1009152, 'steps': 1970, 'loss/train': 2.4895920753479004} -09/20/2021 21:19:06 - INFO - __main__ - Step 31537: {'lr': 0.000199696841986366, 'samples': 1009184, 'steps': 1971, 'loss/train': 2.284595012664795} -09/20/2021 21:19:07 - INFO - __main__ - Step 31538: {'lr': 0.000199696841986366, 'samples': 1009216, 'steps': 1971, 'loss/train': 2.1470327377319336} -09/20/2021 21:19:08 - INFO - __main__ - Step 31539: {'lr': 0.000199696841986366, 'samples': 1009248, 'steps': 1971, 'loss/train': 2.52140212059021} -09/20/2021 21:19:08 - INFO - __main__ - Step 31540: {'lr': 0.000199696841986366, 'samples': 1009280, 'steps': 1971, 'loss/train': 2.455796957015991} -09/20/2021 21:19:09 - INFO - __main__ - Step 31541: {'lr': 0.000199696841986366, 'samples': 1009312, 'steps': 1971, 'loss/train': 1.5714592933654785} -09/20/2021 21:19:10 - INFO - __main__ - Step 31542: {'lr': 0.000199696841986366, 'samples': 1009344, 'steps': 1971, 'loss/train': 0.4036664366722107} -09/20/2021 21:19:11 - INFO - __main__ - Step 31543: {'lr': 0.000199696841986366, 'samples': 1009376, 'steps': 1971, 'loss/train': 0.33702751994132996} -09/20/2021 21:19:11 - INFO - __main__ - Step 31544: {'lr': 0.000199696841986366, 'samples': 1009408, 'steps': 1971, 'loss/train': 0.26284220814704895} -09/20/2021 21:19:12 - INFO - __main__ - Step 31545: {'lr': 0.000199696841986366, 'samples': 1009440, 'steps': 1971, 'loss/train': 2.041282892227173} -09/20/2021 21:19:13 - INFO - __main__ - Step 31546: {'lr': 0.000199696841986366, 'samples': 1009472, 'steps': 1971, 'loss/train': 2.5235912799835205} -09/20/2021 21:19:14 - INFO - __main__ - Step 31547: {'lr': 0.000199696841986366, 'samples': 1009504, 'steps': 1971, 'loss/train': 2.35304594039917} -09/20/2021 21:19:14 - INFO - __main__ - Step 31548: {'lr': 0.000199696841986366, 'samples': 1009536, 'steps': 1971, 'loss/train': 1.3021265268325806} -09/20/2021 21:19:15 - INFO - __main__ - Step 31549: {'lr': 0.000199696841986366, 'samples': 1009568, 'steps': 1971, 'loss/train': 0.7903569340705872} -09/20/2021 21:19:16 - INFO - __main__ - Step 31550: {'lr': 0.000199696841986366, 'samples': 1009600, 'steps': 1971, 'loss/train': 2.9908506870269775} -09/20/2021 21:19:17 - INFO - __main__ - Step 31551: {'lr': 0.000199696841986366, 'samples': 1009632, 'steps': 1971, 'loss/train': 2.916807174682617} -09/20/2021 21:19:17 - INFO - __main__ - Step 31552: {'lr': 0.000199696841986366, 'samples': 1009664, 'steps': 1971, 'loss/train': 2.513607978820801} -09/20/2021 21:19:18 - INFO - __main__ - Step 31553: {'lr': 0.00019969634546126294, 'samples': 1009696, 'steps': 1972, 'loss/train': 1.9669336080551147} -09/20/2021 21:19:19 - INFO - __main__ - Step 31554: {'lr': 0.00019969634546126294, 'samples': 1009728, 'steps': 1972, 'loss/train': 3.207871198654175} -09/20/2021 21:19:20 - INFO - __main__ - Step 31555: {'lr': 0.00019969634546126294, 'samples': 1009760, 'steps': 1972, 'loss/train': 2.5119359493255615} -09/20/2021 21:19:20 - INFO - __main__ - Step 31556: {'lr': 0.00019969634546126294, 'samples': 1009792, 'steps': 1972, 'loss/train': 2.0319972038269043} -09/20/2021 21:19:21 - INFO - __main__ - Step 31557: {'lr': 0.00019969634546126294, 'samples': 1009824, 'steps': 1972, 'loss/train': 1.5223039388656616} -09/20/2021 21:19:22 - INFO - __main__ - Step 31558: {'lr': 0.00019969634546126294, 'samples': 1009856, 'steps': 1972, 'loss/train': 1.2544915676116943} -09/20/2021 21:19:23 - INFO - __main__ - Step 31559: {'lr': 0.00019969634546126294, 'samples': 1009888, 'steps': 1972, 'loss/train': 2.554765462875366} -09/20/2021 21:19:23 - INFO - __main__ - Step 31560: {'lr': 0.00019969634546126294, 'samples': 1009920, 'steps': 1972, 'loss/train': 1.4694324731826782} -09/20/2021 21:19:24 - INFO - __main__ - Step 31561: {'lr': 0.00019969634546126294, 'samples': 1009952, 'steps': 1972, 'loss/train': 3.136111259460449} -09/20/2021 21:19:25 - INFO - __main__ - Step 31562: {'lr': 0.00019969634546126294, 'samples': 1009984, 'steps': 1972, 'loss/train': 2.1167848110198975} -09/20/2021 21:19:26 - INFO - __main__ - Step 31563: {'lr': 0.00019969634546126294, 'samples': 1010016, 'steps': 1972, 'loss/train': 3.5711004734039307} -09/20/2021 21:19:26 - INFO - __main__ - Step 31564: {'lr': 0.00019969634546126294, 'samples': 1010048, 'steps': 1972, 'loss/train': 2.275268316268921} -09/20/2021 21:19:28 - INFO - __main__ - Step 31565: {'lr': 0.00019969634546126294, 'samples': 1010080, 'steps': 1972, 'loss/train': 3.323650360107422} -09/20/2021 21:19:29 - INFO - __main__ - Step 31566: {'lr': 0.00019969634546126294, 'samples': 1010112, 'steps': 1972, 'loss/train': 3.7508020401000977} -09/20/2021 21:19:30 - INFO - __main__ - Step 31567: {'lr': 0.00019969634546126294, 'samples': 1010144, 'steps': 1972, 'loss/train': 3.306365489959717} -09/20/2021 21:19:30 - INFO - __main__ - Step 31568: {'lr': 0.00019969634546126294, 'samples': 1010176, 'steps': 1972, 'loss/train': 3.445007085800171} -09/20/2021 21:19:31 - INFO - __main__ - Step 31569: {'lr': 0.00019969584853049587, 'samples': 1010208, 'steps': 1973, 'loss/train': 2.238809585571289} -09/20/2021 21:19:32 - INFO - __main__ - Step 31570: {'lr': 0.00019969584853049587, 'samples': 1010240, 'steps': 1973, 'loss/train': 3.0246357917785645} -09/20/2021 21:19:33 - INFO - __main__ - Step 31571: {'lr': 0.00019969584853049587, 'samples': 1010272, 'steps': 1973, 'loss/train': 3.028306722640991} -09/20/2021 21:19:33 - INFO - __main__ - Step 31572: {'lr': 0.00019969584853049587, 'samples': 1010304, 'steps': 1973, 'loss/train': 2.601518154144287} -09/20/2021 21:19:34 - INFO - __main__ - Step 31573: {'lr': 0.00019969584853049587, 'samples': 1010336, 'steps': 1973, 'loss/train': 3.1875603199005127} -09/20/2021 21:19:35 - INFO - __main__ - Step 31574: {'lr': 0.00019969584853049587, 'samples': 1010368, 'steps': 1973, 'loss/train': 3.302687644958496} -09/20/2021 21:19:36 - INFO - __main__ - Step 31575: {'lr': 0.00019969584853049587, 'samples': 1010400, 'steps': 1973, 'loss/train': 3.545482635498047} -09/20/2021 21:19:37 - INFO - __main__ - Step 31576: {'lr': 0.00019969584853049587, 'samples': 1010432, 'steps': 1973, 'loss/train': 2.3375422954559326} -09/20/2021 21:19:37 - INFO - __main__ - Step 31577: {'lr': 0.00019969584853049587, 'samples': 1010464, 'steps': 1973, 'loss/train': 2.688082456588745} -09/20/2021 21:19:38 - INFO - __main__ - Step 31578: {'lr': 0.00019969584853049587, 'samples': 1010496, 'steps': 1973, 'loss/train': 1.9154294729232788} -09/20/2021 21:19:39 - INFO - __main__ - Step 31579: {'lr': 0.00019969584853049587, 'samples': 1010528, 'steps': 1973, 'loss/train': 2.0327305793762207} -09/20/2021 21:19:40 - INFO - __main__ - Step 31580: {'lr': 0.00019969584853049587, 'samples': 1010560, 'steps': 1973, 'loss/train': 2.129906415939331} -09/20/2021 21:19:40 - INFO - __main__ - Step 31581: {'lr': 0.00019969584853049587, 'samples': 1010592, 'steps': 1973, 'loss/train': 3.2861523628234863} -09/20/2021 21:19:41 - INFO - __main__ - Step 31582: {'lr': 0.00019969584853049587, 'samples': 1010624, 'steps': 1973, 'loss/train': 2.3191897869110107} -09/20/2021 21:19:42 - INFO - __main__ - Step 31583: {'lr': 0.00019969584853049587, 'samples': 1010656, 'steps': 1973, 'loss/train': 3.4759902954101562} -09/20/2021 21:19:43 - INFO - __main__ - Step 31584: {'lr': 0.00019969584853049587, 'samples': 1010688, 'steps': 1973, 'loss/train': 2.992917537689209} -09/20/2021 21:19:43 - INFO - __main__ - Step 31585: {'lr': 0.00019969535119406678, 'samples': 1010720, 'steps': 1974, 'loss/train': 3.6238110065460205} -09/20/2021 21:19:44 - INFO - __main__ - Step 31586: {'lr': 0.00019969535119406678, 'samples': 1010752, 'steps': 1974, 'loss/train': 2.753249406814575} -09/20/2021 21:19:45 - INFO - __main__ - Step 31587: {'lr': 0.00019969535119406678, 'samples': 1010784, 'steps': 1974, 'loss/train': 2.568247079849243} -09/20/2021 21:19:46 - INFO - __main__ - Step 31588: {'lr': 0.00019969535119406678, 'samples': 1010816, 'steps': 1974, 'loss/train': 3.148252248764038} -09/20/2021 21:19:46 - INFO - __main__ - Step 31589: {'lr': 0.00019969535119406678, 'samples': 1010848, 'steps': 1974, 'loss/train': 2.555046796798706} -09/20/2021 21:19:47 - INFO - __main__ - Step 31590: {'lr': 0.00019969535119406678, 'samples': 1010880, 'steps': 1974, 'loss/train': 2.696157217025757} -09/20/2021 21:19:48 - INFO - __main__ - Step 31591: {'lr': 0.00019969535119406678, 'samples': 1010912, 'steps': 1974, 'loss/train': 2.7870635986328125} -09/20/2021 21:19:49 - INFO - __main__ - Step 31592: {'lr': 0.00019969535119406678, 'samples': 1010944, 'steps': 1974, 'loss/train': 1.6108673810958862} -09/20/2021 21:19:49 - INFO - __main__ - Step 31593: {'lr': 0.00019969535119406678, 'samples': 1010976, 'steps': 1974, 'loss/train': 2.0462002754211426} -09/20/2021 21:19:50 - INFO - __main__ - Step 31594: {'lr': 0.00019969535119406678, 'samples': 1011008, 'steps': 1974, 'loss/train': 3.2775611877441406} -09/20/2021 21:19:51 - INFO - __main__ - Step 31595: {'lr': 0.00019969535119406678, 'samples': 1011040, 'steps': 1974, 'loss/train': 2.350794792175293} -09/20/2021 21:19:52 - INFO - __main__ - Step 31596: {'lr': 0.00019969535119406678, 'samples': 1011072, 'steps': 1974, 'loss/train': 2.7515320777893066} -09/20/2021 21:19:52 - INFO - __main__ - Step 31597: {'lr': 0.00019969535119406678, 'samples': 1011104, 'steps': 1974, 'loss/train': 2.341749429702759} -09/20/2021 21:19:53 - INFO - __main__ - Step 31598: {'lr': 0.00019969535119406678, 'samples': 1011136, 'steps': 1974, 'loss/train': 1.7376514673233032} -09/20/2021 21:19:54 - INFO - __main__ - Step 31599: {'lr': 0.00019969535119406678, 'samples': 1011168, 'steps': 1974, 'loss/train': 5.941253185272217} -09/20/2021 21:19:55 - INFO - __main__ - Step 31600: {'lr': 0.00019969535119406678, 'samples': 1011200, 'steps': 1974, 'loss/train': 2.6558456420898438} -09/20/2021 21:19:57 - INFO - __main__ - Step 31601: {'lr': 0.00019969485345197767, 'samples': 1011232, 'steps': 1975, 'loss/train': 2.24770450592041} -09/20/2021 21:19:57 - INFO - __main__ - Step 31602: {'lr': 0.00019969485345197767, 'samples': 1011264, 'steps': 1975, 'loss/train': 2.5377438068389893} -09/20/2021 21:19:58 - INFO - __main__ - Step 31603: {'lr': 0.00019969485345197767, 'samples': 1011296, 'steps': 1975, 'loss/train': 2.0183920860290527} -09/20/2021 21:19:59 - INFO - __main__ - Step 31604: {'lr': 0.00019969485345197767, 'samples': 1011328, 'steps': 1975, 'loss/train': 1.746075987815857} -09/20/2021 21:20:00 - INFO - __main__ - Step 31605: {'lr': 0.00019969485345197767, 'samples': 1011360, 'steps': 1975, 'loss/train': 2.783731698989868} -09/20/2021 21:20:00 - INFO - __main__ - Step 31606: {'lr': 0.00019969485345197767, 'samples': 1011392, 'steps': 1975, 'loss/train': 0.5795975923538208} -09/20/2021 21:20:01 - INFO - __main__ - Step 31607: {'lr': 0.00019969485345197767, 'samples': 1011424, 'steps': 1975, 'loss/train': 2.3855056762695312} -09/20/2021 21:20:02 - INFO - __main__ - Step 31608: {'lr': 0.00019969485345197767, 'samples': 1011456, 'steps': 1975, 'loss/train': 6.19925594329834} -09/20/2021 21:20:03 - INFO - __main__ - Step 31609: {'lr': 0.00019969485345197767, 'samples': 1011488, 'steps': 1975, 'loss/train': 6.307461261749268} -09/20/2021 21:20:03 - INFO - __main__ - Step 31610: {'lr': 0.00019969485345197767, 'samples': 1011520, 'steps': 1975, 'loss/train': 3.304513931274414} -09/20/2021 21:20:04 - INFO - __main__ - Step 31611: {'lr': 0.00019969485345197767, 'samples': 1011552, 'steps': 1975, 'loss/train': 0.8712846636772156} -09/20/2021 21:20:05 - INFO - __main__ - Step 31612: {'lr': 0.00019969485345197767, 'samples': 1011584, 'steps': 1975, 'loss/train': 2.1852478981018066} -09/20/2021 21:20:06 - INFO - __main__ - Step 31613: {'lr': 0.00019969485345197767, 'samples': 1011616, 'steps': 1975, 'loss/train': 2.7822327613830566} -09/20/2021 21:20:06 - INFO - __main__ - Step 31614: {'lr': 0.00019969485345197767, 'samples': 1011648, 'steps': 1975, 'loss/train': 1.6052470207214355} -09/20/2021 21:20:07 - INFO - __main__ - Step 31615: {'lr': 0.00019969485345197767, 'samples': 1011680, 'steps': 1975, 'loss/train': 2.3066537380218506} -09/20/2021 21:20:08 - INFO - __main__ - Step 31616: {'lr': 0.00019969485345197767, 'samples': 1011712, 'steps': 1975, 'loss/train': 2.3963401317596436} -09/20/2021 21:20:09 - INFO - __main__ - Step 31617: {'lr': 0.0001996943553042306, 'samples': 1011744, 'steps': 1976, 'loss/train': 0.6912631392478943} -09/20/2021 21:20:10 - INFO - __main__ - Step 31618: {'lr': 0.0001996943553042306, 'samples': 1011776, 'steps': 1976, 'loss/train': 0.5011476874351501} -09/20/2021 21:20:10 - INFO - __main__ - Step 31619: {'lr': 0.0001996943553042306, 'samples': 1011808, 'steps': 1976, 'loss/train': 0.6180089116096497} -09/20/2021 21:20:11 - INFO - __main__ - Step 31620: {'lr': 0.0001996943553042306, 'samples': 1011840, 'steps': 1976, 'loss/train': 0.1461876481771469} -09/20/2021 21:20:12 - INFO - __main__ - Step 31621: {'lr': 0.0001996943553042306, 'samples': 1011872, 'steps': 1976, 'loss/train': 2.125922679901123} -09/20/2021 21:20:13 - INFO - __main__ - Step 31622: {'lr': 0.0001996943553042306, 'samples': 1011904, 'steps': 1976, 'loss/train': 2.384709358215332} -09/20/2021 21:20:13 - INFO - __main__ - Step 31623: {'lr': 0.0001996943553042306, 'samples': 1011936, 'steps': 1976, 'loss/train': 2.3555490970611572} -09/20/2021 21:20:14 - INFO - __main__ - Step 31624: {'lr': 0.0001996943553042306, 'samples': 1011968, 'steps': 1976, 'loss/train': 2.812096357345581} -09/20/2021 21:20:15 - INFO - __main__ - Step 31625: {'lr': 0.0001996943553042306, 'samples': 1012000, 'steps': 1976, 'loss/train': 3.2181031703948975} -09/20/2021 21:20:16 - INFO - __main__ - Step 31626: {'lr': 0.0001996943553042306, 'samples': 1012032, 'steps': 1976, 'loss/train': 2.7601170539855957} -09/20/2021 21:20:16 - INFO - __main__ - Step 31627: {'lr': 0.0001996943553042306, 'samples': 1012064, 'steps': 1976, 'loss/train': 0.7998552918434143} -09/20/2021 21:20:17 - INFO - __main__ - Step 31628: {'lr': 0.0001996943553042306, 'samples': 1012096, 'steps': 1976, 'loss/train': 2.740370988845825} -09/20/2021 21:20:18 - INFO - __main__ - Step 31629: {'lr': 0.0001996943553042306, 'samples': 1012128, 'steps': 1976, 'loss/train': 2.8379411697387695} -09/20/2021 21:20:19 - INFO - __main__ - Step 31630: {'lr': 0.0001996943553042306, 'samples': 1012160, 'steps': 1976, 'loss/train': 2.237959146499634} -09/20/2021 21:20:19 - INFO - __main__ - Step 31631: {'lr': 0.0001996943553042306, 'samples': 1012192, 'steps': 1976, 'loss/train': 1.4116778373718262} -09/20/2021 21:20:20 - INFO - __main__ - Step 31632: {'lr': 0.0001996943553042306, 'samples': 1012224, 'steps': 1976, 'loss/train': 2.4777748584747314} -09/20/2021 21:20:22 - INFO - __main__ - Step 31633: {'lr': 0.00019969385675082756, 'samples': 1012256, 'steps': 1977, 'loss/train': 2.1965010166168213} -09/20/2021 21:20:22 - INFO - __main__ - Step 31634: {'lr': 0.00019969385675082756, 'samples': 1012288, 'steps': 1977, 'loss/train': 2.3927090167999268} -09/20/2021 21:20:23 - INFO - __main__ - Step 31635: {'lr': 0.00019969385675082756, 'samples': 1012320, 'steps': 1977, 'loss/train': 1.999665379524231} -09/20/2021 21:20:24 - INFO - __main__ - Step 31636: {'lr': 0.00019969385675082756, 'samples': 1012352, 'steps': 1977, 'loss/train': 2.2622718811035156} -09/20/2021 21:20:25 - INFO - __main__ - Step 31637: {'lr': 0.00019969385675082756, 'samples': 1012384, 'steps': 1977, 'loss/train': 3.091695547103882} -09/20/2021 21:20:25 - INFO - __main__ - Step 31638: {'lr': 0.00019969385675082756, 'samples': 1012416, 'steps': 1977, 'loss/train': 2.1343109607696533} -09/20/2021 21:20:26 - INFO - __main__ - Step 31639: {'lr': 0.00019969385675082756, 'samples': 1012448, 'steps': 1977, 'loss/train': 2.706446886062622} -09/20/2021 21:20:27 - INFO - __main__ - Step 31640: {'lr': 0.00019969385675082756, 'samples': 1012480, 'steps': 1977, 'loss/train': 2.228151798248291} -09/20/2021 21:20:28 - INFO - __main__ - Step 31641: {'lr': 0.00019969385675082756, 'samples': 1012512, 'steps': 1977, 'loss/train': 1.454088807106018} -09/20/2021 21:20:28 - INFO - __main__ - Step 31642: {'lr': 0.00019969385675082756, 'samples': 1012544, 'steps': 1977, 'loss/train': 2.328097105026245} -09/20/2021 21:20:29 - INFO - __main__ - Step 31643: {'lr': 0.00019969385675082756, 'samples': 1012576, 'steps': 1977, 'loss/train': 1.5599898099899292} -09/20/2021 21:20:30 - INFO - __main__ - Step 31644: {'lr': 0.00019969385675082756, 'samples': 1012608, 'steps': 1977, 'loss/train': 2.6908388137817383} -09/20/2021 21:20:31 - INFO - __main__ - Step 31645: {'lr': 0.00019969385675082756, 'samples': 1012640, 'steps': 1977, 'loss/train': 2.128124237060547} -09/20/2021 21:20:31 - INFO - __main__ - Step 31646: {'lr': 0.00019969385675082756, 'samples': 1012672, 'steps': 1977, 'loss/train': 2.1814467906951904} -09/20/2021 21:20:32 - INFO - __main__ - Step 31647: {'lr': 0.00019969385675082756, 'samples': 1012704, 'steps': 1977, 'loss/train': 2.773422956466675} -09/20/2021 21:20:33 - INFO - __main__ - Step 31648: {'lr': 0.00019969385675082756, 'samples': 1012736, 'steps': 1977, 'loss/train': 3.014699935913086} -09/20/2021 21:20:34 - INFO - __main__ - Step 31649: {'lr': 0.00019969335779177066, 'samples': 1012768, 'steps': 1978, 'loss/train': 2.2584919929504395} -09/20/2021 21:20:34 - INFO - __main__ - Step 31650: {'lr': 0.00019969335779177066, 'samples': 1012800, 'steps': 1978, 'loss/train': 2.342311143875122} -09/20/2021 21:20:35 - INFO - __main__ - Step 31651: {'lr': 0.00019969335779177066, 'samples': 1012832, 'steps': 1978, 'loss/train': 2.8845345973968506} -09/20/2021 21:20:36 - INFO - __main__ - Step 31652: {'lr': 0.00019969335779177066, 'samples': 1012864, 'steps': 1978, 'loss/train': 3.0915305614471436} -09/20/2021 21:20:37 - INFO - __main__ - Step 31653: {'lr': 0.00019969335779177066, 'samples': 1012896, 'steps': 1978, 'loss/train': 2.199401617050171} -09/20/2021 21:20:37 - INFO - __main__ - Step 31654: {'lr': 0.00019969335779177066, 'samples': 1012928, 'steps': 1978, 'loss/train': 2.3729937076568604} -09/20/2021 21:20:38 - INFO - __main__ - Step 31655: {'lr': 0.00019969335779177066, 'samples': 1012960, 'steps': 1978, 'loss/train': 2.931593179702759} -09/20/2021 21:20:39 - INFO - __main__ - Step 31656: {'lr': 0.00019969335779177066, 'samples': 1012992, 'steps': 1978, 'loss/train': 1.9734939336776733} -09/20/2021 21:20:40 - INFO - __main__ - Step 31657: {'lr': 0.00019969335779177066, 'samples': 1013024, 'steps': 1978, 'loss/train': 2.487544536590576} -09/20/2021 21:20:40 - INFO - __main__ - Step 31658: {'lr': 0.00019969335779177066, 'samples': 1013056, 'steps': 1978, 'loss/train': 2.306305170059204} -09/20/2021 21:20:41 - INFO - __main__ - Step 31659: {'lr': 0.00019969335779177066, 'samples': 1013088, 'steps': 1978, 'loss/train': 3.3744802474975586} -09/20/2021 21:20:42 - INFO - __main__ - Step 31660: {'lr': 0.00019969335779177066, 'samples': 1013120, 'steps': 1978, 'loss/train': 0.8682552576065063} -09/20/2021 21:20:43 - INFO - __main__ - Step 31661: {'lr': 0.00019969335779177066, 'samples': 1013152, 'steps': 1978, 'loss/train': 3.412879467010498} -09/20/2021 21:20:43 - INFO - __main__ - Step 31662: {'lr': 0.00019969335779177066, 'samples': 1013184, 'steps': 1978, 'loss/train': 3.7223269939422607} -09/20/2021 21:20:44 - INFO - __main__ - Step 31663: {'lr': 0.00019969335779177066, 'samples': 1013216, 'steps': 1978, 'loss/train': 1.1852571964263916} -09/20/2021 21:20:45 - INFO - __main__ - Step 31664: {'lr': 0.00019969335779177066, 'samples': 1013248, 'steps': 1978, 'loss/train': 2.5739641189575195} -09/20/2021 21:20:46 - INFO - __main__ - Step 31665: {'lr': 0.0001996928584270618, 'samples': 1013280, 'steps': 1979, 'loss/train': 1.7456978559494019} -09/20/2021 21:20:47 - INFO - __main__ - Step 31666: {'lr': 0.0001996928584270618, 'samples': 1013312, 'steps': 1979, 'loss/train': 1.5938708782196045} -09/20/2021 21:20:48 - INFO - __main__ - Step 31667: {'lr': 0.0001996928584270618, 'samples': 1013344, 'steps': 1979, 'loss/train': 2.4399609565734863} -09/20/2021 21:20:49 - INFO - __main__ - Step 31668: {'lr': 0.0001996928584270618, 'samples': 1013376, 'steps': 1979, 'loss/train': 2.572484016418457} -09/20/2021 21:20:49 - INFO - __main__ - Step 31669: {'lr': 0.0001996928584270618, 'samples': 1013408, 'steps': 1979, 'loss/train': 2.5187363624572754} -09/20/2021 21:20:50 - INFO - __main__ - Step 31670: {'lr': 0.0001996928584270618, 'samples': 1013440, 'steps': 1979, 'loss/train': 2.7257609367370605} -09/20/2021 21:20:51 - INFO - __main__ - Step 31671: {'lr': 0.0001996928584270618, 'samples': 1013472, 'steps': 1979, 'loss/train': 2.3723669052124023} -09/20/2021 21:20:52 - INFO - __main__ - Step 31672: {'lr': 0.0001996928584270618, 'samples': 1013504, 'steps': 1979, 'loss/train': 1.682011604309082} -09/20/2021 21:20:52 - INFO - __main__ - Step 31673: {'lr': 0.0001996928584270618, 'samples': 1013536, 'steps': 1979, 'loss/train': 1.8755687475204468} -09/20/2021 21:20:53 - INFO - __main__ - Step 31674: {'lr': 0.0001996928584270618, 'samples': 1013568, 'steps': 1979, 'loss/train': 2.2728919982910156} -09/20/2021 21:20:54 - INFO - __main__ - Step 31675: {'lr': 0.0001996928584270618, 'samples': 1013600, 'steps': 1979, 'loss/train': 2.702639579772949} -09/20/2021 21:20:55 - INFO - __main__ - Step 31676: {'lr': 0.0001996928584270618, 'samples': 1013632, 'steps': 1979, 'loss/train': 2.785231113433838} -09/20/2021 21:20:55 - INFO - __main__ - Step 31677: {'lr': 0.0001996928584270618, 'samples': 1013664, 'steps': 1979, 'loss/train': 2.174689769744873} -09/20/2021 21:20:56 - INFO - __main__ - Step 31678: {'lr': 0.0001996928584270618, 'samples': 1013696, 'steps': 1979, 'loss/train': 2.3220906257629395} -09/20/2021 21:20:57 - INFO - __main__ - Step 31679: {'lr': 0.0001996928584270618, 'samples': 1013728, 'steps': 1979, 'loss/train': 2.581559181213379} -09/20/2021 21:20:58 - INFO - __main__ - Step 31680: {'lr': 0.0001996928584270618, 'samples': 1013760, 'steps': 1979, 'loss/train': 1.7513823509216309} -09/20/2021 21:20:58 - INFO - __main__ - Step 31681: {'lr': 0.00019969235865670317, 'samples': 1013792, 'steps': 1980, 'loss/train': 1.8238979578018188} -09/20/2021 21:20:59 - INFO - __main__ - Step 31682: {'lr': 0.00019969235865670317, 'samples': 1013824, 'steps': 1980, 'loss/train': 2.9068851470947266} -09/20/2021 21:21:00 - INFO - __main__ - Step 31683: {'lr': 0.00019969235865670317, 'samples': 1013856, 'steps': 1980, 'loss/train': 2.7591938972473145} -09/20/2021 21:21:01 - INFO - __main__ - Step 31684: {'lr': 0.00019969235865670317, 'samples': 1013888, 'steps': 1980, 'loss/train': 2.4362432956695557} -09/20/2021 21:21:01 - INFO - __main__ - Step 31685: {'lr': 0.00019969235865670317, 'samples': 1013920, 'steps': 1980, 'loss/train': 1.9320958852767944} -09/20/2021 21:21:02 - INFO - __main__ - Step 31686: {'lr': 0.00019969235865670317, 'samples': 1013952, 'steps': 1980, 'loss/train': 2.9090707302093506} -09/20/2021 21:21:03 - INFO - __main__ - Step 31687: {'lr': 0.00019969235865670317, 'samples': 1013984, 'steps': 1980, 'loss/train': 2.7665581703186035} -09/20/2021 21:21:04 - INFO - __main__ - Step 31688: {'lr': 0.00019969235865670317, 'samples': 1014016, 'steps': 1980, 'loss/train': 3.261864423751831} -09/20/2021 21:21:04 - INFO - __main__ - Step 31689: {'lr': 0.00019969235865670317, 'samples': 1014048, 'steps': 1980, 'loss/train': 2.020711898803711} -09/20/2021 21:21:05 - INFO - __main__ - Step 31690: {'lr': 0.00019969235865670317, 'samples': 1014080, 'steps': 1980, 'loss/train': 2.2444372177124023} -09/20/2021 21:21:06 - INFO - __main__ - Step 31691: {'lr': 0.00019969235865670317, 'samples': 1014112, 'steps': 1980, 'loss/train': 2.6843085289001465} -09/20/2021 21:21:07 - INFO - __main__ - Step 31692: {'lr': 0.00019969235865670317, 'samples': 1014144, 'steps': 1980, 'loss/train': 2.9994616508483887} -09/20/2021 21:21:07 - INFO - __main__ - Step 31693: {'lr': 0.00019969235865670317, 'samples': 1014176, 'steps': 1980, 'loss/train': 3.2685043811798096} -09/20/2021 21:21:08 - INFO - __main__ - Step 31694: {'lr': 0.00019969235865670317, 'samples': 1014208, 'steps': 1980, 'loss/train': 3.4007625579833984} -09/20/2021 21:21:09 - INFO - __main__ - Step 31695: {'lr': 0.00019969235865670317, 'samples': 1014240, 'steps': 1980, 'loss/train': 2.637808322906494} -09/20/2021 21:21:10 - INFO - __main__ - Step 31696: {'lr': 0.00019969235865670317, 'samples': 1014272, 'steps': 1980, 'loss/train': 0.513602077960968} -09/20/2021 21:21:11 - INFO - __main__ - Step 31697: {'lr': 0.00019969185848069666, 'samples': 1014304, 'steps': 1981, 'loss/train': 3.1654679775238037} -09/20/2021 21:21:12 - INFO - __main__ - Step 31698: {'lr': 0.00019969185848069666, 'samples': 1014336, 'steps': 1981, 'loss/train': 2.115128755569458} -09/20/2021 21:21:13 - INFO - __main__ - Step 31699: {'lr': 0.00019969185848069666, 'samples': 1014368, 'steps': 1981, 'loss/train': 1.5338584184646606} -09/20/2021 21:21:13 - INFO - __main__ - Step 31700: {'lr': 0.00019969185848069666, 'samples': 1014400, 'steps': 1981, 'loss/train': 2.618661642074585} -09/20/2021 21:21:14 - INFO - __main__ - Step 31701: {'lr': 0.00019969185848069666, 'samples': 1014432, 'steps': 1981, 'loss/train': 2.300365686416626} -09/20/2021 21:21:15 - INFO - __main__ - Step 31702: {'lr': 0.00019969185848069666, 'samples': 1014464, 'steps': 1981, 'loss/train': 2.8505144119262695} -09/20/2021 21:21:16 - INFO - __main__ - Step 31703: {'lr': 0.00019969185848069666, 'samples': 1014496, 'steps': 1981, 'loss/train': 2.0015106201171875} -09/20/2021 21:21:16 - INFO - __main__ - Step 31704: {'lr': 0.00019969185848069666, 'samples': 1014528, 'steps': 1981, 'loss/train': 2.563981771469116} -09/20/2021 21:21:17 - INFO - __main__ - Step 31705: {'lr': 0.00019969185848069666, 'samples': 1014560, 'steps': 1981, 'loss/train': 2.3873445987701416} -09/20/2021 21:21:18 - INFO - __main__ - Step 31706: {'lr': 0.00019969185848069666, 'samples': 1014592, 'steps': 1981, 'loss/train': 2.2107925415039062} -09/20/2021 21:21:19 - INFO - __main__ - Step 31707: {'lr': 0.00019969185848069666, 'samples': 1014624, 'steps': 1981, 'loss/train': 1.9376165866851807} -09/20/2021 21:21:19 - INFO - __main__ - Step 31708: {'lr': 0.00019969185848069666, 'samples': 1014656, 'steps': 1981, 'loss/train': 2.429649829864502} -09/20/2021 21:21:20 - INFO - __main__ - Step 31709: {'lr': 0.00019969185848069666, 'samples': 1014688, 'steps': 1981, 'loss/train': 2.3057241439819336} -09/20/2021 21:21:21 - INFO - __main__ - Step 31710: {'lr': 0.00019969185848069666, 'samples': 1014720, 'steps': 1981, 'loss/train': 2.947327136993408} -09/20/2021 21:21:22 - INFO - __main__ - Step 31711: {'lr': 0.00019969185848069666, 'samples': 1014752, 'steps': 1981, 'loss/train': 1.3622592687606812} -09/20/2021 21:21:22 - INFO - __main__ - Step 31712: {'lr': 0.00019969185848069666, 'samples': 1014784, 'steps': 1981, 'loss/train': 2.9051551818847656} -09/20/2021 21:21:23 - INFO - __main__ - Step 31713: {'lr': 0.00019969135789904438, 'samples': 1014816, 'steps': 1982, 'loss/train': 1.4485081434249878} -09/20/2021 21:21:24 - INFO - __main__ - Step 31714: {'lr': 0.00019969135789904438, 'samples': 1014848, 'steps': 1982, 'loss/train': 2.6847074031829834} -09/20/2021 21:21:25 - INFO - __main__ - Step 31715: {'lr': 0.00019969135789904438, 'samples': 1014880, 'steps': 1982, 'loss/train': 2.327920913696289} -09/20/2021 21:21:25 - INFO - __main__ - Step 31716: {'lr': 0.00019969135789904438, 'samples': 1014912, 'steps': 1982, 'loss/train': 1.7825212478637695} -09/20/2021 21:21:26 - INFO - __main__ - Step 31717: {'lr': 0.00019969135789904438, 'samples': 1014944, 'steps': 1982, 'loss/train': 2.4997143745422363} -09/20/2021 21:21:27 - INFO - __main__ - Step 31718: {'lr': 0.00019969135789904438, 'samples': 1014976, 'steps': 1982, 'loss/train': 3.5386695861816406} -09/20/2021 21:21:28 - INFO - __main__ - Step 31719: {'lr': 0.00019969135789904438, 'samples': 1015008, 'steps': 1982, 'loss/train': 1.9813189506530762} -09/20/2021 21:21:28 - INFO - __main__ - Step 31720: {'lr': 0.00019969135789904438, 'samples': 1015040, 'steps': 1982, 'loss/train': 2.757201910018921} -09/20/2021 21:21:29 - INFO - __main__ - Step 31721: {'lr': 0.00019969135789904438, 'samples': 1015072, 'steps': 1982, 'loss/train': 2.115539073944092} -09/20/2021 21:21:30 - INFO - __main__ - Step 31722: {'lr': 0.00019969135789904438, 'samples': 1015104, 'steps': 1982, 'loss/train': 2.8885912895202637} -09/20/2021 21:21:31 - INFO - __main__ - Step 31723: {'lr': 0.00019969135789904438, 'samples': 1015136, 'steps': 1982, 'loss/train': 2.115065574645996} -09/20/2021 21:21:31 - INFO - __main__ - Step 31724: {'lr': 0.00019969135789904438, 'samples': 1015168, 'steps': 1982, 'loss/train': 2.2619035243988037} -09/20/2021 21:21:32 - INFO - __main__ - Step 31725: {'lr': 0.00019969135789904438, 'samples': 1015200, 'steps': 1982, 'loss/train': 2.138077974319458} -09/20/2021 21:21:33 - INFO - __main__ - Step 31726: {'lr': 0.00019969135789904438, 'samples': 1015232, 'steps': 1982, 'loss/train': 0.7034094333648682} -09/20/2021 21:21:35 - INFO - __main__ - Step 31727: {'lr': 0.00019969135789904438, 'samples': 1015264, 'steps': 1982, 'loss/train': 1.227293610572815} -09/20/2021 21:21:35 - INFO - __main__ - Step 31728: {'lr': 0.00019969135789904438, 'samples': 1015296, 'steps': 1982, 'loss/train': 2.9878361225128174} -09/20/2021 21:21:36 - INFO - __main__ - Step 31729: {'lr': 0.00019969085691174835, 'samples': 1015328, 'steps': 1983, 'loss/train': 2.3831145763397217} -09/20/2021 21:21:37 - INFO - __main__ - Step 31730: {'lr': 0.00019969085691174835, 'samples': 1015360, 'steps': 1983, 'loss/train': 3.118781089782715} -09/20/2021 21:21:38 - INFO - __main__ - Step 31731: {'lr': 0.00019969085691174835, 'samples': 1015392, 'steps': 1983, 'loss/train': 2.7180235385894775} -09/20/2021 21:21:38 - INFO - __main__ - Step 31732: {'lr': 0.00019969085691174835, 'samples': 1015424, 'steps': 1983, 'loss/train': 1.920500636100769} -09/20/2021 21:21:39 - INFO - __main__ - Step 31733: {'lr': 0.00019969085691174835, 'samples': 1015456, 'steps': 1983, 'loss/train': 3.3683784008026123} -09/20/2021 21:21:40 - INFO - __main__ - Step 31734: {'lr': 0.00019969085691174835, 'samples': 1015488, 'steps': 1983, 'loss/train': 2.4802744388580322} -09/20/2021 21:21:41 - INFO - __main__ - Step 31735: {'lr': 0.00019969085691174835, 'samples': 1015520, 'steps': 1983, 'loss/train': 2.698331594467163} -09/20/2021 21:21:41 - INFO - __main__ - Step 31736: {'lr': 0.00019969085691174835, 'samples': 1015552, 'steps': 1983, 'loss/train': 2.718811273574829} -09/20/2021 21:21:42 - INFO - __main__ - Step 31737: {'lr': 0.00019969085691174835, 'samples': 1015584, 'steps': 1983, 'loss/train': 3.1117546558380127} -09/20/2021 21:21:43 - INFO - __main__ - Step 31738: {'lr': 0.00019969085691174835, 'samples': 1015616, 'steps': 1983, 'loss/train': 2.37608003616333} -09/20/2021 21:21:44 - INFO - __main__ - Step 31739: {'lr': 0.00019969085691174835, 'samples': 1015648, 'steps': 1983, 'loss/train': 2.7923450469970703} -09/20/2021 21:21:44 - INFO - __main__ - Step 31740: {'lr': 0.00019969085691174835, 'samples': 1015680, 'steps': 1983, 'loss/train': 1.3970478773117065} -09/20/2021 21:21:45 - INFO - __main__ - Step 31741: {'lr': 0.00019969085691174835, 'samples': 1015712, 'steps': 1983, 'loss/train': 3.0878496170043945} -09/20/2021 21:21:46 - INFO - __main__ - Step 31742: {'lr': 0.00019969085691174835, 'samples': 1015744, 'steps': 1983, 'loss/train': 2.3781704902648926} -09/20/2021 21:21:47 - INFO - __main__ - Step 31743: {'lr': 0.00019969085691174835, 'samples': 1015776, 'steps': 1983, 'loss/train': 1.881105899810791} -09/20/2021 21:21:47 - INFO - __main__ - Step 31744: {'lr': 0.00019969085691174835, 'samples': 1015808, 'steps': 1983, 'loss/train': 3.1273303031921387} -09/20/2021 21:21:48 - INFO - __main__ - Step 31745: {'lr': 0.00019969035551881063, 'samples': 1015840, 'steps': 1984, 'loss/train': 1.6393033266067505} -09/20/2021 21:21:49 - INFO - __main__ - Step 31746: {'lr': 0.00019969035551881063, 'samples': 1015872, 'steps': 1984, 'loss/train': 2.4051311016082764} -09/20/2021 21:21:50 - INFO - __main__ - Step 31747: {'lr': 0.00019969035551881063, 'samples': 1015904, 'steps': 1984, 'loss/train': 2.6094179153442383} -09/20/2021 21:21:51 - INFO - __main__ - Step 31748: {'lr': 0.00019969035551881063, 'samples': 1015936, 'steps': 1984, 'loss/train': 2.037956953048706} -09/20/2021 21:21:51 - INFO - __main__ - Step 31749: {'lr': 0.00019969035551881063, 'samples': 1015968, 'steps': 1984, 'loss/train': 3.4996752738952637} -09/20/2021 21:21:52 - INFO - __main__ - Step 31750: {'lr': 0.00019969035551881063, 'samples': 1016000, 'steps': 1984, 'loss/train': 1.8838279247283936} -09/20/2021 21:21:53 - INFO - __main__ - Step 31751: {'lr': 0.00019969035551881063, 'samples': 1016032, 'steps': 1984, 'loss/train': 3.2090091705322266} -09/20/2021 21:21:54 - INFO - __main__ - Step 31752: {'lr': 0.00019969035551881063, 'samples': 1016064, 'steps': 1984, 'loss/train': 2.4547109603881836} -09/20/2021 21:21:54 - INFO - __main__ - Step 31753: {'lr': 0.00019969035551881063, 'samples': 1016096, 'steps': 1984, 'loss/train': 1.7377992868423462} -09/20/2021 21:21:55 - INFO - __main__ - Step 31754: {'lr': 0.00019969035551881063, 'samples': 1016128, 'steps': 1984, 'loss/train': 0.700038731098175} -09/20/2021 21:21:56 - INFO - __main__ - Step 31755: {'lr': 0.00019969035551881063, 'samples': 1016160, 'steps': 1984, 'loss/train': 0.3587694466114044} -09/20/2021 21:21:57 - INFO - __main__ - Step 31756: {'lr': 0.00019969035551881063, 'samples': 1016192, 'steps': 1984, 'loss/train': 0.28615128993988037} -09/20/2021 21:21:57 - INFO - __main__ - Step 31757: {'lr': 0.00019969035551881063, 'samples': 1016224, 'steps': 1984, 'loss/train': 0.2133956104516983} -09/20/2021 21:21:58 - INFO - __main__ - Step 31758: {'lr': 0.00019969035551881063, 'samples': 1016256, 'steps': 1984, 'loss/train': 0.6140875220298767} -09/20/2021 21:21:59 - INFO - __main__ - Step 31759: {'lr': 0.00019969035551881063, 'samples': 1016288, 'steps': 1984, 'loss/train': 0.3877410590648651} -09/20/2021 21:22:00 - INFO - __main__ - Step 31760: {'lr': 0.00019969035551881063, 'samples': 1016320, 'steps': 1984, 'loss/train': 0.5423722267150879} -09/20/2021 21:22:01 - INFO - __main__ - Step 31761: {'lr': 0.0001996898537202332, 'samples': 1016352, 'steps': 1985, 'loss/train': 2.7567968368530273} -09/20/2021 21:22:02 - INFO - __main__ - Step 31762: {'lr': 0.0001996898537202332, 'samples': 1016384, 'steps': 1985, 'loss/train': 1.94638192653656} -09/20/2021 21:22:03 - INFO - __main__ - Step 31763: {'lr': 0.0001996898537202332, 'samples': 1016416, 'steps': 1985, 'loss/train': 2.8504855632781982} -09/20/2021 21:22:03 - INFO - __main__ - Step 31764: {'lr': 0.0001996898537202332, 'samples': 1016448, 'steps': 1985, 'loss/train': 2.5354623794555664} -09/20/2021 21:22:04 - INFO - __main__ - Step 31765: {'lr': 0.0001996898537202332, 'samples': 1016480, 'steps': 1985, 'loss/train': 2.2078664302825928} -09/20/2021 21:22:05 - INFO - __main__ - Step 31766: {'lr': 0.0001996898537202332, 'samples': 1016512, 'steps': 1985, 'loss/train': 2.6800358295440674} -09/20/2021 21:22:06 - INFO - __main__ - Step 31767: {'lr': 0.0001996898537202332, 'samples': 1016544, 'steps': 1985, 'loss/train': 2.5669844150543213} -09/20/2021 21:22:06 - INFO - __main__ - Step 31768: {'lr': 0.0001996898537202332, 'samples': 1016576, 'steps': 1985, 'loss/train': 1.100372552871704} -09/20/2021 21:22:07 - INFO - __main__ - Step 31769: {'lr': 0.0001996898537202332, 'samples': 1016608, 'steps': 1985, 'loss/train': 1.9798609018325806} -09/20/2021 21:22:08 - INFO - __main__ - Step 31770: {'lr': 0.0001996898537202332, 'samples': 1016640, 'steps': 1985, 'loss/train': 2.5384230613708496} -09/20/2021 21:22:09 - INFO - __main__ - Step 31771: {'lr': 0.0001996898537202332, 'samples': 1016672, 'steps': 1985, 'loss/train': 1.5799144506454468} -09/20/2021 21:22:09 - INFO - __main__ - Step 31772: {'lr': 0.0001996898537202332, 'samples': 1016704, 'steps': 1985, 'loss/train': 2.801340103149414} -09/20/2021 21:22:10 - INFO - __main__ - Step 31773: {'lr': 0.0001996898537202332, 'samples': 1016736, 'steps': 1985, 'loss/train': 3.1122140884399414} -09/20/2021 21:22:11 - INFO - __main__ - Step 31774: {'lr': 0.0001996898537202332, 'samples': 1016768, 'steps': 1985, 'loss/train': 2.292790174484253} -09/20/2021 21:22:12 - INFO - __main__ - Step 31775: {'lr': 0.0001996898537202332, 'samples': 1016800, 'steps': 1985, 'loss/train': 1.5825623273849487} -09/20/2021 21:22:12 - INFO - __main__ - Step 31776: {'lr': 0.0001996898537202332, 'samples': 1016832, 'steps': 1985, 'loss/train': 1.858298420906067} -09/20/2021 21:22:13 - INFO - __main__ - Step 31777: {'lr': 0.00019968935151601816, 'samples': 1016864, 'steps': 1986, 'loss/train': 0.7393524646759033} -09/20/2021 21:22:14 - INFO - __main__ - Step 31778: {'lr': 0.00019968935151601816, 'samples': 1016896, 'steps': 1986, 'loss/train': 2.43245530128479} -09/20/2021 21:22:15 - INFO - __main__ - Step 31779: {'lr': 0.00019968935151601816, 'samples': 1016928, 'steps': 1986, 'loss/train': 1.766991376876831} -09/20/2021 21:22:15 - INFO - __main__ - Step 31780: {'lr': 0.00019968935151601816, 'samples': 1016960, 'steps': 1986, 'loss/train': 2.331021547317505} -09/20/2021 21:22:16 - INFO - __main__ - Step 31781: {'lr': 0.00019968935151601816, 'samples': 1016992, 'steps': 1986, 'loss/train': 0.7376748323440552} -09/20/2021 21:22:17 - INFO - __main__ - Step 31782: {'lr': 0.00019968935151601816, 'samples': 1017024, 'steps': 1986, 'loss/train': 3.047003984451294} -09/20/2021 21:22:18 - INFO - __main__ - Step 31783: {'lr': 0.00019968935151601816, 'samples': 1017056, 'steps': 1986, 'loss/train': 1.4346709251403809} -09/20/2021 21:22:18 - INFO - __main__ - Step 31784: {'lr': 0.00019968935151601816, 'samples': 1017088, 'steps': 1986, 'loss/train': 1.9296261072158813} -09/20/2021 21:22:19 - INFO - __main__ - Step 31785: {'lr': 0.00019968935151601816, 'samples': 1017120, 'steps': 1986, 'loss/train': 2.3116183280944824} -09/20/2021 21:22:20 - INFO - __main__ - Step 31786: {'lr': 0.00019968935151601816, 'samples': 1017152, 'steps': 1986, 'loss/train': 1.9126020669937134} -09/20/2021 21:22:21 - INFO - __main__ - Step 31787: {'lr': 0.00019968935151601816, 'samples': 1017184, 'steps': 1986, 'loss/train': 2.597842216491699} -09/20/2021 21:22:21 - INFO - __main__ - Step 31788: {'lr': 0.00019968935151601816, 'samples': 1017216, 'steps': 1986, 'loss/train': 2.491567373275757} -09/20/2021 21:22:22 - INFO - __main__ - Step 31789: {'lr': 0.00019968935151601816, 'samples': 1017248, 'steps': 1986, 'loss/train': 1.6077228784561157} -09/20/2021 21:22:23 - INFO - __main__ - Step 31790: {'lr': 0.00019968935151601816, 'samples': 1017280, 'steps': 1986, 'loss/train': 3.234008550643921} -09/20/2021 21:22:24 - INFO - __main__ - Step 31791: {'lr': 0.00019968935151601816, 'samples': 1017312, 'steps': 1986, 'loss/train': 2.6027464866638184} -09/20/2021 21:22:24 - INFO - __main__ - Step 31792: {'lr': 0.00019968935151601816, 'samples': 1017344, 'steps': 1986, 'loss/train': 2.668931245803833} -09/20/2021 21:22:26 - INFO - __main__ - Step 31793: {'lr': 0.00019968884890616756, 'samples': 1017376, 'steps': 1987, 'loss/train': 1.8961459398269653} -09/20/2021 21:22:27 - INFO - __main__ - Step 31794: {'lr': 0.00019968884890616756, 'samples': 1017408, 'steps': 1987, 'loss/train': 2.01355242729187} -09/20/2021 21:22:28 - INFO - __main__ - Step 31795: {'lr': 0.00019968884890616756, 'samples': 1017440, 'steps': 1987, 'loss/train': 1.8202104568481445} -09/20/2021 21:22:28 - INFO - __main__ - Step 31796: {'lr': 0.00019968884890616756, 'samples': 1017472, 'steps': 1987, 'loss/train': 0.9259600639343262} -09/20/2021 21:22:29 - INFO - __main__ - Step 31797: {'lr': 0.00019968884890616756, 'samples': 1017504, 'steps': 1987, 'loss/train': 1.5030301809310913} -09/20/2021 21:22:30 - INFO - __main__ - Step 31798: {'lr': 0.00019968884890616756, 'samples': 1017536, 'steps': 1987, 'loss/train': 1.9689273834228516} -09/20/2021 21:22:31 - INFO - __main__ - Step 31799: {'lr': 0.00019968884890616756, 'samples': 1017568, 'steps': 1987, 'loss/train': 2.3282628059387207} -09/20/2021 21:22:31 - INFO - __main__ - Step 31800: {'lr': 0.00019968884890616756, 'samples': 1017600, 'steps': 1987, 'loss/train': 1.6162834167480469} -09/20/2021 21:22:32 - INFO - __main__ - Step 31801: {'lr': 0.00019968884890616756, 'samples': 1017632, 'steps': 1987, 'loss/train': 2.206261157989502} -09/20/2021 21:22:33 - INFO - __main__ - Step 31802: {'lr': 0.00019968884890616756, 'samples': 1017664, 'steps': 1987, 'loss/train': 2.3650476932525635} -09/20/2021 21:22:34 - INFO - __main__ - Step 31803: {'lr': 0.00019968884890616756, 'samples': 1017696, 'steps': 1987, 'loss/train': 2.3112785816192627} -09/20/2021 21:22:34 - INFO - __main__ - Step 31804: {'lr': 0.00019968884890616756, 'samples': 1017728, 'steps': 1987, 'loss/train': 1.402329444885254} -09/20/2021 21:22:35 - INFO - __main__ - Step 31805: {'lr': 0.00019968884890616756, 'samples': 1017760, 'steps': 1987, 'loss/train': 1.894623875617981} -09/20/2021 21:22:36 - INFO - __main__ - Step 31806: {'lr': 0.00019968884890616756, 'samples': 1017792, 'steps': 1987, 'loss/train': 2.497831344604492} -09/20/2021 21:22:37 - INFO - __main__ - Step 31807: {'lr': 0.00019968884890616756, 'samples': 1017824, 'steps': 1987, 'loss/train': 2.5339760780334473} -09/20/2021 21:22:37 - INFO - __main__ - Step 31808: {'lr': 0.00019968884890616756, 'samples': 1017856, 'steps': 1987, 'loss/train': 2.826439619064331} -09/20/2021 21:22:38 - INFO - __main__ - Step 31809: {'lr': 0.0001996883458906834, 'samples': 1017888, 'steps': 1988, 'loss/train': 2.542151689529419} -09/20/2021 21:22:39 - INFO - __main__ - Step 31810: {'lr': 0.0001996883458906834, 'samples': 1017920, 'steps': 1988, 'loss/train': 2.8358747959136963} -09/20/2021 21:22:40 - INFO - __main__ - Step 31811: {'lr': 0.0001996883458906834, 'samples': 1017952, 'steps': 1988, 'loss/train': 2.92305326461792} -09/20/2021 21:22:41 - INFO - __main__ - Step 31812: {'lr': 0.0001996883458906834, 'samples': 1017984, 'steps': 1988, 'loss/train': 2.16375994682312} -09/20/2021 21:22:41 - INFO - __main__ - Step 31813: {'lr': 0.0001996883458906834, 'samples': 1018016, 'steps': 1988, 'loss/train': 2.351783275604248} -09/20/2021 21:22:42 - INFO - __main__ - Step 31814: {'lr': 0.0001996883458906834, 'samples': 1018048, 'steps': 1988, 'loss/train': 2.3644320964813232} -09/20/2021 21:22:43 - INFO - __main__ - Step 31815: {'lr': 0.0001996883458906834, 'samples': 1018080, 'steps': 1988, 'loss/train': 2.28328275680542} -09/20/2021 21:22:44 - INFO - __main__ - Step 31816: {'lr': 0.0001996883458906834, 'samples': 1018112, 'steps': 1988, 'loss/train': 2.6302623748779297} -09/20/2021 21:22:44 - INFO - __main__ - Step 31817: {'lr': 0.0001996883458906834, 'samples': 1018144, 'steps': 1988, 'loss/train': 2.0055367946624756} -09/20/2021 21:22:45 - INFO - __main__ - Step 31818: {'lr': 0.0001996883458906834, 'samples': 1018176, 'steps': 1988, 'loss/train': 2.8297908306121826} -09/20/2021 21:22:46 - INFO - __main__ - Step 31819: {'lr': 0.0001996883458906834, 'samples': 1018208, 'steps': 1988, 'loss/train': 0.734310507774353} -09/20/2021 21:22:47 - INFO - __main__ - Step 31820: {'lr': 0.0001996883458906834, 'samples': 1018240, 'steps': 1988, 'loss/train': 0.6860285997390747} -09/20/2021 21:22:47 - INFO - __main__ - Step 31821: {'lr': 0.0001996883458906834, 'samples': 1018272, 'steps': 1988, 'loss/train': 0.945479154586792} -09/20/2021 21:22:48 - INFO - __main__ - Step 31822: {'lr': 0.0001996883458906834, 'samples': 1018304, 'steps': 1988, 'loss/train': 0.6500191688537598} -09/20/2021 21:22:49 - INFO - __main__ - Step 31823: {'lr': 0.0001996883458906834, 'samples': 1018336, 'steps': 1988, 'loss/train': 0.6545978784561157} -09/20/2021 21:22:50 - INFO - __main__ - Step 31824: {'lr': 0.0001996883458906834, 'samples': 1018368, 'steps': 1988, 'loss/train': 0.7817119359970093} -09/20/2021 21:22:50 - INFO - __main__ - Step 31825: {'lr': 0.00019968784246956776, 'samples': 1018400, 'steps': 1989, 'loss/train': 0.7648100852966309} -09/20/2021 21:22:51 - INFO - __main__ - Step 31826: {'lr': 0.00019968784246956776, 'samples': 1018432, 'steps': 1989, 'loss/train': 0.8650322556495667} -09/20/2021 21:22:52 - INFO - __main__ - Step 31827: {'lr': 0.00019968784246956776, 'samples': 1018464, 'steps': 1989, 'loss/train': 2.7649593353271484} -09/20/2021 21:22:53 - INFO - __main__ - Step 31828: {'lr': 0.00019968784246956776, 'samples': 1018496, 'steps': 1989, 'loss/train': 2.8642005920410156} -09/20/2021 21:22:54 - INFO - __main__ - Step 31829: {'lr': 0.00019968784246956776, 'samples': 1018528, 'steps': 1989, 'loss/train': 2.4093759059906006} -09/20/2021 21:22:55 - INFO - __main__ - Step 31830: {'lr': 0.00019968784246956776, 'samples': 1018560, 'steps': 1989, 'loss/train': 2.0303003787994385} -09/20/2021 21:22:56 - INFO - __main__ - Step 31831: {'lr': 0.00019968784246956776, 'samples': 1018592, 'steps': 1989, 'loss/train': 2.3382222652435303} -09/20/2021 21:22:56 - INFO - __main__ - Step 31832: {'lr': 0.00019968784246956776, 'samples': 1018624, 'steps': 1989, 'loss/train': 2.6970269680023193} -09/20/2021 21:22:57 - INFO - __main__ - Step 31833: {'lr': 0.00019968784246956776, 'samples': 1018656, 'steps': 1989, 'loss/train': 2.414170503616333} -09/20/2021 21:22:58 - INFO - __main__ - Step 31834: {'lr': 0.00019968784246956776, 'samples': 1018688, 'steps': 1989, 'loss/train': 3.486137866973877} -09/20/2021 21:22:59 - INFO - __main__ - Step 31835: {'lr': 0.00019968784246956776, 'samples': 1018720, 'steps': 1989, 'loss/train': 3.049872636795044} -09/20/2021 21:22:59 - INFO - __main__ - Step 31836: {'lr': 0.00019968784246956776, 'samples': 1018752, 'steps': 1989, 'loss/train': 1.9777582883834839} -09/20/2021 21:23:00 - INFO - __main__ - Step 31837: {'lr': 0.00019968784246956776, 'samples': 1018784, 'steps': 1989, 'loss/train': 2.458420515060425} -09/20/2021 21:23:01 - INFO - __main__ - Step 31838: {'lr': 0.00019968784246956776, 'samples': 1018816, 'steps': 1989, 'loss/train': 2.1649694442749023} -09/20/2021 21:23:02 - INFO - __main__ - Step 31839: {'lr': 0.00019968784246956776, 'samples': 1018848, 'steps': 1989, 'loss/train': 3.2000386714935303} -09/20/2021 21:23:02 - INFO - __main__ - Step 31840: {'lr': 0.00019968784246956776, 'samples': 1018880, 'steps': 1989, 'loss/train': 2.8525490760803223} -09/20/2021 21:23:03 - INFO - __main__ - Step 31841: {'lr': 0.00019968733864282265, 'samples': 1018912, 'steps': 1990, 'loss/train': 3.2340173721313477} -09/20/2021 21:23:04 - INFO - __main__ - Step 31842: {'lr': 0.00019968733864282265, 'samples': 1018944, 'steps': 1990, 'loss/train': 1.6855568885803223} -09/20/2021 21:23:05 - INFO - __main__ - Step 31843: {'lr': 0.00019968733864282265, 'samples': 1018976, 'steps': 1990, 'loss/train': 1.896530032157898} -09/20/2021 21:23:05 - INFO - __main__ - Step 31844: {'lr': 0.00019968733864282265, 'samples': 1019008, 'steps': 1990, 'loss/train': 1.977720856666565} -09/20/2021 21:23:06 - INFO - __main__ - Step 31845: {'lr': 0.00019968733864282265, 'samples': 1019040, 'steps': 1990, 'loss/train': 2.539421796798706} -09/20/2021 21:23:07 - INFO - __main__ - Step 31846: {'lr': 0.00019968733864282265, 'samples': 1019072, 'steps': 1990, 'loss/train': 2.4922354221343994} -09/20/2021 21:23:08 - INFO - __main__ - Step 31847: {'lr': 0.00019968733864282265, 'samples': 1019104, 'steps': 1990, 'loss/train': 2.401019811630249} -09/20/2021 21:23:08 - INFO - __main__ - Step 31848: {'lr': 0.00019968733864282265, 'samples': 1019136, 'steps': 1990, 'loss/train': 2.529158353805542} -09/20/2021 21:23:09 - INFO - __main__ - Step 31849: {'lr': 0.00019968733864282265, 'samples': 1019168, 'steps': 1990, 'loss/train': 2.130467653274536} -09/20/2021 21:23:10 - INFO - __main__ - Step 31850: {'lr': 0.00019968733864282265, 'samples': 1019200, 'steps': 1990, 'loss/train': 2.0761425495147705} -09/20/2021 21:23:11 - INFO - __main__ - Step 31851: {'lr': 0.00019968733864282265, 'samples': 1019232, 'steps': 1990, 'loss/train': 2.133376359939575} -09/20/2021 21:23:11 - INFO - __main__ - Step 31852: {'lr': 0.00019968733864282265, 'samples': 1019264, 'steps': 1990, 'loss/train': 3.251528024673462} -09/20/2021 21:23:12 - INFO - __main__ - Step 31853: {'lr': 0.00019968733864282265, 'samples': 1019296, 'steps': 1990, 'loss/train': 2.824965238571167} -09/20/2021 21:23:13 - INFO - __main__ - Step 31854: {'lr': 0.00019968733864282265, 'samples': 1019328, 'steps': 1990, 'loss/train': 1.9280468225479126} -09/20/2021 21:23:14 - INFO - __main__ - Step 31855: {'lr': 0.00019968733864282265, 'samples': 1019360, 'steps': 1990, 'loss/train': 1.8177051544189453} -09/20/2021 21:23:14 - INFO - __main__ - Step 31856: {'lr': 0.00019968733864282265, 'samples': 1019392, 'steps': 1990, 'loss/train': 2.264615535736084} -09/20/2021 21:23:15 - INFO - __main__ - Step 31857: {'lr': 0.00019968683441045016, 'samples': 1019424, 'steps': 1991, 'loss/train': 1.8662620782852173} -09/20/2021 21:23:16 - INFO - __main__ - Step 31858: {'lr': 0.00019968683441045016, 'samples': 1019456, 'steps': 1991, 'loss/train': 2.3266499042510986} -09/20/2021 21:23:17 - INFO - __main__ - Step 31859: {'lr': 0.00019968683441045016, 'samples': 1019488, 'steps': 1991, 'loss/train': 2.6715292930603027} -09/20/2021 21:23:18 - INFO - __main__ - Step 31860: {'lr': 0.00019968683441045016, 'samples': 1019520, 'steps': 1991, 'loss/train': 2.187516450881958} -09/20/2021 21:23:19 - INFO - __main__ - Step 31861: {'lr': 0.00019968683441045016, 'samples': 1019552, 'steps': 1991, 'loss/train': 2.264963150024414} -09/20/2021 21:23:20 - INFO - __main__ - Step 31862: {'lr': 0.00019968683441045016, 'samples': 1019584, 'steps': 1991, 'loss/train': 2.1846330165863037} -09/20/2021 21:23:20 - INFO - __main__ - Step 31863: {'lr': 0.00019968683441045016, 'samples': 1019616, 'steps': 1991, 'loss/train': 2.174170732498169} -09/20/2021 21:23:21 - INFO - __main__ - Step 31864: {'lr': 0.00019968683441045016, 'samples': 1019648, 'steps': 1991, 'loss/train': 2.7824630737304688} -09/20/2021 21:23:22 - INFO - __main__ - Step 31865: {'lr': 0.00019968683441045016, 'samples': 1019680, 'steps': 1991, 'loss/train': 2.1566123962402344} -09/20/2021 21:23:23 - INFO - __main__ - Step 31866: {'lr': 0.00019968683441045016, 'samples': 1019712, 'steps': 1991, 'loss/train': 3.4390053749084473} -09/20/2021 21:23:23 - INFO - __main__ - Step 31867: {'lr': 0.00019968683441045016, 'samples': 1019744, 'steps': 1991, 'loss/train': 2.9683620929718018} -09/20/2021 21:23:24 - INFO - __main__ - Step 31868: {'lr': 0.00019968683441045016, 'samples': 1019776, 'steps': 1991, 'loss/train': 1.1131484508514404} -09/20/2021 21:23:25 - INFO - __main__ - Step 31869: {'lr': 0.00019968683441045016, 'samples': 1019808, 'steps': 1991, 'loss/train': 1.5756480693817139} -09/20/2021 21:23:26 - INFO - __main__ - Step 31870: {'lr': 0.00019968683441045016, 'samples': 1019840, 'steps': 1991, 'loss/train': 3.2677602767944336} -09/20/2021 21:23:26 - INFO - __main__ - Step 31871: {'lr': 0.00019968683441045016, 'samples': 1019872, 'steps': 1991, 'loss/train': 2.8026621341705322} -09/20/2021 21:23:27 - INFO - __main__ - Step 31872: {'lr': 0.00019968683441045016, 'samples': 1019904, 'steps': 1991, 'loss/train': 2.265925645828247} -09/20/2021 21:23:28 - INFO - __main__ - Step 31873: {'lr': 0.00019968632977245235, 'samples': 1019936, 'steps': 1992, 'loss/train': 2.3316245079040527} -09/20/2021 21:23:29 - INFO - __main__ - Step 31874: {'lr': 0.00019968632977245235, 'samples': 1019968, 'steps': 1992, 'loss/train': 0.4005260765552521} -09/20/2021 21:23:30 - INFO - __main__ - Step 31875: {'lr': 0.00019968632977245235, 'samples': 1020000, 'steps': 1992, 'loss/train': 2.2181286811828613} -09/20/2021 21:23:30 - INFO - __main__ - Step 31876: {'lr': 0.00019968632977245235, 'samples': 1020032, 'steps': 1992, 'loss/train': 3.128488779067993} -09/20/2021 21:23:31 - INFO - __main__ - Step 31877: {'lr': 0.00019968632977245235, 'samples': 1020064, 'steps': 1992, 'loss/train': 3.1621570587158203} -09/20/2021 21:23:32 - INFO - __main__ - Step 31878: {'lr': 0.00019968632977245235, 'samples': 1020096, 'steps': 1992, 'loss/train': 2.1152424812316895} -09/20/2021 21:23:33 - INFO - __main__ - Step 31879: {'lr': 0.00019968632977245235, 'samples': 1020128, 'steps': 1992, 'loss/train': 2.09743070602417} -09/20/2021 21:23:33 - INFO - __main__ - Step 31880: {'lr': 0.00019968632977245235, 'samples': 1020160, 'steps': 1992, 'loss/train': 2.4334638118743896} -09/20/2021 21:23:34 - INFO - __main__ - Step 31881: {'lr': 0.00019968632977245235, 'samples': 1020192, 'steps': 1992, 'loss/train': 3.306548833847046} -09/20/2021 21:23:35 - INFO - __main__ - Step 31882: {'lr': 0.00019968632977245235, 'samples': 1020224, 'steps': 1992, 'loss/train': 1.986928939819336} -09/20/2021 21:23:36 - INFO - __main__ - Step 31883: {'lr': 0.00019968632977245235, 'samples': 1020256, 'steps': 1992, 'loss/train': 1.8592195510864258} -09/20/2021 21:23:36 - INFO - __main__ - Step 31884: {'lr': 0.00019968632977245235, 'samples': 1020288, 'steps': 1992, 'loss/train': 1.1463643312454224} -09/20/2021 21:23:37 - INFO - __main__ - Step 31885: {'lr': 0.00019968632977245235, 'samples': 1020320, 'steps': 1992, 'loss/train': 1.041892647743225} -09/20/2021 21:23:38 - INFO - __main__ - Step 31886: {'lr': 0.00019968632977245235, 'samples': 1020352, 'steps': 1992, 'loss/train': 2.9964940547943115} -09/20/2021 21:23:39 - INFO - __main__ - Step 31887: {'lr': 0.00019968632977245235, 'samples': 1020384, 'steps': 1992, 'loss/train': 2.0881407260894775} -09/20/2021 21:23:39 - INFO - __main__ - Step 31888: {'lr': 0.00019968632977245235, 'samples': 1020416, 'steps': 1992, 'loss/train': 2.372579336166382} -09/20/2021 21:23:40 - INFO - __main__ - Step 31889: {'lr': 0.00019968582472883122, 'samples': 1020448, 'steps': 1993, 'loss/train': 1.8675661087036133} -09/20/2021 21:23:41 - INFO - __main__ - Step 31890: {'lr': 0.00019968582472883122, 'samples': 1020480, 'steps': 1993, 'loss/train': 2.8523993492126465} -09/20/2021 21:23:42 - INFO - __main__ - Step 31891: {'lr': 0.00019968582472883122, 'samples': 1020512, 'steps': 1993, 'loss/train': 1.8371213674545288} -09/20/2021 21:23:43 - INFO - __main__ - Step 31892: {'lr': 0.00019968582472883122, 'samples': 1020544, 'steps': 1993, 'loss/train': 2.3882498741149902} -09/20/2021 21:23:44 - INFO - __main__ - Step 31893: {'lr': 0.00019968582472883122, 'samples': 1020576, 'steps': 1993, 'loss/train': 2.0327560901641846} -09/20/2021 21:23:44 - INFO - __main__ - Step 31894: {'lr': 0.00019968582472883122, 'samples': 1020608, 'steps': 1993, 'loss/train': 2.4527628421783447} -09/20/2021 21:23:45 - INFO - __main__ - Step 31895: {'lr': 0.00019968582472883122, 'samples': 1020640, 'steps': 1993, 'loss/train': 2.9148707389831543} -09/20/2021 21:23:46 - INFO - __main__ - Step 31896: {'lr': 0.00019968582472883122, 'samples': 1020672, 'steps': 1993, 'loss/train': 1.8457932472229004} -09/20/2021 21:23:47 - INFO - __main__ - Step 31897: {'lr': 0.00019968582472883122, 'samples': 1020704, 'steps': 1993, 'loss/train': 2.0696091651916504} -09/20/2021 21:23:47 - INFO - __main__ - Step 31898: {'lr': 0.00019968582472883122, 'samples': 1020736, 'steps': 1993, 'loss/train': 2.1543831825256348} -09/20/2021 21:23:48 - INFO - __main__ - Step 31899: {'lr': 0.00019968582472883122, 'samples': 1020768, 'steps': 1993, 'loss/train': 1.8304357528686523} -09/20/2021 21:23:49 - INFO - __main__ - Step 31900: {'lr': 0.00019968582472883122, 'samples': 1020800, 'steps': 1993, 'loss/train': 2.6160266399383545} -09/20/2021 21:23:50 - INFO - __main__ - Step 31901: {'lr': 0.00019968582472883122, 'samples': 1020832, 'steps': 1993, 'loss/train': 2.5477287769317627} -09/20/2021 21:23:50 - INFO - __main__ - Step 31902: {'lr': 0.00019968582472883122, 'samples': 1020864, 'steps': 1993, 'loss/train': 2.44476318359375} -09/20/2021 21:23:51 - INFO - __main__ - Step 31903: {'lr': 0.00019968582472883122, 'samples': 1020896, 'steps': 1993, 'loss/train': 1.8307905197143555} -09/20/2021 21:23:52 - INFO - __main__ - Step 31904: {'lr': 0.00019968582472883122, 'samples': 1020928, 'steps': 1993, 'loss/train': 1.5065217018127441} -09/20/2021 21:23:53 - INFO - __main__ - Step 31905: {'lr': 0.00019968531927958886, 'samples': 1020960, 'steps': 1994, 'loss/train': 2.0295472145080566} -09/20/2021 21:23:54 - INFO - __main__ - Step 31906: {'lr': 0.00019968531927958886, 'samples': 1020992, 'steps': 1994, 'loss/train': 2.52260422706604} -09/20/2021 21:23:54 - INFO - __main__ - Step 31907: {'lr': 0.00019968531927958886, 'samples': 1021024, 'steps': 1994, 'loss/train': 2.4975345134735107} -09/20/2021 21:23:55 - INFO - __main__ - Step 31908: {'lr': 0.00019968531927958886, 'samples': 1021056, 'steps': 1994, 'loss/train': 1.8242902755737305} -09/20/2021 21:23:56 - INFO - __main__ - Step 31909: {'lr': 0.00019968531927958886, 'samples': 1021088, 'steps': 1994, 'loss/train': 2.576887369155884} -09/20/2021 21:23:57 - INFO - __main__ - Step 31910: {'lr': 0.00019968531927958886, 'samples': 1021120, 'steps': 1994, 'loss/train': 2.4593098163604736} -09/20/2021 21:23:57 - INFO - __main__ - Step 31911: {'lr': 0.00019968531927958886, 'samples': 1021152, 'steps': 1994, 'loss/train': 2.418304204940796} -09/20/2021 21:23:58 - INFO - __main__ - Step 31912: {'lr': 0.00019968531927958886, 'samples': 1021184, 'steps': 1994, 'loss/train': 1.3245714902877808} -09/20/2021 21:23:59 - INFO - __main__ - Step 31913: {'lr': 0.00019968531927958886, 'samples': 1021216, 'steps': 1994, 'loss/train': 2.3157577514648438} -09/20/2021 21:24:00 - INFO - __main__ - Step 31914: {'lr': 0.00019968531927958886, 'samples': 1021248, 'steps': 1994, 'loss/train': 2.6685945987701416} -09/20/2021 21:24:00 - INFO - __main__ - Step 31915: {'lr': 0.00019968531927958886, 'samples': 1021280, 'steps': 1994, 'loss/train': 1.8105477094650269} -09/20/2021 21:24:01 - INFO - __main__ - Step 31916: {'lr': 0.00019968531927958886, 'samples': 1021312, 'steps': 1994, 'loss/train': 3.089843511581421} -09/20/2021 21:24:02 - INFO - __main__ - Step 31917: {'lr': 0.00019968531927958886, 'samples': 1021344, 'steps': 1994, 'loss/train': 1.719667673110962} -09/20/2021 21:24:03 - INFO - __main__ - Step 31918: {'lr': 0.00019968531927958886, 'samples': 1021376, 'steps': 1994, 'loss/train': 2.2576565742492676} -09/20/2021 21:24:03 - INFO - __main__ - Step 31919: {'lr': 0.00019968531927958886, 'samples': 1021408, 'steps': 1994, 'loss/train': 2.314689874649048} -09/20/2021 21:24:04 - INFO - __main__ - Step 31920: {'lr': 0.00019968531927958886, 'samples': 1021440, 'steps': 1994, 'loss/train': 2.53985595703125} -09/20/2021 21:24:05 - INFO - __main__ - Step 31921: {'lr': 0.00019968481342472734, 'samples': 1021472, 'steps': 1995, 'loss/train': 2.6717782020568848} -09/20/2021 21:24:06 - INFO - __main__ - Step 31922: {'lr': 0.00019968481342472734, 'samples': 1021504, 'steps': 1995, 'loss/train': 3.5841729640960693} -09/20/2021 21:24:07 - INFO - __main__ - Step 31923: {'lr': 0.00019968481342472734, 'samples': 1021536, 'steps': 1995, 'loss/train': 2.042736768722534} -09/20/2021 21:24:08 - INFO - __main__ - Step 31924: {'lr': 0.00019968481342472734, 'samples': 1021568, 'steps': 1995, 'loss/train': 0.7705115675926208} -09/20/2021 21:24:09 - INFO - __main__ - Step 31925: {'lr': 0.00019968481342472734, 'samples': 1021600, 'steps': 1995, 'loss/train': 1.8230072259902954} -09/20/2021 21:24:09 - INFO - __main__ - Step 31926: {'lr': 0.00019968481342472734, 'samples': 1021632, 'steps': 1995, 'loss/train': 1.1188483238220215} -09/20/2021 21:24:10 - INFO - __main__ - Step 31927: {'lr': 0.00019968481342472734, 'samples': 1021664, 'steps': 1995, 'loss/train': 2.138606309890747} -09/20/2021 21:24:11 - INFO - __main__ - Step 31928: {'lr': 0.00019968481342472734, 'samples': 1021696, 'steps': 1995, 'loss/train': 1.3931689262390137} -09/20/2021 21:24:12 - INFO - __main__ - Step 31929: {'lr': 0.00019968481342472734, 'samples': 1021728, 'steps': 1995, 'loss/train': 2.748802900314331} -09/20/2021 21:24:12 - INFO - __main__ - Step 31930: {'lr': 0.00019968481342472734, 'samples': 1021760, 'steps': 1995, 'loss/train': 1.6378960609436035} -09/20/2021 21:24:13 - INFO - __main__ - Step 31931: {'lr': 0.00019968481342472734, 'samples': 1021792, 'steps': 1995, 'loss/train': 0.291849821805954} -09/20/2021 21:24:14 - INFO - __main__ - Step 31932: {'lr': 0.00019968481342472734, 'samples': 1021824, 'steps': 1995, 'loss/train': 0.3451633155345917} -09/20/2021 21:24:15 - INFO - __main__ - Step 31933: {'lr': 0.00019968481342472734, 'samples': 1021856, 'steps': 1995, 'loss/train': 1.8413387537002563} -09/20/2021 21:24:15 - INFO - __main__ - Step 31934: {'lr': 0.00019968481342472734, 'samples': 1021888, 'steps': 1995, 'loss/train': 2.9824743270874023} -09/20/2021 21:24:16 - INFO - __main__ - Step 31935: {'lr': 0.00019968481342472734, 'samples': 1021920, 'steps': 1995, 'loss/train': 2.6404826641082764} -09/20/2021 21:24:17 - INFO - __main__ - Step 31936: {'lr': 0.00019968481342472734, 'samples': 1021952, 'steps': 1995, 'loss/train': 1.31926429271698} -09/20/2021 21:24:18 - INFO - __main__ - Step 31937: {'lr': 0.00019968430716424867, 'samples': 1021984, 'steps': 1996, 'loss/train': 2.7794435024261475} -09/20/2021 21:24:18 - INFO - __main__ - Step 31938: {'lr': 0.00019968430716424867, 'samples': 1022016, 'steps': 1996, 'loss/train': 2.3482422828674316} -09/20/2021 21:24:19 - INFO - __main__ - Step 31939: {'lr': 0.00019968430716424867, 'samples': 1022048, 'steps': 1996, 'loss/train': 1.9132241010665894} -09/20/2021 21:24:20 - INFO - __main__ - Step 31940: {'lr': 0.00019968430716424867, 'samples': 1022080, 'steps': 1996, 'loss/train': 1.2888394594192505} -09/20/2021 21:24:21 - INFO - __main__ - Step 31941: {'lr': 0.00019968430716424867, 'samples': 1022112, 'steps': 1996, 'loss/train': 3.220658302307129} -09/20/2021 21:24:21 - INFO - __main__ - Step 31942: {'lr': 0.00019968430716424867, 'samples': 1022144, 'steps': 1996, 'loss/train': 3.23075795173645} -09/20/2021 21:24:22 - INFO - __main__ - Step 31943: {'lr': 0.00019968430716424867, 'samples': 1022176, 'steps': 1996, 'loss/train': 2.1953797340393066} -09/20/2021 21:24:23 - INFO - __main__ - Step 31944: {'lr': 0.00019968430716424867, 'samples': 1022208, 'steps': 1996, 'loss/train': 2.022664785385132} -09/20/2021 21:24:24 - INFO - __main__ - Step 31945: {'lr': 0.00019968430716424867, 'samples': 1022240, 'steps': 1996, 'loss/train': 1.9430017471313477} -09/20/2021 21:24:24 - INFO - __main__ - Step 31946: {'lr': 0.00019968430716424867, 'samples': 1022272, 'steps': 1996, 'loss/train': 2.3942294120788574} -09/20/2021 21:24:25 - INFO - __main__ - Step 31947: {'lr': 0.00019968430716424867, 'samples': 1022304, 'steps': 1996, 'loss/train': 1.8605990409851074} -09/20/2021 21:24:26 - INFO - __main__ - Step 31948: {'lr': 0.00019968430716424867, 'samples': 1022336, 'steps': 1996, 'loss/train': 1.490105390548706} -09/20/2021 21:24:27 - INFO - __main__ - Step 31949: {'lr': 0.00019968430716424867, 'samples': 1022368, 'steps': 1996, 'loss/train': 2.231403112411499} -09/20/2021 21:24:27 - INFO - __main__ - Step 31950: {'lr': 0.00019968430716424867, 'samples': 1022400, 'steps': 1996, 'loss/train': 2.267435073852539} -09/20/2021 21:24:28 - INFO - __main__ - Step 31951: {'lr': 0.00019968430716424867, 'samples': 1022432, 'steps': 1996, 'loss/train': 2.521448850631714} -09/20/2021 21:24:29 - INFO - __main__ - Step 31952: {'lr': 0.00019968430716424867, 'samples': 1022464, 'steps': 1996, 'loss/train': 2.3618521690368652} -09/20/2021 21:24:31 - INFO - __main__ - Step 31953: {'lr': 0.000199683800498155, 'samples': 1022496, 'steps': 1997, 'loss/train': 2.288733959197998} -09/20/2021 21:24:32 - INFO - __main__ - Step 31954: {'lr': 0.000199683800498155, 'samples': 1022528, 'steps': 1997, 'loss/train': 1.508660078048706} -09/20/2021 21:24:32 - INFO - __main__ - Step 31955: {'lr': 0.000199683800498155, 'samples': 1022560, 'steps': 1997, 'loss/train': 2.532001495361328} -09/20/2021 21:24:33 - INFO - __main__ - Step 31956: {'lr': 0.000199683800498155, 'samples': 1022592, 'steps': 1997, 'loss/train': 2.5599632263183594} -09/20/2021 21:24:34 - INFO - __main__ - Step 31957: {'lr': 0.000199683800498155, 'samples': 1022624, 'steps': 1997, 'loss/train': 3.030907392501831} -09/20/2021 21:24:35 - INFO - __main__ - Step 31958: {'lr': 0.000199683800498155, 'samples': 1022656, 'steps': 1997, 'loss/train': 2.472052812576294} -09/20/2021 21:24:35 - INFO - __main__ - Step 31959: {'lr': 0.000199683800498155, 'samples': 1022688, 'steps': 1997, 'loss/train': 2.323338270187378} -09/20/2021 21:24:36 - INFO - __main__ - Step 31960: {'lr': 0.000199683800498155, 'samples': 1022720, 'steps': 1997, 'loss/train': 2.4455678462982178} -09/20/2021 21:24:37 - INFO - __main__ - Step 31961: {'lr': 0.000199683800498155, 'samples': 1022752, 'steps': 1997, 'loss/train': 2.100322723388672} -09/20/2021 21:24:38 - INFO - __main__ - Step 31962: {'lr': 0.000199683800498155, 'samples': 1022784, 'steps': 1997, 'loss/train': 2.3761954307556152} -09/20/2021 21:24:38 - INFO - __main__ - Step 31963: {'lr': 0.000199683800498155, 'samples': 1022816, 'steps': 1997, 'loss/train': 1.932769536972046} -09/20/2021 21:24:39 - INFO - __main__ - Step 31964: {'lr': 0.000199683800498155, 'samples': 1022848, 'steps': 1997, 'loss/train': 2.2048606872558594} -09/20/2021 21:24:40 - INFO - __main__ - Step 31965: {'lr': 0.000199683800498155, 'samples': 1022880, 'steps': 1997, 'loss/train': 1.633216381072998} -09/20/2021 21:24:41 - INFO - __main__ - Step 31966: {'lr': 0.000199683800498155, 'samples': 1022912, 'steps': 1997, 'loss/train': 2.6234664916992188} -09/20/2021 21:24:41 - INFO - __main__ - Step 31967: {'lr': 0.000199683800498155, 'samples': 1022944, 'steps': 1997, 'loss/train': 2.207026481628418} -09/20/2021 21:24:42 - INFO - __main__ - Step 31968: {'lr': 0.000199683800498155, 'samples': 1022976, 'steps': 1997, 'loss/train': 3.326026201248169} -09/20/2021 21:24:43 - INFO - __main__ - Step 31969: {'lr': 0.00019968329342644827, 'samples': 1023008, 'steps': 1998, 'loss/train': 2.8176066875457764} -09/20/2021 21:24:44 - INFO - __main__ - Step 31970: {'lr': 0.00019968329342644827, 'samples': 1023040, 'steps': 1998, 'loss/train': 2.453582286834717} -09/20/2021 21:24:45 - INFO - __main__ - Step 31971: {'lr': 0.00019968329342644827, 'samples': 1023072, 'steps': 1998, 'loss/train': 2.807032823562622} -09/20/2021 21:24:45 - INFO - __main__ - Step 31972: {'lr': 0.00019968329342644827, 'samples': 1023104, 'steps': 1998, 'loss/train': 0.8570297956466675} -09/20/2021 21:24:46 - INFO - __main__ - Step 31973: {'lr': 0.00019968329342644827, 'samples': 1023136, 'steps': 1998, 'loss/train': 1.6869080066680908} -09/20/2021 21:24:47 - INFO - __main__ - Step 31974: {'lr': 0.00019968329342644827, 'samples': 1023168, 'steps': 1998, 'loss/train': 2.400397539138794} -09/20/2021 21:24:48 - INFO - __main__ - Step 31975: {'lr': 0.00019968329342644827, 'samples': 1023200, 'steps': 1998, 'loss/train': 1.9712947607040405} -09/20/2021 21:24:48 - INFO - __main__ - Step 31976: {'lr': 0.00019968329342644827, 'samples': 1023232, 'steps': 1998, 'loss/train': 2.9621684551239014} -09/20/2021 21:24:49 - INFO - __main__ - Step 31977: {'lr': 0.00019968329342644827, 'samples': 1023264, 'steps': 1998, 'loss/train': 2.2514474391937256} -09/20/2021 21:24:50 - INFO - __main__ - Step 31978: {'lr': 0.00019968329342644827, 'samples': 1023296, 'steps': 1998, 'loss/train': 2.592522621154785} -09/20/2021 21:24:51 - INFO - __main__ - Step 31979: {'lr': 0.00019968329342644827, 'samples': 1023328, 'steps': 1998, 'loss/train': 2.316323757171631} -09/20/2021 21:24:51 - INFO - __main__ - Step 31980: {'lr': 0.00019968329342644827, 'samples': 1023360, 'steps': 1998, 'loss/train': 1.5878931283950806} -09/20/2021 21:24:52 - INFO - __main__ - Step 31981: {'lr': 0.00019968329342644827, 'samples': 1023392, 'steps': 1998, 'loss/train': 2.3907017707824707} -09/20/2021 21:24:53 - INFO - __main__ - Step 31982: {'lr': 0.00019968329342644827, 'samples': 1023424, 'steps': 1998, 'loss/train': 2.7183189392089844} -09/20/2021 21:24:54 - INFO - __main__ - Step 31983: {'lr': 0.00019968329342644827, 'samples': 1023456, 'steps': 1998, 'loss/train': 2.659987211227417} -09/20/2021 21:24:55 - INFO - __main__ - Step 31984: {'lr': 0.00019968329342644827, 'samples': 1023488, 'steps': 1998, 'loss/train': 1.9251337051391602} -09/20/2021 21:24:56 - INFO - __main__ - Step 31985: {'lr': 0.00019968278594913064, 'samples': 1023520, 'steps': 1999, 'loss/train': 1.9995713233947754} -09/20/2021 21:24:56 - INFO - __main__ - Step 31986: {'lr': 0.00019968278594913064, 'samples': 1023552, 'steps': 1999, 'loss/train': 2.045050621032715} -09/20/2021 21:24:57 - INFO - __main__ - Step 31987: {'lr': 0.00019968278594913064, 'samples': 1023584, 'steps': 1999, 'loss/train': 3.0416221618652344} -09/20/2021 21:24:58 - INFO - __main__ - Step 31988: {'lr': 0.00019968278594913064, 'samples': 1023616, 'steps': 1999, 'loss/train': 2.695803165435791} -09/20/2021 21:24:59 - INFO - __main__ - Step 31989: {'lr': 0.00019968278594913064, 'samples': 1023648, 'steps': 1999, 'loss/train': 1.6500810384750366} -09/20/2021 21:24:59 - INFO - __main__ - Step 31990: {'lr': 0.00019968278594913064, 'samples': 1023680, 'steps': 1999, 'loss/train': 3.2191073894500732} -09/20/2021 21:25:00 - INFO - __main__ - Step 31991: {'lr': 0.00019968278594913064, 'samples': 1023712, 'steps': 1999, 'loss/train': 2.3574323654174805} -09/20/2021 21:25:01 - INFO - __main__ - Step 31992: {'lr': 0.00019968278594913064, 'samples': 1023744, 'steps': 1999, 'loss/train': 2.878628730773926} -09/20/2021 21:25:02 - INFO - __main__ - Step 31993: {'lr': 0.00019968278594913064, 'samples': 1023776, 'steps': 1999, 'loss/train': 3.1029393672943115} -09/20/2021 21:25:02 - INFO - __main__ - Step 31994: {'lr': 0.00019968278594913064, 'samples': 1023808, 'steps': 1999, 'loss/train': 2.3322670459747314} -09/20/2021 21:25:03 - INFO - __main__ - Step 31995: {'lr': 0.00019968278594913064, 'samples': 1023840, 'steps': 1999, 'loss/train': 1.7448430061340332} -09/20/2021 21:25:04 - INFO - __main__ - Step 31996: {'lr': 0.00019968278594913064, 'samples': 1023872, 'steps': 1999, 'loss/train': 3.3366386890411377} -09/20/2021 21:25:05 - INFO - __main__ - Step 31997: {'lr': 0.00019968278594913064, 'samples': 1023904, 'steps': 1999, 'loss/train': 1.470949411392212} -09/20/2021 21:25:05 - INFO - __main__ - Step 31998: {'lr': 0.00019968278594913064, 'samples': 1023936, 'steps': 1999, 'loss/train': 3.1893539428710938} -09/20/2021 21:25:06 - INFO - __main__ - Step 31999: {'lr': 0.00019968278594913064, 'samples': 1023968, 'steps': 1999, 'loss/train': 1.3921610116958618} -09/20/2021 21:25:07 - INFO - __main__ - Step 32000: {'lr': 0.00019968278594913064, 'samples': 1024000, 'steps': 1999, 'loss/train': 2.8526206016540527} -09/20/2021 21:25:08 - INFO - __main__ - Step 32001: {'lr': 0.0001996822780662041, 'samples': 1024032, 'steps': 2000, 'loss/train': 2.5070018768310547} -09/20/2021 21:25:09 - INFO - __main__ - Step 32002: {'lr': 0.0001996822780662041, 'samples': 1024064, 'steps': 2000, 'loss/train': 2.555682897567749} -09/20/2021 21:25:09 - INFO - __main__ - Step 32003: {'lr': 0.0001996822780662041, 'samples': 1024096, 'steps': 2000, 'loss/train': 2.512885570526123} -09/20/2021 21:25:10 - INFO - __main__ - Step 32004: {'lr': 0.0001996822780662041, 'samples': 1024128, 'steps': 2000, 'loss/train': 2.5725514888763428} -09/20/2021 21:25:11 - INFO - __main__ - Step 32005: {'lr': 0.0001996822780662041, 'samples': 1024160, 'steps': 2000, 'loss/train': 2.5257151126861572} -09/20/2021 21:25:12 - INFO - __main__ - Step 32006: {'lr': 0.0001996822780662041, 'samples': 1024192, 'steps': 2000, 'loss/train': 1.2294354438781738} -09/20/2021 21:25:12 - INFO - __main__ - Step 32007: {'lr': 0.0001996822780662041, 'samples': 1024224, 'steps': 2000, 'loss/train': 2.129312753677368} -09/20/2021 21:25:13 - INFO - __main__ - Step 32008: {'lr': 0.0001996822780662041, 'samples': 1024256, 'steps': 2000, 'loss/train': 2.2959234714508057} -09/20/2021 21:25:14 - INFO - __main__ - Step 32009: {'lr': 0.0001996822780662041, 'samples': 1024288, 'steps': 2000, 'loss/train': 2.0286030769348145} -09/20/2021 21:25:15 - INFO - __main__ - Step 32010: {'lr': 0.0001996822780662041, 'samples': 1024320, 'steps': 2000, 'loss/train': 2.527067184448242} -09/20/2021 21:25:15 - INFO - __main__ - Step 32011: {'lr': 0.0001996822780662041, 'samples': 1024352, 'steps': 2000, 'loss/train': 2.98978590965271} -09/20/2021 21:25:16 - INFO - __main__ - Step 32012: {'lr': 0.0001996822780662041, 'samples': 1024384, 'steps': 2000, 'loss/train': 2.651651620864868} -09/20/2021 21:25:17 - INFO - __main__ - Step 32013: {'lr': 0.0001996822780662041, 'samples': 1024416, 'steps': 2000, 'loss/train': 2.1192212104797363} -09/20/2021 21:25:18 - INFO - __main__ - Step 32014: {'lr': 0.0001996822780662041, 'samples': 1024448, 'steps': 2000, 'loss/train': 2.774845838546753} -09/20/2021 21:25:19 - INFO - __main__ - Step 32015: {'lr': 0.0001996822780662041, 'samples': 1024480, 'steps': 2000, 'loss/train': 2.6300835609436035} -09/20/2021 21:25:20 - INFO - __main__ - Step 32016: {'lr': 0.0001996822780662041, 'samples': 1024512, 'steps': 2000, 'loss/train': 2.487159013748169} -09/20/2021 21:25:21 - INFO - __main__ - Step 32017: {'lr': 0.0001996817697776708, 'samples': 1024544, 'steps': 2001, 'loss/train': 2.411259412765503} -09/20/2021 21:25:21 - INFO - __main__ - Step 32018: {'lr': 0.0001996817697776708, 'samples': 1024576, 'steps': 2001, 'loss/train': 2.0445032119750977} -09/20/2021 21:25:22 - INFO - __main__ - Step 32019: {'lr': 0.0001996817697776708, 'samples': 1024608, 'steps': 2001, 'loss/train': 2.413201093673706} -09/20/2021 21:25:23 - INFO - __main__ - Step 32020: {'lr': 0.0001996817697776708, 'samples': 1024640, 'steps': 2001, 'loss/train': 2.5105345249176025} -09/20/2021 21:25:24 - INFO - __main__ - Step 32021: {'lr': 0.0001996817697776708, 'samples': 1024672, 'steps': 2001, 'loss/train': 2.083268880844116} -09/20/2021 21:25:24 - INFO - __main__ - Step 32022: {'lr': 0.0001996817697776708, 'samples': 1024704, 'steps': 2001, 'loss/train': 2.7629473209381104} -09/20/2021 21:25:25 - INFO - __main__ - Step 32023: {'lr': 0.0001996817697776708, 'samples': 1024736, 'steps': 2001, 'loss/train': 2.050116777420044} -09/20/2021 21:25:26 - INFO - __main__ - Step 32024: {'lr': 0.0001996817697776708, 'samples': 1024768, 'steps': 2001, 'loss/train': 3.578778028488159} -09/20/2021 21:25:27 - INFO - __main__ - Step 32025: {'lr': 0.0001996817697776708, 'samples': 1024800, 'steps': 2001, 'loss/train': 1.4487929344177246} -09/20/2021 21:25:27 - INFO - __main__ - Step 32026: {'lr': 0.0001996817697776708, 'samples': 1024832, 'steps': 2001, 'loss/train': 2.306349277496338} -09/20/2021 21:25:28 - INFO - __main__ - Step 32027: {'lr': 0.0001996817697776708, 'samples': 1024864, 'steps': 2001, 'loss/train': 2.175347089767456} -09/20/2021 21:25:29 - INFO - __main__ - Step 32028: {'lr': 0.0001996817697776708, 'samples': 1024896, 'steps': 2001, 'loss/train': 2.4572906494140625} -09/20/2021 21:25:30 - INFO - __main__ - Step 32029: {'lr': 0.0001996817697776708, 'samples': 1024928, 'steps': 2001, 'loss/train': 2.0253849029541016} -09/20/2021 21:25:30 - INFO - __main__ - Step 32030: {'lr': 0.0001996817697776708, 'samples': 1024960, 'steps': 2001, 'loss/train': 2.610828161239624} -09/20/2021 21:25:31 - INFO - __main__ - Step 32031: {'lr': 0.0001996817697776708, 'samples': 1024992, 'steps': 2001, 'loss/train': 2.34938645362854} -09/20/2021 21:25:32 - INFO - __main__ - Step 32032: {'lr': 0.0001996817697776708, 'samples': 1025024, 'steps': 2001, 'loss/train': 3.365947961807251} -09/20/2021 21:25:33 - INFO - __main__ - Step 32033: {'lr': 0.00019968126108353275, 'samples': 1025056, 'steps': 2002, 'loss/train': 3.4324047565460205} -09/20/2021 21:25:33 - INFO - __main__ - Step 32034: {'lr': 0.00019968126108353275, 'samples': 1025088, 'steps': 2002, 'loss/train': 2.6162524223327637} -09/20/2021 21:25:34 - INFO - __main__ - Step 32035: {'lr': 0.00019968126108353275, 'samples': 1025120, 'steps': 2002, 'loss/train': 2.5768489837646484} -09/20/2021 21:25:35 - INFO - __main__ - Step 32036: {'lr': 0.00019968126108353275, 'samples': 1025152, 'steps': 2002, 'loss/train': 1.9969671964645386} -09/20/2021 21:25:36 - INFO - __main__ - Step 32037: {'lr': 0.00019968126108353275, 'samples': 1025184, 'steps': 2002, 'loss/train': 1.4051799774169922} -09/20/2021 21:25:36 - INFO - __main__ - Step 32038: {'lr': 0.00019968126108353275, 'samples': 1025216, 'steps': 2002, 'loss/train': 5.68183708190918} -09/20/2021 21:25:37 - INFO - __main__ - Step 32039: {'lr': 0.00019968126108353275, 'samples': 1025248, 'steps': 2002, 'loss/train': 2.7817046642303467} -09/20/2021 21:25:38 - INFO - __main__ - Step 32040: {'lr': 0.00019968126108353275, 'samples': 1025280, 'steps': 2002, 'loss/train': 1.6680561304092407} -09/20/2021 21:25:39 - INFO - __main__ - Step 32041: {'lr': 0.00019968126108353275, 'samples': 1025312, 'steps': 2002, 'loss/train': 2.766955614089966} -09/20/2021 21:25:39 - INFO - __main__ - Step 32042: {'lr': 0.00019968126108353275, 'samples': 1025344, 'steps': 2002, 'loss/train': 2.6186134815216064} -09/20/2021 21:25:40 - INFO - __main__ - Step 32043: {'lr': 0.00019968126108353275, 'samples': 1025376, 'steps': 2002, 'loss/train': 2.2539236545562744} -09/20/2021 21:25:41 - INFO - __main__ - Step 32044: {'lr': 0.00019968126108353275, 'samples': 1025408, 'steps': 2002, 'loss/train': 2.3668370246887207} -09/20/2021 21:25:42 - INFO - __main__ - Step 32045: {'lr': 0.00019968126108353275, 'samples': 1025440, 'steps': 2002, 'loss/train': 2.477618932723999} -09/20/2021 21:25:43 - INFO - __main__ - Step 32046: {'lr': 0.00019968126108353275, 'samples': 1025472, 'steps': 2002, 'loss/train': 2.666232109069824} -09/20/2021 21:25:44 - INFO - __main__ - Step 32047: {'lr': 0.00019968126108353275, 'samples': 1025504, 'steps': 2002, 'loss/train': 2.150773525238037} -09/20/2021 21:25:45 - INFO - __main__ - Step 32048: {'lr': 0.00019968126108353275, 'samples': 1025536, 'steps': 2002, 'loss/train': 3.02945876121521} -09/20/2021 21:25:45 - INFO - __main__ - Step 32049: {'lr': 0.00019968075198379203, 'samples': 1025568, 'steps': 2003, 'loss/train': 2.389700412750244} -09/20/2021 21:25:46 - INFO - __main__ - Step 32050: {'lr': 0.00019968075198379203, 'samples': 1025600, 'steps': 2003, 'loss/train': 2.0289101600646973} -09/20/2021 21:25:47 - INFO - __main__ - Step 32051: {'lr': 0.00019968075198379203, 'samples': 1025632, 'steps': 2003, 'loss/train': 1.7963911294937134} -09/20/2021 21:25:48 - INFO - __main__ - Step 32052: {'lr': 0.00019968075198379203, 'samples': 1025664, 'steps': 2003, 'loss/train': 2.9130969047546387} -09/20/2021 21:25:48 - INFO - __main__ - Step 32053: {'lr': 0.00019968075198379203, 'samples': 1025696, 'steps': 2003, 'loss/train': 2.7572171688079834} -09/20/2021 21:25:49 - INFO - __main__ - Step 32054: {'lr': 0.00019968075198379203, 'samples': 1025728, 'steps': 2003, 'loss/train': 2.2853827476501465} -09/20/2021 21:25:50 - INFO - __main__ - Step 32055: {'lr': 0.00019968075198379203, 'samples': 1025760, 'steps': 2003, 'loss/train': 3.453484535217285} -09/20/2021 21:25:51 - INFO - __main__ - Step 32056: {'lr': 0.00019968075198379203, 'samples': 1025792, 'steps': 2003, 'loss/train': 1.9269979000091553} -09/20/2021 21:25:51 - INFO - __main__ - Step 32057: {'lr': 0.00019968075198379203, 'samples': 1025824, 'steps': 2003, 'loss/train': 1.6571764945983887} -09/20/2021 21:25:52 - INFO - __main__ - Step 32058: {'lr': 0.00019968075198379203, 'samples': 1025856, 'steps': 2003, 'loss/train': 2.770153760910034} -09/20/2021 21:25:53 - INFO - __main__ - Step 32059: {'lr': 0.00019968075198379203, 'samples': 1025888, 'steps': 2003, 'loss/train': 2.5882678031921387} -09/20/2021 21:25:54 - INFO - __main__ - Step 32060: {'lr': 0.00019968075198379203, 'samples': 1025920, 'steps': 2003, 'loss/train': 2.4086084365844727} -09/20/2021 21:25:54 - INFO - __main__ - Step 32061: {'lr': 0.00019968075198379203, 'samples': 1025952, 'steps': 2003, 'loss/train': 2.541404962539673} -09/20/2021 21:25:55 - INFO - __main__ - Step 32062: {'lr': 0.00019968075198379203, 'samples': 1025984, 'steps': 2003, 'loss/train': 2.58298659324646} -09/20/2021 21:25:56 - INFO - __main__ - Step 32063: {'lr': 0.00019968075198379203, 'samples': 1026016, 'steps': 2003, 'loss/train': 2.098649024963379} -09/20/2021 21:25:57 - INFO - __main__ - Step 32064: {'lr': 0.00019968075198379203, 'samples': 1026048, 'steps': 2003, 'loss/train': 1.961809515953064} -09/20/2021 21:25:58 - INFO - __main__ - Step 32065: {'lr': 0.00019968024247845074, 'samples': 1026080, 'steps': 2004, 'loss/train': 1.9293314218521118} -09/20/2021 21:25:58 - INFO - __main__ - Step 32066: {'lr': 0.00019968024247845074, 'samples': 1026112, 'steps': 2004, 'loss/train': 1.921858787536621} -09/20/2021 21:25:59 - INFO - __main__ - Step 32067: {'lr': 0.00019968024247845074, 'samples': 1026144, 'steps': 2004, 'loss/train': 1.9151523113250732} -09/20/2021 21:26:00 - INFO - __main__ - Step 32068: {'lr': 0.00019968024247845074, 'samples': 1026176, 'steps': 2004, 'loss/train': 2.0473663806915283} -09/20/2021 21:26:01 - INFO - __main__ - Step 32069: {'lr': 0.00019968024247845074, 'samples': 1026208, 'steps': 2004, 'loss/train': 1.9019362926483154} -09/20/2021 21:26:01 - INFO - __main__ - Step 32070: {'lr': 0.00019968024247845074, 'samples': 1026240, 'steps': 2004, 'loss/train': 1.9665590524673462} -09/20/2021 21:26:02 - INFO - __main__ - Step 32071: {'lr': 0.00019968024247845074, 'samples': 1026272, 'steps': 2004, 'loss/train': 2.2821569442749023} -09/20/2021 21:26:03 - INFO - __main__ - Step 32072: {'lr': 0.00019968024247845074, 'samples': 1026304, 'steps': 2004, 'loss/train': 1.874672532081604} -09/20/2021 21:26:04 - INFO - __main__ - Step 32073: {'lr': 0.00019968024247845074, 'samples': 1026336, 'steps': 2004, 'loss/train': 2.2742161750793457} -09/20/2021 21:26:04 - INFO - __main__ - Step 32074: {'lr': 0.00019968024247845074, 'samples': 1026368, 'steps': 2004, 'loss/train': 2.068974733352661} -09/20/2021 21:26:05 - INFO - __main__ - Step 32075: {'lr': 0.00019968024247845074, 'samples': 1026400, 'steps': 2004, 'loss/train': 2.519343137741089} -09/20/2021 21:26:06 - INFO - __main__ - Step 32076: {'lr': 0.00019968024247845074, 'samples': 1026432, 'steps': 2004, 'loss/train': 3.054630756378174} -09/20/2021 21:26:07 - INFO - __main__ - Step 32077: {'lr': 0.00019968024247845074, 'samples': 1026464, 'steps': 2004, 'loss/train': 2.3707094192504883} -09/20/2021 21:26:07 - INFO - __main__ - Step 32078: {'lr': 0.00019968024247845074, 'samples': 1026496, 'steps': 2004, 'loss/train': 1.584708571434021} -09/20/2021 21:26:09 - INFO - __main__ - Step 32079: {'lr': 0.00019968024247845074, 'samples': 1026528, 'steps': 2004, 'loss/train': 3.025055408477783} -09/20/2021 21:26:09 - INFO - __main__ - Step 32080: {'lr': 0.00019968024247845074, 'samples': 1026560, 'steps': 2004, 'loss/train': 2.556483268737793} -09/20/2021 21:26:10 - INFO - __main__ - Step 32081: {'lr': 0.0001996797325675109, 'samples': 1026592, 'steps': 2005, 'loss/train': 2.3674895763397217} -09/20/2021 21:26:11 - INFO - __main__ - Step 32082: {'lr': 0.0001996797325675109, 'samples': 1026624, 'steps': 2005, 'loss/train': 2.244364023208618} -09/20/2021 21:26:12 - INFO - __main__ - Step 32083: {'lr': 0.0001996797325675109, 'samples': 1026656, 'steps': 2005, 'loss/train': 1.8728866577148438} -09/20/2021 21:26:13 - INFO - __main__ - Step 32084: {'lr': 0.0001996797325675109, 'samples': 1026688, 'steps': 2005, 'loss/train': 2.476931095123291} -09/20/2021 21:26:13 - INFO - __main__ - Step 32085: {'lr': 0.0001996797325675109, 'samples': 1026720, 'steps': 2005, 'loss/train': 2.426013946533203} -09/20/2021 21:26:14 - INFO - __main__ - Step 32086: {'lr': 0.0001996797325675109, 'samples': 1026752, 'steps': 2005, 'loss/train': 1.3502546548843384} -09/20/2021 21:26:15 - INFO - __main__ - Step 32087: {'lr': 0.0001996797325675109, 'samples': 1026784, 'steps': 2005, 'loss/train': 0.6681230068206787} -09/20/2021 21:26:16 - INFO - __main__ - Step 32088: {'lr': 0.0001996797325675109, 'samples': 1026816, 'steps': 2005, 'loss/train': 0.27641183137893677} -09/20/2021 21:26:16 - INFO - __main__ - Step 32089: {'lr': 0.0001996797325675109, 'samples': 1026848, 'steps': 2005, 'loss/train': 0.4175061583518982} -09/20/2021 21:26:17 - INFO - __main__ - Step 32090: {'lr': 0.0001996797325675109, 'samples': 1026880, 'steps': 2005, 'loss/train': 0.5918661952018738} -09/20/2021 21:26:18 - INFO - __main__ - Step 32091: {'lr': 0.0001996797325675109, 'samples': 1026912, 'steps': 2005, 'loss/train': 0.38207167387008667} -09/20/2021 21:26:19 - INFO - __main__ - Step 32092: {'lr': 0.0001996797325675109, 'samples': 1026944, 'steps': 2005, 'loss/train': 1.622701644897461} -09/20/2021 21:26:19 - INFO - __main__ - Step 32093: {'lr': 0.0001996797325675109, 'samples': 1026976, 'steps': 2005, 'loss/train': 2.4079818725585938} -09/20/2021 21:26:20 - INFO - __main__ - Step 32094: {'lr': 0.0001996797325675109, 'samples': 1027008, 'steps': 2005, 'loss/train': 2.3075146675109863} -09/20/2021 21:26:21 - INFO - __main__ - Step 32095: {'lr': 0.0001996797325675109, 'samples': 1027040, 'steps': 2005, 'loss/train': 2.30859375} -09/20/2021 21:26:22 - INFO - __main__ - Step 32096: {'lr': 0.0001996797325675109, 'samples': 1027072, 'steps': 2005, 'loss/train': 3.381040573120117} -09/20/2021 21:26:23 - INFO - __main__ - Step 32097: {'lr': 0.00019967922225097465, 'samples': 1027104, 'steps': 2006, 'loss/train': 0.7793011665344238} -09/20/2021 21:26:23 - INFO - __main__ - Step 32098: {'lr': 0.00019967922225097465, 'samples': 1027136, 'steps': 2006, 'loss/train': 2.4654862880706787} -09/20/2021 21:26:24 - INFO - __main__ - Step 32099: {'lr': 0.00019967922225097465, 'samples': 1027168, 'steps': 2006, 'loss/train': 2.1355514526367188} -09/20/2021 21:26:25 - INFO - __main__ - Step 32100: {'lr': 0.00019967922225097465, 'samples': 1027200, 'steps': 2006, 'loss/train': 1.6315274238586426} -09/20/2021 21:26:26 - INFO - __main__ - Step 32101: {'lr': 0.00019967922225097465, 'samples': 1027232, 'steps': 2006, 'loss/train': 2.8742403984069824} -09/20/2021 21:26:26 - INFO - __main__ - Step 32102: {'lr': 0.00019967922225097465, 'samples': 1027264, 'steps': 2006, 'loss/train': 2.9260740280151367} -09/20/2021 21:26:27 - INFO - __main__ - Step 32103: {'lr': 0.00019967922225097465, 'samples': 1027296, 'steps': 2006, 'loss/train': 3.1847047805786133} -09/20/2021 21:26:28 - INFO - __main__ - Step 32104: {'lr': 0.00019967922225097465, 'samples': 1027328, 'steps': 2006, 'loss/train': 0.22242607176303864} -09/20/2021 21:26:29 - INFO - __main__ - Step 32105: {'lr': 0.00019967922225097465, 'samples': 1027360, 'steps': 2006, 'loss/train': 2.8226301670074463} -09/20/2021 21:26:29 - INFO - __main__ - Step 32106: {'lr': 0.00019967922225097465, 'samples': 1027392, 'steps': 2006, 'loss/train': 2.9924561977386475} -09/20/2021 21:26:30 - INFO - __main__ - Step 32107: {'lr': 0.00019967922225097465, 'samples': 1027424, 'steps': 2006, 'loss/train': 2.350264072418213} -09/20/2021 21:26:31 - INFO - __main__ - Step 32108: {'lr': 0.00019967922225097465, 'samples': 1027456, 'steps': 2006, 'loss/train': 1.857020378112793} -09/20/2021 21:26:32 - INFO - __main__ - Step 32109: {'lr': 0.00019967922225097465, 'samples': 1027488, 'steps': 2006, 'loss/train': 2.710538864135742} -09/20/2021 21:26:33 - INFO - __main__ - Step 32110: {'lr': 0.00019967922225097465, 'samples': 1027520, 'steps': 2006, 'loss/train': 2.0879406929016113} -09/20/2021 21:26:34 - INFO - __main__ - Step 32111: {'lr': 0.00019967922225097465, 'samples': 1027552, 'steps': 2006, 'loss/train': 1.6370309591293335} -09/20/2021 21:26:34 - INFO - __main__ - Step 32112: {'lr': 0.00019967922225097465, 'samples': 1027584, 'steps': 2006, 'loss/train': 2.6087489128112793} -09/20/2021 21:26:35 - INFO - __main__ - Step 32113: {'lr': 0.00019967871152884402, 'samples': 1027616, 'steps': 2007, 'loss/train': 2.0980842113494873} -09/20/2021 21:26:36 - INFO - __main__ - Step 32114: {'lr': 0.00019967871152884402, 'samples': 1027648, 'steps': 2007, 'loss/train': 2.0336596965789795} -09/20/2021 21:26:37 - INFO - __main__ - Step 32115: {'lr': 0.00019967871152884402, 'samples': 1027680, 'steps': 2007, 'loss/train': 1.510774850845337} -09/20/2021 21:26:37 - INFO - __main__ - Step 32116: {'lr': 0.00019967871152884402, 'samples': 1027712, 'steps': 2007, 'loss/train': 2.825547933578491} -09/20/2021 21:26:38 - INFO - __main__ - Step 32117: {'lr': 0.00019967871152884402, 'samples': 1027744, 'steps': 2007, 'loss/train': 1.2074798345565796} -09/20/2021 21:26:39 - INFO - __main__ - Step 32118: {'lr': 0.00019967871152884402, 'samples': 1027776, 'steps': 2007, 'loss/train': 2.440176010131836} -09/20/2021 21:26:40 - INFO - __main__ - Step 32119: {'lr': 0.00019967871152884402, 'samples': 1027808, 'steps': 2007, 'loss/train': 1.9942244291305542} -09/20/2021 21:26:40 - INFO - __main__ - Step 32120: {'lr': 0.00019967871152884402, 'samples': 1027840, 'steps': 2007, 'loss/train': 3.2476069927215576} -09/20/2021 21:26:41 - INFO - __main__ - Step 32121: {'lr': 0.00019967871152884402, 'samples': 1027872, 'steps': 2007, 'loss/train': 3.249816656112671} -09/20/2021 21:26:42 - INFO - __main__ - Step 32122: {'lr': 0.00019967871152884402, 'samples': 1027904, 'steps': 2007, 'loss/train': 2.7599217891693115} -09/20/2021 21:26:43 - INFO - __main__ - Step 32123: {'lr': 0.00019967871152884402, 'samples': 1027936, 'steps': 2007, 'loss/train': 2.101815938949585} -09/20/2021 21:26:43 - INFO - __main__ - Step 32124: {'lr': 0.00019967871152884402, 'samples': 1027968, 'steps': 2007, 'loss/train': 2.6451103687286377} -09/20/2021 21:26:44 - INFO - __main__ - Step 32125: {'lr': 0.00019967871152884402, 'samples': 1028000, 'steps': 2007, 'loss/train': 2.2225728034973145} -09/20/2021 21:26:45 - INFO - __main__ - Step 32126: {'lr': 0.00019967871152884402, 'samples': 1028032, 'steps': 2007, 'loss/train': 2.960463285446167} -09/20/2021 21:26:46 - INFO - __main__ - Step 32127: {'lr': 0.00019967871152884402, 'samples': 1028064, 'steps': 2007, 'loss/train': 1.856887936592102} -09/20/2021 21:26:46 - INFO - __main__ - Step 32128: {'lr': 0.00019967871152884402, 'samples': 1028096, 'steps': 2007, 'loss/train': 2.295976400375366} -09/20/2021 21:26:47 - INFO - __main__ - Step 32129: {'lr': 0.00019967820040112108, 'samples': 1028128, 'steps': 2008, 'loss/train': 1.3565537929534912} -09/20/2021 21:26:48 - INFO - __main__ - Step 32130: {'lr': 0.00019967820040112108, 'samples': 1028160, 'steps': 2008, 'loss/train': 2.143752336502075} -09/20/2021 21:26:49 - INFO - __main__ - Step 32131: {'lr': 0.00019967820040112108, 'samples': 1028192, 'steps': 2008, 'loss/train': 2.37697696685791} -09/20/2021 21:26:50 - INFO - __main__ - Step 32132: {'lr': 0.00019967820040112108, 'samples': 1028224, 'steps': 2008, 'loss/train': 3.0242536067962646} -09/20/2021 21:26:50 - INFO - __main__ - Step 32133: {'lr': 0.00019967820040112108, 'samples': 1028256, 'steps': 2008, 'loss/train': 3.195200204849243} -09/20/2021 21:26:51 - INFO - __main__ - Step 32134: {'lr': 0.00019967820040112108, 'samples': 1028288, 'steps': 2008, 'loss/train': 1.5628808736801147} -09/20/2021 21:26:52 - INFO - __main__ - Step 32135: {'lr': 0.00019967820040112108, 'samples': 1028320, 'steps': 2008, 'loss/train': 2.7733147144317627} -09/20/2021 21:26:53 - INFO - __main__ - Step 32136: {'lr': 0.00019967820040112108, 'samples': 1028352, 'steps': 2008, 'loss/train': 1.8697545528411865} -09/20/2021 21:26:53 - INFO - __main__ - Step 32137: {'lr': 0.00019967820040112108, 'samples': 1028384, 'steps': 2008, 'loss/train': 1.6047272682189941} -09/20/2021 21:26:54 - INFO - __main__ - Step 32138: {'lr': 0.00019967820040112108, 'samples': 1028416, 'steps': 2008, 'loss/train': 1.781981110572815} -09/20/2021 21:26:55 - INFO - __main__ - Step 32139: {'lr': 0.00019967820040112108, 'samples': 1028448, 'steps': 2008, 'loss/train': 0.3279414176940918} -09/20/2021 21:26:56 - INFO - __main__ - Step 32140: {'lr': 0.00019967820040112108, 'samples': 1028480, 'steps': 2008, 'loss/train': 0.20117023587226868} -09/20/2021 21:26:57 - INFO - __main__ - Step 32141: {'lr': 0.00019967820040112108, 'samples': 1028512, 'steps': 2008, 'loss/train': 2.2616467475891113} -09/20/2021 21:26:58 - INFO - __main__ - Step 32142: {'lr': 0.00019967820040112108, 'samples': 1028544, 'steps': 2008, 'loss/train': 2.5468647480010986} -09/20/2021 21:26:59 - INFO - __main__ - Step 32143: {'lr': 0.00019967820040112108, 'samples': 1028576, 'steps': 2008, 'loss/train': 2.8035738468170166} -09/20/2021 21:26:59 - INFO - __main__ - Step 32144: {'lr': 0.00019967820040112108, 'samples': 1028608, 'steps': 2008, 'loss/train': 2.1079182624816895} -09/20/2021 21:27:00 - INFO - __main__ - Step 32145: {'lr': 0.00019967768886780795, 'samples': 1028640, 'steps': 2009, 'loss/train': 2.839426040649414} -09/20/2021 21:27:01 - INFO - __main__ - Step 32146: {'lr': 0.00019967768886780795, 'samples': 1028672, 'steps': 2009, 'loss/train': 3.5576937198638916} -09/20/2021 21:27:02 - INFO - __main__ - Step 32147: {'lr': 0.00019967768886780795, 'samples': 1028704, 'steps': 2009, 'loss/train': 2.0610289573669434} -09/20/2021 21:27:03 - INFO - __main__ - Step 32148: {'lr': 0.00019967768886780795, 'samples': 1028736, 'steps': 2009, 'loss/train': 2.1278789043426514} -09/20/2021 21:27:03 - INFO - __main__ - Step 32149: {'lr': 0.00019967768886780795, 'samples': 1028768, 'steps': 2009, 'loss/train': 2.789055347442627} -09/20/2021 21:27:04 - INFO - __main__ - Step 32150: {'lr': 0.00019967768886780795, 'samples': 1028800, 'steps': 2009, 'loss/train': 2.102504014968872} -09/20/2021 21:27:05 - INFO - __main__ - Step 32151: {'lr': 0.00019967768886780795, 'samples': 1028832, 'steps': 2009, 'loss/train': 1.0068050622940063} -09/20/2021 21:27:06 - INFO - __main__ - Step 32152: {'lr': 0.00019967768886780795, 'samples': 1028864, 'steps': 2009, 'loss/train': 0.7085348963737488} -09/20/2021 21:27:06 - INFO - __main__ - Step 32153: {'lr': 0.00019967768886780795, 'samples': 1028896, 'steps': 2009, 'loss/train': 3.066877603530884} -09/20/2021 21:27:07 - INFO - __main__ - Step 32154: {'lr': 0.00019967768886780795, 'samples': 1028928, 'steps': 2009, 'loss/train': 2.7512943744659424} -09/20/2021 21:27:08 - INFO - __main__ - Step 32155: {'lr': 0.00019967768886780795, 'samples': 1028960, 'steps': 2009, 'loss/train': 1.7649505138397217} -09/20/2021 21:27:09 - INFO - __main__ - Step 32156: {'lr': 0.00019967768886780795, 'samples': 1028992, 'steps': 2009, 'loss/train': 2.0454657077789307} -09/20/2021 21:27:09 - INFO - __main__ - Step 32157: {'lr': 0.00019967768886780795, 'samples': 1029024, 'steps': 2009, 'loss/train': 2.8685288429260254} -09/20/2021 21:27:10 - INFO - __main__ - Step 32158: {'lr': 0.00019967768886780795, 'samples': 1029056, 'steps': 2009, 'loss/train': 1.3080750703811646} -09/20/2021 21:27:11 - INFO - __main__ - Step 32159: {'lr': 0.00019967768886780795, 'samples': 1029088, 'steps': 2009, 'loss/train': 0.7886254787445068} -09/20/2021 21:27:12 - INFO - __main__ - Step 32160: {'lr': 0.00019967768886780795, 'samples': 1029120, 'steps': 2009, 'loss/train': 0.8010510802268982} -09/20/2021 21:27:13 - INFO - __main__ - Step 32161: {'lr': 0.00019967717692890669, 'samples': 1029152, 'steps': 2010, 'loss/train': 0.6991740465164185} -09/20/2021 21:27:13 - INFO - __main__ - Step 32162: {'lr': 0.00019967717692890669, 'samples': 1029184, 'steps': 2010, 'loss/train': 0.6094192266464233} -09/20/2021 21:27:14 - INFO - __main__ - Step 32163: {'lr': 0.00019967717692890669, 'samples': 1029216, 'steps': 2010, 'loss/train': 0.7560029029846191} -09/20/2021 21:27:15 - INFO - __main__ - Step 32164: {'lr': 0.00019967717692890669, 'samples': 1029248, 'steps': 2010, 'loss/train': 0.7562756538391113} -09/20/2021 21:27:16 - INFO - __main__ - Step 32165: {'lr': 0.00019967717692890669, 'samples': 1029280, 'steps': 2010, 'loss/train': 0.7251304984092712} -09/20/2021 21:27:16 - INFO - __main__ - Step 32166: {'lr': 0.00019967717692890669, 'samples': 1029312, 'steps': 2010, 'loss/train': 1.0891826152801514} -09/20/2021 21:27:17 - INFO - __main__ - Step 32167: {'lr': 0.00019967717692890669, 'samples': 1029344, 'steps': 2010, 'loss/train': 1.5022873878479004} -09/20/2021 21:27:18 - INFO - __main__ - Step 32168: {'lr': 0.00019967717692890669, 'samples': 1029376, 'steps': 2010, 'loss/train': 2.167572498321533} -09/20/2021 21:27:19 - INFO - __main__ - Step 32169: {'lr': 0.00019967717692890669, 'samples': 1029408, 'steps': 2010, 'loss/train': 2.6418750286102295} -09/20/2021 21:27:19 - INFO - __main__ - Step 32170: {'lr': 0.00019967717692890669, 'samples': 1029440, 'steps': 2010, 'loss/train': 2.3592140674591064} -09/20/2021 21:27:20 - INFO - __main__ - Step 32171: {'lr': 0.00019967717692890669, 'samples': 1029472, 'steps': 2010, 'loss/train': 2.4559853076934814} -09/20/2021 21:27:21 - INFO - __main__ - Step 32172: {'lr': 0.00019967717692890669, 'samples': 1029504, 'steps': 2010, 'loss/train': 1.8633763790130615} -09/20/2021 21:27:22 - INFO - __main__ - Step 32173: {'lr': 0.00019967717692890669, 'samples': 1029536, 'steps': 2010, 'loss/train': 3.513429641723633} -09/20/2021 21:27:22 - INFO - __main__ - Step 32174: {'lr': 0.00019967717692890669, 'samples': 1029568, 'steps': 2010, 'loss/train': 2.753993511199951} -09/20/2021 21:27:23 - INFO - __main__ - Step 32175: {'lr': 0.00019967717692890669, 'samples': 1029600, 'steps': 2010, 'loss/train': 1.8105021715164185} -09/20/2021 21:27:24 - INFO - __main__ - Step 32176: {'lr': 0.00019967717692890669, 'samples': 1029632, 'steps': 2010, 'loss/train': 2.3162193298339844} -09/20/2021 21:27:26 - INFO - __main__ - Step 32177: {'lr': 0.00019967666458441937, 'samples': 1029664, 'steps': 2011, 'loss/train': 2.0759599208831787} -09/20/2021 21:27:26 - INFO - __main__ - Step 32178: {'lr': 0.00019967666458441937, 'samples': 1029696, 'steps': 2011, 'loss/train': 3.0740251541137695} -09/20/2021 21:27:27 - INFO - __main__ - Step 32179: {'lr': 0.00019967666458441937, 'samples': 1029728, 'steps': 2011, 'loss/train': 2.6411163806915283} -09/20/2021 21:27:28 - INFO - __main__ - Step 32180: {'lr': 0.00019967666458441937, 'samples': 1029760, 'steps': 2011, 'loss/train': 2.910975933074951} -09/20/2021 21:27:29 - INFO - __main__ - Step 32181: {'lr': 0.00019967666458441937, 'samples': 1029792, 'steps': 2011, 'loss/train': 2.125433921813965} -09/20/2021 21:27:29 - INFO - __main__ - Step 32182: {'lr': 0.00019967666458441937, 'samples': 1029824, 'steps': 2011, 'loss/train': 2.6946918964385986} -09/20/2021 21:27:30 - INFO - __main__ - Step 32183: {'lr': 0.00019967666458441937, 'samples': 1029856, 'steps': 2011, 'loss/train': 2.7827138900756836} -09/20/2021 21:27:31 - INFO - __main__ - Step 32184: {'lr': 0.00019967666458441937, 'samples': 1029888, 'steps': 2011, 'loss/train': 2.073281764984131} -09/20/2021 21:27:32 - INFO - __main__ - Step 32185: {'lr': 0.00019967666458441937, 'samples': 1029920, 'steps': 2011, 'loss/train': 2.3114120960235596} -09/20/2021 21:27:32 - INFO - __main__ - Step 32186: {'lr': 0.00019967666458441937, 'samples': 1029952, 'steps': 2011, 'loss/train': 1.1619778871536255} -09/20/2021 21:27:33 - INFO - __main__ - Step 32187: {'lr': 0.00019967666458441937, 'samples': 1029984, 'steps': 2011, 'loss/train': 0.9918015003204346} -09/20/2021 21:27:34 - INFO - __main__ - Step 32188: {'lr': 0.00019967666458441937, 'samples': 1030016, 'steps': 2011, 'loss/train': 0.18810150027275085} -09/20/2021 21:27:35 - INFO - __main__ - Step 32189: {'lr': 0.00019967666458441937, 'samples': 1030048, 'steps': 2011, 'loss/train': 0.32146844267845154} -09/20/2021 21:27:35 - INFO - __main__ - Step 32190: {'lr': 0.00019967666458441937, 'samples': 1030080, 'steps': 2011, 'loss/train': 0.0881408229470253} -09/20/2021 21:27:36 - INFO - __main__ - Step 32191: {'lr': 0.00019967666458441937, 'samples': 1030112, 'steps': 2011, 'loss/train': 0.40262681245803833} -09/20/2021 21:27:37 - INFO - __main__ - Step 32192: {'lr': 0.00019967666458441937, 'samples': 1030144, 'steps': 2011, 'loss/train': 0.2897018790245056} -09/20/2021 21:27:38 - INFO - __main__ - Step 32193: {'lr': 0.0001996761518343481, 'samples': 1030176, 'steps': 2012, 'loss/train': 2.3611714839935303} -09/20/2021 21:27:38 - INFO - __main__ - Step 32194: {'lr': 0.0001996761518343481, 'samples': 1030208, 'steps': 2012, 'loss/train': 1.267534613609314} -09/20/2021 21:27:39 - INFO - __main__ - Step 32195: {'lr': 0.0001996761518343481, 'samples': 1030240, 'steps': 2012, 'loss/train': 2.292010545730591} -09/20/2021 21:27:40 - INFO - __main__ - Step 32196: {'lr': 0.0001996761518343481, 'samples': 1030272, 'steps': 2012, 'loss/train': 2.1206116676330566} -09/20/2021 21:27:41 - INFO - __main__ - Step 32197: {'lr': 0.0001996761518343481, 'samples': 1030304, 'steps': 2012, 'loss/train': 2.6215391159057617} -09/20/2021 21:27:41 - INFO - __main__ - Step 32198: {'lr': 0.0001996761518343481, 'samples': 1030336, 'steps': 2012, 'loss/train': 3.27632737159729} -09/20/2021 21:27:42 - INFO - __main__ - Step 32199: {'lr': 0.0001996761518343481, 'samples': 1030368, 'steps': 2012, 'loss/train': 2.490589141845703} -09/20/2021 21:27:43 - INFO - __main__ - Step 32200: {'lr': 0.0001996761518343481, 'samples': 1030400, 'steps': 2012, 'loss/train': 2.9654746055603027} -09/20/2021 21:27:44 - INFO - __main__ - Step 32201: {'lr': 0.0001996761518343481, 'samples': 1030432, 'steps': 2012, 'loss/train': 3.353757858276367} -09/20/2021 21:27:44 - INFO - __main__ - Step 32202: {'lr': 0.0001996761518343481, 'samples': 1030464, 'steps': 2012, 'loss/train': 2.1838018894195557} -09/20/2021 21:27:45 - INFO - __main__ - Step 32203: {'lr': 0.0001996761518343481, 'samples': 1030496, 'steps': 2012, 'loss/train': 1.8426356315612793} -09/20/2021 21:27:46 - INFO - __main__ - Step 32204: {'lr': 0.0001996761518343481, 'samples': 1030528, 'steps': 2012, 'loss/train': 1.6997065544128418} -09/20/2021 21:27:47 - INFO - __main__ - Step 32205: {'lr': 0.0001996761518343481, 'samples': 1030560, 'steps': 2012, 'loss/train': 2.615635871887207} -09/20/2021 21:27:47 - INFO - __main__ - Step 32206: {'lr': 0.0001996761518343481, 'samples': 1030592, 'steps': 2012, 'loss/train': 1.7811853885650635} -09/20/2021 21:27:49 - INFO - __main__ - Step 32207: {'lr': 0.0001996761518343481, 'samples': 1030624, 'steps': 2012, 'loss/train': 2.237943410873413} -09/20/2021 21:27:49 - INFO - __main__ - Step 32208: {'lr': 0.0001996761518343481, 'samples': 1030656, 'steps': 2012, 'loss/train': 2.177250385284424} -09/20/2021 21:27:50 - INFO - __main__ - Step 32209: {'lr': 0.00019967563867869493, 'samples': 1030688, 'steps': 2013, 'loss/train': 3.5511701107025146} -09/20/2021 21:27:51 - INFO - __main__ - Step 32210: {'lr': 0.00019967563867869493, 'samples': 1030720, 'steps': 2013, 'loss/train': 2.0738131999969482} -09/20/2021 21:27:52 - INFO - __main__ - Step 32211: {'lr': 0.00019967563867869493, 'samples': 1030752, 'steps': 2013, 'loss/train': 2.8582613468170166} -09/20/2021 21:27:53 - INFO - __main__ - Step 32212: {'lr': 0.00019967563867869493, 'samples': 1030784, 'steps': 2013, 'loss/train': 2.653211832046509} -09/20/2021 21:27:53 - INFO - __main__ - Step 32213: {'lr': 0.00019967563867869493, 'samples': 1030816, 'steps': 2013, 'loss/train': 1.6479721069335938} -09/20/2021 21:27:54 - INFO - __main__ - Step 32214: {'lr': 0.00019967563867869493, 'samples': 1030848, 'steps': 2013, 'loss/train': 2.9057745933532715} -09/20/2021 21:27:55 - INFO - __main__ - Step 32215: {'lr': 0.00019967563867869493, 'samples': 1030880, 'steps': 2013, 'loss/train': 0.6297109127044678} -09/20/2021 21:27:56 - INFO - __main__ - Step 32216: {'lr': 0.00019967563867869493, 'samples': 1030912, 'steps': 2013, 'loss/train': 1.8645621538162231} -09/20/2021 21:27:56 - INFO - __main__ - Step 32217: {'lr': 0.00019967563867869493, 'samples': 1030944, 'steps': 2013, 'loss/train': 2.7142672538757324} -09/20/2021 21:27:57 - INFO - __main__ - Step 32218: {'lr': 0.00019967563867869493, 'samples': 1030976, 'steps': 2013, 'loss/train': 2.2164933681488037} -09/20/2021 21:27:58 - INFO - __main__ - Step 32219: {'lr': 0.00019967563867869493, 'samples': 1031008, 'steps': 2013, 'loss/train': 2.1171531677246094} -09/20/2021 21:27:59 - INFO - __main__ - Step 32220: {'lr': 0.00019967563867869493, 'samples': 1031040, 'steps': 2013, 'loss/train': 1.6737666130065918} -09/20/2021 21:27:59 - INFO - __main__ - Step 32221: {'lr': 0.00019967563867869493, 'samples': 1031072, 'steps': 2013, 'loss/train': 1.651606798171997} -09/20/2021 21:28:00 - INFO - __main__ - Step 32222: {'lr': 0.00019967563867869493, 'samples': 1031104, 'steps': 2013, 'loss/train': 3.528777837753296} -09/20/2021 21:28:01 - INFO - __main__ - Step 32223: {'lr': 0.00019967563867869493, 'samples': 1031136, 'steps': 2013, 'loss/train': 2.5941858291625977} -09/20/2021 21:28:02 - INFO - __main__ - Step 32224: {'lr': 0.00019967563867869493, 'samples': 1031168, 'steps': 2013, 'loss/train': 2.3495428562164307} -09/20/2021 21:28:02 - INFO - __main__ - Step 32225: {'lr': 0.000199675125117462, 'samples': 1031200, 'steps': 2014, 'loss/train': 2.011314868927002} -09/20/2021 21:28:03 - INFO - __main__ - Step 32226: {'lr': 0.000199675125117462, 'samples': 1031232, 'steps': 2014, 'loss/train': 2.0937678813934326} -09/20/2021 21:28:04 - INFO - __main__ - Step 32227: {'lr': 0.000199675125117462, 'samples': 1031264, 'steps': 2014, 'loss/train': 2.3815178871154785} -09/20/2021 21:28:05 - INFO - __main__ - Step 32228: {'lr': 0.000199675125117462, 'samples': 1031296, 'steps': 2014, 'loss/train': 2.272968292236328} -09/20/2021 21:28:05 - INFO - __main__ - Step 32229: {'lr': 0.000199675125117462, 'samples': 1031328, 'steps': 2014, 'loss/train': 2.76777720451355} -09/20/2021 21:28:06 - INFO - __main__ - Step 32230: {'lr': 0.000199675125117462, 'samples': 1031360, 'steps': 2014, 'loss/train': 1.8571182489395142} -09/20/2021 21:28:07 - INFO - __main__ - Step 32231: {'lr': 0.000199675125117462, 'samples': 1031392, 'steps': 2014, 'loss/train': 0.5782666802406311} -09/20/2021 21:28:08 - INFO - __main__ - Step 32232: {'lr': 0.000199675125117462, 'samples': 1031424, 'steps': 2014, 'loss/train': 2.3845837116241455} -09/20/2021 21:28:08 - INFO - __main__ - Step 32233: {'lr': 0.000199675125117462, 'samples': 1031456, 'steps': 2014, 'loss/train': 1.8276902437210083} -09/20/2021 21:28:09 - INFO - __main__ - Step 32234: {'lr': 0.000199675125117462, 'samples': 1031488, 'steps': 2014, 'loss/train': 1.5063812732696533} -09/20/2021 21:28:10 - INFO - __main__ - Step 32235: {'lr': 0.000199675125117462, 'samples': 1031520, 'steps': 2014, 'loss/train': 2.524498224258423} -09/20/2021 21:28:11 - INFO - __main__ - Step 32236: {'lr': 0.000199675125117462, 'samples': 1031552, 'steps': 2014, 'loss/train': 1.945809245109558} -09/20/2021 21:28:11 - INFO - __main__ - Step 32237: {'lr': 0.000199675125117462, 'samples': 1031584, 'steps': 2014, 'loss/train': 2.312893867492676} -09/20/2021 21:28:13 - INFO - __main__ - Step 32238: {'lr': 0.000199675125117462, 'samples': 1031616, 'steps': 2014, 'loss/train': 2.3669564723968506} -09/20/2021 21:28:13 - INFO - __main__ - Step 32239: {'lr': 0.000199675125117462, 'samples': 1031648, 'steps': 2014, 'loss/train': 2.501889705657959} -09/20/2021 21:28:14 - INFO - __main__ - Step 32240: {'lr': 0.000199675125117462, 'samples': 1031680, 'steps': 2014, 'loss/train': 1.9962676763534546} -09/20/2021 21:28:15 - INFO - __main__ - Step 32241: {'lr': 0.00019967461115065138, 'samples': 1031712, 'steps': 2015, 'loss/train': 2.4790868759155273} -09/20/2021 21:28:16 - INFO - __main__ - Step 32242: {'lr': 0.00019967461115065138, 'samples': 1031744, 'steps': 2015, 'loss/train': 2.3046979904174805} -09/20/2021 21:28:17 - INFO - __main__ - Step 32243: {'lr': 0.00019967461115065138, 'samples': 1031776, 'steps': 2015, 'loss/train': 2.411222457885742} -09/20/2021 21:28:17 - INFO - __main__ - Step 32244: {'lr': 0.00019967461115065138, 'samples': 1031808, 'steps': 2015, 'loss/train': 2.2990384101867676} -09/20/2021 21:28:18 - INFO - __main__ - Step 32245: {'lr': 0.00019967461115065138, 'samples': 1031840, 'steps': 2015, 'loss/train': 2.147083282470703} -09/20/2021 21:28:19 - INFO - __main__ - Step 32246: {'lr': 0.00019967461115065138, 'samples': 1031872, 'steps': 2015, 'loss/train': 2.827824592590332} -09/20/2021 21:28:20 - INFO - __main__ - Step 32247: {'lr': 0.00019967461115065138, 'samples': 1031904, 'steps': 2015, 'loss/train': 2.3371541500091553} -09/20/2021 21:28:20 - INFO - __main__ - Step 32248: {'lr': 0.00019967461115065138, 'samples': 1031936, 'steps': 2015, 'loss/train': 2.4849178791046143} -09/20/2021 21:28:21 - INFO - __main__ - Step 32249: {'lr': 0.00019967461115065138, 'samples': 1031968, 'steps': 2015, 'loss/train': 2.1751511096954346} -09/20/2021 21:28:22 - INFO - __main__ - Step 32250: {'lr': 0.00019967461115065138, 'samples': 1032000, 'steps': 2015, 'loss/train': 3.8389060497283936} -09/20/2021 21:28:23 - INFO - __main__ - Step 32251: {'lr': 0.00019967461115065138, 'samples': 1032032, 'steps': 2015, 'loss/train': 3.1322684288024902} -09/20/2021 21:28:23 - INFO - __main__ - Step 32252: {'lr': 0.00019967461115065138, 'samples': 1032064, 'steps': 2015, 'loss/train': 2.173475980758667} -09/20/2021 21:28:24 - INFO - __main__ - Step 32253: {'lr': 0.00019967461115065138, 'samples': 1032096, 'steps': 2015, 'loss/train': 2.607110023498535} -09/20/2021 21:28:25 - INFO - __main__ - Step 32254: {'lr': 0.00019967461115065138, 'samples': 1032128, 'steps': 2015, 'loss/train': 1.827104926109314} -09/20/2021 21:28:26 - INFO - __main__ - Step 32255: {'lr': 0.00019967461115065138, 'samples': 1032160, 'steps': 2015, 'loss/train': 3.802640199661255} -09/20/2021 21:28:26 - INFO - __main__ - Step 32256: {'lr': 0.00019967461115065138, 'samples': 1032192, 'steps': 2015, 'loss/train': 2.5445120334625244} -09/20/2021 21:28:27 - INFO - __main__ - Step 32257: {'lr': 0.00019967409677826514, 'samples': 1032224, 'steps': 2016, 'loss/train': 1.9698892831802368} -09/20/2021 21:28:28 - INFO - __main__ - Step 32258: {'lr': 0.00019967409677826514, 'samples': 1032256, 'steps': 2016, 'loss/train': 1.8513472080230713} -09/20/2021 21:28:29 - INFO - __main__ - Step 32259: {'lr': 0.00019967409677826514, 'samples': 1032288, 'steps': 2016, 'loss/train': 2.279860734939575} -09/20/2021 21:28:29 - INFO - __main__ - Step 32260: {'lr': 0.00019967409677826514, 'samples': 1032320, 'steps': 2016, 'loss/train': 2.4698727130889893} -09/20/2021 21:28:30 - INFO - __main__ - Step 32261: {'lr': 0.00019967409677826514, 'samples': 1032352, 'steps': 2016, 'loss/train': 2.394880533218384} -09/20/2021 21:28:31 - INFO - __main__ - Step 32262: {'lr': 0.00019967409677826514, 'samples': 1032384, 'steps': 2016, 'loss/train': 2.7535245418548584} -09/20/2021 21:28:32 - INFO - __main__ - Step 32263: {'lr': 0.00019967409677826514, 'samples': 1032416, 'steps': 2016, 'loss/train': 2.7828428745269775} -09/20/2021 21:28:32 - INFO - __main__ - Step 32264: {'lr': 0.00019967409677826514, 'samples': 1032448, 'steps': 2016, 'loss/train': 1.623104214668274} -09/20/2021 21:28:33 - INFO - __main__ - Step 32265: {'lr': 0.00019967409677826514, 'samples': 1032480, 'steps': 2016, 'loss/train': 3.0925393104553223} -09/20/2021 21:28:34 - INFO - __main__ - Step 32266: {'lr': 0.00019967409677826514, 'samples': 1032512, 'steps': 2016, 'loss/train': 2.461948871612549} -09/20/2021 21:28:35 - INFO - __main__ - Step 32267: {'lr': 0.00019967409677826514, 'samples': 1032544, 'steps': 2016, 'loss/train': 2.9080159664154053} -09/20/2021 21:28:37 - INFO - __main__ - Step 32268: {'lr': 0.00019967409677826514, 'samples': 1032576, 'steps': 2016, 'loss/train': 2.969142436981201} -09/20/2021 21:28:37 - INFO - __main__ - Step 32269: {'lr': 0.00019967409677826514, 'samples': 1032608, 'steps': 2016, 'loss/train': 1.8523768186569214} -09/20/2021 21:28:38 - INFO - __main__ - Step 32270: {'lr': 0.00019967409677826514, 'samples': 1032640, 'steps': 2016, 'loss/train': 2.3218908309936523} -09/20/2021 21:28:39 - INFO - __main__ - Step 32271: {'lr': 0.00019967409677826514, 'samples': 1032672, 'steps': 2016, 'loss/train': 2.803933620452881} -09/20/2021 21:28:40 - INFO - __main__ - Step 32272: {'lr': 0.00019967409677826514, 'samples': 1032704, 'steps': 2016, 'loss/train': 2.4652204513549805} -09/20/2021 21:28:40 - INFO - __main__ - Step 32273: {'lr': 0.00019967358200030538, 'samples': 1032736, 'steps': 2017, 'loss/train': 1.5302464962005615} -09/20/2021 21:28:41 - INFO - __main__ - Step 32274: {'lr': 0.00019967358200030538, 'samples': 1032768, 'steps': 2017, 'loss/train': 1.6698462963104248} -09/20/2021 21:28:42 - INFO - __main__ - Step 32275: {'lr': 0.00019967358200030538, 'samples': 1032800, 'steps': 2017, 'loss/train': 2.574968099594116} -09/20/2021 21:28:43 - INFO - __main__ - Step 32276: {'lr': 0.00019967358200030538, 'samples': 1032832, 'steps': 2017, 'loss/train': 2.4288477897644043} -09/20/2021 21:28:43 - INFO - __main__ - Step 32277: {'lr': 0.00019967358200030538, 'samples': 1032864, 'steps': 2017, 'loss/train': 1.9784111976623535} -09/20/2021 21:28:44 - INFO - __main__ - Step 32278: {'lr': 0.00019967358200030538, 'samples': 1032896, 'steps': 2017, 'loss/train': 1.960350751876831} -09/20/2021 21:28:45 - INFO - __main__ - Step 32279: {'lr': 0.00019967358200030538, 'samples': 1032928, 'steps': 2017, 'loss/train': 2.720715284347534} -09/20/2021 21:28:46 - INFO - __main__ - Step 32280: {'lr': 0.00019967358200030538, 'samples': 1032960, 'steps': 2017, 'loss/train': 2.3163158893585205} -09/20/2021 21:28:46 - INFO - __main__ - Step 32281: {'lr': 0.00019967358200030538, 'samples': 1032992, 'steps': 2017, 'loss/train': 1.5612314939498901} -09/20/2021 21:28:47 - INFO - __main__ - Step 32282: {'lr': 0.00019967358200030538, 'samples': 1033024, 'steps': 2017, 'loss/train': 2.397606134414673} -09/20/2021 21:28:48 - INFO - __main__ - Step 32283: {'lr': 0.00019967358200030538, 'samples': 1033056, 'steps': 2017, 'loss/train': 1.2704230546951294} -09/20/2021 21:28:49 - INFO - __main__ - Step 32284: {'lr': 0.00019967358200030538, 'samples': 1033088, 'steps': 2017, 'loss/train': 2.4145240783691406} -09/20/2021 21:28:49 - INFO - __main__ - Step 32285: {'lr': 0.00019967358200030538, 'samples': 1033120, 'steps': 2017, 'loss/train': 1.8798739910125732} -09/20/2021 21:28:50 - INFO - __main__ - Step 32286: {'lr': 0.00019967358200030538, 'samples': 1033152, 'steps': 2017, 'loss/train': 1.953783631324768} -09/20/2021 21:28:51 - INFO - __main__ - Step 32287: {'lr': 0.00019967358200030538, 'samples': 1033184, 'steps': 2017, 'loss/train': 1.5097757577896118} -09/20/2021 21:28:52 - INFO - __main__ - Step 32288: {'lr': 0.00019967358200030538, 'samples': 1033216, 'steps': 2017, 'loss/train': 2.460613965988159} -09/20/2021 21:28:53 - INFO - __main__ - Step 32289: {'lr': 0.0001996730668167742, 'samples': 1033248, 'steps': 2018, 'loss/train': 1.7884368896484375} -09/20/2021 21:28:53 - INFO - __main__ - Step 32290: {'lr': 0.0001996730668167742, 'samples': 1033280, 'steps': 2018, 'loss/train': 2.5821614265441895} -09/20/2021 21:28:54 - INFO - __main__ - Step 32291: {'lr': 0.0001996730668167742, 'samples': 1033312, 'steps': 2018, 'loss/train': 2.3445019721984863} -09/20/2021 21:28:55 - INFO - __main__ - Step 32292: {'lr': 0.0001996730668167742, 'samples': 1033344, 'steps': 2018, 'loss/train': 2.1689419746398926} -09/20/2021 21:28:56 - INFO - __main__ - Step 32293: {'lr': 0.0001996730668167742, 'samples': 1033376, 'steps': 2018, 'loss/train': 0.4456466734409332} -09/20/2021 21:28:56 - INFO - __main__ - Step 32294: {'lr': 0.0001996730668167742, 'samples': 1033408, 'steps': 2018, 'loss/train': 2.3778529167175293} -09/20/2021 21:28:57 - INFO - __main__ - Step 32295: {'lr': 0.0001996730668167742, 'samples': 1033440, 'steps': 2018, 'loss/train': 2.193096876144409} -09/20/2021 21:28:58 - INFO - __main__ - Step 32296: {'lr': 0.0001996730668167742, 'samples': 1033472, 'steps': 2018, 'loss/train': 2.553983688354492} -09/20/2021 21:28:59 - INFO - __main__ - Step 32297: {'lr': 0.0001996730668167742, 'samples': 1033504, 'steps': 2018, 'loss/train': 2.595808982849121} -09/20/2021 21:28:59 - INFO - __main__ - Step 32298: {'lr': 0.0001996730668167742, 'samples': 1033536, 'steps': 2018, 'loss/train': 2.2733635902404785} -09/20/2021 21:29:01 - INFO - __main__ - Step 32299: {'lr': 0.0001996730668167742, 'samples': 1033568, 'steps': 2018, 'loss/train': 2.344778299331665} -09/20/2021 21:29:01 - INFO - __main__ - Step 32300: {'lr': 0.0001996730668167742, 'samples': 1033600, 'steps': 2018, 'loss/train': 2.816236734390259} -09/20/2021 21:29:02 - INFO - __main__ - Step 32301: {'lr': 0.0001996730668167742, 'samples': 1033632, 'steps': 2018, 'loss/train': 1.924600601196289} -09/20/2021 21:29:03 - INFO - __main__ - Step 32302: {'lr': 0.0001996730668167742, 'samples': 1033664, 'steps': 2018, 'loss/train': 1.0360589027404785} -09/20/2021 21:29:04 - INFO - __main__ - Step 32303: {'lr': 0.0001996730668167742, 'samples': 1033696, 'steps': 2018, 'loss/train': 2.602820634841919} -09/20/2021 21:29:04 - INFO - __main__ - Step 32304: {'lr': 0.0001996730668167742, 'samples': 1033728, 'steps': 2018, 'loss/train': 2.4891674518585205} -09/20/2021 21:29:05 - INFO - __main__ - Step 32305: {'lr': 0.00019967255122767372, 'samples': 1033760, 'steps': 2019, 'loss/train': 2.4653000831604004} -09/20/2021 21:29:06 - INFO - __main__ - Step 32306: {'lr': 0.00019967255122767372, 'samples': 1033792, 'steps': 2019, 'loss/train': 3.60394287109375} -09/20/2021 21:29:07 - INFO - __main__ - Step 32307: {'lr': 0.00019967255122767372, 'samples': 1033824, 'steps': 2019, 'loss/train': 2.273055076599121} -09/20/2021 21:29:07 - INFO - __main__ - Step 32308: {'lr': 0.00019967255122767372, 'samples': 1033856, 'steps': 2019, 'loss/train': 1.5682458877563477} -09/20/2021 21:29:08 - INFO - __main__ - Step 32309: {'lr': 0.00019967255122767372, 'samples': 1033888, 'steps': 2019, 'loss/train': 1.9427052736282349} -09/20/2021 21:29:09 - INFO - __main__ - Step 32310: {'lr': 0.00019967255122767372, 'samples': 1033920, 'steps': 2019, 'loss/train': 3.9834465980529785} -09/20/2021 21:29:10 - INFO - __main__ - Step 32311: {'lr': 0.00019967255122767372, 'samples': 1033952, 'steps': 2019, 'loss/train': 1.551281213760376} -09/20/2021 21:29:10 - INFO - __main__ - Step 32312: {'lr': 0.00019967255122767372, 'samples': 1033984, 'steps': 2019, 'loss/train': 2.2244598865509033} -09/20/2021 21:29:11 - INFO - __main__ - Step 32313: {'lr': 0.00019967255122767372, 'samples': 1034016, 'steps': 2019, 'loss/train': 1.8707712888717651} -09/20/2021 21:29:12 - INFO - __main__ - Step 32314: {'lr': 0.00019967255122767372, 'samples': 1034048, 'steps': 2019, 'loss/train': 2.3279337882995605} -09/20/2021 21:29:13 - INFO - __main__ - Step 32315: {'lr': 0.00019967255122767372, 'samples': 1034080, 'steps': 2019, 'loss/train': 3.180351734161377} -09/20/2021 21:29:13 - INFO - __main__ - Step 32316: {'lr': 0.00019967255122767372, 'samples': 1034112, 'steps': 2019, 'loss/train': 2.3727550506591797} -09/20/2021 21:29:14 - INFO - __main__ - Step 32317: {'lr': 0.00019967255122767372, 'samples': 1034144, 'steps': 2019, 'loss/train': 3.519507646560669} -09/20/2021 21:29:15 - INFO - __main__ - Step 32318: {'lr': 0.00019967255122767372, 'samples': 1034176, 'steps': 2019, 'loss/train': 1.6738585233688354} -09/20/2021 21:29:16 - INFO - __main__ - Step 32319: {'lr': 0.00019967255122767372, 'samples': 1034208, 'steps': 2019, 'loss/train': 2.050140619277954} -09/20/2021 21:29:16 - INFO - __main__ - Step 32320: {'lr': 0.00019967255122767372, 'samples': 1034240, 'steps': 2019, 'loss/train': 2.1225736141204834} -09/20/2021 21:29:17 - INFO - __main__ - Step 32321: {'lr': 0.00019967203523300602, 'samples': 1034272, 'steps': 2020, 'loss/train': 1.7541834115982056} -09/20/2021 21:29:18 - INFO - __main__ - Step 32322: {'lr': 0.00019967203523300602, 'samples': 1034304, 'steps': 2020, 'loss/train': 3.2200980186462402} -09/20/2021 21:29:19 - INFO - __main__ - Step 32323: {'lr': 0.00019967203523300602, 'samples': 1034336, 'steps': 2020, 'loss/train': 3.33595609664917} -09/20/2021 21:29:20 - INFO - __main__ - Step 32324: {'lr': 0.00019967203523300602, 'samples': 1034368, 'steps': 2020, 'loss/train': 2.2846713066101074} -09/20/2021 21:29:20 - INFO - __main__ - Step 32325: {'lr': 0.00019967203523300602, 'samples': 1034400, 'steps': 2020, 'loss/train': 2.4154469966888428} -09/20/2021 21:29:21 - INFO - __main__ - Step 32326: {'lr': 0.00019967203523300602, 'samples': 1034432, 'steps': 2020, 'loss/train': 1.9529169797897339} -09/20/2021 21:29:22 - INFO - __main__ - Step 32327: {'lr': 0.00019967203523300602, 'samples': 1034464, 'steps': 2020, 'loss/train': 2.012338399887085} -09/20/2021 21:29:23 - INFO - __main__ - Step 32328: {'lr': 0.00019967203523300602, 'samples': 1034496, 'steps': 2020, 'loss/train': 2.322026014328003} -09/20/2021 21:29:23 - INFO - __main__ - Step 32329: {'lr': 0.00019967203523300602, 'samples': 1034528, 'steps': 2020, 'loss/train': 2.4619412422180176} -09/20/2021 21:29:25 - INFO - __main__ - Step 32330: {'lr': 0.00019967203523300602, 'samples': 1034560, 'steps': 2020, 'loss/train': 1.9284868240356445} -09/20/2021 21:29:26 - INFO - __main__ - Step 32331: {'lr': 0.00019967203523300602, 'samples': 1034592, 'steps': 2020, 'loss/train': 1.5580509901046753} -09/20/2021 21:29:26 - INFO - __main__ - Step 32332: {'lr': 0.00019967203523300602, 'samples': 1034624, 'steps': 2020, 'loss/train': 3.14687180519104} -09/20/2021 21:29:27 - INFO - __main__ - Step 32333: {'lr': 0.00019967203523300602, 'samples': 1034656, 'steps': 2020, 'loss/train': 3.4756956100463867} -09/20/2021 21:29:28 - INFO - __main__ - Step 32334: {'lr': 0.00019967203523300602, 'samples': 1034688, 'steps': 2020, 'loss/train': 3.761540174484253} -09/20/2021 21:29:29 - INFO - __main__ - Step 32335: {'lr': 0.00019967203523300602, 'samples': 1034720, 'steps': 2020, 'loss/train': 0.6977663040161133} -09/20/2021 21:29:29 - INFO - __main__ - Step 32336: {'lr': 0.00019967203523300602, 'samples': 1034752, 'steps': 2020, 'loss/train': 2.133190393447876} -09/20/2021 21:29:30 - INFO - __main__ - Step 32337: {'lr': 0.00019967151883277316, 'samples': 1034784, 'steps': 2021, 'loss/train': 2.1181142330169678} -09/20/2021 21:29:31 - INFO - __main__ - Step 32338: {'lr': 0.00019967151883277316, 'samples': 1034816, 'steps': 2021, 'loss/train': 2.1561293601989746} -09/20/2021 21:29:32 - INFO - __main__ - Step 32339: {'lr': 0.00019967151883277316, 'samples': 1034848, 'steps': 2021, 'loss/train': 1.8400713205337524} -09/20/2021 21:29:32 - INFO - __main__ - Step 32340: {'lr': 0.00019967151883277316, 'samples': 1034880, 'steps': 2021, 'loss/train': 2.515979051589966} -09/20/2021 21:29:33 - INFO - __main__ - Step 32341: {'lr': 0.00019967151883277316, 'samples': 1034912, 'steps': 2021, 'loss/train': 2.1364943981170654} -09/20/2021 21:29:34 - INFO - __main__ - Step 32342: {'lr': 0.00019967151883277316, 'samples': 1034944, 'steps': 2021, 'loss/train': 3.2887513637542725} -09/20/2021 21:29:35 - INFO - __main__ - Step 32343: {'lr': 0.00019967151883277316, 'samples': 1034976, 'steps': 2021, 'loss/train': 2.001250982284546} -09/20/2021 21:29:35 - INFO - __main__ - Step 32344: {'lr': 0.00019967151883277316, 'samples': 1035008, 'steps': 2021, 'loss/train': 2.2369866371154785} -09/20/2021 21:29:36 - INFO - __main__ - Step 32345: {'lr': 0.00019967151883277316, 'samples': 1035040, 'steps': 2021, 'loss/train': 2.611660957336426} -09/20/2021 21:29:37 - INFO - __main__ - Step 32346: {'lr': 0.00019967151883277316, 'samples': 1035072, 'steps': 2021, 'loss/train': 2.577584981918335} -09/20/2021 21:29:38 - INFO - __main__ - Step 32347: {'lr': 0.00019967151883277316, 'samples': 1035104, 'steps': 2021, 'loss/train': 2.295119285583496} -09/20/2021 21:29:38 - INFO - __main__ - Step 32348: {'lr': 0.00019967151883277316, 'samples': 1035136, 'steps': 2021, 'loss/train': 2.0945188999176025} -09/20/2021 21:29:39 - INFO - __main__ - Step 32349: {'lr': 0.00019967151883277316, 'samples': 1035168, 'steps': 2021, 'loss/train': 2.136693000793457} -09/20/2021 21:29:40 - INFO - __main__ - Step 32350: {'lr': 0.00019967151883277316, 'samples': 1035200, 'steps': 2021, 'loss/train': 2.1427433490753174} -09/20/2021 21:29:41 - INFO - __main__ - Step 32351: {'lr': 0.00019967151883277316, 'samples': 1035232, 'steps': 2021, 'loss/train': 2.1384241580963135} -09/20/2021 21:29:41 - INFO - __main__ - Step 32352: {'lr': 0.00019967151883277316, 'samples': 1035264, 'steps': 2021, 'loss/train': 2.668581247329712} -09/20/2021 21:29:42 - INFO - __main__ - Step 32353: {'lr': 0.0001996710020269773, 'samples': 1035296, 'steps': 2022, 'loss/train': 1.2177029848098755} -09/20/2021 21:29:43 - INFO - __main__ - Step 32354: {'lr': 0.0001996710020269773, 'samples': 1035328, 'steps': 2022, 'loss/train': 1.1090091466903687} -09/20/2021 21:29:44 - INFO - __main__ - Step 32355: {'lr': 0.0001996710020269773, 'samples': 1035360, 'steps': 2022, 'loss/train': 3.1364245414733887} -09/20/2021 21:29:45 - INFO - __main__ - Step 32356: {'lr': 0.0001996710020269773, 'samples': 1035392, 'steps': 2022, 'loss/train': 2.893195867538452} -09/20/2021 21:29:45 - INFO - __main__ - Step 32357: {'lr': 0.0001996710020269773, 'samples': 1035424, 'steps': 2022, 'loss/train': 1.9426552057266235} -09/20/2021 21:29:46 - INFO - __main__ - Step 32358: {'lr': 0.0001996710020269773, 'samples': 1035456, 'steps': 2022, 'loss/train': 2.480224370956421} -09/20/2021 21:29:47 - INFO - __main__ - Step 32359: {'lr': 0.0001996710020269773, 'samples': 1035488, 'steps': 2022, 'loss/train': 2.2698352336883545} -09/20/2021 21:29:48 - INFO - __main__ - Step 32360: {'lr': 0.0001996710020269773, 'samples': 1035520, 'steps': 2022, 'loss/train': 3.1553537845611572} -09/20/2021 21:29:49 - INFO - __main__ - Step 32361: {'lr': 0.0001996710020269773, 'samples': 1035552, 'steps': 2022, 'loss/train': 3.325996160507202} -09/20/2021 21:29:50 - INFO - __main__ - Step 32362: {'lr': 0.0001996710020269773, 'samples': 1035584, 'steps': 2022, 'loss/train': 2.3228847980499268} -09/20/2021 21:29:50 - INFO - __main__ - Step 32363: {'lr': 0.0001996710020269773, 'samples': 1035616, 'steps': 2022, 'loss/train': 1.433347463607788} -09/20/2021 21:29:51 - INFO - __main__ - Step 32364: {'lr': 0.0001996710020269773, 'samples': 1035648, 'steps': 2022, 'loss/train': 2.5251340866088867} -09/20/2021 21:29:52 - INFO - __main__ - Step 32365: {'lr': 0.0001996710020269773, 'samples': 1035680, 'steps': 2022, 'loss/train': 1.970037817955017} -09/20/2021 21:29:53 - INFO - __main__ - Step 32366: {'lr': 0.0001996710020269773, 'samples': 1035712, 'steps': 2022, 'loss/train': 2.3459222316741943} -09/20/2021 21:29:53 - INFO - __main__ - Step 32367: {'lr': 0.0001996710020269773, 'samples': 1035744, 'steps': 2022, 'loss/train': 2.623786449432373} -09/20/2021 21:29:54 - INFO - __main__ - Step 32368: {'lr': 0.0001996710020269773, 'samples': 1035776, 'steps': 2022, 'loss/train': 2.4477007389068604} -09/20/2021 21:29:55 - INFO - __main__ - Step 32369: {'lr': 0.00019967048481562053, 'samples': 1035808, 'steps': 2023, 'loss/train': 1.9064972400665283} -09/20/2021 21:29:56 - INFO - __main__ - Step 32370: {'lr': 0.00019967048481562053, 'samples': 1035840, 'steps': 2023, 'loss/train': 2.6920549869537354} -09/20/2021 21:29:56 - INFO - __main__ - Step 32371: {'lr': 0.00019967048481562053, 'samples': 1035872, 'steps': 2023, 'loss/train': 1.9343122243881226} -09/20/2021 21:29:57 - INFO - __main__ - Step 32372: {'lr': 0.00019967048481562053, 'samples': 1035904, 'steps': 2023, 'loss/train': 2.2355096340179443} -09/20/2021 21:29:58 - INFO - __main__ - Step 32373: {'lr': 0.00019967048481562053, 'samples': 1035936, 'steps': 2023, 'loss/train': 1.954418420791626} -09/20/2021 21:29:59 - INFO - __main__ - Step 32374: {'lr': 0.00019967048481562053, 'samples': 1035968, 'steps': 2023, 'loss/train': 2.063774585723877} -09/20/2021 21:29:59 - INFO - __main__ - Step 32375: {'lr': 0.00019967048481562053, 'samples': 1036000, 'steps': 2023, 'loss/train': 3.128479242324829} -09/20/2021 21:30:00 - INFO - __main__ - Step 32376: {'lr': 0.00019967048481562053, 'samples': 1036032, 'steps': 2023, 'loss/train': 2.2914865016937256} -09/20/2021 21:30:01 - INFO - __main__ - Step 32377: {'lr': 0.00019967048481562053, 'samples': 1036064, 'steps': 2023, 'loss/train': 0.8115164041519165} -09/20/2021 21:30:02 - INFO - __main__ - Step 32378: {'lr': 0.00019967048481562053, 'samples': 1036096, 'steps': 2023, 'loss/train': 2.3417046070098877} -09/20/2021 21:30:02 - INFO - __main__ - Step 32379: {'lr': 0.00019967048481562053, 'samples': 1036128, 'steps': 2023, 'loss/train': 3.054689645767212} -09/20/2021 21:30:03 - INFO - __main__ - Step 32380: {'lr': 0.00019967048481562053, 'samples': 1036160, 'steps': 2023, 'loss/train': 2.478579521179199} -09/20/2021 21:30:04 - INFO - __main__ - Step 32381: {'lr': 0.00019967048481562053, 'samples': 1036192, 'steps': 2023, 'loss/train': 2.3439993858337402} -09/20/2021 21:30:05 - INFO - __main__ - Step 32382: {'lr': 0.00019967048481562053, 'samples': 1036224, 'steps': 2023, 'loss/train': 3.0753703117370605} -09/20/2021 21:30:05 - INFO - __main__ - Step 32383: {'lr': 0.00019967048481562053, 'samples': 1036256, 'steps': 2023, 'loss/train': 2.581789016723633} -09/20/2021 21:30:06 - INFO - __main__ - Step 32384: {'lr': 0.00019967048481562053, 'samples': 1036288, 'steps': 2023, 'loss/train': 1.8905699253082275} -09/20/2021 21:30:07 - INFO - __main__ - Step 32385: {'lr': 0.00019966996719870492, 'samples': 1036320, 'steps': 2024, 'loss/train': 2.2821457386016846} -09/20/2021 21:30:08 - INFO - __main__ - Step 32386: {'lr': 0.00019966996719870492, 'samples': 1036352, 'steps': 2024, 'loss/train': 2.2456514835357666} -09/20/2021 21:30:09 - INFO - __main__ - Step 32387: {'lr': 0.00019966996719870492, 'samples': 1036384, 'steps': 2024, 'loss/train': 2.2419273853302} -09/20/2021 21:30:09 - INFO - __main__ - Step 32388: {'lr': 0.00019966996719870492, 'samples': 1036416, 'steps': 2024, 'loss/train': 2.610031843185425} -09/20/2021 21:30:10 - INFO - __main__ - Step 32389: {'lr': 0.00019966996719870492, 'samples': 1036448, 'steps': 2024, 'loss/train': 2.3814034461975098} -09/20/2021 21:30:11 - INFO - __main__ - Step 32390: {'lr': 0.00019966996719870492, 'samples': 1036480, 'steps': 2024, 'loss/train': 2.3723552227020264} -09/20/2021 21:30:12 - INFO - __main__ - Step 32391: {'lr': 0.00019966996719870492, 'samples': 1036512, 'steps': 2024, 'loss/train': 3.0031087398529053} -09/20/2021 21:30:13 - INFO - __main__ - Step 32392: {'lr': 0.00019966996719870492, 'samples': 1036544, 'steps': 2024, 'loss/train': 0.5519096851348877} -09/20/2021 21:30:14 - INFO - __main__ - Step 32393: {'lr': 0.00019966996719870492, 'samples': 1036576, 'steps': 2024, 'loss/train': 1.6957718133926392} -09/20/2021 21:30:14 - INFO - __main__ - Step 32394: {'lr': 0.00019966996719870492, 'samples': 1036608, 'steps': 2024, 'loss/train': 2.335322856903076} -09/20/2021 21:30:15 - INFO - __main__ - Step 32395: {'lr': 0.00019966996719870492, 'samples': 1036640, 'steps': 2024, 'loss/train': 4.203338146209717} -09/20/2021 21:30:16 - INFO - __main__ - Step 32396: {'lr': 0.00019966996719870492, 'samples': 1036672, 'steps': 2024, 'loss/train': 2.312666416168213} -09/20/2021 21:30:17 - INFO - __main__ - Step 32397: {'lr': 0.00019966996719870492, 'samples': 1036704, 'steps': 2024, 'loss/train': 2.3500123023986816} -09/20/2021 21:30:17 - INFO - __main__ - Step 32398: {'lr': 0.00019966996719870492, 'samples': 1036736, 'steps': 2024, 'loss/train': 2.2282230854034424} -09/20/2021 21:30:18 - INFO - __main__ - Step 32399: {'lr': 0.00019966996719870492, 'samples': 1036768, 'steps': 2024, 'loss/train': 0.7289875745773315} -09/20/2021 21:30:19 - INFO - __main__ - Step 32400: {'lr': 0.00019966996719870492, 'samples': 1036800, 'steps': 2024, 'loss/train': 2.1827733516693115} -09/20/2021 21:30:20 - INFO - __main__ - Step 32401: {'lr': 0.00019966944917623261, 'samples': 1036832, 'steps': 2025, 'loss/train': 1.583731770515442} -09/20/2021 21:30:20 - INFO - __main__ - Step 32402: {'lr': 0.00019966944917623261, 'samples': 1036864, 'steps': 2025, 'loss/train': 1.694345474243164} -09/20/2021 21:30:21 - INFO - __main__ - Step 32403: {'lr': 0.00019966944917623261, 'samples': 1036896, 'steps': 2025, 'loss/train': 1.6177464723587036} -09/20/2021 21:30:22 - INFO - __main__ - Step 32404: {'lr': 0.00019966944917623261, 'samples': 1036928, 'steps': 2025, 'loss/train': 2.246283769607544} -09/20/2021 21:30:23 - INFO - __main__ - Step 32405: {'lr': 0.00019966944917623261, 'samples': 1036960, 'steps': 2025, 'loss/train': 1.9046529531478882} -09/20/2021 21:30:23 - INFO - __main__ - Step 32406: {'lr': 0.00019966944917623261, 'samples': 1036992, 'steps': 2025, 'loss/train': 2.3307363986968994} -09/20/2021 21:30:24 - INFO - __main__ - Step 32407: {'lr': 0.00019966944917623261, 'samples': 1037024, 'steps': 2025, 'loss/train': 1.714089035987854} -09/20/2021 21:30:25 - INFO - __main__ - Step 32408: {'lr': 0.00019966944917623261, 'samples': 1037056, 'steps': 2025, 'loss/train': 2.4957854747772217} -09/20/2021 21:30:26 - INFO - __main__ - Step 32409: {'lr': 0.00019966944917623261, 'samples': 1037088, 'steps': 2025, 'loss/train': 2.4176042079925537} -09/20/2021 21:30:26 - INFO - __main__ - Step 32410: {'lr': 0.00019966944917623261, 'samples': 1037120, 'steps': 2025, 'loss/train': 2.8739545345306396} -09/20/2021 21:30:27 - INFO - __main__ - Step 32411: {'lr': 0.00019966944917623261, 'samples': 1037152, 'steps': 2025, 'loss/train': 0.821539580821991} -09/20/2021 21:30:28 - INFO - __main__ - Step 32412: {'lr': 0.00019966944917623261, 'samples': 1037184, 'steps': 2025, 'loss/train': 2.6824967861175537} -09/20/2021 21:30:29 - INFO - __main__ - Step 32413: {'lr': 0.00019966944917623261, 'samples': 1037216, 'steps': 2025, 'loss/train': 2.074000835418701} -09/20/2021 21:30:29 - INFO - __main__ - Step 32414: {'lr': 0.00019966944917623261, 'samples': 1037248, 'steps': 2025, 'loss/train': 3.6760334968566895} -09/20/2021 21:30:30 - INFO - __main__ - Step 32415: {'lr': 0.00019966944917623261, 'samples': 1037280, 'steps': 2025, 'loss/train': 3.0482048988342285} -09/20/2021 21:30:31 - INFO - __main__ - Step 32416: {'lr': 0.00019966944917623261, 'samples': 1037312, 'steps': 2025, 'loss/train': 2.1234023571014404} -09/20/2021 21:30:32 - INFO - __main__ - Step 32417: {'lr': 0.0001996689307482057, 'samples': 1037344, 'steps': 2026, 'loss/train': 2.5567479133605957} -09/20/2021 21:30:33 - INFO - __main__ - Step 32418: {'lr': 0.0001996689307482057, 'samples': 1037376, 'steps': 2026, 'loss/train': 2.3462607860565186} -09/20/2021 21:30:33 - INFO - __main__ - Step 32419: {'lr': 0.0001996689307482057, 'samples': 1037408, 'steps': 2026, 'loss/train': 2.274052858352661} -09/20/2021 21:30:34 - INFO - __main__ - Step 32420: {'lr': 0.0001996689307482057, 'samples': 1037440, 'steps': 2026, 'loss/train': 2.141730546951294} -09/20/2021 21:30:35 - INFO - __main__ - Step 32421: {'lr': 0.0001996689307482057, 'samples': 1037472, 'steps': 2026, 'loss/train': 1.996260166168213} -09/20/2021 21:30:36 - INFO - __main__ - Step 32422: {'lr': 0.0001996689307482057, 'samples': 1037504, 'steps': 2026, 'loss/train': 2.880800247192383} -09/20/2021 21:30:37 - INFO - __main__ - Step 32423: {'lr': 0.0001996689307482057, 'samples': 1037536, 'steps': 2026, 'loss/train': 3.377479076385498} -09/20/2021 21:30:38 - INFO - __main__ - Step 32424: {'lr': 0.0001996689307482057, 'samples': 1037568, 'steps': 2026, 'loss/train': 2.46480655670166} -09/20/2021 21:30:38 - INFO - __main__ - Step 32425: {'lr': 0.0001996689307482057, 'samples': 1037600, 'steps': 2026, 'loss/train': 1.6141859292984009} -09/20/2021 21:30:39 - INFO - __main__ - Step 32426: {'lr': 0.0001996689307482057, 'samples': 1037632, 'steps': 2026, 'loss/train': 1.7924602031707764} -09/20/2021 21:30:40 - INFO - __main__ - Step 32427: {'lr': 0.0001996689307482057, 'samples': 1037664, 'steps': 2026, 'loss/train': 1.7969919443130493} -09/20/2021 21:30:41 - INFO - __main__ - Step 32428: {'lr': 0.0001996689307482057, 'samples': 1037696, 'steps': 2026, 'loss/train': 2.098097801208496} -09/20/2021 21:30:41 - INFO - __main__ - Step 32429: {'lr': 0.0001996689307482057, 'samples': 1037728, 'steps': 2026, 'loss/train': 1.6899162530899048} -09/20/2021 21:30:42 - INFO - __main__ - Step 32430: {'lr': 0.0001996689307482057, 'samples': 1037760, 'steps': 2026, 'loss/train': 1.7548052072525024} -09/20/2021 21:30:43 - INFO - __main__ - Step 32431: {'lr': 0.0001996689307482057, 'samples': 1037792, 'steps': 2026, 'loss/train': 2.4580941200256348} -09/20/2021 21:30:44 - INFO - __main__ - Step 32432: {'lr': 0.0001996689307482057, 'samples': 1037824, 'steps': 2026, 'loss/train': 2.5133090019226074} -09/20/2021 21:30:44 - INFO - __main__ - Step 32433: {'lr': 0.00019966841191462628, 'samples': 1037856, 'steps': 2027, 'loss/train': 2.3519113063812256} -09/20/2021 21:30:45 - INFO - __main__ - Step 32434: {'lr': 0.00019966841191462628, 'samples': 1037888, 'steps': 2027, 'loss/train': 2.8912031650543213} -09/20/2021 21:30:46 - INFO - __main__ - Step 32435: {'lr': 0.00019966841191462628, 'samples': 1037920, 'steps': 2027, 'loss/train': 2.5904085636138916} -09/20/2021 21:30:47 - INFO - __main__ - Step 32436: {'lr': 0.00019966841191462628, 'samples': 1037952, 'steps': 2027, 'loss/train': 0.8379065990447998} -09/20/2021 21:30:47 - INFO - __main__ - Step 32437: {'lr': 0.00019966841191462628, 'samples': 1037984, 'steps': 2027, 'loss/train': 1.496843695640564} -09/20/2021 21:30:48 - INFO - __main__ - Step 32438: {'lr': 0.00019966841191462628, 'samples': 1038016, 'steps': 2027, 'loss/train': 1.9971897602081299} -09/20/2021 21:30:49 - INFO - __main__ - Step 32439: {'lr': 0.00019966841191462628, 'samples': 1038048, 'steps': 2027, 'loss/train': 2.3973605632781982} -09/20/2021 21:30:50 - INFO - __main__ - Step 32440: {'lr': 0.00019966841191462628, 'samples': 1038080, 'steps': 2027, 'loss/train': 2.393550395965576} -09/20/2021 21:30:51 - INFO - __main__ - Step 32441: {'lr': 0.00019966841191462628, 'samples': 1038112, 'steps': 2027, 'loss/train': 2.9845011234283447} -09/20/2021 21:30:51 - INFO - __main__ - Step 32442: {'lr': 0.00019966841191462628, 'samples': 1038144, 'steps': 2027, 'loss/train': 2.8490350246429443} -09/20/2021 21:30:52 - INFO - __main__ - Step 32443: {'lr': 0.00019966841191462628, 'samples': 1038176, 'steps': 2027, 'loss/train': 2.652060031890869} -09/20/2021 21:30:53 - INFO - __main__ - Step 32444: {'lr': 0.00019966841191462628, 'samples': 1038208, 'steps': 2027, 'loss/train': 0.7434204816818237} -09/20/2021 21:30:54 - INFO - __main__ - Step 32445: {'lr': 0.00019966841191462628, 'samples': 1038240, 'steps': 2027, 'loss/train': 3.0339081287384033} -09/20/2021 21:30:54 - INFO - __main__ - Step 32446: {'lr': 0.00019966841191462628, 'samples': 1038272, 'steps': 2027, 'loss/train': 2.4389896392822266} -09/20/2021 21:30:55 - INFO - __main__ - Step 32447: {'lr': 0.00019966841191462628, 'samples': 1038304, 'steps': 2027, 'loss/train': 2.256805658340454} -09/20/2021 21:30:56 - INFO - __main__ - Step 32448: {'lr': 0.00019966841191462628, 'samples': 1038336, 'steps': 2027, 'loss/train': 2.522867441177368} -09/20/2021 21:30:57 - INFO - __main__ - Step 32449: {'lr': 0.0001996678926754965, 'samples': 1038368, 'steps': 2028, 'loss/train': 2.3438632488250732} -09/20/2021 21:30:57 - INFO - __main__ - Step 32450: {'lr': 0.0001996678926754965, 'samples': 1038400, 'steps': 2028, 'loss/train': 2.2581090927124023} -09/20/2021 21:30:58 - INFO - __main__ - Step 32451: {'lr': 0.0001996678926754965, 'samples': 1038432, 'steps': 2028, 'loss/train': 2.693382978439331} -09/20/2021 21:30:59 - INFO - __main__ - Step 32452: {'lr': 0.0001996678926754965, 'samples': 1038464, 'steps': 2028, 'loss/train': 2.1633081436157227} -09/20/2021 21:31:00 - INFO - __main__ - Step 32453: {'lr': 0.0001996678926754965, 'samples': 1038496, 'steps': 2028, 'loss/train': 1.5800234079360962} -09/20/2021 21:31:01 - INFO - __main__ - Step 32454: {'lr': 0.0001996678926754965, 'samples': 1038528, 'steps': 2028, 'loss/train': 2.005739688873291} -09/20/2021 21:31:02 - INFO - __main__ - Step 32455: {'lr': 0.0001996678926754965, 'samples': 1038560, 'steps': 2028, 'loss/train': 1.5326533317565918} -09/20/2021 21:31:02 - INFO - __main__ - Step 32456: {'lr': 0.0001996678926754965, 'samples': 1038592, 'steps': 2028, 'loss/train': 2.5881147384643555} -09/20/2021 21:31:03 - INFO - __main__ - Step 32457: {'lr': 0.0001996678926754965, 'samples': 1038624, 'steps': 2028, 'loss/train': 2.2539498805999756} -09/20/2021 21:31:04 - INFO - __main__ - Step 32458: {'lr': 0.0001996678926754965, 'samples': 1038656, 'steps': 2028, 'loss/train': 2.741689920425415} -09/20/2021 21:31:05 - INFO - __main__ - Step 32459: {'lr': 0.0001996678926754965, 'samples': 1038688, 'steps': 2028, 'loss/train': 2.4307491779327393} -09/20/2021 21:31:05 - INFO - __main__ - Step 32460: {'lr': 0.0001996678926754965, 'samples': 1038720, 'steps': 2028, 'loss/train': 2.2434990406036377} -09/20/2021 21:31:06 - INFO - __main__ - Step 32461: {'lr': 0.0001996678926754965, 'samples': 1038752, 'steps': 2028, 'loss/train': 2.8560070991516113} -09/20/2021 21:31:07 - INFO - __main__ - Step 32462: {'lr': 0.0001996678926754965, 'samples': 1038784, 'steps': 2028, 'loss/train': 0.7589371800422668} -09/20/2021 21:31:08 - INFO - __main__ - Step 32463: {'lr': 0.0001996678926754965, 'samples': 1038816, 'steps': 2028, 'loss/train': 2.5985214710235596} -09/20/2021 21:31:08 - INFO - __main__ - Step 32464: {'lr': 0.0001996678926754965, 'samples': 1038848, 'steps': 2028, 'loss/train': 2.22369384765625} -09/20/2021 21:31:09 - INFO - __main__ - Step 32465: {'lr': 0.00019966737303081847, 'samples': 1038880, 'steps': 2029, 'loss/train': 2.0216941833496094} -09/20/2021 21:31:10 - INFO - __main__ - Step 32466: {'lr': 0.00019966737303081847, 'samples': 1038912, 'steps': 2029, 'loss/train': 1.656340479850769} -09/20/2021 21:31:11 - INFO - __main__ - Step 32467: {'lr': 0.00019966737303081847, 'samples': 1038944, 'steps': 2029, 'loss/train': 2.4843289852142334} -09/20/2021 21:31:12 - INFO - __main__ - Step 32468: {'lr': 0.00019966737303081847, 'samples': 1038976, 'steps': 2029, 'loss/train': 3.112420082092285} -09/20/2021 21:31:12 - INFO - __main__ - Step 32469: {'lr': 0.00019966737303081847, 'samples': 1039008, 'steps': 2029, 'loss/train': 1.1513278484344482} -09/20/2021 21:31:13 - INFO - __main__ - Step 32470: {'lr': 0.00019966737303081847, 'samples': 1039040, 'steps': 2029, 'loss/train': 1.7783713340759277} -09/20/2021 21:31:14 - INFO - __main__ - Step 32471: {'lr': 0.00019966737303081847, 'samples': 1039072, 'steps': 2029, 'loss/train': 2.174381732940674} -09/20/2021 21:31:15 - INFO - __main__ - Step 32472: {'lr': 0.00019966737303081847, 'samples': 1039104, 'steps': 2029, 'loss/train': 1.7041610479354858} -09/20/2021 21:31:15 - INFO - __main__ - Step 32473: {'lr': 0.00019966737303081847, 'samples': 1039136, 'steps': 2029, 'loss/train': 2.4946537017822266} -09/20/2021 21:31:16 - INFO - __main__ - Step 32474: {'lr': 0.00019966737303081847, 'samples': 1039168, 'steps': 2029, 'loss/train': 2.459834337234497} -09/20/2021 21:31:17 - INFO - __main__ - Step 32475: {'lr': 0.00019966737303081847, 'samples': 1039200, 'steps': 2029, 'loss/train': 2.2268614768981934} -09/20/2021 21:31:18 - INFO - __main__ - Step 32476: {'lr': 0.00019966737303081847, 'samples': 1039232, 'steps': 2029, 'loss/train': 2.7348594665527344} -09/20/2021 21:31:18 - INFO - __main__ - Step 32477: {'lr': 0.00019966737303081847, 'samples': 1039264, 'steps': 2029, 'loss/train': 2.0686564445495605} -09/20/2021 21:31:19 - INFO - __main__ - Step 32478: {'lr': 0.00019966737303081847, 'samples': 1039296, 'steps': 2029, 'loss/train': 2.1925246715545654} -09/20/2021 21:31:20 - INFO - __main__ - Step 32479: {'lr': 0.00019966737303081847, 'samples': 1039328, 'steps': 2029, 'loss/train': 1.467162847518921} -09/20/2021 21:31:21 - INFO - __main__ - Step 32480: {'lr': 0.00019966737303081847, 'samples': 1039360, 'steps': 2029, 'loss/train': 0.880229115486145} -09/20/2021 21:31:21 - INFO - __main__ - Step 32481: {'lr': 0.00019966685298059423, 'samples': 1039392, 'steps': 2030, 'loss/train': 2.1700923442840576} -09/20/2021 21:31:22 - INFO - __main__ - Step 32482: {'lr': 0.00019966685298059423, 'samples': 1039424, 'steps': 2030, 'loss/train': 2.141040802001953} -09/20/2021 21:31:23 - INFO - __main__ - Step 32483: {'lr': 0.00019966685298059423, 'samples': 1039456, 'steps': 2030, 'loss/train': 3.087104082107544} -09/20/2021 21:31:25 - INFO - __main__ - Step 32484: {'lr': 0.00019966685298059423, 'samples': 1039488, 'steps': 2030, 'loss/train': 2.4247899055480957} -09/20/2021 21:31:25 - INFO - __main__ - Step 32485: {'lr': 0.00019966685298059423, 'samples': 1039520, 'steps': 2030, 'loss/train': 1.9798779487609863} -09/20/2021 21:31:26 - INFO - __main__ - Step 32486: {'lr': 0.00019966685298059423, 'samples': 1039552, 'steps': 2030, 'loss/train': 1.9689043760299683} -09/20/2021 21:31:27 - INFO - __main__ - Step 32487: {'lr': 0.00019966685298059423, 'samples': 1039584, 'steps': 2030, 'loss/train': 2.2986512184143066} -09/20/2021 21:31:28 - INFO - __main__ - Step 32488: {'lr': 0.00019966685298059423, 'samples': 1039616, 'steps': 2030, 'loss/train': 1.889029622077942} -09/20/2021 21:31:28 - INFO - __main__ - Step 32489: {'lr': 0.00019966685298059423, 'samples': 1039648, 'steps': 2030, 'loss/train': 2.98639178276062} -09/20/2021 21:31:29 - INFO - __main__ - Step 32490: {'lr': 0.00019966685298059423, 'samples': 1039680, 'steps': 2030, 'loss/train': 2.2446420192718506} -09/20/2021 21:31:30 - INFO - __main__ - Step 32491: {'lr': 0.00019966685298059423, 'samples': 1039712, 'steps': 2030, 'loss/train': 1.9247137308120728} -09/20/2021 21:31:31 - INFO - __main__ - Step 32492: {'lr': 0.00019966685298059423, 'samples': 1039744, 'steps': 2030, 'loss/train': 2.5435314178466797} -09/20/2021 21:31:31 - INFO - __main__ - Step 32493: {'lr': 0.00019966685298059423, 'samples': 1039776, 'steps': 2030, 'loss/train': 2.3579955101013184} -09/20/2021 21:31:32 - INFO - __main__ - Step 32494: {'lr': 0.00019966685298059423, 'samples': 1039808, 'steps': 2030, 'loss/train': 2.978102922439575} -09/20/2021 21:31:33 - INFO - __main__ - Step 32495: {'lr': 0.00019966685298059423, 'samples': 1039840, 'steps': 2030, 'loss/train': 2.2001192569732666} -09/20/2021 21:31:34 - INFO - __main__ - Step 32496: {'lr': 0.00019966685298059423, 'samples': 1039872, 'steps': 2030, 'loss/train': 2.444903612136841} -09/20/2021 21:31:34 - INFO - __main__ - Step 32497: {'lr': 0.00019966633252482602, 'samples': 1039904, 'steps': 2031, 'loss/train': 2.287644624710083} -09/20/2021 21:31:35 - INFO - __main__ - Step 32498: {'lr': 0.00019966633252482602, 'samples': 1039936, 'steps': 2031, 'loss/train': 2.0768697261810303} -09/20/2021 21:31:36 - INFO - __main__ - Step 32499: {'lr': 0.00019966633252482602, 'samples': 1039968, 'steps': 2031, 'loss/train': 2.798694133758545} -09/20/2021 21:31:37 - INFO - __main__ - Step 32500: {'lr': 0.00019966633252482602, 'samples': 1040000, 'steps': 2031, 'loss/train': 2.539886951446533} -09/20/2021 21:31:37 - INFO - __main__ - Step 32501: {'lr': 0.00019966633252482602, 'samples': 1040032, 'steps': 2031, 'loss/train': 1.422989010810852} -09/20/2021 21:31:38 - INFO - __main__ - Step 32502: {'lr': 0.00019966633252482602, 'samples': 1040064, 'steps': 2031, 'loss/train': 2.700456380844116} -09/20/2021 21:31:39 - INFO - __main__ - Step 32503: {'lr': 0.00019966633252482602, 'samples': 1040096, 'steps': 2031, 'loss/train': 4.408829212188721} -09/20/2021 21:31:40 - INFO - __main__ - Step 32504: {'lr': 0.00019966633252482602, 'samples': 1040128, 'steps': 2031, 'loss/train': 2.571106433868408} -09/20/2021 21:31:40 - INFO - __main__ - Step 32505: {'lr': 0.00019966633252482602, 'samples': 1040160, 'steps': 2031, 'loss/train': 0.37653031945228577} -09/20/2021 21:31:41 - INFO - __main__ - Step 32506: {'lr': 0.00019966633252482602, 'samples': 1040192, 'steps': 2031, 'loss/train': 0.35790714621543884} -09/20/2021 21:31:42 - INFO - __main__ - Step 32507: {'lr': 0.00019966633252482602, 'samples': 1040224, 'steps': 2031, 'loss/train': 0.3024829626083374} -09/20/2021 21:31:43 - INFO - __main__ - Step 32508: {'lr': 0.00019966633252482602, 'samples': 1040256, 'steps': 2031, 'loss/train': 2.769859790802002} -09/20/2021 21:31:43 - INFO - __main__ - Step 32509: {'lr': 0.00019966633252482602, 'samples': 1040288, 'steps': 2031, 'loss/train': 3.033914804458618} -09/20/2021 21:31:44 - INFO - __main__ - Step 32510: {'lr': 0.00019966633252482602, 'samples': 1040320, 'steps': 2031, 'loss/train': 2.299668312072754} -09/20/2021 21:31:45 - INFO - __main__ - Step 32511: {'lr': 0.00019966633252482602, 'samples': 1040352, 'steps': 2031, 'loss/train': 2.5955021381378174} -09/20/2021 21:31:46 - INFO - __main__ - Step 32512: {'lr': 0.00019966633252482602, 'samples': 1040384, 'steps': 2031, 'loss/train': 2.505572557449341} -09/20/2021 21:31:47 - INFO - __main__ - Step 32513: {'lr': 0.00019966581166351582, 'samples': 1040416, 'steps': 2032, 'loss/train': 3.1790759563446045} -09/20/2021 21:31:47 - INFO - __main__ - Step 32514: {'lr': 0.00019966581166351582, 'samples': 1040448, 'steps': 2032, 'loss/train': 0.5399327874183655} -09/20/2021 21:31:48 - INFO - __main__ - Step 32515: {'lr': 0.00019966581166351582, 'samples': 1040480, 'steps': 2032, 'loss/train': 0.2742493450641632} -09/20/2021 21:31:49 - INFO - __main__ - Step 32516: {'lr': 0.00019966581166351582, 'samples': 1040512, 'steps': 2032, 'loss/train': 0.3979310095310211} -09/20/2021 21:31:50 - INFO - __main__ - Step 32517: {'lr': 0.00019966581166351582, 'samples': 1040544, 'steps': 2032, 'loss/train': 0.22243192791938782} -09/20/2021 21:31:51 - INFO - __main__ - Step 32518: {'lr': 0.00019966581166351582, 'samples': 1040576, 'steps': 2032, 'loss/train': 0.42213425040245056} -09/20/2021 21:31:52 - INFO - __main__ - Step 32519: {'lr': 0.00019966581166351582, 'samples': 1040608, 'steps': 2032, 'loss/train': 1.0995075702667236} -09/20/2021 21:31:52 - INFO - __main__ - Step 32520: {'lr': 0.00019966581166351582, 'samples': 1040640, 'steps': 2032, 'loss/train': 1.6053465604782104} -09/20/2021 21:31:53 - INFO - __main__ - Step 32521: {'lr': 0.00019966581166351582, 'samples': 1040672, 'steps': 2032, 'loss/train': 4.227639198303223} -09/20/2021 21:31:54 - INFO - __main__ - Step 32522: {'lr': 0.00019966581166351582, 'samples': 1040704, 'steps': 2032, 'loss/train': 2.138082265853882} -09/20/2021 21:31:55 - INFO - __main__ - Step 32523: {'lr': 0.00019966581166351582, 'samples': 1040736, 'steps': 2032, 'loss/train': 2.994032382965088} -09/20/2021 21:31:56 - INFO - __main__ - Step 32524: {'lr': 0.00019966581166351582, 'samples': 1040768, 'steps': 2032, 'loss/train': 2.179990291595459} -09/20/2021 21:31:56 - INFO - __main__ - Step 32525: {'lr': 0.00019966581166351582, 'samples': 1040800, 'steps': 2032, 'loss/train': 3.2342422008514404} -09/20/2021 21:31:57 - INFO - __main__ - Step 32526: {'lr': 0.00019966581166351582, 'samples': 1040832, 'steps': 2032, 'loss/train': 3.465459108352661} -09/20/2021 21:31:58 - INFO - __main__ - Step 32527: {'lr': 0.00019966581166351582, 'samples': 1040864, 'steps': 2032, 'loss/train': 2.694666862487793} -09/20/2021 21:31:59 - INFO - __main__ - Step 32528: {'lr': 0.00019966581166351582, 'samples': 1040896, 'steps': 2032, 'loss/train': 2.0177135467529297} -09/20/2021 21:31:59 - INFO - __main__ - Step 32529: {'lr': 0.00019966529039666585, 'samples': 1040928, 'steps': 2033, 'loss/train': 2.3784542083740234} -09/20/2021 21:32:00 - INFO - __main__ - Step 32530: {'lr': 0.00019966529039666585, 'samples': 1040960, 'steps': 2033, 'loss/train': 3.1010794639587402} -09/20/2021 21:32:01 - INFO - __main__ - Step 32531: {'lr': 0.00019966529039666585, 'samples': 1040992, 'steps': 2033, 'loss/train': 2.1644845008850098} -09/20/2021 21:32:02 - INFO - __main__ - Step 32532: {'lr': 0.00019966529039666585, 'samples': 1041024, 'steps': 2033, 'loss/train': 1.7696466445922852} -09/20/2021 21:32:02 - INFO - __main__ - Step 32533: {'lr': 0.00019966529039666585, 'samples': 1041056, 'steps': 2033, 'loss/train': 2.289214849472046} -09/20/2021 21:32:03 - INFO - __main__ - Step 32534: {'lr': 0.00019966529039666585, 'samples': 1041088, 'steps': 2033, 'loss/train': 1.6904821395874023} -09/20/2021 21:32:04 - INFO - __main__ - Step 32535: {'lr': 0.00019966529039666585, 'samples': 1041120, 'steps': 2033, 'loss/train': 1.6978729963302612} -09/20/2021 21:32:05 - INFO - __main__ - Step 32536: {'lr': 0.00019966529039666585, 'samples': 1041152, 'steps': 2033, 'loss/train': 2.4365105628967285} -09/20/2021 21:32:05 - INFO - __main__ - Step 32537: {'lr': 0.00019966529039666585, 'samples': 1041184, 'steps': 2033, 'loss/train': 3.0675768852233887} -09/20/2021 21:32:06 - INFO - __main__ - Step 32538: {'lr': 0.00019966529039666585, 'samples': 1041216, 'steps': 2033, 'loss/train': 1.4605779647827148} -09/20/2021 21:32:07 - INFO - __main__ - Step 32539: {'lr': 0.00019966529039666585, 'samples': 1041248, 'steps': 2033, 'loss/train': 2.0529472827911377} -09/20/2021 21:32:08 - INFO - __main__ - Step 32540: {'lr': 0.00019966529039666585, 'samples': 1041280, 'steps': 2033, 'loss/train': 2.498216152191162} -09/20/2021 21:32:08 - INFO - __main__ - Step 32541: {'lr': 0.00019966529039666585, 'samples': 1041312, 'steps': 2033, 'loss/train': 1.8815556764602661} -09/20/2021 21:32:09 - INFO - __main__ - Step 32542: {'lr': 0.00019966529039666585, 'samples': 1041344, 'steps': 2033, 'loss/train': 1.2932302951812744} -09/20/2021 21:32:10 - INFO - __main__ - Step 32543: {'lr': 0.00019966529039666585, 'samples': 1041376, 'steps': 2033, 'loss/train': 1.6254701614379883} -09/20/2021 21:32:11 - INFO - __main__ - Step 32544: {'lr': 0.00019966529039666585, 'samples': 1041408, 'steps': 2033, 'loss/train': 0.5243287086486816} -09/20/2021 21:32:12 - INFO - __main__ - Step 32545: {'lr': 0.00019966476872427822, 'samples': 1041440, 'steps': 2034, 'loss/train': 1.2983423471450806} -09/20/2021 21:32:12 - INFO - __main__ - Step 32546: {'lr': 0.00019966476872427822, 'samples': 1041472, 'steps': 2034, 'loss/train': 1.9367188215255737} -09/20/2021 21:32:13 - INFO - __main__ - Step 32547: {'lr': 0.00019966476872427822, 'samples': 1041504, 'steps': 2034, 'loss/train': 2.017819881439209} -09/20/2021 21:32:14 - INFO - __main__ - Step 32548: {'lr': 0.00019966476872427822, 'samples': 1041536, 'steps': 2034, 'loss/train': 2.7421438694000244} -09/20/2021 21:32:15 - INFO - __main__ - Step 32549: {'lr': 0.00019966476872427822, 'samples': 1041568, 'steps': 2034, 'loss/train': 1.8677771091461182} -09/20/2021 21:32:16 - INFO - __main__ - Step 32550: {'lr': 0.00019966476872427822, 'samples': 1041600, 'steps': 2034, 'loss/train': 2.644139289855957} -09/20/2021 21:32:17 - INFO - __main__ - Step 32551: {'lr': 0.00019966476872427822, 'samples': 1041632, 'steps': 2034, 'loss/train': 3.1817739009857178} -09/20/2021 21:32:17 - INFO - __main__ - Step 32552: {'lr': 0.00019966476872427822, 'samples': 1041664, 'steps': 2034, 'loss/train': 1.992048978805542} -09/20/2021 21:32:18 - INFO - __main__ - Step 32553: {'lr': 0.00019966476872427822, 'samples': 1041696, 'steps': 2034, 'loss/train': 2.636895179748535} -09/20/2021 21:32:19 - INFO - __main__ - Step 32554: {'lr': 0.00019966476872427822, 'samples': 1041728, 'steps': 2034, 'loss/train': 2.639357089996338} -09/20/2021 21:32:20 - INFO - __main__ - Step 32555: {'lr': 0.00019966476872427822, 'samples': 1041760, 'steps': 2034, 'loss/train': 2.4495058059692383} -09/20/2021 21:32:20 - INFO - __main__ - Step 32556: {'lr': 0.00019966476872427822, 'samples': 1041792, 'steps': 2034, 'loss/train': 1.8490631580352783} -09/20/2021 21:32:21 - INFO - __main__ - Step 32557: {'lr': 0.00019966476872427822, 'samples': 1041824, 'steps': 2034, 'loss/train': 2.2786705493927} -09/20/2021 21:32:22 - INFO - __main__ - Step 32558: {'lr': 0.00019966476872427822, 'samples': 1041856, 'steps': 2034, 'loss/train': 2.337693214416504} -09/20/2021 21:32:23 - INFO - __main__ - Step 32559: {'lr': 0.00019966476872427822, 'samples': 1041888, 'steps': 2034, 'loss/train': 1.8894219398498535} -09/20/2021 21:32:23 - INFO - __main__ - Step 32560: {'lr': 0.00019966476872427822, 'samples': 1041920, 'steps': 2034, 'loss/train': 2.0882389545440674} -09/20/2021 21:32:24 - INFO - __main__ - Step 32561: {'lr': 0.000199664246646355, 'samples': 1041952, 'steps': 2035, 'loss/train': 2.5223824977874756} -09/20/2021 21:32:25 - INFO - __main__ - Step 32562: {'lr': 0.000199664246646355, 'samples': 1041984, 'steps': 2035, 'loss/train': 1.3262948989868164} -09/20/2021 21:32:26 - INFO - __main__ - Step 32563: {'lr': 0.000199664246646355, 'samples': 1042016, 'steps': 2035, 'loss/train': 3.042325973510742} -09/20/2021 21:32:26 - INFO - __main__ - Step 32564: {'lr': 0.000199664246646355, 'samples': 1042048, 'steps': 2035, 'loss/train': 2.539252758026123} -09/20/2021 21:32:27 - INFO - __main__ - Step 32565: {'lr': 0.000199664246646355, 'samples': 1042080, 'steps': 2035, 'loss/train': 2.0742015838623047} -09/20/2021 21:32:28 - INFO - __main__ - Step 32566: {'lr': 0.000199664246646355, 'samples': 1042112, 'steps': 2035, 'loss/train': 2.6330482959747314} -09/20/2021 21:32:29 - INFO - __main__ - Step 32567: {'lr': 0.000199664246646355, 'samples': 1042144, 'steps': 2035, 'loss/train': 1.109978199005127} -09/20/2021 21:32:29 - INFO - __main__ - Step 32568: {'lr': 0.000199664246646355, 'samples': 1042176, 'steps': 2035, 'loss/train': 1.9972537755966187} -09/20/2021 21:32:30 - INFO - __main__ - Step 32569: {'lr': 0.000199664246646355, 'samples': 1042208, 'steps': 2035, 'loss/train': 2.3915114402770996} -09/20/2021 21:32:31 - INFO - __main__ - Step 32570: {'lr': 0.000199664246646355, 'samples': 1042240, 'steps': 2035, 'loss/train': 2.056887626647949} -09/20/2021 21:32:32 - INFO - __main__ - Step 32571: {'lr': 0.000199664246646355, 'samples': 1042272, 'steps': 2035, 'loss/train': 1.870740294456482} -09/20/2021 21:32:32 - INFO - __main__ - Step 32572: {'lr': 0.000199664246646355, 'samples': 1042304, 'steps': 2035, 'loss/train': 2.4321448802948} -09/20/2021 21:32:33 - INFO - __main__ - Step 32573: {'lr': 0.000199664246646355, 'samples': 1042336, 'steps': 2035, 'loss/train': 2.7875020503997803} -09/20/2021 21:32:34 - INFO - __main__ - Step 32574: {'lr': 0.000199664246646355, 'samples': 1042368, 'steps': 2035, 'loss/train': 1.3915835618972778} -09/20/2021 21:32:35 - INFO - __main__ - Step 32575: {'lr': 0.000199664246646355, 'samples': 1042400, 'steps': 2035, 'loss/train': 2.23232364654541} -09/20/2021 21:32:35 - INFO - __main__ - Step 32576: {'lr': 0.000199664246646355, 'samples': 1042432, 'steps': 2035, 'loss/train': 2.1093647480010986} -09/20/2021 21:32:36 - INFO - __main__ - Step 32577: {'lr': 0.0001996637241628984, 'samples': 1042464, 'steps': 2036, 'loss/train': 2.2527577877044678} -09/20/2021 21:32:37 - INFO - __main__ - Step 32578: {'lr': 0.0001996637241628984, 'samples': 1042496, 'steps': 2036, 'loss/train': 1.4569765329360962} -09/20/2021 21:32:38 - INFO - __main__ - Step 32579: {'lr': 0.0001996637241628984, 'samples': 1042528, 'steps': 2036, 'loss/train': 2.7170536518096924} -09/20/2021 21:32:40 - INFO - __main__ - Step 32580: {'lr': 0.0001996637241628984, 'samples': 1042560, 'steps': 2036, 'loss/train': 3.0335395336151123} -09/20/2021 21:32:40 - INFO - __main__ - Step 32581: {'lr': 0.0001996637241628984, 'samples': 1042592, 'steps': 2036, 'loss/train': 2.2877604961395264} -09/20/2021 21:32:41 - INFO - __main__ - Step 32582: {'lr': 0.0001996637241628984, 'samples': 1042624, 'steps': 2036, 'loss/train': 2.1740472316741943} -09/20/2021 21:32:42 - INFO - __main__ - Step 32583: {'lr': 0.0001996637241628984, 'samples': 1042656, 'steps': 2036, 'loss/train': 2.365950107574463} -09/20/2021 21:32:43 - INFO - __main__ - Step 32584: {'lr': 0.0001996637241628984, 'samples': 1042688, 'steps': 2036, 'loss/train': 2.3191404342651367} -09/20/2021 21:32:43 - INFO - __main__ - Step 32585: {'lr': 0.0001996637241628984, 'samples': 1042720, 'steps': 2036, 'loss/train': 0.28454792499542236} -09/20/2021 21:32:44 - INFO - __main__ - Step 32586: {'lr': 0.0001996637241628984, 'samples': 1042752, 'steps': 2036, 'loss/train': 0.44397374987602234} -09/20/2021 21:32:45 - INFO - __main__ - Step 32587: {'lr': 0.0001996637241628984, 'samples': 1042784, 'steps': 2036, 'loss/train': 0.26955708861351013} -09/20/2021 21:32:46 - INFO - __main__ - Step 32588: {'lr': 0.0001996637241628984, 'samples': 1042816, 'steps': 2036, 'loss/train': 2.719620943069458} -09/20/2021 21:32:46 - INFO - __main__ - Step 32589: {'lr': 0.0001996637241628984, 'samples': 1042848, 'steps': 2036, 'loss/train': 1.3750324249267578} -09/20/2021 21:32:47 - INFO - __main__ - Step 32590: {'lr': 0.0001996637241628984, 'samples': 1042880, 'steps': 2036, 'loss/train': 2.3093249797821045} -09/20/2021 21:32:48 - INFO - __main__ - Step 32591: {'lr': 0.0001996637241628984, 'samples': 1042912, 'steps': 2036, 'loss/train': 2.868422746658325} -09/20/2021 21:32:49 - INFO - __main__ - Step 32592: {'lr': 0.0001996637241628984, 'samples': 1042944, 'steps': 2036, 'loss/train': 2.9833357334136963} -09/20/2021 21:32:50 - INFO - __main__ - Step 32593: {'lr': 0.00019966320127391045, 'samples': 1042976, 'steps': 2037, 'loss/train': 2.5595836639404297} -09/20/2021 21:32:50 - INFO - __main__ - Step 32594: {'lr': 0.00019966320127391045, 'samples': 1043008, 'steps': 2037, 'loss/train': 2.111285448074341} -09/20/2021 21:32:51 - INFO - __main__ - Step 32595: {'lr': 0.00019966320127391045, 'samples': 1043040, 'steps': 2037, 'loss/train': 2.7848968505859375} -09/20/2021 21:32:52 - INFO - __main__ - Step 32596: {'lr': 0.00019966320127391045, 'samples': 1043072, 'steps': 2037, 'loss/train': 2.8977057933807373} -09/20/2021 21:32:53 - INFO - __main__ - Step 32597: {'lr': 0.00019966320127391045, 'samples': 1043104, 'steps': 2037, 'loss/train': 3.1541974544525146} -09/20/2021 21:32:53 - INFO - __main__ - Step 32598: {'lr': 0.00019966320127391045, 'samples': 1043136, 'steps': 2037, 'loss/train': 2.0568323135375977} -09/20/2021 21:32:54 - INFO - __main__ - Step 32599: {'lr': 0.00019966320127391045, 'samples': 1043168, 'steps': 2037, 'loss/train': 2.5768048763275146} -09/20/2021 21:32:55 - INFO - __main__ - Step 32600: {'lr': 0.00019966320127391045, 'samples': 1043200, 'steps': 2037, 'loss/train': 2.704700469970703} -09/20/2021 21:32:56 - INFO - __main__ - Step 32601: {'lr': 0.00019966320127391045, 'samples': 1043232, 'steps': 2037, 'loss/train': 2.072108745574951} -09/20/2021 21:32:56 - INFO - __main__ - Step 32602: {'lr': 0.00019966320127391045, 'samples': 1043264, 'steps': 2037, 'loss/train': 2.6255972385406494} -09/20/2021 21:32:57 - INFO - __main__ - Step 32603: {'lr': 0.00019966320127391045, 'samples': 1043296, 'steps': 2037, 'loss/train': 2.1245665550231934} -09/20/2021 21:32:58 - INFO - __main__ - Step 32604: {'lr': 0.00019966320127391045, 'samples': 1043328, 'steps': 2037, 'loss/train': 2.8822779655456543} -09/20/2021 21:32:59 - INFO - __main__ - Step 32605: {'lr': 0.00019966320127391045, 'samples': 1043360, 'steps': 2037, 'loss/train': 2.214048385620117} -09/20/2021 21:32:59 - INFO - __main__ - Step 32606: {'lr': 0.00019966320127391045, 'samples': 1043392, 'steps': 2037, 'loss/train': 1.644019365310669} -09/20/2021 21:33:00 - INFO - __main__ - Step 32607: {'lr': 0.00019966320127391045, 'samples': 1043424, 'steps': 2037, 'loss/train': 2.874356269836426} -09/20/2021 21:33:01 - INFO - __main__ - Step 32608: {'lr': 0.00019966320127391045, 'samples': 1043456, 'steps': 2037, 'loss/train': 2.723879098892212} -09/20/2021 21:33:02 - INFO - __main__ - Step 32609: {'lr': 0.0001996626779793933, 'samples': 1043488, 'steps': 2038, 'loss/train': 2.3923161029815674} -09/20/2021 21:33:02 - INFO - __main__ - Step 32610: {'lr': 0.0001996626779793933, 'samples': 1043520, 'steps': 2038, 'loss/train': 2.5410683155059814} -09/20/2021 21:33:04 - INFO - __main__ - Step 32611: {'lr': 0.0001996626779793933, 'samples': 1043552, 'steps': 2038, 'loss/train': 1.8691129684448242} -09/20/2021 21:33:05 - INFO - __main__ - Step 32612: {'lr': 0.0001996626779793933, 'samples': 1043584, 'steps': 2038, 'loss/train': 1.7273571491241455} -09/20/2021 21:33:05 - INFO - __main__ - Step 32613: {'lr': 0.0001996626779793933, 'samples': 1043616, 'steps': 2038, 'loss/train': 2.3775792121887207} -09/20/2021 21:33:06 - INFO - __main__ - Step 32614: {'lr': 0.0001996626779793933, 'samples': 1043648, 'steps': 2038, 'loss/train': 1.2154158353805542} -09/20/2021 21:33:07 - INFO - __main__ - Step 32615: {'lr': 0.0001996626779793933, 'samples': 1043680, 'steps': 2038, 'loss/train': 2.303837537765503} -09/20/2021 21:33:08 - INFO - __main__ - Step 32616: {'lr': 0.0001996626779793933, 'samples': 1043712, 'steps': 2038, 'loss/train': 0.5526332855224609} -09/20/2021 21:33:08 - INFO - __main__ - Step 32617: {'lr': 0.0001996626779793933, 'samples': 1043744, 'steps': 2038, 'loss/train': 0.8380908370018005} -09/20/2021 21:33:09 - INFO - __main__ - Step 32618: {'lr': 0.0001996626779793933, 'samples': 1043776, 'steps': 2038, 'loss/train': 1.6869032382965088} -09/20/2021 21:33:10 - INFO - __main__ - Step 32619: {'lr': 0.0001996626779793933, 'samples': 1043808, 'steps': 2038, 'loss/train': 2.2148077487945557} -09/20/2021 21:33:11 - INFO - __main__ - Step 32620: {'lr': 0.0001996626779793933, 'samples': 1043840, 'steps': 2038, 'loss/train': 2.5440168380737305} -09/20/2021 21:33:11 - INFO - __main__ - Step 32621: {'lr': 0.0001996626779793933, 'samples': 1043872, 'steps': 2038, 'loss/train': 2.3814728260040283} -09/20/2021 21:33:12 - INFO - __main__ - Step 32622: {'lr': 0.0001996626779793933, 'samples': 1043904, 'steps': 2038, 'loss/train': 3.3255298137664795} -09/20/2021 21:33:13 - INFO - __main__ - Step 32623: {'lr': 0.0001996626779793933, 'samples': 1043936, 'steps': 2038, 'loss/train': 2.7990188598632812} -09/20/2021 21:33:14 - INFO - __main__ - Step 32624: {'lr': 0.0001996626779793933, 'samples': 1043968, 'steps': 2038, 'loss/train': 2.211758852005005} -09/20/2021 21:33:14 - INFO - __main__ - Step 32625: {'lr': 0.00019966215427934914, 'samples': 1044000, 'steps': 2039, 'loss/train': 2.7087671756744385} -09/20/2021 21:33:15 - INFO - __main__ - Step 32626: {'lr': 0.00019966215427934914, 'samples': 1044032, 'steps': 2039, 'loss/train': 2.15565824508667} -09/20/2021 21:33:16 - INFO - __main__ - Step 32627: {'lr': 0.00019966215427934914, 'samples': 1044064, 'steps': 2039, 'loss/train': 2.256304979324341} -09/20/2021 21:33:17 - INFO - __main__ - Step 32628: {'lr': 0.00019966215427934914, 'samples': 1044096, 'steps': 2039, 'loss/train': 3.1904685497283936} -09/20/2021 21:33:17 - INFO - __main__ - Step 32629: {'lr': 0.00019966215427934914, 'samples': 1044128, 'steps': 2039, 'loss/train': 2.955214023590088} -09/20/2021 21:33:18 - INFO - __main__ - Step 32630: {'lr': 0.00019966215427934914, 'samples': 1044160, 'steps': 2039, 'loss/train': 2.044595956802368} -09/20/2021 21:33:19 - INFO - __main__ - Step 32631: {'lr': 0.00019966215427934914, 'samples': 1044192, 'steps': 2039, 'loss/train': 2.1444432735443115} -09/20/2021 21:33:20 - INFO - __main__ - Step 32632: {'lr': 0.00019966215427934914, 'samples': 1044224, 'steps': 2039, 'loss/train': 3.229004383087158} -09/20/2021 21:33:20 - INFO - __main__ - Step 32633: {'lr': 0.00019966215427934914, 'samples': 1044256, 'steps': 2039, 'loss/train': 1.5177078247070312} -09/20/2021 21:33:21 - INFO - __main__ - Step 32634: {'lr': 0.00019966215427934914, 'samples': 1044288, 'steps': 2039, 'loss/train': 1.4446048736572266} -09/20/2021 21:33:22 - INFO - __main__ - Step 32635: {'lr': 0.00019966215427934914, 'samples': 1044320, 'steps': 2039, 'loss/train': 1.526166319847107} -09/20/2021 21:33:23 - INFO - __main__ - Step 32636: {'lr': 0.00019966215427934914, 'samples': 1044352, 'steps': 2039, 'loss/train': 1.3936853408813477} -09/20/2021 21:33:23 - INFO - __main__ - Step 32637: {'lr': 0.00019966215427934914, 'samples': 1044384, 'steps': 2039, 'loss/train': 2.919045925140381} -09/20/2021 21:33:24 - INFO - __main__ - Step 32638: {'lr': 0.00019966215427934914, 'samples': 1044416, 'steps': 2039, 'loss/train': 2.838405132293701} -09/20/2021 21:33:25 - INFO - __main__ - Step 32639: {'lr': 0.00019966215427934914, 'samples': 1044448, 'steps': 2039, 'loss/train': 1.8733749389648438} -09/20/2021 21:33:26 - INFO - __main__ - Step 32640: {'lr': 0.00019966215427934914, 'samples': 1044480, 'steps': 2039, 'loss/train': 2.5906684398651123} -09/20/2021 21:33:27 - INFO - __main__ - Step 32641: {'lr': 0.00019966163017378006, 'samples': 1044512, 'steps': 2040, 'loss/train': 1.6687380075454712} -09/20/2021 21:33:28 - INFO - __main__ - Step 32642: {'lr': 0.00019966163017378006, 'samples': 1044544, 'steps': 2040, 'loss/train': 1.1802458763122559} -09/20/2021 21:33:29 - INFO - __main__ - Step 32643: {'lr': 0.00019966163017378006, 'samples': 1044576, 'steps': 2040, 'loss/train': 2.8347408771514893} -09/20/2021 21:33:29 - INFO - __main__ - Step 32644: {'lr': 0.00019966163017378006, 'samples': 1044608, 'steps': 2040, 'loss/train': 1.7746577262878418} -09/20/2021 21:33:30 - INFO - __main__ - Step 32645: {'lr': 0.00019966163017378006, 'samples': 1044640, 'steps': 2040, 'loss/train': 2.6159963607788086} -09/20/2021 21:33:31 - INFO - __main__ - Step 32646: {'lr': 0.00019966163017378006, 'samples': 1044672, 'steps': 2040, 'loss/train': 2.8423361778259277} -09/20/2021 21:33:32 - INFO - __main__ - Step 32647: {'lr': 0.00019966163017378006, 'samples': 1044704, 'steps': 2040, 'loss/train': 1.997196912765503} -09/20/2021 21:33:32 - INFO - __main__ - Step 32648: {'lr': 0.00019966163017378006, 'samples': 1044736, 'steps': 2040, 'loss/train': 2.547022581100464} -09/20/2021 21:33:33 - INFO - __main__ - Step 32649: {'lr': 0.00019966163017378006, 'samples': 1044768, 'steps': 2040, 'loss/train': 2.120776891708374} -09/20/2021 21:33:34 - INFO - __main__ - Step 32650: {'lr': 0.00019966163017378006, 'samples': 1044800, 'steps': 2040, 'loss/train': 0.8098393082618713} -09/20/2021 21:33:35 - INFO - __main__ - Step 32651: {'lr': 0.00019966163017378006, 'samples': 1044832, 'steps': 2040, 'loss/train': 0.200203076004982} -09/20/2021 21:33:35 - INFO - __main__ - Step 32652: {'lr': 0.00019966163017378006, 'samples': 1044864, 'steps': 2040, 'loss/train': 0.1420024335384369} -09/20/2021 21:33:36 - INFO - __main__ - Step 32653: {'lr': 0.00019966163017378006, 'samples': 1044896, 'steps': 2040, 'loss/train': 2.418588638305664} -09/20/2021 21:33:37 - INFO - __main__ - Step 32654: {'lr': 0.00019966163017378006, 'samples': 1044928, 'steps': 2040, 'loss/train': 2.4547669887542725} -09/20/2021 21:33:38 - INFO - __main__ - Step 32655: {'lr': 0.00019966163017378006, 'samples': 1044960, 'steps': 2040, 'loss/train': 2.1008005142211914} -09/20/2021 21:33:38 - INFO - __main__ - Step 32656: {'lr': 0.00019966163017378006, 'samples': 1044992, 'steps': 2040, 'loss/train': 1.84257972240448} -09/20/2021 21:33:39 - INFO - __main__ - Step 32657: {'lr': 0.00019966110566268816, 'samples': 1045024, 'steps': 2041, 'loss/train': 2.1563730239868164} -09/20/2021 21:33:40 - INFO - __main__ - Step 32658: {'lr': 0.00019966110566268816, 'samples': 1045056, 'steps': 2041, 'loss/train': 3.06589937210083} -09/20/2021 21:33:41 - INFO - __main__ - Step 32659: {'lr': 0.00019966110566268816, 'samples': 1045088, 'steps': 2041, 'loss/train': 2.9173471927642822} -09/20/2021 21:33:42 - INFO - __main__ - Step 32660: {'lr': 0.00019966110566268816, 'samples': 1045120, 'steps': 2041, 'loss/train': 2.6304004192352295} -09/20/2021 21:33:42 - INFO - __main__ - Step 32661: {'lr': 0.00019966110566268816, 'samples': 1045152, 'steps': 2041, 'loss/train': 2.488929271697998} -09/20/2021 21:33:43 - INFO - __main__ - Step 32662: {'lr': 0.00019966110566268816, 'samples': 1045184, 'steps': 2041, 'loss/train': 1.6415081024169922} -09/20/2021 21:33:44 - INFO - __main__ - Step 32663: {'lr': 0.00019966110566268816, 'samples': 1045216, 'steps': 2041, 'loss/train': 2.007702589035034} -09/20/2021 21:33:45 - INFO - __main__ - Step 32664: {'lr': 0.00019966110566268816, 'samples': 1045248, 'steps': 2041, 'loss/train': 2.1519148349761963} -09/20/2021 21:33:45 - INFO - __main__ - Step 32665: {'lr': 0.00019966110566268816, 'samples': 1045280, 'steps': 2041, 'loss/train': 2.138951301574707} -09/20/2021 21:33:46 - INFO - __main__ - Step 32666: {'lr': 0.00019966110566268816, 'samples': 1045312, 'steps': 2041, 'loss/train': 2.149357795715332} -09/20/2021 21:33:47 - INFO - __main__ - Step 32667: {'lr': 0.00019966110566268816, 'samples': 1045344, 'steps': 2041, 'loss/train': 2.0098423957824707} -09/20/2021 21:33:48 - INFO - __main__ - Step 32668: {'lr': 0.00019966110566268816, 'samples': 1045376, 'steps': 2041, 'loss/train': 2.10962176322937} -09/20/2021 21:33:48 - INFO - __main__ - Step 32669: {'lr': 0.00019966110566268816, 'samples': 1045408, 'steps': 2041, 'loss/train': 1.5779248476028442} -09/20/2021 21:33:49 - INFO - __main__ - Step 32670: {'lr': 0.00019966110566268816, 'samples': 1045440, 'steps': 2041, 'loss/train': 2.644857883453369} -09/20/2021 21:33:50 - INFO - __main__ - Step 32671: {'lr': 0.00019966110566268816, 'samples': 1045472, 'steps': 2041, 'loss/train': 2.0755717754364014} -09/20/2021 21:33:51 - INFO - __main__ - Step 32672: {'lr': 0.00019966110566268816, 'samples': 1045504, 'steps': 2041, 'loss/train': 2.8490149974823} -09/20/2021 21:33:51 - INFO - __main__ - Step 32673: {'lr': 0.00019966058074607566, 'samples': 1045536, 'steps': 2042, 'loss/train': 0.45861658453941345} -09/20/2021 21:33:53 - INFO - __main__ - Step 32674: {'lr': 0.00019966058074607566, 'samples': 1045568, 'steps': 2042, 'loss/train': 2.297268867492676} -09/20/2021 21:33:54 - INFO - __main__ - Step 32675: {'lr': 0.00019966058074607566, 'samples': 1045600, 'steps': 2042, 'loss/train': 3.4263179302215576} -09/20/2021 21:33:54 - INFO - __main__ - Step 32676: {'lr': 0.00019966058074607566, 'samples': 1045632, 'steps': 2042, 'loss/train': 2.1203465461730957} -09/20/2021 21:33:55 - INFO - __main__ - Step 32677: {'lr': 0.00019966058074607566, 'samples': 1045664, 'steps': 2042, 'loss/train': 2.5088157653808594} -09/20/2021 21:33:56 - INFO - __main__ - Step 32678: {'lr': 0.00019966058074607566, 'samples': 1045696, 'steps': 2042, 'loss/train': 2.2261171340942383} -09/20/2021 21:33:57 - INFO - __main__ - Step 32679: {'lr': 0.00019966058074607566, 'samples': 1045728, 'steps': 2042, 'loss/train': 1.8452503681182861} -09/20/2021 21:33:57 - INFO - __main__ - Step 32680: {'lr': 0.00019966058074607566, 'samples': 1045760, 'steps': 2042, 'loss/train': 1.0510413646697998} -09/20/2021 21:33:58 - INFO - __main__ - Step 32681: {'lr': 0.00019966058074607566, 'samples': 1045792, 'steps': 2042, 'loss/train': 0.8101347088813782} -09/20/2021 21:33:59 - INFO - __main__ - Step 32682: {'lr': 0.00019966058074607566, 'samples': 1045824, 'steps': 2042, 'loss/train': 1.4301904439926147} -09/20/2021 21:34:00 - INFO - __main__ - Step 32683: {'lr': 0.00019966058074607566, 'samples': 1045856, 'steps': 2042, 'loss/train': 2.160043239593506} -09/20/2021 21:34:00 - INFO - __main__ - Step 32684: {'lr': 0.00019966058074607566, 'samples': 1045888, 'steps': 2042, 'loss/train': 2.2574398517608643} -09/20/2021 21:34:01 - INFO - __main__ - Step 32685: {'lr': 0.00019966058074607566, 'samples': 1045920, 'steps': 2042, 'loss/train': 2.067841053009033} -09/20/2021 21:34:02 - INFO - __main__ - Step 32686: {'lr': 0.00019966058074607566, 'samples': 1045952, 'steps': 2042, 'loss/train': 2.5590567588806152} -09/20/2021 21:34:03 - INFO - __main__ - Step 32687: {'lr': 0.00019966058074607566, 'samples': 1045984, 'steps': 2042, 'loss/train': 0.7493231296539307} -09/20/2021 21:34:03 - INFO - __main__ - Step 32688: {'lr': 0.00019966058074607566, 'samples': 1046016, 'steps': 2042, 'loss/train': 3.2094228267669678} -09/20/2021 21:34:04 - INFO - __main__ - Step 32689: {'lr': 0.0001996600554239446, 'samples': 1046048, 'steps': 2043, 'loss/train': 2.3298633098602295} -09/20/2021 21:34:05 - INFO - __main__ - Step 32690: {'lr': 0.0001996600554239446, 'samples': 1046080, 'steps': 2043, 'loss/train': 2.6316604614257812} -09/20/2021 21:34:06 - INFO - __main__ - Step 32691: {'lr': 0.0001996600554239446, 'samples': 1046112, 'steps': 2043, 'loss/train': 3.2672338485717773} -09/20/2021 21:34:06 - INFO - __main__ - Step 32692: {'lr': 0.0001996600554239446, 'samples': 1046144, 'steps': 2043, 'loss/train': 0.43917831778526306} -09/20/2021 21:34:07 - INFO - __main__ - Step 32693: {'lr': 0.0001996600554239446, 'samples': 1046176, 'steps': 2043, 'loss/train': 2.761843204498291} -09/20/2021 21:34:08 - INFO - __main__ - Step 32694: {'lr': 0.0001996600554239446, 'samples': 1046208, 'steps': 2043, 'loss/train': 3.1817262172698975} -09/20/2021 21:34:09 - INFO - __main__ - Step 32695: {'lr': 0.0001996600554239446, 'samples': 1046240, 'steps': 2043, 'loss/train': 3.375166893005371} -09/20/2021 21:34:09 - INFO - __main__ - Step 32696: {'lr': 0.0001996600554239446, 'samples': 1046272, 'steps': 2043, 'loss/train': 2.692704439163208} -09/20/2021 21:34:10 - INFO - __main__ - Step 32697: {'lr': 0.0001996600554239446, 'samples': 1046304, 'steps': 2043, 'loss/train': 2.426002264022827} -09/20/2021 21:34:11 - INFO - __main__ - Step 32698: {'lr': 0.0001996600554239446, 'samples': 1046336, 'steps': 2043, 'loss/train': 1.5791220664978027} -09/20/2021 21:34:12 - INFO - __main__ - Step 32699: {'lr': 0.0001996600554239446, 'samples': 1046368, 'steps': 2043, 'loss/train': 1.430106520652771} -09/20/2021 21:34:12 - INFO - __main__ - Step 32700: {'lr': 0.0001996600554239446, 'samples': 1046400, 'steps': 2043, 'loss/train': 1.7624322175979614} -09/20/2021 21:34:13 - INFO - __main__ - Step 32701: {'lr': 0.0001996600554239446, 'samples': 1046432, 'steps': 2043, 'loss/train': 2.766115665435791} -09/20/2021 21:34:14 - INFO - __main__ - Step 32702: {'lr': 0.0001996600554239446, 'samples': 1046464, 'steps': 2043, 'loss/train': 2.573235273361206} -09/20/2021 21:34:15 - INFO - __main__ - Step 32703: {'lr': 0.0001996600554239446, 'samples': 1046496, 'steps': 2043, 'loss/train': 2.5014662742614746} -09/20/2021 21:34:16 - INFO - __main__ - Step 32704: {'lr': 0.0001996600554239446, 'samples': 1046528, 'steps': 2043, 'loss/train': 2.4665610790252686} -09/20/2021 21:34:17 - INFO - __main__ - Step 32705: {'lr': 0.00019965952969629717, 'samples': 1046560, 'steps': 2044, 'loss/train': 2.261352777481079} -09/20/2021 21:34:18 - INFO - __main__ - Step 32706: {'lr': 0.00019965952969629717, 'samples': 1046592, 'steps': 2044, 'loss/train': 0.9359139800071716} -09/20/2021 21:34:18 - INFO - __main__ - Step 32707: {'lr': 0.00019965952969629717, 'samples': 1046624, 'steps': 2044, 'loss/train': 3.1278553009033203} -09/20/2021 21:34:19 - INFO - __main__ - Step 32708: {'lr': 0.00019965952969629717, 'samples': 1046656, 'steps': 2044, 'loss/train': 2.4833180904388428} -09/20/2021 21:34:20 - INFO - __main__ - Step 32709: {'lr': 0.00019965952969629717, 'samples': 1046688, 'steps': 2044, 'loss/train': 1.7310385704040527} -09/20/2021 21:34:21 - INFO - __main__ - Step 32710: {'lr': 0.00019965952969629717, 'samples': 1046720, 'steps': 2044, 'loss/train': 2.1572091579437256} -09/20/2021 21:34:21 - INFO - __main__ - Step 32711: {'lr': 0.00019965952969629717, 'samples': 1046752, 'steps': 2044, 'loss/train': 3.1833267211914062} -09/20/2021 21:34:22 - INFO - __main__ - Step 32712: {'lr': 0.00019965952969629717, 'samples': 1046784, 'steps': 2044, 'loss/train': 0.3350335359573364} -09/20/2021 21:34:23 - INFO - __main__ - Step 32713: {'lr': 0.00019965952969629717, 'samples': 1046816, 'steps': 2044, 'loss/train': 2.933912515640259} -09/20/2021 21:34:24 - INFO - __main__ - Step 32714: {'lr': 0.00019965952969629717, 'samples': 1046848, 'steps': 2044, 'loss/train': 2.7775156497955322} -09/20/2021 21:34:24 - INFO - __main__ - Step 32715: {'lr': 0.00019965952969629717, 'samples': 1046880, 'steps': 2044, 'loss/train': 2.132655382156372} -09/20/2021 21:34:25 - INFO - __main__ - Step 32716: {'lr': 0.00019965952969629717, 'samples': 1046912, 'steps': 2044, 'loss/train': 1.2225075960159302} -09/20/2021 21:34:26 - INFO - __main__ - Step 32717: {'lr': 0.00019965952969629717, 'samples': 1046944, 'steps': 2044, 'loss/train': 2.173227310180664} -09/20/2021 21:34:27 - INFO - __main__ - Step 32718: {'lr': 0.00019965952969629717, 'samples': 1046976, 'steps': 2044, 'loss/train': 2.385607957839966} -09/20/2021 21:34:27 - INFO - __main__ - Step 32719: {'lr': 0.00019965952969629717, 'samples': 1047008, 'steps': 2044, 'loss/train': 2.2271409034729004} -09/20/2021 21:34:28 - INFO - __main__ - Step 32720: {'lr': 0.00019965952969629717, 'samples': 1047040, 'steps': 2044, 'loss/train': 2.310774564743042} -09/20/2021 21:34:29 - INFO - __main__ - Step 32721: {'lr': 0.00019965900356313553, 'samples': 1047072, 'steps': 2045, 'loss/train': 1.061257243156433} -09/20/2021 21:34:30 - INFO - __main__ - Step 32722: {'lr': 0.00019965900356313553, 'samples': 1047104, 'steps': 2045, 'loss/train': 2.367178201675415} -09/20/2021 21:34:30 - INFO - __main__ - Step 32723: {'lr': 0.00019965900356313553, 'samples': 1047136, 'steps': 2045, 'loss/train': 3.0633413791656494} -09/20/2021 21:34:31 - INFO - __main__ - Step 32724: {'lr': 0.00019965900356313553, 'samples': 1047168, 'steps': 2045, 'loss/train': 2.7714593410491943} -09/20/2021 21:34:32 - INFO - __main__ - Step 32725: {'lr': 0.00019965900356313553, 'samples': 1047200, 'steps': 2045, 'loss/train': 1.3649041652679443} -09/20/2021 21:34:33 - INFO - __main__ - Step 32726: {'lr': 0.00019965900356313553, 'samples': 1047232, 'steps': 2045, 'loss/train': 1.3806489706039429} -09/20/2021 21:34:33 - INFO - __main__ - Step 32727: {'lr': 0.00019965900356313553, 'samples': 1047264, 'steps': 2045, 'loss/train': 2.537029266357422} -09/20/2021 21:34:34 - INFO - __main__ - Step 32728: {'lr': 0.00019965900356313553, 'samples': 1047296, 'steps': 2045, 'loss/train': 2.9128148555755615} -09/20/2021 21:34:35 - INFO - __main__ - Step 32729: {'lr': 0.00019965900356313553, 'samples': 1047328, 'steps': 2045, 'loss/train': 2.4151759147644043} -09/20/2021 21:34:36 - INFO - __main__ - Step 32730: {'lr': 0.00019965900356313553, 'samples': 1047360, 'steps': 2045, 'loss/train': 2.1468746662139893} -09/20/2021 21:34:36 - INFO - __main__ - Step 32731: {'lr': 0.00019965900356313553, 'samples': 1047392, 'steps': 2045, 'loss/train': 2.1564624309539795} -09/20/2021 21:34:37 - INFO - __main__ - Step 32732: {'lr': 0.00019965900356313553, 'samples': 1047424, 'steps': 2045, 'loss/train': 2.38714337348938} -09/20/2021 21:34:38 - INFO - __main__ - Step 32733: {'lr': 0.00019965900356313553, 'samples': 1047456, 'steps': 2045, 'loss/train': 3.033792495727539} -09/20/2021 21:34:39 - INFO - __main__ - Step 32734: {'lr': 0.00019965900356313553, 'samples': 1047488, 'steps': 2045, 'loss/train': 1.5836520195007324} -09/20/2021 21:34:40 - INFO - __main__ - Step 32735: {'lr': 0.00019965900356313553, 'samples': 1047520, 'steps': 2045, 'loss/train': 2.1603639125823975} -09/20/2021 21:34:41 - INFO - __main__ - Step 32736: {'lr': 0.00019965900356313553, 'samples': 1047552, 'steps': 2045, 'loss/train': 1.9479570388793945} -09/20/2021 21:34:42 - INFO - __main__ - Step 32737: {'lr': 0.00019965847702446175, 'samples': 1047584, 'steps': 2046, 'loss/train': 2.493222951889038} -09/20/2021 21:34:42 - INFO - __main__ - Step 32738: {'lr': 0.00019965847702446175, 'samples': 1047616, 'steps': 2046, 'loss/train': 2.6391243934631348} -09/20/2021 21:34:43 - INFO - __main__ - Step 32739: {'lr': 0.00019965847702446175, 'samples': 1047648, 'steps': 2046, 'loss/train': 2.9543697834014893} -09/20/2021 21:34:44 - INFO - __main__ - Step 32740: {'lr': 0.00019965847702446175, 'samples': 1047680, 'steps': 2046, 'loss/train': 2.288208246231079} -09/20/2021 21:34:45 - INFO - __main__ - Step 32741: {'lr': 0.00019965847702446175, 'samples': 1047712, 'steps': 2046, 'loss/train': 2.1747734546661377} -09/20/2021 21:34:45 - INFO - __main__ - Step 32742: {'lr': 0.00019965847702446175, 'samples': 1047744, 'steps': 2046, 'loss/train': 2.1099884510040283} -09/20/2021 21:34:46 - INFO - __main__ - Step 32743: {'lr': 0.00019965847702446175, 'samples': 1047776, 'steps': 2046, 'loss/train': 2.0689234733581543} -09/20/2021 21:34:47 - INFO - __main__ - Step 32744: {'lr': 0.00019965847702446175, 'samples': 1047808, 'steps': 2046, 'loss/train': 2.6255602836608887} -09/20/2021 21:34:48 - INFO - __main__ - Step 32745: {'lr': 0.00019965847702446175, 'samples': 1047840, 'steps': 2046, 'loss/train': 1.6561123132705688} -09/20/2021 21:34:48 - INFO - __main__ - Step 32746: {'lr': 0.00019965847702446175, 'samples': 1047872, 'steps': 2046, 'loss/train': 2.525963068008423} -09/20/2021 21:34:49 - INFO - __main__ - Step 32747: {'lr': 0.00019965847702446175, 'samples': 1047904, 'steps': 2046, 'loss/train': 2.6168088912963867} -09/20/2021 21:34:50 - INFO - __main__ - Step 32748: {'lr': 0.00019965847702446175, 'samples': 1047936, 'steps': 2046, 'loss/train': 1.8240251541137695} -09/20/2021 21:34:51 - INFO - __main__ - Step 32749: {'lr': 0.00019965847702446175, 'samples': 1047968, 'steps': 2046, 'loss/train': 1.896662950515747} -09/20/2021 21:34:51 - INFO - __main__ - Step 32750: {'lr': 0.00019965847702446175, 'samples': 1048000, 'steps': 2046, 'loss/train': 1.450797438621521} -09/20/2021 21:34:52 - INFO - __main__ - Step 32751: {'lr': 0.00019965847702446175, 'samples': 1048032, 'steps': 2046, 'loss/train': 1.846333384513855} -09/20/2021 21:34:53 - INFO - __main__ - Step 32752: {'lr': 0.00019965847702446175, 'samples': 1048064, 'steps': 2046, 'loss/train': 1.9536445140838623} -09/20/2021 21:34:54 - INFO - __main__ - Step 32753: {'lr': 0.00019965795008027804, 'samples': 1048096, 'steps': 2047, 'loss/train': 2.3622262477874756} -09/20/2021 21:34:55 - INFO - __main__ - Step 32754: {'lr': 0.00019965795008027804, 'samples': 1048128, 'steps': 2047, 'loss/train': 1.3078664541244507} -09/20/2021 21:34:55 - INFO - __main__ - Step 32755: {'lr': 0.00019965795008027804, 'samples': 1048160, 'steps': 2047, 'loss/train': 2.470363140106201} -09/20/2021 21:34:56 - INFO - __main__ - Step 32756: {'lr': 0.00019965795008027804, 'samples': 1048192, 'steps': 2047, 'loss/train': 1.76386559009552} -09/20/2021 21:34:57 - INFO - __main__ - Step 32757: {'lr': 0.00019965795008027804, 'samples': 1048224, 'steps': 2047, 'loss/train': 2.341087818145752} -09/20/2021 21:34:58 - INFO - __main__ - Step 32758: {'lr': 0.00019965795008027804, 'samples': 1048256, 'steps': 2047, 'loss/train': 2.2334752082824707} -09/20/2021 21:34:58 - INFO - __main__ - Step 32759: {'lr': 0.00019965795008027804, 'samples': 1048288, 'steps': 2047, 'loss/train': 2.898646593093872} -09/20/2021 21:34:59 - INFO - __main__ - Step 32760: {'lr': 0.00019965795008027804, 'samples': 1048320, 'steps': 2047, 'loss/train': 2.890653610229492} -09/20/2021 21:35:00 - INFO - __main__ - Step 32761: {'lr': 0.00019965795008027804, 'samples': 1048352, 'steps': 2047, 'loss/train': 2.957720994949341} -09/20/2021 21:35:01 - INFO - __main__ - Step 32762: {'lr': 0.00019965795008027804, 'samples': 1048384, 'steps': 2047, 'loss/train': 1.0313999652862549} -09/20/2021 21:35:01 - INFO - __main__ - Step 32763: {'lr': 0.00019965795008027804, 'samples': 1048416, 'steps': 2047, 'loss/train': 3.2306668758392334} -09/20/2021 21:35:02 - INFO - __main__ - Step 32764: {'lr': 0.00019965795008027804, 'samples': 1048448, 'steps': 2047, 'loss/train': 2.2191269397735596} -09/20/2021 21:35:03 - INFO - __main__ - Step 32765: {'lr': 0.00019965795008027804, 'samples': 1048480, 'steps': 2047, 'loss/train': 3.04695987701416} -09/20/2021 21:35:04 - INFO - __main__ - Step 32766: {'lr': 0.00019965795008027804, 'samples': 1048512, 'steps': 2047, 'loss/train': 2.348740339279175} -09/20/2021 21:35:05 - INFO - __main__ - Step 32767: {'lr': 0.00019965795008027804, 'samples': 1048544, 'steps': 2047, 'loss/train': 2.6842944622039795} -09/20/2021 21:35:06 - INFO - __main__ - Step 32768: {'lr': 0.00019965795008027804, 'samples': 1048576, 'steps': 2047, 'loss/train': 1.7734204530715942} -09/20/2021 21:35:07 - INFO - __main__ - Step 32769: {'lr': 0.00019965742273058651, 'samples': 1048608, 'steps': 2048, 'loss/train': 2.412228584289551} -09/20/2021 21:35:08 - INFO - __main__ - Step 32770: {'lr': 0.00019965742273058651, 'samples': 1048640, 'steps': 2048, 'loss/train': 2.3602182865142822} -09/20/2021 21:35:08 - INFO - __main__ - Step 32771: {'lr': 0.00019965742273058651, 'samples': 1048672, 'steps': 2048, 'loss/train': 2.1701180934906006} -09/20/2021 21:35:09 - INFO - __main__ - Step 32772: {'lr': 0.00019965742273058651, 'samples': 1048704, 'steps': 2048, 'loss/train': 0.2950463593006134} -09/20/2021 21:35:10 - INFO - __main__ - Step 32773: {'lr': 0.00019965742273058651, 'samples': 1048736, 'steps': 2048, 'loss/train': 0.5200121998786926} -09/20/2021 21:35:11 - INFO - __main__ - Step 32774: {'lr': 0.00019965742273058651, 'samples': 1048768, 'steps': 2048, 'loss/train': 0.21578548848628998} -09/20/2021 21:35:11 - INFO - __main__ - Step 32775: {'lr': 0.00019965742273058651, 'samples': 1048800, 'steps': 2048, 'loss/train': 0.25563809275627136} -09/20/2021 21:35:12 - INFO - __main__ - Step 32776: {'lr': 0.00019965742273058651, 'samples': 1048832, 'steps': 2048, 'loss/train': 0.425337553024292} -09/20/2021 21:35:13 - INFO - __main__ - Step 32777: {'lr': 0.00019965742273058651, 'samples': 1048864, 'steps': 2048, 'loss/train': 2.463674783706665} -09/20/2021 21:35:14 - INFO - __main__ - Step 32778: {'lr': 0.00019965742273058651, 'samples': 1048896, 'steps': 2048, 'loss/train': 2.258589029312134} -09/20/2021 21:35:14 - INFO - __main__ - Step 32779: {'lr': 0.00019965742273058651, 'samples': 1048928, 'steps': 2048, 'loss/train': 1.6983948945999146} -09/20/2021 21:35:15 - INFO - __main__ - Step 32780: {'lr': 0.00019965742273058651, 'samples': 1048960, 'steps': 2048, 'loss/train': 2.2601752281188965} -09/20/2021 21:35:16 - INFO - __main__ - Step 32781: {'lr': 0.00019965742273058651, 'samples': 1048992, 'steps': 2048, 'loss/train': 2.702077865600586} -09/20/2021 21:35:17 - INFO - __main__ - Step 32782: {'lr': 0.00019965742273058651, 'samples': 1049024, 'steps': 2048, 'loss/train': 1.8313779830932617} -09/20/2021 21:35:17 - INFO - __main__ - Step 32783: {'lr': 0.00019965742273058651, 'samples': 1049056, 'steps': 2048, 'loss/train': 2.2727179527282715} -09/20/2021 21:35:18 - INFO - __main__ - Step 32784: {'lr': 0.00019965742273058651, 'samples': 1049088, 'steps': 2048, 'loss/train': 1.9223456382751465} -09/20/2021 21:35:19 - INFO - __main__ - Step 32785: {'lr': 0.0001996568949753893, 'samples': 1049120, 'steps': 2049, 'loss/train': 1.5006409883499146} -09/20/2021 21:35:20 - INFO - __main__ - Step 32786: {'lr': 0.0001996568949753893, 'samples': 1049152, 'steps': 2049, 'loss/train': 2.342378854751587} -09/20/2021 21:35:21 - INFO - __main__ - Step 32787: {'lr': 0.0001996568949753893, 'samples': 1049184, 'steps': 2049, 'loss/train': 3.1532187461853027} -09/20/2021 21:35:21 - INFO - __main__ - Step 32788: {'lr': 0.0001996568949753893, 'samples': 1049216, 'steps': 2049, 'loss/train': 3.174783945083618} -09/20/2021 21:35:22 - INFO - __main__ - Step 32789: {'lr': 0.0001996568949753893, 'samples': 1049248, 'steps': 2049, 'loss/train': 3.3764257431030273} -09/20/2021 21:35:23 - INFO - __main__ - Step 32790: {'lr': 0.0001996568949753893, 'samples': 1049280, 'steps': 2049, 'loss/train': 3.008500814437866} -09/20/2021 21:35:24 - INFO - __main__ - Step 32791: {'lr': 0.0001996568949753893, 'samples': 1049312, 'steps': 2049, 'loss/train': 2.3427398204803467} -09/20/2021 21:35:24 - INFO - __main__ - Step 32792: {'lr': 0.0001996568949753893, 'samples': 1049344, 'steps': 2049, 'loss/train': 2.270742177963257} -09/20/2021 21:35:25 - INFO - __main__ - Step 32793: {'lr': 0.0001996568949753893, 'samples': 1049376, 'steps': 2049, 'loss/train': 1.9562124013900757} -09/20/2021 21:35:26 - INFO - __main__ - Step 32794: {'lr': 0.0001996568949753893, 'samples': 1049408, 'steps': 2049, 'loss/train': 0.9708612561225891} -09/20/2021 21:35:27 - INFO - __main__ - Step 32795: {'lr': 0.0001996568949753893, 'samples': 1049440, 'steps': 2049, 'loss/train': 2.3754377365112305} -09/20/2021 21:35:27 - INFO - __main__ - Step 32796: {'lr': 0.0001996568949753893, 'samples': 1049472, 'steps': 2049, 'loss/train': 0.3247954845428467} -09/20/2021 21:35:28 - INFO - __main__ - Step 32797: {'lr': 0.0001996568949753893, 'samples': 1049504, 'steps': 2049, 'loss/train': 2.4341115951538086} -09/20/2021 21:35:29 - INFO - __main__ - Step 32798: {'lr': 0.0001996568949753893, 'samples': 1049536, 'steps': 2049, 'loss/train': 1.948269248008728} -09/20/2021 21:35:30 - INFO - __main__ - Step 32799: {'lr': 0.0001996568949753893, 'samples': 1049568, 'steps': 2049, 'loss/train': 1.5587881803512573} -09/20/2021 21:35:31 - INFO - __main__ - Step 32800: {'lr': 0.0001996568949753893, 'samples': 1049600, 'steps': 2049, 'loss/train': 1.9170713424682617} -09/20/2021 21:35:32 - INFO - __main__ - Step 32801: {'lr': 0.0001996563668146886, 'samples': 1049632, 'steps': 2050, 'loss/train': 1.9759199619293213} -09/20/2021 21:35:32 - INFO - __main__ - Step 32802: {'lr': 0.0001996563668146886, 'samples': 1049664, 'steps': 2050, 'loss/train': 2.4143905639648438} -09/20/2021 21:35:33 - INFO - __main__ - Step 32803: {'lr': 0.0001996563668146886, 'samples': 1049696, 'steps': 2050, 'loss/train': 1.9912315607070923} -09/20/2021 21:35:34 - INFO - __main__ - Step 32804: {'lr': 0.0001996563668146886, 'samples': 1049728, 'steps': 2050, 'loss/train': 2.9594295024871826} -09/20/2021 21:35:35 - INFO - __main__ - Step 32805: {'lr': 0.0001996563668146886, 'samples': 1049760, 'steps': 2050, 'loss/train': 2.322720527648926} -09/20/2021 21:35:35 - INFO - __main__ - Step 32806: {'lr': 0.0001996563668146886, 'samples': 1049792, 'steps': 2050, 'loss/train': 1.2969412803649902} -09/20/2021 21:35:36 - INFO - __main__ - Step 32807: {'lr': 0.0001996563668146886, 'samples': 1049824, 'steps': 2050, 'loss/train': 2.6301772594451904} -09/20/2021 21:35:37 - INFO - __main__ - Step 32808: {'lr': 0.0001996563668146886, 'samples': 1049856, 'steps': 2050, 'loss/train': 2.3203964233398438} -09/20/2021 21:35:38 - INFO - __main__ - Step 32809: {'lr': 0.0001996563668146886, 'samples': 1049888, 'steps': 2050, 'loss/train': 2.594381093978882} -09/20/2021 21:35:38 - INFO - __main__ - Step 32810: {'lr': 0.0001996563668146886, 'samples': 1049920, 'steps': 2050, 'loss/train': 3.5187175273895264} -09/20/2021 21:35:39 - INFO - __main__ - Step 32811: {'lr': 0.0001996563668146886, 'samples': 1049952, 'steps': 2050, 'loss/train': 2.4713125228881836} -09/20/2021 21:35:40 - INFO - __main__ - Step 32812: {'lr': 0.0001996563668146886, 'samples': 1049984, 'steps': 2050, 'loss/train': 1.6007212400436401} -09/20/2021 21:35:41 - INFO - __main__ - Step 32813: {'lr': 0.0001996563668146886, 'samples': 1050016, 'steps': 2050, 'loss/train': 2.4354612827301025} -09/20/2021 21:35:41 - INFO - __main__ - Step 32814: {'lr': 0.0001996563668146886, 'samples': 1050048, 'steps': 2050, 'loss/train': 3.1279563903808594} -09/20/2021 21:35:42 - INFO - __main__ - Step 32815: {'lr': 0.0001996563668146886, 'samples': 1050080, 'steps': 2050, 'loss/train': 1.8647969961166382} -09/20/2021 21:35:43 - INFO - __main__ - Step 32816: {'lr': 0.0001996563668146886, 'samples': 1050112, 'steps': 2050, 'loss/train': 6.158069610595703} -09/20/2021 21:35:44 - INFO - __main__ - Step 32817: {'lr': 0.0001996558382484865, 'samples': 1050144, 'steps': 2051, 'loss/train': 2.554065465927124} -09/20/2021 21:35:45 - INFO - __main__ - Step 32818: {'lr': 0.0001996558382484865, 'samples': 1050176, 'steps': 2051, 'loss/train': 1.4263297319412231} -09/20/2021 21:35:45 - INFO - __main__ - Step 32819: {'lr': 0.0001996558382484865, 'samples': 1050208, 'steps': 2051, 'loss/train': 1.6202001571655273} -09/20/2021 21:35:46 - INFO - __main__ - Step 32820: {'lr': 0.0001996558382484865, 'samples': 1050240, 'steps': 2051, 'loss/train': 1.5468332767486572} -09/20/2021 21:35:47 - INFO - __main__ - Step 32821: {'lr': 0.0001996558382484865, 'samples': 1050272, 'steps': 2051, 'loss/train': 3.2821505069732666} -09/20/2021 21:35:48 - INFO - __main__ - Step 32822: {'lr': 0.0001996558382484865, 'samples': 1050304, 'steps': 2051, 'loss/train': 1.6046122312545776} -09/20/2021 21:35:48 - INFO - __main__ - Step 32823: {'lr': 0.0001996558382484865, 'samples': 1050336, 'steps': 2051, 'loss/train': 2.3663277626037598} -09/20/2021 21:35:49 - INFO - __main__ - Step 32824: {'lr': 0.0001996558382484865, 'samples': 1050368, 'steps': 2051, 'loss/train': 2.2594759464263916} -09/20/2021 21:35:50 - INFO - __main__ - Step 32825: {'lr': 0.0001996558382484865, 'samples': 1050400, 'steps': 2051, 'loss/train': 2.135754108428955} -09/20/2021 21:35:51 - INFO - __main__ - Step 32826: {'lr': 0.0001996558382484865, 'samples': 1050432, 'steps': 2051, 'loss/train': 2.0028741359710693} -09/20/2021 21:35:51 - INFO - __main__ - Step 32827: {'lr': 0.0001996558382484865, 'samples': 1050464, 'steps': 2051, 'loss/train': 2.2113142013549805} -09/20/2021 21:35:52 - INFO - __main__ - Step 32828: {'lr': 0.0001996558382484865, 'samples': 1050496, 'steps': 2051, 'loss/train': 2.4403634071350098} -09/20/2021 21:35:53 - INFO - __main__ - Step 32829: {'lr': 0.0001996558382484865, 'samples': 1050528, 'steps': 2051, 'loss/train': 2.6663191318511963} -09/20/2021 21:35:54 - INFO - __main__ - Step 32830: {'lr': 0.0001996558382484865, 'samples': 1050560, 'steps': 2051, 'loss/train': 1.2056572437286377} -09/20/2021 21:35:55 - INFO - __main__ - Step 32831: {'lr': 0.0001996558382484865, 'samples': 1050592, 'steps': 2051, 'loss/train': 2.7498772144317627} -09/20/2021 21:35:56 - INFO - __main__ - Step 32832: {'lr': 0.0001996558382484865, 'samples': 1050624, 'steps': 2051, 'loss/train': 2.778414249420166} -09/20/2021 21:35:56 - INFO - __main__ - Step 32833: {'lr': 0.0001996553092767852, 'samples': 1050656, 'steps': 2052, 'loss/train': 3.0767323970794678} -09/20/2021 21:35:57 - INFO - __main__ - Step 32834: {'lr': 0.0001996553092767852, 'samples': 1050688, 'steps': 2052, 'loss/train': 2.2870469093322754} -09/20/2021 21:35:58 - INFO - __main__ - Step 32835: {'lr': 0.0001996553092767852, 'samples': 1050720, 'steps': 2052, 'loss/train': 1.8271621465682983} -09/20/2021 21:35:59 - INFO - __main__ - Step 32836: {'lr': 0.0001996553092767852, 'samples': 1050752, 'steps': 2052, 'loss/train': 2.4626362323760986} -09/20/2021 21:35:59 - INFO - __main__ - Step 32837: {'lr': 0.0001996553092767852, 'samples': 1050784, 'steps': 2052, 'loss/train': 1.8393398523330688} -09/20/2021 21:36:00 - INFO - __main__ - Step 32838: {'lr': 0.0001996553092767852, 'samples': 1050816, 'steps': 2052, 'loss/train': 2.589630126953125} -09/20/2021 21:36:01 - INFO - __main__ - Step 32839: {'lr': 0.0001996553092767852, 'samples': 1050848, 'steps': 2052, 'loss/train': 3.106595277786255} -09/20/2021 21:36:02 - INFO - __main__ - Step 32840: {'lr': 0.0001996553092767852, 'samples': 1050880, 'steps': 2052, 'loss/train': 2.53666615486145} -09/20/2021 21:36:02 - INFO - __main__ - Step 32841: {'lr': 0.0001996553092767852, 'samples': 1050912, 'steps': 2052, 'loss/train': 2.3123669624328613} -09/20/2021 21:36:03 - INFO - __main__ - Step 32842: {'lr': 0.0001996553092767852, 'samples': 1050944, 'steps': 2052, 'loss/train': 1.8690392971038818} -09/20/2021 21:36:04 - INFO - __main__ - Step 32843: {'lr': 0.0001996553092767852, 'samples': 1050976, 'steps': 2052, 'loss/train': 2.300708055496216} -09/20/2021 21:36:05 - INFO - __main__ - Step 32844: {'lr': 0.0001996553092767852, 'samples': 1051008, 'steps': 2052, 'loss/train': 2.19435977935791} -09/20/2021 21:36:05 - INFO - __main__ - Step 32845: {'lr': 0.0001996553092767852, 'samples': 1051040, 'steps': 2052, 'loss/train': 1.8230538368225098} -09/20/2021 21:36:06 - INFO - __main__ - Step 32846: {'lr': 0.0001996553092767852, 'samples': 1051072, 'steps': 2052, 'loss/train': 2.1873879432678223} -09/20/2021 21:36:07 - INFO - __main__ - Step 32847: {'lr': 0.0001996553092767852, 'samples': 1051104, 'steps': 2052, 'loss/train': 1.5851974487304688} -09/20/2021 21:36:08 - INFO - __main__ - Step 32848: {'lr': 0.0001996553092767852, 'samples': 1051136, 'steps': 2052, 'loss/train': 2.7345263957977295} -09/20/2021 21:36:09 - INFO - __main__ - Step 32849: {'lr': 0.00019965477989958684, 'samples': 1051168, 'steps': 2053, 'loss/train': 2.661770820617676} -09/20/2021 21:36:09 - INFO - __main__ - Step 32850: {'lr': 0.00019965477989958684, 'samples': 1051200, 'steps': 2053, 'loss/train': 0.19905900955200195} -09/20/2021 21:36:10 - INFO - __main__ - Step 32851: {'lr': 0.00019965477989958684, 'samples': 1051232, 'steps': 2053, 'loss/train': 2.0543787479400635} -09/20/2021 21:36:11 - INFO - __main__ - Step 32852: {'lr': 0.00019965477989958684, 'samples': 1051264, 'steps': 2053, 'loss/train': 1.3992464542388916} -09/20/2021 21:36:12 - INFO - __main__ - Step 32853: {'lr': 0.00019965477989958684, 'samples': 1051296, 'steps': 2053, 'loss/train': 3.5549163818359375} -09/20/2021 21:36:12 - INFO - __main__ - Step 32854: {'lr': 0.00019965477989958684, 'samples': 1051328, 'steps': 2053, 'loss/train': 3.0030198097229004} -09/20/2021 21:36:13 - INFO - __main__ - Step 32855: {'lr': 0.00019965477989958684, 'samples': 1051360, 'steps': 2053, 'loss/train': 1.863205075263977} -09/20/2021 21:36:14 - INFO - __main__ - Step 32856: {'lr': 0.00019965477989958684, 'samples': 1051392, 'steps': 2053, 'loss/train': 3.128506898880005} -09/20/2021 21:36:15 - INFO - __main__ - Step 32857: {'lr': 0.00019965477989958684, 'samples': 1051424, 'steps': 2053, 'loss/train': 2.524120569229126} -09/20/2021 21:36:15 - INFO - __main__ - Step 32858: {'lr': 0.00019965477989958684, 'samples': 1051456, 'steps': 2053, 'loss/train': 0.2623366117477417} -09/20/2021 21:36:17 - INFO - __main__ - Step 32859: {'lr': 0.00019965477989958684, 'samples': 1051488, 'steps': 2053, 'loss/train': 0.24492865800857544} -09/20/2021 21:36:17 - INFO - __main__ - Step 32860: {'lr': 0.00019965477989958684, 'samples': 1051520, 'steps': 2053, 'loss/train': 2.984618663787842} -09/20/2021 21:36:18 - INFO - __main__ - Step 32861: {'lr': 0.00019965477989958684, 'samples': 1051552, 'steps': 2053, 'loss/train': 2.1481239795684814} -09/20/2021 21:36:19 - INFO - __main__ - Step 32862: {'lr': 0.00019965477989958684, 'samples': 1051584, 'steps': 2053, 'loss/train': 0.9745319485664368} -09/20/2021 21:36:20 - INFO - __main__ - Step 32863: {'lr': 0.00019965477989958684, 'samples': 1051616, 'steps': 2053, 'loss/train': 0.5968071222305298} -09/20/2021 21:36:20 - INFO - __main__ - Step 32864: {'lr': 0.00019965477989958684, 'samples': 1051648, 'steps': 2053, 'loss/train': 2.230468511581421} -09/20/2021 21:36:21 - INFO - __main__ - Step 32865: {'lr': 0.00019965425011689357, 'samples': 1051680, 'steps': 2054, 'loss/train': 2.2100162506103516} -09/20/2021 21:36:22 - INFO - __main__ - Step 32866: {'lr': 0.00019965425011689357, 'samples': 1051712, 'steps': 2054, 'loss/train': 1.4056427478790283} -09/20/2021 21:36:23 - INFO - __main__ - Step 32867: {'lr': 0.00019965425011689357, 'samples': 1051744, 'steps': 2054, 'loss/train': 2.2970187664031982} -09/20/2021 21:36:24 - INFO - __main__ - Step 32868: {'lr': 0.00019965425011689357, 'samples': 1051776, 'steps': 2054, 'loss/train': 2.4082791805267334} -09/20/2021 21:36:24 - INFO - __main__ - Step 32869: {'lr': 0.00019965425011689357, 'samples': 1051808, 'steps': 2054, 'loss/train': 1.6768909692764282} -09/20/2021 21:36:25 - INFO - __main__ - Step 32870: {'lr': 0.00019965425011689357, 'samples': 1051840, 'steps': 2054, 'loss/train': 2.017183303833008} -09/20/2021 21:36:26 - INFO - __main__ - Step 32871: {'lr': 0.00019965425011689357, 'samples': 1051872, 'steps': 2054, 'loss/train': 2.2412683963775635} -09/20/2021 21:36:27 - INFO - __main__ - Step 32872: {'lr': 0.00019965425011689357, 'samples': 1051904, 'steps': 2054, 'loss/train': 2.7032008171081543} -09/20/2021 21:36:27 - INFO - __main__ - Step 32873: {'lr': 0.00019965425011689357, 'samples': 1051936, 'steps': 2054, 'loss/train': 1.5522547960281372} -09/20/2021 21:36:28 - INFO - __main__ - Step 32874: {'lr': 0.00019965425011689357, 'samples': 1051968, 'steps': 2054, 'loss/train': 2.767653465270996} -09/20/2021 21:36:29 - INFO - __main__ - Step 32875: {'lr': 0.00019965425011689357, 'samples': 1052000, 'steps': 2054, 'loss/train': 2.012495279312134} -09/20/2021 21:36:30 - INFO - __main__ - Step 32876: {'lr': 0.00019965425011689357, 'samples': 1052032, 'steps': 2054, 'loss/train': 0.2672881782054901} -09/20/2021 21:36:30 - INFO - __main__ - Step 32877: {'lr': 0.00019965425011689357, 'samples': 1052064, 'steps': 2054, 'loss/train': 0.27656352519989014} -09/20/2021 21:36:31 - INFO - __main__ - Step 32878: {'lr': 0.00019965425011689357, 'samples': 1052096, 'steps': 2054, 'loss/train': 0.26484161615371704} -09/20/2021 21:36:32 - INFO - __main__ - Step 32879: {'lr': 0.00019965425011689357, 'samples': 1052128, 'steps': 2054, 'loss/train': 2.7615530490875244} -09/20/2021 21:36:33 - INFO - __main__ - Step 32880: {'lr': 0.00019965425011689357, 'samples': 1052160, 'steps': 2054, 'loss/train': 2.641537666320801} -09/20/2021 21:36:33 - INFO - __main__ - Step 32881: {'lr': 0.0001996537199287075, 'samples': 1052192, 'steps': 2055, 'loss/train': 2.678283214569092} -09/20/2021 21:36:34 - INFO - __main__ - Step 32882: {'lr': 0.0001996537199287075, 'samples': 1052224, 'steps': 2055, 'loss/train': 2.123832941055298} -09/20/2021 21:36:35 - INFO - __main__ - Step 32883: {'lr': 0.0001996537199287075, 'samples': 1052256, 'steps': 2055, 'loss/train': 2.581049680709839} -09/20/2021 21:36:36 - INFO - __main__ - Step 32884: {'lr': 0.0001996537199287075, 'samples': 1052288, 'steps': 2055, 'loss/train': 2.604358434677124} -09/20/2021 21:36:36 - INFO - __main__ - Step 32885: {'lr': 0.0001996537199287075, 'samples': 1052320, 'steps': 2055, 'loss/train': 2.7755563259124756} -09/20/2021 21:36:37 - INFO - __main__ - Step 32886: {'lr': 0.0001996537199287075, 'samples': 1052352, 'steps': 2055, 'loss/train': 3.0593783855438232} -09/20/2021 21:36:38 - INFO - __main__ - Step 32887: {'lr': 0.0001996537199287075, 'samples': 1052384, 'steps': 2055, 'loss/train': 1.8322138786315918} -09/20/2021 21:36:39 - INFO - __main__ - Step 32888: {'lr': 0.0001996537199287075, 'samples': 1052416, 'steps': 2055, 'loss/train': 2.2214949131011963} -09/20/2021 21:36:39 - INFO - __main__ - Step 32889: {'lr': 0.0001996537199287075, 'samples': 1052448, 'steps': 2055, 'loss/train': 1.7572290897369385} -09/20/2021 21:36:40 - INFO - __main__ - Step 32890: {'lr': 0.0001996537199287075, 'samples': 1052480, 'steps': 2055, 'loss/train': 1.8799148797988892} -09/20/2021 21:36:41 - INFO - __main__ - Step 32891: {'lr': 0.0001996537199287075, 'samples': 1052512, 'steps': 2055, 'loss/train': 2.046146869659424} -09/20/2021 21:36:42 - INFO - __main__ - Step 32892: {'lr': 0.0001996537199287075, 'samples': 1052544, 'steps': 2055, 'loss/train': 2.886535167694092} -09/20/2021 21:36:43 - INFO - __main__ - Step 32893: {'lr': 0.0001996537199287075, 'samples': 1052576, 'steps': 2055, 'loss/train': 2.2981116771698} -09/20/2021 21:36:44 - INFO - __main__ - Step 32894: {'lr': 0.0001996537199287075, 'samples': 1052608, 'steps': 2055, 'loss/train': 2.309800863265991} -09/20/2021 21:36:44 - INFO - __main__ - Step 32895: {'lr': 0.0001996537199287075, 'samples': 1052640, 'steps': 2055, 'loss/train': 2.215456008911133} -09/20/2021 21:36:45 - INFO - __main__ - Step 32896: {'lr': 0.0001996537199287075, 'samples': 1052672, 'steps': 2055, 'loss/train': 2.8435261249542236} -09/20/2021 21:36:46 - INFO - __main__ - Step 32897: {'lr': 0.00019965318933503086, 'samples': 1052704, 'steps': 2056, 'loss/train': 0.8861586451530457} -09/20/2021 21:36:47 - INFO - __main__ - Step 32898: {'lr': 0.00019965318933503086, 'samples': 1052736, 'steps': 2056, 'loss/train': 2.9060184955596924} -09/20/2021 21:36:48 - INFO - __main__ - Step 32899: {'lr': 0.00019965318933503086, 'samples': 1052768, 'steps': 2056, 'loss/train': 2.3096885681152344} -09/20/2021 21:36:48 - INFO - __main__ - Step 32900: {'lr': 0.00019965318933503086, 'samples': 1052800, 'steps': 2056, 'loss/train': 2.9445204734802246} -09/20/2021 21:36:49 - INFO - __main__ - Step 32901: {'lr': 0.00019965318933503086, 'samples': 1052832, 'steps': 2056, 'loss/train': 1.081682801246643} -09/20/2021 21:36:50 - INFO - __main__ - Step 32902: {'lr': 0.00019965318933503086, 'samples': 1052864, 'steps': 2056, 'loss/train': 1.5042657852172852} -09/20/2021 21:36:51 - INFO - __main__ - Step 32903: {'lr': 0.00019965318933503086, 'samples': 1052896, 'steps': 2056, 'loss/train': 1.8105775117874146} -09/20/2021 21:36:51 - INFO - __main__ - Step 32904: {'lr': 0.00019965318933503086, 'samples': 1052928, 'steps': 2056, 'loss/train': 2.0741019248962402} -09/20/2021 21:36:52 - INFO - __main__ - Step 32905: {'lr': 0.00019965318933503086, 'samples': 1052960, 'steps': 2056, 'loss/train': 1.4983437061309814} -09/20/2021 21:36:53 - INFO - __main__ - Step 32906: {'lr': 0.00019965318933503086, 'samples': 1052992, 'steps': 2056, 'loss/train': 1.6637535095214844} -09/20/2021 21:36:54 - INFO - __main__ - Step 32907: {'lr': 0.00019965318933503086, 'samples': 1053024, 'steps': 2056, 'loss/train': 3.111879348754883} -09/20/2021 21:36:54 - INFO - __main__ - Step 32908: {'lr': 0.00019965318933503086, 'samples': 1053056, 'steps': 2056, 'loss/train': 2.0142745971679688} -09/20/2021 21:36:55 - INFO - __main__ - Step 32909: {'lr': 0.00019965318933503086, 'samples': 1053088, 'steps': 2056, 'loss/train': 0.5450555682182312} -09/20/2021 21:36:56 - INFO - __main__ - Step 32910: {'lr': 0.00019965318933503086, 'samples': 1053120, 'steps': 2056, 'loss/train': 2.841291904449463} -09/20/2021 21:36:57 - INFO - __main__ - Step 32911: {'lr': 0.00019965318933503086, 'samples': 1053152, 'steps': 2056, 'loss/train': 2.786325216293335} -09/20/2021 21:36:57 - INFO - __main__ - Step 32912: {'lr': 0.00019965318933503086, 'samples': 1053184, 'steps': 2056, 'loss/train': 2.587519645690918} -09/20/2021 21:36:58 - INFO - __main__ - Step 32913: {'lr': 0.00019965265833586578, 'samples': 1053216, 'steps': 2057, 'loss/train': 3.5519704818725586} -09/20/2021 21:36:59 - INFO - __main__ - Step 32914: {'lr': 0.00019965265833586578, 'samples': 1053248, 'steps': 2057, 'loss/train': 2.270368814468384} -09/20/2021 21:37:00 - INFO - __main__ - Step 32915: {'lr': 0.00019965265833586578, 'samples': 1053280, 'steps': 2057, 'loss/train': 2.309554100036621} -09/20/2021 21:37:00 - INFO - __main__ - Step 32916: {'lr': 0.00019965265833586578, 'samples': 1053312, 'steps': 2057, 'loss/train': 1.6287325620651245} -09/20/2021 21:37:01 - INFO - __main__ - Step 32917: {'lr': 0.00019965265833586578, 'samples': 1053344, 'steps': 2057, 'loss/train': 2.290574073791504} -09/20/2021 21:37:02 - INFO - __main__ - Step 32918: {'lr': 0.00019965265833586578, 'samples': 1053376, 'steps': 2057, 'loss/train': 2.398420572280884} -09/20/2021 21:37:03 - INFO - __main__ - Step 32919: {'lr': 0.00019965265833586578, 'samples': 1053408, 'steps': 2057, 'loss/train': 2.6198232173919678} -09/20/2021 21:37:03 - INFO - __main__ - Step 32920: {'lr': 0.00019965265833586578, 'samples': 1053440, 'steps': 2057, 'loss/train': 3.1134066581726074} -09/20/2021 21:37:04 - INFO - __main__ - Step 32921: {'lr': 0.00019965265833586578, 'samples': 1053472, 'steps': 2057, 'loss/train': 2.180764675140381} -09/20/2021 21:37:06 - INFO - __main__ - Step 32922: {'lr': 0.00019965265833586578, 'samples': 1053504, 'steps': 2057, 'loss/train': 1.1279536485671997} -09/20/2021 21:37:07 - INFO - __main__ - Step 32923: {'lr': 0.00019965265833586578, 'samples': 1053536, 'steps': 2057, 'loss/train': 1.6756235361099243} -09/20/2021 21:37:08 - INFO - __main__ - Step 32924: {'lr': 0.00019965265833586578, 'samples': 1053568, 'steps': 2057, 'loss/train': 2.4717676639556885} -09/20/2021 21:37:08 - INFO - __main__ - Step 32925: {'lr': 0.00019965265833586578, 'samples': 1053600, 'steps': 2057, 'loss/train': 2.2866830825805664} -09/20/2021 21:37:09 - INFO - __main__ - Step 32926: {'lr': 0.00019965265833586578, 'samples': 1053632, 'steps': 2057, 'loss/train': 1.8592665195465088} -09/20/2021 21:37:10 - INFO - __main__ - Step 32927: {'lr': 0.00019965265833586578, 'samples': 1053664, 'steps': 2057, 'loss/train': 2.14217209815979} -09/20/2021 21:37:11 - INFO - __main__ - Step 32928: {'lr': 0.00019965265833586578, 'samples': 1053696, 'steps': 2057, 'loss/train': 1.75623619556427} -09/20/2021 21:37:11 - INFO - __main__ - Step 32929: {'lr': 0.00019965212693121443, 'samples': 1053728, 'steps': 2058, 'loss/train': 2.5895800590515137} -09/20/2021 21:37:12 - INFO - __main__ - Step 32930: {'lr': 0.00019965212693121443, 'samples': 1053760, 'steps': 2058, 'loss/train': 2.4095845222473145} -09/20/2021 21:37:13 - INFO - __main__ - Step 32931: {'lr': 0.00019965212693121443, 'samples': 1053792, 'steps': 2058, 'loss/train': 2.2601304054260254} -09/20/2021 21:37:14 - INFO - __main__ - Step 32932: {'lr': 0.00019965212693121443, 'samples': 1053824, 'steps': 2058, 'loss/train': 2.4843759536743164} -09/20/2021 21:37:14 - INFO - __main__ - Step 32933: {'lr': 0.00019965212693121443, 'samples': 1053856, 'steps': 2058, 'loss/train': 2.367062568664551} -09/20/2021 21:37:15 - INFO - __main__ - Step 32934: {'lr': 0.00019965212693121443, 'samples': 1053888, 'steps': 2058, 'loss/train': 2.446894884109497} -09/20/2021 21:37:16 - INFO - __main__ - Step 32935: {'lr': 0.00019965212693121443, 'samples': 1053920, 'steps': 2058, 'loss/train': 2.355945110321045} -09/20/2021 21:37:17 - INFO - __main__ - Step 32936: {'lr': 0.00019965212693121443, 'samples': 1053952, 'steps': 2058, 'loss/train': 1.1006131172180176} -09/20/2021 21:37:17 - INFO - __main__ - Step 32937: {'lr': 0.00019965212693121443, 'samples': 1053984, 'steps': 2058, 'loss/train': 1.2333300113677979} -09/20/2021 21:37:18 - INFO - __main__ - Step 32938: {'lr': 0.00019965212693121443, 'samples': 1054016, 'steps': 2058, 'loss/train': 0.15562745928764343} -09/20/2021 21:37:19 - INFO - __main__ - Step 32939: {'lr': 0.00019965212693121443, 'samples': 1054048, 'steps': 2058, 'loss/train': 0.19855403900146484} -09/20/2021 21:37:20 - INFO - __main__ - Step 32940: {'lr': 0.00019965212693121443, 'samples': 1054080, 'steps': 2058, 'loss/train': 0.34879887104034424} -09/20/2021 21:37:20 - INFO - __main__ - Step 32941: {'lr': 0.00019965212693121443, 'samples': 1054112, 'steps': 2058, 'loss/train': 2.59167218208313} -09/20/2021 21:37:21 - INFO - __main__ - Step 32942: {'lr': 0.00019965212693121443, 'samples': 1054144, 'steps': 2058, 'loss/train': 1.9401613473892212} -09/20/2021 21:37:22 - INFO - __main__ - Step 32943: {'lr': 0.00019965212693121443, 'samples': 1054176, 'steps': 2058, 'loss/train': 2.2055318355560303} -09/20/2021 21:37:23 - INFO - __main__ - Step 32944: {'lr': 0.00019965212693121443, 'samples': 1054208, 'steps': 2058, 'loss/train': 2.6999435424804688} -09/20/2021 21:37:24 - INFO - __main__ - Step 32945: {'lr': 0.00019965159512107893, 'samples': 1054240, 'steps': 2059, 'loss/train': 1.6664185523986816} -09/20/2021 21:37:24 - INFO - __main__ - Step 32946: {'lr': 0.00019965159512107893, 'samples': 1054272, 'steps': 2059, 'loss/train': 2.5462582111358643} -09/20/2021 21:37:25 - INFO - __main__ - Step 32947: {'lr': 0.00019965159512107893, 'samples': 1054304, 'steps': 2059, 'loss/train': 2.1896514892578125} -09/20/2021 21:37:26 - INFO - __main__ - Step 32948: {'lr': 0.00019965159512107893, 'samples': 1054336, 'steps': 2059, 'loss/train': 2.156162738800049} -09/20/2021 21:37:27 - INFO - __main__ - Step 32949: {'lr': 0.00019965159512107893, 'samples': 1054368, 'steps': 2059, 'loss/train': 2.5521433353424072} -09/20/2021 21:37:27 - INFO - __main__ - Step 32950: {'lr': 0.00019965159512107893, 'samples': 1054400, 'steps': 2059, 'loss/train': 2.5476722717285156} -09/20/2021 21:37:28 - INFO - __main__ - Step 32951: {'lr': 0.00019965159512107893, 'samples': 1054432, 'steps': 2059, 'loss/train': 1.8754106760025024} -09/20/2021 21:37:29 - INFO - __main__ - Step 32952: {'lr': 0.00019965159512107893, 'samples': 1054464, 'steps': 2059, 'loss/train': 3.160147190093994} -09/20/2021 21:37:30 - INFO - __main__ - Step 32953: {'lr': 0.00019965159512107893, 'samples': 1054496, 'steps': 2059, 'loss/train': 2.809857130050659} -09/20/2021 21:37:31 - INFO - __main__ - Step 32954: {'lr': 0.00019965159512107893, 'samples': 1054528, 'steps': 2059, 'loss/train': 2.7286922931671143} -09/20/2021 21:37:32 - INFO - __main__ - Step 32955: {'lr': 0.00019965159512107893, 'samples': 1054560, 'steps': 2059, 'loss/train': 2.5251729488372803} -09/20/2021 21:37:33 - INFO - __main__ - Step 32956: {'lr': 0.00019965159512107893, 'samples': 1054592, 'steps': 2059, 'loss/train': 2.903470277786255} -09/20/2021 21:37:33 - INFO - __main__ - Step 32957: {'lr': 0.00019965159512107893, 'samples': 1054624, 'steps': 2059, 'loss/train': 3.2364933490753174} -09/20/2021 21:37:34 - INFO - __main__ - Step 32958: {'lr': 0.00019965159512107893, 'samples': 1054656, 'steps': 2059, 'loss/train': 2.672870635986328} -09/20/2021 21:37:35 - INFO - __main__ - Step 32959: {'lr': 0.00019965159512107893, 'samples': 1054688, 'steps': 2059, 'loss/train': 3.464986801147461} -09/20/2021 21:37:36 - INFO - __main__ - Step 32960: {'lr': 0.00019965159512107893, 'samples': 1054720, 'steps': 2059, 'loss/train': 1.8802618980407715} -09/20/2021 21:37:37 - INFO - __main__ - Step 32961: {'lr': 0.00019965106290546148, 'samples': 1054752, 'steps': 2060, 'loss/train': 1.9812756776809692} -09/20/2021 21:37:37 - INFO - __main__ - Step 32962: {'lr': 0.00019965106290546148, 'samples': 1054784, 'steps': 2060, 'loss/train': 1.9647090435028076} -09/20/2021 21:37:38 - INFO - __main__ - Step 32963: {'lr': 0.00019965106290546148, 'samples': 1054816, 'steps': 2060, 'loss/train': 1.7781509160995483} -09/20/2021 21:37:39 - INFO - __main__ - Step 32964: {'lr': 0.00019965106290546148, 'samples': 1054848, 'steps': 2060, 'loss/train': 1.7621135711669922} -09/20/2021 21:37:40 - INFO - __main__ - Step 32965: {'lr': 0.00019965106290546148, 'samples': 1054880, 'steps': 2060, 'loss/train': 2.607185125350952} -09/20/2021 21:37:40 - INFO - __main__ - Step 32966: {'lr': 0.00019965106290546148, 'samples': 1054912, 'steps': 2060, 'loss/train': 1.8685005903244019} -09/20/2021 21:37:41 - INFO - __main__ - Step 32967: {'lr': 0.00019965106290546148, 'samples': 1054944, 'steps': 2060, 'loss/train': 2.74444842338562} -09/20/2021 21:37:42 - INFO - __main__ - Step 32968: {'lr': 0.00019965106290546148, 'samples': 1054976, 'steps': 2060, 'loss/train': 1.8569300174713135} -09/20/2021 21:37:43 - INFO - __main__ - Step 32969: {'lr': 0.00019965106290546148, 'samples': 1055008, 'steps': 2060, 'loss/train': 0.5179338455200195} -09/20/2021 21:37:43 - INFO - __main__ - Step 32970: {'lr': 0.00019965106290546148, 'samples': 1055040, 'steps': 2060, 'loss/train': 0.356370210647583} -09/20/2021 21:37:44 - INFO - __main__ - Step 32971: {'lr': 0.00019965106290546148, 'samples': 1055072, 'steps': 2060, 'loss/train': 0.30927133560180664} -09/20/2021 21:37:45 - INFO - __main__ - Step 32972: {'lr': 0.00019965106290546148, 'samples': 1055104, 'steps': 2060, 'loss/train': 2.3821516036987305} -09/20/2021 21:37:46 - INFO - __main__ - Step 32973: {'lr': 0.00019965106290546148, 'samples': 1055136, 'steps': 2060, 'loss/train': 2.4400553703308105} -09/20/2021 21:37:46 - INFO - __main__ - Step 32974: {'lr': 0.00019965106290546148, 'samples': 1055168, 'steps': 2060, 'loss/train': 3.432579517364502} -09/20/2021 21:37:47 - INFO - __main__ - Step 32975: {'lr': 0.00019965106290546148, 'samples': 1055200, 'steps': 2060, 'loss/train': 1.7829121351242065} -09/20/2021 21:37:48 - INFO - __main__ - Step 32976: {'lr': 0.00019965106290546148, 'samples': 1055232, 'steps': 2060, 'loss/train': 1.5247336626052856} -09/20/2021 21:37:49 - INFO - __main__ - Step 32977: {'lr': 0.0001996505302843643, 'samples': 1055264, 'steps': 2061, 'loss/train': 1.4196572303771973} -09/20/2021 21:37:49 - INFO - __main__ - Step 32978: {'lr': 0.0001996505302843643, 'samples': 1055296, 'steps': 2061, 'loss/train': 1.9553003311157227} -09/20/2021 21:37:50 - INFO - __main__ - Step 32979: {'lr': 0.0001996505302843643, 'samples': 1055328, 'steps': 2061, 'loss/train': 2.7499303817749023} -09/20/2021 21:37:51 - INFO - __main__ - Step 32980: {'lr': 0.0001996505302843643, 'samples': 1055360, 'steps': 2061, 'loss/train': 2.0437309741973877} -09/20/2021 21:37:52 - INFO - __main__ - Step 32981: {'lr': 0.0001996505302843643, 'samples': 1055392, 'steps': 2061, 'loss/train': 2.2394773960113525} -09/20/2021 21:37:52 - INFO - __main__ - Step 32982: {'lr': 0.0001996505302843643, 'samples': 1055424, 'steps': 2061, 'loss/train': 1.5062439441680908} -09/20/2021 21:37:54 - INFO - __main__ - Step 32983: {'lr': 0.0001996505302843643, 'samples': 1055456, 'steps': 2061, 'loss/train': 1.9419763088226318} -09/20/2021 21:37:54 - INFO - __main__ - Step 32984: {'lr': 0.0001996505302843643, 'samples': 1055488, 'steps': 2061, 'loss/train': 2.0628533363342285} -09/20/2021 21:37:55 - INFO - __main__ - Step 32985: {'lr': 0.0001996505302843643, 'samples': 1055520, 'steps': 2061, 'loss/train': 2.278367042541504} -09/20/2021 21:37:56 - INFO - __main__ - Step 32986: {'lr': 0.0001996505302843643, 'samples': 1055552, 'steps': 2061, 'loss/train': 2.0103647708892822} -09/20/2021 21:37:57 - INFO - __main__ - Step 32987: {'lr': 0.0001996505302843643, 'samples': 1055584, 'steps': 2061, 'loss/train': 2.9299213886260986} -09/20/2021 21:37:57 - INFO - __main__ - Step 32988: {'lr': 0.0001996505302843643, 'samples': 1055616, 'steps': 2061, 'loss/train': 0.5378657579421997} -09/20/2021 21:37:58 - INFO - __main__ - Step 32989: {'lr': 0.0001996505302843643, 'samples': 1055648, 'steps': 2061, 'loss/train': 1.6578073501586914} -09/20/2021 21:37:59 - INFO - __main__ - Step 32990: {'lr': 0.0001996505302843643, 'samples': 1055680, 'steps': 2061, 'loss/train': 2.624462842941284} -09/20/2021 21:38:00 - INFO - __main__ - Step 32991: {'lr': 0.0001996505302843643, 'samples': 1055712, 'steps': 2061, 'loss/train': 2.3829329013824463} -09/20/2021 21:38:00 - INFO - __main__ - Step 32992: {'lr': 0.0001996505302843643, 'samples': 1055744, 'steps': 2061, 'loss/train': 2.6265530586242676} -09/20/2021 21:38:01 - INFO - __main__ - Step 32993: {'lr': 0.00019964999725778944, 'samples': 1055776, 'steps': 2062, 'loss/train': 2.1323046684265137} -09/20/2021 21:38:02 - INFO - __main__ - Step 32994: {'lr': 0.00019964999725778944, 'samples': 1055808, 'steps': 2062, 'loss/train': 1.3083513975143433} -09/20/2021 21:38:03 - INFO - __main__ - Step 32995: {'lr': 0.00019964999725778944, 'samples': 1055840, 'steps': 2062, 'loss/train': 1.9410117864608765} -09/20/2021 21:38:04 - INFO - __main__ - Step 32996: {'lr': 0.00019964999725778944, 'samples': 1055872, 'steps': 2062, 'loss/train': 2.231743097305298} -09/20/2021 21:38:04 - INFO - __main__ - Step 32997: {'lr': 0.00019964999725778944, 'samples': 1055904, 'steps': 2062, 'loss/train': 1.9492669105529785} -09/20/2021 21:38:05 - INFO - __main__ - Step 32998: {'lr': 0.00019964999725778944, 'samples': 1055936, 'steps': 2062, 'loss/train': 1.8723739385604858} -09/20/2021 21:38:06 - INFO - __main__ - Step 32999: {'lr': 0.00019964999725778944, 'samples': 1055968, 'steps': 2062, 'loss/train': 2.110929250717163} -09/20/2021 21:38:07 - INFO - __main__ - Step 33000: {'lr': 0.00019964999725778944, 'samples': 1056000, 'steps': 2062, 'loss/train': 2.386260986328125} -09/20/2021 21:38:07 - INFO - __main__ - Step 33001: {'lr': 0.00019964999725778944, 'samples': 1056032, 'steps': 2062, 'loss/train': 2.493682861328125} -09/20/2021 21:38:08 - INFO - __main__ - Step 33002: {'lr': 0.00019964999725778944, 'samples': 1056064, 'steps': 2062, 'loss/train': 2.466548204421997} -09/20/2021 21:38:09 - INFO - __main__ - Step 33003: {'lr': 0.00019964999725778944, 'samples': 1056096, 'steps': 2062, 'loss/train': 3.234926700592041} -09/20/2021 21:38:10 - INFO - __main__ - Step 33004: {'lr': 0.00019964999725778944, 'samples': 1056128, 'steps': 2062, 'loss/train': 2.883138418197632} -09/20/2021 21:38:10 - INFO - __main__ - Step 33005: {'lr': 0.00019964999725778944, 'samples': 1056160, 'steps': 2062, 'loss/train': 3.5162222385406494} -09/20/2021 21:38:11 - INFO - __main__ - Step 33006: {'lr': 0.00019964999725778944, 'samples': 1056192, 'steps': 2062, 'loss/train': 2.5921008586883545} -09/20/2021 21:38:12 - INFO - __main__ - Step 33007: {'lr': 0.00019964999725778944, 'samples': 1056224, 'steps': 2062, 'loss/train': 2.3003134727478027} -09/20/2021 21:38:13 - INFO - __main__ - Step 33008: {'lr': 0.00019964999725778944, 'samples': 1056256, 'steps': 2062, 'loss/train': 1.7506545782089233} -09/20/2021 21:38:13 - INFO - __main__ - Step 33009: {'lr': 0.00019964946382573917, 'samples': 1056288, 'steps': 2063, 'loss/train': 2.1933984756469727} -09/20/2021 21:38:14 - INFO - __main__ - Step 33010: {'lr': 0.00019964946382573917, 'samples': 1056320, 'steps': 2063, 'loss/train': 1.8551896810531616} -09/20/2021 21:38:15 - INFO - __main__ - Step 33011: {'lr': 0.00019964946382573917, 'samples': 1056352, 'steps': 2063, 'loss/train': 2.535883903503418} -09/20/2021 21:38:16 - INFO - __main__ - Step 33012: {'lr': 0.00019964946382573917, 'samples': 1056384, 'steps': 2063, 'loss/train': 2.463280200958252} -09/20/2021 21:38:16 - INFO - __main__ - Step 33013: {'lr': 0.00019964946382573917, 'samples': 1056416, 'steps': 2063, 'loss/train': 2.3504416942596436} -09/20/2021 21:38:18 - INFO - __main__ - Step 33014: {'lr': 0.00019964946382573917, 'samples': 1056448, 'steps': 2063, 'loss/train': 2.221817970275879} -09/20/2021 21:38:19 - INFO - __main__ - Step 33015: {'lr': 0.00019964946382573917, 'samples': 1056480, 'steps': 2063, 'loss/train': 1.9850283861160278} -09/20/2021 21:38:19 - INFO - __main__ - Step 33016: {'lr': 0.00019964946382573917, 'samples': 1056512, 'steps': 2063, 'loss/train': 1.912188172340393} -09/20/2021 21:38:20 - INFO - __main__ - Step 33017: {'lr': 0.00019964946382573917, 'samples': 1056544, 'steps': 2063, 'loss/train': 2.2536261081695557} -09/20/2021 21:38:21 - INFO - __main__ - Step 33018: {'lr': 0.00019964946382573917, 'samples': 1056576, 'steps': 2063, 'loss/train': 2.5857889652252197} -09/20/2021 21:38:22 - INFO - __main__ - Step 33019: {'lr': 0.00019964946382573917, 'samples': 1056608, 'steps': 2063, 'loss/train': 2.82523775100708} -09/20/2021 21:38:22 - INFO - __main__ - Step 33020: {'lr': 0.00019964946382573917, 'samples': 1056640, 'steps': 2063, 'loss/train': 1.8386019468307495} -09/20/2021 21:38:23 - INFO - __main__ - Step 33021: {'lr': 0.00019964946382573917, 'samples': 1056672, 'steps': 2063, 'loss/train': 1.1647229194641113} -09/20/2021 21:38:24 - INFO - __main__ - Step 33022: {'lr': 0.00019964946382573917, 'samples': 1056704, 'steps': 2063, 'loss/train': 2.608853578567505} -09/20/2021 21:38:25 - INFO - __main__ - Step 33023: {'lr': 0.00019964946382573917, 'samples': 1056736, 'steps': 2063, 'loss/train': 2.1653549671173096} -09/20/2021 21:38:25 - INFO - __main__ - Step 33024: {'lr': 0.00019964946382573917, 'samples': 1056768, 'steps': 2063, 'loss/train': 2.2641713619232178} -09/20/2021 21:38:26 - INFO - __main__ - Step 33025: {'lr': 0.00019964892998821558, 'samples': 1056800, 'steps': 2064, 'loss/train': 1.9277406930923462} -09/20/2021 21:38:27 - INFO - __main__ - Step 33026: {'lr': 0.00019964892998821558, 'samples': 1056832, 'steps': 2064, 'loss/train': 2.7397546768188477} -09/20/2021 21:38:28 - INFO - __main__ - Step 33027: {'lr': 0.00019964892998821558, 'samples': 1056864, 'steps': 2064, 'loss/train': 2.9095935821533203} -09/20/2021 21:38:28 - INFO - __main__ - Step 33028: {'lr': 0.00019964892998821558, 'samples': 1056896, 'steps': 2064, 'loss/train': 2.3500022888183594} -09/20/2021 21:38:29 - INFO - __main__ - Step 33029: {'lr': 0.00019964892998821558, 'samples': 1056928, 'steps': 2064, 'loss/train': 1.4979948997497559} -09/20/2021 21:38:30 - INFO - __main__ - Step 33030: {'lr': 0.00019964892998821558, 'samples': 1056960, 'steps': 2064, 'loss/train': 1.8603301048278809} -09/20/2021 21:38:31 - INFO - __main__ - Step 33031: {'lr': 0.00019964892998821558, 'samples': 1056992, 'steps': 2064, 'loss/train': 1.733816146850586} -09/20/2021 21:38:31 - INFO - __main__ - Step 33032: {'lr': 0.00019964892998821558, 'samples': 1057024, 'steps': 2064, 'loss/train': 1.6828196048736572} -09/20/2021 21:38:32 - INFO - __main__ - Step 33033: {'lr': 0.00019964892998821558, 'samples': 1057056, 'steps': 2064, 'loss/train': 2.1326828002929688} -09/20/2021 21:38:33 - INFO - __main__ - Step 33034: {'lr': 0.00019964892998821558, 'samples': 1057088, 'steps': 2064, 'loss/train': 3.0039854049682617} -09/20/2021 21:38:34 - INFO - __main__ - Step 33035: {'lr': 0.00019964892998821558, 'samples': 1057120, 'steps': 2064, 'loss/train': 2.265930652618408} -09/20/2021 21:38:34 - INFO - __main__ - Step 33036: {'lr': 0.00019964892998821558, 'samples': 1057152, 'steps': 2064, 'loss/train': 1.0176724195480347} -09/20/2021 21:38:35 - INFO - __main__ - Step 33037: {'lr': 0.00019964892998821558, 'samples': 1057184, 'steps': 2064, 'loss/train': 3.0532751083374023} -09/20/2021 21:38:36 - INFO - __main__ - Step 33038: {'lr': 0.00019964892998821558, 'samples': 1057216, 'steps': 2064, 'loss/train': 2.5805561542510986} -09/20/2021 21:38:37 - INFO - __main__ - Step 33039: {'lr': 0.00019964892998821558, 'samples': 1057248, 'steps': 2064, 'loss/train': 2.1685550212860107} -09/20/2021 21:38:37 - INFO - __main__ - Step 33040: {'lr': 0.00019964892998821558, 'samples': 1057280, 'steps': 2064, 'loss/train': 2.434481382369995} -09/20/2021 21:38:38 - INFO - __main__ - Step 33041: {'lr': 0.0001996483957452209, 'samples': 1057312, 'steps': 2065, 'loss/train': 2.519230365753174} -09/20/2021 21:38:39 - INFO - __main__ - Step 33042: {'lr': 0.0001996483957452209, 'samples': 1057344, 'steps': 2065, 'loss/train': 0.1706538200378418} -09/20/2021 21:38:40 - INFO - __main__ - Step 33043: {'lr': 0.0001996483957452209, 'samples': 1057376, 'steps': 2065, 'loss/train': 2.6480326652526855} -09/20/2021 21:38:41 - INFO - __main__ - Step 33044: {'lr': 0.0001996483957452209, 'samples': 1057408, 'steps': 2065, 'loss/train': 2.4083659648895264} -09/20/2021 21:38:41 - INFO - __main__ - Step 33045: {'lr': 0.0001996483957452209, 'samples': 1057440, 'steps': 2065, 'loss/train': 3.4838449954986572} -09/20/2021 21:38:43 - INFO - __main__ - Step 33046: {'lr': 0.0001996483957452209, 'samples': 1057472, 'steps': 2065, 'loss/train': 2.6761257648468018} -09/20/2021 21:38:43 - INFO - __main__ - Step 33047: {'lr': 0.0001996483957452209, 'samples': 1057504, 'steps': 2065, 'loss/train': 2.288424253463745} -09/20/2021 21:38:44 - INFO - __main__ - Step 33048: {'lr': 0.0001996483957452209, 'samples': 1057536, 'steps': 2065, 'loss/train': 2.3737800121307373} -09/20/2021 21:38:45 - INFO - __main__ - Step 33049: {'lr': 0.0001996483957452209, 'samples': 1057568, 'steps': 2065, 'loss/train': 2.5253489017486572} -09/20/2021 21:38:46 - INFO - __main__ - Step 33050: {'lr': 0.0001996483957452209, 'samples': 1057600, 'steps': 2065, 'loss/train': 0.8075559139251709} -09/20/2021 21:38:46 - INFO - __main__ - Step 33051: {'lr': 0.0001996483957452209, 'samples': 1057632, 'steps': 2065, 'loss/train': 2.204552412033081} -09/20/2021 21:38:47 - INFO - __main__ - Step 33052: {'lr': 0.0001996483957452209, 'samples': 1057664, 'steps': 2065, 'loss/train': 1.2386842966079712} -09/20/2021 21:38:48 - INFO - __main__ - Step 33053: {'lr': 0.0001996483957452209, 'samples': 1057696, 'steps': 2065, 'loss/train': 1.8533127307891846} -09/20/2021 21:38:49 - INFO - __main__ - Step 33054: {'lr': 0.0001996483957452209, 'samples': 1057728, 'steps': 2065, 'loss/train': 1.7923779487609863} -09/20/2021 21:38:49 - INFO - __main__ - Step 33055: {'lr': 0.0001996483957452209, 'samples': 1057760, 'steps': 2065, 'loss/train': 2.5211191177368164} -09/20/2021 21:38:50 - INFO - __main__ - Step 33056: {'lr': 0.0001996483957452209, 'samples': 1057792, 'steps': 2065, 'loss/train': 3.116748571395874} -09/20/2021 21:38:51 - INFO - __main__ - Step 33057: {'lr': 0.00019964786109675727, 'samples': 1057824, 'steps': 2066, 'loss/train': 0.7189973592758179} -09/20/2021 21:38:52 - INFO - __main__ - Step 33058: {'lr': 0.00019964786109675727, 'samples': 1057856, 'steps': 2066, 'loss/train': 3.279945135116577} -09/20/2021 21:38:53 - INFO - __main__ - Step 33059: {'lr': 0.00019964786109675727, 'samples': 1057888, 'steps': 2066, 'loss/train': 2.7752623558044434} -09/20/2021 21:38:53 - INFO - __main__ - Step 33060: {'lr': 0.00019964786109675727, 'samples': 1057920, 'steps': 2066, 'loss/train': 2.2705063819885254} -09/20/2021 21:38:54 - INFO - __main__ - Step 33061: {'lr': 0.00019964786109675727, 'samples': 1057952, 'steps': 2066, 'loss/train': 2.3684191703796387} -09/20/2021 21:38:55 - INFO - __main__ - Step 33062: {'lr': 0.00019964786109675727, 'samples': 1057984, 'steps': 2066, 'loss/train': 2.985377788543701} -09/20/2021 21:38:56 - INFO - __main__ - Step 33063: {'lr': 0.00019964786109675727, 'samples': 1058016, 'steps': 2066, 'loss/train': 2.7959136962890625} -09/20/2021 21:38:56 - INFO - __main__ - Step 33064: {'lr': 0.00019964786109675727, 'samples': 1058048, 'steps': 2066, 'loss/train': 1.918622612953186} -09/20/2021 21:38:57 - INFO - __main__ - Step 33065: {'lr': 0.00019964786109675727, 'samples': 1058080, 'steps': 2066, 'loss/train': 2.2196028232574463} -09/20/2021 21:38:58 - INFO - __main__ - Step 33066: {'lr': 0.00019964786109675727, 'samples': 1058112, 'steps': 2066, 'loss/train': 2.0301427841186523} -09/20/2021 21:38:59 - INFO - __main__ - Step 33067: {'lr': 0.00019964786109675727, 'samples': 1058144, 'steps': 2066, 'loss/train': 2.6524362564086914} -09/20/2021 21:38:59 - INFO - __main__ - Step 33068: {'lr': 0.00019964786109675727, 'samples': 1058176, 'steps': 2066, 'loss/train': 1.5708214044570923} -09/20/2021 21:39:00 - INFO - __main__ - Step 33069: {'lr': 0.00019964786109675727, 'samples': 1058208, 'steps': 2066, 'loss/train': 2.747361421585083} -09/20/2021 21:39:01 - INFO - __main__ - Step 33070: {'lr': 0.00019964786109675727, 'samples': 1058240, 'steps': 2066, 'loss/train': 1.9280059337615967} -09/20/2021 21:39:02 - INFO - __main__ - Step 33071: {'lr': 0.00019964786109675727, 'samples': 1058272, 'steps': 2066, 'loss/train': 3.0336191654205322} -09/20/2021 21:39:02 - INFO - __main__ - Step 33072: {'lr': 0.00019964786109675727, 'samples': 1058304, 'steps': 2066, 'loss/train': 2.4119720458984375} -09/20/2021 21:39:03 - INFO - __main__ - Step 33073: {'lr': 0.0001996473260428269, 'samples': 1058336, 'steps': 2067, 'loss/train': 2.895533323287964} -09/20/2021 21:39:04 - INFO - __main__ - Step 33074: {'lr': 0.0001996473260428269, 'samples': 1058368, 'steps': 2067, 'loss/train': 1.4458026885986328} -09/20/2021 21:39:05 - INFO - __main__ - Step 33075: {'lr': 0.0001996473260428269, 'samples': 1058400, 'steps': 2067, 'loss/train': 1.5446068048477173} -09/20/2021 21:39:05 - INFO - __main__ - Step 33076: {'lr': 0.0001996473260428269, 'samples': 1058432, 'steps': 2067, 'loss/train': 2.4150009155273438} -09/20/2021 21:39:07 - INFO - __main__ - Step 33077: {'lr': 0.0001996473260428269, 'samples': 1058464, 'steps': 2067, 'loss/train': 2.491100549697876} -09/20/2021 21:39:08 - INFO - __main__ - Step 33078: {'lr': 0.0001996473260428269, 'samples': 1058496, 'steps': 2067, 'loss/train': 1.811192512512207} -09/20/2021 21:39:08 - INFO - __main__ - Step 33079: {'lr': 0.0001996473260428269, 'samples': 1058528, 'steps': 2067, 'loss/train': 2.025578498840332} -09/20/2021 21:39:09 - INFO - __main__ - Step 33080: {'lr': 0.0001996473260428269, 'samples': 1058560, 'steps': 2067, 'loss/train': 2.0084586143493652} -09/20/2021 21:39:10 - INFO - __main__ - Step 33081: {'lr': 0.0001996473260428269, 'samples': 1058592, 'steps': 2067, 'loss/train': 3.1301791667938232} -09/20/2021 21:39:11 - INFO - __main__ - Step 33082: {'lr': 0.0001996473260428269, 'samples': 1058624, 'steps': 2067, 'loss/train': 3.2651925086975098} -09/20/2021 21:39:11 - INFO - __main__ - Step 33083: {'lr': 0.0001996473260428269, 'samples': 1058656, 'steps': 2067, 'loss/train': 2.330759286880493} -09/20/2021 21:39:12 - INFO - __main__ - Step 33084: {'lr': 0.0001996473260428269, 'samples': 1058688, 'steps': 2067, 'loss/train': 2.216930389404297} -09/20/2021 21:39:13 - INFO - __main__ - Step 33085: {'lr': 0.0001996473260428269, 'samples': 1058720, 'steps': 2067, 'loss/train': 3.0752885341644287} -09/20/2021 21:39:14 - INFO - __main__ - Step 33086: {'lr': 0.0001996473260428269, 'samples': 1058752, 'steps': 2067, 'loss/train': 2.3817591667175293} -09/20/2021 21:39:14 - INFO - __main__ - Step 33087: {'lr': 0.0001996473260428269, 'samples': 1058784, 'steps': 2067, 'loss/train': 1.9342645406723022} -09/20/2021 21:39:15 - INFO - __main__ - Step 33088: {'lr': 0.0001996473260428269, 'samples': 1058816, 'steps': 2067, 'loss/train': 2.777252435684204} -09/20/2021 21:39:16 - INFO - __main__ - Step 33089: {'lr': 0.0001996467905834319, 'samples': 1058848, 'steps': 2068, 'loss/train': 2.5430524349212646} -09/20/2021 21:39:17 - INFO - __main__ - Step 33090: {'lr': 0.0001996467905834319, 'samples': 1058880, 'steps': 2068, 'loss/train': 3.3045992851257324} -09/20/2021 21:39:17 - INFO - __main__ - Step 33091: {'lr': 0.0001996467905834319, 'samples': 1058912, 'steps': 2068, 'loss/train': 2.5527467727661133} -09/20/2021 21:39:18 - INFO - __main__ - Step 33092: {'lr': 0.0001996467905834319, 'samples': 1058944, 'steps': 2068, 'loss/train': 2.0603339672088623} -09/20/2021 21:39:19 - INFO - __main__ - Step 33093: {'lr': 0.0001996467905834319, 'samples': 1058976, 'steps': 2068, 'loss/train': 3.358059883117676} -09/20/2021 21:39:20 - INFO - __main__ - Step 33094: {'lr': 0.0001996467905834319, 'samples': 1059008, 'steps': 2068, 'loss/train': 2.5410168170928955} -09/20/2021 21:39:20 - INFO - __main__ - Step 33095: {'lr': 0.0001996467905834319, 'samples': 1059040, 'steps': 2068, 'loss/train': 2.5505759716033936} -09/20/2021 21:39:21 - INFO - __main__ - Step 33096: {'lr': 0.0001996467905834319, 'samples': 1059072, 'steps': 2068, 'loss/train': 2.202340602874756} -09/20/2021 21:39:22 - INFO - __main__ - Step 33097: {'lr': 0.0001996467905834319, 'samples': 1059104, 'steps': 2068, 'loss/train': 0.704483687877655} -09/20/2021 21:39:23 - INFO - __main__ - Step 33098: {'lr': 0.0001996467905834319, 'samples': 1059136, 'steps': 2068, 'loss/train': 2.316537618637085} -09/20/2021 21:39:23 - INFO - __main__ - Step 33099: {'lr': 0.0001996467905834319, 'samples': 1059168, 'steps': 2068, 'loss/train': 2.886598587036133} -09/20/2021 21:39:24 - INFO - __main__ - Step 33100: {'lr': 0.0001996467905834319, 'samples': 1059200, 'steps': 2068, 'loss/train': 2.7830145359039307} -09/20/2021 21:39:25 - INFO - __main__ - Step 33101: {'lr': 0.0001996467905834319, 'samples': 1059232, 'steps': 2068, 'loss/train': 1.9102431535720825} -09/20/2021 21:39:26 - INFO - __main__ - Step 33102: {'lr': 0.0001996467905834319, 'samples': 1059264, 'steps': 2068, 'loss/train': 2.757866621017456} -09/20/2021 21:39:26 - INFO - __main__ - Step 33103: {'lr': 0.0001996467905834319, 'samples': 1059296, 'steps': 2068, 'loss/train': 2.282174825668335} -09/20/2021 21:39:27 - INFO - __main__ - Step 33104: {'lr': 0.0001996467905834319, 'samples': 1059328, 'steps': 2068, 'loss/train': 3.0449984073638916} -09/20/2021 21:39:28 - INFO - __main__ - Step 33105: {'lr': 0.00019964625471857457, 'samples': 1059360, 'steps': 2069, 'loss/train': 2.536234140396118} -09/20/2021 21:39:29 - INFO - __main__ - Step 33106: {'lr': 0.00019964625471857457, 'samples': 1059392, 'steps': 2069, 'loss/train': 2.010457754135132} -09/20/2021 21:39:30 - INFO - __main__ - Step 33107: {'lr': 0.00019964625471857457, 'samples': 1059424, 'steps': 2069, 'loss/train': 3.070552349090576} -09/20/2021 21:39:31 - INFO - __main__ - Step 33108: {'lr': 0.00019964625471857457, 'samples': 1059456, 'steps': 2069, 'loss/train': 0.3457314372062683} -09/20/2021 21:39:32 - INFO - __main__ - Step 33109: {'lr': 0.00019964625471857457, 'samples': 1059488, 'steps': 2069, 'loss/train': 2.3376379013061523} -09/20/2021 21:39:32 - INFO - __main__ - Step 33110: {'lr': 0.00019964625471857457, 'samples': 1059520, 'steps': 2069, 'loss/train': 2.776837110519409} -09/20/2021 21:39:33 - INFO - __main__ - Step 33111: {'lr': 0.00019964625471857457, 'samples': 1059552, 'steps': 2069, 'loss/train': 2.7872676849365234} -09/20/2021 21:39:34 - INFO - __main__ - Step 33112: {'lr': 0.00019964625471857457, 'samples': 1059584, 'steps': 2069, 'loss/train': 0.39700186252593994} -09/20/2021 21:39:35 - INFO - __main__ - Step 33113: {'lr': 0.00019964625471857457, 'samples': 1059616, 'steps': 2069, 'loss/train': 2.453676700592041} -09/20/2021 21:39:35 - INFO - __main__ - Step 33114: {'lr': 0.00019964625471857457, 'samples': 1059648, 'steps': 2069, 'loss/train': 1.7732685804367065} -09/20/2021 21:39:36 - INFO - __main__ - Step 33115: {'lr': 0.00019964625471857457, 'samples': 1059680, 'steps': 2069, 'loss/train': 3.969984769821167} -09/20/2021 21:39:37 - INFO - __main__ - Step 33116: {'lr': 0.00019964625471857457, 'samples': 1059712, 'steps': 2069, 'loss/train': 2.6619255542755127} -09/20/2021 21:39:38 - INFO - __main__ - Step 33117: {'lr': 0.00019964625471857457, 'samples': 1059744, 'steps': 2069, 'loss/train': 2.486258029937744} -09/20/2021 21:39:38 - INFO - __main__ - Step 33118: {'lr': 0.00019964625471857457, 'samples': 1059776, 'steps': 2069, 'loss/train': 2.0668280124664307} -09/20/2021 21:39:39 - INFO - __main__ - Step 33119: {'lr': 0.00019964625471857457, 'samples': 1059808, 'steps': 2069, 'loss/train': 1.9397368431091309} -09/20/2021 21:39:40 - INFO - __main__ - Step 33120: {'lr': 0.00019964625471857457, 'samples': 1059840, 'steps': 2069, 'loss/train': 2.118035316467285} -09/20/2021 21:39:41 - INFO - __main__ - Step 33121: {'lr': 0.00019964571844825697, 'samples': 1059872, 'steps': 2070, 'loss/train': 3.008929967880249} -09/20/2021 21:39:41 - INFO - __main__ - Step 33122: {'lr': 0.00019964571844825697, 'samples': 1059904, 'steps': 2070, 'loss/train': 1.618327260017395} -09/20/2021 21:39:42 - INFO - __main__ - Step 33123: {'lr': 0.00019964571844825697, 'samples': 1059936, 'steps': 2070, 'loss/train': 2.7532167434692383} -09/20/2021 21:39:43 - INFO - __main__ - Step 33124: {'lr': 0.00019964571844825697, 'samples': 1059968, 'steps': 2070, 'loss/train': 2.7407171726226807} -09/20/2021 21:39:44 - INFO - __main__ - Step 33125: {'lr': 0.00019964571844825697, 'samples': 1060000, 'steps': 2070, 'loss/train': 2.4698431491851807} -09/20/2021 21:39:44 - INFO - __main__ - Step 33126: {'lr': 0.00019964571844825697, 'samples': 1060032, 'steps': 2070, 'loss/train': 1.915247917175293} -09/20/2021 21:39:45 - INFO - __main__ - Step 33127: {'lr': 0.00019964571844825697, 'samples': 1060064, 'steps': 2070, 'loss/train': 2.4940381050109863} -09/20/2021 21:39:46 - INFO - __main__ - Step 33128: {'lr': 0.00019964571844825697, 'samples': 1060096, 'steps': 2070, 'loss/train': 2.716327428817749} -09/20/2021 21:39:47 - INFO - __main__ - Step 33129: {'lr': 0.00019964571844825697, 'samples': 1060128, 'steps': 2070, 'loss/train': 1.2501440048217773} -09/20/2021 21:39:47 - INFO - __main__ - Step 33130: {'lr': 0.00019964571844825697, 'samples': 1060160, 'steps': 2070, 'loss/train': 1.6347328424453735} -09/20/2021 21:39:48 - INFO - __main__ - Step 33131: {'lr': 0.00019964571844825697, 'samples': 1060192, 'steps': 2070, 'loss/train': 2.340503692626953} -09/20/2021 21:39:49 - INFO - __main__ - Step 33132: {'lr': 0.00019964571844825697, 'samples': 1060224, 'steps': 2070, 'loss/train': 2.6156368255615234} -09/20/2021 21:39:50 - INFO - __main__ - Step 33133: {'lr': 0.00019964571844825697, 'samples': 1060256, 'steps': 2070, 'loss/train': 2.663076162338257} -09/20/2021 21:39:50 - INFO - __main__ - Step 33134: {'lr': 0.00019964571844825697, 'samples': 1060288, 'steps': 2070, 'loss/train': 2.840081214904785} -09/20/2021 21:39:51 - INFO - __main__ - Step 33135: {'lr': 0.00019964571844825697, 'samples': 1060320, 'steps': 2070, 'loss/train': 2.8642399311065674} -09/20/2021 21:39:52 - INFO - __main__ - Step 33136: {'lr': 0.00019964571844825697, 'samples': 1060352, 'steps': 2070, 'loss/train': 2.1484577655792236} -09/20/2021 21:39:53 - INFO - __main__ - Step 33137: {'lr': 0.00019964518177248135, 'samples': 1060384, 'steps': 2071, 'loss/train': 3.048152208328247} -09/20/2021 21:39:54 - INFO - __main__ - Step 33138: {'lr': 0.00019964518177248135, 'samples': 1060416, 'steps': 2071, 'loss/train': 3.1988039016723633} -09/20/2021 21:39:55 - INFO - __main__ - Step 33139: {'lr': 0.00019964518177248135, 'samples': 1060448, 'steps': 2071, 'loss/train': 3.0049710273742676} -09/20/2021 21:39:56 - INFO - __main__ - Step 33140: {'lr': 0.00019964518177248135, 'samples': 1060480, 'steps': 2071, 'loss/train': 2.7129807472229004} -09/20/2021 21:39:56 - INFO - __main__ - Step 33141: {'lr': 0.00019964518177248135, 'samples': 1060512, 'steps': 2071, 'loss/train': 1.9017219543457031} -09/20/2021 21:39:57 - INFO - __main__ - Step 33142: {'lr': 0.00019964518177248135, 'samples': 1060544, 'steps': 2071, 'loss/train': 1.894890308380127} -09/20/2021 21:39:58 - INFO - __main__ - Step 33143: {'lr': 0.00019964518177248135, 'samples': 1060576, 'steps': 2071, 'loss/train': 1.5641717910766602} -09/20/2021 21:39:59 - INFO - __main__ - Step 33144: {'lr': 0.00019964518177248135, 'samples': 1060608, 'steps': 2071, 'loss/train': 2.2810757160186768} -09/20/2021 21:39:59 - INFO - __main__ - Step 33145: {'lr': 0.00019964518177248135, 'samples': 1060640, 'steps': 2071, 'loss/train': 1.9904019832611084} -09/20/2021 21:40:00 - INFO - __main__ - Step 33146: {'lr': 0.00019964518177248135, 'samples': 1060672, 'steps': 2071, 'loss/train': 2.859442949295044} -09/20/2021 21:40:01 - INFO - __main__ - Step 33147: {'lr': 0.00019964518177248135, 'samples': 1060704, 'steps': 2071, 'loss/train': 1.9192581176757812} -09/20/2021 21:40:02 - INFO - __main__ - Step 33148: {'lr': 0.00019964518177248135, 'samples': 1060736, 'steps': 2071, 'loss/train': 1.7766221761703491} -09/20/2021 21:40:02 - INFO - __main__ - Step 33149: {'lr': 0.00019964518177248135, 'samples': 1060768, 'steps': 2071, 'loss/train': 2.011084794998169} -09/20/2021 21:40:03 - INFO - __main__ - Step 33150: {'lr': 0.00019964518177248135, 'samples': 1060800, 'steps': 2071, 'loss/train': 2.920610189437866} -09/20/2021 21:40:04 - INFO - __main__ - Step 33151: {'lr': 0.00019964518177248135, 'samples': 1060832, 'steps': 2071, 'loss/train': 3.1218831539154053} -09/20/2021 21:40:05 - INFO - __main__ - Step 33152: {'lr': 0.00019964518177248135, 'samples': 1060864, 'steps': 2071, 'loss/train': 1.397178292274475} -09/20/2021 21:40:05 - INFO - __main__ - Step 33153: {'lr': 0.00019964464469124984, 'samples': 1060896, 'steps': 2072, 'loss/train': 2.121403932571411} -09/20/2021 21:40:06 - INFO - __main__ - Step 33154: {'lr': 0.00019964464469124984, 'samples': 1060928, 'steps': 2072, 'loss/train': 2.7108702659606934} -09/20/2021 21:40:07 - INFO - __main__ - Step 33155: {'lr': 0.00019964464469124984, 'samples': 1060960, 'steps': 2072, 'loss/train': 1.7740880250930786} -09/20/2021 21:40:08 - INFO - __main__ - Step 33156: {'lr': 0.00019964464469124984, 'samples': 1060992, 'steps': 2072, 'loss/train': 1.7598029375076294} -09/20/2021 21:40:08 - INFO - __main__ - Step 33157: {'lr': 0.00019964464469124984, 'samples': 1061024, 'steps': 2072, 'loss/train': 1.6152011156082153} -09/20/2021 21:40:09 - INFO - __main__ - Step 33158: {'lr': 0.00019964464469124984, 'samples': 1061056, 'steps': 2072, 'loss/train': 1.832335114479065} -09/20/2021 21:40:10 - INFO - __main__ - Step 33159: {'lr': 0.00019964464469124984, 'samples': 1061088, 'steps': 2072, 'loss/train': 2.3652658462524414} -09/20/2021 21:40:11 - INFO - __main__ - Step 33160: {'lr': 0.00019964464469124984, 'samples': 1061120, 'steps': 2072, 'loss/train': 1.9856082201004028} -09/20/2021 21:40:11 - INFO - __main__ - Step 33161: {'lr': 0.00019964464469124984, 'samples': 1061152, 'steps': 2072, 'loss/train': 2.4688093662261963} -09/20/2021 21:40:12 - INFO - __main__ - Step 33162: {'lr': 0.00019964464469124984, 'samples': 1061184, 'steps': 2072, 'loss/train': 2.1669602394104004} -09/20/2021 21:40:13 - INFO - __main__ - Step 33163: {'lr': 0.00019964464469124984, 'samples': 1061216, 'steps': 2072, 'loss/train': 2.28440523147583} -09/20/2021 21:40:14 - INFO - __main__ - Step 33164: {'lr': 0.00019964464469124984, 'samples': 1061248, 'steps': 2072, 'loss/train': 2.4338033199310303} -09/20/2021 21:40:14 - INFO - __main__ - Step 33165: {'lr': 0.00019964464469124984, 'samples': 1061280, 'steps': 2072, 'loss/train': 2.255635976791382} -09/20/2021 21:40:15 - INFO - __main__ - Step 33166: {'lr': 0.00019964464469124984, 'samples': 1061312, 'steps': 2072, 'loss/train': 2.831256866455078} -09/20/2021 21:40:16 - INFO - __main__ - Step 33167: {'lr': 0.00019964464469124984, 'samples': 1061344, 'steps': 2072, 'loss/train': 2.656525135040283} -09/20/2021 21:40:17 - INFO - __main__ - Step 33168: {'lr': 0.00019964464469124984, 'samples': 1061376, 'steps': 2072, 'loss/train': 2.110161542892456} -09/20/2021 21:40:18 - INFO - __main__ - Step 33169: {'lr': 0.00019964410720456468, 'samples': 1061408, 'steps': 2073, 'loss/train': 2.4303810596466064} -09/20/2021 21:40:20 - INFO - __main__ - Step 33170: {'lr': 0.00019964410720456468, 'samples': 1061440, 'steps': 2073, 'loss/train': 1.8608976602554321} -09/20/2021 21:40:21 - INFO - __main__ - Step 33171: {'lr': 0.00019964410720456468, 'samples': 1061472, 'steps': 2073, 'loss/train': 1.134559988975525} -09/20/2021 21:40:21 - INFO - __main__ - Step 33172: {'lr': 0.00019964410720456468, 'samples': 1061504, 'steps': 2073, 'loss/train': 2.814767837524414} -09/20/2021 21:40:22 - INFO - __main__ - Step 33173: {'lr': 0.00019964410720456468, 'samples': 1061536, 'steps': 2073, 'loss/train': 2.560620069503784} -09/20/2021 21:40:23 - INFO - __main__ - Step 33174: {'lr': 0.00019964410720456468, 'samples': 1061568, 'steps': 2073, 'loss/train': 0.22461256384849548} -09/20/2021 21:40:24 - INFO - __main__ - Step 33175: {'lr': 0.00019964410720456468, 'samples': 1061600, 'steps': 2073, 'loss/train': 0.22153452038764954} -09/20/2021 21:40:24 - INFO - __main__ - Step 33176: {'lr': 0.00019964410720456468, 'samples': 1061632, 'steps': 2073, 'loss/train': 0.2826552093029022} -09/20/2021 21:40:25 - INFO - __main__ - Step 33177: {'lr': 0.00019964410720456468, 'samples': 1061664, 'steps': 2073, 'loss/train': 2.199052572250366} -09/20/2021 21:40:26 - INFO - __main__ - Step 33178: {'lr': 0.00019964410720456468, 'samples': 1061696, 'steps': 2073, 'loss/train': 2.9735100269317627} -09/20/2021 21:40:27 - INFO - __main__ - Step 33179: {'lr': 0.00019964410720456468, 'samples': 1061728, 'steps': 2073, 'loss/train': 2.120180130004883} -09/20/2021 21:40:27 - INFO - __main__ - Step 33180: {'lr': 0.00019964410720456468, 'samples': 1061760, 'steps': 2073, 'loss/train': 2.2112538814544678} -09/20/2021 21:40:28 - INFO - __main__ - Step 33181: {'lr': 0.00019964410720456468, 'samples': 1061792, 'steps': 2073, 'loss/train': 1.895721435546875} -09/20/2021 21:40:29 - INFO - __main__ - Step 33182: {'lr': 0.00019964410720456468, 'samples': 1061824, 'steps': 2073, 'loss/train': 2.1111021041870117} -09/20/2021 21:40:30 - INFO - __main__ - Step 33183: {'lr': 0.00019964410720456468, 'samples': 1061856, 'steps': 2073, 'loss/train': 3.5805628299713135} -09/20/2021 21:40:30 - INFO - __main__ - Step 33184: {'lr': 0.00019964410720456468, 'samples': 1061888, 'steps': 2073, 'loss/train': 1.563637375831604} -09/20/2021 21:40:31 - INFO - __main__ - Step 33185: {'lr': 0.00019964356931242804, 'samples': 1061920, 'steps': 2074, 'loss/train': 2.0357959270477295} -09/20/2021 21:40:32 - INFO - __main__ - Step 33186: {'lr': 0.00019964356931242804, 'samples': 1061952, 'steps': 2074, 'loss/train': 1.9574445486068726} -09/20/2021 21:40:33 - INFO - __main__ - Step 33187: {'lr': 0.00019964356931242804, 'samples': 1061984, 'steps': 2074, 'loss/train': 2.1629936695098877} -09/20/2021 21:40:33 - INFO - __main__ - Step 33188: {'lr': 0.00019964356931242804, 'samples': 1062016, 'steps': 2074, 'loss/train': 3.0784261226654053} -09/20/2021 21:40:34 - INFO - __main__ - Step 33189: {'lr': 0.00019964356931242804, 'samples': 1062048, 'steps': 2074, 'loss/train': 2.638615131378174} -09/20/2021 21:40:35 - INFO - __main__ - Step 33190: {'lr': 0.00019964356931242804, 'samples': 1062080, 'steps': 2074, 'loss/train': 2.408745527267456} -09/20/2021 21:40:36 - INFO - __main__ - Step 33191: {'lr': 0.00019964356931242804, 'samples': 1062112, 'steps': 2074, 'loss/train': 2.36881947517395} -09/20/2021 21:40:36 - INFO - __main__ - Step 33192: {'lr': 0.00019964356931242804, 'samples': 1062144, 'steps': 2074, 'loss/train': 2.347177267074585} -09/20/2021 21:40:37 - INFO - __main__ - Step 33193: {'lr': 0.00019964356931242804, 'samples': 1062176, 'steps': 2074, 'loss/train': 2.3690807819366455} -09/20/2021 21:40:38 - INFO - __main__ - Step 33194: {'lr': 0.00019964356931242804, 'samples': 1062208, 'steps': 2074, 'loss/train': 2.4382991790771484} -09/20/2021 21:40:39 - INFO - __main__ - Step 33195: {'lr': 0.00019964356931242804, 'samples': 1062240, 'steps': 2074, 'loss/train': 2.4760689735412598} -09/20/2021 21:40:39 - INFO - __main__ - Step 33196: {'lr': 0.00019964356931242804, 'samples': 1062272, 'steps': 2074, 'loss/train': 2.4546375274658203} -09/20/2021 21:40:40 - INFO - __main__ - Step 33197: {'lr': 0.00019964356931242804, 'samples': 1062304, 'steps': 2074, 'loss/train': 2.250685214996338} -09/20/2021 21:40:41 - INFO - __main__ - Step 33198: {'lr': 0.00019964356931242804, 'samples': 1062336, 'steps': 2074, 'loss/train': 2.395719289779663} -09/20/2021 21:40:42 - INFO - __main__ - Step 33199: {'lr': 0.00019964356931242804, 'samples': 1062368, 'steps': 2074, 'loss/train': 2.4545540809631348} -09/20/2021 21:40:42 - INFO - __main__ - Step 33200: {'lr': 0.00019964356931242804, 'samples': 1062400, 'steps': 2074, 'loss/train': 2.416043996810913} -09/20/2021 21:40:43 - INFO - __main__ - Step 33201: {'lr': 0.0001996430310148421, 'samples': 1062432, 'steps': 2075, 'loss/train': 2.1363866329193115} -09/20/2021 21:40:44 - INFO - __main__ - Step 33202: {'lr': 0.0001996430310148421, 'samples': 1062464, 'steps': 2075, 'loss/train': 2.095013380050659} -09/20/2021 21:40:45 - INFO - __main__ - Step 33203: {'lr': 0.0001996430310148421, 'samples': 1062496, 'steps': 2075, 'loss/train': 1.8174704313278198} -09/20/2021 21:40:46 - INFO - __main__ - Step 33204: {'lr': 0.0001996430310148421, 'samples': 1062528, 'steps': 2075, 'loss/train': 1.9907097816467285} -09/20/2021 21:40:46 - INFO - __main__ - Step 33205: {'lr': 0.0001996430310148421, 'samples': 1062560, 'steps': 2075, 'loss/train': 1.4396848678588867} -09/20/2021 21:40:47 - INFO - __main__ - Step 33206: {'lr': 0.0001996430310148421, 'samples': 1062592, 'steps': 2075, 'loss/train': 1.7293376922607422} -09/20/2021 21:40:48 - INFO - __main__ - Step 33207: {'lr': 0.0001996430310148421, 'samples': 1062624, 'steps': 2075, 'loss/train': 2.383164882659912} -09/20/2021 21:40:49 - INFO - __main__ - Step 33208: {'lr': 0.0001996430310148421, 'samples': 1062656, 'steps': 2075, 'loss/train': 2.0746028423309326} -09/20/2021 21:40:50 - INFO - __main__ - Step 33209: {'lr': 0.0001996430310148421, 'samples': 1062688, 'steps': 2075, 'loss/train': 1.8753809928894043} -09/20/2021 21:40:51 - INFO - __main__ - Step 33210: {'lr': 0.0001996430310148421, 'samples': 1062720, 'steps': 2075, 'loss/train': 1.709010124206543} -09/20/2021 21:40:51 - INFO - __main__ - Step 33211: {'lr': 0.0001996430310148421, 'samples': 1062752, 'steps': 2075, 'loss/train': 4.4957122802734375} -09/20/2021 21:40:52 - INFO - __main__ - Step 33212: {'lr': 0.0001996430310148421, 'samples': 1062784, 'steps': 2075, 'loss/train': 2.22916316986084} -09/20/2021 21:40:53 - INFO - __main__ - Step 33213: {'lr': 0.0001996430310148421, 'samples': 1062816, 'steps': 2075, 'loss/train': 2.700923204421997} -09/20/2021 21:40:54 - INFO - __main__ - Step 33214: {'lr': 0.0001996430310148421, 'samples': 1062848, 'steps': 2075, 'loss/train': 2.045940399169922} -09/20/2021 21:40:54 - INFO - __main__ - Step 33215: {'lr': 0.0001996430310148421, 'samples': 1062880, 'steps': 2075, 'loss/train': 0.7788482904434204} -09/20/2021 21:40:55 - INFO - __main__ - Step 33216: {'lr': 0.0001996430310148421, 'samples': 1062912, 'steps': 2075, 'loss/train': 1.9842991828918457} -09/20/2021 21:40:56 - INFO - __main__ - Step 33217: {'lr': 0.00019964249231180906, 'samples': 1062944, 'steps': 2076, 'loss/train': 2.5299556255340576} -09/20/2021 21:40:57 - INFO - __main__ - Step 33218: {'lr': 0.00019964249231180906, 'samples': 1062976, 'steps': 2076, 'loss/train': 2.532526969909668} -09/20/2021 21:40:57 - INFO - __main__ - Step 33219: {'lr': 0.00019964249231180906, 'samples': 1063008, 'steps': 2076, 'loss/train': 2.604719638824463} -09/20/2021 21:40:58 - INFO - __main__ - Step 33220: {'lr': 0.00019964249231180906, 'samples': 1063040, 'steps': 2076, 'loss/train': 2.073173999786377} -09/20/2021 21:40:59 - INFO - __main__ - Step 33221: {'lr': 0.00019964249231180906, 'samples': 1063072, 'steps': 2076, 'loss/train': 2.760434865951538} -09/20/2021 21:41:00 - INFO - __main__ - Step 33222: {'lr': 0.00019964249231180906, 'samples': 1063104, 'steps': 2076, 'loss/train': 2.6707632541656494} -09/20/2021 21:41:00 - INFO - __main__ - Step 33223: {'lr': 0.00019964249231180906, 'samples': 1063136, 'steps': 2076, 'loss/train': 1.2688846588134766} -09/20/2021 21:41:01 - INFO - __main__ - Step 33224: {'lr': 0.00019964249231180906, 'samples': 1063168, 'steps': 2076, 'loss/train': 2.4757192134857178} -09/20/2021 21:41:02 - INFO - __main__ - Step 33225: {'lr': 0.00019964249231180906, 'samples': 1063200, 'steps': 2076, 'loss/train': 2.9124374389648438} -09/20/2021 21:41:03 - INFO - __main__ - Step 33226: {'lr': 0.00019964249231180906, 'samples': 1063232, 'steps': 2076, 'loss/train': 2.1089913845062256} -09/20/2021 21:41:03 - INFO - __main__ - Step 33227: {'lr': 0.00019964249231180906, 'samples': 1063264, 'steps': 2076, 'loss/train': 2.127141237258911} -09/20/2021 21:41:04 - INFO - __main__ - Step 33228: {'lr': 0.00019964249231180906, 'samples': 1063296, 'steps': 2076, 'loss/train': 2.8376736640930176} -09/20/2021 21:41:05 - INFO - __main__ - Step 33229: {'lr': 0.00019964249231180906, 'samples': 1063328, 'steps': 2076, 'loss/train': 1.94692063331604} -09/20/2021 21:41:06 - INFO - __main__ - Step 33230: {'lr': 0.00019964249231180906, 'samples': 1063360, 'steps': 2076, 'loss/train': 1.5520286560058594} -09/20/2021 21:41:06 - INFO - __main__ - Step 33231: {'lr': 0.00019964249231180906, 'samples': 1063392, 'steps': 2076, 'loss/train': 2.6433284282684326} -09/20/2021 21:41:07 - INFO - __main__ - Step 33232: {'lr': 0.00019964249231180906, 'samples': 1063424, 'steps': 2076, 'loss/train': 3.1311047077178955} -09/20/2021 21:41:08 - INFO - __main__ - Step 33233: {'lr': 0.00019964195320333107, 'samples': 1063456, 'steps': 2077, 'loss/train': 1.3327984809875488} -09/20/2021 21:41:09 - INFO - __main__ - Step 33234: {'lr': 0.00019964195320333107, 'samples': 1063488, 'steps': 2077, 'loss/train': 2.304307222366333} -09/20/2021 21:41:10 - INFO - __main__ - Step 33235: {'lr': 0.00019964195320333107, 'samples': 1063520, 'steps': 2077, 'loss/train': 2.1214780807495117} -09/20/2021 21:41:10 - INFO - __main__ - Step 33236: {'lr': 0.00019964195320333107, 'samples': 1063552, 'steps': 2077, 'loss/train': 2.874331474304199} -09/20/2021 21:41:11 - INFO - __main__ - Step 33237: {'lr': 0.00019964195320333107, 'samples': 1063584, 'steps': 2077, 'loss/train': 2.886807680130005} -09/20/2021 21:41:12 - INFO - __main__ - Step 33238: {'lr': 0.00019964195320333107, 'samples': 1063616, 'steps': 2077, 'loss/train': 2.189647912979126} -09/20/2021 21:41:13 - INFO - __main__ - Step 33239: {'lr': 0.00019964195320333107, 'samples': 1063648, 'steps': 2077, 'loss/train': 2.4991343021392822} -09/20/2021 21:41:13 - INFO - __main__ - Step 33240: {'lr': 0.00019964195320333107, 'samples': 1063680, 'steps': 2077, 'loss/train': 2.108311891555786} -09/20/2021 21:41:15 - INFO - __main__ - Step 33241: {'lr': 0.00019964195320333107, 'samples': 1063712, 'steps': 2077, 'loss/train': 2.1081998348236084} -09/20/2021 21:41:16 - INFO - __main__ - Step 33242: {'lr': 0.00019964195320333107, 'samples': 1063744, 'steps': 2077, 'loss/train': 2.5180273056030273} -09/20/2021 21:41:17 - INFO - __main__ - Step 33243: {'lr': 0.00019964195320333107, 'samples': 1063776, 'steps': 2077, 'loss/train': 2.6792778968811035} -09/20/2021 21:41:17 - INFO - __main__ - Step 33244: {'lr': 0.00019964195320333107, 'samples': 1063808, 'steps': 2077, 'loss/train': 1.8188765048980713} -09/20/2021 21:41:18 - INFO - __main__ - Step 33245: {'lr': 0.00019964195320333107, 'samples': 1063840, 'steps': 2077, 'loss/train': 2.667206287384033} -09/20/2021 21:41:19 - INFO - __main__ - Step 33246: {'lr': 0.00019964195320333107, 'samples': 1063872, 'steps': 2077, 'loss/train': 1.8606616258621216} -09/20/2021 21:41:20 - INFO - __main__ - Step 33247: {'lr': 0.00019964195320333107, 'samples': 1063904, 'steps': 2077, 'loss/train': 2.9599246978759766} -09/20/2021 21:41:20 - INFO - __main__ - Step 33248: {'lr': 0.00019964195320333107, 'samples': 1063936, 'steps': 2077, 'loss/train': 1.8963871002197266} -09/20/2021 21:41:21 - INFO - __main__ - Step 33249: {'lr': 0.0001996414136894104, 'samples': 1063968, 'steps': 2078, 'loss/train': 2.2369918823242188} -09/20/2021 21:41:22 - INFO - __main__ - Step 33250: {'lr': 0.0001996414136894104, 'samples': 1064000, 'steps': 2078, 'loss/train': 2.2530550956726074} -09/20/2021 21:41:23 - INFO - __main__ - Step 33251: {'lr': 0.0001996414136894104, 'samples': 1064032, 'steps': 2078, 'loss/train': 2.3010897636413574} -09/20/2021 21:41:24 - INFO - __main__ - Step 33252: {'lr': 0.0001996414136894104, 'samples': 1064064, 'steps': 2078, 'loss/train': 3.0345535278320312} -09/20/2021 21:41:24 - INFO - __main__ - Step 33253: {'lr': 0.0001996414136894104, 'samples': 1064096, 'steps': 2078, 'loss/train': 3.3837473392486572} -09/20/2021 21:41:25 - INFO - __main__ - Step 33254: {'lr': 0.0001996414136894104, 'samples': 1064128, 'steps': 2078, 'loss/train': 2.5413742065429688} -09/20/2021 21:41:26 - INFO - __main__ - Step 33255: {'lr': 0.0001996414136894104, 'samples': 1064160, 'steps': 2078, 'loss/train': 3.0801734924316406} -09/20/2021 21:41:27 - INFO - __main__ - Step 33256: {'lr': 0.0001996414136894104, 'samples': 1064192, 'steps': 2078, 'loss/train': 0.9508473873138428} -09/20/2021 21:41:27 - INFO - __main__ - Step 33257: {'lr': 0.0001996414136894104, 'samples': 1064224, 'steps': 2078, 'loss/train': 2.1177918910980225} -09/20/2021 21:41:28 - INFO - __main__ - Step 33258: {'lr': 0.0001996414136894104, 'samples': 1064256, 'steps': 2078, 'loss/train': 1.6014742851257324} -09/20/2021 21:41:29 - INFO - __main__ - Step 33259: {'lr': 0.0001996414136894104, 'samples': 1064288, 'steps': 2078, 'loss/train': 2.5989503860473633} -09/20/2021 21:41:30 - INFO - __main__ - Step 33260: {'lr': 0.0001996414136894104, 'samples': 1064320, 'steps': 2078, 'loss/train': 2.708632707595825} -09/20/2021 21:41:30 - INFO - __main__ - Step 33261: {'lr': 0.0001996414136894104, 'samples': 1064352, 'steps': 2078, 'loss/train': 2.1559414863586426} -09/20/2021 21:41:31 - INFO - __main__ - Step 33262: {'lr': 0.0001996414136894104, 'samples': 1064384, 'steps': 2078, 'loss/train': 2.0619101524353027} -09/20/2021 21:41:32 - INFO - __main__ - Step 33263: {'lr': 0.0001996414136894104, 'samples': 1064416, 'steps': 2078, 'loss/train': 2.657691240310669} -09/20/2021 21:41:33 - INFO - __main__ - Step 33264: {'lr': 0.0001996414136894104, 'samples': 1064448, 'steps': 2078, 'loss/train': 2.0388119220733643} -09/20/2021 21:41:33 - INFO - __main__ - Step 33265: {'lr': 0.0001996408737700492, 'samples': 1064480, 'steps': 2079, 'loss/train': 2.348311185836792} -09/20/2021 21:41:34 - INFO - __main__ - Step 33266: {'lr': 0.0001996408737700492, 'samples': 1064512, 'steps': 2079, 'loss/train': 2.3443753719329834} -09/20/2021 21:41:35 - INFO - __main__ - Step 33267: {'lr': 0.0001996408737700492, 'samples': 1064544, 'steps': 2079, 'loss/train': 4.488341331481934} -09/20/2021 21:41:36 - INFO - __main__ - Step 33268: {'lr': 0.0001996408737700492, 'samples': 1064576, 'steps': 2079, 'loss/train': 1.5712435245513916} -09/20/2021 21:41:36 - INFO - __main__ - Step 33269: {'lr': 0.0001996408737700492, 'samples': 1064608, 'steps': 2079, 'loss/train': 3.987454414367676} -09/20/2021 21:41:37 - INFO - __main__ - Step 33270: {'lr': 0.0001996408737700492, 'samples': 1064640, 'steps': 2079, 'loss/train': 1.7215871810913086} -09/20/2021 21:41:38 - INFO - __main__ - Step 33271: {'lr': 0.0001996408737700492, 'samples': 1064672, 'steps': 2079, 'loss/train': 2.408323287963867} -09/20/2021 21:41:39 - INFO - __main__ - Step 33272: {'lr': 0.0001996408737700492, 'samples': 1064704, 'steps': 2079, 'loss/train': 2.2506773471832275} -09/20/2021 21:41:40 - INFO - __main__ - Step 33273: {'lr': 0.0001996408737700492, 'samples': 1064736, 'steps': 2079, 'loss/train': 2.918168544769287} -09/20/2021 21:41:41 - INFO - __main__ - Step 33274: {'lr': 0.0001996408737700492, 'samples': 1064768, 'steps': 2079, 'loss/train': 0.6277217268943787} -09/20/2021 21:41:41 - INFO - __main__ - Step 33275: {'lr': 0.0001996408737700492, 'samples': 1064800, 'steps': 2079, 'loss/train': 4.1546149253845215} -09/20/2021 21:41:42 - INFO - __main__ - Step 33276: {'lr': 0.0001996408737700492, 'samples': 1064832, 'steps': 2079, 'loss/train': 4.389187812805176} -09/20/2021 21:41:43 - INFO - __main__ - Step 33277: {'lr': 0.0001996408737700492, 'samples': 1064864, 'steps': 2079, 'loss/train': 2.365058183670044} -09/20/2021 21:41:44 - INFO - __main__ - Step 33278: {'lr': 0.0001996408737700492, 'samples': 1064896, 'steps': 2079, 'loss/train': 1.8055120706558228} -09/20/2021 21:41:44 - INFO - __main__ - Step 33279: {'lr': 0.0001996408737700492, 'samples': 1064928, 'steps': 2079, 'loss/train': 1.5276864767074585} -09/20/2021 21:41:45 - INFO - __main__ - Step 33280: {'lr': 0.0001996408737700492, 'samples': 1064960, 'steps': 2079, 'loss/train': 2.037656307220459} -09/20/2021 21:41:46 - INFO - __main__ - Step 33281: {'lr': 0.00019964033344524964, 'samples': 1064992, 'steps': 2080, 'loss/train': 1.559169054031372} -09/20/2021 21:41:47 - INFO - __main__ - Step 33282: {'lr': 0.00019964033344524964, 'samples': 1065024, 'steps': 2080, 'loss/train': 2.1516358852386475} -09/20/2021 21:41:48 - INFO - __main__ - Step 33283: {'lr': 0.00019964033344524964, 'samples': 1065056, 'steps': 2080, 'loss/train': 2.7807886600494385} -09/20/2021 21:41:48 - INFO - __main__ - Step 33284: {'lr': 0.00019964033344524964, 'samples': 1065088, 'steps': 2080, 'loss/train': 3.104612112045288} -09/20/2021 21:41:49 - INFO - __main__ - Step 33285: {'lr': 0.00019964033344524964, 'samples': 1065120, 'steps': 2080, 'loss/train': 1.7402827739715576} -09/20/2021 21:41:50 - INFO - __main__ - Step 33286: {'lr': 0.00019964033344524964, 'samples': 1065152, 'steps': 2080, 'loss/train': 2.6745951175689697} -09/20/2021 21:41:51 - INFO - __main__ - Step 33287: {'lr': 0.00019964033344524964, 'samples': 1065184, 'steps': 2080, 'loss/train': 1.9127956628799438} -09/20/2021 21:41:51 - INFO - __main__ - Step 33288: {'lr': 0.00019964033344524964, 'samples': 1065216, 'steps': 2080, 'loss/train': 2.0631887912750244} -09/20/2021 21:41:52 - INFO - __main__ - Step 33289: {'lr': 0.00019964033344524964, 'samples': 1065248, 'steps': 2080, 'loss/train': 2.633974075317383} -09/20/2021 21:41:53 - INFO - __main__ - Step 33290: {'lr': 0.00019964033344524964, 'samples': 1065280, 'steps': 2080, 'loss/train': 2.1718902587890625} -09/20/2021 21:41:54 - INFO - __main__ - Step 33291: {'lr': 0.00019964033344524964, 'samples': 1065312, 'steps': 2080, 'loss/train': 1.43165123462677} -09/20/2021 21:41:54 - INFO - __main__ - Step 33292: {'lr': 0.00019964033344524964, 'samples': 1065344, 'steps': 2080, 'loss/train': 1.931917428970337} -09/20/2021 21:41:55 - INFO - __main__ - Step 33293: {'lr': 0.00019964033344524964, 'samples': 1065376, 'steps': 2080, 'loss/train': 2.7469804286956787} -09/20/2021 21:41:56 - INFO - __main__ - Step 33294: {'lr': 0.00019964033344524964, 'samples': 1065408, 'steps': 2080, 'loss/train': 2.067007541656494} -09/20/2021 21:41:57 - INFO - __main__ - Step 33295: {'lr': 0.00019964033344524964, 'samples': 1065440, 'steps': 2080, 'loss/train': 2.963596820831299} -09/20/2021 21:41:57 - INFO - __main__ - Step 33296: {'lr': 0.00019964033344524964, 'samples': 1065472, 'steps': 2080, 'loss/train': 2.0089972019195557} -09/20/2021 21:41:58 - INFO - __main__ - Step 33297: {'lr': 0.00019963979271501398, 'samples': 1065504, 'steps': 2081, 'loss/train': 2.321185827255249} -09/20/2021 21:41:59 - INFO - __main__ - Step 33298: {'lr': 0.00019963979271501398, 'samples': 1065536, 'steps': 2081, 'loss/train': 1.9814856052398682} -09/20/2021 21:42:00 - INFO - __main__ - Step 33299: {'lr': 0.00019963979271501398, 'samples': 1065568, 'steps': 2081, 'loss/train': 2.05607008934021} -09/20/2021 21:42:00 - INFO - __main__ - Step 33300: {'lr': 0.00019963979271501398, 'samples': 1065600, 'steps': 2081, 'loss/train': 2.296494245529175} -09/20/2021 21:42:01 - INFO - __main__ - Step 33301: {'lr': 0.00019963979271501398, 'samples': 1065632, 'steps': 2081, 'loss/train': 2.784388542175293} -09/20/2021 21:42:02 - INFO - __main__ - Step 33302: {'lr': 0.00019963979271501398, 'samples': 1065664, 'steps': 2081, 'loss/train': 2.6084823608398438} -09/20/2021 21:42:03 - INFO - __main__ - Step 33303: {'lr': 0.00019963979271501398, 'samples': 1065696, 'steps': 2081, 'loss/train': 2.535040855407715} -09/20/2021 21:42:04 - INFO - __main__ - Step 33304: {'lr': 0.00019963979271501398, 'samples': 1065728, 'steps': 2081, 'loss/train': 1.7342222929000854} -09/20/2021 21:42:05 - INFO - __main__ - Step 33305: {'lr': 0.00019963979271501398, 'samples': 1065760, 'steps': 2081, 'loss/train': 2.94558048248291} -09/20/2021 21:42:06 - INFO - __main__ - Step 33306: {'lr': 0.00019963979271501398, 'samples': 1065792, 'steps': 2081, 'loss/train': 1.5409334897994995} -09/20/2021 21:42:06 - INFO - __main__ - Step 33307: {'lr': 0.00019963979271501398, 'samples': 1065824, 'steps': 2081, 'loss/train': 2.517148494720459} -09/20/2021 21:42:07 - INFO - __main__ - Step 33308: {'lr': 0.00019963979271501398, 'samples': 1065856, 'steps': 2081, 'loss/train': 2.2499117851257324} -09/20/2021 21:42:08 - INFO - __main__ - Step 33309: {'lr': 0.00019963979271501398, 'samples': 1065888, 'steps': 2081, 'loss/train': 2.6095187664031982} -09/20/2021 21:42:09 - INFO - __main__ - Step 33310: {'lr': 0.00019963979271501398, 'samples': 1065920, 'steps': 2081, 'loss/train': 2.0447700023651123} -09/20/2021 21:42:09 - INFO - __main__ - Step 33311: {'lr': 0.00019963979271501398, 'samples': 1065952, 'steps': 2081, 'loss/train': 2.9743428230285645} -09/20/2021 21:42:10 - INFO - __main__ - Step 33312: {'lr': 0.00019963979271501398, 'samples': 1065984, 'steps': 2081, 'loss/train': 3.1649444103240967} -09/20/2021 21:42:11 - INFO - __main__ - Step 33313: {'lr': 0.00019963925157934437, 'samples': 1066016, 'steps': 2082, 'loss/train': 2.1043527126312256} -09/20/2021 21:42:12 - INFO - __main__ - Step 33314: {'lr': 0.00019963925157934437, 'samples': 1066048, 'steps': 2082, 'loss/train': 2.338188648223877} -09/20/2021 21:42:12 - INFO - __main__ - Step 33315: {'lr': 0.00019963925157934437, 'samples': 1066080, 'steps': 2082, 'loss/train': 2.3927175998687744} -09/20/2021 21:42:13 - INFO - __main__ - Step 33316: {'lr': 0.00019963925157934437, 'samples': 1066112, 'steps': 2082, 'loss/train': 0.5909717082977295} -09/20/2021 21:42:14 - INFO - __main__ - Step 33317: {'lr': 0.00019963925157934437, 'samples': 1066144, 'steps': 2082, 'loss/train': 2.1111316680908203} -09/20/2021 21:42:15 - INFO - __main__ - Step 33318: {'lr': 0.00019963925157934437, 'samples': 1066176, 'steps': 2082, 'loss/train': 2.785320997238159} -09/20/2021 21:42:15 - INFO - __main__ - Step 33319: {'lr': 0.00019963925157934437, 'samples': 1066208, 'steps': 2082, 'loss/train': 2.054363489151001} -09/20/2021 21:42:16 - INFO - __main__ - Step 33320: {'lr': 0.00019963925157934437, 'samples': 1066240, 'steps': 2082, 'loss/train': 2.112076997756958} -09/20/2021 21:42:17 - INFO - __main__ - Step 33321: {'lr': 0.00019963925157934437, 'samples': 1066272, 'steps': 2082, 'loss/train': 2.913444995880127} -09/20/2021 21:42:18 - INFO - __main__ - Step 33322: {'lr': 0.00019963925157934437, 'samples': 1066304, 'steps': 2082, 'loss/train': 1.9030544757843018} -09/20/2021 21:42:18 - INFO - __main__ - Step 33323: {'lr': 0.00019963925157934437, 'samples': 1066336, 'steps': 2082, 'loss/train': 2.308490037918091} -09/20/2021 21:42:19 - INFO - __main__ - Step 33324: {'lr': 0.00019963925157934437, 'samples': 1066368, 'steps': 2082, 'loss/train': 3.7683005332946777} -09/20/2021 21:42:20 - INFO - __main__ - Step 33325: {'lr': 0.00019963925157934437, 'samples': 1066400, 'steps': 2082, 'loss/train': 2.131195068359375} -09/20/2021 21:42:21 - INFO - __main__ - Step 33326: {'lr': 0.00019963925157934437, 'samples': 1066432, 'steps': 2082, 'loss/train': 2.745830774307251} -09/20/2021 21:42:21 - INFO - __main__ - Step 33327: {'lr': 0.00019963925157934437, 'samples': 1066464, 'steps': 2082, 'loss/train': 2.4807136058807373} -09/20/2021 21:42:22 - INFO - __main__ - Step 33328: {'lr': 0.00019963925157934437, 'samples': 1066496, 'steps': 2082, 'loss/train': 2.3725595474243164} -09/20/2021 21:42:23 - INFO - __main__ - Step 33329: {'lr': 0.00019963871003824305, 'samples': 1066528, 'steps': 2083, 'loss/train': 2.704008102416992} -09/20/2021 21:42:24 - INFO - __main__ - Step 33330: {'lr': 0.00019963871003824305, 'samples': 1066560, 'steps': 2083, 'loss/train': 2.742995500564575} -09/20/2021 21:42:25 - INFO - __main__ - Step 33331: {'lr': 0.00019963871003824305, 'samples': 1066592, 'steps': 2083, 'loss/train': 2.5325570106506348} -09/20/2021 21:42:25 - INFO - __main__ - Step 33332: {'lr': 0.00019963871003824305, 'samples': 1066624, 'steps': 2083, 'loss/train': 2.2475478649139404} -09/20/2021 21:42:26 - INFO - __main__ - Step 33333: {'lr': 0.00019963871003824305, 'samples': 1066656, 'steps': 2083, 'loss/train': 2.772812604904175} -09/20/2021 21:42:27 - INFO - __main__ - Step 33334: {'lr': 0.00019963871003824305, 'samples': 1066688, 'steps': 2083, 'loss/train': 2.4928276538848877} -09/20/2021 21:42:28 - INFO - __main__ - Step 33335: {'lr': 0.00019963871003824305, 'samples': 1066720, 'steps': 2083, 'loss/train': 2.544281005859375} -09/20/2021 21:42:29 - INFO - __main__ - Step 33336: {'lr': 0.00019963871003824305, 'samples': 1066752, 'steps': 2083, 'loss/train': 2.4112870693206787} -09/20/2021 21:42:30 - INFO - __main__ - Step 33337: {'lr': 0.00019963871003824305, 'samples': 1066784, 'steps': 2083, 'loss/train': 1.9230111837387085} -09/20/2021 21:42:30 - INFO - __main__ - Step 33338: {'lr': 0.00019963871003824305, 'samples': 1066816, 'steps': 2083, 'loss/train': 2.5653812885284424} -09/20/2021 21:42:31 - INFO - __main__ - Step 33339: {'lr': 0.00019963871003824305, 'samples': 1066848, 'steps': 2083, 'loss/train': 1.5144392251968384} -09/20/2021 21:42:32 - INFO - __main__ - Step 33340: {'lr': 0.00019963871003824305, 'samples': 1066880, 'steps': 2083, 'loss/train': 2.245286464691162} -09/20/2021 21:42:33 - INFO - __main__ - Step 33341: {'lr': 0.00019963871003824305, 'samples': 1066912, 'steps': 2083, 'loss/train': 2.1533918380737305} -09/20/2021 21:42:33 - INFO - __main__ - Step 33342: {'lr': 0.00019963871003824305, 'samples': 1066944, 'steps': 2083, 'loss/train': 2.4244749546051025} -09/20/2021 21:42:34 - INFO - __main__ - Step 33343: {'lr': 0.00019963871003824305, 'samples': 1066976, 'steps': 2083, 'loss/train': 2.5947318077087402} -09/20/2021 21:42:35 - INFO - __main__ - Step 33344: {'lr': 0.00019963871003824305, 'samples': 1067008, 'steps': 2083, 'loss/train': 1.9708997011184692} -09/20/2021 21:42:36 - INFO - __main__ - Step 33345: {'lr': 0.00019963816809171218, 'samples': 1067040, 'steps': 2084, 'loss/train': 2.516211986541748} -09/20/2021 21:42:37 - INFO - __main__ - Step 33346: {'lr': 0.00019963816809171218, 'samples': 1067072, 'steps': 2084, 'loss/train': 3.0733113288879395} -09/20/2021 21:42:37 - INFO - __main__ - Step 33347: {'lr': 0.00019963816809171218, 'samples': 1067104, 'steps': 2084, 'loss/train': 1.8151782751083374} -09/20/2021 21:42:38 - INFO - __main__ - Step 33348: {'lr': 0.00019963816809171218, 'samples': 1067136, 'steps': 2084, 'loss/train': 1.9742066860198975} -09/20/2021 21:42:39 - INFO - __main__ - Step 33349: {'lr': 0.00019963816809171218, 'samples': 1067168, 'steps': 2084, 'loss/train': 2.969681978225708} -09/20/2021 21:42:40 - INFO - __main__ - Step 33350: {'lr': 0.00019963816809171218, 'samples': 1067200, 'steps': 2084, 'loss/train': 2.882211685180664} -09/20/2021 21:42:40 - INFO - __main__ - Step 33351: {'lr': 0.00019963816809171218, 'samples': 1067232, 'steps': 2084, 'loss/train': 1.471947193145752} -09/20/2021 21:42:41 - INFO - __main__ - Step 33352: {'lr': 0.00019963816809171218, 'samples': 1067264, 'steps': 2084, 'loss/train': 2.8283727169036865} -09/20/2021 21:42:42 - INFO - __main__ - Step 33353: {'lr': 0.00019963816809171218, 'samples': 1067296, 'steps': 2084, 'loss/train': 3.395629405975342} -09/20/2021 21:42:43 - INFO - __main__ - Step 33354: {'lr': 0.00019963816809171218, 'samples': 1067328, 'steps': 2084, 'loss/train': 2.676321029663086} -09/20/2021 21:42:43 - INFO - __main__ - Step 33355: {'lr': 0.00019963816809171218, 'samples': 1067360, 'steps': 2084, 'loss/train': 2.2512094974517822} -09/20/2021 21:42:44 - INFO - __main__ - Step 33356: {'lr': 0.00019963816809171218, 'samples': 1067392, 'steps': 2084, 'loss/train': 1.5801500082015991} -09/20/2021 21:42:45 - INFO - __main__ - Step 33357: {'lr': 0.00019963816809171218, 'samples': 1067424, 'steps': 2084, 'loss/train': 2.7361433506011963} -09/20/2021 21:42:46 - INFO - __main__ - Step 33358: {'lr': 0.00019963816809171218, 'samples': 1067456, 'steps': 2084, 'loss/train': 1.7309426069259644} -09/20/2021 21:42:46 - INFO - __main__ - Step 33359: {'lr': 0.00019963816809171218, 'samples': 1067488, 'steps': 2084, 'loss/train': 2.9536046981811523} -09/20/2021 21:42:47 - INFO - __main__ - Step 33360: {'lr': 0.00019963816809171218, 'samples': 1067520, 'steps': 2084, 'loss/train': 2.393584728240967} -09/20/2021 21:42:48 - INFO - __main__ - Step 33361: {'lr': 0.00019963762573975402, 'samples': 1067552, 'steps': 2085, 'loss/train': 1.8930420875549316} -09/20/2021 21:42:49 - INFO - __main__ - Step 33362: {'lr': 0.00019963762573975402, 'samples': 1067584, 'steps': 2085, 'loss/train': 1.5099128484725952} -09/20/2021 21:42:49 - INFO - __main__ - Step 33363: {'lr': 0.00019963762573975402, 'samples': 1067616, 'steps': 2085, 'loss/train': 2.447908401489258} -09/20/2021 21:42:50 - INFO - __main__ - Step 33364: {'lr': 0.00019963762573975402, 'samples': 1067648, 'steps': 2085, 'loss/train': 2.8438923358917236} -09/20/2021 21:42:52 - INFO - __main__ - Step 33365: {'lr': 0.00019963762573975402, 'samples': 1067680, 'steps': 2085, 'loss/train': 2.571976900100708} -09/20/2021 21:42:53 - INFO - __main__ - Step 33366: {'lr': 0.00019963762573975402, 'samples': 1067712, 'steps': 2085, 'loss/train': 2.6989550590515137} -09/20/2021 21:42:53 - INFO - __main__ - Step 33367: {'lr': 0.00019963762573975402, 'samples': 1067744, 'steps': 2085, 'loss/train': 1.6634786128997803} -09/20/2021 21:42:54 - INFO - __main__ - Step 33368: {'lr': 0.00019963762573975402, 'samples': 1067776, 'steps': 2085, 'loss/train': 0.49233436584472656} -09/20/2021 21:42:55 - INFO - __main__ - Step 33369: {'lr': 0.00019963762573975402, 'samples': 1067808, 'steps': 2085, 'loss/train': 2.6782102584838867} -09/20/2021 21:42:56 - INFO - __main__ - Step 33370: {'lr': 0.00019963762573975402, 'samples': 1067840, 'steps': 2085, 'loss/train': 2.053982973098755} -09/20/2021 21:42:56 - INFO - __main__ - Step 33371: {'lr': 0.00019963762573975402, 'samples': 1067872, 'steps': 2085, 'loss/train': 1.862157940864563} -09/20/2021 21:42:57 - INFO - __main__ - Step 33372: {'lr': 0.00019963762573975402, 'samples': 1067904, 'steps': 2085, 'loss/train': 1.9603254795074463} -09/20/2021 21:42:58 - INFO - __main__ - Step 33373: {'lr': 0.00019963762573975402, 'samples': 1067936, 'steps': 2085, 'loss/train': 2.297600746154785} -09/20/2021 21:42:59 - INFO - __main__ - Step 33374: {'lr': 0.00019963762573975402, 'samples': 1067968, 'steps': 2085, 'loss/train': 2.73171329498291} -09/20/2021 21:42:59 - INFO - __main__ - Step 33375: {'lr': 0.00019963762573975402, 'samples': 1068000, 'steps': 2085, 'loss/train': 2.2205393314361572} -09/20/2021 21:43:00 - INFO - __main__ - Step 33376: {'lr': 0.00019963762573975402, 'samples': 1068032, 'steps': 2085, 'loss/train': 2.0306622982025146} -09/20/2021 21:43:01 - INFO - __main__ - Step 33377: {'lr': 0.00019963708298237074, 'samples': 1068064, 'steps': 2086, 'loss/train': 2.041227102279663} -09/20/2021 21:43:02 - INFO - __main__ - Step 33378: {'lr': 0.00019963708298237074, 'samples': 1068096, 'steps': 2086, 'loss/train': 2.721203327178955} -09/20/2021 21:43:03 - INFO - __main__ - Step 33379: {'lr': 0.00019963708298237074, 'samples': 1068128, 'steps': 2086, 'loss/train': 2.6275341510772705} -09/20/2021 21:43:03 - INFO - __main__ - Step 33380: {'lr': 0.00019963708298237074, 'samples': 1068160, 'steps': 2086, 'loss/train': 2.682189464569092} -09/20/2021 21:43:04 - INFO - __main__ - Step 33381: {'lr': 0.00019963708298237074, 'samples': 1068192, 'steps': 2086, 'loss/train': 2.2173938751220703} -09/20/2021 21:43:05 - INFO - __main__ - Step 33382: {'lr': 0.00019963708298237074, 'samples': 1068224, 'steps': 2086, 'loss/train': 1.6775189638137817} -09/20/2021 21:43:06 - INFO - __main__ - Step 33383: {'lr': 0.00019963708298237074, 'samples': 1068256, 'steps': 2086, 'loss/train': 2.657212257385254} -09/20/2021 21:43:06 - INFO - __main__ - Step 33384: {'lr': 0.00019963708298237074, 'samples': 1068288, 'steps': 2086, 'loss/train': 1.2043583393096924} -09/20/2021 21:43:07 - INFO - __main__ - Step 33385: {'lr': 0.00019963708298237074, 'samples': 1068320, 'steps': 2086, 'loss/train': 1.8876240253448486} -09/20/2021 21:43:08 - INFO - __main__ - Step 33386: {'lr': 0.00019963708298237074, 'samples': 1068352, 'steps': 2086, 'loss/train': 1.8960739374160767} -09/20/2021 21:43:09 - INFO - __main__ - Step 33387: {'lr': 0.00019963708298237074, 'samples': 1068384, 'steps': 2086, 'loss/train': 2.511610984802246} -09/20/2021 21:43:09 - INFO - __main__ - Step 33388: {'lr': 0.00019963708298237074, 'samples': 1068416, 'steps': 2086, 'loss/train': 2.69514799118042} -09/20/2021 21:43:10 - INFO - __main__ - Step 33389: {'lr': 0.00019963708298237074, 'samples': 1068448, 'steps': 2086, 'loss/train': 2.966568946838379} -09/20/2021 21:43:11 - INFO - __main__ - Step 33390: {'lr': 0.00019963708298237074, 'samples': 1068480, 'steps': 2086, 'loss/train': 2.8433213233947754} -09/20/2021 21:43:12 - INFO - __main__ - Step 33391: {'lr': 0.00019963708298237074, 'samples': 1068512, 'steps': 2086, 'loss/train': 2.5402557849884033} -09/20/2021 21:43:12 - INFO - __main__ - Step 33392: {'lr': 0.00019963708298237074, 'samples': 1068544, 'steps': 2086, 'loss/train': 2.605053424835205} -09/20/2021 21:43:13 - INFO - __main__ - Step 33393: {'lr': 0.00019963653981956453, 'samples': 1068576, 'steps': 2087, 'loss/train': 2.4904558658599854} -09/20/2021 21:43:14 - INFO - __main__ - Step 33394: {'lr': 0.00019963653981956453, 'samples': 1068608, 'steps': 2087, 'loss/train': 1.5890328884124756} -09/20/2021 21:43:15 - INFO - __main__ - Step 33395: {'lr': 0.00019963653981956453, 'samples': 1068640, 'steps': 2087, 'loss/train': 1.1782691478729248} -09/20/2021 21:43:15 - INFO - __main__ - Step 33396: {'lr': 0.00019963653981956453, 'samples': 1068672, 'steps': 2087, 'loss/train': 0.7917900681495667} -09/20/2021 21:43:16 - INFO - __main__ - Step 33397: {'lr': 0.00019963653981956453, 'samples': 1068704, 'steps': 2087, 'loss/train': 1.0352684259414673} -09/20/2021 21:43:17 - INFO - __main__ - Step 33398: {'lr': 0.00019963653981956453, 'samples': 1068736, 'steps': 2087, 'loss/train': 1.15253746509552} -09/20/2021 21:43:18 - INFO - __main__ - Step 33399: {'lr': 0.00019963653981956453, 'samples': 1068768, 'steps': 2087, 'loss/train': 1.1304603815078735} -09/20/2021 21:43:18 - INFO - __main__ - Step 33400: {'lr': 0.00019963653981956453, 'samples': 1068800, 'steps': 2087, 'loss/train': 0.8440987467765808} -09/20/2021 21:43:19 - INFO - __main__ - Step 33401: {'lr': 0.00019963653981956453, 'samples': 1068832, 'steps': 2087, 'loss/train': 0.7779435515403748} -09/20/2021 21:43:20 - INFO - __main__ - Step 33402: {'lr': 0.00019963653981956453, 'samples': 1068864, 'steps': 2087, 'loss/train': 0.8274372816085815} -09/20/2021 21:43:21 - INFO - __main__ - Step 33403: {'lr': 0.00019963653981956453, 'samples': 1068896, 'steps': 2087, 'loss/train': 0.9877305030822754} -09/20/2021 21:43:22 - INFO - __main__ - Step 33404: {'lr': 0.00019963653981956453, 'samples': 1068928, 'steps': 2087, 'loss/train': 2.6125473976135254} -09/20/2021 21:43:23 - INFO - __main__ - Step 33405: {'lr': 0.00019963653981956453, 'samples': 1068960, 'steps': 2087, 'loss/train': 2.8998851776123047} -09/20/2021 21:43:24 - INFO - __main__ - Step 33406: {'lr': 0.00019963653981956453, 'samples': 1068992, 'steps': 2087, 'loss/train': 2.2253921031951904} -09/20/2021 21:43:24 - INFO - __main__ - Step 33407: {'lr': 0.00019963653981956453, 'samples': 1069024, 'steps': 2087, 'loss/train': 2.192584991455078} -09/20/2021 21:43:25 - INFO - __main__ - Step 33408: {'lr': 0.00019963653981956453, 'samples': 1069056, 'steps': 2087, 'loss/train': 1.7023180723190308} -09/20/2021 21:43:26 - INFO - __main__ - Step 33409: {'lr': 0.00019963599625133767, 'samples': 1069088, 'steps': 2088, 'loss/train': 1.9365787506103516} -09/20/2021 21:43:27 - INFO - __main__ - Step 33410: {'lr': 0.00019963599625133767, 'samples': 1069120, 'steps': 2088, 'loss/train': 2.4349281787872314} -09/20/2021 21:43:27 - INFO - __main__ - Step 33411: {'lr': 0.00019963599625133767, 'samples': 1069152, 'steps': 2088, 'loss/train': 2.9168014526367188} -09/20/2021 21:43:28 - INFO - __main__ - Step 33412: {'lr': 0.00019963599625133767, 'samples': 1069184, 'steps': 2088, 'loss/train': 2.0917067527770996} -09/20/2021 21:43:29 - INFO - __main__ - Step 33413: {'lr': 0.00019963599625133767, 'samples': 1069216, 'steps': 2088, 'loss/train': 1.2218183279037476} -09/20/2021 21:43:30 - INFO - __main__ - Step 33414: {'lr': 0.00019963599625133767, 'samples': 1069248, 'steps': 2088, 'loss/train': 0.5685935020446777} -09/20/2021 21:43:30 - INFO - __main__ - Step 33415: {'lr': 0.00019963599625133767, 'samples': 1069280, 'steps': 2088, 'loss/train': 3.755021333694458} -09/20/2021 21:43:31 - INFO - __main__ - Step 33416: {'lr': 0.00019963599625133767, 'samples': 1069312, 'steps': 2088, 'loss/train': 1.4309569597244263} -09/20/2021 21:43:32 - INFO - __main__ - Step 33417: {'lr': 0.00019963599625133767, 'samples': 1069344, 'steps': 2088, 'loss/train': 1.7188093662261963} -09/20/2021 21:43:33 - INFO - __main__ - Step 33418: {'lr': 0.00019963599625133767, 'samples': 1069376, 'steps': 2088, 'loss/train': 2.406679630279541} -09/20/2021 21:43:33 - INFO - __main__ - Step 33419: {'lr': 0.00019963599625133767, 'samples': 1069408, 'steps': 2088, 'loss/train': 2.487966775894165} -09/20/2021 21:43:34 - INFO - __main__ - Step 33420: {'lr': 0.00019963599625133767, 'samples': 1069440, 'steps': 2088, 'loss/train': 2.221972703933716} -09/20/2021 21:43:35 - INFO - __main__ - Step 33421: {'lr': 0.00019963599625133767, 'samples': 1069472, 'steps': 2088, 'loss/train': 1.4025180339813232} -09/20/2021 21:43:36 - INFO - __main__ - Step 33422: {'lr': 0.00019963599625133767, 'samples': 1069504, 'steps': 2088, 'loss/train': 2.0053768157958984} -09/20/2021 21:43:36 - INFO - __main__ - Step 33423: {'lr': 0.00019963599625133767, 'samples': 1069536, 'steps': 2088, 'loss/train': 2.1210498809814453} -09/20/2021 21:43:37 - INFO - __main__ - Step 33424: {'lr': 0.00019963599625133767, 'samples': 1069568, 'steps': 2088, 'loss/train': 2.974153518676758} -09/20/2021 21:43:38 - INFO - __main__ - Step 33425: {'lr': 0.0001996354522776923, 'samples': 1069600, 'steps': 2089, 'loss/train': 2.5771517753601074} -09/20/2021 21:43:39 - INFO - __main__ - Step 33426: {'lr': 0.0001996354522776923, 'samples': 1069632, 'steps': 2089, 'loss/train': 1.8506507873535156} -09/20/2021 21:43:40 - INFO - __main__ - Step 33427: {'lr': 0.0001996354522776923, 'samples': 1069664, 'steps': 2089, 'loss/train': 2.66471791267395} -09/20/2021 21:43:40 - INFO - __main__ - Step 33428: {'lr': 0.0001996354522776923, 'samples': 1069696, 'steps': 2089, 'loss/train': 1.416107177734375} -09/20/2021 21:43:41 - INFO - __main__ - Step 33429: {'lr': 0.0001996354522776923, 'samples': 1069728, 'steps': 2089, 'loss/train': 2.0953376293182373} -09/20/2021 21:43:42 - INFO - __main__ - Step 33430: {'lr': 0.0001996354522776923, 'samples': 1069760, 'steps': 2089, 'loss/train': 2.545468807220459} -09/20/2021 21:43:43 - INFO - __main__ - Step 33431: {'lr': 0.0001996354522776923, 'samples': 1069792, 'steps': 2089, 'loss/train': 3.1556200981140137} -09/20/2021 21:43:43 - INFO - __main__ - Step 33432: {'lr': 0.0001996354522776923, 'samples': 1069824, 'steps': 2089, 'loss/train': 2.0098369121551514} -09/20/2021 21:43:44 - INFO - __main__ - Step 33433: {'lr': 0.0001996354522776923, 'samples': 1069856, 'steps': 2089, 'loss/train': 2.477916717529297} -09/20/2021 21:43:46 - INFO - __main__ - Step 33434: {'lr': 0.0001996354522776923, 'samples': 1069888, 'steps': 2089, 'loss/train': 3.6842567920684814} -09/20/2021 21:43:46 - INFO - __main__ - Step 33435: {'lr': 0.0001996354522776923, 'samples': 1069920, 'steps': 2089, 'loss/train': 1.7347708940505981} -09/20/2021 21:43:47 - INFO - __main__ - Step 33436: {'lr': 0.0001996354522776923, 'samples': 1069952, 'steps': 2089, 'loss/train': 2.0642025470733643} -09/20/2021 21:43:48 - INFO - __main__ - Step 33437: {'lr': 0.0001996354522776923, 'samples': 1069984, 'steps': 2089, 'loss/train': 1.8389251232147217} -09/20/2021 21:43:49 - INFO - __main__ - Step 33438: {'lr': 0.0001996354522776923, 'samples': 1070016, 'steps': 2089, 'loss/train': 3.5325210094451904} -09/20/2021 21:43:49 - INFO - __main__ - Step 33439: {'lr': 0.0001996354522776923, 'samples': 1070048, 'steps': 2089, 'loss/train': 2.9348385334014893} -09/20/2021 21:43:50 - INFO - __main__ - Step 33440: {'lr': 0.0001996354522776923, 'samples': 1070080, 'steps': 2089, 'loss/train': 2.8088371753692627} -09/20/2021 21:43:51 - INFO - __main__ - Step 33441: {'lr': 0.00019963490789863067, 'samples': 1070112, 'steps': 2090, 'loss/train': 1.6763836145401} -09/20/2021 21:43:52 - INFO - __main__ - Step 33442: {'lr': 0.00019963490789863067, 'samples': 1070144, 'steps': 2090, 'loss/train': 1.4599874019622803} -09/20/2021 21:43:52 - INFO - __main__ - Step 33443: {'lr': 0.00019963490789863067, 'samples': 1070176, 'steps': 2090, 'loss/train': 2.7295031547546387} -09/20/2021 21:43:53 - INFO - __main__ - Step 33444: {'lr': 0.00019963490789863067, 'samples': 1070208, 'steps': 2090, 'loss/train': 2.6207022666931152} -09/20/2021 21:43:54 - INFO - __main__ - Step 33445: {'lr': 0.00019963490789863067, 'samples': 1070240, 'steps': 2090, 'loss/train': 2.5218093395233154} -09/20/2021 21:43:55 - INFO - __main__ - Step 33446: {'lr': 0.00019963490789863067, 'samples': 1070272, 'steps': 2090, 'loss/train': 2.5509657859802246} -09/20/2021 21:43:55 - INFO - __main__ - Step 33447: {'lr': 0.00019963490789863067, 'samples': 1070304, 'steps': 2090, 'loss/train': 1.9357391595840454} -09/20/2021 21:43:56 - INFO - __main__ - Step 33448: {'lr': 0.00019963490789863067, 'samples': 1070336, 'steps': 2090, 'loss/train': 2.481879711151123} -09/20/2021 21:43:57 - INFO - __main__ - Step 33449: {'lr': 0.00019963490789863067, 'samples': 1070368, 'steps': 2090, 'loss/train': 1.69681978225708} -09/20/2021 21:43:58 - INFO - __main__ - Step 33450: {'lr': 0.00019963490789863067, 'samples': 1070400, 'steps': 2090, 'loss/train': 2.000542402267456} -09/20/2021 21:43:58 - INFO - __main__ - Step 33451: {'lr': 0.00019963490789863067, 'samples': 1070432, 'steps': 2090, 'loss/train': 2.525888681411743} -09/20/2021 21:43:59 - INFO - __main__ - Step 33452: {'lr': 0.00019963490789863067, 'samples': 1070464, 'steps': 2090, 'loss/train': 2.385969638824463} -09/20/2021 21:44:00 - INFO - __main__ - Step 33453: {'lr': 0.00019963490789863067, 'samples': 1070496, 'steps': 2090, 'loss/train': 2.473562002182007} -09/20/2021 21:44:01 - INFO - __main__ - Step 33454: {'lr': 0.00019963490789863067, 'samples': 1070528, 'steps': 2090, 'loss/train': 2.1465981006622314} -09/20/2021 21:44:01 - INFO - __main__ - Step 33455: {'lr': 0.00019963490789863067, 'samples': 1070560, 'steps': 2090, 'loss/train': 0.21363964676856995} -09/20/2021 21:44:02 - INFO - __main__ - Step 33456: {'lr': 0.00019963490789863067, 'samples': 1070592, 'steps': 2090, 'loss/train': 0.3291339576244354} -09/20/2021 21:44:03 - INFO - __main__ - Step 33457: {'lr': 0.00019963436311415498, 'samples': 1070624, 'steps': 2091, 'loss/train': 0.34136703610420227} -09/20/2021 21:44:04 - INFO - __main__ - Step 33458: {'lr': 0.00019963436311415498, 'samples': 1070656, 'steps': 2091, 'loss/train': 1.0012235641479492} -09/20/2021 21:44:05 - INFO - __main__ - Step 33459: {'lr': 0.00019963436311415498, 'samples': 1070688, 'steps': 2091, 'loss/train': 2.3818044662475586} -09/20/2021 21:44:05 - INFO - __main__ - Step 33460: {'lr': 0.00019963436311415498, 'samples': 1070720, 'steps': 2091, 'loss/train': 3.3358943462371826} -09/20/2021 21:44:06 - INFO - __main__ - Step 33461: {'lr': 0.00019963436311415498, 'samples': 1070752, 'steps': 2091, 'loss/train': 2.0003821849823} -09/20/2021 21:44:07 - INFO - __main__ - Step 33462: {'lr': 0.00019963436311415498, 'samples': 1070784, 'steps': 2091, 'loss/train': 2.278467893600464} -09/20/2021 21:44:08 - INFO - __main__ - Step 33463: {'lr': 0.00019963436311415498, 'samples': 1070816, 'steps': 2091, 'loss/train': 2.670736312866211} -09/20/2021 21:44:08 - INFO - __main__ - Step 33464: {'lr': 0.00019963436311415498, 'samples': 1070848, 'steps': 2091, 'loss/train': 2.7669336795806885} -09/20/2021 21:44:10 - INFO - __main__ - Step 33465: {'lr': 0.00019963436311415498, 'samples': 1070880, 'steps': 2091, 'loss/train': 2.1942036151885986} -09/20/2021 21:44:10 - INFO - __main__ - Step 33466: {'lr': 0.00019963436311415498, 'samples': 1070912, 'steps': 2091, 'loss/train': 2.1737773418426514} -09/20/2021 21:44:11 - INFO - __main__ - Step 33467: {'lr': 0.00019963436311415498, 'samples': 1070944, 'steps': 2091, 'loss/train': 2.4360711574554443} -09/20/2021 21:44:12 - INFO - __main__ - Step 33468: {'lr': 0.00019963436311415498, 'samples': 1070976, 'steps': 2091, 'loss/train': 3.0249760150909424} -09/20/2021 21:44:13 - INFO - __main__ - Step 33469: {'lr': 0.00019963436311415498, 'samples': 1071008, 'steps': 2091, 'loss/train': 2.331042528152466} -09/20/2021 21:44:13 - INFO - __main__ - Step 33470: {'lr': 0.00019963436311415498, 'samples': 1071040, 'steps': 2091, 'loss/train': 3.0881032943725586} -09/20/2021 21:44:14 - INFO - __main__ - Step 33471: {'lr': 0.00019963436311415498, 'samples': 1071072, 'steps': 2091, 'loss/train': 2.1176788806915283} -09/20/2021 21:44:15 - INFO - __main__ - Step 33472: {'lr': 0.00019963436311415498, 'samples': 1071104, 'steps': 2091, 'loss/train': 3.0650248527526855} -09/20/2021 21:44:16 - INFO - __main__ - Step 33473: {'lr': 0.00019963381792426746, 'samples': 1071136, 'steps': 2092, 'loss/train': 2.219815254211426} -09/20/2021 21:44:17 - INFO - __main__ - Step 33474: {'lr': 0.00019963381792426746, 'samples': 1071168, 'steps': 2092, 'loss/train': 1.6629678010940552} -09/20/2021 21:44:17 - INFO - __main__ - Step 33475: {'lr': 0.00019963381792426746, 'samples': 1071200, 'steps': 2092, 'loss/train': 1.9242101907730103} -09/20/2021 21:44:18 - INFO - __main__ - Step 33476: {'lr': 0.00019963381792426746, 'samples': 1071232, 'steps': 2092, 'loss/train': 1.7789024114608765} -09/20/2021 21:44:19 - INFO - __main__ - Step 33477: {'lr': 0.00019963381792426746, 'samples': 1071264, 'steps': 2092, 'loss/train': 2.6060872077941895} -09/20/2021 21:44:20 - INFO - __main__ - Step 33478: {'lr': 0.00019963381792426746, 'samples': 1071296, 'steps': 2092, 'loss/train': 2.8508005142211914} -09/20/2021 21:44:20 - INFO - __main__ - Step 33479: {'lr': 0.00019963381792426746, 'samples': 1071328, 'steps': 2092, 'loss/train': 2.799487590789795} -09/20/2021 21:44:21 - INFO - __main__ - Step 33480: {'lr': 0.00019963381792426746, 'samples': 1071360, 'steps': 2092, 'loss/train': 1.70408034324646} -09/20/2021 21:44:22 - INFO - __main__ - Step 33481: {'lr': 0.00019963381792426746, 'samples': 1071392, 'steps': 2092, 'loss/train': 2.1120517253875732} -09/20/2021 21:44:23 - INFO - __main__ - Step 33482: {'lr': 0.00019963381792426746, 'samples': 1071424, 'steps': 2092, 'loss/train': 2.1143815517425537} -09/20/2021 21:44:23 - INFO - __main__ - Step 33483: {'lr': 0.00019963381792426746, 'samples': 1071456, 'steps': 2092, 'loss/train': 2.1033754348754883} -09/20/2021 21:44:24 - INFO - __main__ - Step 33484: {'lr': 0.00019963381792426746, 'samples': 1071488, 'steps': 2092, 'loss/train': 2.207948923110962} -09/20/2021 21:44:25 - INFO - __main__ - Step 33485: {'lr': 0.00019963381792426746, 'samples': 1071520, 'steps': 2092, 'loss/train': 2.682223320007324} -09/20/2021 21:44:26 - INFO - __main__ - Step 33486: {'lr': 0.00019963381792426746, 'samples': 1071552, 'steps': 2092, 'loss/train': 2.360029935836792} -09/20/2021 21:44:26 - INFO - __main__ - Step 33487: {'lr': 0.00019963381792426746, 'samples': 1071584, 'steps': 2092, 'loss/train': 2.7891366481781006} -09/20/2021 21:44:27 - INFO - __main__ - Step 33488: {'lr': 0.00019963381792426746, 'samples': 1071616, 'steps': 2092, 'loss/train': 2.43389630317688} -09/20/2021 21:44:28 - INFO - __main__ - Step 33489: {'lr': 0.0001996332723289703, 'samples': 1071648, 'steps': 2093, 'loss/train': 2.063889980316162} -09/20/2021 21:44:29 - INFO - __main__ - Step 33490: {'lr': 0.0001996332723289703, 'samples': 1071680, 'steps': 2093, 'loss/train': 2.7878053188323975} -09/20/2021 21:44:29 - INFO - __main__ - Step 33491: {'lr': 0.0001996332723289703, 'samples': 1071712, 'steps': 2093, 'loss/train': 1.9422005414962769} -09/20/2021 21:44:30 - INFO - __main__ - Step 33492: {'lr': 0.0001996332723289703, 'samples': 1071744, 'steps': 2093, 'loss/train': 2.6730096340179443} -09/20/2021 21:44:31 - INFO - __main__ - Step 33493: {'lr': 0.0001996332723289703, 'samples': 1071776, 'steps': 2093, 'loss/train': 1.5108381509780884} -09/20/2021 21:44:32 - INFO - __main__ - Step 33494: {'lr': 0.0001996332723289703, 'samples': 1071808, 'steps': 2093, 'loss/train': 1.8691487312316895} -09/20/2021 21:44:32 - INFO - __main__ - Step 33495: {'lr': 0.0001996332723289703, 'samples': 1071840, 'steps': 2093, 'loss/train': 2.3559463024139404} -09/20/2021 21:44:33 - INFO - __main__ - Step 33496: {'lr': 0.0001996332723289703, 'samples': 1071872, 'steps': 2093, 'loss/train': 2.166924476623535} -09/20/2021 21:44:34 - INFO - __main__ - Step 33497: {'lr': 0.0001996332723289703, 'samples': 1071904, 'steps': 2093, 'loss/train': 2.506956100463867} -09/20/2021 21:44:36 - INFO - __main__ - Step 33498: {'lr': 0.0001996332723289703, 'samples': 1071936, 'steps': 2093, 'loss/train': 2.477727174758911} -09/20/2021 21:44:37 - INFO - __main__ - Step 33499: {'lr': 0.0001996332723289703, 'samples': 1071968, 'steps': 2093, 'loss/train': 1.8680557012557983} -09/20/2021 21:44:38 - INFO - __main__ - Step 33500: {'lr': 0.0001996332723289703, 'samples': 1072000, 'steps': 2093, 'loss/train': 2.601407766342163} -09/20/2021 21:44:38 - INFO - __main__ - Step 33501: {'lr': 0.0001996332723289703, 'samples': 1072032, 'steps': 2093, 'loss/train': 2.875781774520874} -09/20/2021 21:44:39 - INFO - __main__ - Step 33502: {'lr': 0.0001996332723289703, 'samples': 1072064, 'steps': 2093, 'loss/train': 2.148470401763916} -09/20/2021 21:44:40 - INFO - __main__ - Step 33503: {'lr': 0.0001996332723289703, 'samples': 1072096, 'steps': 2093, 'loss/train': 2.802624225616455} -09/20/2021 21:44:41 - INFO - __main__ - Step 33504: {'lr': 0.0001996332723289703, 'samples': 1072128, 'steps': 2093, 'loss/train': 2.5918309688568115} -09/20/2021 21:44:41 - INFO - __main__ - Step 33505: {'lr': 0.00019963272632826578, 'samples': 1072160, 'steps': 2094, 'loss/train': 1.3015925884246826} -09/20/2021 21:44:42 - INFO - __main__ - Step 33506: {'lr': 0.00019963272632826578, 'samples': 1072192, 'steps': 2094, 'loss/train': 2.0681636333465576} -09/20/2021 21:44:43 - INFO - __main__ - Step 33507: {'lr': 0.00019963272632826578, 'samples': 1072224, 'steps': 2094, 'loss/train': 1.735048532485962} -09/20/2021 21:44:44 - INFO - __main__ - Step 33508: {'lr': 0.00019963272632826578, 'samples': 1072256, 'steps': 2094, 'loss/train': 2.002897024154663} -09/20/2021 21:44:44 - INFO - __main__ - Step 33509: {'lr': 0.00019963272632826578, 'samples': 1072288, 'steps': 2094, 'loss/train': 2.3653643131256104} -09/20/2021 21:44:45 - INFO - __main__ - Step 33510: {'lr': 0.00019963272632826578, 'samples': 1072320, 'steps': 2094, 'loss/train': 1.8765615224838257} -09/20/2021 21:44:46 - INFO - __main__ - Step 33511: {'lr': 0.00019963272632826578, 'samples': 1072352, 'steps': 2094, 'loss/train': 1.9666050672531128} -09/20/2021 21:44:47 - INFO - __main__ - Step 33512: {'lr': 0.00019963272632826578, 'samples': 1072384, 'steps': 2094, 'loss/train': 1.8627790212631226} -09/20/2021 21:44:47 - INFO - __main__ - Step 33513: {'lr': 0.00019963272632826578, 'samples': 1072416, 'steps': 2094, 'loss/train': 2.5764565467834473} -09/20/2021 21:44:48 - INFO - __main__ - Step 33514: {'lr': 0.00019963272632826578, 'samples': 1072448, 'steps': 2094, 'loss/train': 1.9228838682174683} -09/20/2021 21:44:49 - INFO - __main__ - Step 33515: {'lr': 0.00019963272632826578, 'samples': 1072480, 'steps': 2094, 'loss/train': 2.2665181159973145} -09/20/2021 21:44:50 - INFO - __main__ - Step 33516: {'lr': 0.00019963272632826578, 'samples': 1072512, 'steps': 2094, 'loss/train': 2.7278594970703125} -09/20/2021 21:44:50 - INFO - __main__ - Step 33517: {'lr': 0.00019963272632826578, 'samples': 1072544, 'steps': 2094, 'loss/train': 2.497103452682495} -09/20/2021 21:44:51 - INFO - __main__ - Step 33518: {'lr': 0.00019963272632826578, 'samples': 1072576, 'steps': 2094, 'loss/train': 2.729844570159912} -09/20/2021 21:44:52 - INFO - __main__ - Step 33519: {'lr': 0.00019963272632826578, 'samples': 1072608, 'steps': 2094, 'loss/train': 2.1897923946380615} -09/20/2021 21:44:53 - INFO - __main__ - Step 33520: {'lr': 0.00019963272632826578, 'samples': 1072640, 'steps': 2094, 'loss/train': 2.5893735885620117} -09/20/2021 21:44:54 - INFO - __main__ - Step 33521: {'lr': 0.00019963217992215605, 'samples': 1072672, 'steps': 2095, 'loss/train': 2.6159274578094482} -09/20/2021 21:44:54 - INFO - __main__ - Step 33522: {'lr': 0.00019963217992215605, 'samples': 1072704, 'steps': 2095, 'loss/train': 2.4272592067718506} -09/20/2021 21:44:55 - INFO - __main__ - Step 33523: {'lr': 0.00019963217992215605, 'samples': 1072736, 'steps': 2095, 'loss/train': 1.599061369895935} -09/20/2021 21:44:56 - INFO - __main__ - Step 33524: {'lr': 0.00019963217992215605, 'samples': 1072768, 'steps': 2095, 'loss/train': 1.9709731340408325} -09/20/2021 21:44:57 - INFO - __main__ - Step 33525: {'lr': 0.00019963217992215605, 'samples': 1072800, 'steps': 2095, 'loss/train': 1.926536202430725} -09/20/2021 21:44:57 - INFO - __main__ - Step 33526: {'lr': 0.00019963217992215605, 'samples': 1072832, 'steps': 2095, 'loss/train': 2.846459150314331} -09/20/2021 21:44:58 - INFO - __main__ - Step 33527: {'lr': 0.00019963217992215605, 'samples': 1072864, 'steps': 2095, 'loss/train': 3.1401748657226562} -09/20/2021 21:44:59 - INFO - __main__ - Step 33528: {'lr': 0.00019963217992215605, 'samples': 1072896, 'steps': 2095, 'loss/train': 3.1235880851745605} -09/20/2021 21:45:00 - INFO - __main__ - Step 33529: {'lr': 0.00019963217992215605, 'samples': 1072928, 'steps': 2095, 'loss/train': 3.133319616317749} -09/20/2021 21:45:00 - INFO - __main__ - Step 33530: {'lr': 0.00019963217992215605, 'samples': 1072960, 'steps': 2095, 'loss/train': 3.183101177215576} -09/20/2021 21:45:01 - INFO - __main__ - Step 33531: {'lr': 0.00019963217992215605, 'samples': 1072992, 'steps': 2095, 'loss/train': 3.158604621887207} -09/20/2021 21:45:02 - INFO - __main__ - Step 33532: {'lr': 0.00019963217992215605, 'samples': 1073024, 'steps': 2095, 'loss/train': 3.1065971851348877} -09/20/2021 21:45:03 - INFO - __main__ - Step 33533: {'lr': 0.00019963217992215605, 'samples': 1073056, 'steps': 2095, 'loss/train': 3.144730567932129} -09/20/2021 21:45:03 - INFO - __main__ - Step 33534: {'lr': 0.00019963217992215605, 'samples': 1073088, 'steps': 2095, 'loss/train': 3.2101476192474365} -09/20/2021 21:45:04 - INFO - __main__ - Step 33535: {'lr': 0.00019963217992215605, 'samples': 1073120, 'steps': 2095, 'loss/train': 3.1537163257598877} -09/20/2021 21:45:05 - INFO - __main__ - Step 33536: {'lr': 0.00019963217992215605, 'samples': 1073152, 'steps': 2095, 'loss/train': 3.1458113193511963} -09/20/2021 21:45:06 - INFO - __main__ - Step 33537: {'lr': 0.0001996316331106434, 'samples': 1073184, 'steps': 2096, 'loss/train': 2.327214241027832} -09/20/2021 21:45:06 - INFO - __main__ - Step 33538: {'lr': 0.0001996316331106434, 'samples': 1073216, 'steps': 2096, 'loss/train': 2.296952247619629} -09/20/2021 21:45:07 - INFO - __main__ - Step 33539: {'lr': 0.0001996316331106434, 'samples': 1073248, 'steps': 2096, 'loss/train': 2.276921272277832} -09/20/2021 21:45:08 - INFO - __main__ - Step 33540: {'lr': 0.0001996316331106434, 'samples': 1073280, 'steps': 2096, 'loss/train': 2.2255678176879883} -09/20/2021 21:45:09 - INFO - __main__ - Step 33541: {'lr': 0.0001996316331106434, 'samples': 1073312, 'steps': 2096, 'loss/train': 2.290581464767456} -09/20/2021 21:45:10 - INFO - __main__ - Step 33542: {'lr': 0.0001996316331106434, 'samples': 1073344, 'steps': 2096, 'loss/train': 2.2134687900543213} -09/20/2021 21:45:11 - INFO - __main__ - Step 33543: {'lr': 0.0001996316331106434, 'samples': 1073376, 'steps': 2096, 'loss/train': 2.072082757949829} -09/20/2021 21:45:11 - INFO - __main__ - Step 33544: {'lr': 0.0001996316331106434, 'samples': 1073408, 'steps': 2096, 'loss/train': 1.6959846019744873} -09/20/2021 21:45:12 - INFO - __main__ - Step 33545: {'lr': 0.0001996316331106434, 'samples': 1073440, 'steps': 2096, 'loss/train': 2.306936502456665} -09/20/2021 21:45:13 - INFO - __main__ - Step 33546: {'lr': 0.0001996316331106434, 'samples': 1073472, 'steps': 2096, 'loss/train': 1.9034982919692993} -09/20/2021 21:45:14 - INFO - __main__ - Step 33547: {'lr': 0.0001996316331106434, 'samples': 1073504, 'steps': 2096, 'loss/train': 1.6921693086624146} -09/20/2021 21:45:14 - INFO - __main__ - Step 33548: {'lr': 0.0001996316331106434, 'samples': 1073536, 'steps': 2096, 'loss/train': 2.082261323928833} -09/20/2021 21:45:15 - INFO - __main__ - Step 33549: {'lr': 0.0001996316331106434, 'samples': 1073568, 'steps': 2096, 'loss/train': 2.410766124725342} -09/20/2021 21:45:16 - INFO - __main__ - Step 33550: {'lr': 0.0001996316331106434, 'samples': 1073600, 'steps': 2096, 'loss/train': 3.09295654296875} -09/20/2021 21:45:17 - INFO - __main__ - Step 33551: {'lr': 0.0001996316331106434, 'samples': 1073632, 'steps': 2096, 'loss/train': 2.7872538566589355} -09/20/2021 21:45:17 - INFO - __main__ - Step 33552: {'lr': 0.0001996316331106434, 'samples': 1073664, 'steps': 2096, 'loss/train': 2.4192309379577637} -09/20/2021 21:45:18 - INFO - __main__ - Step 33553: {'lr': 0.00019963108589372998, 'samples': 1073696, 'steps': 2097, 'loss/train': 2.5266640186309814} -09/20/2021 21:45:19 - INFO - __main__ - Step 33554: {'lr': 0.00019963108589372998, 'samples': 1073728, 'steps': 2097, 'loss/train': 2.013242721557617} -09/20/2021 21:45:20 - INFO - __main__ - Step 33555: {'lr': 0.00019963108589372998, 'samples': 1073760, 'steps': 2097, 'loss/train': 1.6979445219039917} -09/20/2021 21:45:21 - INFO - __main__ - Step 33556: {'lr': 0.00019963108589372998, 'samples': 1073792, 'steps': 2097, 'loss/train': 1.9100677967071533} -09/20/2021 21:45:21 - INFO - __main__ - Step 33557: {'lr': 0.00019963108589372998, 'samples': 1073824, 'steps': 2097, 'loss/train': 1.088929533958435} -09/20/2021 21:45:22 - INFO - __main__ - Step 33558: {'lr': 0.00019963108589372998, 'samples': 1073856, 'steps': 2097, 'loss/train': 3.0605087280273438} -09/20/2021 21:45:23 - INFO - __main__ - Step 33559: {'lr': 0.00019963108589372998, 'samples': 1073888, 'steps': 2097, 'loss/train': 2.5106875896453857} -09/20/2021 21:45:24 - INFO - __main__ - Step 33560: {'lr': 0.00019963108589372998, 'samples': 1073920, 'steps': 2097, 'loss/train': 3.1902902126312256} -09/20/2021 21:45:24 - INFO - __main__ - Step 33561: {'lr': 0.00019963108589372998, 'samples': 1073952, 'steps': 2097, 'loss/train': 2.844027280807495} -09/20/2021 21:45:25 - INFO - __main__ - Step 33562: {'lr': 0.00019963108589372998, 'samples': 1073984, 'steps': 2097, 'loss/train': 1.910648226737976} -09/20/2021 21:45:26 - INFO - __main__ - Step 33563: {'lr': 0.00019963108589372998, 'samples': 1074016, 'steps': 2097, 'loss/train': 3.0300981998443604} -09/20/2021 21:45:27 - INFO - __main__ - Step 33564: {'lr': 0.00019963108589372998, 'samples': 1074048, 'steps': 2097, 'loss/train': 2.4275383949279785} -09/20/2021 21:45:27 - INFO - __main__ - Step 33565: {'lr': 0.00019963108589372998, 'samples': 1074080, 'steps': 2097, 'loss/train': 2.296717405319214} -09/20/2021 21:45:28 - INFO - __main__ - Step 33566: {'lr': 0.00019963108589372998, 'samples': 1074112, 'steps': 2097, 'loss/train': 2.0989105701446533} -09/20/2021 21:45:29 - INFO - __main__ - Step 33567: {'lr': 0.00019963108589372998, 'samples': 1074144, 'steps': 2097, 'loss/train': 2.3978638648986816} -09/20/2021 21:45:30 - INFO - __main__ - Step 33568: {'lr': 0.00019963108589372998, 'samples': 1074176, 'steps': 2097, 'loss/train': 1.7380107641220093} -09/20/2021 21:45:31 - INFO - __main__ - Step 33569: {'lr': 0.0001996305382714181, 'samples': 1074208, 'steps': 2098, 'loss/train': 2.4788806438446045} -09/20/2021 21:45:31 - INFO - __main__ - Step 33570: {'lr': 0.0001996305382714181, 'samples': 1074240, 'steps': 2098, 'loss/train': 1.2490557432174683} -09/20/2021 21:45:33 - INFO - __main__ - Step 33571: {'lr': 0.0001996305382714181, 'samples': 1074272, 'steps': 2098, 'loss/train': 2.0324437618255615} -09/20/2021 21:45:34 - INFO - __main__ - Step 33572: {'lr': 0.0001996305382714181, 'samples': 1074304, 'steps': 2098, 'loss/train': 1.8290148973464966} -09/20/2021 21:45:35 - INFO - __main__ - Step 33573: {'lr': 0.0001996305382714181, 'samples': 1074336, 'steps': 2098, 'loss/train': 1.5012595653533936} -09/20/2021 21:45:35 - INFO - __main__ - Step 33574: {'lr': 0.0001996305382714181, 'samples': 1074368, 'steps': 2098, 'loss/train': 3.0099551677703857} -09/20/2021 21:45:36 - INFO - __main__ - Step 33575: {'lr': 0.0001996305382714181, 'samples': 1074400, 'steps': 2098, 'loss/train': 1.9858628511428833} -09/20/2021 21:45:37 - INFO - __main__ - Step 33576: {'lr': 0.0001996305382714181, 'samples': 1074432, 'steps': 2098, 'loss/train': 2.02758526802063} -09/20/2021 21:45:38 - INFO - __main__ - Step 33577: {'lr': 0.0001996305382714181, 'samples': 1074464, 'steps': 2098, 'loss/train': 1.6550506353378296} -09/20/2021 21:45:38 - INFO - __main__ - Step 33578: {'lr': 0.0001996305382714181, 'samples': 1074496, 'steps': 2098, 'loss/train': 3.054901599884033} -09/20/2021 21:45:39 - INFO - __main__ - Step 33579: {'lr': 0.0001996305382714181, 'samples': 1074528, 'steps': 2098, 'loss/train': 2.3966362476348877} -09/20/2021 21:45:40 - INFO - __main__ - Step 33580: {'lr': 0.0001996305382714181, 'samples': 1074560, 'steps': 2098, 'loss/train': 2.966503858566284} -09/20/2021 21:45:41 - INFO - __main__ - Step 33581: {'lr': 0.0001996305382714181, 'samples': 1074592, 'steps': 2098, 'loss/train': 3.0450875759124756} -09/20/2021 21:45:41 - INFO - __main__ - Step 33582: {'lr': 0.0001996305382714181, 'samples': 1074624, 'steps': 2098, 'loss/train': 2.6588945388793945} -09/20/2021 21:45:42 - INFO - __main__ - Step 33583: {'lr': 0.0001996305382714181, 'samples': 1074656, 'steps': 2098, 'loss/train': 2.8261959552764893} -09/20/2021 21:45:43 - INFO - __main__ - Step 33584: {'lr': 0.0001996305382714181, 'samples': 1074688, 'steps': 2098, 'loss/train': 2.9719624519348145} -09/20/2021 21:45:44 - INFO - __main__ - Step 33585: {'lr': 0.00019962999024370992, 'samples': 1074720, 'steps': 2099, 'loss/train': 2.556633949279785} -09/20/2021 21:45:44 - INFO - __main__ - Step 33586: {'lr': 0.00019962999024370992, 'samples': 1074752, 'steps': 2099, 'loss/train': 2.018152952194214} -09/20/2021 21:45:45 - INFO - __main__ - Step 33587: {'lr': 0.00019962999024370992, 'samples': 1074784, 'steps': 2099, 'loss/train': 1.8540027141571045} -09/20/2021 21:45:46 - INFO - __main__ - Step 33588: {'lr': 0.00019962999024370992, 'samples': 1074816, 'steps': 2099, 'loss/train': 2.469108819961548} -09/20/2021 21:45:47 - INFO - __main__ - Step 33589: {'lr': 0.00019962999024370992, 'samples': 1074848, 'steps': 2099, 'loss/train': 2.0910732746124268} -09/20/2021 21:45:47 - INFO - __main__ - Step 33590: {'lr': 0.00019962999024370992, 'samples': 1074880, 'steps': 2099, 'loss/train': 3.5215365886688232} -09/20/2021 21:45:48 - INFO - __main__ - Step 33591: {'lr': 0.00019962999024370992, 'samples': 1074912, 'steps': 2099, 'loss/train': 3.5120201110839844} -09/20/2021 21:45:49 - INFO - __main__ - Step 33592: {'lr': 0.00019962999024370992, 'samples': 1074944, 'steps': 2099, 'loss/train': 2.3251867294311523} -09/20/2021 21:45:50 - INFO - __main__ - Step 33593: {'lr': 0.00019962999024370992, 'samples': 1074976, 'steps': 2099, 'loss/train': 2.5380401611328125} -09/20/2021 21:45:50 - INFO - __main__ - Step 33594: {'lr': 0.00019962999024370992, 'samples': 1075008, 'steps': 2099, 'loss/train': 1.57414710521698} -09/20/2021 21:45:51 - INFO - __main__ - Step 33595: {'lr': 0.00019962999024370992, 'samples': 1075040, 'steps': 2099, 'loss/train': 0.8569216132164001} -09/20/2021 21:45:52 - INFO - __main__ - Step 33596: {'lr': 0.00019962999024370992, 'samples': 1075072, 'steps': 2099, 'loss/train': 3.1411285400390625} -09/20/2021 21:45:53 - INFO - __main__ - Step 33597: {'lr': 0.00019962999024370992, 'samples': 1075104, 'steps': 2099, 'loss/train': 2.4833667278289795} -09/20/2021 21:45:53 - INFO - __main__ - Step 33598: {'lr': 0.00019962999024370992, 'samples': 1075136, 'steps': 2099, 'loss/train': 2.5103893280029297} -09/20/2021 21:45:54 - INFO - __main__ - Step 33599: {'lr': 0.00019962999024370992, 'samples': 1075168, 'steps': 2099, 'loss/train': 2.277182102203369} -09/20/2021 21:45:55 - INFO - __main__ - Step 33600: {'lr': 0.00019962999024370992, 'samples': 1075200, 'steps': 2099, 'loss/train': 2.111945867538452} -09/20/2021 21:45:56 - INFO - __main__ - Step 33601: {'lr': 0.0001996294418106077, 'samples': 1075232, 'steps': 2100, 'loss/train': 2.768975019454956} -09/20/2021 21:45:57 - INFO - __main__ - Step 33602: {'lr': 0.0001996294418106077, 'samples': 1075264, 'steps': 2100, 'loss/train': 2.2735025882720947} -09/20/2021 21:45:58 - INFO - __main__ - Step 33603: {'lr': 0.0001996294418106077, 'samples': 1075296, 'steps': 2100, 'loss/train': 1.977011799812317} -09/20/2021 21:45:59 - INFO - __main__ - Step 33604: {'lr': 0.0001996294418106077, 'samples': 1075328, 'steps': 2100, 'loss/train': 2.328852415084839} -09/20/2021 21:45:59 - INFO - __main__ - Step 33605: {'lr': 0.0001996294418106077, 'samples': 1075360, 'steps': 2100, 'loss/train': 1.786572813987732} -09/20/2021 21:46:00 - INFO - __main__ - Step 33606: {'lr': 0.0001996294418106077, 'samples': 1075392, 'steps': 2100, 'loss/train': 1.5223697423934937} -09/20/2021 21:46:01 - INFO - __main__ - Step 33607: {'lr': 0.0001996294418106077, 'samples': 1075424, 'steps': 2100, 'loss/train': 2.5903232097625732} -09/20/2021 21:46:02 - INFO - __main__ - Step 33608: {'lr': 0.0001996294418106077, 'samples': 1075456, 'steps': 2100, 'loss/train': 4.633582592010498} -09/20/2021 21:46:02 - INFO - __main__ - Step 33609: {'lr': 0.0001996294418106077, 'samples': 1075488, 'steps': 2100, 'loss/train': 2.899294376373291} -09/20/2021 21:46:03 - INFO - __main__ - Step 33610: {'lr': 0.0001996294418106077, 'samples': 1075520, 'steps': 2100, 'loss/train': 2.584580659866333} -09/20/2021 21:46:04 - INFO - __main__ - Step 33611: {'lr': 0.0001996294418106077, 'samples': 1075552, 'steps': 2100, 'loss/train': 2.3844621181488037} -09/20/2021 21:46:05 - INFO - __main__ - Step 33612: {'lr': 0.0001996294418106077, 'samples': 1075584, 'steps': 2100, 'loss/train': 2.2727842330932617} -09/20/2021 21:46:05 - INFO - __main__ - Step 33613: {'lr': 0.0001996294418106077, 'samples': 1075616, 'steps': 2100, 'loss/train': 2.415778160095215} -09/20/2021 21:46:06 - INFO - __main__ - Step 33614: {'lr': 0.0001996294418106077, 'samples': 1075648, 'steps': 2100, 'loss/train': 2.521451473236084} -09/20/2021 21:46:07 - INFO - __main__ - Step 33615: {'lr': 0.0001996294418106077, 'samples': 1075680, 'steps': 2100, 'loss/train': 1.3378576040267944} -09/20/2021 21:46:08 - INFO - __main__ - Step 33616: {'lr': 0.0001996294418106077, 'samples': 1075712, 'steps': 2100, 'loss/train': 2.497791051864624} -09/20/2021 21:46:08 - INFO - __main__ - Step 33617: {'lr': 0.00019962889297211366, 'samples': 1075744, 'steps': 2101, 'loss/train': 2.2751588821411133} -09/20/2021 21:46:09 - INFO - __main__ - Step 33618: {'lr': 0.00019962889297211366, 'samples': 1075776, 'steps': 2101, 'loss/train': 1.8970146179199219} -09/20/2021 21:46:10 - INFO - __main__ - Step 33619: {'lr': 0.00019962889297211366, 'samples': 1075808, 'steps': 2101, 'loss/train': 6.210023403167725} -09/20/2021 21:46:11 - INFO - __main__ - Step 33620: {'lr': 0.00019962889297211366, 'samples': 1075840, 'steps': 2101, 'loss/train': 5.233482837677002} -09/20/2021 21:46:11 - INFO - __main__ - Step 33621: {'lr': 0.00019962889297211366, 'samples': 1075872, 'steps': 2101, 'loss/train': 2.778064012527466} -09/20/2021 21:46:12 - INFO - __main__ - Step 33622: {'lr': 0.00019962889297211366, 'samples': 1075904, 'steps': 2101, 'loss/train': 2.3690247535705566} -09/20/2021 21:46:13 - INFO - __main__ - Step 33623: {'lr': 0.00019962889297211366, 'samples': 1075936, 'steps': 2101, 'loss/train': 2.3971431255340576} -09/20/2021 21:46:14 - INFO - __main__ - Step 33624: {'lr': 0.00019962889297211366, 'samples': 1075968, 'steps': 2101, 'loss/train': 1.7584357261657715} -09/20/2021 21:46:14 - INFO - __main__ - Step 33625: {'lr': 0.00019962889297211366, 'samples': 1076000, 'steps': 2101, 'loss/train': 3.0244863033294678} -09/20/2021 21:46:15 - INFO - __main__ - Step 33626: {'lr': 0.00019962889297211366, 'samples': 1076032, 'steps': 2101, 'loss/train': 2.976297378540039} -09/20/2021 21:46:16 - INFO - __main__ - Step 33627: {'lr': 0.00019962889297211366, 'samples': 1076064, 'steps': 2101, 'loss/train': 2.2422304153442383} -09/20/2021 21:46:17 - INFO - __main__ - Step 33628: {'lr': 0.00019962889297211366, 'samples': 1076096, 'steps': 2101, 'loss/train': 1.8912595510482788} -09/20/2021 21:46:17 - INFO - __main__ - Step 33629: {'lr': 0.00019962889297211366, 'samples': 1076128, 'steps': 2101, 'loss/train': 1.7441900968551636} -09/20/2021 21:46:18 - INFO - __main__ - Step 33630: {'lr': 0.00019962889297211366, 'samples': 1076160, 'steps': 2101, 'loss/train': 0.5771347880363464} -09/20/2021 21:46:19 - INFO - __main__ - Step 33631: {'lr': 0.00019962889297211366, 'samples': 1076192, 'steps': 2101, 'loss/train': 2.4045794010162354} -09/20/2021 21:46:20 - INFO - __main__ - Step 33632: {'lr': 0.00019962889297211366, 'samples': 1076224, 'steps': 2101, 'loss/train': 2.288677453994751} -09/20/2021 21:46:21 - INFO - __main__ - Step 33633: {'lr': 0.00019962834372823008, 'samples': 1076256, 'steps': 2102, 'loss/train': 2.6532511711120605} -09/20/2021 21:46:22 - INFO - __main__ - Step 33634: {'lr': 0.00019962834372823008, 'samples': 1076288, 'steps': 2102, 'loss/train': 2.606245756149292} -09/20/2021 21:46:23 - INFO - __main__ - Step 33635: {'lr': 0.00019962834372823008, 'samples': 1076320, 'steps': 2102, 'loss/train': 3.5112855434417725} -09/20/2021 21:46:23 - INFO - __main__ - Step 33636: {'lr': 0.00019962834372823008, 'samples': 1076352, 'steps': 2102, 'loss/train': 2.5708088874816895} -09/20/2021 21:46:24 - INFO - __main__ - Step 33637: {'lr': 0.00019962834372823008, 'samples': 1076384, 'steps': 2102, 'loss/train': 2.253284215927124} -09/20/2021 21:46:25 - INFO - __main__ - Step 33638: {'lr': 0.00019962834372823008, 'samples': 1076416, 'steps': 2102, 'loss/train': 2.8013193607330322} -09/20/2021 21:46:26 - INFO - __main__ - Step 33639: {'lr': 0.00019962834372823008, 'samples': 1076448, 'steps': 2102, 'loss/train': 0.4627333879470825} -09/20/2021 21:46:26 - INFO - __main__ - Step 33640: {'lr': 0.00019962834372823008, 'samples': 1076480, 'steps': 2102, 'loss/train': 2.0149993896484375} -09/20/2021 21:46:27 - INFO - __main__ - Step 33641: {'lr': 0.00019962834372823008, 'samples': 1076512, 'steps': 2102, 'loss/train': 2.4576447010040283} -09/20/2021 21:46:28 - INFO - __main__ - Step 33642: {'lr': 0.00019962834372823008, 'samples': 1076544, 'steps': 2102, 'loss/train': 3.343449354171753} -09/20/2021 21:46:29 - INFO - __main__ - Step 33643: {'lr': 0.00019962834372823008, 'samples': 1076576, 'steps': 2102, 'loss/train': 2.143224000930786} -09/20/2021 21:46:29 - INFO - __main__ - Step 33644: {'lr': 0.00019962834372823008, 'samples': 1076608, 'steps': 2102, 'loss/train': 3.181976318359375} -09/20/2021 21:46:30 - INFO - __main__ - Step 33645: {'lr': 0.00019962834372823008, 'samples': 1076640, 'steps': 2102, 'loss/train': 2.1756982803344727} -09/20/2021 21:46:31 - INFO - __main__ - Step 33646: {'lr': 0.00019962834372823008, 'samples': 1076672, 'steps': 2102, 'loss/train': 1.7254350185394287} -09/20/2021 21:46:32 - INFO - __main__ - Step 33647: {'lr': 0.00019962834372823008, 'samples': 1076704, 'steps': 2102, 'loss/train': 3.421010971069336} -09/20/2021 21:46:32 - INFO - __main__ - Step 33648: {'lr': 0.00019962834372823008, 'samples': 1076736, 'steps': 2102, 'loss/train': 1.525659441947937} -09/20/2021 21:46:33 - INFO - __main__ - Step 33649: {'lr': 0.0001996277940789591, 'samples': 1076768, 'steps': 2103, 'loss/train': 0.5191594958305359} -09/20/2021 21:46:34 - INFO - __main__ - Step 33650: {'lr': 0.0001996277940789591, 'samples': 1076800, 'steps': 2103, 'loss/train': 1.8186873197555542} -09/20/2021 21:46:35 - INFO - __main__ - Step 33651: {'lr': 0.0001996277940789591, 'samples': 1076832, 'steps': 2103, 'loss/train': 1.6238576173782349} -09/20/2021 21:46:35 - INFO - __main__ - Step 33652: {'lr': 0.0001996277940789591, 'samples': 1076864, 'steps': 2103, 'loss/train': 2.3519930839538574} -09/20/2021 21:46:36 - INFO - __main__ - Step 33653: {'lr': 0.0001996277940789591, 'samples': 1076896, 'steps': 2103, 'loss/train': 1.9606112241744995} -09/20/2021 21:46:37 - INFO - __main__ - Step 33654: {'lr': 0.0001996277940789591, 'samples': 1076928, 'steps': 2103, 'loss/train': 1.535802960395813} -09/20/2021 21:46:38 - INFO - __main__ - Step 33655: {'lr': 0.0001996277940789591, 'samples': 1076960, 'steps': 2103, 'loss/train': 1.7695680856704712} -09/20/2021 21:46:39 - INFO - __main__ - Step 33656: {'lr': 0.0001996277940789591, 'samples': 1076992, 'steps': 2103, 'loss/train': 2.855384111404419} -09/20/2021 21:46:39 - INFO - __main__ - Step 33657: {'lr': 0.0001996277940789591, 'samples': 1077024, 'steps': 2103, 'loss/train': 2.924607038497925} -09/20/2021 21:46:40 - INFO - __main__ - Step 33658: {'lr': 0.0001996277940789591, 'samples': 1077056, 'steps': 2103, 'loss/train': 2.0119147300720215} -09/20/2021 21:46:41 - INFO - __main__ - Step 33659: {'lr': 0.0001996277940789591, 'samples': 1077088, 'steps': 2103, 'loss/train': 2.129279375076294} -09/20/2021 21:46:42 - INFO - __main__ - Step 33660: {'lr': 0.0001996277940789591, 'samples': 1077120, 'steps': 2103, 'loss/train': 2.6924397945404053} -09/20/2021 21:46:42 - INFO - __main__ - Step 33661: {'lr': 0.0001996277940789591, 'samples': 1077152, 'steps': 2103, 'loss/train': 2.5106022357940674} -09/20/2021 21:46:43 - INFO - __main__ - Step 33662: {'lr': 0.0001996277940789591, 'samples': 1077184, 'steps': 2103, 'loss/train': 2.441570520401001} -09/20/2021 21:46:44 - INFO - __main__ - Step 33663: {'lr': 0.0001996277940789591, 'samples': 1077216, 'steps': 2103, 'loss/train': 2.0842559337615967} -09/20/2021 21:46:45 - INFO - __main__ - Step 33664: {'lr': 0.0001996277940789591, 'samples': 1077248, 'steps': 2103, 'loss/train': 2.4553515911102295} -09/20/2021 21:46:46 - INFO - __main__ - Step 33665: {'lr': 0.00019962724402430303, 'samples': 1077280, 'steps': 2104, 'loss/train': 1.8706482648849487} -09/20/2021 21:46:47 - INFO - __main__ - Step 33666: {'lr': 0.00019962724402430303, 'samples': 1077312, 'steps': 2104, 'loss/train': 1.8495383262634277} -09/20/2021 21:46:48 - INFO - __main__ - Step 33667: {'lr': 0.00019962724402430303, 'samples': 1077344, 'steps': 2104, 'loss/train': 0.35860031843185425} -09/20/2021 21:46:48 - INFO - __main__ - Step 33668: {'lr': 0.00019962724402430303, 'samples': 1077376, 'steps': 2104, 'loss/train': 0.26002222299575806} -09/20/2021 21:46:49 - INFO - __main__ - Step 33669: {'lr': 0.00019962724402430303, 'samples': 1077408, 'steps': 2104, 'loss/train': 0.28379449248313904} -09/20/2021 21:46:50 - INFO - __main__ - Step 33670: {'lr': 0.00019962724402430303, 'samples': 1077440, 'steps': 2104, 'loss/train': 0.24301372468471527} -09/20/2021 21:46:51 - INFO - __main__ - Step 33671: {'lr': 0.00019962724402430303, 'samples': 1077472, 'steps': 2104, 'loss/train': 1.6480121612548828} -09/20/2021 21:46:51 - INFO - __main__ - Step 33672: {'lr': 0.00019962724402430303, 'samples': 1077504, 'steps': 2104, 'loss/train': 3.1986565589904785} -09/20/2021 21:46:52 - INFO - __main__ - Step 33673: {'lr': 0.00019962724402430303, 'samples': 1077536, 'steps': 2104, 'loss/train': 1.9713717699050903} -09/20/2021 21:46:53 - INFO - __main__ - Step 33674: {'lr': 0.00019962724402430303, 'samples': 1077568, 'steps': 2104, 'loss/train': 1.912709355354309} -09/20/2021 21:46:54 - INFO - __main__ - Step 33675: {'lr': 0.00019962724402430303, 'samples': 1077600, 'steps': 2104, 'loss/train': 2.0200488567352295} -09/20/2021 21:46:54 - INFO - __main__ - Step 33676: {'lr': 0.00019962724402430303, 'samples': 1077632, 'steps': 2104, 'loss/train': 1.7249151468276978} -09/20/2021 21:46:55 - INFO - __main__ - Step 33677: {'lr': 0.00019962724402430303, 'samples': 1077664, 'steps': 2104, 'loss/train': 2.3451666831970215} -09/20/2021 21:46:56 - INFO - __main__ - Step 33678: {'lr': 0.00019962724402430303, 'samples': 1077696, 'steps': 2104, 'loss/train': 2.154266357421875} -09/20/2021 21:46:57 - INFO - __main__ - Step 33679: {'lr': 0.00019962724402430303, 'samples': 1077728, 'steps': 2104, 'loss/train': 2.1107587814331055} -09/20/2021 21:46:57 - INFO - __main__ - Step 33680: {'lr': 0.00019962724402430303, 'samples': 1077760, 'steps': 2104, 'loss/train': 2.188877820968628} -09/20/2021 21:46:58 - INFO - __main__ - Step 33681: {'lr': 0.0001996266935642641, 'samples': 1077792, 'steps': 2105, 'loss/train': 2.455789566040039} -09/20/2021 21:46:59 - INFO - __main__ - Step 33682: {'lr': 0.0001996266935642641, 'samples': 1077824, 'steps': 2105, 'loss/train': 1.8627636432647705} -09/20/2021 21:47:00 - INFO - __main__ - Step 33683: {'lr': 0.0001996266935642641, 'samples': 1077856, 'steps': 2105, 'loss/train': 1.0887449979782104} -09/20/2021 21:47:00 - INFO - __main__ - Step 33684: {'lr': 0.0001996266935642641, 'samples': 1077888, 'steps': 2105, 'loss/train': 2.787226676940918} -09/20/2021 21:47:01 - INFO - __main__ - Step 33685: {'lr': 0.0001996266935642641, 'samples': 1077920, 'steps': 2105, 'loss/train': 2.7737913131713867} -09/20/2021 21:47:02 - INFO - __main__ - Step 33686: {'lr': 0.0001996266935642641, 'samples': 1077952, 'steps': 2105, 'loss/train': 2.302419662475586} -09/20/2021 21:47:03 - INFO - __main__ - Step 33687: {'lr': 0.0001996266935642641, 'samples': 1077984, 'steps': 2105, 'loss/train': 2.2823641300201416} -09/20/2021 21:47:03 - INFO - __main__ - Step 33688: {'lr': 0.0001996266935642641, 'samples': 1078016, 'steps': 2105, 'loss/train': 2.7569777965545654} -09/20/2021 21:47:04 - INFO - __main__ - Step 33689: {'lr': 0.0001996266935642641, 'samples': 1078048, 'steps': 2105, 'loss/train': 1.911849021911621} -09/20/2021 21:47:05 - INFO - __main__ - Step 33690: {'lr': 0.0001996266935642641, 'samples': 1078080, 'steps': 2105, 'loss/train': 2.6631505489349365} -09/20/2021 21:47:06 - INFO - __main__ - Step 33691: {'lr': 0.0001996266935642641, 'samples': 1078112, 'steps': 2105, 'loss/train': 1.3642737865447998} -09/20/2021 21:47:06 - INFO - __main__ - Step 33692: {'lr': 0.0001996266935642641, 'samples': 1078144, 'steps': 2105, 'loss/train': 2.489809513092041} -09/20/2021 21:47:08 - INFO - __main__ - Step 33693: {'lr': 0.0001996266935642641, 'samples': 1078176, 'steps': 2105, 'loss/train': 2.3820199966430664} -09/20/2021 21:47:08 - INFO - __main__ - Step 33694: {'lr': 0.0001996266935642641, 'samples': 1078208, 'steps': 2105, 'loss/train': 1.5313997268676758} -09/20/2021 21:47:09 - INFO - __main__ - Step 33695: {'lr': 0.0001996266935642641, 'samples': 1078240, 'steps': 2105, 'loss/train': 2.3766136169433594} -09/20/2021 21:47:10 - INFO - __main__ - Step 33696: {'lr': 0.0001996266935642641, 'samples': 1078272, 'steps': 2105, 'loss/train': 2.10343337059021} -09/20/2021 21:47:11 - INFO - __main__ - Step 33697: {'lr': 0.00019962614269884458, 'samples': 1078304, 'steps': 2106, 'loss/train': 1.8858345746994019} -09/20/2021 21:47:12 - INFO - __main__ - Step 33698: {'lr': 0.00019962614269884458, 'samples': 1078336, 'steps': 2106, 'loss/train': 2.4679038524627686} -09/20/2021 21:47:12 - INFO - __main__ - Step 33699: {'lr': 0.00019962614269884458, 'samples': 1078368, 'steps': 2106, 'loss/train': 1.7686618566513062} -09/20/2021 21:47:13 - INFO - __main__ - Step 33700: {'lr': 0.00019962614269884458, 'samples': 1078400, 'steps': 2106, 'loss/train': 2.834331512451172} -09/20/2021 21:47:14 - INFO - __main__ - Step 33701: {'lr': 0.00019962614269884458, 'samples': 1078432, 'steps': 2106, 'loss/train': 1.1910463571548462} -09/20/2021 21:47:15 - INFO - __main__ - Step 33702: {'lr': 0.00019962614269884458, 'samples': 1078464, 'steps': 2106, 'loss/train': 2.1310582160949707} -09/20/2021 21:47:15 - INFO - __main__ - Step 33703: {'lr': 0.00019962614269884458, 'samples': 1078496, 'steps': 2106, 'loss/train': 2.5620224475860596} -09/20/2021 21:47:16 - INFO - __main__ - Step 33704: {'lr': 0.00019962614269884458, 'samples': 1078528, 'steps': 2106, 'loss/train': 2.898580312728882} -09/20/2021 21:47:17 - INFO - __main__ - Step 33705: {'lr': 0.00019962614269884458, 'samples': 1078560, 'steps': 2106, 'loss/train': 1.9745845794677734} -09/20/2021 21:47:18 - INFO - __main__ - Step 33706: {'lr': 0.00019962614269884458, 'samples': 1078592, 'steps': 2106, 'loss/train': 2.619584083557129} -09/20/2021 21:47:18 - INFO - __main__ - Step 33707: {'lr': 0.00019962614269884458, 'samples': 1078624, 'steps': 2106, 'loss/train': 2.5975964069366455} -09/20/2021 21:47:19 - INFO - __main__ - Step 33708: {'lr': 0.00019962614269884458, 'samples': 1078656, 'steps': 2106, 'loss/train': 1.9711531400680542} -09/20/2021 21:47:20 - INFO - __main__ - Step 33709: {'lr': 0.00019962614269884458, 'samples': 1078688, 'steps': 2106, 'loss/train': 2.00663423538208} -09/20/2021 21:47:21 - INFO - __main__ - Step 33710: {'lr': 0.00019962614269884458, 'samples': 1078720, 'steps': 2106, 'loss/train': 2.7333428859710693} -09/20/2021 21:47:21 - INFO - __main__ - Step 33711: {'lr': 0.00019962614269884458, 'samples': 1078752, 'steps': 2106, 'loss/train': 2.1253039836883545} -09/20/2021 21:47:22 - INFO - __main__ - Step 33712: {'lr': 0.00019962614269884458, 'samples': 1078784, 'steps': 2106, 'loss/train': 2.865365743637085} -09/20/2021 21:47:23 - INFO - __main__ - Step 33713: {'lr': 0.00019962559142804663, 'samples': 1078816, 'steps': 2107, 'loss/train': 2.556239604949951} -09/20/2021 21:47:24 - INFO - __main__ - Step 33714: {'lr': 0.00019962559142804663, 'samples': 1078848, 'steps': 2107, 'loss/train': 3.2487313747406006} -09/20/2021 21:47:24 - INFO - __main__ - Step 33715: {'lr': 0.00019962559142804663, 'samples': 1078880, 'steps': 2107, 'loss/train': 2.07494854927063} -09/20/2021 21:47:25 - INFO - __main__ - Step 33716: {'lr': 0.00019962559142804663, 'samples': 1078912, 'steps': 2107, 'loss/train': 2.4568028450012207} -09/20/2021 21:47:26 - INFO - __main__ - Step 33717: {'lr': 0.00019962559142804663, 'samples': 1078944, 'steps': 2107, 'loss/train': 2.7519733905792236} -09/20/2021 21:47:27 - INFO - __main__ - Step 33718: {'lr': 0.00019962559142804663, 'samples': 1078976, 'steps': 2107, 'loss/train': 3.0631914138793945} -09/20/2021 21:47:27 - INFO - __main__ - Step 33719: {'lr': 0.00019962559142804663, 'samples': 1079008, 'steps': 2107, 'loss/train': 1.743910789489746} -09/20/2021 21:47:28 - INFO - __main__ - Step 33720: {'lr': 0.00019962559142804663, 'samples': 1079040, 'steps': 2107, 'loss/train': 2.337998390197754} -09/20/2021 21:47:29 - INFO - __main__ - Step 33721: {'lr': 0.00019962559142804663, 'samples': 1079072, 'steps': 2107, 'loss/train': 2.9253499507904053} -09/20/2021 21:47:30 - INFO - __main__ - Step 33722: {'lr': 0.00019962559142804663, 'samples': 1079104, 'steps': 2107, 'loss/train': 1.2200759649276733} -09/20/2021 21:47:31 - INFO - __main__ - Step 33723: {'lr': 0.00019962559142804663, 'samples': 1079136, 'steps': 2107, 'loss/train': 2.7669825553894043} -09/20/2021 21:47:31 - INFO - __main__ - Step 33724: {'lr': 0.00019962559142804663, 'samples': 1079168, 'steps': 2107, 'loss/train': 1.6273562908172607} -09/20/2021 21:47:33 - INFO - __main__ - Step 33725: {'lr': 0.00019962559142804663, 'samples': 1079200, 'steps': 2107, 'loss/train': 1.6670795679092407} -09/20/2021 21:47:33 - INFO - __main__ - Step 33726: {'lr': 0.00019962559142804663, 'samples': 1079232, 'steps': 2107, 'loss/train': 2.395094871520996} -09/20/2021 21:47:34 - INFO - __main__ - Step 33727: {'lr': 0.00019962559142804663, 'samples': 1079264, 'steps': 2107, 'loss/train': 1.9588156938552856} -09/20/2021 21:47:35 - INFO - __main__ - Step 33728: {'lr': 0.00019962559142804663, 'samples': 1079296, 'steps': 2107, 'loss/train': 2.4842069149017334} -09/20/2021 21:47:36 - INFO - __main__ - Step 33729: {'lr': 0.00019962503975187252, 'samples': 1079328, 'steps': 2108, 'loss/train': 2.0461344718933105} -09/20/2021 21:47:36 - INFO - __main__ - Step 33730: {'lr': 0.00019962503975187252, 'samples': 1079360, 'steps': 2108, 'loss/train': 2.6832199096679688} -09/20/2021 21:47:37 - INFO - __main__ - Step 33731: {'lr': 0.00019962503975187252, 'samples': 1079392, 'steps': 2108, 'loss/train': 1.1841355562210083} -09/20/2021 21:47:38 - INFO - __main__ - Step 33732: {'lr': 0.00019962503975187252, 'samples': 1079424, 'steps': 2108, 'loss/train': 1.6756688356399536} -09/20/2021 21:47:39 - INFO - __main__ - Step 33733: {'lr': 0.00019962503975187252, 'samples': 1079456, 'steps': 2108, 'loss/train': 2.401244640350342} -09/20/2021 21:47:39 - INFO - __main__ - Step 33734: {'lr': 0.00019962503975187252, 'samples': 1079488, 'steps': 2108, 'loss/train': 2.1318771839141846} -09/20/2021 21:47:40 - INFO - __main__ - Step 33735: {'lr': 0.00019962503975187252, 'samples': 1079520, 'steps': 2108, 'loss/train': 1.5104738473892212} -09/20/2021 21:47:41 - INFO - __main__ - Step 33736: {'lr': 0.00019962503975187252, 'samples': 1079552, 'steps': 2108, 'loss/train': 1.7211825847625732} -09/20/2021 21:47:42 - INFO - __main__ - Step 33737: {'lr': 0.00019962503975187252, 'samples': 1079584, 'steps': 2108, 'loss/train': 1.7712193727493286} -09/20/2021 21:47:42 - INFO - __main__ - Step 33738: {'lr': 0.00019962503975187252, 'samples': 1079616, 'steps': 2108, 'loss/train': 3.154290199279785} -09/20/2021 21:47:43 - INFO - __main__ - Step 33739: {'lr': 0.00019962503975187252, 'samples': 1079648, 'steps': 2108, 'loss/train': 2.4562551975250244} -09/20/2021 21:47:44 - INFO - __main__ - Step 33740: {'lr': 0.00019962503975187252, 'samples': 1079680, 'steps': 2108, 'loss/train': 2.536557912826538} -09/20/2021 21:47:45 - INFO - __main__ - Step 33741: {'lr': 0.00019962503975187252, 'samples': 1079712, 'steps': 2108, 'loss/train': 2.495474100112915} -09/20/2021 21:47:45 - INFO - __main__ - Step 33742: {'lr': 0.00019962503975187252, 'samples': 1079744, 'steps': 2108, 'loss/train': 2.2644107341766357} -09/20/2021 21:47:46 - INFO - __main__ - Step 33743: {'lr': 0.00019962503975187252, 'samples': 1079776, 'steps': 2108, 'loss/train': 2.272484302520752} -09/20/2021 21:47:47 - INFO - __main__ - Step 33744: {'lr': 0.00019962503975187252, 'samples': 1079808, 'steps': 2108, 'loss/train': 1.7826181650161743} -09/20/2021 21:47:48 - INFO - __main__ - Step 33745: {'lr': 0.00019962448767032453, 'samples': 1079840, 'steps': 2109, 'loss/train': 1.960963487625122} -09/20/2021 21:47:49 - INFO - __main__ - Step 33746: {'lr': 0.00019962448767032453, 'samples': 1079872, 'steps': 2109, 'loss/train': 2.3005530834198} -09/20/2021 21:47:49 - INFO - __main__ - Step 33747: {'lr': 0.00019962448767032453, 'samples': 1079904, 'steps': 2109, 'loss/train': 2.446864366531372} -09/20/2021 21:47:50 - INFO - __main__ - Step 33748: {'lr': 0.00019962448767032453, 'samples': 1079936, 'steps': 2109, 'loss/train': 2.138457775115967} -09/20/2021 21:47:51 - INFO - __main__ - Step 33749: {'lr': 0.00019962448767032453, 'samples': 1079968, 'steps': 2109, 'loss/train': 2.8969905376434326} -09/20/2021 21:47:52 - INFO - __main__ - Step 33750: {'lr': 0.00019962448767032453, 'samples': 1080000, 'steps': 2109, 'loss/train': 2.2897942066192627} -09/20/2021 21:47:52 - INFO - __main__ - Step 33751: {'lr': 0.00019962448767032453, 'samples': 1080032, 'steps': 2109, 'loss/train': 2.293006658554077} -09/20/2021 21:47:53 - INFO - __main__ - Step 33752: {'lr': 0.00019962448767032453, 'samples': 1080064, 'steps': 2109, 'loss/train': 1.0882134437561035} -09/20/2021 21:47:54 - INFO - __main__ - Step 33753: {'lr': 0.00019962448767032453, 'samples': 1080096, 'steps': 2109, 'loss/train': 2.27894926071167} -09/20/2021 21:47:55 - INFO - __main__ - Step 33754: {'lr': 0.00019962448767032453, 'samples': 1080128, 'steps': 2109, 'loss/train': 2.1433346271514893} -09/20/2021 21:47:55 - INFO - __main__ - Step 33755: {'lr': 0.00019962448767032453, 'samples': 1080160, 'steps': 2109, 'loss/train': 0.7101392149925232} -09/20/2021 21:47:56 - INFO - __main__ - Step 33756: {'lr': 0.00019962448767032453, 'samples': 1080192, 'steps': 2109, 'loss/train': 2.3446333408355713} -09/20/2021 21:47:57 - INFO - __main__ - Step 33757: {'lr': 0.00019962448767032453, 'samples': 1080224, 'steps': 2109, 'loss/train': 1.6813690662384033} -09/20/2021 21:47:58 - INFO - __main__ - Step 33758: {'lr': 0.00019962448767032453, 'samples': 1080256, 'steps': 2109, 'loss/train': 3.292658567428589} -09/20/2021 21:47:59 - INFO - __main__ - Step 33759: {'lr': 0.00019962448767032453, 'samples': 1080288, 'steps': 2109, 'loss/train': 3.257110595703125} -09/20/2021 21:48:00 - INFO - __main__ - Step 33760: {'lr': 0.00019962448767032453, 'samples': 1080320, 'steps': 2109, 'loss/train': 2.9031834602355957} -09/20/2021 21:48:00 - INFO - __main__ - Step 33761: {'lr': 0.0001996239351834049, 'samples': 1080352, 'steps': 2110, 'loss/train': 2.254969835281372} -09/20/2021 21:48:01 - INFO - __main__ - Step 33762: {'lr': 0.0001996239351834049, 'samples': 1080384, 'steps': 2110, 'loss/train': 2.833890676498413} -09/20/2021 21:48:02 - INFO - __main__ - Step 33763: {'lr': 0.0001996239351834049, 'samples': 1080416, 'steps': 2110, 'loss/train': 2.5390775203704834} -09/20/2021 21:48:03 - INFO - __main__ - Step 33764: {'lr': 0.0001996239351834049, 'samples': 1080448, 'steps': 2110, 'loss/train': 3.0568904876708984} -09/20/2021 21:48:03 - INFO - __main__ - Step 33765: {'lr': 0.0001996239351834049, 'samples': 1080480, 'steps': 2110, 'loss/train': 2.380993604660034} -09/20/2021 21:48:04 - INFO - __main__ - Step 33766: {'lr': 0.0001996239351834049, 'samples': 1080512, 'steps': 2110, 'loss/train': 1.6378213167190552} -09/20/2021 21:48:05 - INFO - __main__ - Step 33767: {'lr': 0.0001996239351834049, 'samples': 1080544, 'steps': 2110, 'loss/train': 2.108475685119629} -09/20/2021 21:48:06 - INFO - __main__ - Step 33768: {'lr': 0.0001996239351834049, 'samples': 1080576, 'steps': 2110, 'loss/train': 3.2377841472625732} -09/20/2021 21:48:06 - INFO - __main__ - Step 33769: {'lr': 0.0001996239351834049, 'samples': 1080608, 'steps': 2110, 'loss/train': 2.571892261505127} -09/20/2021 21:48:07 - INFO - __main__ - Step 33770: {'lr': 0.0001996239351834049, 'samples': 1080640, 'steps': 2110, 'loss/train': 2.044365406036377} -09/20/2021 21:48:08 - INFO - __main__ - Step 33771: {'lr': 0.0001996239351834049, 'samples': 1080672, 'steps': 2110, 'loss/train': 2.602843761444092} -09/20/2021 21:48:09 - INFO - __main__ - Step 33772: {'lr': 0.0001996239351834049, 'samples': 1080704, 'steps': 2110, 'loss/train': 0.7443593740463257} -09/20/2021 21:48:09 - INFO - __main__ - Step 33773: {'lr': 0.0001996239351834049, 'samples': 1080736, 'steps': 2110, 'loss/train': 1.2460105419158936} -09/20/2021 21:48:10 - INFO - __main__ - Step 33774: {'lr': 0.0001996239351834049, 'samples': 1080768, 'steps': 2110, 'loss/train': 2.323685646057129} -09/20/2021 21:48:11 - INFO - __main__ - Step 33775: {'lr': 0.0001996239351834049, 'samples': 1080800, 'steps': 2110, 'loss/train': 1.5058566331863403} -09/20/2021 21:48:12 - INFO - __main__ - Step 33776: {'lr': 0.0001996239351834049, 'samples': 1080832, 'steps': 2110, 'loss/train': 2.7176265716552734} -09/20/2021 21:48:13 - INFO - __main__ - Step 33777: {'lr': 0.00019962338229111585, 'samples': 1080864, 'steps': 2111, 'loss/train': 1.509251356124878} -09/20/2021 21:48:13 - INFO - __main__ - Step 33778: {'lr': 0.00019962338229111585, 'samples': 1080896, 'steps': 2111, 'loss/train': 2.59928822517395} -09/20/2021 21:48:14 - INFO - __main__ - Step 33779: {'lr': 0.00019962338229111585, 'samples': 1080928, 'steps': 2111, 'loss/train': 2.234173536300659} -09/20/2021 21:48:15 - INFO - __main__ - Step 33780: {'lr': 0.00019962338229111585, 'samples': 1080960, 'steps': 2111, 'loss/train': 2.7371914386749268} -09/20/2021 21:48:16 - INFO - __main__ - Step 33781: {'lr': 0.00019962338229111585, 'samples': 1080992, 'steps': 2111, 'loss/train': 1.033416748046875} -09/20/2021 21:48:16 - INFO - __main__ - Step 33782: {'lr': 0.00019962338229111585, 'samples': 1081024, 'steps': 2111, 'loss/train': 2.5787343978881836} -09/20/2021 21:48:17 - INFO - __main__ - Step 33783: {'lr': 0.00019962338229111585, 'samples': 1081056, 'steps': 2111, 'loss/train': 1.6989903450012207} -09/20/2021 21:48:18 - INFO - __main__ - Step 33784: {'lr': 0.00019962338229111585, 'samples': 1081088, 'steps': 2111, 'loss/train': 1.6820464134216309} -09/20/2021 21:48:19 - INFO - __main__ - Step 33785: {'lr': 0.00019962338229111585, 'samples': 1081120, 'steps': 2111, 'loss/train': 2.207725763320923} -09/20/2021 21:48:19 - INFO - __main__ - Step 33786: {'lr': 0.00019962338229111585, 'samples': 1081152, 'steps': 2111, 'loss/train': 1.6058210134506226} -09/20/2021 21:48:20 - INFO - __main__ - Step 33787: {'lr': 0.00019962338229111585, 'samples': 1081184, 'steps': 2111, 'loss/train': 2.0450797080993652} -09/20/2021 21:48:21 - INFO - __main__ - Step 33788: {'lr': 0.00019962338229111585, 'samples': 1081216, 'steps': 2111, 'loss/train': 1.649716854095459} -09/20/2021 21:48:22 - INFO - __main__ - Step 33789: {'lr': 0.00019962338229111585, 'samples': 1081248, 'steps': 2111, 'loss/train': 2.1885507106781006} -09/20/2021 21:48:23 - INFO - __main__ - Step 33790: {'lr': 0.00019962338229111585, 'samples': 1081280, 'steps': 2111, 'loss/train': 1.7722361087799072} -09/20/2021 21:48:24 - INFO - __main__ - Step 33791: {'lr': 0.00019962338229111585, 'samples': 1081312, 'steps': 2111, 'loss/train': 1.9468878507614136} -09/20/2021 21:48:24 - INFO - __main__ - Step 33792: {'lr': 0.00019962338229111585, 'samples': 1081344, 'steps': 2111, 'loss/train': 1.6249572038650513} -09/20/2021 21:48:25 - INFO - __main__ - Step 33793: {'lr': 0.00019962282899345962, 'samples': 1081376, 'steps': 2112, 'loss/train': 2.482438325881958} -09/20/2021 21:48:26 - INFO - __main__ - Step 33794: {'lr': 0.00019962282899345962, 'samples': 1081408, 'steps': 2112, 'loss/train': 2.2066762447357178} -09/20/2021 21:48:27 - INFO - __main__ - Step 33795: {'lr': 0.00019962282899345962, 'samples': 1081440, 'steps': 2112, 'loss/train': 2.1317999362945557} -09/20/2021 21:48:28 - INFO - __main__ - Step 33796: {'lr': 0.00019962282899345962, 'samples': 1081472, 'steps': 2112, 'loss/train': 2.6796834468841553} -09/20/2021 21:48:28 - INFO - __main__ - Step 33797: {'lr': 0.00019962282899345962, 'samples': 1081504, 'steps': 2112, 'loss/train': 2.256753921508789} -09/20/2021 21:48:29 - INFO - __main__ - Step 33798: {'lr': 0.00019962282899345962, 'samples': 1081536, 'steps': 2112, 'loss/train': 2.1760265827178955} -09/20/2021 21:48:30 - INFO - __main__ - Step 33799: {'lr': 0.00019962282899345962, 'samples': 1081568, 'steps': 2112, 'loss/train': 2.3146462440490723} -09/20/2021 21:48:31 - INFO - __main__ - Step 33800: {'lr': 0.00019962282899345962, 'samples': 1081600, 'steps': 2112, 'loss/train': 1.161667823791504} -09/20/2021 21:48:31 - INFO - __main__ - Step 33801: {'lr': 0.00019962282899345962, 'samples': 1081632, 'steps': 2112, 'loss/train': 1.0891674757003784} -09/20/2021 21:48:32 - INFO - __main__ - Step 33802: {'lr': 0.00019962282899345962, 'samples': 1081664, 'steps': 2112, 'loss/train': 0.6109389066696167} -09/20/2021 21:48:33 - INFO - __main__ - Step 33803: {'lr': 0.00019962282899345962, 'samples': 1081696, 'steps': 2112, 'loss/train': 2.2365853786468506} -09/20/2021 21:48:34 - INFO - __main__ - Step 33804: {'lr': 0.00019962282899345962, 'samples': 1081728, 'steps': 2112, 'loss/train': 1.972330927848816} -09/20/2021 21:48:34 - INFO - __main__ - Step 33805: {'lr': 0.00019962282899345962, 'samples': 1081760, 'steps': 2112, 'loss/train': 2.044858932495117} -09/20/2021 21:48:35 - INFO - __main__ - Step 33806: {'lr': 0.00019962282899345962, 'samples': 1081792, 'steps': 2112, 'loss/train': 1.367687702178955} -09/20/2021 21:48:36 - INFO - __main__ - Step 33807: {'lr': 0.00019962282899345962, 'samples': 1081824, 'steps': 2112, 'loss/train': 1.885136604309082} -09/20/2021 21:48:37 - INFO - __main__ - Step 33808: {'lr': 0.00019962282899345962, 'samples': 1081856, 'steps': 2112, 'loss/train': 2.0405662059783936} -09/20/2021 21:48:37 - INFO - __main__ - Step 33809: {'lr': 0.0001996222752904385, 'samples': 1081888, 'steps': 2113, 'loss/train': 1.8934071063995361} -09/20/2021 21:48:38 - INFO - __main__ - Step 33810: {'lr': 0.0001996222752904385, 'samples': 1081920, 'steps': 2113, 'loss/train': 2.47637677192688} -09/20/2021 21:48:39 - INFO - __main__ - Step 33811: {'lr': 0.0001996222752904385, 'samples': 1081952, 'steps': 2113, 'loss/train': 2.0971126556396484} -09/20/2021 21:48:40 - INFO - __main__ - Step 33812: {'lr': 0.0001996222752904385, 'samples': 1081984, 'steps': 2113, 'loss/train': 2.1601932048797607} -09/20/2021 21:48:40 - INFO - __main__ - Step 33813: {'lr': 0.0001996222752904385, 'samples': 1082016, 'steps': 2113, 'loss/train': 2.2594573497772217} -09/20/2021 21:48:41 - INFO - __main__ - Step 33814: {'lr': 0.0001996222752904385, 'samples': 1082048, 'steps': 2113, 'loss/train': 2.10703444480896} -09/20/2021 21:48:42 - INFO - __main__ - Step 33815: {'lr': 0.0001996222752904385, 'samples': 1082080, 'steps': 2113, 'loss/train': 2.6487162113189697} -09/20/2021 21:48:43 - INFO - __main__ - Step 33816: {'lr': 0.0001996222752904385, 'samples': 1082112, 'steps': 2113, 'loss/train': 2.4072649478912354} -09/20/2021 21:48:43 - INFO - __main__ - Step 33817: {'lr': 0.0001996222752904385, 'samples': 1082144, 'steps': 2113, 'loss/train': 3.2166802883148193} -09/20/2021 21:48:44 - INFO - __main__ - Step 33818: {'lr': 0.0001996222752904385, 'samples': 1082176, 'steps': 2113, 'loss/train': 1.8557493686676025} -09/20/2021 21:48:45 - INFO - __main__ - Step 33819: {'lr': 0.0001996222752904385, 'samples': 1082208, 'steps': 2113, 'loss/train': 2.769594430923462} -09/20/2021 21:48:46 - INFO - __main__ - Step 33820: {'lr': 0.0001996222752904385, 'samples': 1082240, 'steps': 2113, 'loss/train': 2.773259162902832} -09/20/2021 21:48:47 - INFO - __main__ - Step 33821: {'lr': 0.0001996222752904385, 'samples': 1082272, 'steps': 2113, 'loss/train': 1.935119867324829} -09/20/2021 21:48:48 - INFO - __main__ - Step 33822: {'lr': 0.0001996222752904385, 'samples': 1082304, 'steps': 2113, 'loss/train': 0.8622580170631409} -09/20/2021 21:48:48 - INFO - __main__ - Step 33823: {'lr': 0.0001996222752904385, 'samples': 1082336, 'steps': 2113, 'loss/train': 2.959127187728882} -09/20/2021 21:48:49 - INFO - __main__ - Step 33824: {'lr': 0.0001996222752904385, 'samples': 1082368, 'steps': 2113, 'loss/train': 1.0328869819641113} -09/20/2021 21:48:50 - INFO - __main__ - Step 33825: {'lr': 0.00019962172118205475, 'samples': 1082400, 'steps': 2114, 'loss/train': 2.5300445556640625} -09/20/2021 21:48:51 - INFO - __main__ - Step 33826: {'lr': 0.00019962172118205475, 'samples': 1082432, 'steps': 2114, 'loss/train': 0.7537832260131836} -09/20/2021 21:48:52 - INFO - __main__ - Step 33827: {'lr': 0.00019962172118205475, 'samples': 1082464, 'steps': 2114, 'loss/train': 2.574127435684204} -09/20/2021 21:48:52 - INFO - __main__ - Step 33828: {'lr': 0.00019962172118205475, 'samples': 1082496, 'steps': 2114, 'loss/train': 1.3927292823791504} -09/20/2021 21:48:53 - INFO - __main__ - Step 33829: {'lr': 0.00019962172118205475, 'samples': 1082528, 'steps': 2114, 'loss/train': 3.8148105144500732} -09/20/2021 21:48:54 - INFO - __main__ - Step 33830: {'lr': 0.00019962172118205475, 'samples': 1082560, 'steps': 2114, 'loss/train': 2.6594765186309814} -09/20/2021 21:48:55 - INFO - __main__ - Step 33831: {'lr': 0.00019962172118205475, 'samples': 1082592, 'steps': 2114, 'loss/train': 2.1132681369781494} -09/20/2021 21:48:55 - INFO - __main__ - Step 33832: {'lr': 0.00019962172118205475, 'samples': 1082624, 'steps': 2114, 'loss/train': 2.1421682834625244} -09/20/2021 21:48:56 - INFO - __main__ - Step 33833: {'lr': 0.00019962172118205475, 'samples': 1082656, 'steps': 2114, 'loss/train': 2.2676045894622803} -09/20/2021 21:48:57 - INFO - __main__ - Step 33834: {'lr': 0.00019962172118205475, 'samples': 1082688, 'steps': 2114, 'loss/train': 1.8438997268676758} -09/20/2021 21:48:58 - INFO - __main__ - Step 33835: {'lr': 0.00019962172118205475, 'samples': 1082720, 'steps': 2114, 'loss/train': 2.111276865005493} -09/20/2021 21:48:58 - INFO - __main__ - Step 33836: {'lr': 0.00019962172118205475, 'samples': 1082752, 'steps': 2114, 'loss/train': 2.4444031715393066} -09/20/2021 21:48:59 - INFO - __main__ - Step 33837: {'lr': 0.00019962172118205475, 'samples': 1082784, 'steps': 2114, 'loss/train': 2.3983817100524902} -09/20/2021 21:49:00 - INFO - __main__ - Step 33838: {'lr': 0.00019962172118205475, 'samples': 1082816, 'steps': 2114, 'loss/train': 2.5852644443511963} -09/20/2021 21:49:01 - INFO - __main__ - Step 33839: {'lr': 0.00019962172118205475, 'samples': 1082848, 'steps': 2114, 'loss/train': 2.7484536170959473} -09/20/2021 21:49:01 - INFO - __main__ - Step 33840: {'lr': 0.00019962172118205475, 'samples': 1082880, 'steps': 2114, 'loss/train': 1.8662819862365723} -09/20/2021 21:49:02 - INFO - __main__ - Step 33841: {'lr': 0.00019962116666831061, 'samples': 1082912, 'steps': 2115, 'loss/train': 2.738920211791992} -09/20/2021 21:49:03 - INFO - __main__ - Step 33842: {'lr': 0.00019962116666831061, 'samples': 1082944, 'steps': 2115, 'loss/train': 2.868198871612549} -09/20/2021 21:49:04 - INFO - __main__ - Step 33843: {'lr': 0.00019962116666831061, 'samples': 1082976, 'steps': 2115, 'loss/train': 2.5807945728302} -09/20/2021 21:49:04 - INFO - __main__ - Step 33844: {'lr': 0.00019962116666831061, 'samples': 1083008, 'steps': 2115, 'loss/train': 2.4520504474639893} -09/20/2021 21:49:05 - INFO - __main__ - Step 33845: {'lr': 0.00019962116666831061, 'samples': 1083040, 'steps': 2115, 'loss/train': 1.6620599031448364} -09/20/2021 21:49:06 - INFO - __main__ - Step 33846: {'lr': 0.00019962116666831061, 'samples': 1083072, 'steps': 2115, 'loss/train': 2.783600330352783} -09/20/2021 21:49:07 - INFO - __main__ - Step 33847: {'lr': 0.00019962116666831061, 'samples': 1083104, 'steps': 2115, 'loss/train': 1.9270389080047607} -09/20/2021 21:49:08 - INFO - __main__ - Step 33848: {'lr': 0.00019962116666831061, 'samples': 1083136, 'steps': 2115, 'loss/train': 1.8173415660858154} -09/20/2021 21:49:08 - INFO - __main__ - Step 33849: {'lr': 0.00019962116666831061, 'samples': 1083168, 'steps': 2115, 'loss/train': 2.05005145072937} -09/20/2021 21:49:09 - INFO - __main__ - Step 33850: {'lr': 0.00019962116666831061, 'samples': 1083200, 'steps': 2115, 'loss/train': 1.2433615922927856} -09/20/2021 21:49:10 - INFO - __main__ - Step 33851: {'lr': 0.00019962116666831061, 'samples': 1083232, 'steps': 2115, 'loss/train': 3.280651330947876} -09/20/2021 21:49:11 - INFO - __main__ - Step 33852: {'lr': 0.00019962116666831061, 'samples': 1083264, 'steps': 2115, 'loss/train': 2.477421998977661} -09/20/2021 21:49:12 - INFO - __main__ - Step 33853: {'lr': 0.00019962116666831061, 'samples': 1083296, 'steps': 2115, 'loss/train': 2.45432710647583} -09/20/2021 21:49:13 - INFO - __main__ - Step 33854: {'lr': 0.00019962116666831061, 'samples': 1083328, 'steps': 2115, 'loss/train': 1.9586396217346191} -09/20/2021 21:49:13 - INFO - __main__ - Step 33855: {'lr': 0.00019962116666831061, 'samples': 1083360, 'steps': 2115, 'loss/train': 1.9556580781936646} -09/20/2021 21:49:14 - INFO - __main__ - Step 33856: {'lr': 0.00019962116666831061, 'samples': 1083392, 'steps': 2115, 'loss/train': 1.0291959047317505} -09/20/2021 21:49:15 - INFO - __main__ - Step 33857: {'lr': 0.00019962061174920833, 'samples': 1083424, 'steps': 2116, 'loss/train': 2.9382643699645996} -09/20/2021 21:49:16 - INFO - __main__ - Step 33858: {'lr': 0.00019962061174920833, 'samples': 1083456, 'steps': 2116, 'loss/train': 3.1535890102386475} -09/20/2021 21:49:16 - INFO - __main__ - Step 33859: {'lr': 0.00019962061174920833, 'samples': 1083488, 'steps': 2116, 'loss/train': 2.6753361225128174} -09/20/2021 21:49:17 - INFO - __main__ - Step 33860: {'lr': 0.00019962061174920833, 'samples': 1083520, 'steps': 2116, 'loss/train': 1.431762456893921} -09/20/2021 21:49:18 - INFO - __main__ - Step 33861: {'lr': 0.00019962061174920833, 'samples': 1083552, 'steps': 2116, 'loss/train': 1.982774257659912} -09/20/2021 21:49:19 - INFO - __main__ - Step 33862: {'lr': 0.00019962061174920833, 'samples': 1083584, 'steps': 2116, 'loss/train': 2.5330326557159424} -09/20/2021 21:49:19 - INFO - __main__ - Step 33863: {'lr': 0.00019962061174920833, 'samples': 1083616, 'steps': 2116, 'loss/train': 2.916041612625122} -09/20/2021 21:49:20 - INFO - __main__ - Step 33864: {'lr': 0.00019962061174920833, 'samples': 1083648, 'steps': 2116, 'loss/train': 2.125004768371582} -09/20/2021 21:49:21 - INFO - __main__ - Step 33865: {'lr': 0.00019962061174920833, 'samples': 1083680, 'steps': 2116, 'loss/train': 1.8720003366470337} -09/20/2021 21:49:22 - INFO - __main__ - Step 33866: {'lr': 0.00019962061174920833, 'samples': 1083712, 'steps': 2116, 'loss/train': 2.927121877670288} -09/20/2021 21:49:22 - INFO - __main__ - Step 33867: {'lr': 0.00019962061174920833, 'samples': 1083744, 'steps': 2116, 'loss/train': 2.898054599761963} -09/20/2021 21:49:23 - INFO - __main__ - Step 33868: {'lr': 0.00019962061174920833, 'samples': 1083776, 'steps': 2116, 'loss/train': 2.5861189365386963} -09/20/2021 21:49:24 - INFO - __main__ - Step 33869: {'lr': 0.00019962061174920833, 'samples': 1083808, 'steps': 2116, 'loss/train': 2.409850835800171} -09/20/2021 21:49:25 - INFO - __main__ - Step 33870: {'lr': 0.00019962061174920833, 'samples': 1083840, 'steps': 2116, 'loss/train': 2.2745935916900635} -09/20/2021 21:49:25 - INFO - __main__ - Step 33871: {'lr': 0.00019962061174920833, 'samples': 1083872, 'steps': 2116, 'loss/train': 2.4818859100341797} -09/20/2021 21:49:26 - INFO - __main__ - Step 33872: {'lr': 0.00019962061174920833, 'samples': 1083904, 'steps': 2116, 'loss/train': 2.0303444862365723} -09/20/2021 21:49:27 - INFO - __main__ - Step 33873: {'lr': 0.00019962005642475012, 'samples': 1083936, 'steps': 2117, 'loss/train': 2.5875749588012695} -09/20/2021 21:49:28 - INFO - __main__ - Step 33874: {'lr': 0.00019962005642475012, 'samples': 1083968, 'steps': 2117, 'loss/train': 2.8095285892486572} -09/20/2021 21:49:29 - INFO - __main__ - Step 33875: {'lr': 0.00019962005642475012, 'samples': 1084000, 'steps': 2117, 'loss/train': 2.470197916030884} -09/20/2021 21:49:29 - INFO - __main__ - Step 33876: {'lr': 0.00019962005642475012, 'samples': 1084032, 'steps': 2117, 'loss/train': 2.208906650543213} -09/20/2021 21:49:30 - INFO - __main__ - Step 33877: {'lr': 0.00019962005642475012, 'samples': 1084064, 'steps': 2117, 'loss/train': 2.6455063819885254} -09/20/2021 21:49:31 - INFO - __main__ - Step 33878: {'lr': 0.00019962005642475012, 'samples': 1084096, 'steps': 2117, 'loss/train': 2.243929862976074} -09/20/2021 21:49:32 - INFO - __main__ - Step 33879: {'lr': 0.00019962005642475012, 'samples': 1084128, 'steps': 2117, 'loss/train': 2.049407482147217} -09/20/2021 21:49:32 - INFO - __main__ - Step 33880: {'lr': 0.00019962005642475012, 'samples': 1084160, 'steps': 2117, 'loss/train': 1.8419721126556396} -09/20/2021 21:49:33 - INFO - __main__ - Step 33881: {'lr': 0.00019962005642475012, 'samples': 1084192, 'steps': 2117, 'loss/train': 2.530043601989746} -09/20/2021 21:49:34 - INFO - __main__ - Step 33882: {'lr': 0.00019962005642475012, 'samples': 1084224, 'steps': 2117, 'loss/train': 2.9634571075439453} -09/20/2021 21:49:35 - INFO - __main__ - Step 33883: {'lr': 0.00019962005642475012, 'samples': 1084256, 'steps': 2117, 'loss/train': 1.1303008794784546} -09/20/2021 21:49:36 - INFO - __main__ - Step 33884: {'lr': 0.00019962005642475012, 'samples': 1084288, 'steps': 2117, 'loss/train': 1.7218085527420044} -09/20/2021 21:49:37 - INFO - __main__ - Step 33885: {'lr': 0.00019962005642475012, 'samples': 1084320, 'steps': 2117, 'loss/train': 1.7175343036651611} -09/20/2021 21:49:37 - INFO - __main__ - Step 33886: {'lr': 0.00019962005642475012, 'samples': 1084352, 'steps': 2117, 'loss/train': 2.1181328296661377} -09/20/2021 21:49:38 - INFO - __main__ - Step 33887: {'lr': 0.00019962005642475012, 'samples': 1084384, 'steps': 2117, 'loss/train': 2.2569432258605957} -09/20/2021 21:49:39 - INFO - __main__ - Step 33888: {'lr': 0.00019962005642475012, 'samples': 1084416, 'steps': 2117, 'loss/train': 0.8062170147895813} -09/20/2021 21:49:40 - INFO - __main__ - Step 33889: {'lr': 0.0001996195006949383, 'samples': 1084448, 'steps': 2118, 'loss/train': 2.610931873321533} -09/20/2021 21:49:41 - INFO - __main__ - Step 33890: {'lr': 0.0001996195006949383, 'samples': 1084480, 'steps': 2118, 'loss/train': 2.426089286804199} -09/20/2021 21:49:41 - INFO - __main__ - Step 33891: {'lr': 0.0001996195006949383, 'samples': 1084512, 'steps': 2118, 'loss/train': 1.364879846572876} -09/20/2021 21:49:42 - INFO - __main__ - Step 33892: {'lr': 0.0001996195006949383, 'samples': 1084544, 'steps': 2118, 'loss/train': 1.5831818580627441} -09/20/2021 21:49:43 - INFO - __main__ - Step 33893: {'lr': 0.0001996195006949383, 'samples': 1084576, 'steps': 2118, 'loss/train': 2.130417585372925} -09/20/2021 21:49:44 - INFO - __main__ - Step 33894: {'lr': 0.0001996195006949383, 'samples': 1084608, 'steps': 2118, 'loss/train': 2.4233813285827637} -09/20/2021 21:49:44 - INFO - __main__ - Step 33895: {'lr': 0.0001996195006949383, 'samples': 1084640, 'steps': 2118, 'loss/train': 0.25853225588798523} -09/20/2021 21:49:45 - INFO - __main__ - Step 33896: {'lr': 0.0001996195006949383, 'samples': 1084672, 'steps': 2118, 'loss/train': 0.30837321281433105} -09/20/2021 21:49:46 - INFO - __main__ - Step 33897: {'lr': 0.0001996195006949383, 'samples': 1084704, 'steps': 2118, 'loss/train': 2.512366533279419} -09/20/2021 21:49:47 - INFO - __main__ - Step 33898: {'lr': 0.0001996195006949383, 'samples': 1084736, 'steps': 2118, 'loss/train': 0.40276920795440674} -09/20/2021 21:49:47 - INFO - __main__ - Step 33899: {'lr': 0.0001996195006949383, 'samples': 1084768, 'steps': 2118, 'loss/train': 1.7024799585342407} -09/20/2021 21:49:48 - INFO - __main__ - Step 33900: {'lr': 0.0001996195006949383, 'samples': 1084800, 'steps': 2118, 'loss/train': 2.489549160003662} -09/20/2021 21:49:49 - INFO - __main__ - Step 33901: {'lr': 0.0001996195006949383, 'samples': 1084832, 'steps': 2118, 'loss/train': 2.2267978191375732} -09/20/2021 21:49:50 - INFO - __main__ - Step 33902: {'lr': 0.0001996195006949383, 'samples': 1084864, 'steps': 2118, 'loss/train': 1.996856451034546} -09/20/2021 21:49:50 - INFO - __main__ - Step 33903: {'lr': 0.0001996195006949383, 'samples': 1084896, 'steps': 2118, 'loss/train': 3.719843626022339} -09/20/2021 21:49:51 - INFO - __main__ - Step 33904: {'lr': 0.0001996195006949383, 'samples': 1084928, 'steps': 2118, 'loss/train': 2.0619752407073975} -09/20/2021 21:49:52 - INFO - __main__ - Step 33905: {'lr': 0.00019961894455977513, 'samples': 1084960, 'steps': 2119, 'loss/train': 1.821356177330017} -09/20/2021 21:49:53 - INFO - __main__ - Step 33906: {'lr': 0.00019961894455977513, 'samples': 1084992, 'steps': 2119, 'loss/train': 2.2155048847198486} -09/20/2021 21:49:53 - INFO - __main__ - Step 33907: {'lr': 0.00019961894455977513, 'samples': 1085024, 'steps': 2119, 'loss/train': 2.795443534851074} -09/20/2021 21:49:54 - INFO - __main__ - Step 33908: {'lr': 0.00019961894455977513, 'samples': 1085056, 'steps': 2119, 'loss/train': 2.056637763977051} -09/20/2021 21:49:55 - INFO - __main__ - Step 33909: {'lr': 0.00019961894455977513, 'samples': 1085088, 'steps': 2119, 'loss/train': 2.3465187549591064} -09/20/2021 21:49:56 - INFO - __main__ - Step 33910: {'lr': 0.00019961894455977513, 'samples': 1085120, 'steps': 2119, 'loss/train': 4.519865036010742} -09/20/2021 21:49:56 - INFO - __main__ - Step 33911: {'lr': 0.00019961894455977513, 'samples': 1085152, 'steps': 2119, 'loss/train': 4.283524036407471} -09/20/2021 21:49:57 - INFO - __main__ - Step 33912: {'lr': 0.00019961894455977513, 'samples': 1085184, 'steps': 2119, 'loss/train': 4.35101842880249} -09/20/2021 21:49:58 - INFO - __main__ - Step 33913: {'lr': 0.00019961894455977513, 'samples': 1085216, 'steps': 2119, 'loss/train': 1.4371501207351685} -09/20/2021 21:50:00 - INFO - __main__ - Step 33914: {'lr': 0.00019961894455977513, 'samples': 1085248, 'steps': 2119, 'loss/train': 2.0898633003234863} -09/20/2021 21:50:01 - INFO - __main__ - Step 33915: {'lr': 0.00019961894455977513, 'samples': 1085280, 'steps': 2119, 'loss/train': 1.8233991861343384} -09/20/2021 21:50:01 - INFO - __main__ - Step 33916: {'lr': 0.00019961894455977513, 'samples': 1085312, 'steps': 2119, 'loss/train': 1.3652682304382324} -09/20/2021 21:50:02 - INFO - __main__ - Step 33917: {'lr': 0.00019961894455977513, 'samples': 1085344, 'steps': 2119, 'loss/train': 2.254045248031616} -09/20/2021 21:50:03 - INFO - __main__ - Step 33918: {'lr': 0.00019961894455977513, 'samples': 1085376, 'steps': 2119, 'loss/train': 2.1941940784454346} -09/20/2021 21:50:04 - INFO - __main__ - Step 33919: {'lr': 0.00019961894455977513, 'samples': 1085408, 'steps': 2119, 'loss/train': 2.3784992694854736} -09/20/2021 21:50:04 - INFO - __main__ - Step 33920: {'lr': 0.00019961894455977513, 'samples': 1085440, 'steps': 2119, 'loss/train': 2.8836617469787598} -09/20/2021 21:50:05 - INFO - __main__ - Step 33921: {'lr': 0.0001996183880192629, 'samples': 1085472, 'steps': 2120, 'loss/train': 2.390866994857788} -09/20/2021 21:50:06 - INFO - __main__ - Step 33922: {'lr': 0.0001996183880192629, 'samples': 1085504, 'steps': 2120, 'loss/train': 2.4484636783599854} -09/20/2021 21:50:07 - INFO - __main__ - Step 33923: {'lr': 0.0001996183880192629, 'samples': 1085536, 'steps': 2120, 'loss/train': 2.5735743045806885} -09/20/2021 21:50:08 - INFO - __main__ - Step 33924: {'lr': 0.0001996183880192629, 'samples': 1085568, 'steps': 2120, 'loss/train': 2.0139245986938477} -09/20/2021 21:50:08 - INFO - __main__ - Step 33925: {'lr': 0.0001996183880192629, 'samples': 1085600, 'steps': 2120, 'loss/train': 2.254727363586426} -09/20/2021 21:50:09 - INFO - __main__ - Step 33926: {'lr': 0.0001996183880192629, 'samples': 1085632, 'steps': 2120, 'loss/train': 1.9707541465759277} -09/20/2021 21:50:10 - INFO - __main__ - Step 33927: {'lr': 0.0001996183880192629, 'samples': 1085664, 'steps': 2120, 'loss/train': 2.121988296508789} -09/20/2021 21:50:11 - INFO - __main__ - Step 33928: {'lr': 0.0001996183880192629, 'samples': 1085696, 'steps': 2120, 'loss/train': 2.5010406970977783} -09/20/2021 21:50:11 - INFO - __main__ - Step 33929: {'lr': 0.0001996183880192629, 'samples': 1085728, 'steps': 2120, 'loss/train': 3.736431121826172} -09/20/2021 21:50:12 - INFO - __main__ - Step 33930: {'lr': 0.0001996183880192629, 'samples': 1085760, 'steps': 2120, 'loss/train': 1.4642229080200195} -09/20/2021 21:50:13 - INFO - __main__ - Step 33931: {'lr': 0.0001996183880192629, 'samples': 1085792, 'steps': 2120, 'loss/train': 1.7292410135269165} -09/20/2021 21:50:14 - INFO - __main__ - Step 33932: {'lr': 0.0001996183880192629, 'samples': 1085824, 'steps': 2120, 'loss/train': 1.4983617067337036} -09/20/2021 21:50:14 - INFO - __main__ - Step 33933: {'lr': 0.0001996183880192629, 'samples': 1085856, 'steps': 2120, 'loss/train': 1.700443148612976} -09/20/2021 21:50:15 - INFO - __main__ - Step 33934: {'lr': 0.0001996183880192629, 'samples': 1085888, 'steps': 2120, 'loss/train': 1.6008425951004028} -09/20/2021 21:50:16 - INFO - __main__ - Step 33935: {'lr': 0.0001996183880192629, 'samples': 1085920, 'steps': 2120, 'loss/train': 2.0098695755004883} -09/20/2021 21:50:17 - INFO - __main__ - Step 33936: {'lr': 0.0001996183880192629, 'samples': 1085952, 'steps': 2120, 'loss/train': 2.589456796646118} -09/20/2021 21:50:17 - INFO - __main__ - Step 33937: {'lr': 0.0001996178310734038, 'samples': 1085984, 'steps': 2121, 'loss/train': 1.0739620923995972} -09/20/2021 21:50:18 - INFO - __main__ - Step 33938: {'lr': 0.0001996178310734038, 'samples': 1086016, 'steps': 2121, 'loss/train': 2.517329454421997} -09/20/2021 21:50:19 - INFO - __main__ - Step 33939: {'lr': 0.0001996178310734038, 'samples': 1086048, 'steps': 2121, 'loss/train': 3.335054636001587} -09/20/2021 21:50:20 - INFO - __main__ - Step 33940: {'lr': 0.0001996178310734038, 'samples': 1086080, 'steps': 2121, 'loss/train': 1.422804832458496} -09/20/2021 21:50:20 - INFO - __main__ - Step 33941: {'lr': 0.0001996178310734038, 'samples': 1086112, 'steps': 2121, 'loss/train': 2.6110575199127197} -09/20/2021 21:50:21 - INFO - __main__ - Step 33942: {'lr': 0.0001996178310734038, 'samples': 1086144, 'steps': 2121, 'loss/train': 2.1247329711914062} -09/20/2021 21:50:22 - INFO - __main__ - Step 33943: {'lr': 0.0001996178310734038, 'samples': 1086176, 'steps': 2121, 'loss/train': 2.3366293907165527} -09/20/2021 21:50:23 - INFO - __main__ - Step 33944: {'lr': 0.0001996178310734038, 'samples': 1086208, 'steps': 2121, 'loss/train': 2.6476757526397705} -09/20/2021 21:50:24 - INFO - __main__ - Step 33945: {'lr': 0.0001996178310734038, 'samples': 1086240, 'steps': 2121, 'loss/train': 2.8935422897338867} -09/20/2021 21:50:25 - INFO - __main__ - Step 33946: {'lr': 0.0001996178310734038, 'samples': 1086272, 'steps': 2121, 'loss/train': 5.892439842224121} -09/20/2021 21:50:25 - INFO - __main__ - Step 33947: {'lr': 0.0001996178310734038, 'samples': 1086304, 'steps': 2121, 'loss/train': 1.9740146398544312} -09/20/2021 21:50:26 - INFO - __main__ - Step 33948: {'lr': 0.0001996178310734038, 'samples': 1086336, 'steps': 2121, 'loss/train': 3.1002283096313477} -09/20/2021 21:50:27 - INFO - __main__ - Step 33949: {'lr': 0.0001996178310734038, 'samples': 1086368, 'steps': 2121, 'loss/train': 3.2789900302886963} -09/20/2021 21:50:28 - INFO - __main__ - Step 33950: {'lr': 0.0001996178310734038, 'samples': 1086400, 'steps': 2121, 'loss/train': 0.6184825301170349} -09/20/2021 21:50:28 - INFO - __main__ - Step 33951: {'lr': 0.0001996178310734038, 'samples': 1086432, 'steps': 2121, 'loss/train': 3.0061452388763428} -09/20/2021 21:50:29 - INFO - __main__ - Step 33952: {'lr': 0.0001996178310734038, 'samples': 1086464, 'steps': 2121, 'loss/train': 1.3621954917907715} -09/20/2021 21:50:30 - INFO - __main__ - Step 33953: {'lr': 0.00019961727372220015, 'samples': 1086496, 'steps': 2122, 'loss/train': 2.573009729385376} -09/20/2021 21:50:31 - INFO - __main__ - Step 33954: {'lr': 0.00019961727372220015, 'samples': 1086528, 'steps': 2122, 'loss/train': 1.6340383291244507} -09/20/2021 21:50:32 - INFO - __main__ - Step 33955: {'lr': 0.00019961727372220015, 'samples': 1086560, 'steps': 2122, 'loss/train': 1.4439709186553955} -09/20/2021 21:50:32 - INFO - __main__ - Step 33956: {'lr': 0.00019961727372220015, 'samples': 1086592, 'steps': 2122, 'loss/train': 0.7913739085197449} -09/20/2021 21:50:33 - INFO - __main__ - Step 33957: {'lr': 0.00019961727372220015, 'samples': 1086624, 'steps': 2122, 'loss/train': 2.23569393157959} -09/20/2021 21:50:34 - INFO - __main__ - Step 33958: {'lr': 0.00019961727372220015, 'samples': 1086656, 'steps': 2122, 'loss/train': 1.8326705694198608} -09/20/2021 21:50:35 - INFO - __main__ - Step 33959: {'lr': 0.00019961727372220015, 'samples': 1086688, 'steps': 2122, 'loss/train': 0.5406787395477295} -09/20/2021 21:50:35 - INFO - __main__ - Step 33960: {'lr': 0.00019961727372220015, 'samples': 1086720, 'steps': 2122, 'loss/train': 2.6207263469696045} -09/20/2021 21:50:36 - INFO - __main__ - Step 33961: {'lr': 0.00019961727372220015, 'samples': 1086752, 'steps': 2122, 'loss/train': 2.7148959636688232} -09/20/2021 21:50:37 - INFO - __main__ - Step 33962: {'lr': 0.00019961727372220015, 'samples': 1086784, 'steps': 2122, 'loss/train': 1.5817323923110962} -09/20/2021 21:50:38 - INFO - __main__ - Step 33963: {'lr': 0.00019961727372220015, 'samples': 1086816, 'steps': 2122, 'loss/train': 3.472804546356201} -09/20/2021 21:50:38 - INFO - __main__ - Step 33964: {'lr': 0.00019961727372220015, 'samples': 1086848, 'steps': 2122, 'loss/train': 2.339782476425171} -09/20/2021 21:50:39 - INFO - __main__ - Step 33965: {'lr': 0.00019961727372220015, 'samples': 1086880, 'steps': 2122, 'loss/train': 2.705325126647949} -09/20/2021 21:50:40 - INFO - __main__ - Step 33966: {'lr': 0.00019961727372220015, 'samples': 1086912, 'steps': 2122, 'loss/train': 2.3773176670074463} -09/20/2021 21:50:41 - INFO - __main__ - Step 33967: {'lr': 0.00019961727372220015, 'samples': 1086944, 'steps': 2122, 'loss/train': 1.867602825164795} -09/20/2021 21:50:41 - INFO - __main__ - Step 33968: {'lr': 0.00019961727372220015, 'samples': 1086976, 'steps': 2122, 'loss/train': 2.373725652694702} -09/20/2021 21:50:42 - INFO - __main__ - Step 33969: {'lr': 0.00019961671596565418, 'samples': 1087008, 'steps': 2123, 'loss/train': 2.2075071334838867} -09/20/2021 21:50:43 - INFO - __main__ - Step 33970: {'lr': 0.00019961671596565418, 'samples': 1087040, 'steps': 2123, 'loss/train': 2.7877845764160156} -09/20/2021 21:50:44 - INFO - __main__ - Step 33971: {'lr': 0.00019961671596565418, 'samples': 1087072, 'steps': 2123, 'loss/train': 2.2980446815490723} -09/20/2021 21:50:45 - INFO - __main__ - Step 33972: {'lr': 0.00019961671596565418, 'samples': 1087104, 'steps': 2123, 'loss/train': 2.4598958492279053} -09/20/2021 21:50:45 - INFO - __main__ - Step 33973: {'lr': 0.00019961671596565418, 'samples': 1087136, 'steps': 2123, 'loss/train': 2.6158392429351807} -09/20/2021 21:50:46 - INFO - __main__ - Step 33974: {'lr': 0.00019961671596565418, 'samples': 1087168, 'steps': 2123, 'loss/train': 1.8309398889541626} -09/20/2021 21:50:48 - INFO - __main__ - Step 33975: {'lr': 0.00019961671596565418, 'samples': 1087200, 'steps': 2123, 'loss/train': 1.79079008102417} -09/20/2021 21:50:49 - INFO - __main__ - Step 33976: {'lr': 0.00019961671596565418, 'samples': 1087232, 'steps': 2123, 'loss/train': 1.7379307746887207} -09/20/2021 21:50:49 - INFO - __main__ - Step 33977: {'lr': 0.00019961671596565418, 'samples': 1087264, 'steps': 2123, 'loss/train': 1.4476131200790405} -09/20/2021 21:50:50 - INFO - __main__ - Step 33978: {'lr': 0.00019961671596565418, 'samples': 1087296, 'steps': 2123, 'loss/train': 2.0408759117126465} -09/20/2021 21:50:51 - INFO - __main__ - Step 33979: {'lr': 0.00019961671596565418, 'samples': 1087328, 'steps': 2123, 'loss/train': 2.4296631813049316} -09/20/2021 21:50:52 - INFO - __main__ - Step 33980: {'lr': 0.00019961671596565418, 'samples': 1087360, 'steps': 2123, 'loss/train': 2.28429913520813} -09/20/2021 21:50:52 - INFO - __main__ - Step 33981: {'lr': 0.00019961671596565418, 'samples': 1087392, 'steps': 2123, 'loss/train': 2.170431137084961} -09/20/2021 21:50:53 - INFO - __main__ - Step 33982: {'lr': 0.00019961671596565418, 'samples': 1087424, 'steps': 2123, 'loss/train': 1.7759087085723877} -09/20/2021 21:50:54 - INFO - __main__ - Step 33983: {'lr': 0.00019961671596565418, 'samples': 1087456, 'steps': 2123, 'loss/train': 1.7309839725494385} -09/20/2021 21:50:55 - INFO - __main__ - Step 33984: {'lr': 0.00019961671596565418, 'samples': 1087488, 'steps': 2123, 'loss/train': 2.5703158378601074} -09/20/2021 21:50:56 - INFO - __main__ - Step 33985: {'lr': 0.00019961615780376816, 'samples': 1087520, 'steps': 2124, 'loss/train': 1.5117534399032593} -09/20/2021 21:50:56 - INFO - __main__ - Step 33986: {'lr': 0.00019961615780376816, 'samples': 1087552, 'steps': 2124, 'loss/train': 2.684443235397339} -09/20/2021 21:50:57 - INFO - __main__ - Step 33987: {'lr': 0.00019961615780376816, 'samples': 1087584, 'steps': 2124, 'loss/train': 2.5877585411071777} -09/20/2021 21:50:58 - INFO - __main__ - Step 33988: {'lr': 0.00019961615780376816, 'samples': 1087616, 'steps': 2124, 'loss/train': 2.506361722946167} -09/20/2021 21:50:59 - INFO - __main__ - Step 33989: {'lr': 0.00019961615780376816, 'samples': 1087648, 'steps': 2124, 'loss/train': 2.4486188888549805} -09/20/2021 21:50:59 - INFO - __main__ - Step 33990: {'lr': 0.00019961615780376816, 'samples': 1087680, 'steps': 2124, 'loss/train': 2.4715793132781982} -09/20/2021 21:51:00 - INFO - __main__ - Step 33991: {'lr': 0.00019961615780376816, 'samples': 1087712, 'steps': 2124, 'loss/train': 3.6961889266967773} -09/20/2021 21:51:01 - INFO - __main__ - Step 33992: {'lr': 0.00019961615780376816, 'samples': 1087744, 'steps': 2124, 'loss/train': 3.6724729537963867} -09/20/2021 21:51:02 - INFO - __main__ - Step 33993: {'lr': 0.00019961615780376816, 'samples': 1087776, 'steps': 2124, 'loss/train': 1.9328280687332153} -09/20/2021 21:51:02 - INFO - __main__ - Step 33994: {'lr': 0.00019961615780376816, 'samples': 1087808, 'steps': 2124, 'loss/train': 1.6486566066741943} -09/20/2021 21:51:03 - INFO - __main__ - Step 33995: {'lr': 0.00019961615780376816, 'samples': 1087840, 'steps': 2124, 'loss/train': 1.7330191135406494} -09/20/2021 21:51:04 - INFO - __main__ - Step 33996: {'lr': 0.00019961615780376816, 'samples': 1087872, 'steps': 2124, 'loss/train': 2.1615068912506104} -09/20/2021 21:51:05 - INFO - __main__ - Step 33997: {'lr': 0.00019961615780376816, 'samples': 1087904, 'steps': 2124, 'loss/train': 0.8504422903060913} -09/20/2021 21:51:05 - INFO - __main__ - Step 33998: {'lr': 0.00019961615780376816, 'samples': 1087936, 'steps': 2124, 'loss/train': 2.747063159942627} -09/20/2021 21:51:06 - INFO - __main__ - Step 33999: {'lr': 0.00019961615780376816, 'samples': 1087968, 'steps': 2124, 'loss/train': 1.9781779050827026} -09/20/2021 21:51:07 - INFO - __main__ - Step 34000: {'lr': 0.00019961615780376816, 'samples': 1088000, 'steps': 2124, 'loss/train': 2.1254825592041016} -09/20/2021 21:51:08 - INFO - __main__ - Step 34001: {'lr': 0.0001996155992365444, 'samples': 1088032, 'steps': 2125, 'loss/train': 2.8438732624053955} -09/20/2021 21:51:08 - INFO - __main__ - Step 34002: {'lr': 0.0001996155992365444, 'samples': 1088064, 'steps': 2125, 'loss/train': 2.1035759449005127} -09/20/2021 21:51:09 - INFO - __main__ - Step 34003: {'lr': 0.0001996155992365444, 'samples': 1088096, 'steps': 2125, 'loss/train': 3.3611631393432617} -09/20/2021 21:51:10 - INFO - __main__ - Step 34004: {'lr': 0.0001996155992365444, 'samples': 1088128, 'steps': 2125, 'loss/train': 1.2454888820648193} -09/20/2021 21:51:11 - INFO - __main__ - Step 34005: {'lr': 0.0001996155992365444, 'samples': 1088160, 'steps': 2125, 'loss/train': 1.652987003326416} -09/20/2021 21:51:12 - INFO - __main__ - Step 34006: {'lr': 0.0001996155992365444, 'samples': 1088192, 'steps': 2125, 'loss/train': 2.1846718788146973} -09/20/2021 21:51:13 - INFO - __main__ - Step 34007: {'lr': 0.0001996155992365444, 'samples': 1088224, 'steps': 2125, 'loss/train': 2.5555243492126465} -09/20/2021 21:51:13 - INFO - __main__ - Step 34008: {'lr': 0.0001996155992365444, 'samples': 1088256, 'steps': 2125, 'loss/train': 2.745115041732788} -09/20/2021 21:51:14 - INFO - __main__ - Step 34009: {'lr': 0.0001996155992365444, 'samples': 1088288, 'steps': 2125, 'loss/train': 4.169842720031738} -09/20/2021 21:51:15 - INFO - __main__ - Step 34010: {'lr': 0.0001996155992365444, 'samples': 1088320, 'steps': 2125, 'loss/train': 2.1807971000671387} -09/20/2021 21:51:16 - INFO - __main__ - Step 34011: {'lr': 0.0001996155992365444, 'samples': 1088352, 'steps': 2125, 'loss/train': 1.8154557943344116} -09/20/2021 21:51:16 - INFO - __main__ - Step 34012: {'lr': 0.0001996155992365444, 'samples': 1088384, 'steps': 2125, 'loss/train': 0.7445976734161377} -09/20/2021 21:51:17 - INFO - __main__ - Step 34013: {'lr': 0.0001996155992365444, 'samples': 1088416, 'steps': 2125, 'loss/train': 2.4826629161834717} -09/20/2021 21:51:18 - INFO - __main__ - Step 34014: {'lr': 0.0001996155992365444, 'samples': 1088448, 'steps': 2125, 'loss/train': 1.5270233154296875} -09/20/2021 21:51:19 - INFO - __main__ - Step 34015: {'lr': 0.0001996155992365444, 'samples': 1088480, 'steps': 2125, 'loss/train': 3.7859442234039307} -09/20/2021 21:51:19 - INFO - __main__ - Step 34016: {'lr': 0.0001996155992365444, 'samples': 1088512, 'steps': 2125, 'loss/train': 2.8259479999542236} -09/20/2021 21:51:20 - INFO - __main__ - Step 34017: {'lr': 0.00019961504026398514, 'samples': 1088544, 'steps': 2126, 'loss/train': 2.2571933269500732} -09/20/2021 21:51:21 - INFO - __main__ - Step 34018: {'lr': 0.00019961504026398514, 'samples': 1088576, 'steps': 2126, 'loss/train': 2.0837297439575195} -09/20/2021 21:51:22 - INFO - __main__ - Step 34019: {'lr': 0.00019961504026398514, 'samples': 1088608, 'steps': 2126, 'loss/train': 2.749922037124634} -09/20/2021 21:51:23 - INFO - __main__ - Step 34020: {'lr': 0.00019961504026398514, 'samples': 1088640, 'steps': 2126, 'loss/train': 3.3967506885528564} -09/20/2021 21:51:23 - INFO - __main__ - Step 34021: {'lr': 0.00019961504026398514, 'samples': 1088672, 'steps': 2126, 'loss/train': 1.5001449584960938} -09/20/2021 21:51:24 - INFO - __main__ - Step 34022: {'lr': 0.00019961504026398514, 'samples': 1088704, 'steps': 2126, 'loss/train': 2.2013888359069824} -09/20/2021 21:51:25 - INFO - __main__ - Step 34023: {'lr': 0.00019961504026398514, 'samples': 1088736, 'steps': 2126, 'loss/train': 2.201075792312622} -09/20/2021 21:51:26 - INFO - __main__ - Step 34024: {'lr': 0.00019961504026398514, 'samples': 1088768, 'steps': 2126, 'loss/train': 1.9267443418502808} -09/20/2021 21:51:26 - INFO - __main__ - Step 34025: {'lr': 0.00019961504026398514, 'samples': 1088800, 'steps': 2126, 'loss/train': 2.838118314743042} -09/20/2021 21:51:27 - INFO - __main__ - Step 34026: {'lr': 0.00019961504026398514, 'samples': 1088832, 'steps': 2126, 'loss/train': 2.499159574508667} -09/20/2021 21:51:28 - INFO - __main__ - Step 34027: {'lr': 0.00019961504026398514, 'samples': 1088864, 'steps': 2126, 'loss/train': 2.2235429286956787} -09/20/2021 21:51:29 - INFO - __main__ - Step 34028: {'lr': 0.00019961504026398514, 'samples': 1088896, 'steps': 2126, 'loss/train': 1.9003485441207886} -09/20/2021 21:51:29 - INFO - __main__ - Step 34029: {'lr': 0.00019961504026398514, 'samples': 1088928, 'steps': 2126, 'loss/train': 1.992746114730835} -09/20/2021 21:51:30 - INFO - __main__ - Step 34030: {'lr': 0.00019961504026398514, 'samples': 1088960, 'steps': 2126, 'loss/train': 2.653266668319702} -09/20/2021 21:51:31 - INFO - __main__ - Step 34031: {'lr': 0.00019961504026398514, 'samples': 1088992, 'steps': 2126, 'loss/train': 2.26991605758667} -09/20/2021 21:51:32 - INFO - __main__ - Step 34032: {'lr': 0.00019961504026398514, 'samples': 1089024, 'steps': 2126, 'loss/train': 2.0259344577789307} -09/20/2021 21:51:33 - INFO - __main__ - Step 34033: {'lr': 0.0001996144808860927, 'samples': 1089056, 'steps': 2127, 'loss/train': 2.679717779159546} -09/20/2021 21:51:33 - INFO - __main__ - Step 34034: {'lr': 0.0001996144808860927, 'samples': 1089088, 'steps': 2127, 'loss/train': 3.438791513442993} -09/20/2021 21:51:34 - INFO - __main__ - Step 34035: {'lr': 0.0001996144808860927, 'samples': 1089120, 'steps': 2127, 'loss/train': 2.998887538909912} -09/20/2021 21:51:35 - INFO - __main__ - Step 34036: {'lr': 0.0001996144808860927, 'samples': 1089152, 'steps': 2127, 'loss/train': 2.6179697513580322} -09/20/2021 21:51:36 - INFO - __main__ - Step 34037: {'lr': 0.0001996144808860927, 'samples': 1089184, 'steps': 2127, 'loss/train': 0.16252945363521576} -09/20/2021 21:51:37 - INFO - __main__ - Step 34038: {'lr': 0.0001996144808860927, 'samples': 1089216, 'steps': 2127, 'loss/train': 0.30431777238845825} -09/20/2021 21:51:38 - INFO - __main__ - Step 34039: {'lr': 0.0001996144808860927, 'samples': 1089248, 'steps': 2127, 'loss/train': 3.4177186489105225} -09/20/2021 21:51:38 - INFO - __main__ - Step 34040: {'lr': 0.0001996144808860927, 'samples': 1089280, 'steps': 2127, 'loss/train': 2.433933973312378} -09/20/2021 21:51:39 - INFO - __main__ - Step 34041: {'lr': 0.0001996144808860927, 'samples': 1089312, 'steps': 2127, 'loss/train': 1.072290062904358} -09/20/2021 21:51:40 - INFO - __main__ - Step 34042: {'lr': 0.0001996144808860927, 'samples': 1089344, 'steps': 2127, 'loss/train': 2.0422043800354004} -09/20/2021 21:51:41 - INFO - __main__ - Step 34043: {'lr': 0.0001996144808860927, 'samples': 1089376, 'steps': 2127, 'loss/train': 2.320671319961548} -09/20/2021 21:51:41 - INFO - __main__ - Step 34044: {'lr': 0.0001996144808860927, 'samples': 1089408, 'steps': 2127, 'loss/train': 2.5065009593963623} -09/20/2021 21:51:42 - INFO - __main__ - Step 34045: {'lr': 0.0001996144808860927, 'samples': 1089440, 'steps': 2127, 'loss/train': 2.2526330947875977} -09/20/2021 21:51:43 - INFO - __main__ - Step 34046: {'lr': 0.0001996144808860927, 'samples': 1089472, 'steps': 2127, 'loss/train': 2.868962049484253} -09/20/2021 21:51:44 - INFO - __main__ - Step 34047: {'lr': 0.0001996144808860927, 'samples': 1089504, 'steps': 2127, 'loss/train': 1.725586175918579} -09/20/2021 21:51:44 - INFO - __main__ - Step 34048: {'lr': 0.0001996144808860927, 'samples': 1089536, 'steps': 2127, 'loss/train': 2.00587797164917} -09/20/2021 21:51:45 - INFO - __main__ - Step 34049: {'lr': 0.0001996139211028693, 'samples': 1089568, 'steps': 2128, 'loss/train': 2.8121144771575928} -09/20/2021 21:51:46 - INFO - __main__ - Step 34050: {'lr': 0.0001996139211028693, 'samples': 1089600, 'steps': 2128, 'loss/train': 2.9273288249969482} -09/20/2021 21:51:47 - INFO - __main__ - Step 34051: {'lr': 0.0001996139211028693, 'samples': 1089632, 'steps': 2128, 'loss/train': 1.6573443412780762} -09/20/2021 21:51:47 - INFO - __main__ - Step 34052: {'lr': 0.0001996139211028693, 'samples': 1089664, 'steps': 2128, 'loss/train': 2.6891255378723145} -09/20/2021 21:51:48 - INFO - __main__ - Step 34053: {'lr': 0.0001996139211028693, 'samples': 1089696, 'steps': 2128, 'loss/train': 2.771193742752075} -09/20/2021 21:51:49 - INFO - __main__ - Step 34054: {'lr': 0.0001996139211028693, 'samples': 1089728, 'steps': 2128, 'loss/train': 1.470224142074585} -09/20/2021 21:51:50 - INFO - __main__ - Step 34055: {'lr': 0.0001996139211028693, 'samples': 1089760, 'steps': 2128, 'loss/train': 1.7849416732788086} -09/20/2021 21:51:50 - INFO - __main__ - Step 34056: {'lr': 0.0001996139211028693, 'samples': 1089792, 'steps': 2128, 'loss/train': 2.7644107341766357} -09/20/2021 21:51:51 - INFO - __main__ - Step 34057: {'lr': 0.0001996139211028693, 'samples': 1089824, 'steps': 2128, 'loss/train': 1.925299048423767} -09/20/2021 21:51:52 - INFO - __main__ - Step 34058: {'lr': 0.0001996139211028693, 'samples': 1089856, 'steps': 2128, 'loss/train': 1.9434099197387695} -09/20/2021 21:51:53 - INFO - __main__ - Step 34059: {'lr': 0.0001996139211028693, 'samples': 1089888, 'steps': 2128, 'loss/train': 1.7027993202209473} -09/20/2021 21:51:53 - INFO - __main__ - Step 34060: {'lr': 0.0001996139211028693, 'samples': 1089920, 'steps': 2128, 'loss/train': 2.9391252994537354} -09/20/2021 21:51:54 - INFO - __main__ - Step 34061: {'lr': 0.0001996139211028693, 'samples': 1089952, 'steps': 2128, 'loss/train': 1.32523512840271} -09/20/2021 21:51:55 - INFO - __main__ - Step 34062: {'lr': 0.0001996139211028693, 'samples': 1089984, 'steps': 2128, 'loss/train': 1.378967523574829} -09/20/2021 21:51:56 - INFO - __main__ - Step 34063: {'lr': 0.0001996139211028693, 'samples': 1090016, 'steps': 2128, 'loss/train': 1.9891085624694824} -09/20/2021 21:51:56 - INFO - __main__ - Step 34064: {'lr': 0.0001996139211028693, 'samples': 1090048, 'steps': 2128, 'loss/train': 2.5340077877044678} -09/20/2021 21:51:57 - INFO - __main__ - Step 34065: {'lr': 0.00019961336091431727, 'samples': 1090080, 'steps': 2129, 'loss/train': 2.5606331825256348} -09/20/2021 21:51:58 - INFO - __main__ - Step 34066: {'lr': 0.00019961336091431727, 'samples': 1090112, 'steps': 2129, 'loss/train': 0.6556230783462524} -09/20/2021 21:51:59 - INFO - __main__ - Step 34067: {'lr': 0.00019961336091431727, 'samples': 1090144, 'steps': 2129, 'loss/train': 1.3568134307861328} -09/20/2021 21:52:00 - INFO - __main__ - Step 34068: {'lr': 0.00019961336091431727, 'samples': 1090176, 'steps': 2129, 'loss/train': 0.8042850494384766} -09/20/2021 21:52:00 - INFO - __main__ - Step 34069: {'lr': 0.00019961336091431727, 'samples': 1090208, 'steps': 2129, 'loss/train': 2.3065624237060547} -09/20/2021 21:52:02 - INFO - __main__ - Step 34070: {'lr': 0.00019961336091431727, 'samples': 1090240, 'steps': 2129, 'loss/train': 0.604097306728363} -09/20/2021 21:52:03 - INFO - __main__ - Step 34071: {'lr': 0.00019961336091431727, 'samples': 1090272, 'steps': 2129, 'loss/train': 1.3813799619674683} -09/20/2021 21:52:03 - INFO - __main__ - Step 34072: {'lr': 0.00019961336091431727, 'samples': 1090304, 'steps': 2129, 'loss/train': 2.8478236198425293} -09/20/2021 21:52:04 - INFO - __main__ - Step 34073: {'lr': 0.00019961336091431727, 'samples': 1090336, 'steps': 2129, 'loss/train': 0.2939494550228119} -09/20/2021 21:52:05 - INFO - __main__ - Step 34074: {'lr': 0.00019961336091431727, 'samples': 1090368, 'steps': 2129, 'loss/train': 0.4319717288017273} -09/20/2021 21:52:06 - INFO - __main__ - Step 34075: {'lr': 0.00019961336091431727, 'samples': 1090400, 'steps': 2129, 'loss/train': 0.32113373279571533} -09/20/2021 21:52:06 - INFO - __main__ - Step 34076: {'lr': 0.00019961336091431727, 'samples': 1090432, 'steps': 2129, 'loss/train': 0.10923121869564056} -09/20/2021 21:52:07 - INFO - __main__ - Step 34077: {'lr': 0.00019961336091431727, 'samples': 1090464, 'steps': 2129, 'loss/train': 0.34640491008758545} -09/20/2021 21:52:08 - INFO - __main__ - Step 34078: {'lr': 0.00019961336091431727, 'samples': 1090496, 'steps': 2129, 'loss/train': 1.7338447570800781} -09/20/2021 21:52:09 - INFO - __main__ - Step 34079: {'lr': 0.00019961336091431727, 'samples': 1090528, 'steps': 2129, 'loss/train': 2.157099485397339} -09/20/2021 21:52:09 - INFO - __main__ - Step 34080: {'lr': 0.00019961336091431727, 'samples': 1090560, 'steps': 2129, 'loss/train': 3.3714373111724854} -09/20/2021 21:52:10 - INFO - __main__ - Step 34081: {'lr': 0.00019961280032043883, 'samples': 1090592, 'steps': 2130, 'loss/train': 1.95369291305542} -09/20/2021 21:52:11 - INFO - __main__ - Step 34082: {'lr': 0.00019961280032043883, 'samples': 1090624, 'steps': 2130, 'loss/train': 3.573500871658325} -09/20/2021 21:52:12 - INFO - __main__ - Step 34083: {'lr': 0.00019961280032043883, 'samples': 1090656, 'steps': 2130, 'loss/train': 2.6025869846343994} -09/20/2021 21:52:13 - INFO - __main__ - Step 34084: {'lr': 0.00019961280032043883, 'samples': 1090688, 'steps': 2130, 'loss/train': 3.098409414291382} -09/20/2021 21:52:13 - INFO - __main__ - Step 34085: {'lr': 0.00019961280032043883, 'samples': 1090720, 'steps': 2130, 'loss/train': 2.5720014572143555} -09/20/2021 21:52:14 - INFO - __main__ - Step 34086: {'lr': 0.00019961280032043883, 'samples': 1090752, 'steps': 2130, 'loss/train': 2.5676939487457275} -09/20/2021 21:52:15 - INFO - __main__ - Step 34087: {'lr': 0.00019961280032043883, 'samples': 1090784, 'steps': 2130, 'loss/train': 1.7080676555633545} -09/20/2021 21:52:16 - INFO - __main__ - Step 34088: {'lr': 0.00019961280032043883, 'samples': 1090816, 'steps': 2130, 'loss/train': 1.2154492139816284} -09/20/2021 21:52:16 - INFO - __main__ - Step 34089: {'lr': 0.00019961280032043883, 'samples': 1090848, 'steps': 2130, 'loss/train': 2.9562315940856934} -09/20/2021 21:52:17 - INFO - __main__ - Step 34090: {'lr': 0.00019961280032043883, 'samples': 1090880, 'steps': 2130, 'loss/train': 2.9036312103271484} -09/20/2021 21:52:18 - INFO - __main__ - Step 34091: {'lr': 0.00019961280032043883, 'samples': 1090912, 'steps': 2130, 'loss/train': 2.449162483215332} -09/20/2021 21:52:19 - INFO - __main__ - Step 34092: {'lr': 0.00019961280032043883, 'samples': 1090944, 'steps': 2130, 'loss/train': 2.7445671558380127} -09/20/2021 21:52:19 - INFO - __main__ - Step 34093: {'lr': 0.00019961280032043883, 'samples': 1090976, 'steps': 2130, 'loss/train': 2.679140329360962} -09/20/2021 21:52:20 - INFO - __main__ - Step 34094: {'lr': 0.00019961280032043883, 'samples': 1091008, 'steps': 2130, 'loss/train': 1.91517174243927} -09/20/2021 21:52:21 - INFO - __main__ - Step 34095: {'lr': 0.00019961280032043883, 'samples': 1091040, 'steps': 2130, 'loss/train': 2.352572202682495} -09/20/2021 21:52:22 - INFO - __main__ - Step 34096: {'lr': 0.00019961280032043883, 'samples': 1091072, 'steps': 2130, 'loss/train': 2.4127161502838135} -09/20/2021 21:52:22 - INFO - __main__ - Step 34097: {'lr': 0.0001996122393212363, 'samples': 1091104, 'steps': 2131, 'loss/train': 3.2120087146759033} -09/20/2021 21:52:23 - INFO - __main__ - Step 34098: {'lr': 0.0001996122393212363, 'samples': 1091136, 'steps': 2131, 'loss/train': 1.883270025253296} -09/20/2021 21:52:24 - INFO - __main__ - Step 34099: {'lr': 0.0001996122393212363, 'samples': 1091168, 'steps': 2131, 'loss/train': 1.9453871250152588} -09/20/2021 21:52:25 - INFO - __main__ - Step 34100: {'lr': 0.0001996122393212363, 'samples': 1091200, 'steps': 2131, 'loss/train': 2.145015239715576} -09/20/2021 21:52:26 - INFO - __main__ - Step 34101: {'lr': 0.0001996122393212363, 'samples': 1091232, 'steps': 2131, 'loss/train': 2.4412546157836914} -09/20/2021 21:52:27 - INFO - __main__ - Step 34102: {'lr': 0.0001996122393212363, 'samples': 1091264, 'steps': 2131, 'loss/train': 3.191600799560547} -09/20/2021 21:52:27 - INFO - __main__ - Step 34103: {'lr': 0.0001996122393212363, 'samples': 1091296, 'steps': 2131, 'loss/train': 2.0475265979766846} -09/20/2021 21:52:28 - INFO - __main__ - Step 34104: {'lr': 0.0001996122393212363, 'samples': 1091328, 'steps': 2131, 'loss/train': 2.435325860977173} -09/20/2021 21:52:29 - INFO - __main__ - Step 34105: {'lr': 0.0001996122393212363, 'samples': 1091360, 'steps': 2131, 'loss/train': 2.2154555320739746} -09/20/2021 21:52:30 - INFO - __main__ - Step 34106: {'lr': 0.0001996122393212363, 'samples': 1091392, 'steps': 2131, 'loss/train': 1.808447003364563} -09/20/2021 21:52:30 - INFO - __main__ - Step 34107: {'lr': 0.0001996122393212363, 'samples': 1091424, 'steps': 2131, 'loss/train': 1.9483925104141235} -09/20/2021 21:52:31 - INFO - __main__ - Step 34108: {'lr': 0.0001996122393212363, 'samples': 1091456, 'steps': 2131, 'loss/train': 1.970837116241455} -09/20/2021 21:52:32 - INFO - __main__ - Step 34109: {'lr': 0.0001996122393212363, 'samples': 1091488, 'steps': 2131, 'loss/train': 1.5059151649475098} -09/20/2021 21:52:33 - INFO - __main__ - Step 34110: {'lr': 0.0001996122393212363, 'samples': 1091520, 'steps': 2131, 'loss/train': 2.3233466148376465} -09/20/2021 21:52:33 - INFO - __main__ - Step 34111: {'lr': 0.0001996122393212363, 'samples': 1091552, 'steps': 2131, 'loss/train': 2.380171537399292} -09/20/2021 21:52:34 - INFO - __main__ - Step 34112: {'lr': 0.0001996122393212363, 'samples': 1091584, 'steps': 2131, 'loss/train': 2.658200979232788} -09/20/2021 21:52:35 - INFO - __main__ - Step 34113: {'lr': 0.00019961167791671195, 'samples': 1091616, 'steps': 2132, 'loss/train': 2.206383228302002} -09/20/2021 21:52:36 - INFO - __main__ - Step 34114: {'lr': 0.00019961167791671195, 'samples': 1091648, 'steps': 2132, 'loss/train': 2.4913711547851562} -09/20/2021 21:52:37 - INFO - __main__ - Step 34115: {'lr': 0.00019961167791671195, 'samples': 1091680, 'steps': 2132, 'loss/train': 2.790254592895508} -09/20/2021 21:52:37 - INFO - __main__ - Step 34116: {'lr': 0.00019961167791671195, 'samples': 1091712, 'steps': 2132, 'loss/train': 2.651947498321533} -09/20/2021 21:52:38 - INFO - __main__ - Step 34117: {'lr': 0.00019961167791671195, 'samples': 1091744, 'steps': 2132, 'loss/train': 2.6495401859283447} -09/20/2021 21:52:39 - INFO - __main__ - Step 34118: {'lr': 0.00019961167791671195, 'samples': 1091776, 'steps': 2132, 'loss/train': 2.2188560962677} -09/20/2021 21:52:40 - INFO - __main__ - Step 34119: {'lr': 0.00019961167791671195, 'samples': 1091808, 'steps': 2132, 'loss/train': 1.5848803520202637} -09/20/2021 21:52:40 - INFO - __main__ - Step 34120: {'lr': 0.00019961167791671195, 'samples': 1091840, 'steps': 2132, 'loss/train': 2.7358238697052} -09/20/2021 21:52:41 - INFO - __main__ - Step 34121: {'lr': 0.00019961167791671195, 'samples': 1091872, 'steps': 2132, 'loss/train': 2.3638644218444824} -09/20/2021 21:52:42 - INFO - __main__ - Step 34122: {'lr': 0.00019961167791671195, 'samples': 1091904, 'steps': 2132, 'loss/train': 1.6571217775344849} -09/20/2021 21:52:43 - INFO - __main__ - Step 34123: {'lr': 0.00019961167791671195, 'samples': 1091936, 'steps': 2132, 'loss/train': 1.8628703355789185} -09/20/2021 21:52:43 - INFO - __main__ - Step 34124: {'lr': 0.00019961167791671195, 'samples': 1091968, 'steps': 2132, 'loss/train': 2.6333553791046143} -09/20/2021 21:52:44 - INFO - __main__ - Step 34125: {'lr': 0.00019961167791671195, 'samples': 1092000, 'steps': 2132, 'loss/train': 2.399965524673462} -09/20/2021 21:52:45 - INFO - __main__ - Step 34126: {'lr': 0.00019961167791671195, 'samples': 1092032, 'steps': 2132, 'loss/train': 0.5213419198989868} -09/20/2021 21:52:46 - INFO - __main__ - Step 34127: {'lr': 0.00019961167791671195, 'samples': 1092064, 'steps': 2132, 'loss/train': 2.851306915283203} -09/20/2021 21:52:46 - INFO - __main__ - Step 34128: {'lr': 0.00019961167791671195, 'samples': 1092096, 'steps': 2132, 'loss/train': 2.363192081451416} -09/20/2021 21:52:47 - INFO - __main__ - Step 34129: {'lr': 0.00019961111610686808, 'samples': 1092128, 'steps': 2133, 'loss/train': 2.8221518993377686} -09/20/2021 21:52:48 - INFO - __main__ - Step 34130: {'lr': 0.00019961111610686808, 'samples': 1092160, 'steps': 2133, 'loss/train': 2.1046478748321533} -09/20/2021 21:52:49 - INFO - __main__ - Step 34131: {'lr': 0.00019961111610686808, 'samples': 1092192, 'steps': 2133, 'loss/train': 2.4239182472229004} -09/20/2021 21:52:50 - INFO - __main__ - Step 34132: {'lr': 0.00019961111610686808, 'samples': 1092224, 'steps': 2133, 'loss/train': 2.4503767490386963} -09/20/2021 21:52:51 - INFO - __main__ - Step 34133: {'lr': 0.00019961111610686808, 'samples': 1092256, 'steps': 2133, 'loss/train': 2.4839484691619873} -09/20/2021 21:52:51 - INFO - __main__ - Step 34134: {'lr': 0.00019961111610686808, 'samples': 1092288, 'steps': 2133, 'loss/train': 2.4084699153900146} -09/20/2021 21:52:52 - INFO - __main__ - Step 34135: {'lr': 0.00019961111610686808, 'samples': 1092320, 'steps': 2133, 'loss/train': 2.028277635574341} -09/20/2021 21:52:53 - INFO - __main__ - Step 34136: {'lr': 0.00019961111610686808, 'samples': 1092352, 'steps': 2133, 'loss/train': 2.224802017211914} -09/20/2021 21:52:54 - INFO - __main__ - Step 34137: {'lr': 0.00019961111610686808, 'samples': 1092384, 'steps': 2133, 'loss/train': 1.5118919610977173} -09/20/2021 21:52:54 - INFO - __main__ - Step 34138: {'lr': 0.00019961111610686808, 'samples': 1092416, 'steps': 2133, 'loss/train': 2.113529920578003} -09/20/2021 21:52:55 - INFO - __main__ - Step 34139: {'lr': 0.00019961111610686808, 'samples': 1092448, 'steps': 2133, 'loss/train': 2.3250839710235596} -09/20/2021 21:52:56 - INFO - __main__ - Step 34140: {'lr': 0.00019961111610686808, 'samples': 1092480, 'steps': 2133, 'loss/train': 2.602121591567993} -09/20/2021 21:52:57 - INFO - __main__ - Step 34141: {'lr': 0.00019961111610686808, 'samples': 1092512, 'steps': 2133, 'loss/train': 1.9328726530075073} -09/20/2021 21:52:57 - INFO - __main__ - Step 34142: {'lr': 0.00019961111610686808, 'samples': 1092544, 'steps': 2133, 'loss/train': 1.184391736984253} -09/20/2021 21:52:58 - INFO - __main__ - Step 34143: {'lr': 0.00019961111610686808, 'samples': 1092576, 'steps': 2133, 'loss/train': 2.542907476425171} -09/20/2021 21:52:59 - INFO - __main__ - Step 34144: {'lr': 0.00019961111610686808, 'samples': 1092608, 'steps': 2133, 'loss/train': 2.5225138664245605} -09/20/2021 21:53:00 - INFO - __main__ - Step 34145: {'lr': 0.00019961055389170696, 'samples': 1092640, 'steps': 2134, 'loss/train': 2.1247341632843018} -09/20/2021 21:53:01 - INFO - __main__ - Step 34146: {'lr': 0.00019961055389170696, 'samples': 1092672, 'steps': 2134, 'loss/train': 1.9772745370864868} -09/20/2021 21:53:01 - INFO - __main__ - Step 34147: {'lr': 0.00019961055389170696, 'samples': 1092704, 'steps': 2134, 'loss/train': 2.212890863418579} -09/20/2021 21:53:02 - INFO - __main__ - Step 34148: {'lr': 0.00019961055389170696, 'samples': 1092736, 'steps': 2134, 'loss/train': 3.446491241455078} -09/20/2021 21:53:03 - INFO - __main__ - Step 34149: {'lr': 0.00019961055389170696, 'samples': 1092768, 'steps': 2134, 'loss/train': 2.055875539779663} -09/20/2021 21:53:04 - INFO - __main__ - Step 34150: {'lr': 0.00019961055389170696, 'samples': 1092800, 'steps': 2134, 'loss/train': 1.92636239528656} -09/20/2021 21:53:04 - INFO - __main__ - Step 34151: {'lr': 0.00019961055389170696, 'samples': 1092832, 'steps': 2134, 'loss/train': 2.599482297897339} -09/20/2021 21:53:05 - INFO - __main__ - Step 34152: {'lr': 0.00019961055389170696, 'samples': 1092864, 'steps': 2134, 'loss/train': 1.5896178483963013} -09/20/2021 21:53:06 - INFO - __main__ - Step 34153: {'lr': 0.00019961055389170696, 'samples': 1092896, 'steps': 2134, 'loss/train': 2.4711263179779053} -09/20/2021 21:53:07 - INFO - __main__ - Step 34154: {'lr': 0.00019961055389170696, 'samples': 1092928, 'steps': 2134, 'loss/train': 2.2818117141723633} -09/20/2021 21:53:07 - INFO - __main__ - Step 34155: {'lr': 0.00019961055389170696, 'samples': 1092960, 'steps': 2134, 'loss/train': 2.250570058822632} -09/20/2021 21:53:08 - INFO - __main__ - Step 34156: {'lr': 0.00019961055389170696, 'samples': 1092992, 'steps': 2134, 'loss/train': 1.8978227376937866} -09/20/2021 21:53:09 - INFO - __main__ - Step 34157: {'lr': 0.00019961055389170696, 'samples': 1093024, 'steps': 2134, 'loss/train': 2.3679473400115967} -09/20/2021 21:53:10 - INFO - __main__ - Step 34158: {'lr': 0.00019961055389170696, 'samples': 1093056, 'steps': 2134, 'loss/train': 2.082909345626831} -09/20/2021 21:53:10 - INFO - __main__ - Step 34159: {'lr': 0.00019961055389170696, 'samples': 1093088, 'steps': 2134, 'loss/train': 0.8705942630767822} -09/20/2021 21:53:11 - INFO - __main__ - Step 34160: {'lr': 0.00019961055389170696, 'samples': 1093120, 'steps': 2134, 'loss/train': 2.693803548812866} -09/20/2021 21:53:12 - INFO - __main__ - Step 34161: {'lr': 0.0001996099912712309, 'samples': 1093152, 'steps': 2135, 'loss/train': 1.8892041444778442} -09/20/2021 21:53:13 - INFO - __main__ - Step 34162: {'lr': 0.0001996099912712309, 'samples': 1093184, 'steps': 2135, 'loss/train': 1.3465137481689453} -09/20/2021 21:53:14 - INFO - __main__ - Step 34163: {'lr': 0.0001996099912712309, 'samples': 1093216, 'steps': 2135, 'loss/train': 2.5286285877227783} -09/20/2021 21:53:15 - INFO - __main__ - Step 34164: {'lr': 0.0001996099912712309, 'samples': 1093248, 'steps': 2135, 'loss/train': 0.7124322056770325} -09/20/2021 21:53:15 - INFO - __main__ - Step 34165: {'lr': 0.0001996099912712309, 'samples': 1093280, 'steps': 2135, 'loss/train': 2.5610361099243164} -09/20/2021 21:53:16 - INFO - __main__ - Step 34166: {'lr': 0.0001996099912712309, 'samples': 1093312, 'steps': 2135, 'loss/train': 2.817223310470581} -09/20/2021 21:53:17 - INFO - __main__ - Step 34167: {'lr': 0.0001996099912712309, 'samples': 1093344, 'steps': 2135, 'loss/train': 2.355870246887207} -09/20/2021 21:53:18 - INFO - __main__ - Step 34168: {'lr': 0.0001996099912712309, 'samples': 1093376, 'steps': 2135, 'loss/train': 1.5003329515457153} -09/20/2021 21:53:18 - INFO - __main__ - Step 34169: {'lr': 0.0001996099912712309, 'samples': 1093408, 'steps': 2135, 'loss/train': 1.496509313583374} -09/20/2021 21:53:19 - INFO - __main__ - Step 34170: {'lr': 0.0001996099912712309, 'samples': 1093440, 'steps': 2135, 'loss/train': 2.459733247756958} -09/20/2021 21:53:20 - INFO - __main__ - Step 34171: {'lr': 0.0001996099912712309, 'samples': 1093472, 'steps': 2135, 'loss/train': 0.7867657542228699} -09/20/2021 21:53:21 - INFO - __main__ - Step 34172: {'lr': 0.0001996099912712309, 'samples': 1093504, 'steps': 2135, 'loss/train': 1.8872904777526855} -09/20/2021 21:53:21 - INFO - __main__ - Step 34173: {'lr': 0.0001996099912712309, 'samples': 1093536, 'steps': 2135, 'loss/train': 2.3002772331237793} -09/20/2021 21:53:22 - INFO - __main__ - Step 34174: {'lr': 0.0001996099912712309, 'samples': 1093568, 'steps': 2135, 'loss/train': 2.1022534370422363} -09/20/2021 21:53:23 - INFO - __main__ - Step 34175: {'lr': 0.0001996099912712309, 'samples': 1093600, 'steps': 2135, 'loss/train': 1.5031650066375732} -09/20/2021 21:53:24 - INFO - __main__ - Step 34176: {'lr': 0.0001996099912712309, 'samples': 1093632, 'steps': 2135, 'loss/train': 2.0050034523010254} -09/20/2021 21:53:25 - INFO - __main__ - Step 34177: {'lr': 0.00019960942824544215, 'samples': 1093664, 'steps': 2136, 'loss/train': 1.3993903398513794} -09/20/2021 21:53:25 - INFO - __main__ - Step 34178: {'lr': 0.00019960942824544215, 'samples': 1093696, 'steps': 2136, 'loss/train': 2.639629364013672} -09/20/2021 21:53:26 - INFO - __main__ - Step 34179: {'lr': 0.00019960942824544215, 'samples': 1093728, 'steps': 2136, 'loss/train': 2.321340799331665} -09/20/2021 21:53:27 - INFO - __main__ - Step 34180: {'lr': 0.00019960942824544215, 'samples': 1093760, 'steps': 2136, 'loss/train': 2.572079658508301} -09/20/2021 21:53:28 - INFO - __main__ - Step 34181: {'lr': 0.00019960942824544215, 'samples': 1093792, 'steps': 2136, 'loss/train': 2.7381985187530518} -09/20/2021 21:53:28 - INFO - __main__ - Step 34182: {'lr': 0.00019960942824544215, 'samples': 1093824, 'steps': 2136, 'loss/train': 3.0944676399230957} -09/20/2021 21:53:29 - INFO - __main__ - Step 34183: {'lr': 0.00019960942824544215, 'samples': 1093856, 'steps': 2136, 'loss/train': 2.5101606845855713} -09/20/2021 21:53:30 - INFO - __main__ - Step 34184: {'lr': 0.00019960942824544215, 'samples': 1093888, 'steps': 2136, 'loss/train': 1.625289797782898} -09/20/2021 21:53:31 - INFO - __main__ - Step 34185: {'lr': 0.00019960942824544215, 'samples': 1093920, 'steps': 2136, 'loss/train': 2.2239794731140137} -09/20/2021 21:53:31 - INFO - __main__ - Step 34186: {'lr': 0.00019960942824544215, 'samples': 1093952, 'steps': 2136, 'loss/train': 1.5599596500396729} -09/20/2021 21:53:32 - INFO - __main__ - Step 34187: {'lr': 0.00019960942824544215, 'samples': 1093984, 'steps': 2136, 'loss/train': 1.8234223127365112} -09/20/2021 21:53:33 - INFO - __main__ - Step 34188: {'lr': 0.00019960942824544215, 'samples': 1094016, 'steps': 2136, 'loss/train': 2.4416494369506836} -09/20/2021 21:53:34 - INFO - __main__ - Step 34189: {'lr': 0.00019960942824544215, 'samples': 1094048, 'steps': 2136, 'loss/train': 2.8431594371795654} -09/20/2021 21:53:34 - INFO - __main__ - Step 34190: {'lr': 0.00019960942824544215, 'samples': 1094080, 'steps': 2136, 'loss/train': 2.136845827102661} -09/20/2021 21:53:35 - INFO - __main__ - Step 34191: {'lr': 0.00019960942824544215, 'samples': 1094112, 'steps': 2136, 'loss/train': 2.626932382583618} -09/20/2021 21:53:36 - INFO - __main__ - Step 34192: {'lr': 0.00019960942824544215, 'samples': 1094144, 'steps': 2136, 'loss/train': 1.1346371173858643} -09/20/2021 21:53:37 - INFO - __main__ - Step 34193: {'lr': 0.000199608864814343, 'samples': 1094176, 'steps': 2137, 'loss/train': 1.6806583404541016} -09/20/2021 21:53:38 - INFO - __main__ - Step 34194: {'lr': 0.000199608864814343, 'samples': 1094208, 'steps': 2137, 'loss/train': 2.736769437789917} -09/20/2021 21:53:39 - INFO - __main__ - Step 34195: {'lr': 0.000199608864814343, 'samples': 1094240, 'steps': 2137, 'loss/train': 1.4124178886413574} -09/20/2021 21:53:40 - INFO - __main__ - Step 34196: {'lr': 0.000199608864814343, 'samples': 1094272, 'steps': 2137, 'loss/train': 2.220165252685547} -09/20/2021 21:53:40 - INFO - __main__ - Step 34197: {'lr': 0.000199608864814343, 'samples': 1094304, 'steps': 2137, 'loss/train': 2.678795576095581} -09/20/2021 21:53:41 - INFO - __main__ - Step 34198: {'lr': 0.000199608864814343, 'samples': 1094336, 'steps': 2137, 'loss/train': 3.0029873847961426} -09/20/2021 21:53:42 - INFO - __main__ - Step 34199: {'lr': 0.000199608864814343, 'samples': 1094368, 'steps': 2137, 'loss/train': 3.0353550910949707} -09/20/2021 21:53:43 - INFO - __main__ - Step 34200: {'lr': 0.000199608864814343, 'samples': 1094400, 'steps': 2137, 'loss/train': 2.4688215255737305} -09/20/2021 21:53:43 - INFO - __main__ - Step 34201: {'lr': 0.000199608864814343, 'samples': 1094432, 'steps': 2137, 'loss/train': 0.6971829533576965} -09/20/2021 21:53:44 - INFO - __main__ - Step 34202: {'lr': 0.000199608864814343, 'samples': 1094464, 'steps': 2137, 'loss/train': 2.4226322174072266} -09/20/2021 21:53:45 - INFO - __main__ - Step 34203: {'lr': 0.000199608864814343, 'samples': 1094496, 'steps': 2137, 'loss/train': 2.4357681274414062} -09/20/2021 21:53:46 - INFO - __main__ - Step 34204: {'lr': 0.000199608864814343, 'samples': 1094528, 'steps': 2137, 'loss/train': 1.997068166732788} -09/20/2021 21:53:46 - INFO - __main__ - Step 34205: {'lr': 0.000199608864814343, 'samples': 1094560, 'steps': 2137, 'loss/train': 0.9433686137199402} -09/20/2021 21:53:47 - INFO - __main__ - Step 34206: {'lr': 0.000199608864814343, 'samples': 1094592, 'steps': 2137, 'loss/train': 2.2353062629699707} -09/20/2021 21:53:48 - INFO - __main__ - Step 34207: {'lr': 0.000199608864814343, 'samples': 1094624, 'steps': 2137, 'loss/train': 1.8798370361328125} -09/20/2021 21:53:49 - INFO - __main__ - Step 34208: {'lr': 0.000199608864814343, 'samples': 1094656, 'steps': 2137, 'loss/train': 2.224008083343506} -09/20/2021 21:53:49 - INFO - __main__ - Step 34209: {'lr': 0.00019960830097793584, 'samples': 1094688, 'steps': 2138, 'loss/train': 2.511451482772827} -09/20/2021 21:53:50 - INFO - __main__ - Step 34210: {'lr': 0.00019960830097793584, 'samples': 1094720, 'steps': 2138, 'loss/train': 2.1167259216308594} -09/20/2021 21:53:51 - INFO - __main__ - Step 34211: {'lr': 0.00019960830097793584, 'samples': 1094752, 'steps': 2138, 'loss/train': 2.493882656097412} -09/20/2021 21:53:52 - INFO - __main__ - Step 34212: {'lr': 0.00019960830097793584, 'samples': 1094784, 'steps': 2138, 'loss/train': 2.2161200046539307} -09/20/2021 21:53:52 - INFO - __main__ - Step 34213: {'lr': 0.00019960830097793584, 'samples': 1094816, 'steps': 2138, 'loss/train': 2.933929204940796} -09/20/2021 21:53:53 - INFO - __main__ - Step 34214: {'lr': 0.00019960830097793584, 'samples': 1094848, 'steps': 2138, 'loss/train': 1.7128041982650757} -09/20/2021 21:53:54 - INFO - __main__ - Step 34215: {'lr': 0.00019960830097793584, 'samples': 1094880, 'steps': 2138, 'loss/train': 2.190185070037842} -09/20/2021 21:53:55 - INFO - __main__ - Step 34216: {'lr': 0.00019960830097793584, 'samples': 1094912, 'steps': 2138, 'loss/train': 2.6047282218933105} -09/20/2021 21:53:55 - INFO - __main__ - Step 34217: {'lr': 0.00019960830097793584, 'samples': 1094944, 'steps': 2138, 'loss/train': 2.814666509628296} -09/20/2021 21:53:56 - INFO - __main__ - Step 34218: {'lr': 0.00019960830097793584, 'samples': 1094976, 'steps': 2138, 'loss/train': 2.409357786178589} -09/20/2021 21:53:57 - INFO - __main__ - Step 34219: {'lr': 0.00019960830097793584, 'samples': 1095008, 'steps': 2138, 'loss/train': 3.597733974456787} -09/20/2021 21:53:58 - INFO - __main__ - Step 34220: {'lr': 0.00019960830097793584, 'samples': 1095040, 'steps': 2138, 'loss/train': 2.4175522327423096} -09/20/2021 21:53:58 - INFO - __main__ - Step 34221: {'lr': 0.00019960830097793584, 'samples': 1095072, 'steps': 2138, 'loss/train': 2.4022278785705566} -09/20/2021 21:53:59 - INFO - __main__ - Step 34222: {'lr': 0.00019960830097793584, 'samples': 1095104, 'steps': 2138, 'loss/train': 2.1965956687927246} -09/20/2021 21:54:00 - INFO - __main__ - Step 34223: {'lr': 0.00019960830097793584, 'samples': 1095136, 'steps': 2138, 'loss/train': 2.48464035987854} -09/20/2021 21:54:02 - INFO - __main__ - Step 34224: {'lr': 0.00019960830097793584, 'samples': 1095168, 'steps': 2138, 'loss/train': 2.686427116394043} -09/20/2021 21:54:03 - INFO - __main__ - Step 34225: {'lr': 0.00019960773673622284, 'samples': 1095200, 'steps': 2139, 'loss/train': 2.3345296382904053} -09/20/2021 21:54:03 - INFO - __main__ - Step 34226: {'lr': 0.00019960773673622284, 'samples': 1095232, 'steps': 2139, 'loss/train': 2.25765061378479} -09/20/2021 21:54:04 - INFO - __main__ - Step 34227: {'lr': 0.00019960773673622284, 'samples': 1095264, 'steps': 2139, 'loss/train': 2.041804075241089} -09/20/2021 21:54:05 - INFO - __main__ - Step 34228: {'lr': 0.00019960773673622284, 'samples': 1095296, 'steps': 2139, 'loss/train': 3.6559946537017822} -09/20/2021 21:54:06 - INFO - __main__ - Step 34229: {'lr': 0.00019960773673622284, 'samples': 1095328, 'steps': 2139, 'loss/train': 2.651869058609009} -09/20/2021 21:54:06 - INFO - __main__ - Step 34230: {'lr': 0.00019960773673622284, 'samples': 1095360, 'steps': 2139, 'loss/train': 2.7252981662750244} -09/20/2021 21:54:07 - INFO - __main__ - Step 34231: {'lr': 0.00019960773673622284, 'samples': 1095392, 'steps': 2139, 'loss/train': 2.559964895248413} -09/20/2021 21:54:08 - INFO - __main__ - Step 34232: {'lr': 0.00019960773673622284, 'samples': 1095424, 'steps': 2139, 'loss/train': 2.3256776332855225} -09/20/2021 21:54:09 - INFO - __main__ - Step 34233: {'lr': 0.00019960773673622284, 'samples': 1095456, 'steps': 2139, 'loss/train': 2.617098093032837} -09/20/2021 21:54:09 - INFO - __main__ - Step 34234: {'lr': 0.00019960773673622284, 'samples': 1095488, 'steps': 2139, 'loss/train': 2.4093151092529297} -09/20/2021 21:54:10 - INFO - __main__ - Step 34235: {'lr': 0.00019960773673622284, 'samples': 1095520, 'steps': 2139, 'loss/train': 2.181367874145508} -09/20/2021 21:54:11 - INFO - __main__ - Step 34236: {'lr': 0.00019960773673622284, 'samples': 1095552, 'steps': 2139, 'loss/train': 2.073470115661621} -09/20/2021 21:54:12 - INFO - __main__ - Step 34237: {'lr': 0.00019960773673622284, 'samples': 1095584, 'steps': 2139, 'loss/train': 2.214639902114868} -09/20/2021 21:54:12 - INFO - __main__ - Step 34238: {'lr': 0.00019960773673622284, 'samples': 1095616, 'steps': 2139, 'loss/train': 2.077491521835327} -09/20/2021 21:54:13 - INFO - __main__ - Step 34239: {'lr': 0.00019960773673622284, 'samples': 1095648, 'steps': 2139, 'loss/train': 2.8209924697875977} -09/20/2021 21:54:14 - INFO - __main__ - Step 34240: {'lr': 0.00019960773673622284, 'samples': 1095680, 'steps': 2139, 'loss/train': 2.3686602115631104} -09/20/2021 21:54:15 - INFO - __main__ - Step 34241: {'lr': 0.00019960717208920633, 'samples': 1095712, 'steps': 2140, 'loss/train': 2.597057580947876} -09/20/2021 21:54:16 - INFO - __main__ - Step 34242: {'lr': 0.00019960717208920633, 'samples': 1095744, 'steps': 2140, 'loss/train': 1.961283564567566} -09/20/2021 21:54:16 - INFO - __main__ - Step 34243: {'lr': 0.00019960717208920633, 'samples': 1095776, 'steps': 2140, 'loss/train': 2.275177240371704} -09/20/2021 21:54:17 - INFO - __main__ - Step 34244: {'lr': 0.00019960717208920633, 'samples': 1095808, 'steps': 2140, 'loss/train': 1.794419288635254} -09/20/2021 21:54:18 - INFO - __main__ - Step 34245: {'lr': 0.00019960717208920633, 'samples': 1095840, 'steps': 2140, 'loss/train': 2.11637544631958} -09/20/2021 21:54:19 - INFO - __main__ - Step 34246: {'lr': 0.00019960717208920633, 'samples': 1095872, 'steps': 2140, 'loss/train': 2.091059446334839} -09/20/2021 21:54:19 - INFO - __main__ - Step 34247: {'lr': 0.00019960717208920633, 'samples': 1095904, 'steps': 2140, 'loss/train': 2.299866199493408} -09/20/2021 21:54:20 - INFO - __main__ - Step 34248: {'lr': 0.00019960717208920633, 'samples': 1095936, 'steps': 2140, 'loss/train': 2.266094207763672} -09/20/2021 21:54:21 - INFO - __main__ - Step 34249: {'lr': 0.00019960717208920633, 'samples': 1095968, 'steps': 2140, 'loss/train': 1.980805516242981} -09/20/2021 21:54:22 - INFO - __main__ - Step 34250: {'lr': 0.00019960717208920633, 'samples': 1096000, 'steps': 2140, 'loss/train': 0.1649172604084015} -09/20/2021 21:54:22 - INFO - __main__ - Step 34251: {'lr': 0.00019960717208920633, 'samples': 1096032, 'steps': 2140, 'loss/train': 0.1891452819108963} -09/20/2021 21:54:23 - INFO - __main__ - Step 34252: {'lr': 0.00019960717208920633, 'samples': 1096064, 'steps': 2140, 'loss/train': 2.5181663036346436} -09/20/2021 21:54:24 - INFO - __main__ - Step 34253: {'lr': 0.00019960717208920633, 'samples': 1096096, 'steps': 2140, 'loss/train': 1.9389539957046509} -09/20/2021 21:54:25 - INFO - __main__ - Step 34254: {'lr': 0.00019960717208920633, 'samples': 1096128, 'steps': 2140, 'loss/train': 1.9283353090286255} -09/20/2021 21:54:26 - INFO - __main__ - Step 34255: {'lr': 0.00019960717208920633, 'samples': 1096160, 'steps': 2140, 'loss/train': 3.0862913131713867} -09/20/2021 21:54:27 - INFO - __main__ - Step 34256: {'lr': 0.00019960717208920633, 'samples': 1096192, 'steps': 2140, 'loss/train': 1.4461508989334106} -09/20/2021 21:54:28 - INFO - __main__ - Step 34257: {'lr': 0.00019960660703688868, 'samples': 1096224, 'steps': 2141, 'loss/train': 1.8931496143341064} -09/20/2021 21:54:28 - INFO - __main__ - Step 34258: {'lr': 0.00019960660703688868, 'samples': 1096256, 'steps': 2141, 'loss/train': 2.749638080596924} -09/20/2021 21:54:29 - INFO - __main__ - Step 34259: {'lr': 0.00019960660703688868, 'samples': 1096288, 'steps': 2141, 'loss/train': 1.8745166063308716} -09/20/2021 21:54:30 - INFO - __main__ - Step 34260: {'lr': 0.00019960660703688868, 'samples': 1096320, 'steps': 2141, 'loss/train': 1.3718476295471191} -09/20/2021 21:54:31 - INFO - __main__ - Step 34261: {'lr': 0.00019960660703688868, 'samples': 1096352, 'steps': 2141, 'loss/train': 2.122243881225586} -09/20/2021 21:54:31 - INFO - __main__ - Step 34262: {'lr': 0.00019960660703688868, 'samples': 1096384, 'steps': 2141, 'loss/train': 2.1075706481933594} -09/20/2021 21:54:32 - INFO - __main__ - Step 34263: {'lr': 0.00019960660703688868, 'samples': 1096416, 'steps': 2141, 'loss/train': 2.408688545227051} -09/20/2021 21:54:33 - INFO - __main__ - Step 34264: {'lr': 0.00019960660703688868, 'samples': 1096448, 'steps': 2141, 'loss/train': 1.283850908279419} -09/20/2021 21:54:34 - INFO - __main__ - Step 34265: {'lr': 0.00019960660703688868, 'samples': 1096480, 'steps': 2141, 'loss/train': 2.5510997772216797} -09/20/2021 21:54:34 - INFO - __main__ - Step 34266: {'lr': 0.00019960660703688868, 'samples': 1096512, 'steps': 2141, 'loss/train': 2.5430691242218018} -09/20/2021 21:54:35 - INFO - __main__ - Step 34267: {'lr': 0.00019960660703688868, 'samples': 1096544, 'steps': 2141, 'loss/train': 2.158134698867798} -09/20/2021 21:54:36 - INFO - __main__ - Step 34268: {'lr': 0.00019960660703688868, 'samples': 1096576, 'steps': 2141, 'loss/train': 3.195964813232422} -09/20/2021 21:54:37 - INFO - __main__ - Step 34269: {'lr': 0.00019960660703688868, 'samples': 1096608, 'steps': 2141, 'loss/train': 2.4457943439483643} -09/20/2021 21:54:37 - INFO - __main__ - Step 34270: {'lr': 0.00019960660703688868, 'samples': 1096640, 'steps': 2141, 'loss/train': 1.4885706901550293} -09/20/2021 21:54:38 - INFO - __main__ - Step 34271: {'lr': 0.00019960660703688868, 'samples': 1096672, 'steps': 2141, 'loss/train': 2.4836056232452393} -09/20/2021 21:54:39 - INFO - __main__ - Step 34272: {'lr': 0.00019960660703688868, 'samples': 1096704, 'steps': 2141, 'loss/train': 1.5365185737609863} -09/20/2021 21:54:40 - INFO - __main__ - Step 34273: {'lr': 0.00019960604157927208, 'samples': 1096736, 'steps': 2142, 'loss/train': 2.218439817428589} -09/20/2021 21:54:41 - INFO - __main__ - Step 34274: {'lr': 0.00019960604157927208, 'samples': 1096768, 'steps': 2142, 'loss/train': 2.3306679725646973} -09/20/2021 21:54:41 - INFO - __main__ - Step 34275: {'lr': 0.00019960604157927208, 'samples': 1096800, 'steps': 2142, 'loss/train': 2.8659820556640625} -09/20/2021 21:54:42 - INFO - __main__ - Step 34276: {'lr': 0.00019960604157927208, 'samples': 1096832, 'steps': 2142, 'loss/train': 2.6646835803985596} -09/20/2021 21:54:43 - INFO - __main__ - Step 34277: {'lr': 0.00019960604157927208, 'samples': 1096864, 'steps': 2142, 'loss/train': 1.9462025165557861} -09/20/2021 21:54:44 - INFO - __main__ - Step 34278: {'lr': 0.00019960604157927208, 'samples': 1096896, 'steps': 2142, 'loss/train': 2.1464295387268066} -09/20/2021 21:54:44 - INFO - __main__ - Step 34279: {'lr': 0.00019960604157927208, 'samples': 1096928, 'steps': 2142, 'loss/train': 1.783980369567871} -09/20/2021 21:54:45 - INFO - __main__ - Step 34280: {'lr': 0.00019960604157927208, 'samples': 1096960, 'steps': 2142, 'loss/train': 1.9379537105560303} -09/20/2021 21:54:46 - INFO - __main__ - Step 34281: {'lr': 0.00019960604157927208, 'samples': 1096992, 'steps': 2142, 'loss/train': 1.860625147819519} -09/20/2021 21:54:47 - INFO - __main__ - Step 34282: {'lr': 0.00019960604157927208, 'samples': 1097024, 'steps': 2142, 'loss/train': 2.917495012283325} -09/20/2021 21:54:47 - INFO - __main__ - Step 34283: {'lr': 0.00019960604157927208, 'samples': 1097056, 'steps': 2142, 'loss/train': 2.6382389068603516} -09/20/2021 21:54:49 - INFO - __main__ - Step 34284: {'lr': 0.00019960604157927208, 'samples': 1097088, 'steps': 2142, 'loss/train': 1.3852527141571045} -09/20/2021 21:54:49 - INFO - __main__ - Step 34285: {'lr': 0.00019960604157927208, 'samples': 1097120, 'steps': 2142, 'loss/train': 1.9656797647476196} -09/20/2021 21:54:50 - INFO - __main__ - Step 34286: {'lr': 0.00019960604157927208, 'samples': 1097152, 'steps': 2142, 'loss/train': 2.4408695697784424} -09/20/2021 21:54:51 - INFO - __main__ - Step 34287: {'lr': 0.00019960604157927208, 'samples': 1097184, 'steps': 2142, 'loss/train': 2.8729259967803955} -09/20/2021 21:54:52 - INFO - __main__ - Step 34288: {'lr': 0.00019960604157927208, 'samples': 1097216, 'steps': 2142, 'loss/train': 3.072242021560669} -09/20/2021 21:54:52 - INFO - __main__ - Step 34289: {'lr': 0.00019960547571635888, 'samples': 1097248, 'steps': 2143, 'loss/train': 2.21712064743042} -09/20/2021 21:54:53 - INFO - __main__ - Step 34290: {'lr': 0.00019960547571635888, 'samples': 1097280, 'steps': 2143, 'loss/train': 2.15283465385437} -09/20/2021 21:54:54 - INFO - __main__ - Step 34291: {'lr': 0.00019960547571635888, 'samples': 1097312, 'steps': 2143, 'loss/train': 2.3206727504730225} -09/20/2021 21:54:55 - INFO - __main__ - Step 34292: {'lr': 0.00019960547571635888, 'samples': 1097344, 'steps': 2143, 'loss/train': 1.9139059782028198} -09/20/2021 21:54:55 - INFO - __main__ - Step 34293: {'lr': 0.00019960547571635888, 'samples': 1097376, 'steps': 2143, 'loss/train': 1.8809901475906372} -09/20/2021 21:54:56 - INFO - __main__ - Step 34294: {'lr': 0.00019960547571635888, 'samples': 1097408, 'steps': 2143, 'loss/train': 2.484445095062256} -09/20/2021 21:54:57 - INFO - __main__ - Step 34295: {'lr': 0.00019960547571635888, 'samples': 1097440, 'steps': 2143, 'loss/train': 2.1556644439697266} -09/20/2021 21:54:58 - INFO - __main__ - Step 34296: {'lr': 0.00019960547571635888, 'samples': 1097472, 'steps': 2143, 'loss/train': 2.6876676082611084} -09/20/2021 21:54:58 - INFO - __main__ - Step 34297: {'lr': 0.00019960547571635888, 'samples': 1097504, 'steps': 2143, 'loss/train': 2.5746405124664307} -09/20/2021 21:54:59 - INFO - __main__ - Step 34298: {'lr': 0.00019960547571635888, 'samples': 1097536, 'steps': 2143, 'loss/train': 2.692314624786377} -09/20/2021 21:55:00 - INFO - __main__ - Step 34299: {'lr': 0.00019960547571635888, 'samples': 1097568, 'steps': 2143, 'loss/train': 3.0799267292022705} -09/20/2021 21:55:01 - INFO - __main__ - Step 34300: {'lr': 0.00019960547571635888, 'samples': 1097600, 'steps': 2143, 'loss/train': 0.9894548058509827} -09/20/2021 21:55:01 - INFO - __main__ - Step 34301: {'lr': 0.00019960547571635888, 'samples': 1097632, 'steps': 2143, 'loss/train': 2.375188112258911} -09/20/2021 21:55:02 - INFO - __main__ - Step 34302: {'lr': 0.00019960547571635888, 'samples': 1097664, 'steps': 2143, 'loss/train': 2.9035160541534424} -09/20/2021 21:55:03 - INFO - __main__ - Step 34303: {'lr': 0.00019960547571635888, 'samples': 1097696, 'steps': 2143, 'loss/train': 1.777360200881958} -09/20/2021 21:55:04 - INFO - __main__ - Step 34304: {'lr': 0.00019960547571635888, 'samples': 1097728, 'steps': 2143, 'loss/train': 2.2866296768188477} -09/20/2021 21:55:05 - INFO - __main__ - Step 34305: {'lr': 0.00019960490944815143, 'samples': 1097760, 'steps': 2144, 'loss/train': 2.042402982711792} -09/20/2021 21:55:05 - INFO - __main__ - Step 34306: {'lr': 0.00019960490944815143, 'samples': 1097792, 'steps': 2144, 'loss/train': 1.796627163887024} -09/20/2021 21:55:06 - INFO - __main__ - Step 34307: {'lr': 0.00019960490944815143, 'samples': 1097824, 'steps': 2144, 'loss/train': 2.1287360191345215} -09/20/2021 21:55:07 - INFO - __main__ - Step 34308: {'lr': 0.00019960490944815143, 'samples': 1097856, 'steps': 2144, 'loss/train': 1.9583611488342285} -09/20/2021 21:55:08 - INFO - __main__ - Step 34309: {'lr': 0.00019960490944815143, 'samples': 1097888, 'steps': 2144, 'loss/train': 2.5787365436553955} -09/20/2021 21:55:08 - INFO - __main__ - Step 34310: {'lr': 0.00019960490944815143, 'samples': 1097920, 'steps': 2144, 'loss/train': 2.702086925506592} -09/20/2021 21:55:09 - INFO - __main__ - Step 34311: {'lr': 0.00019960490944815143, 'samples': 1097952, 'steps': 2144, 'loss/train': 2.2380404472351074} -09/20/2021 21:55:10 - INFO - __main__ - Step 34312: {'lr': 0.00019960490944815143, 'samples': 1097984, 'steps': 2144, 'loss/train': 2.4451799392700195} -09/20/2021 21:55:11 - INFO - __main__ - Step 34313: {'lr': 0.00019960490944815143, 'samples': 1098016, 'steps': 2144, 'loss/train': 2.0142946243286133} -09/20/2021 21:55:11 - INFO - __main__ - Step 34314: {'lr': 0.00019960490944815143, 'samples': 1098048, 'steps': 2144, 'loss/train': 2.0177605152130127} -09/20/2021 21:55:13 - INFO - __main__ - Step 34315: {'lr': 0.00019960490944815143, 'samples': 1098080, 'steps': 2144, 'loss/train': 1.963340163230896} -09/20/2021 21:55:13 - INFO - __main__ - Step 34316: {'lr': 0.00019960490944815143, 'samples': 1098112, 'steps': 2144, 'loss/train': 2.5983378887176514} -09/20/2021 21:55:14 - INFO - __main__ - Step 34317: {'lr': 0.00019960490944815143, 'samples': 1098144, 'steps': 2144, 'loss/train': 2.1406748294830322} -09/20/2021 21:55:15 - INFO - __main__ - Step 34318: {'lr': 0.00019960490944815143, 'samples': 1098176, 'steps': 2144, 'loss/train': 2.4838712215423584} -09/20/2021 21:55:16 - INFO - __main__ - Step 34319: {'lr': 0.00019960490944815143, 'samples': 1098208, 'steps': 2144, 'loss/train': 2.918088912963867} -09/20/2021 21:55:16 - INFO - __main__ - Step 34320: {'lr': 0.00019960490944815143, 'samples': 1098240, 'steps': 2144, 'loss/train': 1.7916821241378784} -09/20/2021 21:55:17 - INFO - __main__ - Step 34321: {'lr': 0.00019960434277465193, 'samples': 1098272, 'steps': 2145, 'loss/train': 3.0164425373077393} -09/20/2021 21:55:18 - INFO - __main__ - Step 34322: {'lr': 0.00019960434277465193, 'samples': 1098304, 'steps': 2145, 'loss/train': 2.937323808670044} -09/20/2021 21:55:19 - INFO - __main__ - Step 34323: {'lr': 0.00019960434277465193, 'samples': 1098336, 'steps': 2145, 'loss/train': 2.683309316635132} -09/20/2021 21:55:19 - INFO - __main__ - Step 34324: {'lr': 0.00019960434277465193, 'samples': 1098368, 'steps': 2145, 'loss/train': 2.578488826751709} -09/20/2021 21:55:20 - INFO - __main__ - Step 34325: {'lr': 0.00019960434277465193, 'samples': 1098400, 'steps': 2145, 'loss/train': 2.8245413303375244} -09/20/2021 21:55:21 - INFO - __main__ - Step 34326: {'lr': 0.00019960434277465193, 'samples': 1098432, 'steps': 2145, 'loss/train': 1.6701322793960571} -09/20/2021 21:55:22 - INFO - __main__ - Step 34327: {'lr': 0.00019960434277465193, 'samples': 1098464, 'steps': 2145, 'loss/train': 1.9027957916259766} -09/20/2021 21:55:22 - INFO - __main__ - Step 34328: {'lr': 0.00019960434277465193, 'samples': 1098496, 'steps': 2145, 'loss/train': 2.2633042335510254} -09/20/2021 21:55:23 - INFO - __main__ - Step 34329: {'lr': 0.00019960434277465193, 'samples': 1098528, 'steps': 2145, 'loss/train': 2.602377414703369} -09/20/2021 21:55:24 - INFO - __main__ - Step 34330: {'lr': 0.00019960434277465193, 'samples': 1098560, 'steps': 2145, 'loss/train': 2.6452505588531494} -09/20/2021 21:55:25 - INFO - __main__ - Step 34331: {'lr': 0.00019960434277465193, 'samples': 1098592, 'steps': 2145, 'loss/train': 1.8514689207077026} -09/20/2021 21:55:25 - INFO - __main__ - Step 34332: {'lr': 0.00019960434277465193, 'samples': 1098624, 'steps': 2145, 'loss/train': 2.7941701412200928} -09/20/2021 21:55:26 - INFO - __main__ - Step 34333: {'lr': 0.00019960434277465193, 'samples': 1098656, 'steps': 2145, 'loss/train': 3.020660877227783} -09/20/2021 21:55:27 - INFO - __main__ - Step 34334: {'lr': 0.00019960434277465193, 'samples': 1098688, 'steps': 2145, 'loss/train': 1.7740588188171387} -09/20/2021 21:55:28 - INFO - __main__ - Step 34335: {'lr': 0.00019960434277465193, 'samples': 1098720, 'steps': 2145, 'loss/train': 2.9612061977386475} -09/20/2021 21:55:28 - INFO - __main__ - Step 34336: {'lr': 0.00019960434277465193, 'samples': 1098752, 'steps': 2145, 'loss/train': 1.64840567111969} -09/20/2021 21:55:29 - INFO - __main__ - Step 34337: {'lr': 0.00019960377569586281, 'samples': 1098784, 'steps': 2146, 'loss/train': 1.7921491861343384} -09/20/2021 21:55:30 - INFO - __main__ - Step 34338: {'lr': 0.00019960377569586281, 'samples': 1098816, 'steps': 2146, 'loss/train': 1.9584466218948364} -09/20/2021 21:55:31 - INFO - __main__ - Step 34339: {'lr': 0.00019960377569586281, 'samples': 1098848, 'steps': 2146, 'loss/train': 1.4602619409561157} -09/20/2021 21:55:32 - INFO - __main__ - Step 34340: {'lr': 0.00019960377569586281, 'samples': 1098880, 'steps': 2146, 'loss/train': 2.394443988800049} -09/20/2021 21:55:32 - INFO - __main__ - Step 34341: {'lr': 0.00019960377569586281, 'samples': 1098912, 'steps': 2146, 'loss/train': 2.8210854530334473} -09/20/2021 21:55:33 - INFO - __main__ - Step 34342: {'lr': 0.00019960377569586281, 'samples': 1098944, 'steps': 2146, 'loss/train': 2.6871988773345947} -09/20/2021 21:55:34 - INFO - __main__ - Step 34343: {'lr': 0.00019960377569586281, 'samples': 1098976, 'steps': 2146, 'loss/train': 2.036890745162964} -09/20/2021 21:55:35 - INFO - __main__ - Step 34344: {'lr': 0.00019960377569586281, 'samples': 1099008, 'steps': 2146, 'loss/train': 2.7496485710144043} -09/20/2021 21:55:35 - INFO - __main__ - Step 34345: {'lr': 0.00019960377569586281, 'samples': 1099040, 'steps': 2146, 'loss/train': 2.077348232269287} -09/20/2021 21:55:37 - INFO - __main__ - Step 34346: {'lr': 0.00019960377569586281, 'samples': 1099072, 'steps': 2146, 'loss/train': 2.3374862670898438} -09/20/2021 21:55:37 - INFO - __main__ - Step 34347: {'lr': 0.00019960377569586281, 'samples': 1099104, 'steps': 2146, 'loss/train': 2.2642056941986084} -09/20/2021 21:55:38 - INFO - __main__ - Step 34348: {'lr': 0.00019960377569586281, 'samples': 1099136, 'steps': 2146, 'loss/train': 1.9608546495437622} -09/20/2021 21:55:39 - INFO - __main__ - Step 34349: {'lr': 0.00019960377569586281, 'samples': 1099168, 'steps': 2146, 'loss/train': 0.14577557146549225} -09/20/2021 21:55:40 - INFO - __main__ - Step 34350: {'lr': 0.00019960377569586281, 'samples': 1099200, 'steps': 2146, 'loss/train': 0.43117576837539673} -09/20/2021 21:55:40 - INFO - __main__ - Step 34351: {'lr': 0.00019960377569586281, 'samples': 1099232, 'steps': 2146, 'loss/train': 2.2718653678894043} -09/20/2021 21:55:41 - INFO - __main__ - Step 34352: {'lr': 0.00019960377569586281, 'samples': 1099264, 'steps': 2146, 'loss/train': 3.1698381900787354} -09/20/2021 21:55:42 - INFO - __main__ - Step 34353: {'lr': 0.0001996032082117863, 'samples': 1099296, 'steps': 2147, 'loss/train': 2.423076629638672} -09/20/2021 21:55:43 - INFO - __main__ - Step 34354: {'lr': 0.0001996032082117863, 'samples': 1099328, 'steps': 2147, 'loss/train': 2.18228816986084} -09/20/2021 21:55:43 - INFO - __main__ - Step 34355: {'lr': 0.0001996032082117863, 'samples': 1099360, 'steps': 2147, 'loss/train': 2.2209603786468506} -09/20/2021 21:55:44 - INFO - __main__ - Step 34356: {'lr': 0.0001996032082117863, 'samples': 1099392, 'steps': 2147, 'loss/train': 2.1778366565704346} -09/20/2021 21:55:45 - INFO - __main__ - Step 34357: {'lr': 0.0001996032082117863, 'samples': 1099424, 'steps': 2147, 'loss/train': 1.7795108556747437} -09/20/2021 21:55:46 - INFO - __main__ - Step 34358: {'lr': 0.0001996032082117863, 'samples': 1099456, 'steps': 2147, 'loss/train': 1.7881401777267456} -09/20/2021 21:55:46 - INFO - __main__ - Step 34359: {'lr': 0.0001996032082117863, 'samples': 1099488, 'steps': 2147, 'loss/train': 2.473334550857544} -09/20/2021 21:55:47 - INFO - __main__ - Step 34360: {'lr': 0.0001996032082117863, 'samples': 1099520, 'steps': 2147, 'loss/train': 2.4760682582855225} -09/20/2021 21:55:48 - INFO - __main__ - Step 34361: {'lr': 0.0001996032082117863, 'samples': 1099552, 'steps': 2147, 'loss/train': 3.0159897804260254} -09/20/2021 21:55:49 - INFO - __main__ - Step 34362: {'lr': 0.0001996032082117863, 'samples': 1099584, 'steps': 2147, 'loss/train': 1.8459516763687134} -09/20/2021 21:55:49 - INFO - __main__ - Step 34363: {'lr': 0.0001996032082117863, 'samples': 1099616, 'steps': 2147, 'loss/train': 1.6122384071350098} -09/20/2021 21:55:50 - INFO - __main__ - Step 34364: {'lr': 0.0001996032082117863, 'samples': 1099648, 'steps': 2147, 'loss/train': 2.449883460998535} -09/20/2021 21:55:51 - INFO - __main__ - Step 34365: {'lr': 0.0001996032082117863, 'samples': 1099680, 'steps': 2147, 'loss/train': 2.0659101009368896} -09/20/2021 21:55:52 - INFO - __main__ - Step 34366: {'lr': 0.0001996032082117863, 'samples': 1099712, 'steps': 2147, 'loss/train': 2.4401941299438477} -09/20/2021 21:55:52 - INFO - __main__ - Step 34367: {'lr': 0.0001996032082117863, 'samples': 1099744, 'steps': 2147, 'loss/train': 1.9375613927841187} -09/20/2021 21:55:53 - INFO - __main__ - Step 34368: {'lr': 0.0001996032082117863, 'samples': 1099776, 'steps': 2147, 'loss/train': 3.1680707931518555} -09/20/2021 21:55:54 - INFO - __main__ - Step 34369: {'lr': 0.0001996026403224247, 'samples': 1099808, 'steps': 2148, 'loss/train': 1.3423696756362915} -09/20/2021 21:55:55 - INFO - __main__ - Step 34370: {'lr': 0.0001996026403224247, 'samples': 1099840, 'steps': 2148, 'loss/train': 1.4575713872909546} -09/20/2021 21:55:56 - INFO - __main__ - Step 34371: {'lr': 0.0001996026403224247, 'samples': 1099872, 'steps': 2148, 'loss/train': 3.311439275741577} -09/20/2021 21:55:56 - INFO - __main__ - Step 34372: {'lr': 0.0001996026403224247, 'samples': 1099904, 'steps': 2148, 'loss/train': 1.7848149538040161} -09/20/2021 21:55:57 - INFO - __main__ - Step 34373: {'lr': 0.0001996026403224247, 'samples': 1099936, 'steps': 2148, 'loss/train': 1.9202910661697388} -09/20/2021 21:55:58 - INFO - __main__ - Step 34374: {'lr': 0.0001996026403224247, 'samples': 1099968, 'steps': 2148, 'loss/train': 2.1460323333740234} -09/20/2021 21:55:59 - INFO - __main__ - Step 34375: {'lr': 0.0001996026403224247, 'samples': 1100000, 'steps': 2148, 'loss/train': 2.5711841583251953} -09/20/2021 21:56:00 - INFO - __main__ - Step 34376: {'lr': 0.0001996026403224247, 'samples': 1100032, 'steps': 2148, 'loss/train': 2.5881190299987793} -09/20/2021 21:56:01 - INFO - __main__ - Step 34377: {'lr': 0.0001996026403224247, 'samples': 1100064, 'steps': 2148, 'loss/train': 2.406693458557129} -09/20/2021 21:56:01 - INFO - __main__ - Step 34378: {'lr': 0.0001996026403224247, 'samples': 1100096, 'steps': 2148, 'loss/train': 2.327854871749878} -09/20/2021 21:56:02 - INFO - __main__ - Step 34379: {'lr': 0.0001996026403224247, 'samples': 1100128, 'steps': 2148, 'loss/train': 1.412043571472168} -09/20/2021 21:56:03 - INFO - __main__ - Step 34380: {'lr': 0.0001996026403224247, 'samples': 1100160, 'steps': 2148, 'loss/train': 2.238509178161621} -09/20/2021 21:56:04 - INFO - __main__ - Step 34381: {'lr': 0.0001996026403224247, 'samples': 1100192, 'steps': 2148, 'loss/train': 1.9974583387374878} -09/20/2021 21:56:04 - INFO - __main__ - Step 34382: {'lr': 0.0001996026403224247, 'samples': 1100224, 'steps': 2148, 'loss/train': 2.49200177192688} -09/20/2021 21:56:05 - INFO - __main__ - Step 34383: {'lr': 0.0001996026403224247, 'samples': 1100256, 'steps': 2148, 'loss/train': 2.1651053428649902} -09/20/2021 21:56:06 - INFO - __main__ - Step 34384: {'lr': 0.0001996026403224247, 'samples': 1100288, 'steps': 2148, 'loss/train': 3.5566318035125732} -09/20/2021 21:56:07 - INFO - __main__ - Step 34385: {'lr': 0.00019960207202778034, 'samples': 1100320, 'steps': 2149, 'loss/train': 2.0582082271575928} -09/20/2021 21:56:07 - INFO - __main__ - Step 34386: {'lr': 0.00019960207202778034, 'samples': 1100352, 'steps': 2149, 'loss/train': 2.245626926422119} -09/20/2021 21:56:08 - INFO - __main__ - Step 34387: {'lr': 0.00019960207202778034, 'samples': 1100384, 'steps': 2149, 'loss/train': 2.097005844116211} -09/20/2021 21:56:09 - INFO - __main__ - Step 34388: {'lr': 0.00019960207202778034, 'samples': 1100416, 'steps': 2149, 'loss/train': 2.097987413406372} -09/20/2021 21:56:10 - INFO - __main__ - Step 34389: {'lr': 0.00019960207202778034, 'samples': 1100448, 'steps': 2149, 'loss/train': 1.0307422876358032} -09/20/2021 21:56:10 - INFO - __main__ - Step 34390: {'lr': 0.00019960207202778034, 'samples': 1100480, 'steps': 2149, 'loss/train': 2.4631619453430176} -09/20/2021 21:56:11 - INFO - __main__ - Step 34391: {'lr': 0.00019960207202778034, 'samples': 1100512, 'steps': 2149, 'loss/train': 2.8185975551605225} -09/20/2021 21:56:12 - INFO - __main__ - Step 34392: {'lr': 0.00019960207202778034, 'samples': 1100544, 'steps': 2149, 'loss/train': 1.9050384759902954} -09/20/2021 21:56:13 - INFO - __main__ - Step 34393: {'lr': 0.00019960207202778034, 'samples': 1100576, 'steps': 2149, 'loss/train': 1.4296454191207886} -09/20/2021 21:56:14 - INFO - __main__ - Step 34394: {'lr': 0.00019960207202778034, 'samples': 1100608, 'steps': 2149, 'loss/train': 3.218687057495117} -09/20/2021 21:56:14 - INFO - __main__ - Step 34395: {'lr': 0.00019960207202778034, 'samples': 1100640, 'steps': 2149, 'loss/train': 0.32846471667289734} -09/20/2021 21:56:15 - INFO - __main__ - Step 34396: {'lr': 0.00019960207202778034, 'samples': 1100672, 'steps': 2149, 'loss/train': 1.8177098035812378} -09/20/2021 21:56:16 - INFO - __main__ - Step 34397: {'lr': 0.00019960207202778034, 'samples': 1100704, 'steps': 2149, 'loss/train': 2.2222323417663574} -09/20/2021 21:56:17 - INFO - __main__ - Step 34398: {'lr': 0.00019960207202778034, 'samples': 1100736, 'steps': 2149, 'loss/train': 1.810217261314392} -09/20/2021 21:56:17 - INFO - __main__ - Step 34399: {'lr': 0.00019960207202778034, 'samples': 1100768, 'steps': 2149, 'loss/train': 0.23375433683395386} -09/20/2021 21:56:18 - INFO - __main__ - Step 34400: {'lr': 0.00019960207202778034, 'samples': 1100800, 'steps': 2149, 'loss/train': 2.651799201965332} -09/20/2021 21:56:19 - INFO - __main__ - Step 34401: {'lr': 0.00019960150332785554, 'samples': 1100832, 'steps': 2150, 'loss/train': 2.642502546310425} -09/20/2021 21:56:20 - INFO - __main__ - Step 34402: {'lr': 0.00019960150332785554, 'samples': 1100864, 'steps': 2150, 'loss/train': 1.0480599403381348} -09/20/2021 21:56:20 - INFO - __main__ - Step 34403: {'lr': 0.00019960150332785554, 'samples': 1100896, 'steps': 2150, 'loss/train': 2.970036268234253} -09/20/2021 21:56:21 - INFO - __main__ - Step 34404: {'lr': 0.00019960150332785554, 'samples': 1100928, 'steps': 2150, 'loss/train': 2.7681572437286377} -09/20/2021 21:56:22 - INFO - __main__ - Step 34405: {'lr': 0.00019960150332785554, 'samples': 1100960, 'steps': 2150, 'loss/train': 2.701080083847046} -09/20/2021 21:56:23 - INFO - __main__ - Step 34406: {'lr': 0.00019960150332785554, 'samples': 1100992, 'steps': 2150, 'loss/train': 1.1637260913848877} -09/20/2021 21:56:24 - INFO - __main__ - Step 34407: {'lr': 0.00019960150332785554, 'samples': 1101024, 'steps': 2150, 'loss/train': 3.052448034286499} -09/20/2021 21:56:25 - INFO - __main__ - Step 34408: {'lr': 0.00019960150332785554, 'samples': 1101056, 'steps': 2150, 'loss/train': 2.646801233291626} -09/20/2021 21:56:25 - INFO - __main__ - Step 34409: {'lr': 0.00019960150332785554, 'samples': 1101088, 'steps': 2150, 'loss/train': 0.8577570915222168} -09/20/2021 21:56:26 - INFO - __main__ - Step 34410: {'lr': 0.00019960150332785554, 'samples': 1101120, 'steps': 2150, 'loss/train': 2.0598738193511963} -09/20/2021 21:56:27 - INFO - __main__ - Step 34411: {'lr': 0.00019960150332785554, 'samples': 1101152, 'steps': 2150, 'loss/train': 2.216595411300659} -09/20/2021 21:56:28 - INFO - __main__ - Step 34412: {'lr': 0.00019960150332785554, 'samples': 1101184, 'steps': 2150, 'loss/train': 2.569880962371826} -09/20/2021 21:56:28 - INFO - __main__ - Step 34413: {'lr': 0.00019960150332785554, 'samples': 1101216, 'steps': 2150, 'loss/train': 2.26658296585083} -09/20/2021 21:56:29 - INFO - __main__ - Step 34414: {'lr': 0.00019960150332785554, 'samples': 1101248, 'steps': 2150, 'loss/train': 2.4799814224243164} -09/20/2021 21:56:30 - INFO - __main__ - Step 34415: {'lr': 0.00019960150332785554, 'samples': 1101280, 'steps': 2150, 'loss/train': 1.9491924047470093} -09/20/2021 21:56:31 - INFO - __main__ - Step 34416: {'lr': 0.00019960150332785554, 'samples': 1101312, 'steps': 2150, 'loss/train': 2.357525110244751} -09/20/2021 21:56:32 - INFO - __main__ - Step 34417: {'lr': 0.00019960093422265263, 'samples': 1101344, 'steps': 2151, 'loss/train': 2.710891008377075} -09/20/2021 21:56:32 - INFO - __main__ - Step 34418: {'lr': 0.00019960093422265263, 'samples': 1101376, 'steps': 2151, 'loss/train': 2.5890583992004395} -09/20/2021 21:56:33 - INFO - __main__ - Step 34419: {'lr': 0.00019960093422265263, 'samples': 1101408, 'steps': 2151, 'loss/train': 0.8018975853919983} -09/20/2021 21:56:34 - INFO - __main__ - Step 34420: {'lr': 0.00019960093422265263, 'samples': 1101440, 'steps': 2151, 'loss/train': 1.6603264808654785} -09/20/2021 21:56:35 - INFO - __main__ - Step 34421: {'lr': 0.00019960093422265263, 'samples': 1101472, 'steps': 2151, 'loss/train': 1.7870850563049316} -09/20/2021 21:56:35 - INFO - __main__ - Step 34422: {'lr': 0.00019960093422265263, 'samples': 1101504, 'steps': 2151, 'loss/train': 3.0095012187957764} -09/20/2021 21:56:36 - INFO - __main__ - Step 34423: {'lr': 0.00019960093422265263, 'samples': 1101536, 'steps': 2151, 'loss/train': 2.219568967819214} -09/20/2021 21:56:37 - INFO - __main__ - Step 34424: {'lr': 0.00019960093422265263, 'samples': 1101568, 'steps': 2151, 'loss/train': 1.8604035377502441} -09/20/2021 21:56:38 - INFO - __main__ - Step 34425: {'lr': 0.00019960093422265263, 'samples': 1101600, 'steps': 2151, 'loss/train': 2.2159461975097656} -09/20/2021 21:56:38 - INFO - __main__ - Step 34426: {'lr': 0.00019960093422265263, 'samples': 1101632, 'steps': 2151, 'loss/train': 2.506179094314575} -09/20/2021 21:56:39 - INFO - __main__ - Step 34427: {'lr': 0.00019960093422265263, 'samples': 1101664, 'steps': 2151, 'loss/train': 2.2604591846466064} -09/20/2021 21:56:40 - INFO - __main__ - Step 34428: {'lr': 0.00019960093422265263, 'samples': 1101696, 'steps': 2151, 'loss/train': 1.916337251663208} -09/20/2021 21:56:41 - INFO - __main__ - Step 34429: {'lr': 0.00019960093422265263, 'samples': 1101728, 'steps': 2151, 'loss/train': 2.0305275917053223} -09/20/2021 21:56:41 - INFO - __main__ - Step 34430: {'lr': 0.00019960093422265263, 'samples': 1101760, 'steps': 2151, 'loss/train': 2.2558298110961914} -09/20/2021 21:56:42 - INFO - __main__ - Step 34431: {'lr': 0.00019960093422265263, 'samples': 1101792, 'steps': 2151, 'loss/train': 1.6666185855865479} -09/20/2021 21:56:43 - INFO - __main__ - Step 34432: {'lr': 0.00019960093422265263, 'samples': 1101824, 'steps': 2151, 'loss/train': 2.3462181091308594} -09/20/2021 21:56:44 - INFO - __main__ - Step 34433: {'lr': 0.0001996003647121739, 'samples': 1101856, 'steps': 2152, 'loss/train': 2.0482006072998047} -09/20/2021 21:56:44 - INFO - __main__ - Step 34434: {'lr': 0.0001996003647121739, 'samples': 1101888, 'steps': 2152, 'loss/train': 2.4735827445983887} -09/20/2021 21:56:45 - INFO - __main__ - Step 34435: {'lr': 0.0001996003647121739, 'samples': 1101920, 'steps': 2152, 'loss/train': 2.3266208171844482} -09/20/2021 21:56:46 - INFO - __main__ - Step 34436: {'lr': 0.0001996003647121739, 'samples': 1101952, 'steps': 2152, 'loss/train': 2.4227373600006104} -09/20/2021 21:56:47 - INFO - __main__ - Step 34437: {'lr': 0.0001996003647121739, 'samples': 1101984, 'steps': 2152, 'loss/train': 2.0842998027801514} -09/20/2021 21:56:47 - INFO - __main__ - Step 34438: {'lr': 0.0001996003647121739, 'samples': 1102016, 'steps': 2152, 'loss/train': 1.8431282043457031} -09/20/2021 21:56:49 - INFO - __main__ - Step 34439: {'lr': 0.0001996003647121739, 'samples': 1102048, 'steps': 2152, 'loss/train': 1.4051119089126587} -09/20/2021 21:56:50 - INFO - __main__ - Step 34440: {'lr': 0.0001996003647121739, 'samples': 1102080, 'steps': 2152, 'loss/train': 2.66322922706604} -09/20/2021 21:56:50 - INFO - __main__ - Step 34441: {'lr': 0.0001996003647121739, 'samples': 1102112, 'steps': 2152, 'loss/train': 1.7205458879470825} -09/20/2021 21:56:51 - INFO - __main__ - Step 34442: {'lr': 0.0001996003647121739, 'samples': 1102144, 'steps': 2152, 'loss/train': 2.4452173709869385} -09/20/2021 21:56:52 - INFO - __main__ - Step 34443: {'lr': 0.0001996003647121739, 'samples': 1102176, 'steps': 2152, 'loss/train': 0.9788878560066223} -09/20/2021 21:56:53 - INFO - __main__ - Step 34444: {'lr': 0.0001996003647121739, 'samples': 1102208, 'steps': 2152, 'loss/train': 1.051849126815796} -09/20/2021 21:56:53 - INFO - __main__ - Step 34445: {'lr': 0.0001996003647121739, 'samples': 1102240, 'steps': 2152, 'loss/train': 1.028109073638916} -09/20/2021 21:56:54 - INFO - __main__ - Step 34446: {'lr': 0.0001996003647121739, 'samples': 1102272, 'steps': 2152, 'loss/train': 1.1319257020950317} -09/20/2021 21:56:55 - INFO - __main__ - Step 34447: {'lr': 0.0001996003647121739, 'samples': 1102304, 'steps': 2152, 'loss/train': 2.045269250869751} -09/20/2021 21:56:56 - INFO - __main__ - Step 34448: {'lr': 0.0001996003647121739, 'samples': 1102336, 'steps': 2152, 'loss/train': 2.623615026473999} -09/20/2021 21:56:56 - INFO - __main__ - Step 34449: {'lr': 0.00019959979479642167, 'samples': 1102368, 'steps': 2153, 'loss/train': 0.5251145362854004} -09/20/2021 21:56:57 - INFO - __main__ - Step 34450: {'lr': 0.00019959979479642167, 'samples': 1102400, 'steps': 2153, 'loss/train': 2.8091683387756348} -09/20/2021 21:56:58 - INFO - __main__ - Step 34451: {'lr': 0.00019959979479642167, 'samples': 1102432, 'steps': 2153, 'loss/train': 2.995082378387451} -09/20/2021 21:56:59 - INFO - __main__ - Step 34452: {'lr': 0.00019959979479642167, 'samples': 1102464, 'steps': 2153, 'loss/train': 1.7767101526260376} -09/20/2021 21:56:59 - INFO - __main__ - Step 34453: {'lr': 0.00019959979479642167, 'samples': 1102496, 'steps': 2153, 'loss/train': 2.0855844020843506} -09/20/2021 21:57:00 - INFO - __main__ - Step 34454: {'lr': 0.00019959979479642167, 'samples': 1102528, 'steps': 2153, 'loss/train': 2.051121473312378} -09/20/2021 21:57:01 - INFO - __main__ - Step 34455: {'lr': 0.00019959979479642167, 'samples': 1102560, 'steps': 2153, 'loss/train': 2.245637893676758} -09/20/2021 21:57:02 - INFO - __main__ - Step 34456: {'lr': 0.00019959979479642167, 'samples': 1102592, 'steps': 2153, 'loss/train': 1.7092036008834839} -09/20/2021 21:57:02 - INFO - __main__ - Step 34457: {'lr': 0.00019959979479642167, 'samples': 1102624, 'steps': 2153, 'loss/train': 1.7922255992889404} -09/20/2021 21:57:03 - INFO - __main__ - Step 34458: {'lr': 0.00019959979479642167, 'samples': 1102656, 'steps': 2153, 'loss/train': 2.4575705528259277} -09/20/2021 21:57:04 - INFO - __main__ - Step 34459: {'lr': 0.00019959979479642167, 'samples': 1102688, 'steps': 2153, 'loss/train': 1.5343846082687378} -09/20/2021 21:57:05 - INFO - __main__ - Step 34460: {'lr': 0.00019959979479642167, 'samples': 1102720, 'steps': 2153, 'loss/train': 3.0859429836273193} -09/20/2021 21:57:05 - INFO - __main__ - Step 34461: {'lr': 0.00019959979479642167, 'samples': 1102752, 'steps': 2153, 'loss/train': 1.767930507659912} -09/20/2021 21:57:06 - INFO - __main__ - Step 34462: {'lr': 0.00019959979479642167, 'samples': 1102784, 'steps': 2153, 'loss/train': 2.3656046390533447} -09/20/2021 21:57:07 - INFO - __main__ - Step 34463: {'lr': 0.00019959979479642167, 'samples': 1102816, 'steps': 2153, 'loss/train': 2.921818733215332} -09/20/2021 21:57:08 - INFO - __main__ - Step 34464: {'lr': 0.00019959979479642167, 'samples': 1102848, 'steps': 2153, 'loss/train': 2.3345518112182617} -09/20/2021 21:57:09 - INFO - __main__ - Step 34465: {'lr': 0.00019959922447539821, 'samples': 1102880, 'steps': 2154, 'loss/train': 2.359292984008789} -09/20/2021 21:57:09 - INFO - __main__ - Step 34466: {'lr': 0.00019959922447539821, 'samples': 1102912, 'steps': 2154, 'loss/train': 2.7025177478790283} -09/20/2021 21:57:10 - INFO - __main__ - Step 34467: {'lr': 0.00019959922447539821, 'samples': 1102944, 'steps': 2154, 'loss/train': 2.0457029342651367} -09/20/2021 21:57:11 - INFO - __main__ - Step 34468: {'lr': 0.00019959922447539821, 'samples': 1102976, 'steps': 2154, 'loss/train': 1.3649718761444092} -09/20/2021 21:57:12 - INFO - __main__ - Step 34469: {'lr': 0.00019959922447539821, 'samples': 1103008, 'steps': 2154, 'loss/train': 1.7901625633239746} -09/20/2021 21:57:12 - INFO - __main__ - Step 34470: {'lr': 0.00019959922447539821, 'samples': 1103040, 'steps': 2154, 'loss/train': 2.64160418510437} -09/20/2021 21:57:13 - INFO - __main__ - Step 34471: {'lr': 0.00019959922447539821, 'samples': 1103072, 'steps': 2154, 'loss/train': 2.667495012283325} -09/20/2021 21:57:14 - INFO - __main__ - Step 34472: {'lr': 0.00019959922447539821, 'samples': 1103104, 'steps': 2154, 'loss/train': 1.8388384580612183} -09/20/2021 21:57:15 - INFO - __main__ - Step 34473: {'lr': 0.00019959922447539821, 'samples': 1103136, 'steps': 2154, 'loss/train': 2.5585927963256836} -09/20/2021 21:57:16 - INFO - __main__ - Step 34474: {'lr': 0.00019959922447539821, 'samples': 1103168, 'steps': 2154, 'loss/train': 1.892884373664856} -09/20/2021 21:57:17 - INFO - __main__ - Step 34475: {'lr': 0.00019959922447539821, 'samples': 1103200, 'steps': 2154, 'loss/train': 2.425987958908081} -09/20/2021 21:57:17 - INFO - __main__ - Step 34476: {'lr': 0.00019959922447539821, 'samples': 1103232, 'steps': 2154, 'loss/train': 2.820056676864624} -09/20/2021 21:57:18 - INFO - __main__ - Step 34477: {'lr': 0.00019959922447539821, 'samples': 1103264, 'steps': 2154, 'loss/train': 2.549962282180786} -09/20/2021 21:57:19 - INFO - __main__ - Step 34478: {'lr': 0.00019959922447539821, 'samples': 1103296, 'steps': 2154, 'loss/train': 3.0264534950256348} -09/20/2021 21:57:20 - INFO - __main__ - Step 34479: {'lr': 0.00019959922447539821, 'samples': 1103328, 'steps': 2154, 'loss/train': 1.9902870655059814} -09/20/2021 21:57:20 - INFO - __main__ - Step 34480: {'lr': 0.00019959922447539821, 'samples': 1103360, 'steps': 2154, 'loss/train': 2.7277724742889404} -09/20/2021 21:57:21 - INFO - __main__ - Step 34481: {'lr': 0.00019959865374910595, 'samples': 1103392, 'steps': 2155, 'loss/train': 2.1523244380950928} -09/20/2021 21:57:22 - INFO - __main__ - Step 34482: {'lr': 0.00019959865374910595, 'samples': 1103424, 'steps': 2155, 'loss/train': 1.3717100620269775} -09/20/2021 21:57:23 - INFO - __main__ - Step 34483: {'lr': 0.00019959865374910595, 'samples': 1103456, 'steps': 2155, 'loss/train': 2.325200319290161} -09/20/2021 21:57:23 - INFO - __main__ - Step 34484: {'lr': 0.00019959865374910595, 'samples': 1103488, 'steps': 2155, 'loss/train': 2.493192434310913} -09/20/2021 21:57:24 - INFO - __main__ - Step 34485: {'lr': 0.00019959865374910595, 'samples': 1103520, 'steps': 2155, 'loss/train': 1.8115112781524658} -09/20/2021 21:57:25 - INFO - __main__ - Step 34486: {'lr': 0.00019959865374910595, 'samples': 1103552, 'steps': 2155, 'loss/train': 1.7487359046936035} -09/20/2021 21:57:26 - INFO - __main__ - Step 34487: {'lr': 0.00019959865374910595, 'samples': 1103584, 'steps': 2155, 'loss/train': 1.9156973361968994} -09/20/2021 21:57:26 - INFO - __main__ - Step 34488: {'lr': 0.00019959865374910595, 'samples': 1103616, 'steps': 2155, 'loss/train': 2.458925247192383} -09/20/2021 21:57:27 - INFO - __main__ - Step 34489: {'lr': 0.00019959865374910595, 'samples': 1103648, 'steps': 2155, 'loss/train': 2.307426929473877} -09/20/2021 21:57:28 - INFO - __main__ - Step 34490: {'lr': 0.00019959865374910595, 'samples': 1103680, 'steps': 2155, 'loss/train': 1.342435598373413} -09/20/2021 21:57:29 - INFO - __main__ - Step 34491: {'lr': 0.00019959865374910595, 'samples': 1103712, 'steps': 2155, 'loss/train': 1.5522738695144653} -09/20/2021 21:57:29 - INFO - __main__ - Step 34492: {'lr': 0.00019959865374910595, 'samples': 1103744, 'steps': 2155, 'loss/train': 1.6356743574142456} -09/20/2021 21:57:30 - INFO - __main__ - Step 34493: {'lr': 0.00019959865374910595, 'samples': 1103776, 'steps': 2155, 'loss/train': 2.4987645149230957} -09/20/2021 21:57:31 - INFO - __main__ - Step 34494: {'lr': 0.00019959865374910595, 'samples': 1103808, 'steps': 2155, 'loss/train': 0.4713410437107086} -09/20/2021 21:57:32 - INFO - __main__ - Step 34495: {'lr': 0.00019959865374910595, 'samples': 1103840, 'steps': 2155, 'loss/train': 2.2473461627960205} -09/20/2021 21:57:32 - INFO - __main__ - Step 34496: {'lr': 0.00019959865374910595, 'samples': 1103872, 'steps': 2155, 'loss/train': 0.5572569966316223} -09/20/2021 21:57:33 - INFO - __main__ - Step 34497: {'lr': 0.00019959808261754716, 'samples': 1103904, 'steps': 2156, 'loss/train': 2.612420082092285} -09/20/2021 21:57:34 - INFO - __main__ - Step 34498: {'lr': 0.00019959808261754716, 'samples': 1103936, 'steps': 2156, 'loss/train': 2.4002602100372314} -09/20/2021 21:57:35 - INFO - __main__ - Step 34499: {'lr': 0.00019959808261754716, 'samples': 1103968, 'steps': 2156, 'loss/train': 2.0853524208068848} -09/20/2021 21:57:36 - INFO - __main__ - Step 34500: {'lr': 0.00019959808261754716, 'samples': 1104000, 'steps': 2156, 'loss/train': 2.360424757003784} -09/20/2021 21:57:36 - INFO - __main__ - Step 34501: {'lr': 0.00019959808261754716, 'samples': 1104032, 'steps': 2156, 'loss/train': 2.233555316925049} -09/20/2021 21:57:37 - INFO - __main__ - Step 34502: {'lr': 0.00019959808261754716, 'samples': 1104064, 'steps': 2156, 'loss/train': 2.258639335632324} -09/20/2021 21:57:38 - INFO - __main__ - Step 34503: {'lr': 0.00019959808261754716, 'samples': 1104096, 'steps': 2156, 'loss/train': 2.1764440536499023} -09/20/2021 21:57:39 - INFO - __main__ - Step 34504: {'lr': 0.00019959808261754716, 'samples': 1104128, 'steps': 2156, 'loss/train': 2.717622995376587} -09/20/2021 21:57:40 - INFO - __main__ - Step 34505: {'lr': 0.00019959808261754716, 'samples': 1104160, 'steps': 2156, 'loss/train': 2.1353399753570557} -09/20/2021 21:57:41 - INFO - __main__ - Step 34506: {'lr': 0.00019959808261754716, 'samples': 1104192, 'steps': 2156, 'loss/train': 2.3637359142303467} -09/20/2021 21:57:41 - INFO - __main__ - Step 34507: {'lr': 0.00019959808261754716, 'samples': 1104224, 'steps': 2156, 'loss/train': 3.286557674407959} -09/20/2021 21:57:42 - INFO - __main__ - Step 34508: {'lr': 0.00019959808261754716, 'samples': 1104256, 'steps': 2156, 'loss/train': 2.0632965564727783} -09/20/2021 21:57:43 - INFO - __main__ - Step 34509: {'lr': 0.00019959808261754716, 'samples': 1104288, 'steps': 2156, 'loss/train': 2.4483728408813477} -09/20/2021 21:57:44 - INFO - __main__ - Step 34510: {'lr': 0.00019959808261754716, 'samples': 1104320, 'steps': 2156, 'loss/train': 2.670415163040161} -09/20/2021 21:57:44 - INFO - __main__ - Step 34511: {'lr': 0.00019959808261754716, 'samples': 1104352, 'steps': 2156, 'loss/train': 3.339651584625244} -09/20/2021 21:57:45 - INFO - __main__ - Step 34512: {'lr': 0.00019959808261754716, 'samples': 1104384, 'steps': 2156, 'loss/train': 1.7389899492263794} -09/20/2021 21:57:46 - INFO - __main__ - Step 34513: {'lr': 0.00019959751108072414, 'samples': 1104416, 'steps': 2157, 'loss/train': 2.3807201385498047} -09/20/2021 21:57:47 - INFO - __main__ - Step 34514: {'lr': 0.00019959751108072414, 'samples': 1104448, 'steps': 2157, 'loss/train': 3.1515743732452393} -09/20/2021 21:57:47 - INFO - __main__ - Step 34515: {'lr': 0.00019959751108072414, 'samples': 1104480, 'steps': 2157, 'loss/train': 2.587331533432007} -09/20/2021 21:57:48 - INFO - __main__ - Step 34516: {'lr': 0.00019959751108072414, 'samples': 1104512, 'steps': 2157, 'loss/train': 2.3699567317962646} -09/20/2021 21:57:49 - INFO - __main__ - Step 34517: {'lr': 0.00019959751108072414, 'samples': 1104544, 'steps': 2157, 'loss/train': 2.0551810264587402} -09/20/2021 21:57:50 - INFO - __main__ - Step 34518: {'lr': 0.00019959751108072414, 'samples': 1104576, 'steps': 2157, 'loss/train': 2.723814010620117} -09/20/2021 21:57:50 - INFO - __main__ - Step 34519: {'lr': 0.00019959751108072414, 'samples': 1104608, 'steps': 2157, 'loss/train': 2.5665369033813477} -09/20/2021 21:57:51 - INFO - __main__ - Step 34520: {'lr': 0.00019959751108072414, 'samples': 1104640, 'steps': 2157, 'loss/train': 1.9982939958572388} -09/20/2021 21:57:52 - INFO - __main__ - Step 34521: {'lr': 0.00019959751108072414, 'samples': 1104672, 'steps': 2157, 'loss/train': 1.9155550003051758} -09/20/2021 21:57:53 - INFO - __main__ - Step 34522: {'lr': 0.00019959751108072414, 'samples': 1104704, 'steps': 2157, 'loss/train': 2.688654899597168} -09/20/2021 21:57:53 - INFO - __main__ - Step 34523: {'lr': 0.00019959751108072414, 'samples': 1104736, 'steps': 2157, 'loss/train': 2.3628830909729004} -09/20/2021 21:57:54 - INFO - __main__ - Step 34524: {'lr': 0.00019959751108072414, 'samples': 1104768, 'steps': 2157, 'loss/train': 2.397152900695801} -09/20/2021 21:57:55 - INFO - __main__ - Step 34525: {'lr': 0.00019959751108072414, 'samples': 1104800, 'steps': 2157, 'loss/train': 2.812654733657837} -09/20/2021 21:57:56 - INFO - __main__ - Step 34526: {'lr': 0.00019959751108072414, 'samples': 1104832, 'steps': 2157, 'loss/train': 2.2504754066467285} -09/20/2021 21:57:56 - INFO - __main__ - Step 34527: {'lr': 0.00019959751108072414, 'samples': 1104864, 'steps': 2157, 'loss/train': 2.3800148963928223} -09/20/2021 21:57:57 - INFO - __main__ - Step 34528: {'lr': 0.00019959751108072414, 'samples': 1104896, 'steps': 2157, 'loss/train': 1.8360806703567505} -09/20/2021 21:57:58 - INFO - __main__ - Step 34529: {'lr': 0.00019959693913863924, 'samples': 1104928, 'steps': 2158, 'loss/train': 2.174333095550537} -09/20/2021 21:57:59 - INFO - __main__ - Step 34530: {'lr': 0.00019959693913863924, 'samples': 1104960, 'steps': 2158, 'loss/train': 2.568800687789917} -09/20/2021 21:58:00 - INFO - __main__ - Step 34531: {'lr': 0.00019959693913863924, 'samples': 1104992, 'steps': 2158, 'loss/train': 1.6761014461517334} -09/20/2021 21:58:00 - INFO - __main__ - Step 34532: {'lr': 0.00019959693913863924, 'samples': 1105024, 'steps': 2158, 'loss/train': 1.9991068840026855} -09/20/2021 21:58:01 - INFO - __main__ - Step 34533: {'lr': 0.00019959693913863924, 'samples': 1105056, 'steps': 2158, 'loss/train': 1.6649988889694214} -09/20/2021 21:58:02 - INFO - __main__ - Step 34534: {'lr': 0.00019959693913863924, 'samples': 1105088, 'steps': 2158, 'loss/train': 2.2729663848876953} -09/20/2021 21:58:04 - INFO - __main__ - Step 34535: {'lr': 0.00019959693913863924, 'samples': 1105120, 'steps': 2158, 'loss/train': 2.7474658489227295} -09/20/2021 21:58:04 - INFO - __main__ - Step 34536: {'lr': 0.00019959693913863924, 'samples': 1105152, 'steps': 2158, 'loss/train': 2.097243309020996} -09/20/2021 21:58:05 - INFO - __main__ - Step 34537: {'lr': 0.00019959693913863924, 'samples': 1105184, 'steps': 2158, 'loss/train': 2.395591974258423} -09/20/2021 21:58:06 - INFO - __main__ - Step 34538: {'lr': 0.00019959693913863924, 'samples': 1105216, 'steps': 2158, 'loss/train': 2.257791042327881} -09/20/2021 21:58:07 - INFO - __main__ - Step 34539: {'lr': 0.00019959693913863924, 'samples': 1105248, 'steps': 2158, 'loss/train': 2.1799099445343018} -09/20/2021 21:58:07 - INFO - __main__ - Step 34540: {'lr': 0.00019959693913863924, 'samples': 1105280, 'steps': 2158, 'loss/train': 2.1382832527160645} -09/20/2021 21:58:08 - INFO - __main__ - Step 34541: {'lr': 0.00019959693913863924, 'samples': 1105312, 'steps': 2158, 'loss/train': 2.3010833263397217} -09/20/2021 21:58:09 - INFO - __main__ - Step 34542: {'lr': 0.00019959693913863924, 'samples': 1105344, 'steps': 2158, 'loss/train': 2.816132068634033} -09/20/2021 21:58:10 - INFO - __main__ - Step 34543: {'lr': 0.00019959693913863924, 'samples': 1105376, 'steps': 2158, 'loss/train': 1.7811243534088135} -09/20/2021 21:58:10 - INFO - __main__ - Step 34544: {'lr': 0.00019959693913863924, 'samples': 1105408, 'steps': 2158, 'loss/train': 2.7607908248901367} -09/20/2021 21:58:11 - INFO - __main__ - Step 34545: {'lr': 0.00019959636679129478, 'samples': 1105440, 'steps': 2159, 'loss/train': 2.609125852584839} -09/20/2021 21:58:12 - INFO - __main__ - Step 34546: {'lr': 0.00019959636679129478, 'samples': 1105472, 'steps': 2159, 'loss/train': 2.387855291366577} -09/20/2021 21:58:13 - INFO - __main__ - Step 34547: {'lr': 0.00019959636679129478, 'samples': 1105504, 'steps': 2159, 'loss/train': 2.3699395656585693} -09/20/2021 21:58:14 - INFO - __main__ - Step 34548: {'lr': 0.00019959636679129478, 'samples': 1105536, 'steps': 2159, 'loss/train': 2.897608757019043} -09/20/2021 21:58:14 - INFO - __main__ - Step 34549: {'lr': 0.00019959636679129478, 'samples': 1105568, 'steps': 2159, 'loss/train': 1.6477444171905518} -09/20/2021 21:58:15 - INFO - __main__ - Step 34550: {'lr': 0.00019959636679129478, 'samples': 1105600, 'steps': 2159, 'loss/train': 1.9514702558517456} -09/20/2021 21:58:16 - INFO - __main__ - Step 34551: {'lr': 0.00019959636679129478, 'samples': 1105632, 'steps': 2159, 'loss/train': 2.5179636478424072} -09/20/2021 21:58:17 - INFO - __main__ - Step 34552: {'lr': 0.00019959636679129478, 'samples': 1105664, 'steps': 2159, 'loss/train': 2.1300203800201416} -09/20/2021 21:58:17 - INFO - __main__ - Step 34553: {'lr': 0.00019959636679129478, 'samples': 1105696, 'steps': 2159, 'loss/train': 2.071955919265747} -09/20/2021 21:58:18 - INFO - __main__ - Step 34554: {'lr': 0.00019959636679129478, 'samples': 1105728, 'steps': 2159, 'loss/train': 2.8217613697052} -09/20/2021 21:58:19 - INFO - __main__ - Step 34555: {'lr': 0.00019959636679129478, 'samples': 1105760, 'steps': 2159, 'loss/train': 2.0625314712524414} -09/20/2021 21:58:20 - INFO - __main__ - Step 34556: {'lr': 0.00019959636679129478, 'samples': 1105792, 'steps': 2159, 'loss/train': 3.262929677963257} -09/20/2021 21:58:20 - INFO - __main__ - Step 34557: {'lr': 0.00019959636679129478, 'samples': 1105824, 'steps': 2159, 'loss/train': 2.9096860885620117} -09/20/2021 21:58:21 - INFO - __main__ - Step 34558: {'lr': 0.00019959636679129478, 'samples': 1105856, 'steps': 2159, 'loss/train': 2.842078447341919} -09/20/2021 21:58:22 - INFO - __main__ - Step 34559: {'lr': 0.00019959636679129478, 'samples': 1105888, 'steps': 2159, 'loss/train': 2.4616589546203613} -09/20/2021 21:58:23 - INFO - __main__ - Step 34560: {'lr': 0.00019959636679129478, 'samples': 1105920, 'steps': 2159, 'loss/train': 2.498943328857422} -09/20/2021 21:58:23 - INFO - __main__ - Step 34561: {'lr': 0.0001995957940386931, 'samples': 1105952, 'steps': 2160, 'loss/train': 2.5865073204040527} -09/20/2021 21:58:24 - INFO - __main__ - Step 34562: {'lr': 0.0001995957940386931, 'samples': 1105984, 'steps': 2160, 'loss/train': 2.189537525177002} -09/20/2021 21:58:25 - INFO - __main__ - Step 34563: {'lr': 0.0001995957940386931, 'samples': 1106016, 'steps': 2160, 'loss/train': 2.472125768661499} -09/20/2021 21:58:26 - INFO - __main__ - Step 34564: {'lr': 0.0001995957940386931, 'samples': 1106048, 'steps': 2160, 'loss/train': 1.9355621337890625} -09/20/2021 21:58:26 - INFO - __main__ - Step 34565: {'lr': 0.0001995957940386931, 'samples': 1106080, 'steps': 2160, 'loss/train': 2.4775922298431396} -09/20/2021 21:58:28 - INFO - __main__ - Step 34566: {'lr': 0.0001995957940386931, 'samples': 1106112, 'steps': 2160, 'loss/train': 2.086099624633789} -09/20/2021 21:58:29 - INFO - __main__ - Step 34567: {'lr': 0.0001995957940386931, 'samples': 1106144, 'steps': 2160, 'loss/train': 2.3465771675109863} -09/20/2021 21:58:29 - INFO - __main__ - Step 34568: {'lr': 0.0001995957940386931, 'samples': 1106176, 'steps': 2160, 'loss/train': 2.705502986907959} -09/20/2021 21:58:30 - INFO - __main__ - Step 34569: {'lr': 0.0001995957940386931, 'samples': 1106208, 'steps': 2160, 'loss/train': 2.067368745803833} -09/20/2021 21:58:31 - INFO - __main__ - Step 34570: {'lr': 0.0001995957940386931, 'samples': 1106240, 'steps': 2160, 'loss/train': 0.5403143167495728} -09/20/2021 21:58:32 - INFO - __main__ - Step 34571: {'lr': 0.0001995957940386931, 'samples': 1106272, 'steps': 2160, 'loss/train': 1.5805120468139648} -09/20/2021 21:58:32 - INFO - __main__ - Step 34572: {'lr': 0.0001995957940386931, 'samples': 1106304, 'steps': 2160, 'loss/train': 2.930241823196411} -09/20/2021 21:58:33 - INFO - __main__ - Step 34573: {'lr': 0.0001995957940386931, 'samples': 1106336, 'steps': 2160, 'loss/train': 0.6085609793663025} -09/20/2021 21:58:34 - INFO - __main__ - Step 34574: {'lr': 0.0001995957940386931, 'samples': 1106368, 'steps': 2160, 'loss/train': 3.0108869075775146} -09/20/2021 21:58:35 - INFO - __main__ - Step 34575: {'lr': 0.0001995957940386931, 'samples': 1106400, 'steps': 2160, 'loss/train': 2.5488240718841553} -09/20/2021 21:58:35 - INFO - __main__ - Step 34576: {'lr': 0.0001995957940386931, 'samples': 1106432, 'steps': 2160, 'loss/train': 2.4625136852264404} -09/20/2021 21:58:36 - INFO - __main__ - Step 34577: {'lr': 0.0001995952208808365, 'samples': 1106464, 'steps': 2161, 'loss/train': 2.252650737762451} -09/20/2021 21:58:37 - INFO - __main__ - Step 34578: {'lr': 0.0001995952208808365, 'samples': 1106496, 'steps': 2161, 'loss/train': 2.1680634021759033} -09/20/2021 21:58:38 - INFO - __main__ - Step 34579: {'lr': 0.0001995952208808365, 'samples': 1106528, 'steps': 2161, 'loss/train': 1.941362977027893} -09/20/2021 21:58:38 - INFO - __main__ - Step 34580: {'lr': 0.0001995952208808365, 'samples': 1106560, 'steps': 2161, 'loss/train': 1.5596195459365845} -09/20/2021 21:58:39 - INFO - __main__ - Step 34581: {'lr': 0.0001995952208808365, 'samples': 1106592, 'steps': 2161, 'loss/train': 1.7526206970214844} -09/20/2021 21:58:40 - INFO - __main__ - Step 34582: {'lr': 0.0001995952208808365, 'samples': 1106624, 'steps': 2161, 'loss/train': 2.456557273864746} -09/20/2021 21:58:41 - INFO - __main__ - Step 34583: {'lr': 0.0001995952208808365, 'samples': 1106656, 'steps': 2161, 'loss/train': 2.5854785442352295} -09/20/2021 21:58:41 - INFO - __main__ - Step 34584: {'lr': 0.0001995952208808365, 'samples': 1106688, 'steps': 2161, 'loss/train': 3.435471296310425} -09/20/2021 21:58:42 - INFO - __main__ - Step 34585: {'lr': 0.0001995952208808365, 'samples': 1106720, 'steps': 2161, 'loss/train': 3.5356130599975586} -09/20/2021 21:58:43 - INFO - __main__ - Step 34586: {'lr': 0.0001995952208808365, 'samples': 1106752, 'steps': 2161, 'loss/train': 2.231966733932495} -09/20/2021 21:58:44 - INFO - __main__ - Step 34587: {'lr': 0.0001995952208808365, 'samples': 1106784, 'steps': 2161, 'loss/train': 1.6824547052383423} -09/20/2021 21:58:44 - INFO - __main__ - Step 34588: {'lr': 0.0001995952208808365, 'samples': 1106816, 'steps': 2161, 'loss/train': 2.224047899246216} -09/20/2021 21:58:45 - INFO - __main__ - Step 34589: {'lr': 0.0001995952208808365, 'samples': 1106848, 'steps': 2161, 'loss/train': 0.17344975471496582} -09/20/2021 21:58:46 - INFO - __main__ - Step 34590: {'lr': 0.0001995952208808365, 'samples': 1106880, 'steps': 2161, 'loss/train': 0.31595104932785034} -09/20/2021 21:58:47 - INFO - __main__ - Step 34591: {'lr': 0.0001995952208808365, 'samples': 1106912, 'steps': 2161, 'loss/train': 0.4670518934726715} -09/20/2021 21:58:47 - INFO - __main__ - Step 34592: {'lr': 0.0001995952208808365, 'samples': 1106944, 'steps': 2161, 'loss/train': 3.000349521636963} -09/20/2021 21:58:48 - INFO - __main__ - Step 34593: {'lr': 0.00019959464731772732, 'samples': 1106976, 'steps': 2162, 'loss/train': 1.820825219154358} -09/20/2021 21:58:49 - INFO - __main__ - Step 34594: {'lr': 0.00019959464731772732, 'samples': 1107008, 'steps': 2162, 'loss/train': 2.443866729736328} -09/20/2021 21:58:50 - INFO - __main__ - Step 34595: {'lr': 0.00019959464731772732, 'samples': 1107040, 'steps': 2162, 'loss/train': 1.9979584217071533} -09/20/2021 21:58:51 - INFO - __main__ - Step 34596: {'lr': 0.00019959464731772732, 'samples': 1107072, 'steps': 2162, 'loss/train': 3.1070470809936523} -09/20/2021 21:58:51 - INFO - __main__ - Step 34597: {'lr': 0.00019959464731772732, 'samples': 1107104, 'steps': 2162, 'loss/train': 2.0358643531799316} -09/20/2021 21:58:52 - INFO - __main__ - Step 34598: {'lr': 0.00019959464731772732, 'samples': 1107136, 'steps': 2162, 'loss/train': 2.009845018386841} -09/20/2021 21:58:53 - INFO - __main__ - Step 34599: {'lr': 0.00019959464731772732, 'samples': 1107168, 'steps': 2162, 'loss/train': 3.354874849319458} -09/20/2021 21:58:54 - INFO - __main__ - Step 34600: {'lr': 0.00019959464731772732, 'samples': 1107200, 'steps': 2162, 'loss/train': 2.5110323429107666} -09/20/2021 21:58:55 - INFO - __main__ - Step 34601: {'lr': 0.00019959464731772732, 'samples': 1107232, 'steps': 2162, 'loss/train': 1.971693992614746} -09/20/2021 21:58:56 - INFO - __main__ - Step 34602: {'lr': 0.00019959464731772732, 'samples': 1107264, 'steps': 2162, 'loss/train': 2.8316359519958496} -09/20/2021 21:58:56 - INFO - __main__ - Step 34603: {'lr': 0.00019959464731772732, 'samples': 1107296, 'steps': 2162, 'loss/train': 0.7128831744194031} -09/20/2021 21:58:57 - INFO - __main__ - Step 34604: {'lr': 0.00019959464731772732, 'samples': 1107328, 'steps': 2162, 'loss/train': 2.3242459297180176} -09/20/2021 21:58:58 - INFO - __main__ - Step 34605: {'lr': 0.00019959464731772732, 'samples': 1107360, 'steps': 2162, 'loss/train': 0.6004437208175659} -09/20/2021 21:58:59 - INFO - __main__ - Step 34606: {'lr': 0.00019959464731772732, 'samples': 1107392, 'steps': 2162, 'loss/train': 2.190678596496582} -09/20/2021 21:58:59 - INFO - __main__ - Step 34607: {'lr': 0.00019959464731772732, 'samples': 1107424, 'steps': 2162, 'loss/train': 1.9858968257904053} -09/20/2021 21:59:00 - INFO - __main__ - Step 34608: {'lr': 0.00019959464731772732, 'samples': 1107456, 'steps': 2162, 'loss/train': 3.521759510040283} -09/20/2021 21:59:01 - INFO - __main__ - Step 34609: {'lr': 0.00019959407334936793, 'samples': 1107488, 'steps': 2163, 'loss/train': 1.862973690032959} -09/20/2021 21:59:02 - INFO - __main__ - Step 34610: {'lr': 0.00019959407334936793, 'samples': 1107520, 'steps': 2163, 'loss/train': 2.547297477722168} -09/20/2021 21:59:03 - INFO - __main__ - Step 34611: {'lr': 0.00019959407334936793, 'samples': 1107552, 'steps': 2163, 'loss/train': 2.2075016498565674} -09/20/2021 21:59:03 - INFO - __main__ - Step 34612: {'lr': 0.00019959407334936793, 'samples': 1107584, 'steps': 2163, 'loss/train': 2.2432491779327393} -09/20/2021 21:59:04 - INFO - __main__ - Step 34613: {'lr': 0.00019959407334936793, 'samples': 1107616, 'steps': 2163, 'loss/train': 1.3796435594558716} -09/20/2021 21:59:05 - INFO - __main__ - Step 34614: {'lr': 0.00019959407334936793, 'samples': 1107648, 'steps': 2163, 'loss/train': 1.89249587059021} -09/20/2021 21:59:06 - INFO - __main__ - Step 34615: {'lr': 0.00019959407334936793, 'samples': 1107680, 'steps': 2163, 'loss/train': 2.7583534717559814} -09/20/2021 21:59:06 - INFO - __main__ - Step 34616: {'lr': 0.00019959407334936793, 'samples': 1107712, 'steps': 2163, 'loss/train': 2.9875471591949463} -09/20/2021 21:59:07 - INFO - __main__ - Step 34617: {'lr': 0.00019959407334936793, 'samples': 1107744, 'steps': 2163, 'loss/train': 2.8682429790496826} -09/20/2021 21:59:08 - INFO - __main__ - Step 34618: {'lr': 0.00019959407334936793, 'samples': 1107776, 'steps': 2163, 'loss/train': 1.9632923603057861} -09/20/2021 21:59:09 - INFO - __main__ - Step 34619: {'lr': 0.00019959407334936793, 'samples': 1107808, 'steps': 2163, 'loss/train': 1.2586110830307007} -09/20/2021 21:59:09 - INFO - __main__ - Step 34620: {'lr': 0.00019959407334936793, 'samples': 1107840, 'steps': 2163, 'loss/train': 3.1143081188201904} -09/20/2021 21:59:10 - INFO - __main__ - Step 34621: {'lr': 0.00019959407334936793, 'samples': 1107872, 'steps': 2163, 'loss/train': 2.82904052734375} -09/20/2021 21:59:11 - INFO - __main__ - Step 34622: {'lr': 0.00019959407334936793, 'samples': 1107904, 'steps': 2163, 'loss/train': 1.5566434860229492} -09/20/2021 21:59:12 - INFO - __main__ - Step 34623: {'lr': 0.00019959407334936793, 'samples': 1107936, 'steps': 2163, 'loss/train': 1.7507230043411255} -09/20/2021 21:59:12 - INFO - __main__ - Step 34624: {'lr': 0.00019959407334936793, 'samples': 1107968, 'steps': 2163, 'loss/train': 2.723233699798584} -09/20/2021 21:59:13 - INFO - __main__ - Step 34625: {'lr': 0.00019959349897576064, 'samples': 1108000, 'steps': 2164, 'loss/train': 0.8232490420341492} -09/20/2021 21:59:14 - INFO - __main__ - Step 34626: {'lr': 0.00019959349897576064, 'samples': 1108032, 'steps': 2164, 'loss/train': 2.8773255348205566} -09/20/2021 21:59:15 - INFO - __main__ - Step 34627: {'lr': 0.00019959349897576064, 'samples': 1108064, 'steps': 2164, 'loss/train': 1.9077820777893066} -09/20/2021 21:59:15 - INFO - __main__ - Step 34628: {'lr': 0.00019959349897576064, 'samples': 1108096, 'steps': 2164, 'loss/train': 2.040435791015625} -09/20/2021 21:59:16 - INFO - __main__ - Step 34629: {'lr': 0.00019959349897576064, 'samples': 1108128, 'steps': 2164, 'loss/train': 1.8347967863082886} -09/20/2021 21:59:17 - INFO - __main__ - Step 34630: {'lr': 0.00019959349897576064, 'samples': 1108160, 'steps': 2164, 'loss/train': 0.4662594795227051} -09/20/2021 21:59:18 - INFO - __main__ - Step 34631: {'lr': 0.00019959349897576064, 'samples': 1108192, 'steps': 2164, 'loss/train': 2.802762746810913} -09/20/2021 21:59:19 - INFO - __main__ - Step 34632: {'lr': 0.00019959349897576064, 'samples': 1108224, 'steps': 2164, 'loss/train': 2.6726579666137695} -09/20/2021 21:59:20 - INFO - __main__ - Step 34633: {'lr': 0.00019959349897576064, 'samples': 1108256, 'steps': 2164, 'loss/train': 2.4608442783355713} -09/20/2021 21:59:20 - INFO - __main__ - Step 34634: {'lr': 0.00019959349897576064, 'samples': 1108288, 'steps': 2164, 'loss/train': 2.512300491333008} -09/20/2021 21:59:21 - INFO - __main__ - Step 34635: {'lr': 0.00019959349897576064, 'samples': 1108320, 'steps': 2164, 'loss/train': 1.9827544689178467} -09/20/2021 21:59:22 - INFO - __main__ - Step 34636: {'lr': 0.00019959349897576064, 'samples': 1108352, 'steps': 2164, 'loss/train': 2.109334945678711} -09/20/2021 21:59:23 - INFO - __main__ - Step 34637: {'lr': 0.00019959349897576064, 'samples': 1108384, 'steps': 2164, 'loss/train': 2.575754165649414} -09/20/2021 21:59:23 - INFO - __main__ - Step 34638: {'lr': 0.00019959349897576064, 'samples': 1108416, 'steps': 2164, 'loss/train': 2.6632277965545654} -09/20/2021 21:59:24 - INFO - __main__ - Step 34639: {'lr': 0.00019959349897576064, 'samples': 1108448, 'steps': 2164, 'loss/train': 1.6634002923965454} -09/20/2021 21:59:25 - INFO - __main__ - Step 34640: {'lr': 0.00019959349897576064, 'samples': 1108480, 'steps': 2164, 'loss/train': 1.9772517681121826} -09/20/2021 21:59:26 - INFO - __main__ - Step 34641: {'lr': 0.00019959292419690781, 'samples': 1108512, 'steps': 2165, 'loss/train': 2.7411670684814453} -09/20/2021 21:59:27 - INFO - __main__ - Step 34642: {'lr': 0.00019959292419690781, 'samples': 1108544, 'steps': 2165, 'loss/train': 2.4605116844177246} -09/20/2021 21:59:27 - INFO - __main__ - Step 34643: {'lr': 0.00019959292419690781, 'samples': 1108576, 'steps': 2165, 'loss/train': 2.351248025894165} -09/20/2021 21:59:28 - INFO - __main__ - Step 34644: {'lr': 0.00019959292419690781, 'samples': 1108608, 'steps': 2165, 'loss/train': 2.692220687866211} -09/20/2021 21:59:29 - INFO - __main__ - Step 34645: {'lr': 0.00019959292419690781, 'samples': 1108640, 'steps': 2165, 'loss/train': 2.4311683177948} -09/20/2021 21:59:30 - INFO - __main__ - Step 34646: {'lr': 0.00019959292419690781, 'samples': 1108672, 'steps': 2165, 'loss/train': 2.8504364490509033} -09/20/2021 21:59:30 - INFO - __main__ - Step 34647: {'lr': 0.00019959292419690781, 'samples': 1108704, 'steps': 2165, 'loss/train': 2.7148513793945312} -09/20/2021 21:59:31 - INFO - __main__ - Step 34648: {'lr': 0.00019959292419690781, 'samples': 1108736, 'steps': 2165, 'loss/train': 3.125983238220215} -09/20/2021 21:59:32 - INFO - __main__ - Step 34649: {'lr': 0.00019959292419690781, 'samples': 1108768, 'steps': 2165, 'loss/train': 2.1901943683624268} -09/20/2021 21:59:33 - INFO - __main__ - Step 34650: {'lr': 0.00019959292419690781, 'samples': 1108800, 'steps': 2165, 'loss/train': 1.6761952638626099} -09/20/2021 21:59:33 - INFO - __main__ - Step 34651: {'lr': 0.00019959292419690781, 'samples': 1108832, 'steps': 2165, 'loss/train': 2.3613367080688477} -09/20/2021 21:59:34 - INFO - __main__ - Step 34652: {'lr': 0.00019959292419690781, 'samples': 1108864, 'steps': 2165, 'loss/train': 1.2161117792129517} -09/20/2021 21:59:35 - INFO - __main__ - Step 34653: {'lr': 0.00019959292419690781, 'samples': 1108896, 'steps': 2165, 'loss/train': 1.936313271522522} -09/20/2021 21:59:36 - INFO - __main__ - Step 34654: {'lr': 0.00019959292419690781, 'samples': 1108928, 'steps': 2165, 'loss/train': 2.3272883892059326} -09/20/2021 21:59:36 - INFO - __main__ - Step 34655: {'lr': 0.00019959292419690781, 'samples': 1108960, 'steps': 2165, 'loss/train': 2.1506872177124023} -09/20/2021 21:59:37 - INFO - __main__ - Step 34656: {'lr': 0.00019959292419690781, 'samples': 1108992, 'steps': 2165, 'loss/train': 1.75717294216156} -09/20/2021 21:59:38 - INFO - __main__ - Step 34657: {'lr': 0.00019959234901281172, 'samples': 1109024, 'steps': 2166, 'loss/train': 2.60452938079834} -09/20/2021 21:59:39 - INFO - __main__ - Step 34658: {'lr': 0.00019959234901281172, 'samples': 1109056, 'steps': 2166, 'loss/train': 2.4264981746673584} -09/20/2021 21:59:39 - INFO - __main__ - Step 34659: {'lr': 0.00019959234901281172, 'samples': 1109088, 'steps': 2166, 'loss/train': 2.0238304138183594} -09/20/2021 21:59:40 - INFO - __main__ - Step 34660: {'lr': 0.00019959234901281172, 'samples': 1109120, 'steps': 2166, 'loss/train': 2.529688835144043} -09/20/2021 21:59:41 - INFO - __main__ - Step 34661: {'lr': 0.00019959234901281172, 'samples': 1109152, 'steps': 2166, 'loss/train': 2.629798412322998} -09/20/2021 21:59:42 - INFO - __main__ - Step 34662: {'lr': 0.00019959234901281172, 'samples': 1109184, 'steps': 2166, 'loss/train': 2.8607170581817627} -09/20/2021 21:59:43 - INFO - __main__ - Step 34663: {'lr': 0.00019959234901281172, 'samples': 1109216, 'steps': 2166, 'loss/train': 2.699258804321289} -09/20/2021 21:59:44 - INFO - __main__ - Step 34664: {'lr': 0.00019959234901281172, 'samples': 1109248, 'steps': 2166, 'loss/train': 2.2135353088378906} -09/20/2021 21:59:45 - INFO - __main__ - Step 34665: {'lr': 0.00019959234901281172, 'samples': 1109280, 'steps': 2166, 'loss/train': 2.566013813018799} -09/20/2021 21:59:45 - INFO - __main__ - Step 34666: {'lr': 0.00019959234901281172, 'samples': 1109312, 'steps': 2166, 'loss/train': 2.3980777263641357} -09/20/2021 21:59:46 - INFO - __main__ - Step 34667: {'lr': 0.00019959234901281172, 'samples': 1109344, 'steps': 2166, 'loss/train': 3.201403856277466} -09/20/2021 21:59:47 - INFO - __main__ - Step 34668: {'lr': 0.00019959234901281172, 'samples': 1109376, 'steps': 2166, 'loss/train': 2.116814136505127} -09/20/2021 21:59:47 - INFO - __main__ - Step 34669: {'lr': 0.00019959234901281172, 'samples': 1109408, 'steps': 2166, 'loss/train': 1.9111700057983398} -09/20/2021 21:59:48 - INFO - __main__ - Step 34670: {'lr': 0.00019959234901281172, 'samples': 1109440, 'steps': 2166, 'loss/train': 1.5235153436660767} -09/20/2021 21:59:49 - INFO - __main__ - Step 34671: {'lr': 0.00019959234901281172, 'samples': 1109472, 'steps': 2166, 'loss/train': 2.4617409706115723} -09/20/2021 21:59:50 - INFO - __main__ - Step 34672: {'lr': 0.00019959234901281172, 'samples': 1109504, 'steps': 2166, 'loss/train': 1.8357032537460327} -09/20/2021 21:59:51 - INFO - __main__ - Step 34673: {'lr': 0.00019959177342347478, 'samples': 1109536, 'steps': 2167, 'loss/train': 2.270965814590454} -09/20/2021 21:59:51 - INFO - __main__ - Step 34674: {'lr': 0.00019959177342347478, 'samples': 1109568, 'steps': 2167, 'loss/train': 1.5149301290512085} -09/20/2021 21:59:52 - INFO - __main__ - Step 34675: {'lr': 0.00019959177342347478, 'samples': 1109600, 'steps': 2167, 'loss/train': 1.8407295942306519} -09/20/2021 21:59:53 - INFO - __main__ - Step 34676: {'lr': 0.00019959177342347478, 'samples': 1109632, 'steps': 2167, 'loss/train': 2.45564603805542} -09/20/2021 21:59:54 - INFO - __main__ - Step 34677: {'lr': 0.00019959177342347478, 'samples': 1109664, 'steps': 2167, 'loss/train': 2.4669950008392334} -09/20/2021 21:59:54 - INFO - __main__ - Step 34678: {'lr': 0.00019959177342347478, 'samples': 1109696, 'steps': 2167, 'loss/train': 2.3632333278656006} -09/20/2021 21:59:55 - INFO - __main__ - Step 34679: {'lr': 0.00019959177342347478, 'samples': 1109728, 'steps': 2167, 'loss/train': 2.1335537433624268} -09/20/2021 21:59:56 - INFO - __main__ - Step 34680: {'lr': 0.00019959177342347478, 'samples': 1109760, 'steps': 2167, 'loss/train': 2.2413582801818848} -09/20/2021 21:59:57 - INFO - __main__ - Step 34681: {'lr': 0.00019959177342347478, 'samples': 1109792, 'steps': 2167, 'loss/train': 2.0464751720428467} -09/20/2021 21:59:57 - INFO - __main__ - Step 34682: {'lr': 0.00019959177342347478, 'samples': 1109824, 'steps': 2167, 'loss/train': 2.241191864013672} -09/20/2021 21:59:58 - INFO - __main__ - Step 34683: {'lr': 0.00019959177342347478, 'samples': 1109856, 'steps': 2167, 'loss/train': 2.3384037017822266} -09/20/2021 21:59:59 - INFO - __main__ - Step 34684: {'lr': 0.00019959177342347478, 'samples': 1109888, 'steps': 2167, 'loss/train': 1.543628454208374} -09/20/2021 22:00:00 - INFO - __main__ - Step 34685: {'lr': 0.00019959177342347478, 'samples': 1109920, 'steps': 2167, 'loss/train': 2.689575672149658} -09/20/2021 22:00:00 - INFO - __main__ - Step 34686: {'lr': 0.00019959177342347478, 'samples': 1109952, 'steps': 2167, 'loss/train': 2.100757122039795} -09/20/2021 22:00:01 - INFO - __main__ - Step 34687: {'lr': 0.00019959177342347478, 'samples': 1109984, 'steps': 2167, 'loss/train': 0.5128540992736816} -09/20/2021 22:00:02 - INFO - __main__ - Step 34688: {'lr': 0.00019959177342347478, 'samples': 1110016, 'steps': 2167, 'loss/train': 2.2152161598205566} -09/20/2021 22:00:03 - INFO - __main__ - Step 34689: {'lr': 0.00019959119742889926, 'samples': 1110048, 'steps': 2168, 'loss/train': 1.959925651550293} -09/20/2021 22:00:04 - INFO - __main__ - Step 34690: {'lr': 0.00019959119742889926, 'samples': 1110080, 'steps': 2168, 'loss/train': 2.674983263015747} -09/20/2021 22:00:04 - INFO - __main__ - Step 34691: {'lr': 0.00019959119742889926, 'samples': 1110112, 'steps': 2168, 'loss/train': 2.2480483055114746} -09/20/2021 22:00:05 - INFO - __main__ - Step 34692: {'lr': 0.00019959119742889926, 'samples': 1110144, 'steps': 2168, 'loss/train': 2.6091835498809814} -09/20/2021 22:00:06 - INFO - __main__ - Step 34693: {'lr': 0.00019959119742889926, 'samples': 1110176, 'steps': 2168, 'loss/train': 2.4290084838867188} -09/20/2021 22:00:07 - INFO - __main__ - Step 34694: {'lr': 0.00019959119742889926, 'samples': 1110208, 'steps': 2168, 'loss/train': 1.3001118898391724} -09/20/2021 22:00:08 - INFO - __main__ - Step 34695: {'lr': 0.00019959119742889926, 'samples': 1110240, 'steps': 2168, 'loss/train': 2.6667590141296387} -09/20/2021 22:00:09 - INFO - __main__ - Step 34696: {'lr': 0.00019959119742889926, 'samples': 1110272, 'steps': 2168, 'loss/train': 0.7796549201011658} -09/20/2021 22:00:09 - INFO - __main__ - Step 34697: {'lr': 0.00019959119742889926, 'samples': 1110304, 'steps': 2168, 'loss/train': 1.80286705493927} -09/20/2021 22:00:10 - INFO - __main__ - Step 34698: {'lr': 0.00019959119742889926, 'samples': 1110336, 'steps': 2168, 'loss/train': 2.1468279361724854} -09/20/2021 22:00:11 - INFO - __main__ - Step 34699: {'lr': 0.00019959119742889926, 'samples': 1110368, 'steps': 2168, 'loss/train': 1.6668781042099} -09/20/2021 22:00:12 - INFO - __main__ - Step 34700: {'lr': 0.00019959119742889926, 'samples': 1110400, 'steps': 2168, 'loss/train': 2.399686336517334} -09/20/2021 22:00:12 - INFO - __main__ - Step 34701: {'lr': 0.00019959119742889926, 'samples': 1110432, 'steps': 2168, 'loss/train': 2.3884427547454834} -09/20/2021 22:00:13 - INFO - __main__ - Step 34702: {'lr': 0.00019959119742889926, 'samples': 1110464, 'steps': 2168, 'loss/train': 2.35744571685791} -09/20/2021 22:00:14 - INFO - __main__ - Step 34703: {'lr': 0.00019959119742889926, 'samples': 1110496, 'steps': 2168, 'loss/train': 1.9452250003814697} -09/20/2021 22:00:15 - INFO - __main__ - Step 34704: {'lr': 0.00019959119742889926, 'samples': 1110528, 'steps': 2168, 'loss/train': 2.391395092010498} -09/20/2021 22:00:15 - INFO - __main__ - Step 34705: {'lr': 0.00019959062102908756, 'samples': 1110560, 'steps': 2169, 'loss/train': 2.1846797466278076} -09/20/2021 22:00:16 - INFO - __main__ - Step 34706: {'lr': 0.00019959062102908756, 'samples': 1110592, 'steps': 2169, 'loss/train': 2.4799652099609375} -09/20/2021 22:00:17 - INFO - __main__ - Step 34707: {'lr': 0.00019959062102908756, 'samples': 1110624, 'steps': 2169, 'loss/train': 1.9667017459869385} -09/20/2021 22:00:18 - INFO - __main__ - Step 34708: {'lr': 0.00019959062102908756, 'samples': 1110656, 'steps': 2169, 'loss/train': 2.6053354740142822} -09/20/2021 22:00:18 - INFO - __main__ - Step 34709: {'lr': 0.00019959062102908756, 'samples': 1110688, 'steps': 2169, 'loss/train': 1.940414309501648} -09/20/2021 22:00:19 - INFO - __main__ - Step 34710: {'lr': 0.00019959062102908756, 'samples': 1110720, 'steps': 2169, 'loss/train': 1.7439932823181152} -09/20/2021 22:00:20 - INFO - __main__ - Step 34711: {'lr': 0.00019959062102908756, 'samples': 1110752, 'steps': 2169, 'loss/train': 1.7839653491973877} -09/20/2021 22:00:21 - INFO - __main__ - Step 34712: {'lr': 0.00019959062102908756, 'samples': 1110784, 'steps': 2169, 'loss/train': 2.3066370487213135} -09/20/2021 22:00:21 - INFO - __main__ - Step 34713: {'lr': 0.00019959062102908756, 'samples': 1110816, 'steps': 2169, 'loss/train': 2.005450963973999} -09/20/2021 22:00:22 - INFO - __main__ - Step 34714: {'lr': 0.00019959062102908756, 'samples': 1110848, 'steps': 2169, 'loss/train': 0.6225308775901794} -09/20/2021 22:00:23 - INFO - __main__ - Step 34715: {'lr': 0.00019959062102908756, 'samples': 1110880, 'steps': 2169, 'loss/train': 1.555080771446228} -09/20/2021 22:00:24 - INFO - __main__ - Step 34716: {'lr': 0.00019959062102908756, 'samples': 1110912, 'steps': 2169, 'loss/train': 2.327481269836426} -09/20/2021 22:00:24 - INFO - __main__ - Step 34717: {'lr': 0.00019959062102908756, 'samples': 1110944, 'steps': 2169, 'loss/train': 3.0228288173675537} -09/20/2021 22:00:25 - INFO - __main__ - Step 34718: {'lr': 0.00019959062102908756, 'samples': 1110976, 'steps': 2169, 'loss/train': 2.2958927154541016} -09/20/2021 22:00:26 - INFO - __main__ - Step 34719: {'lr': 0.00019959062102908756, 'samples': 1111008, 'steps': 2169, 'loss/train': 2.221691608428955} -09/20/2021 22:00:27 - INFO - __main__ - Step 34720: {'lr': 0.00019959062102908756, 'samples': 1111040, 'steps': 2169, 'loss/train': 2.2224621772766113} -09/20/2021 22:00:28 - INFO - __main__ - Step 34721: {'lr': 0.00019959004422404205, 'samples': 1111072, 'steps': 2170, 'loss/train': 2.2348973751068115} -09/20/2021 22:00:28 - INFO - __main__ - Step 34722: {'lr': 0.00019959004422404205, 'samples': 1111104, 'steps': 2170, 'loss/train': 1.9593919515609741} -09/20/2021 22:00:30 - INFO - __main__ - Step 34723: {'lr': 0.00019959004422404205, 'samples': 1111136, 'steps': 2170, 'loss/train': 1.6544305086135864} -09/20/2021 22:00:30 - INFO - __main__ - Step 34724: {'lr': 0.00019959004422404205, 'samples': 1111168, 'steps': 2170, 'loss/train': 2.074335813522339} -09/20/2021 22:00:31 - INFO - __main__ - Step 34725: {'lr': 0.00019959004422404205, 'samples': 1111200, 'steps': 2170, 'loss/train': 2.4106311798095703} -09/20/2021 22:00:32 - INFO - __main__ - Step 34726: {'lr': 0.00019959004422404205, 'samples': 1111232, 'steps': 2170, 'loss/train': 1.7959702014923096} -09/20/2021 22:00:33 - INFO - __main__ - Step 34727: {'lr': 0.00019959004422404205, 'samples': 1111264, 'steps': 2170, 'loss/train': 2.3713207244873047} -09/20/2021 22:00:33 - INFO - __main__ - Step 34728: {'lr': 0.00019959004422404205, 'samples': 1111296, 'steps': 2170, 'loss/train': 1.8978393077850342} -09/20/2021 22:00:34 - INFO - __main__ - Step 34729: {'lr': 0.00019959004422404205, 'samples': 1111328, 'steps': 2170, 'loss/train': 1.8283313512802124} -09/20/2021 22:00:35 - INFO - __main__ - Step 34730: {'lr': 0.00019959004422404205, 'samples': 1111360, 'steps': 2170, 'loss/train': 2.5423552989959717} -09/20/2021 22:00:36 - INFO - __main__ - Step 34731: {'lr': 0.00019959004422404205, 'samples': 1111392, 'steps': 2170, 'loss/train': 2.428273916244507} -09/20/2021 22:00:36 - INFO - __main__ - Step 34732: {'lr': 0.00019959004422404205, 'samples': 1111424, 'steps': 2170, 'loss/train': 2.2892262935638428} -09/20/2021 22:00:37 - INFO - __main__ - Step 34733: {'lr': 0.00019959004422404205, 'samples': 1111456, 'steps': 2170, 'loss/train': 2.5892536640167236} -09/20/2021 22:00:38 - INFO - __main__ - Step 34734: {'lr': 0.00019959004422404205, 'samples': 1111488, 'steps': 2170, 'loss/train': 1.869360089302063} -09/20/2021 22:00:39 - INFO - __main__ - Step 34735: {'lr': 0.00019959004422404205, 'samples': 1111520, 'steps': 2170, 'loss/train': 1.3944605588912964} -09/20/2021 22:00:39 - INFO - __main__ - Step 34736: {'lr': 0.00019959004422404205, 'samples': 1111552, 'steps': 2170, 'loss/train': 2.646000862121582} -09/20/2021 22:00:40 - INFO - __main__ - Step 34737: {'lr': 0.00019958946701376497, 'samples': 1111584, 'steps': 2171, 'loss/train': 2.08860445022583} -09/20/2021 22:00:41 - INFO - __main__ - Step 34738: {'lr': 0.00019958946701376497, 'samples': 1111616, 'steps': 2171, 'loss/train': 2.345871925354004} -09/20/2021 22:00:42 - INFO - __main__ - Step 34739: {'lr': 0.00019958946701376497, 'samples': 1111648, 'steps': 2171, 'loss/train': 2.249095916748047} -09/20/2021 22:00:42 - INFO - __main__ - Step 34740: {'lr': 0.00019958946701376497, 'samples': 1111680, 'steps': 2171, 'loss/train': 0.3987978994846344} -09/20/2021 22:00:43 - INFO - __main__ - Step 34741: {'lr': 0.00019958946701376497, 'samples': 1111712, 'steps': 2171, 'loss/train': 1.7874101400375366} -09/20/2021 22:00:44 - INFO - __main__ - Step 34742: {'lr': 0.00019958946701376497, 'samples': 1111744, 'steps': 2171, 'loss/train': 2.6357667446136475} -09/20/2021 22:00:45 - INFO - __main__ - Step 34743: {'lr': 0.00019958946701376497, 'samples': 1111776, 'steps': 2171, 'loss/train': 2.4904351234436035} -09/20/2021 22:00:45 - INFO - __main__ - Step 34744: {'lr': 0.00019958946701376497, 'samples': 1111808, 'steps': 2171, 'loss/train': 0.18862374126911163} -09/20/2021 22:00:46 - INFO - __main__ - Step 34745: {'lr': 0.00019958946701376497, 'samples': 1111840, 'steps': 2171, 'loss/train': 2.4176559448242188} -09/20/2021 22:00:47 - INFO - __main__ - Step 34746: {'lr': 0.00019958946701376497, 'samples': 1111872, 'steps': 2171, 'loss/train': 2.433863401412964} -09/20/2021 22:00:48 - INFO - __main__ - Step 34747: {'lr': 0.00019958946701376497, 'samples': 1111904, 'steps': 2171, 'loss/train': 1.7214969396591187} -09/20/2021 22:00:48 - INFO - __main__ - Step 34748: {'lr': 0.00019958946701376497, 'samples': 1111936, 'steps': 2171, 'loss/train': 2.363311767578125} -09/20/2021 22:00:49 - INFO - __main__ - Step 34749: {'lr': 0.00019958946701376497, 'samples': 1111968, 'steps': 2171, 'loss/train': 2.5841052532196045} -09/20/2021 22:00:50 - INFO - __main__ - Step 34750: {'lr': 0.00019958946701376497, 'samples': 1112000, 'steps': 2171, 'loss/train': 3.1147310733795166} -09/20/2021 22:00:51 - INFO - __main__ - Step 34751: {'lr': 0.00019958946701376497, 'samples': 1112032, 'steps': 2171, 'loss/train': 3.064711332321167} -09/20/2021 22:00:51 - INFO - __main__ - Step 34752: {'lr': 0.00019958946701376497, 'samples': 1112064, 'steps': 2171, 'loss/train': 2.3533506393432617} -09/20/2021 22:00:52 - INFO - __main__ - Step 34753: {'lr': 0.0001995888893982588, 'samples': 1112096, 'steps': 2172, 'loss/train': 2.664959192276001} -09/20/2021 22:00:54 - INFO - __main__ - Step 34754: {'lr': 0.0001995888893982588, 'samples': 1112128, 'steps': 2172, 'loss/train': 0.7450399398803711} -09/20/2021 22:00:55 - INFO - __main__ - Step 34755: {'lr': 0.0001995888893982588, 'samples': 1112160, 'steps': 2172, 'loss/train': 3.9622368812561035} -09/20/2021 22:00:55 - INFO - __main__ - Step 34756: {'lr': 0.0001995888893982588, 'samples': 1112192, 'steps': 2172, 'loss/train': 2.456578493118286} -09/20/2021 22:00:56 - INFO - __main__ - Step 34757: {'lr': 0.0001995888893982588, 'samples': 1112224, 'steps': 2172, 'loss/train': 2.603205680847168} -09/20/2021 22:00:57 - INFO - __main__ - Step 34758: {'lr': 0.0001995888893982588, 'samples': 1112256, 'steps': 2172, 'loss/train': 2.951822280883789} -09/20/2021 22:00:58 - INFO - __main__ - Step 34759: {'lr': 0.0001995888893982588, 'samples': 1112288, 'steps': 2172, 'loss/train': 0.9505271911621094} -09/20/2021 22:00:58 - INFO - __main__ - Step 34760: {'lr': 0.0001995888893982588, 'samples': 1112320, 'steps': 2172, 'loss/train': 2.1020736694335938} -09/20/2021 22:00:59 - INFO - __main__ - Step 34761: {'lr': 0.0001995888893982588, 'samples': 1112352, 'steps': 2172, 'loss/train': 0.9598583579063416} -09/20/2021 22:01:00 - INFO - __main__ - Step 34762: {'lr': 0.0001995888893982588, 'samples': 1112384, 'steps': 2172, 'loss/train': 2.563070297241211} -09/20/2021 22:01:01 - INFO - __main__ - Step 34763: {'lr': 0.0001995888893982588, 'samples': 1112416, 'steps': 2172, 'loss/train': 2.217092990875244} -09/20/2021 22:01:01 - INFO - __main__ - Step 34764: {'lr': 0.0001995888893982588, 'samples': 1112448, 'steps': 2172, 'loss/train': 1.9028295278549194} -09/20/2021 22:01:02 - INFO - __main__ - Step 34765: {'lr': 0.0001995888893982588, 'samples': 1112480, 'steps': 2172, 'loss/train': 2.858973503112793} -09/20/2021 22:01:03 - INFO - __main__ - Step 34766: {'lr': 0.0001995888893982588, 'samples': 1112512, 'steps': 2172, 'loss/train': 1.7129184007644653} -09/20/2021 22:01:04 - INFO - __main__ - Step 34767: {'lr': 0.0001995888893982588, 'samples': 1112544, 'steps': 2172, 'loss/train': 1.7102551460266113} -09/20/2021 22:01:04 - INFO - __main__ - Step 34768: {'lr': 0.0001995888893982588, 'samples': 1112576, 'steps': 2172, 'loss/train': 1.4382954835891724} -09/20/2021 22:01:05 - INFO - __main__ - Step 34769: {'lr': 0.0001995883113775258, 'samples': 1112608, 'steps': 2173, 'loss/train': 1.1537859439849854} -09/20/2021 22:01:06 - INFO - __main__ - Step 34770: {'lr': 0.0001995883113775258, 'samples': 1112640, 'steps': 2173, 'loss/train': 1.6494178771972656} -09/20/2021 22:01:07 - INFO - __main__ - Step 34771: {'lr': 0.0001995883113775258, 'samples': 1112672, 'steps': 2173, 'loss/train': 2.557748556137085} -09/20/2021 22:01:07 - INFO - __main__ - Step 34772: {'lr': 0.0001995883113775258, 'samples': 1112704, 'steps': 2173, 'loss/train': 2.7140986919403076} -09/20/2021 22:01:08 - INFO - __main__ - Step 34773: {'lr': 0.0001995883113775258, 'samples': 1112736, 'steps': 2173, 'loss/train': 2.4971182346343994} -09/20/2021 22:01:09 - INFO - __main__ - Step 34774: {'lr': 0.0001995883113775258, 'samples': 1112768, 'steps': 2173, 'loss/train': 2.5438191890716553} -09/20/2021 22:01:10 - INFO - __main__ - Step 34775: {'lr': 0.0001995883113775258, 'samples': 1112800, 'steps': 2173, 'loss/train': 2.731874704360962} -09/20/2021 22:01:10 - INFO - __main__ - Step 34776: {'lr': 0.0001995883113775258, 'samples': 1112832, 'steps': 2173, 'loss/train': 2.1565606594085693} -09/20/2021 22:01:11 - INFO - __main__ - Step 34777: {'lr': 0.0001995883113775258, 'samples': 1112864, 'steps': 2173, 'loss/train': 2.4429314136505127} -09/20/2021 22:01:12 - INFO - __main__ - Step 34778: {'lr': 0.0001995883113775258, 'samples': 1112896, 'steps': 2173, 'loss/train': 2.356658935546875} -09/20/2021 22:01:13 - INFO - __main__ - Step 34779: {'lr': 0.0001995883113775258, 'samples': 1112928, 'steps': 2173, 'loss/train': 2.330441474914551} -09/20/2021 22:01:13 - INFO - __main__ - Step 34780: {'lr': 0.0001995883113775258, 'samples': 1112960, 'steps': 2173, 'loss/train': 2.3099451065063477} -09/20/2021 22:01:14 - INFO - __main__ - Step 34781: {'lr': 0.0001995883113775258, 'samples': 1112992, 'steps': 2173, 'loss/train': 2.421708106994629} -09/20/2021 22:01:15 - INFO - __main__ - Step 34782: {'lr': 0.0001995883113775258, 'samples': 1113024, 'steps': 2173, 'loss/train': 2.2981138229370117} -09/20/2021 22:01:16 - INFO - __main__ - Step 34783: {'lr': 0.0001995883113775258, 'samples': 1113056, 'steps': 2173, 'loss/train': 2.421332359313965} -09/20/2021 22:01:16 - INFO - __main__ - Step 34784: {'lr': 0.0001995883113775258, 'samples': 1113088, 'steps': 2173, 'loss/train': 3.835679054260254} -09/20/2021 22:01:17 - INFO - __main__ - Step 34785: {'lr': 0.00019958773295156835, 'samples': 1113120, 'steps': 2174, 'loss/train': 2.502933979034424} -09/20/2021 22:01:18 - INFO - __main__ - Step 34786: {'lr': 0.00019958773295156835, 'samples': 1113152, 'steps': 2174, 'loss/train': 2.603663444519043} -09/20/2021 22:01:19 - INFO - __main__ - Step 34787: {'lr': 0.00019958773295156835, 'samples': 1113184, 'steps': 2174, 'loss/train': 2.201476812362671} -09/20/2021 22:01:20 - INFO - __main__ - Step 34788: {'lr': 0.00019958773295156835, 'samples': 1113216, 'steps': 2174, 'loss/train': 2.0169920921325684} -09/20/2021 22:01:20 - INFO - __main__ - Step 34789: {'lr': 0.00019958773295156835, 'samples': 1113248, 'steps': 2174, 'loss/train': 2.3157846927642822} -09/20/2021 22:01:21 - INFO - __main__ - Step 34790: {'lr': 0.00019958773295156835, 'samples': 1113280, 'steps': 2174, 'loss/train': 2.029230833053589} -09/20/2021 22:01:22 - INFO - __main__ - Step 34791: {'lr': 0.00019958773295156835, 'samples': 1113312, 'steps': 2174, 'loss/train': 2.3721249103546143} -09/20/2021 22:01:23 - INFO - __main__ - Step 34792: {'lr': 0.00019958773295156835, 'samples': 1113344, 'steps': 2174, 'loss/train': 2.164806365966797} -09/20/2021 22:01:24 - INFO - __main__ - Step 34793: {'lr': 0.00019958773295156835, 'samples': 1113376, 'steps': 2174, 'loss/train': 2.2785186767578125} -09/20/2021 22:01:25 - INFO - __main__ - Step 34794: {'lr': 0.00019958773295156835, 'samples': 1113408, 'steps': 2174, 'loss/train': 1.4990627765655518} -09/20/2021 22:01:25 - INFO - __main__ - Step 34795: {'lr': 0.00019958773295156835, 'samples': 1113440, 'steps': 2174, 'loss/train': 2.7921993732452393} -09/20/2021 22:01:26 - INFO - __main__ - Step 34796: {'lr': 0.00019958773295156835, 'samples': 1113472, 'steps': 2174, 'loss/train': 2.666574478149414} -09/20/2021 22:01:27 - INFO - __main__ - Step 34797: {'lr': 0.00019958773295156835, 'samples': 1113504, 'steps': 2174, 'loss/train': 3.3654143810272217} -09/20/2021 22:01:28 - INFO - __main__ - Step 34798: {'lr': 0.00019958773295156835, 'samples': 1113536, 'steps': 2174, 'loss/train': 2.5543723106384277} -09/20/2021 22:01:28 - INFO - __main__ - Step 34799: {'lr': 0.00019958773295156835, 'samples': 1113568, 'steps': 2174, 'loss/train': 2.314493179321289} -09/20/2021 22:01:29 - INFO - __main__ - Step 34800: {'lr': 0.00019958773295156835, 'samples': 1113600, 'steps': 2174, 'loss/train': 2.6129791736602783} -09/20/2021 22:01:30 - INFO - __main__ - Step 34801: {'lr': 0.00019958715412038877, 'samples': 1113632, 'steps': 2175, 'loss/train': 2.2027413845062256} -09/20/2021 22:01:31 - INFO - __main__ - Step 34802: {'lr': 0.00019958715412038877, 'samples': 1113664, 'steps': 2175, 'loss/train': 1.8584810495376587} -09/20/2021 22:01:32 - INFO - __main__ - Step 34803: {'lr': 0.00019958715412038877, 'samples': 1113696, 'steps': 2175, 'loss/train': 2.5098490715026855} -09/20/2021 22:01:32 - INFO - __main__ - Step 34804: {'lr': 0.00019958715412038877, 'samples': 1113728, 'steps': 2175, 'loss/train': 1.5073158740997314} -09/20/2021 22:01:33 - INFO - __main__ - Step 34805: {'lr': 0.00019958715412038877, 'samples': 1113760, 'steps': 2175, 'loss/train': 2.1780521869659424} -09/20/2021 22:01:34 - INFO - __main__ - Step 34806: {'lr': 0.00019958715412038877, 'samples': 1113792, 'steps': 2175, 'loss/train': 2.4924042224884033} -09/20/2021 22:01:35 - INFO - __main__ - Step 34807: {'lr': 0.00019958715412038877, 'samples': 1113824, 'steps': 2175, 'loss/train': 2.5323731899261475} -09/20/2021 22:01:35 - INFO - __main__ - Step 34808: {'lr': 0.00019958715412038877, 'samples': 1113856, 'steps': 2175, 'loss/train': 2.047353982925415} -09/20/2021 22:01:36 - INFO - __main__ - Step 34809: {'lr': 0.00019958715412038877, 'samples': 1113888, 'steps': 2175, 'loss/train': 2.4517972469329834} -09/20/2021 22:01:37 - INFO - __main__ - Step 34810: {'lr': 0.00019958715412038877, 'samples': 1113920, 'steps': 2175, 'loss/train': 3.2198522090911865} -09/20/2021 22:01:38 - INFO - __main__ - Step 34811: {'lr': 0.00019958715412038877, 'samples': 1113952, 'steps': 2175, 'loss/train': 1.885776162147522} -09/20/2021 22:01:38 - INFO - __main__ - Step 34812: {'lr': 0.00019958715412038877, 'samples': 1113984, 'steps': 2175, 'loss/train': 0.9465459585189819} -09/20/2021 22:01:39 - INFO - __main__ - Step 34813: {'lr': 0.00019958715412038877, 'samples': 1114016, 'steps': 2175, 'loss/train': 2.755336284637451} -09/20/2021 22:01:40 - INFO - __main__ - Step 34814: {'lr': 0.00019958715412038877, 'samples': 1114048, 'steps': 2175, 'loss/train': 2.3659183979034424} -09/20/2021 22:01:41 - INFO - __main__ - Step 34815: {'lr': 0.00019958715412038877, 'samples': 1114080, 'steps': 2175, 'loss/train': 1.984958291053772} -09/20/2021 22:01:41 - INFO - __main__ - Step 34816: {'lr': 0.00019958715412038877, 'samples': 1114112, 'steps': 2175, 'loss/train': 2.4116971492767334} -09/20/2021 22:01:42 - INFO - __main__ - Step 34817: {'lr': 0.00019958657488398948, 'samples': 1114144, 'steps': 2176, 'loss/train': 1.4823414087295532} -09/20/2021 22:01:43 - INFO - __main__ - Step 34818: {'lr': 0.00019958657488398948, 'samples': 1114176, 'steps': 2176, 'loss/train': 1.6175429821014404} -09/20/2021 22:01:44 - INFO - __main__ - Step 34819: {'lr': 0.00019958657488398948, 'samples': 1114208, 'steps': 2176, 'loss/train': 0.6087387204170227} -09/20/2021 22:01:44 - INFO - __main__ - Step 34820: {'lr': 0.00019958657488398948, 'samples': 1114240, 'steps': 2176, 'loss/train': 0.9358384609222412} -09/20/2021 22:01:45 - INFO - __main__ - Step 34821: {'lr': 0.00019958657488398948, 'samples': 1114272, 'steps': 2176, 'loss/train': 1.6301190853118896} -09/20/2021 22:01:47 - INFO - __main__ - Step 34822: {'lr': 0.00019958657488398948, 'samples': 1114304, 'steps': 2176, 'loss/train': 2.348893880844116} -09/20/2021 22:01:48 - INFO - __main__ - Step 34823: {'lr': 0.00019958657488398948, 'samples': 1114336, 'steps': 2176, 'loss/train': 2.357482671737671} -09/20/2021 22:01:48 - INFO - __main__ - Step 34824: {'lr': 0.00019958657488398948, 'samples': 1114368, 'steps': 2176, 'loss/train': 1.8246281147003174} -09/20/2021 22:01:49 - INFO - __main__ - Step 34825: {'lr': 0.00019958657488398948, 'samples': 1114400, 'steps': 2176, 'loss/train': 2.7532169818878174} -09/20/2021 22:01:50 - INFO - __main__ - Step 34826: {'lr': 0.00019958657488398948, 'samples': 1114432, 'steps': 2176, 'loss/train': 2.2266969680786133} -09/20/2021 22:01:51 - INFO - __main__ - Step 34827: {'lr': 0.00019958657488398948, 'samples': 1114464, 'steps': 2176, 'loss/train': 0.9139369130134583} -09/20/2021 22:01:51 - INFO - __main__ - Step 34828: {'lr': 0.00019958657488398948, 'samples': 1114496, 'steps': 2176, 'loss/train': 0.451552152633667} -09/20/2021 22:01:52 - INFO - __main__ - Step 34829: {'lr': 0.00019958657488398948, 'samples': 1114528, 'steps': 2176, 'loss/train': 0.2519698739051819} -09/20/2021 22:01:53 - INFO - __main__ - Step 34830: {'lr': 0.00019958657488398948, 'samples': 1114560, 'steps': 2176, 'loss/train': 0.48833009600639343} -09/20/2021 22:01:54 - INFO - __main__ - Step 34831: {'lr': 0.00019958657488398948, 'samples': 1114592, 'steps': 2176, 'loss/train': 0.2106897532939911} -09/20/2021 22:01:54 - INFO - __main__ - Step 34832: {'lr': 0.00019958657488398948, 'samples': 1114624, 'steps': 2176, 'loss/train': 0.5532893538475037} -09/20/2021 22:01:55 - INFO - __main__ - Step 34833: {'lr': 0.0001995859952423728, 'samples': 1114656, 'steps': 2177, 'loss/train': 0.6242294311523438} -09/20/2021 22:01:56 - INFO - __main__ - Step 34834: {'lr': 0.0001995859952423728, 'samples': 1114688, 'steps': 2177, 'loss/train': 2.150460720062256} -09/20/2021 22:01:57 - INFO - __main__ - Step 34835: {'lr': 0.0001995859952423728, 'samples': 1114720, 'steps': 2177, 'loss/train': 1.0312072038650513} -09/20/2021 22:01:57 - INFO - __main__ - Step 34836: {'lr': 0.0001995859952423728, 'samples': 1114752, 'steps': 2177, 'loss/train': 1.3512296676635742} -09/20/2021 22:01:58 - INFO - __main__ - Step 34837: {'lr': 0.0001995859952423728, 'samples': 1114784, 'steps': 2177, 'loss/train': 2.6632919311523438} -09/20/2021 22:01:59 - INFO - __main__ - Step 34838: {'lr': 0.0001995859952423728, 'samples': 1114816, 'steps': 2177, 'loss/train': 2.341834783554077} -09/20/2021 22:02:00 - INFO - __main__ - Step 34839: {'lr': 0.0001995859952423728, 'samples': 1114848, 'steps': 2177, 'loss/train': 2.5539519786834717} -09/20/2021 22:02:00 - INFO - __main__ - Step 34840: {'lr': 0.0001995859952423728, 'samples': 1114880, 'steps': 2177, 'loss/train': 1.3757389783859253} -09/20/2021 22:02:01 - INFO - __main__ - Step 34841: {'lr': 0.0001995859952423728, 'samples': 1114912, 'steps': 2177, 'loss/train': 1.743366003036499} -09/20/2021 22:02:02 - INFO - __main__ - Step 34842: {'lr': 0.0001995859952423728, 'samples': 1114944, 'steps': 2177, 'loss/train': 2.4741640090942383} -09/20/2021 22:02:03 - INFO - __main__ - Step 34843: {'lr': 0.0001995859952423728, 'samples': 1114976, 'steps': 2177, 'loss/train': 1.6334741115570068} -09/20/2021 22:02:03 - INFO - __main__ - Step 34844: {'lr': 0.0001995859952423728, 'samples': 1115008, 'steps': 2177, 'loss/train': 2.312673807144165} -09/20/2021 22:02:04 - INFO - __main__ - Step 34845: {'lr': 0.0001995859952423728, 'samples': 1115040, 'steps': 2177, 'loss/train': 2.229905605316162} -09/20/2021 22:02:05 - INFO - __main__ - Step 34846: {'lr': 0.0001995859952423728, 'samples': 1115072, 'steps': 2177, 'loss/train': 2.951892852783203} -09/20/2021 22:02:06 - INFO - __main__ - Step 34847: {'lr': 0.0001995859952423728, 'samples': 1115104, 'steps': 2177, 'loss/train': 1.3877040147781372} -09/20/2021 22:02:06 - INFO - __main__ - Step 34848: {'lr': 0.0001995859952423728, 'samples': 1115136, 'steps': 2177, 'loss/train': 4.712569713592529} -09/20/2021 22:02:07 - INFO - __main__ - Step 34849: {'lr': 0.00019958541519554107, 'samples': 1115168, 'steps': 2178, 'loss/train': 1.4388620853424072} -09/20/2021 22:02:08 - INFO - __main__ - Step 34850: {'lr': 0.00019958541519554107, 'samples': 1115200, 'steps': 2178, 'loss/train': 2.767321825027466} -09/20/2021 22:02:09 - INFO - __main__ - Step 34851: {'lr': 0.00019958541519554107, 'samples': 1115232, 'steps': 2178, 'loss/train': 1.9851467609405518} -09/20/2021 22:02:10 - INFO - __main__ - Step 34852: {'lr': 0.00019958541519554107, 'samples': 1115264, 'steps': 2178, 'loss/train': 2.2682576179504395} -09/20/2021 22:02:11 - INFO - __main__ - Step 34853: {'lr': 0.00019958541519554107, 'samples': 1115296, 'steps': 2178, 'loss/train': 2.394742965698242} -09/20/2021 22:02:12 - INFO - __main__ - Step 34854: {'lr': 0.00019958541519554107, 'samples': 1115328, 'steps': 2178, 'loss/train': 1.5278559923171997} -09/20/2021 22:02:12 - INFO - __main__ - Step 34855: {'lr': 0.00019958541519554107, 'samples': 1115360, 'steps': 2178, 'loss/train': 1.9076887369155884} -09/20/2021 22:02:13 - INFO - __main__ - Step 34856: {'lr': 0.00019958541519554107, 'samples': 1115392, 'steps': 2178, 'loss/train': 2.5574207305908203} -09/20/2021 22:02:14 - INFO - __main__ - Step 34857: {'lr': 0.00019958541519554107, 'samples': 1115424, 'steps': 2178, 'loss/train': 2.2167282104492188} -09/20/2021 22:02:15 - INFO - __main__ - Step 34858: {'lr': 0.00019958541519554107, 'samples': 1115456, 'steps': 2178, 'loss/train': 2.2626864910125732} -09/20/2021 22:02:15 - INFO - __main__ - Step 34859: {'lr': 0.00019958541519554107, 'samples': 1115488, 'steps': 2178, 'loss/train': 1.633602499961853} -09/20/2021 22:02:16 - INFO - __main__ - Step 34860: {'lr': 0.00019958541519554107, 'samples': 1115520, 'steps': 2178, 'loss/train': 3.037538766860962} -09/20/2021 22:02:17 - INFO - __main__ - Step 34861: {'lr': 0.00019958541519554107, 'samples': 1115552, 'steps': 2178, 'loss/train': 2.5920698642730713} -09/20/2021 22:02:18 - INFO - __main__ - Step 34862: {'lr': 0.00019958541519554107, 'samples': 1115584, 'steps': 2178, 'loss/train': 1.6388194561004639} -09/20/2021 22:02:18 - INFO - __main__ - Step 34863: {'lr': 0.00019958541519554107, 'samples': 1115616, 'steps': 2178, 'loss/train': 2.2522451877593994} -09/20/2021 22:02:19 - INFO - __main__ - Step 34864: {'lr': 0.00019958541519554107, 'samples': 1115648, 'steps': 2178, 'loss/train': 2.9397923946380615} -09/20/2021 22:02:20 - INFO - __main__ - Step 34865: {'lr': 0.0001995848347434967, 'samples': 1115680, 'steps': 2179, 'loss/train': 2.233536958694458} -09/20/2021 22:02:21 - INFO - __main__ - Step 34866: {'lr': 0.0001995848347434967, 'samples': 1115712, 'steps': 2179, 'loss/train': 1.6984682083129883} -09/20/2021 22:02:21 - INFO - __main__ - Step 34867: {'lr': 0.0001995848347434967, 'samples': 1115744, 'steps': 2179, 'loss/train': 2.0343480110168457} -09/20/2021 22:02:22 - INFO - __main__ - Step 34868: {'lr': 0.0001995848347434967, 'samples': 1115776, 'steps': 2179, 'loss/train': 2.2871131896972656} -09/20/2021 22:02:23 - INFO - __main__ - Step 34869: {'lr': 0.0001995848347434967, 'samples': 1115808, 'steps': 2179, 'loss/train': 0.681267261505127} -09/20/2021 22:02:24 - INFO - __main__ - Step 34870: {'lr': 0.0001995848347434967, 'samples': 1115840, 'steps': 2179, 'loss/train': 1.2482833862304688} -09/20/2021 22:02:24 - INFO - __main__ - Step 34871: {'lr': 0.0001995848347434967, 'samples': 1115872, 'steps': 2179, 'loss/train': 2.7484958171844482} -09/20/2021 22:02:25 - INFO - __main__ - Step 34872: {'lr': 0.0001995848347434967, 'samples': 1115904, 'steps': 2179, 'loss/train': 1.9608426094055176} -09/20/2021 22:02:26 - INFO - __main__ - Step 34873: {'lr': 0.0001995848347434967, 'samples': 1115936, 'steps': 2179, 'loss/train': 2.059811592102051} -09/20/2021 22:02:27 - INFO - __main__ - Step 34874: {'lr': 0.0001995848347434967, 'samples': 1115968, 'steps': 2179, 'loss/train': 3.1162803173065186} -09/20/2021 22:02:27 - INFO - __main__ - Step 34875: {'lr': 0.0001995848347434967, 'samples': 1116000, 'steps': 2179, 'loss/train': 1.7840170860290527} -09/20/2021 22:02:28 - INFO - __main__ - Step 34876: {'lr': 0.0001995848347434967, 'samples': 1116032, 'steps': 2179, 'loss/train': 1.6080281734466553} -09/20/2021 22:02:29 - INFO - __main__ - Step 34877: {'lr': 0.0001995848347434967, 'samples': 1116064, 'steps': 2179, 'loss/train': 2.7618298530578613} -09/20/2021 22:02:30 - INFO - __main__ - Step 34878: {'lr': 0.0001995848347434967, 'samples': 1116096, 'steps': 2179, 'loss/train': 2.979322671890259} -09/20/2021 22:02:30 - INFO - __main__ - Step 34879: {'lr': 0.0001995848347434967, 'samples': 1116128, 'steps': 2179, 'loss/train': 2.826322078704834} -09/20/2021 22:02:31 - INFO - __main__ - Step 34880: {'lr': 0.0001995848347434967, 'samples': 1116160, 'steps': 2179, 'loss/train': 1.8829673528671265} -09/20/2021 22:02:32 - INFO - __main__ - Step 34881: {'lr': 0.00019958425388624202, 'samples': 1116192, 'steps': 2180, 'loss/train': 2.5718698501586914} -09/20/2021 22:02:33 - INFO - __main__ - Step 34882: {'lr': 0.00019958425388624202, 'samples': 1116224, 'steps': 2180, 'loss/train': 2.2839977741241455} -09/20/2021 22:02:35 - INFO - __main__ - Step 34883: {'lr': 0.00019958425388624202, 'samples': 1116256, 'steps': 2180, 'loss/train': 3.660996198654175} -09/20/2021 22:02:35 - INFO - __main__ - Step 34884: {'lr': 0.00019958425388624202, 'samples': 1116288, 'steps': 2180, 'loss/train': 2.130929470062256} -09/20/2021 22:02:36 - INFO - __main__ - Step 34885: {'lr': 0.00019958425388624202, 'samples': 1116320, 'steps': 2180, 'loss/train': 1.6694523096084595} -09/20/2021 22:02:37 - INFO - __main__ - Step 34886: {'lr': 0.00019958425388624202, 'samples': 1116352, 'steps': 2180, 'loss/train': 2.039292573928833} -09/20/2021 22:02:38 - INFO - __main__ - Step 34887: {'lr': 0.00019958425388624202, 'samples': 1116384, 'steps': 2180, 'loss/train': 1.1314905881881714} -09/20/2021 22:02:38 - INFO - __main__ - Step 34888: {'lr': 0.00019958425388624202, 'samples': 1116416, 'steps': 2180, 'loss/train': 2.2785284519195557} -09/20/2021 22:02:39 - INFO - __main__ - Step 34889: {'lr': 0.00019958425388624202, 'samples': 1116448, 'steps': 2180, 'loss/train': 2.392378807067871} -09/20/2021 22:02:40 - INFO - __main__ - Step 34890: {'lr': 0.00019958425388624202, 'samples': 1116480, 'steps': 2180, 'loss/train': 2.850745916366577} -09/20/2021 22:02:41 - INFO - __main__ - Step 34891: {'lr': 0.00019958425388624202, 'samples': 1116512, 'steps': 2180, 'loss/train': 2.3638105392456055} -09/20/2021 22:02:41 - INFO - __main__ - Step 34892: {'lr': 0.00019958425388624202, 'samples': 1116544, 'steps': 2180, 'loss/train': 1.8387905359268188} -09/20/2021 22:02:42 - INFO - __main__ - Step 34893: {'lr': 0.00019958425388624202, 'samples': 1116576, 'steps': 2180, 'loss/train': 2.0143167972564697} -09/20/2021 22:02:43 - INFO - __main__ - Step 34894: {'lr': 0.00019958425388624202, 'samples': 1116608, 'steps': 2180, 'loss/train': 2.0781185626983643} -09/20/2021 22:02:44 - INFO - __main__ - Step 34895: {'lr': 0.00019958425388624202, 'samples': 1116640, 'steps': 2180, 'loss/train': 3.1957297325134277} -09/20/2021 22:02:44 - INFO - __main__ - Step 34896: {'lr': 0.00019958425388624202, 'samples': 1116672, 'steps': 2180, 'loss/train': 3.0928242206573486} -09/20/2021 22:02:45 - INFO - __main__ - Step 34897: {'lr': 0.00019958367262377938, 'samples': 1116704, 'steps': 2181, 'loss/train': 3.749873161315918} -09/20/2021 22:02:46 - INFO - __main__ - Step 34898: {'lr': 0.00019958367262377938, 'samples': 1116736, 'steps': 2181, 'loss/train': 3.8307957649230957} -09/20/2021 22:02:47 - INFO - __main__ - Step 34899: {'lr': 0.00019958367262377938, 'samples': 1116768, 'steps': 2181, 'loss/train': 3.0747618675231934} -09/20/2021 22:02:48 - INFO - __main__ - Step 34900: {'lr': 0.00019958367262377938, 'samples': 1116800, 'steps': 2181, 'loss/train': 2.2964415550231934} -09/20/2021 22:02:48 - INFO - __main__ - Step 34901: {'lr': 0.00019958367262377938, 'samples': 1116832, 'steps': 2181, 'loss/train': 2.641127109527588} -09/20/2021 22:02:49 - INFO - __main__ - Step 34902: {'lr': 0.00019958367262377938, 'samples': 1116864, 'steps': 2181, 'loss/train': 2.1484615802764893} -09/20/2021 22:02:50 - INFO - __main__ - Step 34903: {'lr': 0.00019958367262377938, 'samples': 1116896, 'steps': 2181, 'loss/train': 2.877659797668457} -09/20/2021 22:02:51 - INFO - __main__ - Step 34904: {'lr': 0.00019958367262377938, 'samples': 1116928, 'steps': 2181, 'loss/train': 2.220017194747925} -09/20/2021 22:02:51 - INFO - __main__ - Step 34905: {'lr': 0.00019958367262377938, 'samples': 1116960, 'steps': 2181, 'loss/train': 2.096508264541626} -09/20/2021 22:02:52 - INFO - __main__ - Step 34906: {'lr': 0.00019958367262377938, 'samples': 1116992, 'steps': 2181, 'loss/train': 2.4373245239257812} -09/20/2021 22:02:53 - INFO - __main__ - Step 34907: {'lr': 0.00019958367262377938, 'samples': 1117024, 'steps': 2181, 'loss/train': 1.7962661981582642} -09/20/2021 22:02:54 - INFO - __main__ - Step 34908: {'lr': 0.00019958367262377938, 'samples': 1117056, 'steps': 2181, 'loss/train': 2.5828428268432617} -09/20/2021 22:02:54 - INFO - __main__ - Step 34909: {'lr': 0.00019958367262377938, 'samples': 1117088, 'steps': 2181, 'loss/train': 2.524217128753662} -09/20/2021 22:02:55 - INFO - __main__ - Step 34910: {'lr': 0.00019958367262377938, 'samples': 1117120, 'steps': 2181, 'loss/train': 1.637535572052002} -09/20/2021 22:02:56 - INFO - __main__ - Step 34911: {'lr': 0.00019958367262377938, 'samples': 1117152, 'steps': 2181, 'loss/train': 2.0755228996276855} -09/20/2021 22:02:57 - INFO - __main__ - Step 34912: {'lr': 0.00019958367262377938, 'samples': 1117184, 'steps': 2181, 'loss/train': 2.885551929473877} -09/20/2021 22:02:57 - INFO - __main__ - Step 34913: {'lr': 0.00019958309095611116, 'samples': 1117216, 'steps': 2182, 'loss/train': 2.2363202571868896} -09/20/2021 22:02:59 - INFO - __main__ - Step 34914: {'lr': 0.00019958309095611116, 'samples': 1117248, 'steps': 2182, 'loss/train': 1.8890961408615112} -09/20/2021 22:03:00 - INFO - __main__ - Step 34915: {'lr': 0.00019958309095611116, 'samples': 1117280, 'steps': 2182, 'loss/train': 1.662566900253296} -09/20/2021 22:03:00 - INFO - __main__ - Step 34916: {'lr': 0.00019958309095611116, 'samples': 1117312, 'steps': 2182, 'loss/train': 2.1523256301879883} -09/20/2021 22:03:01 - INFO - __main__ - Step 34917: {'lr': 0.00019958309095611116, 'samples': 1117344, 'steps': 2182, 'loss/train': 1.9989525079727173} -09/20/2021 22:03:02 - INFO - __main__ - Step 34918: {'lr': 0.00019958309095611116, 'samples': 1117376, 'steps': 2182, 'loss/train': 1.8831311464309692} -09/20/2021 22:03:03 - INFO - __main__ - Step 34919: {'lr': 0.00019958309095611116, 'samples': 1117408, 'steps': 2182, 'loss/train': 2.057219982147217} -09/20/2021 22:03:03 - INFO - __main__ - Step 34920: {'lr': 0.00019958309095611116, 'samples': 1117440, 'steps': 2182, 'loss/train': 2.2283363342285156} -09/20/2021 22:03:04 - INFO - __main__ - Step 34921: {'lr': 0.00019958309095611116, 'samples': 1117472, 'steps': 2182, 'loss/train': 3.080659866333008} -09/20/2021 22:03:05 - INFO - __main__ - Step 34922: {'lr': 0.00019958309095611116, 'samples': 1117504, 'steps': 2182, 'loss/train': 2.7001943588256836} -09/20/2021 22:03:06 - INFO - __main__ - Step 34923: {'lr': 0.00019958309095611116, 'samples': 1117536, 'steps': 2182, 'loss/train': 1.960174560546875} -09/20/2021 22:03:06 - INFO - __main__ - Step 34924: {'lr': 0.00019958309095611116, 'samples': 1117568, 'steps': 2182, 'loss/train': 2.326364040374756} -09/20/2021 22:03:07 - INFO - __main__ - Step 34925: {'lr': 0.00019958309095611116, 'samples': 1117600, 'steps': 2182, 'loss/train': 2.0421090126037598} -09/20/2021 22:03:08 - INFO - __main__ - Step 34926: {'lr': 0.00019958309095611116, 'samples': 1117632, 'steps': 2182, 'loss/train': 2.1048460006713867} -09/20/2021 22:03:09 - INFO - __main__ - Step 34927: {'lr': 0.00019958309095611116, 'samples': 1117664, 'steps': 2182, 'loss/train': 1.798315405845642} -09/20/2021 22:03:09 - INFO - __main__ - Step 34928: {'lr': 0.00019958309095611116, 'samples': 1117696, 'steps': 2182, 'loss/train': 2.4025650024414062} -09/20/2021 22:03:10 - INFO - __main__ - Step 34929: {'lr': 0.00019958250888323976, 'samples': 1117728, 'steps': 2183, 'loss/train': 1.9778450727462769} -09/20/2021 22:03:11 - INFO - __main__ - Step 34930: {'lr': 0.00019958250888323976, 'samples': 1117760, 'steps': 2183, 'loss/train': 2.8077232837677} -09/20/2021 22:03:12 - INFO - __main__ - Step 34931: {'lr': 0.00019958250888323976, 'samples': 1117792, 'steps': 2183, 'loss/train': 3.1338696479797363} -09/20/2021 22:03:12 - INFO - __main__ - Step 34932: {'lr': 0.00019958250888323976, 'samples': 1117824, 'steps': 2183, 'loss/train': 2.1334705352783203} -09/20/2021 22:03:13 - INFO - __main__ - Step 34933: {'lr': 0.00019958250888323976, 'samples': 1117856, 'steps': 2183, 'loss/train': 2.8080570697784424} -09/20/2021 22:03:14 - INFO - __main__ - Step 34934: {'lr': 0.00019958250888323976, 'samples': 1117888, 'steps': 2183, 'loss/train': 0.36887601017951965} -09/20/2021 22:03:15 - INFO - __main__ - Step 34935: {'lr': 0.00019958250888323976, 'samples': 1117920, 'steps': 2183, 'loss/train': 0.17507600784301758} -09/20/2021 22:03:15 - INFO - __main__ - Step 34936: {'lr': 0.00019958250888323976, 'samples': 1117952, 'steps': 2183, 'loss/train': 0.2505275309085846} -09/20/2021 22:03:16 - INFO - __main__ - Step 34937: {'lr': 0.00019958250888323976, 'samples': 1117984, 'steps': 2183, 'loss/train': 1.9154839515686035} -09/20/2021 22:03:17 - INFO - __main__ - Step 34938: {'lr': 0.00019958250888323976, 'samples': 1118016, 'steps': 2183, 'loss/train': 1.7889080047607422} -09/20/2021 22:03:18 - INFO - __main__ - Step 34939: {'lr': 0.00019958250888323976, 'samples': 1118048, 'steps': 2183, 'loss/train': 2.5639309883117676} -09/20/2021 22:03:18 - INFO - __main__ - Step 34940: {'lr': 0.00019958250888323976, 'samples': 1118080, 'steps': 2183, 'loss/train': 2.0448243618011475} -09/20/2021 22:03:19 - INFO - __main__ - Step 34941: {'lr': 0.00019958250888323976, 'samples': 1118112, 'steps': 2183, 'loss/train': 2.035871982574463} -09/20/2021 22:03:20 - INFO - __main__ - Step 34942: {'lr': 0.00019958250888323976, 'samples': 1118144, 'steps': 2183, 'loss/train': 2.3442299365997314} -09/20/2021 22:03:21 - INFO - __main__ - Step 34943: {'lr': 0.00019958250888323976, 'samples': 1118176, 'steps': 2183, 'loss/train': 2.1445670127868652} -09/20/2021 22:03:23 - INFO - __main__ - Step 34944: {'lr': 0.00019958250888323976, 'samples': 1118208, 'steps': 2183, 'loss/train': 2.192948818206787} -09/20/2021 22:03:23 - INFO - __main__ - Step 34945: {'lr': 0.00019958192640516748, 'samples': 1118240, 'steps': 2184, 'loss/train': 2.1100685596466064} -09/20/2021 22:03:24 - INFO - __main__ - Step 34946: {'lr': 0.00019958192640516748, 'samples': 1118272, 'steps': 2184, 'loss/train': 2.438173532485962} -09/20/2021 22:03:25 - INFO - __main__ - Step 34947: {'lr': 0.00019958192640516748, 'samples': 1118304, 'steps': 2184, 'loss/train': 1.7236679792404175} -09/20/2021 22:03:26 - INFO - __main__ - Step 34948: {'lr': 0.00019958192640516748, 'samples': 1118336, 'steps': 2184, 'loss/train': 1.7731934785842896} -09/20/2021 22:03:26 - INFO - __main__ - Step 34949: {'lr': 0.00019958192640516748, 'samples': 1118368, 'steps': 2184, 'loss/train': 2.756211042404175} -09/20/2021 22:03:27 - INFO - __main__ - Step 34950: {'lr': 0.00019958192640516748, 'samples': 1118400, 'steps': 2184, 'loss/train': 2.114319086074829} -09/20/2021 22:03:28 - INFO - __main__ - Step 34951: {'lr': 0.00019958192640516748, 'samples': 1118432, 'steps': 2184, 'loss/train': 0.5265076160430908} -09/20/2021 22:03:29 - INFO - __main__ - Step 34952: {'lr': 0.00019958192640516748, 'samples': 1118464, 'steps': 2184, 'loss/train': 2.1489717960357666} -09/20/2021 22:03:29 - INFO - __main__ - Step 34953: {'lr': 0.00019958192640516748, 'samples': 1118496, 'steps': 2184, 'loss/train': 2.726384162902832} -09/20/2021 22:03:30 - INFO - __main__ - Step 34954: {'lr': 0.00019958192640516748, 'samples': 1118528, 'steps': 2184, 'loss/train': 2.4685301780700684} -09/20/2021 22:03:31 - INFO - __main__ - Step 34955: {'lr': 0.00019958192640516748, 'samples': 1118560, 'steps': 2184, 'loss/train': 0.4951232373714447} -09/20/2021 22:03:32 - INFO - __main__ - Step 34956: {'lr': 0.00019958192640516748, 'samples': 1118592, 'steps': 2184, 'loss/train': 2.151202440261841} -09/20/2021 22:03:32 - INFO - __main__ - Step 34957: {'lr': 0.00019958192640516748, 'samples': 1118624, 'steps': 2184, 'loss/train': 1.372084140777588} -09/20/2021 22:03:33 - INFO - __main__ - Step 34958: {'lr': 0.00019958192640516748, 'samples': 1118656, 'steps': 2184, 'loss/train': 1.362960934638977} -09/20/2021 22:03:34 - INFO - __main__ - Step 34959: {'lr': 0.00019958192640516748, 'samples': 1118688, 'steps': 2184, 'loss/train': 1.928313136100769} -09/20/2021 22:03:35 - INFO - __main__ - Step 34960: {'lr': 0.00019958192640516748, 'samples': 1118720, 'steps': 2184, 'loss/train': 2.7339742183685303} -09/20/2021 22:03:36 - INFO - __main__ - Step 34961: {'lr': 0.00019958134352189677, 'samples': 1118752, 'steps': 2185, 'loss/train': 1.6450204849243164} -09/20/2021 22:03:36 - INFO - __main__ - Step 34962: {'lr': 0.00019958134352189677, 'samples': 1118784, 'steps': 2185, 'loss/train': 2.361928701400757} -09/20/2021 22:03:37 - INFO - __main__ - Step 34963: {'lr': 0.00019958134352189677, 'samples': 1118816, 'steps': 2185, 'loss/train': 1.7684799432754517} -09/20/2021 22:03:38 - INFO - __main__ - Step 34964: {'lr': 0.00019958134352189677, 'samples': 1118848, 'steps': 2185, 'loss/train': 2.0394411087036133} -09/20/2021 22:03:39 - INFO - __main__ - Step 34965: {'lr': 0.00019958134352189677, 'samples': 1118880, 'steps': 2185, 'loss/train': 1.8213093280792236} -09/20/2021 22:03:39 - INFO - __main__ - Step 34966: {'lr': 0.00019958134352189677, 'samples': 1118912, 'steps': 2185, 'loss/train': 2.645780563354492} -09/20/2021 22:03:40 - INFO - __main__ - Step 34967: {'lr': 0.00019958134352189677, 'samples': 1118944, 'steps': 2185, 'loss/train': 2.047417402267456} -09/20/2021 22:03:41 - INFO - __main__ - Step 34968: {'lr': 0.00019958134352189677, 'samples': 1118976, 'steps': 2185, 'loss/train': 2.7348899841308594} -09/20/2021 22:03:42 - INFO - __main__ - Step 34969: {'lr': 0.00019958134352189677, 'samples': 1119008, 'steps': 2185, 'loss/train': 0.39336392283439636} -09/20/2021 22:03:42 - INFO - __main__ - Step 34970: {'lr': 0.00019958134352189677, 'samples': 1119040, 'steps': 2185, 'loss/train': 0.23454278707504272} -09/20/2021 22:03:43 - INFO - __main__ - Step 34971: {'lr': 0.00019958134352189677, 'samples': 1119072, 'steps': 2185, 'loss/train': 0.34430888295173645} -09/20/2021 22:03:44 - INFO - __main__ - Step 34972: {'lr': 0.00019958134352189677, 'samples': 1119104, 'steps': 2185, 'loss/train': 0.2632718086242676} -09/20/2021 22:03:45 - INFO - __main__ - Step 34973: {'lr': 0.00019958134352189677, 'samples': 1119136, 'steps': 2185, 'loss/train': 0.3922818899154663} -09/20/2021 22:03:45 - INFO - __main__ - Step 34974: {'lr': 0.00019958134352189677, 'samples': 1119168, 'steps': 2185, 'loss/train': 0.3837053179740906} -09/20/2021 22:03:46 - INFO - __main__ - Step 34975: {'lr': 0.00019958134352189677, 'samples': 1119200, 'steps': 2185, 'loss/train': 0.6263701319694519} -09/20/2021 22:03:47 - INFO - __main__ - Step 34976: {'lr': 0.00019958134352189677, 'samples': 1119232, 'steps': 2185, 'loss/train': 0.6359872817993164} -09/20/2021 22:03:48 - INFO - __main__ - Step 34977: {'lr': 0.00019958076023342993, 'samples': 1119264, 'steps': 2186, 'loss/train': 3.05334734916687} -09/20/2021 22:03:49 - INFO - __main__ - Step 34978: {'lr': 0.00019958076023342993, 'samples': 1119296, 'steps': 2186, 'loss/train': 0.6092352271080017} -09/20/2021 22:03:50 - INFO - __main__ - Step 34979: {'lr': 0.00019958076023342993, 'samples': 1119328, 'steps': 2186, 'loss/train': 2.4923975467681885} -09/20/2021 22:03:51 - INFO - __main__ - Step 34980: {'lr': 0.00019958076023342993, 'samples': 1119360, 'steps': 2186, 'loss/train': 2.2935428619384766} -09/20/2021 22:03:51 - INFO - __main__ - Step 34981: {'lr': 0.00019958076023342993, 'samples': 1119392, 'steps': 2186, 'loss/train': 2.0427486896514893} -09/20/2021 22:03:52 - INFO - __main__ - Step 34982: {'lr': 0.00019958076023342993, 'samples': 1119424, 'steps': 2186, 'loss/train': 1.7075631618499756} -09/20/2021 22:03:53 - INFO - __main__ - Step 34983: {'lr': 0.00019958076023342993, 'samples': 1119456, 'steps': 2186, 'loss/train': 3.034156084060669} -09/20/2021 22:03:53 - INFO - __main__ - Step 34984: {'lr': 0.00019958076023342993, 'samples': 1119488, 'steps': 2186, 'loss/train': 1.8860896825790405} -09/20/2021 22:03:54 - INFO - __main__ - Step 34985: {'lr': 0.00019958076023342993, 'samples': 1119520, 'steps': 2186, 'loss/train': 1.9845075607299805} -09/20/2021 22:03:55 - INFO - __main__ - Step 34986: {'lr': 0.00019958076023342993, 'samples': 1119552, 'steps': 2186, 'loss/train': 1.9650895595550537} -09/20/2021 22:03:56 - INFO - __main__ - Step 34987: {'lr': 0.00019958076023342993, 'samples': 1119584, 'steps': 2186, 'loss/train': 2.099271297454834} -09/20/2021 22:03:56 - INFO - __main__ - Step 34988: {'lr': 0.00019958076023342993, 'samples': 1119616, 'steps': 2186, 'loss/train': 1.8524991273880005} -09/20/2021 22:03:57 - INFO - __main__ - Step 34989: {'lr': 0.00019958076023342993, 'samples': 1119648, 'steps': 2186, 'loss/train': 1.4211846590042114} -09/20/2021 22:03:58 - INFO - __main__ - Step 34990: {'lr': 0.00019958076023342993, 'samples': 1119680, 'steps': 2186, 'loss/train': 0.39365240931510925} -09/20/2021 22:03:59 - INFO - __main__ - Step 34991: {'lr': 0.00019958076023342993, 'samples': 1119712, 'steps': 2186, 'loss/train': 2.233429431915283} -09/20/2021 22:03:59 - INFO - __main__ - Step 34992: {'lr': 0.00019958076023342993, 'samples': 1119744, 'steps': 2186, 'loss/train': 2.3992886543273926} -09/20/2021 22:04:00 - INFO - __main__ - Step 34993: {'lr': 0.00019958017653976936, 'samples': 1119776, 'steps': 2187, 'loss/train': 1.9513386487960815} -09/20/2021 22:04:01 - INFO - __main__ - Step 34994: {'lr': 0.00019958017653976936, 'samples': 1119808, 'steps': 2187, 'loss/train': 1.4724565744400024} -09/20/2021 22:04:02 - INFO - __main__ - Step 34995: {'lr': 0.00019958017653976936, 'samples': 1119840, 'steps': 2187, 'loss/train': 2.3398826122283936} -09/20/2021 22:04:03 - INFO - __main__ - Step 34996: {'lr': 0.00019958017653976936, 'samples': 1119872, 'steps': 2187, 'loss/train': 1.5207546949386597} -09/20/2021 22:04:03 - INFO - __main__ - Step 34997: {'lr': 0.00019958017653976936, 'samples': 1119904, 'steps': 2187, 'loss/train': 2.4252843856811523} -09/20/2021 22:04:04 - INFO - __main__ - Step 34998: {'lr': 0.00019958017653976936, 'samples': 1119936, 'steps': 2187, 'loss/train': 3.1848361492156982} -09/20/2021 22:04:05 - INFO - __main__ - Step 34999: {'lr': 0.00019958017653976936, 'samples': 1119968, 'steps': 2187, 'loss/train': 2.034727096557617} -09/20/2021 22:04:06 - INFO - __main__ - Step 35000: {'lr': 0.00019958017653976936, 'samples': 1120000, 'steps': 2187, 'loss/train': 2.083341121673584} -09/20/2021 22:04:06 - INFO - __main__ - Step 35001: {'lr': 0.00019958017653976936, 'samples': 1120032, 'steps': 2187, 'loss/train': 2.73588490486145} -09/20/2021 22:04:07 - INFO - __main__ - Step 35002: {'lr': 0.00019958017653976936, 'samples': 1120064, 'steps': 2187, 'loss/train': 2.2239763736724854} -09/20/2021 22:04:08 - INFO - __main__ - Step 35003: {'lr': 0.00019958017653976936, 'samples': 1120096, 'steps': 2187, 'loss/train': 2.6901438236236572} -09/20/2021 22:04:09 - INFO - __main__ - Step 35004: {'lr': 0.00019958017653976936, 'samples': 1120128, 'steps': 2187, 'loss/train': 2.4282805919647217} -09/20/2021 22:04:09 - INFO - __main__ - Step 35005: {'lr': 0.00019958017653976936, 'samples': 1120160, 'steps': 2187, 'loss/train': 0.8696702122688293} -09/20/2021 22:04:10 - INFO - __main__ - Step 35006: {'lr': 0.00019958017653976936, 'samples': 1120192, 'steps': 2187, 'loss/train': 2.591787338256836} -09/20/2021 22:04:12 - INFO - __main__ - Step 35007: {'lr': 0.00019958017653976936, 'samples': 1120224, 'steps': 2187, 'loss/train': 2.657661199569702} -09/20/2021 22:04:12 - INFO - __main__ - Step 35008: {'lr': 0.00019958017653976936, 'samples': 1120256, 'steps': 2187, 'loss/train': 1.7216850519180298} -09/20/2021 22:04:13 - INFO - __main__ - Step 35009: {'lr': 0.00019957959244091747, 'samples': 1120288, 'steps': 2188, 'loss/train': 2.649171829223633} -09/20/2021 22:04:14 - INFO - __main__ - Step 35010: {'lr': 0.00019957959244091747, 'samples': 1120320, 'steps': 2188, 'loss/train': 2.6195218563079834} -09/20/2021 22:04:15 - INFO - __main__ - Step 35011: {'lr': 0.00019957959244091747, 'samples': 1120352, 'steps': 2188, 'loss/train': 2.7344415187835693} -09/20/2021 22:04:15 - INFO - __main__ - Step 35012: {'lr': 0.00019957959244091747, 'samples': 1120384, 'steps': 2188, 'loss/train': 2.4790282249450684} -09/20/2021 22:04:16 - INFO - __main__ - Step 35013: {'lr': 0.00019957959244091747, 'samples': 1120416, 'steps': 2188, 'loss/train': 0.2490708976984024} -09/20/2021 22:04:17 - INFO - __main__ - Step 35014: {'lr': 0.00019957959244091747, 'samples': 1120448, 'steps': 2188, 'loss/train': 0.1708061397075653} -09/20/2021 22:04:18 - INFO - __main__ - Step 35015: {'lr': 0.00019957959244091747, 'samples': 1120480, 'steps': 2188, 'loss/train': 1.885945439338684} -09/20/2021 22:04:18 - INFO - __main__ - Step 35016: {'lr': 0.00019957959244091747, 'samples': 1120512, 'steps': 2188, 'loss/train': 3.133066415786743} -09/20/2021 22:04:19 - INFO - __main__ - Step 35017: {'lr': 0.00019957959244091747, 'samples': 1120544, 'steps': 2188, 'loss/train': 1.6969995498657227} -09/20/2021 22:04:20 - INFO - __main__ - Step 35018: {'lr': 0.00019957959244091747, 'samples': 1120576, 'steps': 2188, 'loss/train': 1.421505093574524} -09/20/2021 22:04:21 - INFO - __main__ - Step 35019: {'lr': 0.00019957959244091747, 'samples': 1120608, 'steps': 2188, 'loss/train': 2.427978277206421} -09/20/2021 22:04:21 - INFO - __main__ - Step 35020: {'lr': 0.00019957959244091747, 'samples': 1120640, 'steps': 2188, 'loss/train': 1.8141509294509888} -09/20/2021 22:04:22 - INFO - __main__ - Step 35021: {'lr': 0.00019957959244091747, 'samples': 1120672, 'steps': 2188, 'loss/train': 2.283189296722412} -09/20/2021 22:04:23 - INFO - __main__ - Step 35022: {'lr': 0.00019957959244091747, 'samples': 1120704, 'steps': 2188, 'loss/train': 2.1206207275390625} -09/20/2021 22:04:24 - INFO - __main__ - Step 35023: {'lr': 0.00019957959244091747, 'samples': 1120736, 'steps': 2188, 'loss/train': 1.9525593519210815} -09/20/2021 22:04:24 - INFO - __main__ - Step 35024: {'lr': 0.00019957959244091747, 'samples': 1120768, 'steps': 2188, 'loss/train': 1.33756422996521} -09/20/2021 22:04:25 - INFO - __main__ - Step 35025: {'lr': 0.00019957900793687657, 'samples': 1120800, 'steps': 2189, 'loss/train': 2.1564857959747314} -09/20/2021 22:04:26 - INFO - __main__ - Step 35026: {'lr': 0.00019957900793687657, 'samples': 1120832, 'steps': 2189, 'loss/train': 0.23248519003391266} -09/20/2021 22:04:27 - INFO - __main__ - Step 35027: {'lr': 0.00019957900793687657, 'samples': 1120864, 'steps': 2189, 'loss/train': 0.30483219027519226} -09/20/2021 22:04:28 - INFO - __main__ - Step 35028: {'lr': 0.00019957900793687657, 'samples': 1120896, 'steps': 2189, 'loss/train': 0.4132009744644165} -09/20/2021 22:04:28 - INFO - __main__ - Step 35029: {'lr': 0.00019957900793687657, 'samples': 1120928, 'steps': 2189, 'loss/train': 2.6797585487365723} -09/20/2021 22:04:29 - INFO - __main__ - Step 35030: {'lr': 0.00019957900793687657, 'samples': 1120960, 'steps': 2189, 'loss/train': 2.5169360637664795} -09/20/2021 22:04:30 - INFO - __main__ - Step 35031: {'lr': 0.00019957900793687657, 'samples': 1120992, 'steps': 2189, 'loss/train': 0.9721853137016296} -09/20/2021 22:04:31 - INFO - __main__ - Step 35032: {'lr': 0.00019957900793687657, 'samples': 1121024, 'steps': 2189, 'loss/train': 3.2928197383880615} -09/20/2021 22:04:31 - INFO - __main__ - Step 35033: {'lr': 0.00019957900793687657, 'samples': 1121056, 'steps': 2189, 'loss/train': 1.9341373443603516} -09/20/2021 22:04:32 - INFO - __main__ - Step 35034: {'lr': 0.00019957900793687657, 'samples': 1121088, 'steps': 2189, 'loss/train': 2.1617321968078613} -09/20/2021 22:04:33 - INFO - __main__ - Step 35035: {'lr': 0.00019957900793687657, 'samples': 1121120, 'steps': 2189, 'loss/train': 2.317870855331421} -09/20/2021 22:04:34 - INFO - __main__ - Step 35036: {'lr': 0.00019957900793687657, 'samples': 1121152, 'steps': 2189, 'loss/train': 2.416790246963501} -09/20/2021 22:04:34 - INFO - __main__ - Step 35037: {'lr': 0.00019957900793687657, 'samples': 1121184, 'steps': 2189, 'loss/train': 0.2222900092601776} -09/20/2021 22:04:35 - INFO - __main__ - Step 35038: {'lr': 0.00019957900793687657, 'samples': 1121216, 'steps': 2189, 'loss/train': 0.21781374514102936} -09/20/2021 22:04:36 - INFO - __main__ - Step 35039: {'lr': 0.00019957900793687657, 'samples': 1121248, 'steps': 2189, 'loss/train': 0.2351258248090744} -09/20/2021 22:04:37 - INFO - __main__ - Step 35040: {'lr': 0.00019957900793687657, 'samples': 1121280, 'steps': 2189, 'loss/train': 2.501560688018799} -09/20/2021 22:04:38 - INFO - __main__ - Step 35041: {'lr': 0.00019957842302764908, 'samples': 1121312, 'steps': 2190, 'loss/train': 0.7467392086982727} -09/20/2021 22:04:39 - INFO - __main__ - Step 35042: {'lr': 0.00019957842302764908, 'samples': 1121344, 'steps': 2190, 'loss/train': 2.556070566177368} -09/20/2021 22:04:40 - INFO - __main__ - Step 35043: {'lr': 0.00019957842302764908, 'samples': 1121376, 'steps': 2190, 'loss/train': 0.4544278085231781} -09/20/2021 22:04:40 - INFO - __main__ - Step 35044: {'lr': 0.00019957842302764908, 'samples': 1121408, 'steps': 2190, 'loss/train': 1.9504636526107788} -09/20/2021 22:04:41 - INFO - __main__ - Step 35045: {'lr': 0.00019957842302764908, 'samples': 1121440, 'steps': 2190, 'loss/train': 0.7378022074699402} -09/20/2021 22:04:42 - INFO - __main__ - Step 35046: {'lr': 0.00019957842302764908, 'samples': 1121472, 'steps': 2190, 'loss/train': 3.050687551498413} -09/20/2021 22:04:43 - INFO - __main__ - Step 35047: {'lr': 0.00019957842302764908, 'samples': 1121504, 'steps': 2190, 'loss/train': 1.8392397165298462} -09/20/2021 22:04:43 - INFO - __main__ - Step 35048: {'lr': 0.00019957842302764908, 'samples': 1121536, 'steps': 2190, 'loss/train': 1.6281086206436157} -09/20/2021 22:04:44 - INFO - __main__ - Step 35049: {'lr': 0.00019957842302764908, 'samples': 1121568, 'steps': 2190, 'loss/train': 2.2675118446350098} -09/20/2021 22:04:45 - INFO - __main__ - Step 35050: {'lr': 0.00019957842302764908, 'samples': 1121600, 'steps': 2190, 'loss/train': 3.0066983699798584} -09/20/2021 22:04:46 - INFO - __main__ - Step 35051: {'lr': 0.00019957842302764908, 'samples': 1121632, 'steps': 2190, 'loss/train': 1.1195672750473022} -09/20/2021 22:04:46 - INFO - __main__ - Step 35052: {'lr': 0.00019957842302764908, 'samples': 1121664, 'steps': 2190, 'loss/train': 1.894845724105835} -09/20/2021 22:04:47 - INFO - __main__ - Step 35053: {'lr': 0.00019957842302764908, 'samples': 1121696, 'steps': 2190, 'loss/train': 2.8505828380584717} -09/20/2021 22:04:48 - INFO - __main__ - Step 35054: {'lr': 0.00019957842302764908, 'samples': 1121728, 'steps': 2190, 'loss/train': 1.9258745908737183} -09/20/2021 22:04:49 - INFO - __main__ - Step 35055: {'lr': 0.00019957842302764908, 'samples': 1121760, 'steps': 2190, 'loss/train': 1.3469661474227905} -09/20/2021 22:04:49 - INFO - __main__ - Step 35056: {'lr': 0.00019957842302764908, 'samples': 1121792, 'steps': 2190, 'loss/train': 1.3466287851333618} -09/20/2021 22:04:50 - INFO - __main__ - Step 35057: {'lr': 0.0001995778377132374, 'samples': 1121824, 'steps': 2191, 'loss/train': 1.8806947469711304} -09/20/2021 22:04:51 - INFO - __main__ - Step 35058: {'lr': 0.0001995778377132374, 'samples': 1121856, 'steps': 2191, 'loss/train': 1.8046363592147827} -09/20/2021 22:04:52 - INFO - __main__ - Step 35059: {'lr': 0.0001995778377132374, 'samples': 1121888, 'steps': 2191, 'loss/train': 0.23965148627758026} -09/20/2021 22:04:52 - INFO - __main__ - Step 35060: {'lr': 0.0001995778377132374, 'samples': 1121920, 'steps': 2191, 'loss/train': 0.27103811502456665} -09/20/2021 22:04:53 - INFO - __main__ - Step 35061: {'lr': 0.0001995778377132374, 'samples': 1121952, 'steps': 2191, 'loss/train': 0.2105943262577057} -09/20/2021 22:04:54 - INFO - __main__ - Step 35062: {'lr': 0.0001995778377132374, 'samples': 1121984, 'steps': 2191, 'loss/train': 2.407374143600464} -09/20/2021 22:04:55 - INFO - __main__ - Step 35063: {'lr': 0.0001995778377132374, 'samples': 1122016, 'steps': 2191, 'loss/train': 2.0990285873413086} -09/20/2021 22:04:55 - INFO - __main__ - Step 35064: {'lr': 0.0001995778377132374, 'samples': 1122048, 'steps': 2191, 'loss/train': 1.9411487579345703} -09/20/2021 22:04:56 - INFO - __main__ - Step 35065: {'lr': 0.0001995778377132374, 'samples': 1122080, 'steps': 2191, 'loss/train': 1.6325546503067017} -09/20/2021 22:04:57 - INFO - __main__ - Step 35066: {'lr': 0.0001995778377132374, 'samples': 1122112, 'steps': 2191, 'loss/train': 2.9716925621032715} -09/20/2021 22:04:58 - INFO - __main__ - Step 35067: {'lr': 0.0001995778377132374, 'samples': 1122144, 'steps': 2191, 'loss/train': 2.6959853172302246} -09/20/2021 22:04:58 - INFO - __main__ - Step 35068: {'lr': 0.0001995778377132374, 'samples': 1122176, 'steps': 2191, 'loss/train': 2.4214587211608887} -09/20/2021 22:04:59 - INFO - __main__ - Step 35069: {'lr': 0.0001995778377132374, 'samples': 1122208, 'steps': 2191, 'loss/train': 2.3968920707702637} -09/20/2021 22:05:01 - INFO - __main__ - Step 35070: {'lr': 0.0001995778377132374, 'samples': 1122240, 'steps': 2191, 'loss/train': 1.6652944087982178} -09/20/2021 22:05:01 - INFO - __main__ - Step 35071: {'lr': 0.0001995778377132374, 'samples': 1122272, 'steps': 2191, 'loss/train': 1.8159592151641846} -09/20/2021 22:05:02 - INFO - __main__ - Step 35072: {'lr': 0.0001995778377132374, 'samples': 1122304, 'steps': 2191, 'loss/train': 3.7657792568206787} -09/20/2021 22:05:03 - INFO - __main__ - Step 35073: {'lr': 0.00019957725199364385, 'samples': 1122336, 'steps': 2192, 'loss/train': 3.83941912651062} -09/20/2021 22:05:04 - INFO - __main__ - Step 35074: {'lr': 0.00019957725199364385, 'samples': 1122368, 'steps': 2192, 'loss/train': 2.908762216567993} -09/20/2021 22:05:04 - INFO - __main__ - Step 35075: {'lr': 0.00019957725199364385, 'samples': 1122400, 'steps': 2192, 'loss/train': 3.4756791591644287} -09/20/2021 22:05:05 - INFO - __main__ - Step 35076: {'lr': 0.00019957725199364385, 'samples': 1122432, 'steps': 2192, 'loss/train': 3.1110191345214844} -09/20/2021 22:05:06 - INFO - __main__ - Step 35077: {'lr': 0.00019957725199364385, 'samples': 1122464, 'steps': 2192, 'loss/train': 1.3736690282821655} -09/20/2021 22:05:07 - INFO - __main__ - Step 35078: {'lr': 0.00019957725199364385, 'samples': 1122496, 'steps': 2192, 'loss/train': 1.9925990104675293} -09/20/2021 22:05:07 - INFO - __main__ - Step 35079: {'lr': 0.00019957725199364385, 'samples': 1122528, 'steps': 2192, 'loss/train': 3.4644577503204346} -09/20/2021 22:05:08 - INFO - __main__ - Step 35080: {'lr': 0.00019957725199364385, 'samples': 1122560, 'steps': 2192, 'loss/train': 2.714130163192749} -09/20/2021 22:05:09 - INFO - __main__ - Step 35081: {'lr': 0.00019957725199364385, 'samples': 1122592, 'steps': 2192, 'loss/train': 2.741478204727173} -09/20/2021 22:05:10 - INFO - __main__ - Step 35082: {'lr': 0.00019957725199364385, 'samples': 1122624, 'steps': 2192, 'loss/train': 2.2446093559265137} -09/20/2021 22:05:10 - INFO - __main__ - Step 35083: {'lr': 0.00019957725199364385, 'samples': 1122656, 'steps': 2192, 'loss/train': 1.890702724456787} -09/20/2021 22:05:11 - INFO - __main__ - Step 35084: {'lr': 0.00019957725199364385, 'samples': 1122688, 'steps': 2192, 'loss/train': 3.5565457344055176} -09/20/2021 22:05:12 - INFO - __main__ - Step 35085: {'lr': 0.00019957725199364385, 'samples': 1122720, 'steps': 2192, 'loss/train': 1.6062495708465576} -09/20/2021 22:05:13 - INFO - __main__ - Step 35086: {'lr': 0.00019957725199364385, 'samples': 1122752, 'steps': 2192, 'loss/train': 2.4475338459014893} -09/20/2021 22:05:13 - INFO - __main__ - Step 35087: {'lr': 0.00019957725199364385, 'samples': 1122784, 'steps': 2192, 'loss/train': 2.6826369762420654} -09/20/2021 22:05:14 - INFO - __main__ - Step 35088: {'lr': 0.00019957725199364385, 'samples': 1122816, 'steps': 2192, 'loss/train': 1.8616505861282349} -09/20/2021 22:05:15 - INFO - __main__ - Step 35089: {'lr': 0.00019957666586887087, 'samples': 1122848, 'steps': 2193, 'loss/train': 2.1796445846557617} -09/20/2021 22:05:16 - INFO - __main__ - Step 35090: {'lr': 0.00019957666586887087, 'samples': 1122880, 'steps': 2193, 'loss/train': 0.8939707279205322} -09/20/2021 22:05:17 - INFO - __main__ - Step 35091: {'lr': 0.00019957666586887087, 'samples': 1122912, 'steps': 2193, 'loss/train': 0.39596328139305115} -09/20/2021 22:05:17 - INFO - __main__ - Step 35092: {'lr': 0.00019957666586887087, 'samples': 1122944, 'steps': 2193, 'loss/train': 2.685123920440674} -09/20/2021 22:05:18 - INFO - __main__ - Step 35093: {'lr': 0.00019957666586887087, 'samples': 1122976, 'steps': 2193, 'loss/train': 2.176940679550171} -09/20/2021 22:05:19 - INFO - __main__ - Step 35094: {'lr': 0.00019957666586887087, 'samples': 1123008, 'steps': 2193, 'loss/train': 2.3947629928588867} -09/20/2021 22:05:20 - INFO - __main__ - Step 35095: {'lr': 0.00019957666586887087, 'samples': 1123040, 'steps': 2193, 'loss/train': 0.47234827280044556} -09/20/2021 22:05:20 - INFO - __main__ - Step 35096: {'lr': 0.00019957666586887087, 'samples': 1123072, 'steps': 2193, 'loss/train': 0.6051680445671082} -09/20/2021 22:05:21 - INFO - __main__ - Step 35097: {'lr': 0.00019957666586887087, 'samples': 1123104, 'steps': 2193, 'loss/train': 2.463728189468384} -09/20/2021 22:05:22 - INFO - __main__ - Step 35098: {'lr': 0.00019957666586887087, 'samples': 1123136, 'steps': 2193, 'loss/train': 2.2464215755462646} -09/20/2021 22:05:23 - INFO - __main__ - Step 35099: {'lr': 0.00019957666586887087, 'samples': 1123168, 'steps': 2193, 'loss/train': 3.349790096282959} -09/20/2021 22:05:24 - INFO - __main__ - Step 35100: {'lr': 0.00019957666586887087, 'samples': 1123200, 'steps': 2193, 'loss/train': 2.0448811054229736} -09/20/2021 22:05:25 - INFO - __main__ - Step 35101: {'lr': 0.00019957666586887087, 'samples': 1123232, 'steps': 2193, 'loss/train': 3.036339282989502} -09/20/2021 22:05:26 - INFO - __main__ - Step 35102: {'lr': 0.00019957666586887087, 'samples': 1123264, 'steps': 2193, 'loss/train': 0.8773794174194336} -09/20/2021 22:05:27 - INFO - __main__ - Step 35103: {'lr': 0.00019957666586887087, 'samples': 1123296, 'steps': 2193, 'loss/train': 0.6757262349128723} -09/20/2021 22:05:27 - INFO - __main__ - Step 35104: {'lr': 0.00019957666586887087, 'samples': 1123328, 'steps': 2193, 'loss/train': 0.695658802986145} -09/20/2021 22:05:28 - INFO - __main__ - Step 35105: {'lr': 0.00019957607933892082, 'samples': 1123360, 'steps': 2194, 'loss/train': 0.7064849734306335} -09/20/2021 22:05:29 - INFO - __main__ - Step 35106: {'lr': 0.00019957607933892082, 'samples': 1123392, 'steps': 2194, 'loss/train': 0.48337048292160034} -09/20/2021 22:05:30 - INFO - __main__ - Step 35107: {'lr': 0.00019957607933892082, 'samples': 1123424, 'steps': 2194, 'loss/train': 0.504524290561676} -09/20/2021 22:05:30 - INFO - __main__ - Step 35108: {'lr': 0.00019957607933892082, 'samples': 1123456, 'steps': 2194, 'loss/train': 0.627244770526886} -09/20/2021 22:05:31 - INFO - __main__ - Step 35109: {'lr': 0.00019957607933892082, 'samples': 1123488, 'steps': 2194, 'loss/train': 0.6043880581855774} -09/20/2021 22:05:32 - INFO - __main__ - Step 35110: {'lr': 0.00019957607933892082, 'samples': 1123520, 'steps': 2194, 'loss/train': 0.6799054741859436} -09/20/2021 22:05:33 - INFO - __main__ - Step 35111: {'lr': 0.00019957607933892082, 'samples': 1123552, 'steps': 2194, 'loss/train': 1.602579951286316} -09/20/2021 22:05:33 - INFO - __main__ - Step 35112: {'lr': 0.00019957607933892082, 'samples': 1123584, 'steps': 2194, 'loss/train': 2.528127908706665} -09/20/2021 22:05:34 - INFO - __main__ - Step 35113: {'lr': 0.00019957607933892082, 'samples': 1123616, 'steps': 2194, 'loss/train': 1.7602311372756958} -09/20/2021 22:05:35 - INFO - __main__ - Step 35114: {'lr': 0.00019957607933892082, 'samples': 1123648, 'steps': 2194, 'loss/train': 2.280766010284424} -09/20/2021 22:05:36 - INFO - __main__ - Step 35115: {'lr': 0.00019957607933892082, 'samples': 1123680, 'steps': 2194, 'loss/train': 2.851393938064575} -09/20/2021 22:05:36 - INFO - __main__ - Step 35116: {'lr': 0.00019957607933892082, 'samples': 1123712, 'steps': 2194, 'loss/train': 1.5713070631027222} -09/20/2021 22:05:37 - INFO - __main__ - Step 35117: {'lr': 0.00019957607933892082, 'samples': 1123744, 'steps': 2194, 'loss/train': 0.6072992086410522} -09/20/2021 22:05:38 - INFO - __main__ - Step 35118: {'lr': 0.00019957607933892082, 'samples': 1123776, 'steps': 2194, 'loss/train': 2.0989465713500977} -09/20/2021 22:05:39 - INFO - __main__ - Step 35119: {'lr': 0.00019957607933892082, 'samples': 1123808, 'steps': 2194, 'loss/train': 2.3318734169006348} -09/20/2021 22:05:39 - INFO - __main__ - Step 35120: {'lr': 0.00019957607933892082, 'samples': 1123840, 'steps': 2194, 'loss/train': 2.2180490493774414} -09/20/2021 22:05:40 - INFO - __main__ - Step 35121: {'lr': 0.00019957549240379608, 'samples': 1123872, 'steps': 2195, 'loss/train': 1.9711977243423462} -09/20/2021 22:05:41 - INFO - __main__ - Step 35122: {'lr': 0.00019957549240379608, 'samples': 1123904, 'steps': 2195, 'loss/train': 2.0739099979400635} -09/20/2021 22:05:42 - INFO - __main__ - Step 35123: {'lr': 0.00019957549240379608, 'samples': 1123936, 'steps': 2195, 'loss/train': 3.366126775741577} -09/20/2021 22:05:43 - INFO - __main__ - Step 35124: {'lr': 0.00019957549240379608, 'samples': 1123968, 'steps': 2195, 'loss/train': 1.5213321447372437} -09/20/2021 22:05:43 - INFO - __main__ - Step 35125: {'lr': 0.00019957549240379608, 'samples': 1124000, 'steps': 2195, 'loss/train': 3.051467180252075} -09/20/2021 22:05:44 - INFO - __main__ - Step 35126: {'lr': 0.00019957549240379608, 'samples': 1124032, 'steps': 2195, 'loss/train': 2.4147064685821533} -09/20/2021 22:05:45 - INFO - __main__ - Step 35127: {'lr': 0.00019957549240379608, 'samples': 1124064, 'steps': 2195, 'loss/train': 2.5811963081359863} -09/20/2021 22:05:46 - INFO - __main__ - Step 35128: {'lr': 0.00019957549240379608, 'samples': 1124096, 'steps': 2195, 'loss/train': 2.308448076248169} -09/20/2021 22:05:46 - INFO - __main__ - Step 35129: {'lr': 0.00019957549240379608, 'samples': 1124128, 'steps': 2195, 'loss/train': 1.3000582456588745} -09/20/2021 22:05:47 - INFO - __main__ - Step 35130: {'lr': 0.00019957549240379608, 'samples': 1124160, 'steps': 2195, 'loss/train': 2.7103116512298584} -09/20/2021 22:05:48 - INFO - __main__ - Step 35131: {'lr': 0.00019957549240379608, 'samples': 1124192, 'steps': 2195, 'loss/train': 2.8133389949798584} -09/20/2021 22:05:49 - INFO - __main__ - Step 35132: {'lr': 0.00019957549240379608, 'samples': 1124224, 'steps': 2195, 'loss/train': 1.831621766090393} -09/20/2021 22:05:49 - INFO - __main__ - Step 35133: {'lr': 0.00019957549240379608, 'samples': 1124256, 'steps': 2195, 'loss/train': 2.8254384994506836} -09/20/2021 22:05:50 - INFO - __main__ - Step 35134: {'lr': 0.00019957549240379608, 'samples': 1124288, 'steps': 2195, 'loss/train': 2.990764856338501} -09/20/2021 22:05:51 - INFO - __main__ - Step 35135: {'lr': 0.00019957549240379608, 'samples': 1124320, 'steps': 2195, 'loss/train': 2.2891666889190674} -09/20/2021 22:05:52 - INFO - __main__ - Step 35136: {'lr': 0.00019957549240379608, 'samples': 1124352, 'steps': 2195, 'loss/train': 2.153975009918213} -09/20/2021 22:05:53 - INFO - __main__ - Step 35137: {'lr': 0.00019957490506349905, 'samples': 1124384, 'steps': 2196, 'loss/train': 2.4851789474487305} -09/20/2021 22:05:54 - INFO - __main__ - Step 35138: {'lr': 0.00019957490506349905, 'samples': 1124416, 'steps': 2196, 'loss/train': 1.2983282804489136} -09/20/2021 22:05:54 - INFO - __main__ - Step 35139: {'lr': 0.00019957490506349905, 'samples': 1124448, 'steps': 2196, 'loss/train': 1.6646355390548706} -09/20/2021 22:05:55 - INFO - __main__ - Step 35140: {'lr': 0.00019957490506349905, 'samples': 1124480, 'steps': 2196, 'loss/train': 1.4015480279922485} -09/20/2021 22:05:56 - INFO - __main__ - Step 35141: {'lr': 0.00019957490506349905, 'samples': 1124512, 'steps': 2196, 'loss/train': 2.758582830429077} -09/20/2021 22:05:57 - INFO - __main__ - Step 35142: {'lr': 0.00019957490506349905, 'samples': 1124544, 'steps': 2196, 'loss/train': 1.0859986543655396} -09/20/2021 22:05:57 - INFO - __main__ - Step 35143: {'lr': 0.00019957490506349905, 'samples': 1124576, 'steps': 2196, 'loss/train': 3.054499864578247} -09/20/2021 22:05:58 - INFO - __main__ - Step 35144: {'lr': 0.00019957490506349905, 'samples': 1124608, 'steps': 2196, 'loss/train': 2.289301872253418} -09/20/2021 22:05:59 - INFO - __main__ - Step 35145: {'lr': 0.00019957490506349905, 'samples': 1124640, 'steps': 2196, 'loss/train': 3.303614616394043} -09/20/2021 22:06:00 - INFO - __main__ - Step 35146: {'lr': 0.00019957490506349905, 'samples': 1124672, 'steps': 2196, 'loss/train': 2.678769588470459} -09/20/2021 22:06:00 - INFO - __main__ - Step 35147: {'lr': 0.00019957490506349905, 'samples': 1124704, 'steps': 2196, 'loss/train': 2.5865397453308105} -09/20/2021 22:06:01 - INFO - __main__ - Step 35148: {'lr': 0.00019957490506349905, 'samples': 1124736, 'steps': 2196, 'loss/train': 2.4260404109954834} -09/20/2021 22:06:02 - INFO - __main__ - Step 35149: {'lr': 0.00019957490506349905, 'samples': 1124768, 'steps': 2196, 'loss/train': 1.7656465768814087} -09/20/2021 22:06:03 - INFO - __main__ - Step 35150: {'lr': 0.00019957490506349905, 'samples': 1124800, 'steps': 2196, 'loss/train': 2.4802308082580566} -09/20/2021 22:06:03 - INFO - __main__ - Step 35151: {'lr': 0.00019957490506349905, 'samples': 1124832, 'steps': 2196, 'loss/train': 1.6844007968902588} -09/20/2021 22:06:04 - INFO - __main__ - Step 35152: {'lr': 0.00019957490506349905, 'samples': 1124864, 'steps': 2196, 'loss/train': 1.987675666809082} -09/20/2021 22:06:05 - INFO - __main__ - Step 35153: {'lr': 0.00019957431731803214, 'samples': 1124896, 'steps': 2197, 'loss/train': 2.1455395221710205} -09/20/2021 22:06:06 - INFO - __main__ - Step 35154: {'lr': 0.00019957431731803214, 'samples': 1124928, 'steps': 2197, 'loss/train': 2.225051164627075} -09/20/2021 22:06:07 - INFO - __main__ - Step 35155: {'lr': 0.00019957431731803214, 'samples': 1124960, 'steps': 2197, 'loss/train': 2.2553467750549316} -09/20/2021 22:06:07 - INFO - __main__ - Step 35156: {'lr': 0.00019957431731803214, 'samples': 1124992, 'steps': 2197, 'loss/train': 1.913399338722229} -09/20/2021 22:06:08 - INFO - __main__ - Step 35157: {'lr': 0.00019957431731803214, 'samples': 1125024, 'steps': 2197, 'loss/train': 1.7784757614135742} -09/20/2021 22:06:09 - INFO - __main__ - Step 35158: {'lr': 0.00019957431731803214, 'samples': 1125056, 'steps': 2197, 'loss/train': 2.493717670440674} -09/20/2021 22:06:10 - INFO - __main__ - Step 35159: {'lr': 0.00019957431731803214, 'samples': 1125088, 'steps': 2197, 'loss/train': 2.0020461082458496} -09/20/2021 22:06:10 - INFO - __main__ - Step 35160: {'lr': 0.00019957431731803214, 'samples': 1125120, 'steps': 2197, 'loss/train': 2.6122519969940186} -09/20/2021 22:06:11 - INFO - __main__ - Step 35161: {'lr': 0.00019957431731803214, 'samples': 1125152, 'steps': 2197, 'loss/train': 1.8333836793899536} -09/20/2021 22:06:12 - INFO - __main__ - Step 35162: {'lr': 0.00019957431731803214, 'samples': 1125184, 'steps': 2197, 'loss/train': 2.2277939319610596} -09/20/2021 22:06:13 - INFO - __main__ - Step 35163: {'lr': 0.00019957431731803214, 'samples': 1125216, 'steps': 2197, 'loss/train': 1.9198209047317505} -09/20/2021 22:06:13 - INFO - __main__ - Step 35164: {'lr': 0.00019957431731803214, 'samples': 1125248, 'steps': 2197, 'loss/train': 2.2636609077453613} -09/20/2021 22:06:14 - INFO - __main__ - Step 35165: {'lr': 0.00019957431731803214, 'samples': 1125280, 'steps': 2197, 'loss/train': 1.9032034873962402} -09/20/2021 22:06:15 - INFO - __main__ - Step 35166: {'lr': 0.00019957431731803214, 'samples': 1125312, 'steps': 2197, 'loss/train': 2.1328389644622803} -09/20/2021 22:06:16 - INFO - __main__ - Step 35167: {'lr': 0.00019957431731803214, 'samples': 1125344, 'steps': 2197, 'loss/train': 1.4587204456329346} -09/20/2021 22:06:17 - INFO - __main__ - Step 35168: {'lr': 0.00019957431731803214, 'samples': 1125376, 'steps': 2197, 'loss/train': 1.64397394657135} -09/20/2021 22:06:18 - INFO - __main__ - Step 35169: {'lr': 0.0001995737291673977, 'samples': 1125408, 'steps': 2198, 'loss/train': 2.025688409805298} -09/20/2021 22:06:19 - INFO - __main__ - Step 35170: {'lr': 0.0001995737291673977, 'samples': 1125440, 'steps': 2198, 'loss/train': 2.1841018199920654} -09/20/2021 22:06:19 - INFO - __main__ - Step 35171: {'lr': 0.0001995737291673977, 'samples': 1125472, 'steps': 2198, 'loss/train': 2.1806092262268066} -09/20/2021 22:06:20 - INFO - __main__ - Step 35172: {'lr': 0.0001995737291673977, 'samples': 1125504, 'steps': 2198, 'loss/train': 2.367356777191162} -09/20/2021 22:06:21 - INFO - __main__ - Step 35173: {'lr': 0.0001995737291673977, 'samples': 1125536, 'steps': 2198, 'loss/train': 1.7613641023635864} -09/20/2021 22:06:22 - INFO - __main__ - Step 35174: {'lr': 0.0001995737291673977, 'samples': 1125568, 'steps': 2198, 'loss/train': 1.4136812686920166} -09/20/2021 22:06:22 - INFO - __main__ - Step 35175: {'lr': 0.0001995737291673977, 'samples': 1125600, 'steps': 2198, 'loss/train': 2.837831974029541} -09/20/2021 22:06:23 - INFO - __main__ - Step 35176: {'lr': 0.0001995737291673977, 'samples': 1125632, 'steps': 2198, 'loss/train': 2.721849203109741} -09/20/2021 22:06:24 - INFO - __main__ - Step 35177: {'lr': 0.0001995737291673977, 'samples': 1125664, 'steps': 2198, 'loss/train': 3.2139506340026855} -09/20/2021 22:06:25 - INFO - __main__ - Step 35178: {'lr': 0.0001995737291673977, 'samples': 1125696, 'steps': 2198, 'loss/train': 2.391462564468384} -09/20/2021 22:06:25 - INFO - __main__ - Step 35179: {'lr': 0.0001995737291673977, 'samples': 1125728, 'steps': 2198, 'loss/train': 3.694723606109619} -09/20/2021 22:06:26 - INFO - __main__ - Step 35180: {'lr': 0.0001995737291673977, 'samples': 1125760, 'steps': 2198, 'loss/train': 2.762963056564331} -09/20/2021 22:06:27 - INFO - __main__ - Step 35181: {'lr': 0.0001995737291673977, 'samples': 1125792, 'steps': 2198, 'loss/train': 1.0175244808197021} -09/20/2021 22:06:28 - INFO - __main__ - Step 35182: {'lr': 0.0001995737291673977, 'samples': 1125824, 'steps': 2198, 'loss/train': 0.7420148849487305} -09/20/2021 22:06:28 - INFO - __main__ - Step 35183: {'lr': 0.0001995737291673977, 'samples': 1125856, 'steps': 2198, 'loss/train': 2.742802619934082} -09/20/2021 22:06:29 - INFO - __main__ - Step 35184: {'lr': 0.0001995737291673977, 'samples': 1125888, 'steps': 2198, 'loss/train': 2.3765547275543213} -09/20/2021 22:06:30 - INFO - __main__ - Step 35185: {'lr': 0.00019957314061159814, 'samples': 1125920, 'steps': 2199, 'loss/train': 1.8623470067977905} -09/20/2021 22:06:31 - INFO - __main__ - Step 35186: {'lr': 0.00019957314061159814, 'samples': 1125952, 'steps': 2199, 'loss/train': 3.02545428276062} -09/20/2021 22:06:31 - INFO - __main__ - Step 35187: {'lr': 0.00019957314061159814, 'samples': 1125984, 'steps': 2199, 'loss/train': 2.618884563446045} -09/20/2021 22:06:32 - INFO - __main__ - Step 35188: {'lr': 0.00019957314061159814, 'samples': 1126016, 'steps': 2199, 'loss/train': 2.57548189163208} -09/20/2021 22:06:33 - INFO - __main__ - Step 35189: {'lr': 0.00019957314061159814, 'samples': 1126048, 'steps': 2199, 'loss/train': 2.1296815872192383} -09/20/2021 22:06:34 - INFO - __main__ - Step 35190: {'lr': 0.00019957314061159814, 'samples': 1126080, 'steps': 2199, 'loss/train': 2.975797653198242} -09/20/2021 22:06:34 - INFO - __main__ - Step 35191: {'lr': 0.00019957314061159814, 'samples': 1126112, 'steps': 2199, 'loss/train': 2.050467014312744} -09/20/2021 22:06:35 - INFO - __main__ - Step 35192: {'lr': 0.00019957314061159814, 'samples': 1126144, 'steps': 2199, 'loss/train': 1.8213977813720703} -09/20/2021 22:06:36 - INFO - __main__ - Step 35193: {'lr': 0.00019957314061159814, 'samples': 1126176, 'steps': 2199, 'loss/train': 2.164088249206543} -09/20/2021 22:06:37 - INFO - __main__ - Step 35194: {'lr': 0.00019957314061159814, 'samples': 1126208, 'steps': 2199, 'loss/train': 1.8334839344024658} -09/20/2021 22:06:37 - INFO - __main__ - Step 35195: {'lr': 0.00019957314061159814, 'samples': 1126240, 'steps': 2199, 'loss/train': 3.2595608234405518} -09/20/2021 22:06:38 - INFO - __main__ - Step 35196: {'lr': 0.00019957314061159814, 'samples': 1126272, 'steps': 2199, 'loss/train': 2.985893726348877} -09/20/2021 22:06:39 - INFO - __main__ - Step 35197: {'lr': 0.00019957314061159814, 'samples': 1126304, 'steps': 2199, 'loss/train': 3.277674674987793} -09/20/2021 22:06:40 - INFO - __main__ - Step 35198: {'lr': 0.00019957314061159814, 'samples': 1126336, 'steps': 2199, 'loss/train': 2.1883299350738525} -09/20/2021 22:06:41 - INFO - __main__ - Step 35199: {'lr': 0.00019957314061159814, 'samples': 1126368, 'steps': 2199, 'loss/train': 0.6332858800888062} -09/20/2021 22:06:42 - INFO - __main__ - Step 35200: {'lr': 0.00019957314061159814, 'samples': 1126400, 'steps': 2199, 'loss/train': 2.0688347816467285} -09/20/2021 22:06:43 - INFO - __main__ - Step 35201: {'lr': 0.00019957255165063584, 'samples': 1126432, 'steps': 2200, 'loss/train': 1.6181319952011108} -09/20/2021 22:06:43 - INFO - __main__ - Step 35202: {'lr': 0.00019957255165063584, 'samples': 1126464, 'steps': 2200, 'loss/train': 2.8172450065612793} -09/20/2021 22:06:44 - INFO - __main__ - Step 35203: {'lr': 0.00019957255165063584, 'samples': 1126496, 'steps': 2200, 'loss/train': 2.288478136062622} -09/20/2021 22:06:45 - INFO - __main__ - Step 35204: {'lr': 0.00019957255165063584, 'samples': 1126528, 'steps': 2200, 'loss/train': 2.4889512062072754} -09/20/2021 22:06:46 - INFO - __main__ - Step 35205: {'lr': 0.00019957255165063584, 'samples': 1126560, 'steps': 2200, 'loss/train': 0.8890318870544434} -09/20/2021 22:06:46 - INFO - __main__ - Step 35206: {'lr': 0.00019957255165063584, 'samples': 1126592, 'steps': 2200, 'loss/train': 2.2794089317321777} -09/20/2021 22:06:47 - INFO - __main__ - Step 35207: {'lr': 0.00019957255165063584, 'samples': 1126624, 'steps': 2200, 'loss/train': 1.9132641553878784} -09/20/2021 22:06:48 - INFO - __main__ - Step 35208: {'lr': 0.00019957255165063584, 'samples': 1126656, 'steps': 2200, 'loss/train': 2.5647969245910645} -09/20/2021 22:06:49 - INFO - __main__ - Step 35209: {'lr': 0.00019957255165063584, 'samples': 1126688, 'steps': 2200, 'loss/train': 2.1517527103424072} -09/20/2021 22:06:49 - INFO - __main__ - Step 35210: {'lr': 0.00019957255165063584, 'samples': 1126720, 'steps': 2200, 'loss/train': 1.7988905906677246} -09/20/2021 22:06:50 - INFO - __main__ - Step 35211: {'lr': 0.00019957255165063584, 'samples': 1126752, 'steps': 2200, 'loss/train': 1.1622694730758667} -09/20/2021 22:06:51 - INFO - __main__ - Step 35212: {'lr': 0.00019957255165063584, 'samples': 1126784, 'steps': 2200, 'loss/train': 1.9395278692245483} -09/20/2021 22:06:52 - INFO - __main__ - Step 35213: {'lr': 0.00019957255165063584, 'samples': 1126816, 'steps': 2200, 'loss/train': 2.1831252574920654} -09/20/2021 22:06:52 - INFO - __main__ - Step 35214: {'lr': 0.00019957255165063584, 'samples': 1126848, 'steps': 2200, 'loss/train': 2.32391357421875} -09/20/2021 22:06:53 - INFO - __main__ - Step 35215: {'lr': 0.00019957255165063584, 'samples': 1126880, 'steps': 2200, 'loss/train': 2.0326249599456787} -09/20/2021 22:06:54 - INFO - __main__ - Step 35216: {'lr': 0.00019957255165063584, 'samples': 1126912, 'steps': 2200, 'loss/train': 2.343716859817505} -09/20/2021 22:06:55 - INFO - __main__ - Step 35217: {'lr': 0.00019957196228451325, 'samples': 1126944, 'steps': 2201, 'loss/train': 1.5802243947982788} -09/20/2021 22:06:55 - INFO - __main__ - Step 35218: {'lr': 0.00019957196228451325, 'samples': 1126976, 'steps': 2201, 'loss/train': 2.5521016120910645} -09/20/2021 22:06:56 - INFO - __main__ - Step 35219: {'lr': 0.00019957196228451325, 'samples': 1127008, 'steps': 2201, 'loss/train': 1.6627534627914429} -09/20/2021 22:06:57 - INFO - __main__ - Step 35220: {'lr': 0.00019957196228451325, 'samples': 1127040, 'steps': 2201, 'loss/train': 0.4484502077102661} -09/20/2021 22:06:58 - INFO - __main__ - Step 35221: {'lr': 0.00019957196228451325, 'samples': 1127072, 'steps': 2201, 'loss/train': 2.892374277114868} -09/20/2021 22:06:58 - INFO - __main__ - Step 35222: {'lr': 0.00019957196228451325, 'samples': 1127104, 'steps': 2201, 'loss/train': 2.2460110187530518} -09/20/2021 22:06:59 - INFO - __main__ - Step 35223: {'lr': 0.00019957196228451325, 'samples': 1127136, 'steps': 2201, 'loss/train': 2.1874823570251465} -09/20/2021 22:07:00 - INFO - __main__ - Step 35224: {'lr': 0.00019957196228451325, 'samples': 1127168, 'steps': 2201, 'loss/train': 2.367382049560547} -09/20/2021 22:07:01 - INFO - __main__ - Step 35225: {'lr': 0.00019957196228451325, 'samples': 1127200, 'steps': 2201, 'loss/train': 2.077867031097412} -09/20/2021 22:07:01 - INFO - __main__ - Step 35226: {'lr': 0.00019957196228451325, 'samples': 1127232, 'steps': 2201, 'loss/train': 2.444183588027954} -09/20/2021 22:07:02 - INFO - __main__ - Step 35227: {'lr': 0.00019957196228451325, 'samples': 1127264, 'steps': 2201, 'loss/train': 1.6089116334915161} -09/20/2021 22:07:03 - INFO - __main__ - Step 35228: {'lr': 0.00019957196228451325, 'samples': 1127296, 'steps': 2201, 'loss/train': 2.7361505031585693} -09/20/2021 22:07:05 - INFO - __main__ - Step 35229: {'lr': 0.00019957196228451325, 'samples': 1127328, 'steps': 2201, 'loss/train': 2.306537628173828} -09/20/2021 22:07:06 - INFO - __main__ - Step 35230: {'lr': 0.00019957196228451325, 'samples': 1127360, 'steps': 2201, 'loss/train': 2.6934733390808105} -09/20/2021 22:07:06 - INFO - __main__ - Step 35231: {'lr': 0.00019957196228451325, 'samples': 1127392, 'steps': 2201, 'loss/train': 2.9513866901397705} -09/20/2021 22:07:07 - INFO - __main__ - Step 35232: {'lr': 0.00019957196228451325, 'samples': 1127424, 'steps': 2201, 'loss/train': 2.1531870365142822} -09/20/2021 22:07:08 - INFO - __main__ - Step 35233: {'lr': 0.0001995713725132327, 'samples': 1127456, 'steps': 2202, 'loss/train': 0.8010947704315186} -09/20/2021 22:07:09 - INFO - __main__ - Step 35234: {'lr': 0.0001995713725132327, 'samples': 1127488, 'steps': 2202, 'loss/train': 1.240971565246582} -09/20/2021 22:07:09 - INFO - __main__ - Step 35235: {'lr': 0.0001995713725132327, 'samples': 1127520, 'steps': 2202, 'loss/train': 1.3694218397140503} -09/20/2021 22:07:10 - INFO - __main__ - Step 35236: {'lr': 0.0001995713725132327, 'samples': 1127552, 'steps': 2202, 'loss/train': 1.2298576831817627} -09/20/2021 22:07:11 - INFO - __main__ - Step 35237: {'lr': 0.0001995713725132327, 'samples': 1127584, 'steps': 2202, 'loss/train': 2.339902639389038} -09/20/2021 22:07:12 - INFO - __main__ - Step 35238: {'lr': 0.0001995713725132327, 'samples': 1127616, 'steps': 2202, 'loss/train': 1.9398579597473145} -09/20/2021 22:07:12 - INFO - __main__ - Step 35239: {'lr': 0.0001995713725132327, 'samples': 1127648, 'steps': 2202, 'loss/train': 0.5734779834747314} -09/20/2021 22:07:13 - INFO - __main__ - Step 35240: {'lr': 0.0001995713725132327, 'samples': 1127680, 'steps': 2202, 'loss/train': 2.205404043197632} -09/20/2021 22:07:14 - INFO - __main__ - Step 35241: {'lr': 0.0001995713725132327, 'samples': 1127712, 'steps': 2202, 'loss/train': 2.310875177383423} -09/20/2021 22:07:15 - INFO - __main__ - Step 35242: {'lr': 0.0001995713725132327, 'samples': 1127744, 'steps': 2202, 'loss/train': 2.2728114128112793} -09/20/2021 22:07:15 - INFO - __main__ - Step 35243: {'lr': 0.0001995713725132327, 'samples': 1127776, 'steps': 2202, 'loss/train': 1.9934780597686768} -09/20/2021 22:07:16 - INFO - __main__ - Step 35244: {'lr': 0.0001995713725132327, 'samples': 1127808, 'steps': 2202, 'loss/train': 1.728306770324707} -09/20/2021 22:07:17 - INFO - __main__ - Step 35245: {'lr': 0.0001995713725132327, 'samples': 1127840, 'steps': 2202, 'loss/train': 2.6499552726745605} -09/20/2021 22:07:18 - INFO - __main__ - Step 35246: {'lr': 0.0001995713725132327, 'samples': 1127872, 'steps': 2202, 'loss/train': 1.1229705810546875} -09/20/2021 22:07:18 - INFO - __main__ - Step 35247: {'lr': 0.0001995713725132327, 'samples': 1127904, 'steps': 2202, 'loss/train': 2.6732068061828613} -09/20/2021 22:07:19 - INFO - __main__ - Step 35248: {'lr': 0.0001995713725132327, 'samples': 1127936, 'steps': 2202, 'loss/train': 0.563072919845581} -09/20/2021 22:07:20 - INFO - __main__ - Step 35249: {'lr': 0.00019957078233679668, 'samples': 1127968, 'steps': 2203, 'loss/train': 1.7946058511734009} -09/20/2021 22:07:21 - INFO - __main__ - Step 35250: {'lr': 0.00019957078233679668, 'samples': 1128000, 'steps': 2203, 'loss/train': 1.7005348205566406} -09/20/2021 22:07:22 - INFO - __main__ - Step 35251: {'lr': 0.00019957078233679668, 'samples': 1128032, 'steps': 2203, 'loss/train': 2.2761545181274414} -09/20/2021 22:07:22 - INFO - __main__ - Step 35252: {'lr': 0.00019957078233679668, 'samples': 1128064, 'steps': 2203, 'loss/train': 2.39044451713562} -09/20/2021 22:07:23 - INFO - __main__ - Step 35253: {'lr': 0.00019957078233679668, 'samples': 1128096, 'steps': 2203, 'loss/train': 2.5180037021636963} -09/20/2021 22:07:24 - INFO - __main__ - Step 35254: {'lr': 0.00019957078233679668, 'samples': 1128128, 'steps': 2203, 'loss/train': 1.6003307104110718} -09/20/2021 22:07:25 - INFO - __main__ - Step 35255: {'lr': 0.00019957078233679668, 'samples': 1128160, 'steps': 2203, 'loss/train': 2.709178924560547} -09/20/2021 22:07:25 - INFO - __main__ - Step 35256: {'lr': 0.00019957078233679668, 'samples': 1128192, 'steps': 2203, 'loss/train': 0.574688196182251} -09/20/2021 22:07:26 - INFO - __main__ - Step 35257: {'lr': 0.00019957078233679668, 'samples': 1128224, 'steps': 2203, 'loss/train': 0.27494704723358154} -09/20/2021 22:07:27 - INFO - __main__ - Step 35258: {'lr': 0.00019957078233679668, 'samples': 1128256, 'steps': 2203, 'loss/train': 0.2696601152420044} -09/20/2021 22:07:28 - INFO - __main__ - Step 35259: {'lr': 0.00019957078233679668, 'samples': 1128288, 'steps': 2203, 'loss/train': 2.789696455001831} -09/20/2021 22:07:28 - INFO - __main__ - Step 35260: {'lr': 0.00019957078233679668, 'samples': 1128320, 'steps': 2203, 'loss/train': 2.5083789825439453} -09/20/2021 22:07:30 - INFO - __main__ - Step 35261: {'lr': 0.00019957078233679668, 'samples': 1128352, 'steps': 2203, 'loss/train': 0.6311272382736206} -09/20/2021 22:07:30 - INFO - __main__ - Step 35262: {'lr': 0.00019957078233679668, 'samples': 1128384, 'steps': 2203, 'loss/train': 2.0578277111053467} -09/20/2021 22:07:31 - INFO - __main__ - Step 35263: {'lr': 0.00019957078233679668, 'samples': 1128416, 'steps': 2203, 'loss/train': 3.155750274658203} -09/20/2021 22:07:32 - INFO - __main__ - Step 35264: {'lr': 0.00019957078233679668, 'samples': 1128448, 'steps': 2203, 'loss/train': 2.7959370613098145} -09/20/2021 22:07:33 - INFO - __main__ - Step 35265: {'lr': 0.00019957019175520749, 'samples': 1128480, 'steps': 2204, 'loss/train': 2.4346930980682373} -09/20/2021 22:07:34 - INFO - __main__ - Step 35266: {'lr': 0.00019957019175520749, 'samples': 1128512, 'steps': 2204, 'loss/train': 2.8421201705932617} -09/20/2021 22:07:34 - INFO - __main__ - Step 35267: {'lr': 0.00019957019175520749, 'samples': 1128544, 'steps': 2204, 'loss/train': 2.1080265045166016} -09/20/2021 22:07:35 - INFO - __main__ - Step 35268: {'lr': 0.00019957019175520749, 'samples': 1128576, 'steps': 2204, 'loss/train': 1.617448329925537} -09/20/2021 22:07:36 - INFO - __main__ - Step 35269: {'lr': 0.00019957019175520749, 'samples': 1128608, 'steps': 2204, 'loss/train': 2.0524466037750244} -09/20/2021 22:07:37 - INFO - __main__ - Step 35270: {'lr': 0.00019957019175520749, 'samples': 1128640, 'steps': 2204, 'loss/train': 2.1358273029327393} -09/20/2021 22:07:37 - INFO - __main__ - Step 35271: {'lr': 0.00019957019175520749, 'samples': 1128672, 'steps': 2204, 'loss/train': 2.194357395172119} -09/20/2021 22:07:38 - INFO - __main__ - Step 35272: {'lr': 0.00019957019175520749, 'samples': 1128704, 'steps': 2204, 'loss/train': 1.6915171146392822} -09/20/2021 22:07:39 - INFO - __main__ - Step 35273: {'lr': 0.00019957019175520749, 'samples': 1128736, 'steps': 2204, 'loss/train': 2.8064401149749756} -09/20/2021 22:07:40 - INFO - __main__ - Step 35274: {'lr': 0.00019957019175520749, 'samples': 1128768, 'steps': 2204, 'loss/train': 2.373079299926758} -09/20/2021 22:07:40 - INFO - __main__ - Step 35275: {'lr': 0.00019957019175520749, 'samples': 1128800, 'steps': 2204, 'loss/train': 2.8709652423858643} -09/20/2021 22:07:41 - INFO - __main__ - Step 35276: {'lr': 0.00019957019175520749, 'samples': 1128832, 'steps': 2204, 'loss/train': 2.0062451362609863} -09/20/2021 22:07:42 - INFO - __main__ - Step 35277: {'lr': 0.00019957019175520749, 'samples': 1128864, 'steps': 2204, 'loss/train': 2.6422107219696045} -09/20/2021 22:07:43 - INFO - __main__ - Step 35278: {'lr': 0.00019957019175520749, 'samples': 1128896, 'steps': 2204, 'loss/train': 2.529876947402954} -09/20/2021 22:07:43 - INFO - __main__ - Step 35279: {'lr': 0.00019957019175520749, 'samples': 1128928, 'steps': 2204, 'loss/train': 2.296520948410034} -09/20/2021 22:07:44 - INFO - __main__ - Step 35280: {'lr': 0.00019957019175520749, 'samples': 1128960, 'steps': 2204, 'loss/train': 2.0977938175201416} -09/20/2021 22:07:45 - INFO - __main__ - Step 35281: {'lr': 0.00019956960076846755, 'samples': 1128992, 'steps': 2205, 'loss/train': 2.580592155456543} -09/20/2021 22:07:46 - INFO - __main__ - Step 35282: {'lr': 0.00019956960076846755, 'samples': 1129024, 'steps': 2205, 'loss/train': 2.113576650619507} -09/20/2021 22:07:46 - INFO - __main__ - Step 35283: {'lr': 0.00019956960076846755, 'samples': 1129056, 'steps': 2205, 'loss/train': 1.5838539600372314} -09/20/2021 22:07:47 - INFO - __main__ - Step 35284: {'lr': 0.00019956960076846755, 'samples': 1129088, 'steps': 2205, 'loss/train': 2.423741102218628} -09/20/2021 22:07:48 - INFO - __main__ - Step 35285: {'lr': 0.00019956960076846755, 'samples': 1129120, 'steps': 2205, 'loss/train': 1.568947434425354} -09/20/2021 22:07:49 - INFO - __main__ - Step 35286: {'lr': 0.00019956960076846755, 'samples': 1129152, 'steps': 2205, 'loss/train': 2.964407205581665} -09/20/2021 22:07:49 - INFO - __main__ - Step 35287: {'lr': 0.00019956960076846755, 'samples': 1129184, 'steps': 2205, 'loss/train': 2.242239236831665} -09/20/2021 22:07:50 - INFO - __main__ - Step 35288: {'lr': 0.00019956960076846755, 'samples': 1129216, 'steps': 2205, 'loss/train': 2.6577539443969727} -09/20/2021 22:07:51 - INFO - __main__ - Step 35289: {'lr': 0.00019956960076846755, 'samples': 1129248, 'steps': 2205, 'loss/train': 2.5840039253234863} -09/20/2021 22:07:52 - INFO - __main__ - Step 35290: {'lr': 0.00019956960076846755, 'samples': 1129280, 'steps': 2205, 'loss/train': 1.8961589336395264} -09/20/2021 22:07:52 - INFO - __main__ - Step 35291: {'lr': 0.00019956960076846755, 'samples': 1129312, 'steps': 2205, 'loss/train': 2.3979079723358154} -09/20/2021 22:07:53 - INFO - __main__ - Step 35292: {'lr': 0.00019956960076846755, 'samples': 1129344, 'steps': 2205, 'loss/train': 2.309629440307617} -09/20/2021 22:07:55 - INFO - __main__ - Step 35293: {'lr': 0.00019956960076846755, 'samples': 1129376, 'steps': 2205, 'loss/train': 2.2669618129730225} -09/20/2021 22:07:55 - INFO - __main__ - Step 35294: {'lr': 0.00019956960076846755, 'samples': 1129408, 'steps': 2205, 'loss/train': 1.9962029457092285} -09/20/2021 22:07:56 - INFO - __main__ - Step 35295: {'lr': 0.00019956960076846755, 'samples': 1129440, 'steps': 2205, 'loss/train': 2.065401077270508} -09/20/2021 22:07:57 - INFO - __main__ - Step 35296: {'lr': 0.00019956960076846755, 'samples': 1129472, 'steps': 2205, 'loss/train': 2.3164899349212646} -09/20/2021 22:07:58 - INFO - __main__ - Step 35297: {'lr': 0.00019956900937657932, 'samples': 1129504, 'steps': 2206, 'loss/train': 2.738537073135376} -09/20/2021 22:07:58 - INFO - __main__ - Step 35298: {'lr': 0.00019956900937657932, 'samples': 1129536, 'steps': 2206, 'loss/train': 2.2351624965667725} -09/20/2021 22:07:59 - INFO - __main__ - Step 35299: {'lr': 0.00019956900937657932, 'samples': 1129568, 'steps': 2206, 'loss/train': 2.422780990600586} -09/20/2021 22:08:00 - INFO - __main__ - Step 35300: {'lr': 0.00019956900937657932, 'samples': 1129600, 'steps': 2206, 'loss/train': 2.43611216545105} -09/20/2021 22:08:01 - INFO - __main__ - Step 35301: {'lr': 0.00019956900937657932, 'samples': 1129632, 'steps': 2206, 'loss/train': 2.1482620239257812} -09/20/2021 22:08:01 - INFO - __main__ - Step 35302: {'lr': 0.00019956900937657932, 'samples': 1129664, 'steps': 2206, 'loss/train': 3.4551918506622314} -09/20/2021 22:08:02 - INFO - __main__ - Step 35303: {'lr': 0.00019956900937657932, 'samples': 1129696, 'steps': 2206, 'loss/train': 0.9505547881126404} -09/20/2021 22:08:03 - INFO - __main__ - Step 35304: {'lr': 0.00019956900937657932, 'samples': 1129728, 'steps': 2206, 'loss/train': 2.39849591255188} -09/20/2021 22:08:04 - INFO - __main__ - Step 35305: {'lr': 0.00019956900937657932, 'samples': 1129760, 'steps': 2206, 'loss/train': 1.4791098833084106} -09/20/2021 22:08:04 - INFO - __main__ - Step 35306: {'lr': 0.00019956900937657932, 'samples': 1129792, 'steps': 2206, 'loss/train': 1.9580943584442139} -09/20/2021 22:08:05 - INFO - __main__ - Step 35307: {'lr': 0.00019956900937657932, 'samples': 1129824, 'steps': 2206, 'loss/train': 2.4016571044921875} -09/20/2021 22:08:06 - INFO - __main__ - Step 35308: {'lr': 0.00019956900937657932, 'samples': 1129856, 'steps': 2206, 'loss/train': 1.3283028602600098} -09/20/2021 22:08:07 - INFO - __main__ - Step 35309: {'lr': 0.00019956900937657932, 'samples': 1129888, 'steps': 2206, 'loss/train': 2.828629493713379} -09/20/2021 22:08:07 - INFO - __main__ - Step 35310: {'lr': 0.00019956900937657932, 'samples': 1129920, 'steps': 2206, 'loss/train': 2.2918214797973633} -09/20/2021 22:08:08 - INFO - __main__ - Step 35311: {'lr': 0.00019956900937657932, 'samples': 1129952, 'steps': 2206, 'loss/train': 2.2581000328063965} -09/20/2021 22:08:09 - INFO - __main__ - Step 35312: {'lr': 0.00019956900937657932, 'samples': 1129984, 'steps': 2206, 'loss/train': 1.67086923122406} -09/20/2021 22:08:10 - INFO - __main__ - Step 35313: {'lr': 0.0001995684175795452, 'samples': 1130016, 'steps': 2207, 'loss/train': 2.2105941772460938} -09/20/2021 22:08:11 - INFO - __main__ - Step 35314: {'lr': 0.0001995684175795452, 'samples': 1130048, 'steps': 2207, 'loss/train': 4.788902282714844} -09/20/2021 22:08:11 - INFO - __main__ - Step 35315: {'lr': 0.0001995684175795452, 'samples': 1130080, 'steps': 2207, 'loss/train': 2.385730028152466} -09/20/2021 22:08:12 - INFO - __main__ - Step 35316: {'lr': 0.0001995684175795452, 'samples': 1130112, 'steps': 2207, 'loss/train': 2.6281955242156982} -09/20/2021 22:08:13 - INFO - __main__ - Step 35317: {'lr': 0.0001995684175795452, 'samples': 1130144, 'steps': 2207, 'loss/train': 0.18555693328380585} -09/20/2021 22:08:14 - INFO - __main__ - Step 35318: {'lr': 0.0001995684175795452, 'samples': 1130176, 'steps': 2207, 'loss/train': 0.15576358139514923} -09/20/2021 22:08:14 - INFO - __main__ - Step 35319: {'lr': 0.0001995684175795452, 'samples': 1130208, 'steps': 2207, 'loss/train': 0.21412226557731628} -09/20/2021 22:08:15 - INFO - __main__ - Step 35320: {'lr': 0.0001995684175795452, 'samples': 1130240, 'steps': 2207, 'loss/train': 1.958607792854309} -09/20/2021 22:08:16 - INFO - __main__ - Step 35321: {'lr': 0.0001995684175795452, 'samples': 1130272, 'steps': 2207, 'loss/train': 2.4765307903289795} -09/20/2021 22:08:17 - INFO - __main__ - Step 35322: {'lr': 0.0001995684175795452, 'samples': 1130304, 'steps': 2207, 'loss/train': 2.6890454292297363} -09/20/2021 22:08:18 - INFO - __main__ - Step 35323: {'lr': 0.0001995684175795452, 'samples': 1130336, 'steps': 2207, 'loss/train': 1.4680168628692627} -09/20/2021 22:08:19 - INFO - __main__ - Step 35324: {'lr': 0.0001995684175795452, 'samples': 1130368, 'steps': 2207, 'loss/train': 1.6307021379470825} -09/20/2021 22:08:19 - INFO - __main__ - Step 35325: {'lr': 0.0001995684175795452, 'samples': 1130400, 'steps': 2207, 'loss/train': 2.2571728229522705} -09/20/2021 22:08:20 - INFO - __main__ - Step 35326: {'lr': 0.0001995684175795452, 'samples': 1130432, 'steps': 2207, 'loss/train': 3.1768980026245117} -09/20/2021 22:08:21 - INFO - __main__ - Step 35327: {'lr': 0.0001995684175795452, 'samples': 1130464, 'steps': 2207, 'loss/train': 1.947058081626892} -09/20/2021 22:08:22 - INFO - __main__ - Step 35328: {'lr': 0.0001995684175795452, 'samples': 1130496, 'steps': 2207, 'loss/train': 2.285547971725464} -09/20/2021 22:08:23 - INFO - __main__ - Step 35329: {'lr': 0.00019956782537736752, 'samples': 1130528, 'steps': 2208, 'loss/train': 3.1324996948242188} -09/20/2021 22:08:23 - INFO - __main__ - Step 35330: {'lr': 0.00019956782537736752, 'samples': 1130560, 'steps': 2208, 'loss/train': 2.131359577178955} -09/20/2021 22:08:24 - INFO - __main__ - Step 35331: {'lr': 0.00019956782537736752, 'samples': 1130592, 'steps': 2208, 'loss/train': 1.8534069061279297} -09/20/2021 22:08:25 - INFO - __main__ - Step 35332: {'lr': 0.00019956782537736752, 'samples': 1130624, 'steps': 2208, 'loss/train': 1.6710975170135498} -09/20/2021 22:08:26 - INFO - __main__ - Step 35333: {'lr': 0.00019956782537736752, 'samples': 1130656, 'steps': 2208, 'loss/train': 3.2784955501556396} -09/20/2021 22:08:26 - INFO - __main__ - Step 35334: {'lr': 0.00019956782537736752, 'samples': 1130688, 'steps': 2208, 'loss/train': 2.3132193088531494} -09/20/2021 22:08:27 - INFO - __main__ - Step 35335: {'lr': 0.00019956782537736752, 'samples': 1130720, 'steps': 2208, 'loss/train': 3.102739095687866} -09/20/2021 22:08:28 - INFO - __main__ - Step 35336: {'lr': 0.00019956782537736752, 'samples': 1130752, 'steps': 2208, 'loss/train': 3.0970041751861572} -09/20/2021 22:08:29 - INFO - __main__ - Step 35337: {'lr': 0.00019956782537736752, 'samples': 1130784, 'steps': 2208, 'loss/train': 2.051417589187622} -09/20/2021 22:08:29 - INFO - __main__ - Step 35338: {'lr': 0.00019956782537736752, 'samples': 1130816, 'steps': 2208, 'loss/train': 1.374292254447937} -09/20/2021 22:08:30 - INFO - __main__ - Step 35339: {'lr': 0.00019956782537736752, 'samples': 1130848, 'steps': 2208, 'loss/train': 1.8000402450561523} -09/20/2021 22:08:31 - INFO - __main__ - Step 35340: {'lr': 0.00019956782537736752, 'samples': 1130880, 'steps': 2208, 'loss/train': 2.453496217727661} -09/20/2021 22:08:32 - INFO - __main__ - Step 35341: {'lr': 0.00019956782537736752, 'samples': 1130912, 'steps': 2208, 'loss/train': 1.453857660293579} -09/20/2021 22:08:32 - INFO - __main__ - Step 35342: {'lr': 0.00019956782537736752, 'samples': 1130944, 'steps': 2208, 'loss/train': 1.9345394372940063} -09/20/2021 22:08:33 - INFO - __main__ - Step 35343: {'lr': 0.00019956782537736752, 'samples': 1130976, 'steps': 2208, 'loss/train': 2.440842628479004} -09/20/2021 22:08:34 - INFO - __main__ - Step 35344: {'lr': 0.00019956782537736752, 'samples': 1131008, 'steps': 2208, 'loss/train': 2.6495511531829834} -09/20/2021 22:08:35 - INFO - __main__ - Step 35345: {'lr': 0.00019956723277004878, 'samples': 1131040, 'steps': 2209, 'loss/train': 0.7680556178092957} -09/20/2021 22:08:35 - INFO - __main__ - Step 35346: {'lr': 0.00019956723277004878, 'samples': 1131072, 'steps': 2209, 'loss/train': 2.3059144020080566} -09/20/2021 22:08:36 - INFO - __main__ - Step 35347: {'lr': 0.00019956723277004878, 'samples': 1131104, 'steps': 2209, 'loss/train': 2.739076852798462} -09/20/2021 22:08:37 - INFO - __main__ - Step 35348: {'lr': 0.00019956723277004878, 'samples': 1131136, 'steps': 2209, 'loss/train': 2.1865758895874023} -09/20/2021 22:08:38 - INFO - __main__ - Step 35349: {'lr': 0.00019956723277004878, 'samples': 1131168, 'steps': 2209, 'loss/train': 2.390861988067627} -09/20/2021 22:08:38 - INFO - __main__ - Step 35350: {'lr': 0.00019956723277004878, 'samples': 1131200, 'steps': 2209, 'loss/train': 2.821985960006714} -09/20/2021 22:08:39 - INFO - __main__ - Step 35351: {'lr': 0.00019956723277004878, 'samples': 1131232, 'steps': 2209, 'loss/train': 2.359462022781372} -09/20/2021 22:08:40 - INFO - __main__ - Step 35352: {'lr': 0.00019956723277004878, 'samples': 1131264, 'steps': 2209, 'loss/train': 2.184495449066162} -09/20/2021 22:08:41 - INFO - __main__ - Step 35353: {'lr': 0.00019956723277004878, 'samples': 1131296, 'steps': 2209, 'loss/train': 1.999915361404419} -09/20/2021 22:08:42 - INFO - __main__ - Step 35354: {'lr': 0.00019956723277004878, 'samples': 1131328, 'steps': 2209, 'loss/train': 2.436664342880249} -09/20/2021 22:08:43 - INFO - __main__ - Step 35355: {'lr': 0.00019956723277004878, 'samples': 1131360, 'steps': 2209, 'loss/train': 2.891995668411255} -09/20/2021 22:08:43 - INFO - __main__ - Step 35356: {'lr': 0.00019956723277004878, 'samples': 1131392, 'steps': 2209, 'loss/train': 2.275291919708252} -09/20/2021 22:08:44 - INFO - __main__ - Step 35357: {'lr': 0.00019956723277004878, 'samples': 1131424, 'steps': 2209, 'loss/train': 2.2705769538879395} -09/20/2021 22:08:45 - INFO - __main__ - Step 35358: {'lr': 0.00019956723277004878, 'samples': 1131456, 'steps': 2209, 'loss/train': 2.1904373168945312} -09/20/2021 22:08:46 - INFO - __main__ - Step 35359: {'lr': 0.00019956723277004878, 'samples': 1131488, 'steps': 2209, 'loss/train': 2.6902496814727783} -09/20/2021 22:08:46 - INFO - __main__ - Step 35360: {'lr': 0.00019956723277004878, 'samples': 1131520, 'steps': 2209, 'loss/train': 1.6564757823944092} -09/20/2021 22:08:47 - INFO - __main__ - Step 35361: {'lr': 0.00019956663975759136, 'samples': 1131552, 'steps': 2210, 'loss/train': 2.1786861419677734} -09/20/2021 22:08:48 - INFO - __main__ - Step 35362: {'lr': 0.00019956663975759136, 'samples': 1131584, 'steps': 2210, 'loss/train': 0.23868773877620697} -09/20/2021 22:08:49 - INFO - __main__ - Step 35363: {'lr': 0.00019956663975759136, 'samples': 1131616, 'steps': 2210, 'loss/train': 0.8121009469032288} -09/20/2021 22:08:50 - INFO - __main__ - Step 35364: {'lr': 0.00019956663975759136, 'samples': 1131648, 'steps': 2210, 'loss/train': 1.9527227878570557} -09/20/2021 22:08:50 - INFO - __main__ - Step 35365: {'lr': 0.00019956663975759136, 'samples': 1131680, 'steps': 2210, 'loss/train': 2.3165738582611084} -09/20/2021 22:08:51 - INFO - __main__ - Step 35366: {'lr': 0.00019956663975759136, 'samples': 1131712, 'steps': 2210, 'loss/train': 2.1753342151641846} -09/20/2021 22:08:52 - INFO - __main__ - Step 35367: {'lr': 0.00019956663975759136, 'samples': 1131744, 'steps': 2210, 'loss/train': 2.1689202785491943} -09/20/2021 22:08:53 - INFO - __main__ - Step 35368: {'lr': 0.00019956663975759136, 'samples': 1131776, 'steps': 2210, 'loss/train': 1.600338339805603} -09/20/2021 22:08:53 - INFO - __main__ - Step 35369: {'lr': 0.00019956663975759136, 'samples': 1131808, 'steps': 2210, 'loss/train': 3.3899829387664795} -09/20/2021 22:08:54 - INFO - __main__ - Step 35370: {'lr': 0.00019956663975759136, 'samples': 1131840, 'steps': 2210, 'loss/train': 2.2648284435272217} -09/20/2021 22:08:55 - INFO - __main__ - Step 35371: {'lr': 0.00019956663975759136, 'samples': 1131872, 'steps': 2210, 'loss/train': 2.9442005157470703} -09/20/2021 22:08:56 - INFO - __main__ - Step 35372: {'lr': 0.00019956663975759136, 'samples': 1131904, 'steps': 2210, 'loss/train': 2.524460792541504} -09/20/2021 22:08:56 - INFO - __main__ - Step 35373: {'lr': 0.00019956663975759136, 'samples': 1131936, 'steps': 2210, 'loss/train': 2.5353176593780518} -09/20/2021 22:08:57 - INFO - __main__ - Step 35374: {'lr': 0.00019956663975759136, 'samples': 1131968, 'steps': 2210, 'loss/train': 2.3265881538391113} -09/20/2021 22:08:58 - INFO - __main__ - Step 35375: {'lr': 0.00019956663975759136, 'samples': 1132000, 'steps': 2210, 'loss/train': 1.8038753271102905} -09/20/2021 22:08:59 - INFO - __main__ - Step 35376: {'lr': 0.00019956663975759136, 'samples': 1132032, 'steps': 2210, 'loss/train': 2.1413543224334717} -09/20/2021 22:09:00 - INFO - __main__ - Step 35377: {'lr': 0.00019956604633999768, 'samples': 1132064, 'steps': 2211, 'loss/train': 2.523167610168457} -09/20/2021 22:09:00 - INFO - __main__ - Step 35378: {'lr': 0.00019956604633999768, 'samples': 1132096, 'steps': 2211, 'loss/train': 2.2582733631134033} -09/20/2021 22:09:01 - INFO - __main__ - Step 35379: {'lr': 0.00019956604633999768, 'samples': 1132128, 'steps': 2211, 'loss/train': 1.8801263570785522} -09/20/2021 22:09:02 - INFO - __main__ - Step 35380: {'lr': 0.00019956604633999768, 'samples': 1132160, 'steps': 2211, 'loss/train': 2.2329764366149902} -09/20/2021 22:09:03 - INFO - __main__ - Step 35381: {'lr': 0.00019956604633999768, 'samples': 1132192, 'steps': 2211, 'loss/train': 2.706698417663574} -09/20/2021 22:09:03 - INFO - __main__ - Step 35382: {'lr': 0.00019956604633999768, 'samples': 1132224, 'steps': 2211, 'loss/train': 2.690215826034546} -09/20/2021 22:09:04 - INFO - __main__ - Step 35383: {'lr': 0.00019956604633999768, 'samples': 1132256, 'steps': 2211, 'loss/train': 2.627331256866455} -09/20/2021 22:09:05 - INFO - __main__ - Step 35384: {'lr': 0.00019956604633999768, 'samples': 1132288, 'steps': 2211, 'loss/train': 2.47676682472229} -09/20/2021 22:09:06 - INFO - __main__ - Step 35385: {'lr': 0.00019956604633999768, 'samples': 1132320, 'steps': 2211, 'loss/train': 2.5195229053497314} -09/20/2021 22:09:07 - INFO - __main__ - Step 35386: {'lr': 0.00019956604633999768, 'samples': 1132352, 'steps': 2211, 'loss/train': 3.0735769271850586} -09/20/2021 22:09:08 - INFO - __main__ - Step 35387: {'lr': 0.00019956604633999768, 'samples': 1132384, 'steps': 2211, 'loss/train': 2.282517910003662} -09/20/2021 22:09:09 - INFO - __main__ - Step 35388: {'lr': 0.00019956604633999768, 'samples': 1132416, 'steps': 2211, 'loss/train': 0.7998846173286438} -09/20/2021 22:09:09 - INFO - __main__ - Step 35389: {'lr': 0.00019956604633999768, 'samples': 1132448, 'steps': 2211, 'loss/train': 2.5042319297790527} -09/20/2021 22:09:10 - INFO - __main__ - Step 35390: {'lr': 0.00019956604633999768, 'samples': 1132480, 'steps': 2211, 'loss/train': 2.1819958686828613} -09/20/2021 22:09:11 - INFO - __main__ - Step 35391: {'lr': 0.00019956604633999768, 'samples': 1132512, 'steps': 2211, 'loss/train': 2.4777657985687256} -09/20/2021 22:09:12 - INFO - __main__ - Step 35392: {'lr': 0.00019956604633999768, 'samples': 1132544, 'steps': 2211, 'loss/train': 1.7898588180541992} -09/20/2021 22:09:12 - INFO - __main__ - Step 35393: {'lr': 0.0001995654525172701, 'samples': 1132576, 'steps': 2212, 'loss/train': 2.7592809200286865} -09/20/2021 22:09:13 - INFO - __main__ - Step 35394: {'lr': 0.0001995654525172701, 'samples': 1132608, 'steps': 2212, 'loss/train': 2.7132949829101562} -09/20/2021 22:09:14 - INFO - __main__ - Step 35395: {'lr': 0.0001995654525172701, 'samples': 1132640, 'steps': 2212, 'loss/train': 2.0792322158813477} -09/20/2021 22:09:15 - INFO - __main__ - Step 35396: {'lr': 0.0001995654525172701, 'samples': 1132672, 'steps': 2212, 'loss/train': 2.6240272521972656} -09/20/2021 22:09:15 - INFO - __main__ - Step 35397: {'lr': 0.0001995654525172701, 'samples': 1132704, 'steps': 2212, 'loss/train': 2.4147372245788574} -09/20/2021 22:09:16 - INFO - __main__ - Step 35398: {'lr': 0.0001995654525172701, 'samples': 1132736, 'steps': 2212, 'loss/train': 2.429676055908203} -09/20/2021 22:09:17 - INFO - __main__ - Step 35399: {'lr': 0.0001995654525172701, 'samples': 1132768, 'steps': 2212, 'loss/train': 1.5972611904144287} -09/20/2021 22:09:18 - INFO - __main__ - Step 35400: {'lr': 0.0001995654525172701, 'samples': 1132800, 'steps': 2212, 'loss/train': 0.9944718480110168} -09/20/2021 22:09:18 - INFO - __main__ - Step 35401: {'lr': 0.0001995654525172701, 'samples': 1132832, 'steps': 2212, 'loss/train': 2.330400228500366} -09/20/2021 22:09:19 - INFO - __main__ - Step 35402: {'lr': 0.0001995654525172701, 'samples': 1132864, 'steps': 2212, 'loss/train': 1.906624436378479} -09/20/2021 22:09:20 - INFO - __main__ - Step 35403: {'lr': 0.0001995654525172701, 'samples': 1132896, 'steps': 2212, 'loss/train': 1.6992077827453613} -09/20/2021 22:09:21 - INFO - __main__ - Step 35404: {'lr': 0.0001995654525172701, 'samples': 1132928, 'steps': 2212, 'loss/train': 1.858038306236267} -09/20/2021 22:09:21 - INFO - __main__ - Step 35405: {'lr': 0.0001995654525172701, 'samples': 1132960, 'steps': 2212, 'loss/train': 2.350639820098877} -09/20/2021 22:09:22 - INFO - __main__ - Step 35406: {'lr': 0.0001995654525172701, 'samples': 1132992, 'steps': 2212, 'loss/train': 2.069338798522949} -09/20/2021 22:09:23 - INFO - __main__ - Step 35407: {'lr': 0.0001995654525172701, 'samples': 1133024, 'steps': 2212, 'loss/train': 2.053434133529663} -09/20/2021 22:09:24 - INFO - __main__ - Step 35408: {'lr': 0.0001995654525172701, 'samples': 1133056, 'steps': 2212, 'loss/train': 1.9103883504867554} -09/20/2021 22:09:25 - INFO - __main__ - Step 35409: {'lr': 0.00019956485828941112, 'samples': 1133088, 'steps': 2213, 'loss/train': 2.4826507568359375} -09/20/2021 22:09:25 - INFO - __main__ - Step 35410: {'lr': 0.00019956485828941112, 'samples': 1133120, 'steps': 2213, 'loss/train': 0.5012027025222778} -09/20/2021 22:09:26 - INFO - __main__ - Step 35411: {'lr': 0.00019956485828941112, 'samples': 1133152, 'steps': 2213, 'loss/train': 2.161630153656006} -09/20/2021 22:09:27 - INFO - __main__ - Step 35412: {'lr': 0.00019956485828941112, 'samples': 1133184, 'steps': 2213, 'loss/train': 2.6744861602783203} -09/20/2021 22:09:28 - INFO - __main__ - Step 35413: {'lr': 0.00019956485828941112, 'samples': 1133216, 'steps': 2213, 'loss/train': 0.7773206233978271} -09/20/2021 22:09:28 - INFO - __main__ - Step 35414: {'lr': 0.00019956485828941112, 'samples': 1133248, 'steps': 2213, 'loss/train': 2.0516889095306396} -09/20/2021 22:09:29 - INFO - __main__ - Step 35415: {'lr': 0.00019956485828941112, 'samples': 1133280, 'steps': 2213, 'loss/train': 1.8494839668273926} -09/20/2021 22:09:30 - INFO - __main__ - Step 35416: {'lr': 0.00019956485828941112, 'samples': 1133312, 'steps': 2213, 'loss/train': 1.9819960594177246} -09/20/2021 22:09:31 - INFO - __main__ - Step 35417: {'lr': 0.00019956485828941112, 'samples': 1133344, 'steps': 2213, 'loss/train': 2.610391616821289} -09/20/2021 22:09:31 - INFO - __main__ - Step 35418: {'lr': 0.00019956485828941112, 'samples': 1133376, 'steps': 2213, 'loss/train': 2.685274362564087} -09/20/2021 22:09:32 - INFO - __main__ - Step 35419: {'lr': 0.00019956485828941112, 'samples': 1133408, 'steps': 2213, 'loss/train': 2.7747066020965576} -09/20/2021 22:09:33 - INFO - __main__ - Step 35420: {'lr': 0.00019956485828941112, 'samples': 1133440, 'steps': 2213, 'loss/train': 2.7513134479522705} -09/20/2021 22:09:34 - INFO - __main__ - Step 35421: {'lr': 0.00019956485828941112, 'samples': 1133472, 'steps': 2213, 'loss/train': 2.6621806621551514} -09/20/2021 22:09:34 - INFO - __main__ - Step 35422: {'lr': 0.00019956485828941112, 'samples': 1133504, 'steps': 2213, 'loss/train': 2.7715370655059814} -09/20/2021 22:09:36 - INFO - __main__ - Step 35423: {'lr': 0.00019956485828941112, 'samples': 1133536, 'steps': 2213, 'loss/train': 1.921438455581665} -09/20/2021 22:09:36 - INFO - __main__ - Step 35424: {'lr': 0.00019956485828941112, 'samples': 1133568, 'steps': 2213, 'loss/train': 2.054175615310669} -09/20/2021 22:09:37 - INFO - __main__ - Step 35425: {'lr': 0.00019956426365642309, 'samples': 1133600, 'steps': 2214, 'loss/train': 1.7333883047103882} -09/20/2021 22:09:38 - INFO - __main__ - Step 35426: {'lr': 0.00019956426365642309, 'samples': 1133632, 'steps': 2214, 'loss/train': 0.8911787271499634} -09/20/2021 22:09:39 - INFO - __main__ - Step 35427: {'lr': 0.00019956426365642309, 'samples': 1133664, 'steps': 2214, 'loss/train': 1.6296881437301636} -09/20/2021 22:09:40 - INFO - __main__ - Step 35428: {'lr': 0.00019956426365642309, 'samples': 1133696, 'steps': 2214, 'loss/train': 3.151604413986206} -09/20/2021 22:09:40 - INFO - __main__ - Step 35429: {'lr': 0.00019956426365642309, 'samples': 1133728, 'steps': 2214, 'loss/train': 2.0302536487579346} -09/20/2021 22:09:41 - INFO - __main__ - Step 35430: {'lr': 0.00019956426365642309, 'samples': 1133760, 'steps': 2214, 'loss/train': 2.5874061584472656} -09/20/2021 22:09:42 - INFO - __main__ - Step 35431: {'lr': 0.00019956426365642309, 'samples': 1133792, 'steps': 2214, 'loss/train': 0.9594652056694031} -09/20/2021 22:09:43 - INFO - __main__ - Step 35432: {'lr': 0.00019956426365642309, 'samples': 1133824, 'steps': 2214, 'loss/train': 1.9303615093231201} -09/20/2021 22:09:43 - INFO - __main__ - Step 35433: {'lr': 0.00019956426365642309, 'samples': 1133856, 'steps': 2214, 'loss/train': 1.8863587379455566} -09/20/2021 22:09:44 - INFO - __main__ - Step 35434: {'lr': 0.00019956426365642309, 'samples': 1133888, 'steps': 2214, 'loss/train': 2.732741117477417} -09/20/2021 22:09:45 - INFO - __main__ - Step 35435: {'lr': 0.00019956426365642309, 'samples': 1133920, 'steps': 2214, 'loss/train': 0.7249552607536316} -09/20/2021 22:09:46 - INFO - __main__ - Step 35436: {'lr': 0.00019956426365642309, 'samples': 1133952, 'steps': 2214, 'loss/train': 2.0249969959259033} -09/20/2021 22:09:46 - INFO - __main__ - Step 35437: {'lr': 0.00019956426365642309, 'samples': 1133984, 'steps': 2214, 'loss/train': 2.1800708770751953} -09/20/2021 22:09:47 - INFO - __main__ - Step 35438: {'lr': 0.00019956426365642309, 'samples': 1134016, 'steps': 2214, 'loss/train': 0.9946149587631226} -09/20/2021 22:09:48 - INFO - __main__ - Step 35439: {'lr': 0.00019956426365642309, 'samples': 1134048, 'steps': 2214, 'loss/train': 1.684057593345642} -09/20/2021 22:09:49 - INFO - __main__ - Step 35440: {'lr': 0.00019956426365642309, 'samples': 1134080, 'steps': 2214, 'loss/train': 2.013711452484131} -09/20/2021 22:09:49 - INFO - __main__ - Step 35441: {'lr': 0.0001995636686183085, 'samples': 1134112, 'steps': 2215, 'loss/train': 2.27451229095459} -09/20/2021 22:09:50 - INFO - __main__ - Step 35442: {'lr': 0.0001995636686183085, 'samples': 1134144, 'steps': 2215, 'loss/train': 2.6161906719207764} -09/20/2021 22:09:51 - INFO - __main__ - Step 35443: {'lr': 0.0001995636686183085, 'samples': 1134176, 'steps': 2215, 'loss/train': 0.7676188349723816} -09/20/2021 22:09:52 - INFO - __main__ - Step 35444: {'lr': 0.0001995636686183085, 'samples': 1134208, 'steps': 2215, 'loss/train': 2.059084892272949} -09/20/2021 22:09:52 - INFO - __main__ - Step 35445: {'lr': 0.0001995636686183085, 'samples': 1134240, 'steps': 2215, 'loss/train': 3.302854061126709} -09/20/2021 22:09:53 - INFO - __main__ - Step 35446: {'lr': 0.0001995636686183085, 'samples': 1134272, 'steps': 2215, 'loss/train': 3.0372567176818848} -09/20/2021 22:09:54 - INFO - __main__ - Step 35447: {'lr': 0.0001995636686183085, 'samples': 1134304, 'steps': 2215, 'loss/train': 2.4278724193573} -09/20/2021 22:09:55 - INFO - __main__ - Step 35448: {'lr': 0.0001995636686183085, 'samples': 1134336, 'steps': 2215, 'loss/train': 2.8832340240478516} -09/20/2021 22:09:55 - INFO - __main__ - Step 35449: {'lr': 0.0001995636686183085, 'samples': 1134368, 'steps': 2215, 'loss/train': 2.3155782222747803} -09/20/2021 22:09:56 - INFO - __main__ - Step 35450: {'lr': 0.0001995636686183085, 'samples': 1134400, 'steps': 2215, 'loss/train': 2.2471413612365723} -09/20/2021 22:09:57 - INFO - __main__ - Step 35451: {'lr': 0.0001995636686183085, 'samples': 1134432, 'steps': 2215, 'loss/train': 2.7472352981567383} -09/20/2021 22:09:58 - INFO - __main__ - Step 35452: {'lr': 0.0001995636686183085, 'samples': 1134464, 'steps': 2215, 'loss/train': 1.7475032806396484} -09/20/2021 22:09:58 - INFO - __main__ - Step 35453: {'lr': 0.0001995636686183085, 'samples': 1134496, 'steps': 2215, 'loss/train': 1.3392373323440552} -09/20/2021 22:10:01 - INFO - __main__ - Step 35454: {'lr': 0.0001995636686183085, 'samples': 1134528, 'steps': 2215, 'loss/train': 0.9328518509864807} -09/20/2021 22:10:01 - INFO - __main__ - Step 35455: {'lr': 0.0001995636686183085, 'samples': 1134560, 'steps': 2215, 'loss/train': 2.2391295433044434} -09/20/2021 22:10:02 - INFO - __main__ - Step 35456: {'lr': 0.0001995636686183085, 'samples': 1134592, 'steps': 2215, 'loss/train': 2.179749011993408} -09/20/2021 22:10:03 - INFO - __main__ - Step 35457: {'lr': 0.00019956307317506967, 'samples': 1134624, 'steps': 2216, 'loss/train': 2.6214439868927} -09/20/2021 22:10:04 - INFO - __main__ - Step 35458: {'lr': 0.00019956307317506967, 'samples': 1134656, 'steps': 2216, 'loss/train': 1.939626693725586} -09/20/2021 22:10:05 - INFO - __main__ - Step 35459: {'lr': 0.00019956307317506967, 'samples': 1134688, 'steps': 2216, 'loss/train': 2.4815573692321777} -09/20/2021 22:10:05 - INFO - __main__ - Step 35460: {'lr': 0.00019956307317506967, 'samples': 1134720, 'steps': 2216, 'loss/train': 2.2532691955566406} -09/20/2021 22:10:06 - INFO - __main__ - Step 35461: {'lr': 0.00019956307317506967, 'samples': 1134752, 'steps': 2216, 'loss/train': 2.2143330574035645} -09/20/2021 22:10:07 - INFO - __main__ - Step 35462: {'lr': 0.00019956307317506967, 'samples': 1134784, 'steps': 2216, 'loss/train': 2.2314131259918213} -09/20/2021 22:10:08 - INFO - __main__ - Step 35463: {'lr': 0.00019956307317506967, 'samples': 1134816, 'steps': 2216, 'loss/train': 2.02388072013855} -09/20/2021 22:10:08 - INFO - __main__ - Step 35464: {'lr': 0.00019956307317506967, 'samples': 1134848, 'steps': 2216, 'loss/train': 2.2088563442230225} -09/20/2021 22:10:09 - INFO - __main__ - Step 35465: {'lr': 0.00019956307317506967, 'samples': 1134880, 'steps': 2216, 'loss/train': 1.9647021293640137} -09/20/2021 22:10:10 - INFO - __main__ - Step 35466: {'lr': 0.00019956307317506967, 'samples': 1134912, 'steps': 2216, 'loss/train': 1.9510579109191895} -09/20/2021 22:10:11 - INFO - __main__ - Step 35467: {'lr': 0.00019956307317506967, 'samples': 1134944, 'steps': 2216, 'loss/train': 2.120842456817627} -09/20/2021 22:10:11 - INFO - __main__ - Step 35468: {'lr': 0.00019956307317506967, 'samples': 1134976, 'steps': 2216, 'loss/train': 2.2498788833618164} -09/20/2021 22:10:12 - INFO - __main__ - Step 35469: {'lr': 0.00019956307317506967, 'samples': 1135008, 'steps': 2216, 'loss/train': 2.0971240997314453} -09/20/2021 22:10:13 - INFO - __main__ - Step 35470: {'lr': 0.00019956307317506967, 'samples': 1135040, 'steps': 2216, 'loss/train': 2.065748453140259} -09/20/2021 22:10:14 - INFO - __main__ - Step 35471: {'lr': 0.00019956307317506967, 'samples': 1135072, 'steps': 2216, 'loss/train': 2.17441463470459} -09/20/2021 22:10:14 - INFO - __main__ - Step 35472: {'lr': 0.00019956307317506967, 'samples': 1135104, 'steps': 2216, 'loss/train': 2.014462947845459} -09/20/2021 22:10:15 - INFO - __main__ - Step 35473: {'lr': 0.0001995624773267091, 'samples': 1135136, 'steps': 2217, 'loss/train': 1.6673610210418701} -09/20/2021 22:10:16 - INFO - __main__ - Step 35474: {'lr': 0.0001995624773267091, 'samples': 1135168, 'steps': 2217, 'loss/train': 1.6575630903244019} -09/20/2021 22:10:17 - INFO - __main__ - Step 35475: {'lr': 0.0001995624773267091, 'samples': 1135200, 'steps': 2217, 'loss/train': 2.492152452468872} -09/20/2021 22:10:17 - INFO - __main__ - Step 35476: {'lr': 0.0001995624773267091, 'samples': 1135232, 'steps': 2217, 'loss/train': 1.828885793685913} -09/20/2021 22:10:18 - INFO - __main__ - Step 35477: {'lr': 0.0001995624773267091, 'samples': 1135264, 'steps': 2217, 'loss/train': 2.4827933311462402} -09/20/2021 22:10:19 - INFO - __main__ - Step 35478: {'lr': 0.0001995624773267091, 'samples': 1135296, 'steps': 2217, 'loss/train': 2.3317019939422607} -09/20/2021 22:10:20 - INFO - __main__ - Step 35479: {'lr': 0.0001995624773267091, 'samples': 1135328, 'steps': 2217, 'loss/train': 2.6844165325164795} -09/20/2021 22:10:20 - INFO - __main__ - Step 35480: {'lr': 0.0001995624773267091, 'samples': 1135360, 'steps': 2217, 'loss/train': 2.507009267807007} -09/20/2021 22:10:21 - INFO - __main__ - Step 35481: {'lr': 0.0001995624773267091, 'samples': 1135392, 'steps': 2217, 'loss/train': 2.348296880722046} -09/20/2021 22:10:22 - INFO - __main__ - Step 35482: {'lr': 0.0001995624773267091, 'samples': 1135424, 'steps': 2217, 'loss/train': 2.801726818084717} -09/20/2021 22:10:23 - INFO - __main__ - Step 35483: {'lr': 0.0001995624773267091, 'samples': 1135456, 'steps': 2217, 'loss/train': 1.291123628616333} -09/20/2021 22:10:23 - INFO - __main__ - Step 35484: {'lr': 0.0001995624773267091, 'samples': 1135488, 'steps': 2217, 'loss/train': 2.210292339324951} -09/20/2021 22:10:24 - INFO - __main__ - Step 35485: {'lr': 0.0001995624773267091, 'samples': 1135520, 'steps': 2217, 'loss/train': 2.236466884613037} -09/20/2021 22:10:25 - INFO - __main__ - Step 35486: {'lr': 0.0001995624773267091, 'samples': 1135552, 'steps': 2217, 'loss/train': 2.1448261737823486} -09/20/2021 22:10:26 - INFO - __main__ - Step 35487: {'lr': 0.0001995624773267091, 'samples': 1135584, 'steps': 2217, 'loss/train': 3.207026481628418} -09/20/2021 22:10:26 - INFO - __main__ - Step 35488: {'lr': 0.0001995624773267091, 'samples': 1135616, 'steps': 2217, 'loss/train': 0.694896399974823} -09/20/2021 22:10:27 - INFO - __main__ - Step 35489: {'lr': 0.00019956188107322925, 'samples': 1135648, 'steps': 2218, 'loss/train': 1.7517461776733398} -09/20/2021 22:10:28 - INFO - __main__ - Step 35490: {'lr': 0.00019956188107322925, 'samples': 1135680, 'steps': 2218, 'loss/train': 1.9961439371109009} -09/20/2021 22:10:30 - INFO - __main__ - Step 35491: {'lr': 0.00019956188107322925, 'samples': 1135712, 'steps': 2218, 'loss/train': 1.8974933624267578} -09/20/2021 22:10:30 - INFO - __main__ - Step 35492: {'lr': 0.00019956188107322925, 'samples': 1135744, 'steps': 2218, 'loss/train': 2.1319596767425537} -09/20/2021 22:10:31 - INFO - __main__ - Step 35493: {'lr': 0.00019956188107322925, 'samples': 1135776, 'steps': 2218, 'loss/train': 2.0068423748016357} -09/20/2021 22:10:32 - INFO - __main__ - Step 35494: {'lr': 0.00019956188107322925, 'samples': 1135808, 'steps': 2218, 'loss/train': 2.4488208293914795} -09/20/2021 22:10:33 - INFO - __main__ - Step 35495: {'lr': 0.00019956188107322925, 'samples': 1135840, 'steps': 2218, 'loss/train': 2.705721616744995} -09/20/2021 22:10:33 - INFO - __main__ - Step 35496: {'lr': 0.00019956188107322925, 'samples': 1135872, 'steps': 2218, 'loss/train': 2.9525060653686523} -09/20/2021 22:10:34 - INFO - __main__ - Step 35497: {'lr': 0.00019956188107322925, 'samples': 1135904, 'steps': 2218, 'loss/train': 2.197530746459961} -09/20/2021 22:10:35 - INFO - __main__ - Step 35498: {'lr': 0.00019956188107322925, 'samples': 1135936, 'steps': 2218, 'loss/train': 3.3320417404174805} -09/20/2021 22:10:36 - INFO - __main__ - Step 35499: {'lr': 0.00019956188107322925, 'samples': 1135968, 'steps': 2218, 'loss/train': 2.4217820167541504} -09/20/2021 22:10:36 - INFO - __main__ - Step 35500: {'lr': 0.00019956188107322925, 'samples': 1136000, 'steps': 2218, 'loss/train': 3.588761329650879} -09/20/2021 22:10:37 - INFO - __main__ - Step 35501: {'lr': 0.00019956188107322925, 'samples': 1136032, 'steps': 2218, 'loss/train': 2.968959093093872} -09/20/2021 22:10:38 - INFO - __main__ - Step 35502: {'lr': 0.00019956188107322925, 'samples': 1136064, 'steps': 2218, 'loss/train': 2.51124906539917} -09/20/2021 22:10:39 - INFO - __main__ - Step 35503: {'lr': 0.00019956188107322925, 'samples': 1136096, 'steps': 2218, 'loss/train': 3.8032548427581787} -09/20/2021 22:10:39 - INFO - __main__ - Step 35504: {'lr': 0.00019956188107322925, 'samples': 1136128, 'steps': 2218, 'loss/train': 2.483704090118408} -09/20/2021 22:10:40 - INFO - __main__ - Step 35505: {'lr': 0.00019956128441463245, 'samples': 1136160, 'steps': 2219, 'loss/train': 2.606870412826538} -09/20/2021 22:10:41 - INFO - __main__ - Step 35506: {'lr': 0.00019956128441463245, 'samples': 1136192, 'steps': 2219, 'loss/train': 1.6200746297836304} -09/20/2021 22:10:42 - INFO - __main__ - Step 35507: {'lr': 0.00019956128441463245, 'samples': 1136224, 'steps': 2219, 'loss/train': 2.3644447326660156} -09/20/2021 22:10:42 - INFO - __main__ - Step 35508: {'lr': 0.00019956128441463245, 'samples': 1136256, 'steps': 2219, 'loss/train': 1.9266941547393799} -09/20/2021 22:10:43 - INFO - __main__ - Step 35509: {'lr': 0.00019956128441463245, 'samples': 1136288, 'steps': 2219, 'loss/train': 2.40193247795105} -09/20/2021 22:10:44 - INFO - __main__ - Step 35510: {'lr': 0.00019956128441463245, 'samples': 1136320, 'steps': 2219, 'loss/train': 3.1055827140808105} -09/20/2021 22:10:45 - INFO - __main__ - Step 35511: {'lr': 0.00019956128441463245, 'samples': 1136352, 'steps': 2219, 'loss/train': 2.224277973175049} -09/20/2021 22:10:45 - INFO - __main__ - Step 35512: {'lr': 0.00019956128441463245, 'samples': 1136384, 'steps': 2219, 'loss/train': 2.846625566482544} -09/20/2021 22:10:46 - INFO - __main__ - Step 35513: {'lr': 0.00019956128441463245, 'samples': 1136416, 'steps': 2219, 'loss/train': 2.062692403793335} -09/20/2021 22:10:47 - INFO - __main__ - Step 35514: {'lr': 0.00019956128441463245, 'samples': 1136448, 'steps': 2219, 'loss/train': 2.407038450241089} -09/20/2021 22:10:48 - INFO - __main__ - Step 35515: {'lr': 0.00019956128441463245, 'samples': 1136480, 'steps': 2219, 'loss/train': 1.2455672025680542} -09/20/2021 22:10:48 - INFO - __main__ - Step 35516: {'lr': 0.00019956128441463245, 'samples': 1136512, 'steps': 2219, 'loss/train': 1.8422877788543701} -09/20/2021 22:10:49 - INFO - __main__ - Step 35517: {'lr': 0.00019956128441463245, 'samples': 1136544, 'steps': 2219, 'loss/train': 1.5948559045791626} -09/20/2021 22:10:50 - INFO - __main__ - Step 35518: {'lr': 0.00019956128441463245, 'samples': 1136576, 'steps': 2219, 'loss/train': 2.0731890201568604} -09/20/2021 22:10:51 - INFO - __main__ - Step 35519: {'lr': 0.00019956128441463245, 'samples': 1136608, 'steps': 2219, 'loss/train': 1.7730027437210083} -09/20/2021 22:10:51 - INFO - __main__ - Step 35520: {'lr': 0.00019956128441463245, 'samples': 1136640, 'steps': 2219, 'loss/train': 2.1481947898864746} -09/20/2021 22:10:52 - INFO - __main__ - Step 35521: {'lr': 0.00019956068735092116, 'samples': 1136672, 'steps': 2220, 'loss/train': 1.81497323513031} -09/20/2021 22:10:53 - INFO - __main__ - Step 35522: {'lr': 0.00019956068735092116, 'samples': 1136704, 'steps': 2220, 'loss/train': 1.8135696649551392} -09/20/2021 22:10:54 - INFO - __main__ - Step 35523: {'lr': 0.00019956068735092116, 'samples': 1136736, 'steps': 2220, 'loss/train': 1.7942500114440918} -09/20/2021 22:10:55 - INFO - __main__ - Step 35524: {'lr': 0.00019956068735092116, 'samples': 1136768, 'steps': 2220, 'loss/train': 1.9395345449447632} -09/20/2021 22:10:56 - INFO - __main__ - Step 35525: {'lr': 0.00019956068735092116, 'samples': 1136800, 'steps': 2220, 'loss/train': 2.2231481075286865} -09/20/2021 22:10:57 - INFO - __main__ - Step 35526: {'lr': 0.00019956068735092116, 'samples': 1136832, 'steps': 2220, 'loss/train': 2.3326776027679443} -09/20/2021 22:10:57 - INFO - __main__ - Step 35527: {'lr': 0.00019956068735092116, 'samples': 1136864, 'steps': 2220, 'loss/train': 1.747423529624939} -09/20/2021 22:10:58 - INFO - __main__ - Step 35528: {'lr': 0.00019956068735092116, 'samples': 1136896, 'steps': 2220, 'loss/train': 2.2209548950195312} -09/20/2021 22:10:59 - INFO - __main__ - Step 35529: {'lr': 0.00019956068735092116, 'samples': 1136928, 'steps': 2220, 'loss/train': 2.1310558319091797} -09/20/2021 22:11:00 - INFO - __main__ - Step 35530: {'lr': 0.00019956068735092116, 'samples': 1136960, 'steps': 2220, 'loss/train': 0.5413133502006531} -09/20/2021 22:11:00 - INFO - __main__ - Step 35531: {'lr': 0.00019956068735092116, 'samples': 1136992, 'steps': 2220, 'loss/train': 2.749861478805542} -09/20/2021 22:11:01 - INFO - __main__ - Step 35532: {'lr': 0.00019956068735092116, 'samples': 1137024, 'steps': 2220, 'loss/train': 2.7577054500579834} -09/20/2021 22:11:02 - INFO - __main__ - Step 35533: {'lr': 0.00019956068735092116, 'samples': 1137056, 'steps': 2220, 'loss/train': 2.1724693775177} -09/20/2021 22:11:03 - INFO - __main__ - Step 35534: {'lr': 0.00019956068735092116, 'samples': 1137088, 'steps': 2220, 'loss/train': 2.268657684326172} -09/20/2021 22:11:03 - INFO - __main__ - Step 35535: {'lr': 0.00019956068735092116, 'samples': 1137120, 'steps': 2220, 'loss/train': 2.197313070297241} -09/20/2021 22:11:04 - INFO - __main__ - Step 35536: {'lr': 0.00019956068735092116, 'samples': 1137152, 'steps': 2220, 'loss/train': 2.1133997440338135} -09/20/2021 22:11:05 - INFO - __main__ - Step 35537: {'lr': 0.00019956008988209782, 'samples': 1137184, 'steps': 2221, 'loss/train': 1.4474139213562012} -09/20/2021 22:11:06 - INFO - __main__ - Step 35538: {'lr': 0.00019956008988209782, 'samples': 1137216, 'steps': 2221, 'loss/train': 2.533658742904663} -09/20/2021 22:11:06 - INFO - __main__ - Step 35539: {'lr': 0.00019956008988209782, 'samples': 1137248, 'steps': 2221, 'loss/train': 3.4406397342681885} -09/20/2021 22:11:07 - INFO - __main__ - Step 35540: {'lr': 0.00019956008988209782, 'samples': 1137280, 'steps': 2221, 'loss/train': 2.078434705734253} -09/20/2021 22:11:08 - INFO - __main__ - Step 35541: {'lr': 0.00019956008988209782, 'samples': 1137312, 'steps': 2221, 'loss/train': 2.326032876968384} -09/20/2021 22:11:09 - INFO - __main__ - Step 35542: {'lr': 0.00019956008988209782, 'samples': 1137344, 'steps': 2221, 'loss/train': 1.6251897811889648} -09/20/2021 22:11:09 - INFO - __main__ - Step 35543: {'lr': 0.00019956008988209782, 'samples': 1137376, 'steps': 2221, 'loss/train': 1.9951257705688477} -09/20/2021 22:11:10 - INFO - __main__ - Step 35544: {'lr': 0.00019956008988209782, 'samples': 1137408, 'steps': 2221, 'loss/train': 1.5312951803207397} -09/20/2021 22:11:11 - INFO - __main__ - Step 35545: {'lr': 0.00019956008988209782, 'samples': 1137440, 'steps': 2221, 'loss/train': 3.562915086746216} -09/20/2021 22:11:12 - INFO - __main__ - Step 35546: {'lr': 0.00019956008988209782, 'samples': 1137472, 'steps': 2221, 'loss/train': 2.966763973236084} -09/20/2021 22:11:13 - INFO - __main__ - Step 35547: {'lr': 0.00019956008988209782, 'samples': 1137504, 'steps': 2221, 'loss/train': 2.0959229469299316} -09/20/2021 22:11:13 - INFO - __main__ - Step 35548: {'lr': 0.00019956008988209782, 'samples': 1137536, 'steps': 2221, 'loss/train': 0.8463618755340576} -09/20/2021 22:11:14 - INFO - __main__ - Step 35549: {'lr': 0.00019956008988209782, 'samples': 1137568, 'steps': 2221, 'loss/train': 1.2147542238235474} -09/20/2021 22:11:15 - INFO - __main__ - Step 35550: {'lr': 0.00019956008988209782, 'samples': 1137600, 'steps': 2221, 'loss/train': 3.6455607414245605} -09/20/2021 22:11:15 - INFO - __main__ - Step 35551: {'lr': 0.00019956008988209782, 'samples': 1137632, 'steps': 2221, 'loss/train': 2.240563154220581} -09/20/2021 22:11:16 - INFO - __main__ - Step 35552: {'lr': 0.00019956008988209782, 'samples': 1137664, 'steps': 2221, 'loss/train': 2.77101469039917} -09/20/2021 22:11:17 - INFO - __main__ - Step 35553: {'lr': 0.00019955949200816487, 'samples': 1137696, 'steps': 2222, 'loss/train': 2.3804731369018555} -09/20/2021 22:11:18 - INFO - __main__ - Step 35554: {'lr': 0.00019955949200816487, 'samples': 1137728, 'steps': 2222, 'loss/train': 1.7789238691329956} -09/20/2021 22:11:19 - INFO - __main__ - Step 35555: {'lr': 0.00019955949200816487, 'samples': 1137760, 'steps': 2222, 'loss/train': 2.089259147644043} -09/20/2021 22:11:19 - INFO - __main__ - Step 35556: {'lr': 0.00019955949200816487, 'samples': 1137792, 'steps': 2222, 'loss/train': 2.061084032058716} -09/20/2021 22:11:20 - INFO - __main__ - Step 35557: {'lr': 0.00019955949200816487, 'samples': 1137824, 'steps': 2222, 'loss/train': 2.0588390827178955} -09/20/2021 22:11:22 - INFO - __main__ - Step 35558: {'lr': 0.00019955949200816487, 'samples': 1137856, 'steps': 2222, 'loss/train': 3.112086296081543} -09/20/2021 22:11:23 - INFO - __main__ - Step 35559: {'lr': 0.00019955949200816487, 'samples': 1137888, 'steps': 2222, 'loss/train': 3.578164577484131} -09/20/2021 22:11:23 - INFO - __main__ - Step 35560: {'lr': 0.00019955949200816487, 'samples': 1137920, 'steps': 2222, 'loss/train': 2.845195770263672} -09/20/2021 22:11:24 - INFO - __main__ - Step 35561: {'lr': 0.00019955949200816487, 'samples': 1137952, 'steps': 2222, 'loss/train': 2.820542573928833} -09/20/2021 22:11:25 - INFO - __main__ - Step 35562: {'lr': 0.00019955949200816487, 'samples': 1137984, 'steps': 2222, 'loss/train': 1.9301691055297852} -09/20/2021 22:11:26 - INFO - __main__ - Step 35563: {'lr': 0.00019955949200816487, 'samples': 1138016, 'steps': 2222, 'loss/train': 1.6862601041793823} -09/20/2021 22:11:26 - INFO - __main__ - Step 35564: {'lr': 0.00019955949200816487, 'samples': 1138048, 'steps': 2222, 'loss/train': 2.561729669570923} -09/20/2021 22:11:27 - INFO - __main__ - Step 35565: {'lr': 0.00019955949200816487, 'samples': 1138080, 'steps': 2222, 'loss/train': 4.630419731140137} -09/20/2021 22:11:28 - INFO - __main__ - Step 35566: {'lr': 0.00019955949200816487, 'samples': 1138112, 'steps': 2222, 'loss/train': 2.3032784461975098} -09/20/2021 22:11:29 - INFO - __main__ - Step 35567: {'lr': 0.00019955949200816487, 'samples': 1138144, 'steps': 2222, 'loss/train': 2.4922409057617188} -09/20/2021 22:11:29 - INFO - __main__ - Step 35568: {'lr': 0.00019955949200816487, 'samples': 1138176, 'steps': 2222, 'loss/train': 2.1312663555145264} -09/20/2021 22:11:30 - INFO - __main__ - Step 35569: {'lr': 0.00019955889372912474, 'samples': 1138208, 'steps': 2223, 'loss/train': 2.42024827003479} -09/20/2021 22:11:31 - INFO - __main__ - Step 35570: {'lr': 0.00019955889372912474, 'samples': 1138240, 'steps': 2223, 'loss/train': 2.8343892097473145} -09/20/2021 22:11:32 - INFO - __main__ - Step 35571: {'lr': 0.00019955889372912474, 'samples': 1138272, 'steps': 2223, 'loss/train': 0.544512927532196} -09/20/2021 22:11:33 - INFO - __main__ - Step 35572: {'lr': 0.00019955889372912474, 'samples': 1138304, 'steps': 2223, 'loss/train': 2.3889331817626953} -09/20/2021 22:11:33 - INFO - __main__ - Step 35573: {'lr': 0.00019955889372912474, 'samples': 1138336, 'steps': 2223, 'loss/train': 3.2932534217834473} -09/20/2021 22:11:34 - INFO - __main__ - Step 35574: {'lr': 0.00019955889372912474, 'samples': 1138368, 'steps': 2223, 'loss/train': 0.7197346687316895} -09/20/2021 22:11:35 - INFO - __main__ - Step 35575: {'lr': 0.00019955889372912474, 'samples': 1138400, 'steps': 2223, 'loss/train': 2.268775701522827} -09/20/2021 22:11:36 - INFO - __main__ - Step 35576: {'lr': 0.00019955889372912474, 'samples': 1138432, 'steps': 2223, 'loss/train': 2.106844902038574} -09/20/2021 22:11:36 - INFO - __main__ - Step 35577: {'lr': 0.00019955889372912474, 'samples': 1138464, 'steps': 2223, 'loss/train': 2.117396831512451} -09/20/2021 22:11:37 - INFO - __main__ - Step 35578: {'lr': 0.00019955889372912474, 'samples': 1138496, 'steps': 2223, 'loss/train': 3.139765739440918} -09/20/2021 22:11:38 - INFO - __main__ - Step 35579: {'lr': 0.00019955889372912474, 'samples': 1138528, 'steps': 2223, 'loss/train': 2.161694049835205} -09/20/2021 22:11:39 - INFO - __main__ - Step 35580: {'lr': 0.00019955889372912474, 'samples': 1138560, 'steps': 2223, 'loss/train': 2.236468553543091} -09/20/2021 22:11:39 - INFO - __main__ - Step 35581: {'lr': 0.00019955889372912474, 'samples': 1138592, 'steps': 2223, 'loss/train': 2.4393603801727295} -09/20/2021 22:11:40 - INFO - __main__ - Step 35582: {'lr': 0.00019955889372912474, 'samples': 1138624, 'steps': 2223, 'loss/train': 2.0677287578582764} -09/20/2021 22:11:41 - INFO - __main__ - Step 35583: {'lr': 0.00019955889372912474, 'samples': 1138656, 'steps': 2223, 'loss/train': 1.5536048412322998} -09/20/2021 22:11:42 - INFO - __main__ - Step 35584: {'lr': 0.00019955889372912474, 'samples': 1138688, 'steps': 2223, 'loss/train': 2.9062716960906982} -09/20/2021 22:11:42 - INFO - __main__ - Step 35585: {'lr': 0.00019955829504497986, 'samples': 1138720, 'steps': 2224, 'loss/train': 2.2322640419006348} -09/20/2021 22:11:43 - INFO - __main__ - Step 35586: {'lr': 0.00019955829504497986, 'samples': 1138752, 'steps': 2224, 'loss/train': 2.4021596908569336} -09/20/2021 22:11:44 - INFO - __main__ - Step 35587: {'lr': 0.00019955829504497986, 'samples': 1138784, 'steps': 2224, 'loss/train': 1.802829623222351} -09/20/2021 22:11:45 - INFO - __main__ - Step 35588: {'lr': 0.00019955829504497986, 'samples': 1138816, 'steps': 2224, 'loss/train': 1.785854697227478} -09/20/2021 22:11:45 - INFO - __main__ - Step 35589: {'lr': 0.00019955829504497986, 'samples': 1138848, 'steps': 2224, 'loss/train': 2.300969362258911} -09/20/2021 22:11:47 - INFO - __main__ - Step 35590: {'lr': 0.00019955829504497986, 'samples': 1138880, 'steps': 2224, 'loss/train': 2.0178182125091553} -09/20/2021 22:11:48 - INFO - __main__ - Step 35591: {'lr': 0.00019955829504497986, 'samples': 1138912, 'steps': 2224, 'loss/train': 2.361923933029175} -09/20/2021 22:11:48 - INFO - __main__ - Step 35592: {'lr': 0.00019955829504497986, 'samples': 1138944, 'steps': 2224, 'loss/train': 1.6533782482147217} -09/20/2021 22:11:49 - INFO - __main__ - Step 35593: {'lr': 0.00019955829504497986, 'samples': 1138976, 'steps': 2224, 'loss/train': 2.698483943939209} -09/20/2021 22:11:50 - INFO - __main__ - Step 35594: {'lr': 0.00019955829504497986, 'samples': 1139008, 'steps': 2224, 'loss/train': 2.0613207817077637} -09/20/2021 22:11:51 - INFO - __main__ - Step 35595: {'lr': 0.00019955829504497986, 'samples': 1139040, 'steps': 2224, 'loss/train': 2.7527475357055664} -09/20/2021 22:11:51 - INFO - __main__ - Step 35596: {'lr': 0.00019955829504497986, 'samples': 1139072, 'steps': 2224, 'loss/train': 2.3266525268554688} -09/20/2021 22:11:52 - INFO - __main__ - Step 35597: {'lr': 0.00019955829504497986, 'samples': 1139104, 'steps': 2224, 'loss/train': 1.822649598121643} -09/20/2021 22:11:53 - INFO - __main__ - Step 35598: {'lr': 0.00019955829504497986, 'samples': 1139136, 'steps': 2224, 'loss/train': 2.673541784286499} -09/20/2021 22:11:54 - INFO - __main__ - Step 35599: {'lr': 0.00019955829504497986, 'samples': 1139168, 'steps': 2224, 'loss/train': 2.721350908279419} -09/20/2021 22:11:54 - INFO - __main__ - Step 35600: {'lr': 0.00019955829504497986, 'samples': 1139200, 'steps': 2224, 'loss/train': 2.063450813293457} -09/20/2021 22:11:55 - INFO - __main__ - Step 35601: {'lr': 0.00019955769595573263, 'samples': 1139232, 'steps': 2225, 'loss/train': 1.9320660829544067} -09/20/2021 22:11:56 - INFO - __main__ - Step 35602: {'lr': 0.00019955769595573263, 'samples': 1139264, 'steps': 2225, 'loss/train': 2.190807342529297} -09/20/2021 22:11:57 - INFO - __main__ - Step 35603: {'lr': 0.00019955769595573263, 'samples': 1139296, 'steps': 2225, 'loss/train': 1.6967413425445557} -09/20/2021 22:11:58 - INFO - __main__ - Step 35604: {'lr': 0.00019955769595573263, 'samples': 1139328, 'steps': 2225, 'loss/train': 2.1599645614624023} -09/20/2021 22:11:58 - INFO - __main__ - Step 35605: {'lr': 0.00019955769595573263, 'samples': 1139360, 'steps': 2225, 'loss/train': 2.4472556114196777} -09/20/2021 22:11:59 - INFO - __main__ - Step 35606: {'lr': 0.00019955769595573263, 'samples': 1139392, 'steps': 2225, 'loss/train': 2.5527050495147705} -09/20/2021 22:12:00 - INFO - __main__ - Step 35607: {'lr': 0.00019955769595573263, 'samples': 1139424, 'steps': 2225, 'loss/train': 2.8001554012298584} -09/20/2021 22:12:01 - INFO - __main__ - Step 35608: {'lr': 0.00019955769595573263, 'samples': 1139456, 'steps': 2225, 'loss/train': 2.1581010818481445} -09/20/2021 22:12:01 - INFO - __main__ - Step 35609: {'lr': 0.00019955769595573263, 'samples': 1139488, 'steps': 2225, 'loss/train': 2.6323094367980957} -09/20/2021 22:12:02 - INFO - __main__ - Step 35610: {'lr': 0.00019955769595573263, 'samples': 1139520, 'steps': 2225, 'loss/train': 2.277576446533203} -09/20/2021 22:12:03 - INFO - __main__ - Step 35611: {'lr': 0.00019955769595573263, 'samples': 1139552, 'steps': 2225, 'loss/train': 2.0000526905059814} -09/20/2021 22:12:04 - INFO - __main__ - Step 35612: {'lr': 0.00019955769595573263, 'samples': 1139584, 'steps': 2225, 'loss/train': 1.8894119262695312} -09/20/2021 22:12:04 - INFO - __main__ - Step 35613: {'lr': 0.00019955769595573263, 'samples': 1139616, 'steps': 2225, 'loss/train': 2.2990849018096924} -09/20/2021 22:12:05 - INFO - __main__ - Step 35614: {'lr': 0.00019955769595573263, 'samples': 1139648, 'steps': 2225, 'loss/train': 1.178667426109314} -09/20/2021 22:12:06 - INFO - __main__ - Step 35615: {'lr': 0.00019955769595573263, 'samples': 1139680, 'steps': 2225, 'loss/train': 1.9761862754821777} -09/20/2021 22:12:07 - INFO - __main__ - Step 35616: {'lr': 0.00019955769595573263, 'samples': 1139712, 'steps': 2225, 'loss/train': 1.9211416244506836} -09/20/2021 22:12:07 - INFO - __main__ - Step 35617: {'lr': 0.0001995570964613856, 'samples': 1139744, 'steps': 2226, 'loss/train': 1.714484691619873} -09/20/2021 22:12:08 - INFO - __main__ - Step 35618: {'lr': 0.0001995570964613856, 'samples': 1139776, 'steps': 2226, 'loss/train': 1.901296615600586} -09/20/2021 22:12:09 - INFO - __main__ - Step 35619: {'lr': 0.0001995570964613856, 'samples': 1139808, 'steps': 2226, 'loss/train': 1.5492080450057983} -09/20/2021 22:12:10 - INFO - __main__ - Step 35620: {'lr': 0.0001995570964613856, 'samples': 1139840, 'steps': 2226, 'loss/train': 1.398612141609192} -09/20/2021 22:12:10 - INFO - __main__ - Step 35621: {'lr': 0.0001995570964613856, 'samples': 1139872, 'steps': 2226, 'loss/train': 1.4532315731048584} -09/20/2021 22:12:12 - INFO - __main__ - Step 35622: {'lr': 0.0001995570964613856, 'samples': 1139904, 'steps': 2226, 'loss/train': 1.9660173654556274} -09/20/2021 22:12:13 - INFO - __main__ - Step 35623: {'lr': 0.0001995570964613856, 'samples': 1139936, 'steps': 2226, 'loss/train': 3.021756649017334} -09/20/2021 22:12:13 - INFO - __main__ - Step 35624: {'lr': 0.0001995570964613856, 'samples': 1139968, 'steps': 2226, 'loss/train': 2.6491620540618896} -09/20/2021 22:12:14 - INFO - __main__ - Step 35625: {'lr': 0.0001995570964613856, 'samples': 1140000, 'steps': 2226, 'loss/train': 2.8557145595550537} -09/20/2021 22:12:15 - INFO - __main__ - Step 35626: {'lr': 0.0001995570964613856, 'samples': 1140032, 'steps': 2226, 'loss/train': 1.780340313911438} -09/20/2021 22:12:16 - INFO - __main__ - Step 35627: {'lr': 0.0001995570964613856, 'samples': 1140064, 'steps': 2226, 'loss/train': 0.6148381233215332} -09/20/2021 22:12:16 - INFO - __main__ - Step 35628: {'lr': 0.0001995570964613856, 'samples': 1140096, 'steps': 2226, 'loss/train': 2.3146767616271973} -09/20/2021 22:12:17 - INFO - __main__ - Step 35629: {'lr': 0.0001995570964613856, 'samples': 1140128, 'steps': 2226, 'loss/train': 2.516026735305786} -09/20/2021 22:12:18 - INFO - __main__ - Step 35630: {'lr': 0.0001995570964613856, 'samples': 1140160, 'steps': 2226, 'loss/train': 2.388453722000122} -09/20/2021 22:12:19 - INFO - __main__ - Step 35631: {'lr': 0.0001995570964613856, 'samples': 1140192, 'steps': 2226, 'loss/train': 1.8104270696640015} -09/20/2021 22:12:19 - INFO - __main__ - Step 35632: {'lr': 0.0001995570964613856, 'samples': 1140224, 'steps': 2226, 'loss/train': 2.7195308208465576} -09/20/2021 22:12:20 - INFO - __main__ - Step 35633: {'lr': 0.00019955649656194107, 'samples': 1140256, 'steps': 2227, 'loss/train': 2.874835729598999} -09/20/2021 22:12:21 - INFO - __main__ - Step 35634: {'lr': 0.00019955649656194107, 'samples': 1140288, 'steps': 2227, 'loss/train': 2.865762710571289} -09/20/2021 22:12:22 - INFO - __main__ - Step 35635: {'lr': 0.00019955649656194107, 'samples': 1140320, 'steps': 2227, 'loss/train': 1.5889371633529663} -09/20/2021 22:12:22 - INFO - __main__ - Step 35636: {'lr': 0.00019955649656194107, 'samples': 1140352, 'steps': 2227, 'loss/train': 2.5906240940093994} -09/20/2021 22:12:23 - INFO - __main__ - Step 35637: {'lr': 0.00019955649656194107, 'samples': 1140384, 'steps': 2227, 'loss/train': 3.278353691101074} -09/20/2021 22:12:24 - INFO - __main__ - Step 35638: {'lr': 0.00019955649656194107, 'samples': 1140416, 'steps': 2227, 'loss/train': 6.108996868133545} -09/20/2021 22:12:25 - INFO - __main__ - Step 35639: {'lr': 0.00019955649656194107, 'samples': 1140448, 'steps': 2227, 'loss/train': 2.082659959793091} -09/20/2021 22:12:25 - INFO - __main__ - Step 35640: {'lr': 0.00019955649656194107, 'samples': 1140480, 'steps': 2227, 'loss/train': 2.3044662475585938} -09/20/2021 22:12:26 - INFO - __main__ - Step 35641: {'lr': 0.00019955649656194107, 'samples': 1140512, 'steps': 2227, 'loss/train': 2.195591688156128} -09/20/2021 22:12:27 - INFO - __main__ - Step 35642: {'lr': 0.00019955649656194107, 'samples': 1140544, 'steps': 2227, 'loss/train': 2.3969569206237793} -09/20/2021 22:12:28 - INFO - __main__ - Step 35643: {'lr': 0.00019955649656194107, 'samples': 1140576, 'steps': 2227, 'loss/train': 0.2361694574356079} -09/20/2021 22:12:28 - INFO - __main__ - Step 35644: {'lr': 0.00019955649656194107, 'samples': 1140608, 'steps': 2227, 'loss/train': 0.4677562117576599} -09/20/2021 22:12:29 - INFO - __main__ - Step 35645: {'lr': 0.00019955649656194107, 'samples': 1140640, 'steps': 2227, 'loss/train': 0.22545428574085236} -09/20/2021 22:12:30 - INFO - __main__ - Step 35646: {'lr': 0.00019955649656194107, 'samples': 1140672, 'steps': 2227, 'loss/train': 1.3030568361282349} -09/20/2021 22:12:31 - INFO - __main__ - Step 35647: {'lr': 0.00019955649656194107, 'samples': 1140704, 'steps': 2227, 'loss/train': 2.308929920196533} -09/20/2021 22:12:31 - INFO - __main__ - Step 35648: {'lr': 0.00019955649656194107, 'samples': 1140736, 'steps': 2227, 'loss/train': 2.501554012298584} -09/20/2021 22:12:32 - INFO - __main__ - Step 35649: {'lr': 0.00019955589625740152, 'samples': 1140768, 'steps': 2228, 'loss/train': 2.12310791015625} -09/20/2021 22:12:33 - INFO - __main__ - Step 35650: {'lr': 0.00019955589625740152, 'samples': 1140800, 'steps': 2228, 'loss/train': 3.3981454372406006} -09/20/2021 22:12:34 - INFO - __main__ - Step 35651: {'lr': 0.00019955589625740152, 'samples': 1140832, 'steps': 2228, 'loss/train': 2.1571035385131836} -09/20/2021 22:12:35 - INFO - __main__ - Step 35652: {'lr': 0.00019955589625740152, 'samples': 1140864, 'steps': 2228, 'loss/train': 3.1723926067352295} -09/20/2021 22:12:36 - INFO - __main__ - Step 35653: {'lr': 0.00019955589625740152, 'samples': 1140896, 'steps': 2228, 'loss/train': 1.9402310848236084} -09/20/2021 22:12:37 - INFO - __main__ - Step 35654: {'lr': 0.00019955589625740152, 'samples': 1140928, 'steps': 2228, 'loss/train': 1.9857406616210938} -09/20/2021 22:12:37 - INFO - __main__ - Step 35655: {'lr': 0.00019955589625740152, 'samples': 1140960, 'steps': 2228, 'loss/train': 1.9552621841430664} -09/20/2021 22:12:38 - INFO - __main__ - Step 35656: {'lr': 0.00019955589625740152, 'samples': 1140992, 'steps': 2228, 'loss/train': 2.784986972808838} -09/20/2021 22:12:39 - INFO - __main__ - Step 35657: {'lr': 0.00019955589625740152, 'samples': 1141024, 'steps': 2228, 'loss/train': 2.3166911602020264} -09/20/2021 22:12:40 - INFO - __main__ - Step 35658: {'lr': 0.00019955589625740152, 'samples': 1141056, 'steps': 2228, 'loss/train': 2.3424007892608643} -09/20/2021 22:12:40 - INFO - __main__ - Step 35659: {'lr': 0.00019955589625740152, 'samples': 1141088, 'steps': 2228, 'loss/train': 2.4566073417663574} -09/20/2021 22:12:41 - INFO - __main__ - Step 35660: {'lr': 0.00019955589625740152, 'samples': 1141120, 'steps': 2228, 'loss/train': 2.389122247695923} -09/20/2021 22:12:42 - INFO - __main__ - Step 35661: {'lr': 0.00019955589625740152, 'samples': 1141152, 'steps': 2228, 'loss/train': 2.870907783508301} -09/20/2021 22:12:43 - INFO - __main__ - Step 35662: {'lr': 0.00019955589625740152, 'samples': 1141184, 'steps': 2228, 'loss/train': 1.9766020774841309} -09/20/2021 22:12:43 - INFO - __main__ - Step 35663: {'lr': 0.00019955589625740152, 'samples': 1141216, 'steps': 2228, 'loss/train': 3.4993906021118164} -09/20/2021 22:12:44 - INFO - __main__ - Step 35664: {'lr': 0.00019955589625740152, 'samples': 1141248, 'steps': 2228, 'loss/train': 2.105740547180176} -09/20/2021 22:12:45 - INFO - __main__ - Step 35665: {'lr': 0.00019955529554776944, 'samples': 1141280, 'steps': 2229, 'loss/train': 2.499236822128296} -09/20/2021 22:12:46 - INFO - __main__ - Step 35666: {'lr': 0.00019955529554776944, 'samples': 1141312, 'steps': 2229, 'loss/train': 2.158372640609741} -09/20/2021 22:12:47 - INFO - __main__ - Step 35667: {'lr': 0.00019955529554776944, 'samples': 1141344, 'steps': 2229, 'loss/train': 0.802234947681427} -09/20/2021 22:12:47 - INFO - __main__ - Step 35668: {'lr': 0.00019955529554776944, 'samples': 1141376, 'steps': 2229, 'loss/train': 2.8618857860565186} -09/20/2021 22:12:48 - INFO - __main__ - Step 35669: {'lr': 0.00019955529554776944, 'samples': 1141408, 'steps': 2229, 'loss/train': 2.010087728500366} -09/20/2021 22:12:49 - INFO - __main__ - Step 35670: {'lr': 0.00019955529554776944, 'samples': 1141440, 'steps': 2229, 'loss/train': 1.7708086967468262} -09/20/2021 22:12:50 - INFO - __main__ - Step 35671: {'lr': 0.00019955529554776944, 'samples': 1141472, 'steps': 2229, 'loss/train': 2.5086913108825684} -09/20/2021 22:12:50 - INFO - __main__ - Step 35672: {'lr': 0.00019955529554776944, 'samples': 1141504, 'steps': 2229, 'loss/train': 2.7256596088409424} -09/20/2021 22:12:51 - INFO - __main__ - Step 35673: {'lr': 0.00019955529554776944, 'samples': 1141536, 'steps': 2229, 'loss/train': 1.8607772588729858} -09/20/2021 22:12:52 - INFO - __main__ - Step 35674: {'lr': 0.00019955529554776944, 'samples': 1141568, 'steps': 2229, 'loss/train': 2.4811272621154785} -09/20/2021 22:12:53 - INFO - __main__ - Step 35675: {'lr': 0.00019955529554776944, 'samples': 1141600, 'steps': 2229, 'loss/train': 2.4567320346832275} -09/20/2021 22:12:53 - INFO - __main__ - Step 35676: {'lr': 0.00019955529554776944, 'samples': 1141632, 'steps': 2229, 'loss/train': 2.0587174892425537} -09/20/2021 22:12:54 - INFO - __main__ - Step 35677: {'lr': 0.00019955529554776944, 'samples': 1141664, 'steps': 2229, 'loss/train': 2.4958534240722656} -09/20/2021 22:12:55 - INFO - __main__ - Step 35678: {'lr': 0.00019955529554776944, 'samples': 1141696, 'steps': 2229, 'loss/train': 0.9808833599090576} -09/20/2021 22:12:56 - INFO - __main__ - Step 35679: {'lr': 0.00019955529554776944, 'samples': 1141728, 'steps': 2229, 'loss/train': 0.74040687084198} -09/20/2021 22:12:56 - INFO - __main__ - Step 35680: {'lr': 0.00019955529554776944, 'samples': 1141760, 'steps': 2229, 'loss/train': 2.116481065750122} -09/20/2021 22:12:57 - INFO - __main__ - Step 35681: {'lr': 0.00019955469443304726, 'samples': 1141792, 'steps': 2230, 'loss/train': 1.646401286125183} -09/20/2021 22:12:58 - INFO - __main__ - Step 35682: {'lr': 0.00019955469443304726, 'samples': 1141824, 'steps': 2230, 'loss/train': 2.530057430267334} -09/20/2021 22:13:00 - INFO - __main__ - Step 35683: {'lr': 0.00019955469443304726, 'samples': 1141856, 'steps': 2230, 'loss/train': 1.91986882686615} -09/20/2021 22:13:00 - INFO - __main__ - Step 35684: {'lr': 0.00019955469443304726, 'samples': 1141888, 'steps': 2230, 'loss/train': 1.87936270236969} -09/20/2021 22:13:01 - INFO - __main__ - Step 35685: {'lr': 0.00019955469443304726, 'samples': 1141920, 'steps': 2230, 'loss/train': 3.8271901607513428} -09/20/2021 22:13:02 - INFO - __main__ - Step 35686: {'lr': 0.00019955469443304726, 'samples': 1141952, 'steps': 2230, 'loss/train': 2.656738042831421} -09/20/2021 22:13:03 - INFO - __main__ - Step 35687: {'lr': 0.00019955469443304726, 'samples': 1141984, 'steps': 2230, 'loss/train': 2.3004987239837646} -09/20/2021 22:13:03 - INFO - __main__ - Step 35688: {'lr': 0.00019955469443304726, 'samples': 1142016, 'steps': 2230, 'loss/train': 2.3315155506134033} -09/20/2021 22:13:04 - INFO - __main__ - Step 35689: {'lr': 0.00019955469443304726, 'samples': 1142048, 'steps': 2230, 'loss/train': 2.313704252243042} -09/20/2021 22:13:05 - INFO - __main__ - Step 35690: {'lr': 0.00019955469443304726, 'samples': 1142080, 'steps': 2230, 'loss/train': 2.2298359870910645} -09/20/2021 22:13:06 - INFO - __main__ - Step 35691: {'lr': 0.00019955469443304726, 'samples': 1142112, 'steps': 2230, 'loss/train': 2.216280460357666} -09/20/2021 22:13:06 - INFO - __main__ - Step 35692: {'lr': 0.00019955469443304726, 'samples': 1142144, 'steps': 2230, 'loss/train': 1.8977398872375488} -09/20/2021 22:13:07 - INFO - __main__ - Step 35693: {'lr': 0.00019955469443304726, 'samples': 1142176, 'steps': 2230, 'loss/train': 0.8498958945274353} -09/20/2021 22:13:08 - INFO - __main__ - Step 35694: {'lr': 0.00019955469443304726, 'samples': 1142208, 'steps': 2230, 'loss/train': 0.7656873464584351} -09/20/2021 22:13:09 - INFO - __main__ - Step 35695: {'lr': 0.00019955469443304726, 'samples': 1142240, 'steps': 2230, 'loss/train': 0.9090569615364075} -09/20/2021 22:13:09 - INFO - __main__ - Step 35696: {'lr': 0.00019955469443304726, 'samples': 1142272, 'steps': 2230, 'loss/train': 0.5871708393096924} -09/20/2021 22:13:10 - INFO - __main__ - Step 35697: {'lr': 0.00019955409291323744, 'samples': 1142304, 'steps': 2231, 'loss/train': 0.4613039195537567} -09/20/2021 22:13:11 - INFO - __main__ - Step 35698: {'lr': 0.00019955409291323744, 'samples': 1142336, 'steps': 2231, 'loss/train': 0.5461248159408569} -09/20/2021 22:13:12 - INFO - __main__ - Step 35699: {'lr': 0.00019955409291323744, 'samples': 1142368, 'steps': 2231, 'loss/train': 0.5708569884300232} -09/20/2021 22:13:12 - INFO - __main__ - Step 35700: {'lr': 0.00019955409291323744, 'samples': 1142400, 'steps': 2231, 'loss/train': 0.5182305574417114} -09/20/2021 22:13:13 - INFO - __main__ - Step 35701: {'lr': 0.00019955409291323744, 'samples': 1142432, 'steps': 2231, 'loss/train': 0.7978324890136719} -09/20/2021 22:13:14 - INFO - __main__ - Step 35702: {'lr': 0.00019955409291323744, 'samples': 1142464, 'steps': 2231, 'loss/train': 2.6097331047058105} -09/20/2021 22:13:15 - INFO - __main__ - Step 35703: {'lr': 0.00019955409291323744, 'samples': 1142496, 'steps': 2231, 'loss/train': 1.4668105840682983} -09/20/2021 22:13:15 - INFO - __main__ - Step 35704: {'lr': 0.00019955409291323744, 'samples': 1142528, 'steps': 2231, 'loss/train': 2.396655797958374} -09/20/2021 22:13:16 - INFO - __main__ - Step 35705: {'lr': 0.00019955409291323744, 'samples': 1142560, 'steps': 2231, 'loss/train': 2.6003758907318115} -09/20/2021 22:13:17 - INFO - __main__ - Step 35706: {'lr': 0.00019955409291323744, 'samples': 1142592, 'steps': 2231, 'loss/train': 1.9678806066513062} -09/20/2021 22:13:18 - INFO - __main__ - Step 35707: {'lr': 0.00019955409291323744, 'samples': 1142624, 'steps': 2231, 'loss/train': 2.6018640995025635} -09/20/2021 22:13:18 - INFO - __main__ - Step 35708: {'lr': 0.00019955409291323744, 'samples': 1142656, 'steps': 2231, 'loss/train': 2.1576147079467773} -09/20/2021 22:13:19 - INFO - __main__ - Step 35709: {'lr': 0.00019955409291323744, 'samples': 1142688, 'steps': 2231, 'loss/train': 1.7648742198944092} -09/20/2021 22:13:20 - INFO - __main__ - Step 35710: {'lr': 0.00019955409291323744, 'samples': 1142720, 'steps': 2231, 'loss/train': 1.9111160039901733} -09/20/2021 22:13:21 - INFO - __main__ - Step 35711: {'lr': 0.00019955409291323744, 'samples': 1142752, 'steps': 2231, 'loss/train': 1.7577942609786987} -09/20/2021 22:13:21 - INFO - __main__ - Step 35712: {'lr': 0.00019955409291323744, 'samples': 1142784, 'steps': 2231, 'loss/train': 2.586286783218384} -09/20/2021 22:13:22 - INFO - __main__ - Step 35713: {'lr': 0.00019955349098834234, 'samples': 1142816, 'steps': 2232, 'loss/train': 2.0858962535858154} -09/20/2021 22:13:23 - INFO - __main__ - Step 35714: {'lr': 0.00019955349098834234, 'samples': 1142848, 'steps': 2232, 'loss/train': 3.0286624431610107} -09/20/2021 22:13:24 - INFO - __main__ - Step 35715: {'lr': 0.00019955349098834234, 'samples': 1142880, 'steps': 2232, 'loss/train': 1.8046575784683228} -09/20/2021 22:13:25 - INFO - __main__ - Step 35716: {'lr': 0.00019955349098834234, 'samples': 1142912, 'steps': 2232, 'loss/train': 0.967968761920929} -09/20/2021 22:13:25 - INFO - __main__ - Step 35717: {'lr': 0.00019955349098834234, 'samples': 1142944, 'steps': 2232, 'loss/train': 2.509571075439453} -09/20/2021 22:13:26 - INFO - __main__ - Step 35718: {'lr': 0.00019955349098834234, 'samples': 1142976, 'steps': 2232, 'loss/train': 2.4953253269195557} -09/20/2021 22:13:27 - INFO - __main__ - Step 35719: {'lr': 0.00019955349098834234, 'samples': 1143008, 'steps': 2232, 'loss/train': 2.4603183269500732} -09/20/2021 22:13:28 - INFO - __main__ - Step 35720: {'lr': 0.00019955349098834234, 'samples': 1143040, 'steps': 2232, 'loss/train': 1.5888290405273438} -09/20/2021 22:13:29 - INFO - __main__ - Step 35721: {'lr': 0.00019955349098834234, 'samples': 1143072, 'steps': 2232, 'loss/train': 1.8793444633483887} -09/20/2021 22:13:30 - INFO - __main__ - Step 35722: {'lr': 0.00019955349098834234, 'samples': 1143104, 'steps': 2232, 'loss/train': 3.359203815460205} -09/20/2021 22:13:30 - INFO - __main__ - Step 35723: {'lr': 0.00019955349098834234, 'samples': 1143136, 'steps': 2232, 'loss/train': 2.6091349124908447} -09/20/2021 22:13:31 - INFO - __main__ - Step 35724: {'lr': 0.00019955349098834234, 'samples': 1143168, 'steps': 2232, 'loss/train': 2.450775384902954} -09/20/2021 22:13:32 - INFO - __main__ - Step 35725: {'lr': 0.00019955349098834234, 'samples': 1143200, 'steps': 2232, 'loss/train': 2.1964707374572754} -09/20/2021 22:13:33 - INFO - __main__ - Step 35726: {'lr': 0.00019955349098834234, 'samples': 1143232, 'steps': 2232, 'loss/train': 2.279637098312378} -09/20/2021 22:13:33 - INFO - __main__ - Step 35727: {'lr': 0.00019955349098834234, 'samples': 1143264, 'steps': 2232, 'loss/train': 2.644962787628174} -09/20/2021 22:13:34 - INFO - __main__ - Step 35728: {'lr': 0.00019955349098834234, 'samples': 1143296, 'steps': 2232, 'loss/train': 0.5920085906982422} -09/20/2021 22:13:35 - INFO - __main__ - Step 35729: {'lr': 0.0001995528886583645, 'samples': 1143328, 'steps': 2233, 'loss/train': 3.2285172939300537} -09/20/2021 22:13:36 - INFO - __main__ - Step 35730: {'lr': 0.0001995528886583645, 'samples': 1143360, 'steps': 2233, 'loss/train': 2.0955898761749268} -09/20/2021 22:13:36 - INFO - __main__ - Step 35731: {'lr': 0.0001995528886583645, 'samples': 1143392, 'steps': 2233, 'loss/train': 2.3314852714538574} -09/20/2021 22:13:37 - INFO - __main__ - Step 35732: {'lr': 0.0001995528886583645, 'samples': 1143424, 'steps': 2233, 'loss/train': 2.4392309188842773} -09/20/2021 22:13:38 - INFO - __main__ - Step 35733: {'lr': 0.0001995528886583645, 'samples': 1143456, 'steps': 2233, 'loss/train': 1.017917275428772} -09/20/2021 22:13:39 - INFO - __main__ - Step 35734: {'lr': 0.0001995528886583645, 'samples': 1143488, 'steps': 2233, 'loss/train': 1.5042612552642822} -09/20/2021 22:13:39 - INFO - __main__ - Step 35735: {'lr': 0.0001995528886583645, 'samples': 1143520, 'steps': 2233, 'loss/train': 2.8716928958892822} -09/20/2021 22:13:40 - INFO - __main__ - Step 35736: {'lr': 0.0001995528886583645, 'samples': 1143552, 'steps': 2233, 'loss/train': 2.8978981971740723} -09/20/2021 22:13:41 - INFO - __main__ - Step 35737: {'lr': 0.0001995528886583645, 'samples': 1143584, 'steps': 2233, 'loss/train': 2.2962899208068848} -09/20/2021 22:13:42 - INFO - __main__ - Step 35738: {'lr': 0.0001995528886583645, 'samples': 1143616, 'steps': 2233, 'loss/train': 2.250877857208252} -09/20/2021 22:13:42 - INFO - __main__ - Step 35739: {'lr': 0.0001995528886583645, 'samples': 1143648, 'steps': 2233, 'loss/train': 0.6755312085151672} -09/20/2021 22:13:43 - INFO - __main__ - Step 35740: {'lr': 0.0001995528886583645, 'samples': 1143680, 'steps': 2233, 'loss/train': 2.8549957275390625} -09/20/2021 22:13:44 - INFO - __main__ - Step 35741: {'lr': 0.0001995528886583645, 'samples': 1143712, 'steps': 2233, 'loss/train': 2.394479990005493} -09/20/2021 22:13:45 - INFO - __main__ - Step 35742: {'lr': 0.0001995528886583645, 'samples': 1143744, 'steps': 2233, 'loss/train': 1.9140703678131104} -09/20/2021 22:13:45 - INFO - __main__ - Step 35743: {'lr': 0.0001995528886583645, 'samples': 1143776, 'steps': 2233, 'loss/train': 1.8305485248565674} -09/20/2021 22:13:46 - INFO - __main__ - Step 35744: {'lr': 0.0001995528886583645, 'samples': 1143808, 'steps': 2233, 'loss/train': 0.9805300235748291} -09/20/2021 22:13:47 - INFO - __main__ - Step 35745: {'lr': 0.00019955228592330638, 'samples': 1143840, 'steps': 2234, 'loss/train': 1.7076114416122437} -09/20/2021 22:13:48 - INFO - __main__ - Step 35746: {'lr': 0.00019955228592330638, 'samples': 1143872, 'steps': 2234, 'loss/train': 1.3823660612106323} -09/20/2021 22:13:49 - INFO - __main__ - Step 35747: {'lr': 0.00019955228592330638, 'samples': 1143904, 'steps': 2234, 'loss/train': 1.8915619850158691} -09/20/2021 22:13:49 - INFO - __main__ - Step 35748: {'lr': 0.00019955228592330638, 'samples': 1143936, 'steps': 2234, 'loss/train': 1.6426656246185303} -09/20/2021 22:13:50 - INFO - __main__ - Step 35749: {'lr': 0.00019955228592330638, 'samples': 1143968, 'steps': 2234, 'loss/train': 1.8515971899032593} -09/20/2021 22:13:52 - INFO - __main__ - Step 35750: {'lr': 0.00019955228592330638, 'samples': 1144000, 'steps': 2234, 'loss/train': 2.7646827697753906} -09/20/2021 22:13:52 - INFO - __main__ - Step 35751: {'lr': 0.00019955228592330638, 'samples': 1144032, 'steps': 2234, 'loss/train': 2.8243534564971924} -09/20/2021 22:13:53 - INFO - __main__ - Step 35752: {'lr': 0.00019955228592330638, 'samples': 1144064, 'steps': 2234, 'loss/train': 2.2853081226348877} -09/20/2021 22:13:54 - INFO - __main__ - Step 35753: {'lr': 0.00019955228592330638, 'samples': 1144096, 'steps': 2234, 'loss/train': 1.9741325378417969} -09/20/2021 22:13:55 - INFO - __main__ - Step 35754: {'lr': 0.00019955228592330638, 'samples': 1144128, 'steps': 2234, 'loss/train': 2.08825421333313} -09/20/2021 22:13:55 - INFO - __main__ - Step 35755: {'lr': 0.00019955228592330638, 'samples': 1144160, 'steps': 2234, 'loss/train': 1.2748290300369263} -09/20/2021 22:13:56 - INFO - __main__ - Step 35756: {'lr': 0.00019955228592330638, 'samples': 1144192, 'steps': 2234, 'loss/train': 1.7266157865524292} -09/20/2021 22:13:57 - INFO - __main__ - Step 35757: {'lr': 0.00019955228592330638, 'samples': 1144224, 'steps': 2234, 'loss/train': 1.0885274410247803} -09/20/2021 22:13:58 - INFO - __main__ - Step 35758: {'lr': 0.00019955228592330638, 'samples': 1144256, 'steps': 2234, 'loss/train': 2.3648993968963623} -09/20/2021 22:13:58 - INFO - __main__ - Step 35759: {'lr': 0.00019955228592330638, 'samples': 1144288, 'steps': 2234, 'loss/train': 1.835855484008789} -09/20/2021 22:13:59 - INFO - __main__ - Step 35760: {'lr': 0.00019955228592330638, 'samples': 1144320, 'steps': 2234, 'loss/train': 2.4707560539245605} -09/20/2021 22:14:00 - INFO - __main__ - Step 35761: {'lr': 0.00019955168278317032, 'samples': 1144352, 'steps': 2235, 'loss/train': 0.3683721125125885} -09/20/2021 22:14:01 - INFO - __main__ - Step 35762: {'lr': 0.00019955168278317032, 'samples': 1144384, 'steps': 2235, 'loss/train': 0.20756927132606506} -09/20/2021 22:14:01 - INFO - __main__ - Step 35763: {'lr': 0.00019955168278317032, 'samples': 1144416, 'steps': 2235, 'loss/train': 0.16659726202487946} -09/20/2021 22:14:02 - INFO - __main__ - Step 35764: {'lr': 0.00019955168278317032, 'samples': 1144448, 'steps': 2235, 'loss/train': 0.35402312874794006} -09/20/2021 22:14:03 - INFO - __main__ - Step 35765: {'lr': 0.00019955168278317032, 'samples': 1144480, 'steps': 2235, 'loss/train': 1.811499834060669} -09/20/2021 22:14:04 - INFO - __main__ - Step 35766: {'lr': 0.00019955168278317032, 'samples': 1144512, 'steps': 2235, 'loss/train': 2.4184985160827637} -09/20/2021 22:14:04 - INFO - __main__ - Step 35767: {'lr': 0.00019955168278317032, 'samples': 1144544, 'steps': 2235, 'loss/train': 3.228558301925659} -09/20/2021 22:14:05 - INFO - __main__ - Step 35768: {'lr': 0.00019955168278317032, 'samples': 1144576, 'steps': 2235, 'loss/train': 1.9510847330093384} -09/20/2021 22:14:06 - INFO - __main__ - Step 35769: {'lr': 0.00019955168278317032, 'samples': 1144608, 'steps': 2235, 'loss/train': 2.7182321548461914} -09/20/2021 22:14:07 - INFO - __main__ - Step 35770: {'lr': 0.00019955168278317032, 'samples': 1144640, 'steps': 2235, 'loss/train': 1.7949849367141724} -09/20/2021 22:14:07 - INFO - __main__ - Step 35771: {'lr': 0.00019955168278317032, 'samples': 1144672, 'steps': 2235, 'loss/train': 2.4083807468414307} -09/20/2021 22:14:08 - INFO - __main__ - Step 35772: {'lr': 0.00019955168278317032, 'samples': 1144704, 'steps': 2235, 'loss/train': 2.090956449508667} -09/20/2021 22:14:09 - INFO - __main__ - Step 35773: {'lr': 0.00019955168278317032, 'samples': 1144736, 'steps': 2235, 'loss/train': 1.7724380493164062} -09/20/2021 22:14:10 - INFO - __main__ - Step 35774: {'lr': 0.00019955168278317032, 'samples': 1144768, 'steps': 2235, 'loss/train': 2.5439789295196533} -09/20/2021 22:14:10 - INFO - __main__ - Step 35775: {'lr': 0.00019955168278317032, 'samples': 1144800, 'steps': 2235, 'loss/train': 2.2931649684906006} -09/20/2021 22:14:11 - INFO - __main__ - Step 35776: {'lr': 0.00019955168278317032, 'samples': 1144832, 'steps': 2235, 'loss/train': 0.9944903254508972} -09/20/2021 22:14:12 - INFO - __main__ - Step 35777: {'lr': 0.0001995510792379589, 'samples': 1144864, 'steps': 2236, 'loss/train': 1.640394687652588} -09/20/2021 22:14:13 - INFO - __main__ - Step 35778: {'lr': 0.0001995510792379589, 'samples': 1144896, 'steps': 2236, 'loss/train': 2.593717098236084} -09/20/2021 22:14:14 - INFO - __main__ - Step 35779: {'lr': 0.0001995510792379589, 'samples': 1144928, 'steps': 2236, 'loss/train': 3.608654022216797} -09/20/2021 22:14:14 - INFO - __main__ - Step 35780: {'lr': 0.0001995510792379589, 'samples': 1144960, 'steps': 2236, 'loss/train': 3.0194075107574463} -09/20/2021 22:14:16 - INFO - __main__ - Step 35781: {'lr': 0.0001995510792379589, 'samples': 1144992, 'steps': 2236, 'loss/train': 2.2017338275909424} -09/20/2021 22:14:16 - INFO - __main__ - Step 35782: {'lr': 0.0001995510792379589, 'samples': 1145024, 'steps': 2236, 'loss/train': 1.8828853368759155} -09/20/2021 22:14:17 - INFO - __main__ - Step 35783: {'lr': 0.0001995510792379589, 'samples': 1145056, 'steps': 2236, 'loss/train': 1.7152655124664307} -09/20/2021 22:14:18 - INFO - __main__ - Step 35784: {'lr': 0.0001995510792379589, 'samples': 1145088, 'steps': 2236, 'loss/train': 2.0523521900177} -09/20/2021 22:14:19 - INFO - __main__ - Step 35785: {'lr': 0.0001995510792379589, 'samples': 1145120, 'steps': 2236, 'loss/train': 2.0390069484710693} -09/20/2021 22:14:19 - INFO - __main__ - Step 35786: {'lr': 0.0001995510792379589, 'samples': 1145152, 'steps': 2236, 'loss/train': 2.1073157787323} -09/20/2021 22:14:20 - INFO - __main__ - Step 35787: {'lr': 0.0001995510792379589, 'samples': 1145184, 'steps': 2236, 'loss/train': 3.7070460319519043} -09/20/2021 22:14:21 - INFO - __main__ - Step 35788: {'lr': 0.0001995510792379589, 'samples': 1145216, 'steps': 2236, 'loss/train': 1.4302228689193726} -09/20/2021 22:14:22 - INFO - __main__ - Step 35789: {'lr': 0.0001995510792379589, 'samples': 1145248, 'steps': 2236, 'loss/train': 2.3370869159698486} -09/20/2021 22:14:22 - INFO - __main__ - Step 35790: {'lr': 0.0001995510792379589, 'samples': 1145280, 'steps': 2236, 'loss/train': 1.9691543579101562} -09/20/2021 22:14:23 - INFO - __main__ - Step 35791: {'lr': 0.0001995510792379589, 'samples': 1145312, 'steps': 2236, 'loss/train': 2.417966842651367} -09/20/2021 22:14:24 - INFO - __main__ - Step 35792: {'lr': 0.0001995510792379589, 'samples': 1145344, 'steps': 2236, 'loss/train': 1.8062485456466675} -09/20/2021 22:14:25 - INFO - __main__ - Step 35793: {'lr': 0.00019955047528767453, 'samples': 1145376, 'steps': 2237, 'loss/train': 1.8444373607635498} -09/20/2021 22:14:26 - INFO - __main__ - Step 35794: {'lr': 0.00019955047528767453, 'samples': 1145408, 'steps': 2237, 'loss/train': 2.8230979442596436} -09/20/2021 22:14:26 - INFO - __main__ - Step 35795: {'lr': 0.00019955047528767453, 'samples': 1145440, 'steps': 2237, 'loss/train': 2.4168055057525635} -09/20/2021 22:14:27 - INFO - __main__ - Step 35796: {'lr': 0.00019955047528767453, 'samples': 1145472, 'steps': 2237, 'loss/train': 2.33063006401062} -09/20/2021 22:14:28 - INFO - __main__ - Step 35797: {'lr': 0.00019955047528767453, 'samples': 1145504, 'steps': 2237, 'loss/train': 2.0781188011169434} -09/20/2021 22:14:29 - INFO - __main__ - Step 35798: {'lr': 0.00019955047528767453, 'samples': 1145536, 'steps': 2237, 'loss/train': 2.662353992462158} -09/20/2021 22:14:29 - INFO - __main__ - Step 35799: {'lr': 0.00019955047528767453, 'samples': 1145568, 'steps': 2237, 'loss/train': 2.3836052417755127} -09/20/2021 22:14:30 - INFO - __main__ - Step 35800: {'lr': 0.00019955047528767453, 'samples': 1145600, 'steps': 2237, 'loss/train': 2.1356394290924072} -09/20/2021 22:14:31 - INFO - __main__ - Step 35801: {'lr': 0.00019955047528767453, 'samples': 1145632, 'steps': 2237, 'loss/train': 1.3926053047180176} -09/20/2021 22:14:32 - INFO - __main__ - Step 35802: {'lr': 0.00019955047528767453, 'samples': 1145664, 'steps': 2237, 'loss/train': 2.258060932159424} -09/20/2021 22:14:32 - INFO - __main__ - Step 35803: {'lr': 0.00019955047528767453, 'samples': 1145696, 'steps': 2237, 'loss/train': 2.5999083518981934} -09/20/2021 22:14:33 - INFO - __main__ - Step 35804: {'lr': 0.00019955047528767453, 'samples': 1145728, 'steps': 2237, 'loss/train': 3.431934356689453} -09/20/2021 22:14:34 - INFO - __main__ - Step 35805: {'lr': 0.00019955047528767453, 'samples': 1145760, 'steps': 2237, 'loss/train': 1.9690675735473633} -09/20/2021 22:14:35 - INFO - __main__ - Step 35806: {'lr': 0.00019955047528767453, 'samples': 1145792, 'steps': 2237, 'loss/train': 2.314631223678589} -09/20/2021 22:14:35 - INFO - __main__ - Step 35807: {'lr': 0.00019955047528767453, 'samples': 1145824, 'steps': 2237, 'loss/train': 2.0021655559539795} -09/20/2021 22:14:36 - INFO - __main__ - Step 35808: {'lr': 0.00019955047528767453, 'samples': 1145856, 'steps': 2237, 'loss/train': 2.3302550315856934} -09/20/2021 22:14:37 - INFO - __main__ - Step 35809: {'lr': 0.00019954987093231963, 'samples': 1145888, 'steps': 2238, 'loss/train': 1.953005075454712} -09/20/2021 22:14:38 - INFO - __main__ - Step 35810: {'lr': 0.00019954987093231963, 'samples': 1145920, 'steps': 2238, 'loss/train': 2.438185930252075} -09/20/2021 22:14:38 - INFO - __main__ - Step 35811: {'lr': 0.00019954987093231963, 'samples': 1145952, 'steps': 2238, 'loss/train': 1.9207147359848022} -09/20/2021 22:14:39 - INFO - __main__ - Step 35812: {'lr': 0.00019954987093231963, 'samples': 1145984, 'steps': 2238, 'loss/train': 2.326277494430542} -09/20/2021 22:14:40 - INFO - __main__ - Step 35813: {'lr': 0.00019954987093231963, 'samples': 1146016, 'steps': 2238, 'loss/train': 1.5374197959899902} -09/20/2021 22:14:41 - INFO - __main__ - Step 35814: {'lr': 0.00019954987093231963, 'samples': 1146048, 'steps': 2238, 'loss/train': 1.9116965532302856} -09/20/2021 22:14:42 - INFO - __main__ - Step 35815: {'lr': 0.00019954987093231963, 'samples': 1146080, 'steps': 2238, 'loss/train': 2.145076274871826} -09/20/2021 22:14:43 - INFO - __main__ - Step 35816: {'lr': 0.00019954987093231963, 'samples': 1146112, 'steps': 2238, 'loss/train': 2.02168869972229} -09/20/2021 22:14:43 - INFO - __main__ - Step 35817: {'lr': 0.00019954987093231963, 'samples': 1146144, 'steps': 2238, 'loss/train': 1.5847026109695435} -09/20/2021 22:14:44 - INFO - __main__ - Step 35818: {'lr': 0.00019954987093231963, 'samples': 1146176, 'steps': 2238, 'loss/train': 2.169010877609253} -09/20/2021 22:14:45 - INFO - __main__ - Step 35819: {'lr': 0.00019954987093231963, 'samples': 1146208, 'steps': 2238, 'loss/train': 2.751472234725952} -09/20/2021 22:14:46 - INFO - __main__ - Step 35820: {'lr': 0.00019954987093231963, 'samples': 1146240, 'steps': 2238, 'loss/train': 2.725717067718506} -09/20/2021 22:14:46 - INFO - __main__ - Step 35821: {'lr': 0.00019954987093231963, 'samples': 1146272, 'steps': 2238, 'loss/train': 2.0313520431518555} -09/20/2021 22:14:47 - INFO - __main__ - Step 35822: {'lr': 0.00019954987093231963, 'samples': 1146304, 'steps': 2238, 'loss/train': 2.279945135116577} -09/20/2021 22:14:48 - INFO - __main__ - Step 35823: {'lr': 0.00019954987093231963, 'samples': 1146336, 'steps': 2238, 'loss/train': 3.1742305755615234} -09/20/2021 22:14:49 - INFO - __main__ - Step 35824: {'lr': 0.00019954987093231963, 'samples': 1146368, 'steps': 2238, 'loss/train': 1.381105661392212} -09/20/2021 22:14:50 - INFO - __main__ - Step 35825: {'lr': 0.00019954926617189674, 'samples': 1146400, 'steps': 2239, 'loss/train': 1.8440840244293213} -09/20/2021 22:14:50 - INFO - __main__ - Step 35826: {'lr': 0.00019954926617189674, 'samples': 1146432, 'steps': 2239, 'loss/train': 2.600338935852051} -09/20/2021 22:14:51 - INFO - __main__ - Step 35827: {'lr': 0.00019954926617189674, 'samples': 1146464, 'steps': 2239, 'loss/train': 2.6422433853149414} -09/20/2021 22:14:52 - INFO - __main__ - Step 35828: {'lr': 0.00019954926617189674, 'samples': 1146496, 'steps': 2239, 'loss/train': 1.4560513496398926} -09/20/2021 22:14:53 - INFO - __main__ - Step 35829: {'lr': 0.00019954926617189674, 'samples': 1146528, 'steps': 2239, 'loss/train': 2.081021547317505} -09/20/2021 22:14:53 - INFO - __main__ - Step 35830: {'lr': 0.00019954926617189674, 'samples': 1146560, 'steps': 2239, 'loss/train': 2.682708501815796} -09/20/2021 22:14:54 - INFO - __main__ - Step 35831: {'lr': 0.00019954926617189674, 'samples': 1146592, 'steps': 2239, 'loss/train': 1.9008665084838867} -09/20/2021 22:14:55 - INFO - __main__ - Step 35832: {'lr': 0.00019954926617189674, 'samples': 1146624, 'steps': 2239, 'loss/train': 2.10785174369812} -09/20/2021 22:14:56 - INFO - __main__ - Step 35833: {'lr': 0.00019954926617189674, 'samples': 1146656, 'steps': 2239, 'loss/train': 3.1283459663391113} -09/20/2021 22:14:56 - INFO - __main__ - Step 35834: {'lr': 0.00019954926617189674, 'samples': 1146688, 'steps': 2239, 'loss/train': 1.6001402139663696} -09/20/2021 22:14:57 - INFO - __main__ - Step 35835: {'lr': 0.00019954926617189674, 'samples': 1146720, 'steps': 2239, 'loss/train': 2.190485715866089} -09/20/2021 22:14:58 - INFO - __main__ - Step 35836: {'lr': 0.00019954926617189674, 'samples': 1146752, 'steps': 2239, 'loss/train': 2.3864948749542236} -09/20/2021 22:14:59 - INFO - __main__ - Step 35837: {'lr': 0.00019954926617189674, 'samples': 1146784, 'steps': 2239, 'loss/train': 2.3368752002716064} -09/20/2021 22:14:59 - INFO - __main__ - Step 35838: {'lr': 0.00019954926617189674, 'samples': 1146816, 'steps': 2239, 'loss/train': 2.768463373184204} -09/20/2021 22:15:00 - INFO - __main__ - Step 35839: {'lr': 0.00019954926617189674, 'samples': 1146848, 'steps': 2239, 'loss/train': 2.3440284729003906} -09/20/2021 22:15:01 - INFO - __main__ - Step 35840: {'lr': 0.00019954926617189674, 'samples': 1146880, 'steps': 2239, 'loss/train': 2.5410261154174805} -09/20/2021 22:15:02 - INFO - __main__ - Step 35841: {'lr': 0.0001995486610064082, 'samples': 1146912, 'steps': 2240, 'loss/train': 1.9339652061462402} -09/20/2021 22:15:02 - INFO - __main__ - Step 35842: {'lr': 0.0001995486610064082, 'samples': 1146944, 'steps': 2240, 'loss/train': 1.9559402465820312} -09/20/2021 22:15:03 - INFO - __main__ - Step 35843: {'lr': 0.0001995486610064082, 'samples': 1146976, 'steps': 2240, 'loss/train': 2.2052440643310547} -09/20/2021 22:15:04 - INFO - __main__ - Step 35844: {'lr': 0.0001995486610064082, 'samples': 1147008, 'steps': 2240, 'loss/train': 2.3090367317199707} -09/20/2021 22:15:05 - INFO - __main__ - Step 35845: {'lr': 0.0001995486610064082, 'samples': 1147040, 'steps': 2240, 'loss/train': 1.4124078750610352} -09/20/2021 22:15:06 - INFO - __main__ - Step 35846: {'lr': 0.0001995486610064082, 'samples': 1147072, 'steps': 2240, 'loss/train': 1.5491001605987549} -09/20/2021 22:15:07 - INFO - __main__ - Step 35847: {'lr': 0.0001995486610064082, 'samples': 1147104, 'steps': 2240, 'loss/train': 1.9087833166122437} -09/20/2021 22:15:07 - INFO - __main__ - Step 35848: {'lr': 0.0001995486610064082, 'samples': 1147136, 'steps': 2240, 'loss/train': 2.1708831787109375} -09/20/2021 22:15:08 - INFO - __main__ - Step 35849: {'lr': 0.0001995486610064082, 'samples': 1147168, 'steps': 2240, 'loss/train': 2.514335870742798} -09/20/2021 22:15:09 - INFO - __main__ - Step 35850: {'lr': 0.0001995486610064082, 'samples': 1147200, 'steps': 2240, 'loss/train': 2.6754941940307617} -09/20/2021 22:15:10 - INFO - __main__ - Step 35851: {'lr': 0.0001995486610064082, 'samples': 1147232, 'steps': 2240, 'loss/train': 3.19071102142334} -09/20/2021 22:15:10 - INFO - __main__ - Step 35852: {'lr': 0.0001995486610064082, 'samples': 1147264, 'steps': 2240, 'loss/train': 3.1571781635284424} -09/20/2021 22:15:11 - INFO - __main__ - Step 35853: {'lr': 0.0001995486610064082, 'samples': 1147296, 'steps': 2240, 'loss/train': 1.73789644241333} -09/20/2021 22:15:12 - INFO - __main__ - Step 35854: {'lr': 0.0001995486610064082, 'samples': 1147328, 'steps': 2240, 'loss/train': 2.4131195545196533} -09/20/2021 22:15:13 - INFO - __main__ - Step 35855: {'lr': 0.0001995486610064082, 'samples': 1147360, 'steps': 2240, 'loss/train': 2.4870872497558594} -09/20/2021 22:15:13 - INFO - __main__ - Step 35856: {'lr': 0.0001995486610064082, 'samples': 1147392, 'steps': 2240, 'loss/train': 2.1264615058898926} -09/20/2021 22:15:14 - INFO - __main__ - Step 35857: {'lr': 0.00019954805543585658, 'samples': 1147424, 'steps': 2241, 'loss/train': 2.26157283782959} -09/20/2021 22:15:15 - INFO - __main__ - Step 35858: {'lr': 0.00019954805543585658, 'samples': 1147456, 'steps': 2241, 'loss/train': 3.1981372833251953} -09/20/2021 22:15:16 - INFO - __main__ - Step 35859: {'lr': 0.00019954805543585658, 'samples': 1147488, 'steps': 2241, 'loss/train': 1.4979863166809082} -09/20/2021 22:15:17 - INFO - __main__ - Step 35860: {'lr': 0.00019954805543585658, 'samples': 1147520, 'steps': 2241, 'loss/train': 1.6677441596984863} -09/20/2021 22:15:17 - INFO - __main__ - Step 35861: {'lr': 0.00019954805543585658, 'samples': 1147552, 'steps': 2241, 'loss/train': 2.0972843170166016} -09/20/2021 22:15:18 - INFO - __main__ - Step 35862: {'lr': 0.00019954805543585658, 'samples': 1147584, 'steps': 2241, 'loss/train': 2.145719528198242} -09/20/2021 22:15:19 - INFO - __main__ - Step 35863: {'lr': 0.00019954805543585658, 'samples': 1147616, 'steps': 2241, 'loss/train': 1.9568105936050415} -09/20/2021 22:15:20 - INFO - __main__ - Step 35864: {'lr': 0.00019954805543585658, 'samples': 1147648, 'steps': 2241, 'loss/train': 2.4763858318328857} -09/20/2021 22:15:20 - INFO - __main__ - Step 35865: {'lr': 0.00019954805543585658, 'samples': 1147680, 'steps': 2241, 'loss/train': 2.6144192218780518} -09/20/2021 22:15:21 - INFO - __main__ - Step 35866: {'lr': 0.00019954805543585658, 'samples': 1147712, 'steps': 2241, 'loss/train': 1.582417368888855} -09/20/2021 22:15:22 - INFO - __main__ - Step 35867: {'lr': 0.00019954805543585658, 'samples': 1147744, 'steps': 2241, 'loss/train': 3.062105417251587} -09/20/2021 22:15:23 - INFO - __main__ - Step 35868: {'lr': 0.00019954805543585658, 'samples': 1147776, 'steps': 2241, 'loss/train': 2.71834135055542} -09/20/2021 22:15:23 - INFO - __main__ - Step 35869: {'lr': 0.00019954805543585658, 'samples': 1147808, 'steps': 2241, 'loss/train': 2.8791568279266357} -09/20/2021 22:15:24 - INFO - __main__ - Step 35870: {'lr': 0.00019954805543585658, 'samples': 1147840, 'steps': 2241, 'loss/train': 1.8940907716751099} -09/20/2021 22:15:25 - INFO - __main__ - Step 35871: {'lr': 0.00019954805543585658, 'samples': 1147872, 'steps': 2241, 'loss/train': 1.7956997156143188} -09/20/2021 22:15:26 - INFO - __main__ - Step 35872: {'lr': 0.00019954805543585658, 'samples': 1147904, 'steps': 2241, 'loss/train': 1.1009169816970825} -09/20/2021 22:15:26 - INFO - __main__ - Step 35873: {'lr': 0.00019954744946024434, 'samples': 1147936, 'steps': 2242, 'loss/train': 2.839916467666626} -09/20/2021 22:15:27 - INFO - __main__ - Step 35874: {'lr': 0.00019954744946024434, 'samples': 1147968, 'steps': 2242, 'loss/train': 1.5744794607162476} -09/20/2021 22:15:29 - INFO - __main__ - Step 35875: {'lr': 0.00019954744946024434, 'samples': 1148000, 'steps': 2242, 'loss/train': 2.3456411361694336} -09/20/2021 22:15:29 - INFO - __main__ - Step 35876: {'lr': 0.00019954744946024434, 'samples': 1148032, 'steps': 2242, 'loss/train': 1.4165396690368652} -09/20/2021 22:15:30 - INFO - __main__ - Step 35877: {'lr': 0.00019954744946024434, 'samples': 1148064, 'steps': 2242, 'loss/train': 2.218515157699585} -09/20/2021 22:15:31 - INFO - __main__ - Step 35878: {'lr': 0.00019954744946024434, 'samples': 1148096, 'steps': 2242, 'loss/train': 1.8000675439834595} -09/20/2021 22:15:32 - INFO - __main__ - Step 35879: {'lr': 0.00019954744946024434, 'samples': 1148128, 'steps': 2242, 'loss/train': 2.0105583667755127} -09/20/2021 22:15:32 - INFO - __main__ - Step 35880: {'lr': 0.00019954744946024434, 'samples': 1148160, 'steps': 2242, 'loss/train': 1.849459171295166} -09/20/2021 22:15:33 - INFO - __main__ - Step 35881: {'lr': 0.00019954744946024434, 'samples': 1148192, 'steps': 2242, 'loss/train': 2.2923948764801025} -09/20/2021 22:15:34 - INFO - __main__ - Step 35882: {'lr': 0.00019954744946024434, 'samples': 1148224, 'steps': 2242, 'loss/train': 2.3512370586395264} -09/20/2021 22:15:35 - INFO - __main__ - Step 35883: {'lr': 0.00019954744946024434, 'samples': 1148256, 'steps': 2242, 'loss/train': 1.9569653272628784} -09/20/2021 22:15:35 - INFO - __main__ - Step 35884: {'lr': 0.00019954744946024434, 'samples': 1148288, 'steps': 2242, 'loss/train': 1.6239181756973267} -09/20/2021 22:15:36 - INFO - __main__ - Step 35885: {'lr': 0.00019954744946024434, 'samples': 1148320, 'steps': 2242, 'loss/train': 2.452874183654785} -09/20/2021 22:15:37 - INFO - __main__ - Step 35886: {'lr': 0.00019954744946024434, 'samples': 1148352, 'steps': 2242, 'loss/train': 2.76882266998291} -09/20/2021 22:15:38 - INFO - __main__ - Step 35887: {'lr': 0.00019954744946024434, 'samples': 1148384, 'steps': 2242, 'loss/train': 2.258192539215088} -09/20/2021 22:15:38 - INFO - __main__ - Step 35888: {'lr': 0.00019954744946024434, 'samples': 1148416, 'steps': 2242, 'loss/train': 2.638921022415161} -09/20/2021 22:15:39 - INFO - __main__ - Step 35889: {'lr': 0.0001995468430795739, 'samples': 1148448, 'steps': 2243, 'loss/train': 2.570420026779175} -09/20/2021 22:15:40 - INFO - __main__ - Step 35890: {'lr': 0.0001995468430795739, 'samples': 1148480, 'steps': 2243, 'loss/train': 1.9320755004882812} -09/20/2021 22:15:41 - INFO - __main__ - Step 35891: {'lr': 0.0001995468430795739, 'samples': 1148512, 'steps': 2243, 'loss/train': 2.849597215652466} -09/20/2021 22:15:41 - INFO - __main__ - Step 35892: {'lr': 0.0001995468430795739, 'samples': 1148544, 'steps': 2243, 'loss/train': 2.0490458011627197} -09/20/2021 22:15:42 - INFO - __main__ - Step 35893: {'lr': 0.0001995468430795739, 'samples': 1148576, 'steps': 2243, 'loss/train': 1.456010103225708} -09/20/2021 22:15:43 - INFO - __main__ - Step 35894: {'lr': 0.0001995468430795739, 'samples': 1148608, 'steps': 2243, 'loss/train': 2.823866605758667} -09/20/2021 22:15:44 - INFO - __main__ - Step 35895: {'lr': 0.0001995468430795739, 'samples': 1148640, 'steps': 2243, 'loss/train': 1.5564533472061157} -09/20/2021 22:15:44 - INFO - __main__ - Step 35896: {'lr': 0.0001995468430795739, 'samples': 1148672, 'steps': 2243, 'loss/train': 0.7384235262870789} -09/20/2021 22:15:45 - INFO - __main__ - Step 35897: {'lr': 0.0001995468430795739, 'samples': 1148704, 'steps': 2243, 'loss/train': 1.928403377532959} -09/20/2021 22:15:46 - INFO - __main__ - Step 35898: {'lr': 0.0001995468430795739, 'samples': 1148736, 'steps': 2243, 'loss/train': 2.2254860401153564} -09/20/2021 22:15:47 - INFO - __main__ - Step 35899: {'lr': 0.0001995468430795739, 'samples': 1148768, 'steps': 2243, 'loss/train': 2.9925174713134766} -09/20/2021 22:15:47 - INFO - __main__ - Step 35900: {'lr': 0.0001995468430795739, 'samples': 1148800, 'steps': 2243, 'loss/train': 2.16066312789917} -09/20/2021 22:15:48 - INFO - __main__ - Step 35901: {'lr': 0.0001995468430795739, 'samples': 1148832, 'steps': 2243, 'loss/train': 3.0426669120788574} -09/20/2021 22:15:49 - INFO - __main__ - Step 35902: {'lr': 0.0001995468430795739, 'samples': 1148864, 'steps': 2243, 'loss/train': 2.0359554290771484} -09/20/2021 22:15:50 - INFO - __main__ - Step 35903: {'lr': 0.0001995468430795739, 'samples': 1148896, 'steps': 2243, 'loss/train': 2.3056881427764893} -09/20/2021 22:15:50 - INFO - __main__ - Step 35904: {'lr': 0.0001995468430795739, 'samples': 1148928, 'steps': 2243, 'loss/train': 2.5098226070404053} -09/20/2021 22:15:52 - INFO - __main__ - Step 35905: {'lr': 0.00019954623629384773, 'samples': 1148960, 'steps': 2244, 'loss/train': 2.1928012371063232} -09/20/2021 22:15:53 - INFO - __main__ - Step 35906: {'lr': 0.00019954623629384773, 'samples': 1148992, 'steps': 2244, 'loss/train': 2.1412012577056885} -09/20/2021 22:15:54 - INFO - __main__ - Step 35907: {'lr': 0.00019954623629384773, 'samples': 1149024, 'steps': 2244, 'loss/train': 2.167433023452759} -09/20/2021 22:15:55 - INFO - __main__ - Step 35908: {'lr': 0.00019954623629384773, 'samples': 1149056, 'steps': 2244, 'loss/train': 2.5383143424987793} -09/20/2021 22:15:55 - INFO - __main__ - Step 35909: {'lr': 0.00019954623629384773, 'samples': 1149088, 'steps': 2244, 'loss/train': 2.8354573249816895} -09/20/2021 22:15:56 - INFO - __main__ - Step 35910: {'lr': 0.00019954623629384773, 'samples': 1149120, 'steps': 2244, 'loss/train': 2.8521835803985596} -09/20/2021 22:15:57 - INFO - __main__ - Step 35911: {'lr': 0.00019954623629384773, 'samples': 1149152, 'steps': 2244, 'loss/train': 2.2919392585754395} -09/20/2021 22:15:58 - INFO - __main__ - Step 35912: {'lr': 0.00019954623629384773, 'samples': 1149184, 'steps': 2244, 'loss/train': 1.8275023698806763} -09/20/2021 22:15:58 - INFO - __main__ - Step 35913: {'lr': 0.00019954623629384773, 'samples': 1149216, 'steps': 2244, 'loss/train': 2.900895357131958} -09/20/2021 22:15:59 - INFO - __main__ - Step 35914: {'lr': 0.00019954623629384773, 'samples': 1149248, 'steps': 2244, 'loss/train': 1.862916111946106} -09/20/2021 22:16:00 - INFO - __main__ - Step 35915: {'lr': 0.00019954623629384773, 'samples': 1149280, 'steps': 2244, 'loss/train': 1.1355372667312622} -09/20/2021 22:16:01 - INFO - __main__ - Step 35916: {'lr': 0.00019954623629384773, 'samples': 1149312, 'steps': 2244, 'loss/train': 2.7716004848480225} -09/20/2021 22:16:01 - INFO - __main__ - Step 35917: {'lr': 0.00019954623629384773, 'samples': 1149344, 'steps': 2244, 'loss/train': 1.989682912826538} -09/20/2021 22:16:02 - INFO - __main__ - Step 35918: {'lr': 0.00019954623629384773, 'samples': 1149376, 'steps': 2244, 'loss/train': 2.214116096496582} -09/20/2021 22:16:03 - INFO - __main__ - Step 35919: {'lr': 0.00019954623629384773, 'samples': 1149408, 'steps': 2244, 'loss/train': 1.9788801670074463} -09/20/2021 22:16:04 - INFO - __main__ - Step 35920: {'lr': 0.00019954623629384773, 'samples': 1149440, 'steps': 2244, 'loss/train': 2.9056568145751953} -09/20/2021 22:16:05 - INFO - __main__ - Step 35921: {'lr': 0.0001995456291030683, 'samples': 1149472, 'steps': 2245, 'loss/train': 1.694185495376587} -09/20/2021 22:16:05 - INFO - __main__ - Step 35922: {'lr': 0.0001995456291030683, 'samples': 1149504, 'steps': 2245, 'loss/train': 2.2013065814971924} -09/20/2021 22:16:06 - INFO - __main__ - Step 35923: {'lr': 0.0001995456291030683, 'samples': 1149536, 'steps': 2245, 'loss/train': 1.3175082206726074} -09/20/2021 22:16:07 - INFO - __main__ - Step 35924: {'lr': 0.0001995456291030683, 'samples': 1149568, 'steps': 2245, 'loss/train': 1.9089791774749756} -09/20/2021 22:16:08 - INFO - __main__ - Step 35925: {'lr': 0.0001995456291030683, 'samples': 1149600, 'steps': 2245, 'loss/train': 0.5325325727462769} -09/20/2021 22:16:08 - INFO - __main__ - Step 35926: {'lr': 0.0001995456291030683, 'samples': 1149632, 'steps': 2245, 'loss/train': 0.4652756154537201} -09/20/2021 22:16:09 - INFO - __main__ - Step 35927: {'lr': 0.0001995456291030683, 'samples': 1149664, 'steps': 2245, 'loss/train': 1.2056618928909302} -09/20/2021 22:16:10 - INFO - __main__ - Step 35928: {'lr': 0.0001995456291030683, 'samples': 1149696, 'steps': 2245, 'loss/train': 2.13759446144104} -09/20/2021 22:16:11 - INFO - __main__ - Step 35929: {'lr': 0.0001995456291030683, 'samples': 1149728, 'steps': 2245, 'loss/train': 1.7052419185638428} -09/20/2021 22:16:11 - INFO - __main__ - Step 35930: {'lr': 0.0001995456291030683, 'samples': 1149760, 'steps': 2245, 'loss/train': 3.2379844188690186} -09/20/2021 22:16:12 - INFO - __main__ - Step 35931: {'lr': 0.0001995456291030683, 'samples': 1149792, 'steps': 2245, 'loss/train': 2.0218403339385986} -09/20/2021 22:16:13 - INFO - __main__ - Step 35932: {'lr': 0.0001995456291030683, 'samples': 1149824, 'steps': 2245, 'loss/train': 2.4402945041656494} -09/20/2021 22:16:14 - INFO - __main__ - Step 35933: {'lr': 0.0001995456291030683, 'samples': 1149856, 'steps': 2245, 'loss/train': 1.9128282070159912} -09/20/2021 22:16:14 - INFO - __main__ - Step 35934: {'lr': 0.0001995456291030683, 'samples': 1149888, 'steps': 2245, 'loss/train': 2.1810498237609863} -09/20/2021 22:16:16 - INFO - __main__ - Step 35935: {'lr': 0.0001995456291030683, 'samples': 1149920, 'steps': 2245, 'loss/train': 2.2540276050567627} -09/20/2021 22:16:16 - INFO - __main__ - Step 35936: {'lr': 0.0001995456291030683, 'samples': 1149952, 'steps': 2245, 'loss/train': 1.6824954748153687} -09/20/2021 22:16:17 - INFO - __main__ - Step 35937: {'lr': 0.0001995450215072381, 'samples': 1149984, 'steps': 2246, 'loss/train': 2.4927170276641846} -09/20/2021 22:16:18 - INFO - __main__ - Step 35938: {'lr': 0.0001995450215072381, 'samples': 1150016, 'steps': 2246, 'loss/train': 4.102428913116455} -09/20/2021 22:16:19 - INFO - __main__ - Step 35939: {'lr': 0.0001995450215072381, 'samples': 1150048, 'steps': 2246, 'loss/train': 1.5204415321350098} -09/20/2021 22:16:19 - INFO - __main__ - Step 35940: {'lr': 0.0001995450215072381, 'samples': 1150080, 'steps': 2246, 'loss/train': 2.1964402198791504} -09/20/2021 22:16:20 - INFO - __main__ - Step 35941: {'lr': 0.0001995450215072381, 'samples': 1150112, 'steps': 2246, 'loss/train': 2.2465336322784424} -09/20/2021 22:16:21 - INFO - __main__ - Step 35942: {'lr': 0.0001995450215072381, 'samples': 1150144, 'steps': 2246, 'loss/train': 2.2371139526367188} -09/20/2021 22:16:22 - INFO - __main__ - Step 35943: {'lr': 0.0001995450215072381, 'samples': 1150176, 'steps': 2246, 'loss/train': 2.3665692806243896} -09/20/2021 22:16:22 - INFO - __main__ - Step 35944: {'lr': 0.0001995450215072381, 'samples': 1150208, 'steps': 2246, 'loss/train': 2.607699394226074} -09/20/2021 22:16:23 - INFO - __main__ - Step 35945: {'lr': 0.0001995450215072381, 'samples': 1150240, 'steps': 2246, 'loss/train': 0.41757211089134216} -09/20/2021 22:16:24 - INFO - __main__ - Step 35946: {'lr': 0.0001995450215072381, 'samples': 1150272, 'steps': 2246, 'loss/train': 1.7716702222824097} -09/20/2021 22:16:25 - INFO - __main__ - Step 35947: {'lr': 0.0001995450215072381, 'samples': 1150304, 'steps': 2246, 'loss/train': 2.5938615798950195} -09/20/2021 22:16:25 - INFO - __main__ - Step 35948: {'lr': 0.0001995450215072381, 'samples': 1150336, 'steps': 2246, 'loss/train': 1.2783114910125732} -09/20/2021 22:16:26 - INFO - __main__ - Step 35949: {'lr': 0.0001995450215072381, 'samples': 1150368, 'steps': 2246, 'loss/train': 2.6590538024902344} -09/20/2021 22:16:27 - INFO - __main__ - Step 35950: {'lr': 0.0001995450215072381, 'samples': 1150400, 'steps': 2246, 'loss/train': 1.9740116596221924} -09/20/2021 22:16:28 - INFO - __main__ - Step 35951: {'lr': 0.0001995450215072381, 'samples': 1150432, 'steps': 2246, 'loss/train': 2.5176315307617188} -09/20/2021 22:16:28 - INFO - __main__ - Step 35952: {'lr': 0.0001995450215072381, 'samples': 1150464, 'steps': 2246, 'loss/train': 2.225553035736084} -09/20/2021 22:16:29 - INFO - __main__ - Step 35953: {'lr': 0.0001995444135063596, 'samples': 1150496, 'steps': 2247, 'loss/train': 2.6253044605255127} -09/20/2021 22:16:30 - INFO - __main__ - Step 35954: {'lr': 0.0001995444135063596, 'samples': 1150528, 'steps': 2247, 'loss/train': 1.9224013090133667} -09/20/2021 22:16:31 - INFO - __main__ - Step 35955: {'lr': 0.0001995444135063596, 'samples': 1150560, 'steps': 2247, 'loss/train': 3.3446767330169678} -09/20/2021 22:16:32 - INFO - __main__ - Step 35956: {'lr': 0.0001995444135063596, 'samples': 1150592, 'steps': 2247, 'loss/train': 2.6354353427886963} -09/20/2021 22:16:32 - INFO - __main__ - Step 35957: {'lr': 0.0001995444135063596, 'samples': 1150624, 'steps': 2247, 'loss/train': 2.12070894241333} -09/20/2021 22:16:33 - INFO - __main__ - Step 35958: {'lr': 0.0001995444135063596, 'samples': 1150656, 'steps': 2247, 'loss/train': 0.813953161239624} -09/20/2021 22:16:34 - INFO - __main__ - Step 35959: {'lr': 0.0001995444135063596, 'samples': 1150688, 'steps': 2247, 'loss/train': 2.6345226764678955} -09/20/2021 22:16:35 - INFO - __main__ - Step 35960: {'lr': 0.0001995444135063596, 'samples': 1150720, 'steps': 2247, 'loss/train': 3.239147663116455} -09/20/2021 22:16:35 - INFO - __main__ - Step 35961: {'lr': 0.0001995444135063596, 'samples': 1150752, 'steps': 2247, 'loss/train': 2.5260372161865234} -09/20/2021 22:16:36 - INFO - __main__ - Step 35962: {'lr': 0.0001995444135063596, 'samples': 1150784, 'steps': 2247, 'loss/train': 1.984071135520935} -09/20/2021 22:16:37 - INFO - __main__ - Step 35963: {'lr': 0.0001995444135063596, 'samples': 1150816, 'steps': 2247, 'loss/train': 0.9401834607124329} -09/20/2021 22:16:38 - INFO - __main__ - Step 35964: {'lr': 0.0001995444135063596, 'samples': 1150848, 'steps': 2247, 'loss/train': 2.7442588806152344} -09/20/2021 22:16:38 - INFO - __main__ - Step 35965: {'lr': 0.0001995444135063596, 'samples': 1150880, 'steps': 2247, 'loss/train': 2.6758415699005127} -09/20/2021 22:16:40 - INFO - __main__ - Step 35966: {'lr': 0.0001995444135063596, 'samples': 1150912, 'steps': 2247, 'loss/train': 2.3475751876831055} -09/20/2021 22:16:40 - INFO - __main__ - Step 35967: {'lr': 0.0001995444135063596, 'samples': 1150944, 'steps': 2247, 'loss/train': 2.2163851261138916} -09/20/2021 22:16:41 - INFO - __main__ - Step 35968: {'lr': 0.0001995444135063596, 'samples': 1150976, 'steps': 2247, 'loss/train': 2.59212589263916} -09/20/2021 22:16:42 - INFO - __main__ - Step 35969: {'lr': 0.0001995438051004353, 'samples': 1151008, 'steps': 2248, 'loss/train': 2.1997230052948} -09/20/2021 22:16:43 - INFO - __main__ - Step 35970: {'lr': 0.0001995438051004353, 'samples': 1151040, 'steps': 2248, 'loss/train': 2.868237018585205} -09/20/2021 22:16:43 - INFO - __main__ - Step 35971: {'lr': 0.0001995438051004353, 'samples': 1151072, 'steps': 2248, 'loss/train': 2.53548526763916} -09/20/2021 22:16:44 - INFO - __main__ - Step 35972: {'lr': 0.0001995438051004353, 'samples': 1151104, 'steps': 2248, 'loss/train': 2.043212890625} -09/20/2021 22:16:45 - INFO - __main__ - Step 35973: {'lr': 0.0001995438051004353, 'samples': 1151136, 'steps': 2248, 'loss/train': 1.8021999597549438} -09/20/2021 22:16:46 - INFO - __main__ - Step 35974: {'lr': 0.0001995438051004353, 'samples': 1151168, 'steps': 2248, 'loss/train': 2.727936267852783} -09/20/2021 22:16:46 - INFO - __main__ - Step 35975: {'lr': 0.0001995438051004353, 'samples': 1151200, 'steps': 2248, 'loss/train': 2.537184000015259} -09/20/2021 22:16:47 - INFO - __main__ - Step 35976: {'lr': 0.0001995438051004353, 'samples': 1151232, 'steps': 2248, 'loss/train': 1.9712495803833008} -09/20/2021 22:16:48 - INFO - __main__ - Step 35977: {'lr': 0.0001995438051004353, 'samples': 1151264, 'steps': 2248, 'loss/train': 1.9708654880523682} -09/20/2021 22:16:49 - INFO - __main__ - Step 35978: {'lr': 0.0001995438051004353, 'samples': 1151296, 'steps': 2248, 'loss/train': 1.788269281387329} -09/20/2021 22:16:49 - INFO - __main__ - Step 35979: {'lr': 0.0001995438051004353, 'samples': 1151328, 'steps': 2248, 'loss/train': 2.0232832431793213} -09/20/2021 22:16:50 - INFO - __main__ - Step 35980: {'lr': 0.0001995438051004353, 'samples': 1151360, 'steps': 2248, 'loss/train': 1.8733975887298584} -09/20/2021 22:16:51 - INFO - __main__ - Step 35981: {'lr': 0.0001995438051004353, 'samples': 1151392, 'steps': 2248, 'loss/train': 2.7341954708099365} -09/20/2021 22:16:52 - INFO - __main__ - Step 35982: {'lr': 0.0001995438051004353, 'samples': 1151424, 'steps': 2248, 'loss/train': 2.335815191268921} -09/20/2021 22:16:52 - INFO - __main__ - Step 35983: {'lr': 0.0001995438051004353, 'samples': 1151456, 'steps': 2248, 'loss/train': 2.400216817855835} -09/20/2021 22:16:53 - INFO - __main__ - Step 35984: {'lr': 0.0001995438051004353, 'samples': 1151488, 'steps': 2248, 'loss/train': 1.975624442100525} -09/20/2021 22:16:54 - INFO - __main__ - Step 35985: {'lr': 0.0001995431962894676, 'samples': 1151520, 'steps': 2249, 'loss/train': 2.648162364959717} -09/20/2021 22:16:55 - INFO - __main__ - Step 35986: {'lr': 0.0001995431962894676, 'samples': 1151552, 'steps': 2249, 'loss/train': 2.6056418418884277} -09/20/2021 22:16:56 - INFO - __main__ - Step 35987: {'lr': 0.0001995431962894676, 'samples': 1151584, 'steps': 2249, 'loss/train': 1.808221697807312} -09/20/2021 22:16:56 - INFO - __main__ - Step 35988: {'lr': 0.0001995431962894676, 'samples': 1151616, 'steps': 2249, 'loss/train': 2.5056777000427246} -09/20/2021 22:16:57 - INFO - __main__ - Step 35989: {'lr': 0.0001995431962894676, 'samples': 1151648, 'steps': 2249, 'loss/train': 2.337735652923584} -09/20/2021 22:16:58 - INFO - __main__ - Step 35990: {'lr': 0.0001995431962894676, 'samples': 1151680, 'steps': 2249, 'loss/train': 2.434122323989868} -09/20/2021 22:16:59 - INFO - __main__ - Step 35991: {'lr': 0.0001995431962894676, 'samples': 1151712, 'steps': 2249, 'loss/train': 1.7025405168533325} -09/20/2021 22:16:59 - INFO - __main__ - Step 35992: {'lr': 0.0001995431962894676, 'samples': 1151744, 'steps': 2249, 'loss/train': 2.3130762577056885} -09/20/2021 22:17:00 - INFO - __main__ - Step 35993: {'lr': 0.0001995431962894676, 'samples': 1151776, 'steps': 2249, 'loss/train': 2.1101012229919434} -09/20/2021 22:17:01 - INFO - __main__ - Step 35994: {'lr': 0.0001995431962894676, 'samples': 1151808, 'steps': 2249, 'loss/train': 1.5557926893234253} -09/20/2021 22:17:02 - INFO - __main__ - Step 35995: {'lr': 0.0001995431962894676, 'samples': 1151840, 'steps': 2249, 'loss/train': 2.2947194576263428} -09/20/2021 22:17:02 - INFO - __main__ - Step 35996: {'lr': 0.0001995431962894676, 'samples': 1151872, 'steps': 2249, 'loss/train': 2.767549991607666} -09/20/2021 22:17:04 - INFO - __main__ - Step 35997: {'lr': 0.0001995431962894676, 'samples': 1151904, 'steps': 2249, 'loss/train': 1.83420991897583} -09/20/2021 22:17:04 - INFO - __main__ - Step 35998: {'lr': 0.0001995431962894676, 'samples': 1151936, 'steps': 2249, 'loss/train': 1.3355501890182495} -09/20/2021 22:17:05 - INFO - __main__ - Step 35999: {'lr': 0.0001995431962894676, 'samples': 1151968, 'steps': 2249, 'loss/train': 3.157470941543579} -09/20/2021 22:17:06 - INFO - __main__ - Step 36000: {'lr': 0.0001995431962894676, 'samples': 1152000, 'steps': 2249, 'loss/train': 1.6790632009506226} -09/20/2021 22:17:07 - INFO - __main__ - Step 36001: {'lr': 0.000199542587073459, 'samples': 1152032, 'steps': 2250, 'loss/train': 1.9715403318405151} -09/20/2021 22:17:08 - INFO - __main__ - Step 36002: {'lr': 0.000199542587073459, 'samples': 1152064, 'steps': 2250, 'loss/train': 1.7278227806091309} -09/20/2021 22:17:08 - INFO - __main__ - Step 36003: {'lr': 0.000199542587073459, 'samples': 1152096, 'steps': 2250, 'loss/train': 2.288104772567749} -09/20/2021 22:17:09 - INFO - __main__ - Step 36004: {'lr': 0.000199542587073459, 'samples': 1152128, 'steps': 2250, 'loss/train': 2.13484787940979} -09/20/2021 22:17:10 - INFO - __main__ - Step 36005: {'lr': 0.000199542587073459, 'samples': 1152160, 'steps': 2250, 'loss/train': 1.9571728706359863} -09/20/2021 22:17:11 - INFO - __main__ - Step 36006: {'lr': 0.000199542587073459, 'samples': 1152192, 'steps': 2250, 'loss/train': 2.95509672164917} -09/20/2021 22:17:11 - INFO - __main__ - Step 36007: {'lr': 0.000199542587073459, 'samples': 1152224, 'steps': 2250, 'loss/train': 2.276764392852783} -09/20/2021 22:17:12 - INFO - __main__ - Step 36008: {'lr': 0.000199542587073459, 'samples': 1152256, 'steps': 2250, 'loss/train': 0.6823796629905701} -09/20/2021 22:17:13 - INFO - __main__ - Step 36009: {'lr': 0.000199542587073459, 'samples': 1152288, 'steps': 2250, 'loss/train': 1.5118030309677124} -09/20/2021 22:17:14 - INFO - __main__ - Step 36010: {'lr': 0.000199542587073459, 'samples': 1152320, 'steps': 2250, 'loss/train': 2.9419267177581787} -09/20/2021 22:17:14 - INFO - __main__ - Step 36011: {'lr': 0.000199542587073459, 'samples': 1152352, 'steps': 2250, 'loss/train': 2.4254586696624756} -09/20/2021 22:17:15 - INFO - __main__ - Step 36012: {'lr': 0.000199542587073459, 'samples': 1152384, 'steps': 2250, 'loss/train': 1.9991042613983154} -09/20/2021 22:17:16 - INFO - __main__ - Step 36013: {'lr': 0.000199542587073459, 'samples': 1152416, 'steps': 2250, 'loss/train': 2.486572027206421} -09/20/2021 22:17:17 - INFO - __main__ - Step 36014: {'lr': 0.000199542587073459, 'samples': 1152448, 'steps': 2250, 'loss/train': 1.9481730461120605} -09/20/2021 22:17:17 - INFO - __main__ - Step 36015: {'lr': 0.000199542587073459, 'samples': 1152480, 'steps': 2250, 'loss/train': 2.263629913330078} -09/20/2021 22:17:18 - INFO - __main__ - Step 36016: {'lr': 0.000199542587073459, 'samples': 1152512, 'steps': 2250, 'loss/train': 3.007990598678589} -09/20/2021 22:17:19 - INFO - __main__ - Step 36017: {'lr': 0.00019954197745241205, 'samples': 1152544, 'steps': 2251, 'loss/train': 1.2578601837158203} -09/20/2021 22:17:20 - INFO - __main__ - Step 36018: {'lr': 0.00019954197745241205, 'samples': 1152576, 'steps': 2251, 'loss/train': 2.674943685531616} -09/20/2021 22:17:20 - INFO - __main__ - Step 36019: {'lr': 0.00019954197745241205, 'samples': 1152608, 'steps': 2251, 'loss/train': 1.7410000562667847} -09/20/2021 22:17:21 - INFO - __main__ - Step 36020: {'lr': 0.00019954197745241205, 'samples': 1152640, 'steps': 2251, 'loss/train': 2.9311411380767822} -09/20/2021 22:17:22 - INFO - __main__ - Step 36021: {'lr': 0.00019954197745241205, 'samples': 1152672, 'steps': 2251, 'loss/train': 2.3043055534362793} -09/20/2021 22:17:23 - INFO - __main__ - Step 36022: {'lr': 0.00019954197745241205, 'samples': 1152704, 'steps': 2251, 'loss/train': 0.37910234928131104} -09/20/2021 22:17:23 - INFO - __main__ - Step 36023: {'lr': 0.00019954197745241205, 'samples': 1152736, 'steps': 2251, 'loss/train': 0.2505241930484772} -09/20/2021 22:17:24 - INFO - __main__ - Step 36024: {'lr': 0.00019954197745241205, 'samples': 1152768, 'steps': 2251, 'loss/train': 2.9413857460021973} -09/20/2021 22:17:25 - INFO - __main__ - Step 36025: {'lr': 0.00019954197745241205, 'samples': 1152800, 'steps': 2251, 'loss/train': 1.043688178062439} -09/20/2021 22:17:26 - INFO - __main__ - Step 36026: {'lr': 0.00019954197745241205, 'samples': 1152832, 'steps': 2251, 'loss/train': 2.625046730041504} -09/20/2021 22:17:27 - INFO - __main__ - Step 36027: {'lr': 0.00019954197745241205, 'samples': 1152864, 'steps': 2251, 'loss/train': 1.3581123352050781} -09/20/2021 22:17:28 - INFO - __main__ - Step 36028: {'lr': 0.00019954197745241205, 'samples': 1152896, 'steps': 2251, 'loss/train': 2.6093225479125977} -09/20/2021 22:17:28 - INFO - __main__ - Step 36029: {'lr': 0.00019954197745241205, 'samples': 1152928, 'steps': 2251, 'loss/train': 1.8819754123687744} -09/20/2021 22:17:29 - INFO - __main__ - Step 36030: {'lr': 0.00019954197745241205, 'samples': 1152960, 'steps': 2251, 'loss/train': 2.474364757537842} -09/20/2021 22:17:30 - INFO - __main__ - Step 36031: {'lr': 0.00019954197745241205, 'samples': 1152992, 'steps': 2251, 'loss/train': 2.097780466079712} -09/20/2021 22:17:31 - INFO - __main__ - Step 36032: {'lr': 0.00019954197745241205, 'samples': 1153024, 'steps': 2251, 'loss/train': 1.7711538076400757} -09/20/2021 22:17:32 - INFO - __main__ - Step 36033: {'lr': 0.00019954136742632915, 'samples': 1153056, 'steps': 2252, 'loss/train': 2.1075563430786133} -09/20/2021 22:17:32 - INFO - __main__ - Step 36034: {'lr': 0.00019954136742632915, 'samples': 1153088, 'steps': 2252, 'loss/train': 2.3223211765289307} -09/20/2021 22:17:33 - INFO - __main__ - Step 36035: {'lr': 0.00019954136742632915, 'samples': 1153120, 'steps': 2252, 'loss/train': 2.5071349143981934} -09/20/2021 22:17:34 - INFO - __main__ - Step 36036: {'lr': 0.00019954136742632915, 'samples': 1153152, 'steps': 2252, 'loss/train': 1.4887111186981201} -09/20/2021 22:17:35 - INFO - __main__ - Step 36037: {'lr': 0.00019954136742632915, 'samples': 1153184, 'steps': 2252, 'loss/train': 1.6890850067138672} -09/20/2021 22:17:35 - INFO - __main__ - Step 36038: {'lr': 0.00019954136742632915, 'samples': 1153216, 'steps': 2252, 'loss/train': 1.8856565952301025} -09/20/2021 22:17:36 - INFO - __main__ - Step 36039: {'lr': 0.00019954136742632915, 'samples': 1153248, 'steps': 2252, 'loss/train': 1.6647837162017822} -09/20/2021 22:17:37 - INFO - __main__ - Step 36040: {'lr': 0.00019954136742632915, 'samples': 1153280, 'steps': 2252, 'loss/train': 2.128610849380493} -09/20/2021 22:17:38 - INFO - __main__ - Step 36041: {'lr': 0.00019954136742632915, 'samples': 1153312, 'steps': 2252, 'loss/train': 2.6392617225646973} -09/20/2021 22:17:38 - INFO - __main__ - Step 36042: {'lr': 0.00019954136742632915, 'samples': 1153344, 'steps': 2252, 'loss/train': 2.2356984615325928} -09/20/2021 22:17:39 - INFO - __main__ - Step 36043: {'lr': 0.00019954136742632915, 'samples': 1153376, 'steps': 2252, 'loss/train': 1.8911828994750977} -09/20/2021 22:17:40 - INFO - __main__ - Step 36044: {'lr': 0.00019954136742632915, 'samples': 1153408, 'steps': 2252, 'loss/train': 2.4861927032470703} -09/20/2021 22:17:41 - INFO - __main__ - Step 36045: {'lr': 0.00019954136742632915, 'samples': 1153440, 'steps': 2252, 'loss/train': 3.4177815914154053} -09/20/2021 22:17:41 - INFO - __main__ - Step 36046: {'lr': 0.00019954136742632915, 'samples': 1153472, 'steps': 2252, 'loss/train': 2.0525667667388916} -09/20/2021 22:17:42 - INFO - __main__ - Step 36047: {'lr': 0.00019954136742632915, 'samples': 1153504, 'steps': 2252, 'loss/train': 1.4537453651428223} -09/20/2021 22:17:43 - INFO - __main__ - Step 36048: {'lr': 0.00019954136742632915, 'samples': 1153536, 'steps': 2252, 'loss/train': 2.1813290119171143} -09/20/2021 22:17:44 - INFO - __main__ - Step 36049: {'lr': 0.00019954075699521283, 'samples': 1153568, 'steps': 2253, 'loss/train': 2.341846227645874} -09/20/2021 22:17:44 - INFO - __main__ - Step 36050: {'lr': 0.00019954075699521283, 'samples': 1153600, 'steps': 2253, 'loss/train': 2.0233705043792725} -09/20/2021 22:17:45 - INFO - __main__ - Step 36051: {'lr': 0.00019954075699521283, 'samples': 1153632, 'steps': 2253, 'loss/train': 1.6874113082885742} -09/20/2021 22:17:46 - INFO - __main__ - Step 36052: {'lr': 0.00019954075699521283, 'samples': 1153664, 'steps': 2253, 'loss/train': 1.4456497430801392} -09/20/2021 22:17:47 - INFO - __main__ - Step 36053: {'lr': 0.00019954075699521283, 'samples': 1153696, 'steps': 2253, 'loss/train': 2.1770546436309814} -09/20/2021 22:17:47 - INFO - __main__ - Step 36054: {'lr': 0.00019954075699521283, 'samples': 1153728, 'steps': 2253, 'loss/train': 1.0737149715423584} -09/20/2021 22:17:48 - INFO - __main__ - Step 36055: {'lr': 0.00019954075699521283, 'samples': 1153760, 'steps': 2253, 'loss/train': 2.1384739875793457} -09/20/2021 22:17:49 - INFO - __main__ - Step 36056: {'lr': 0.00019954075699521283, 'samples': 1153792, 'steps': 2253, 'loss/train': 2.9607598781585693} -09/20/2021 22:17:50 - INFO - __main__ - Step 36057: {'lr': 0.00019954075699521283, 'samples': 1153824, 'steps': 2253, 'loss/train': 2.7559499740600586} -09/20/2021 22:17:50 - INFO - __main__ - Step 36058: {'lr': 0.00019954075699521283, 'samples': 1153856, 'steps': 2253, 'loss/train': 1.7610065937042236} -09/20/2021 22:17:52 - INFO - __main__ - Step 36059: {'lr': 0.00019954075699521283, 'samples': 1153888, 'steps': 2253, 'loss/train': 2.2405498027801514} -09/20/2021 22:17:53 - INFO - __main__ - Step 36060: {'lr': 0.00019954075699521283, 'samples': 1153920, 'steps': 2253, 'loss/train': 2.208465814590454} -09/20/2021 22:17:53 - INFO - __main__ - Step 36061: {'lr': 0.00019954075699521283, 'samples': 1153952, 'steps': 2253, 'loss/train': 1.6752969026565552} -09/20/2021 22:17:54 - INFO - __main__ - Step 36062: {'lr': 0.00019954075699521283, 'samples': 1153984, 'steps': 2253, 'loss/train': 0.7304447293281555} -09/20/2021 22:17:55 - INFO - __main__ - Step 36063: {'lr': 0.00019954075699521283, 'samples': 1154016, 'steps': 2253, 'loss/train': 0.7817417979240417} -09/20/2021 22:17:56 - INFO - __main__ - Step 36064: {'lr': 0.00019954075699521283, 'samples': 1154048, 'steps': 2253, 'loss/train': 0.8118446469306946} -09/20/2021 22:17:57 - INFO - __main__ - Step 36065: {'lr': 0.00019954014615906554, 'samples': 1154080, 'steps': 2254, 'loss/train': 0.591041624546051} -09/20/2021 22:17:57 - INFO - __main__ - Step 36066: {'lr': 0.00019954014615906554, 'samples': 1154112, 'steps': 2254, 'loss/train': 3.429821729660034} -09/20/2021 22:17:58 - INFO - __main__ - Step 36067: {'lr': 0.00019954014615906554, 'samples': 1154144, 'steps': 2254, 'loss/train': 2.8198342323303223} -09/20/2021 22:17:59 - INFO - __main__ - Step 36068: {'lr': 0.00019954014615906554, 'samples': 1154176, 'steps': 2254, 'loss/train': 2.0374515056610107} -09/20/2021 22:18:00 - INFO - __main__ - Step 36069: {'lr': 0.00019954014615906554, 'samples': 1154208, 'steps': 2254, 'loss/train': 1.6957749128341675} -09/20/2021 22:18:00 - INFO - __main__ - Step 36070: {'lr': 0.00019954014615906554, 'samples': 1154240, 'steps': 2254, 'loss/train': 2.7355048656463623} -09/20/2021 22:18:01 - INFO - __main__ - Step 36071: {'lr': 0.00019954014615906554, 'samples': 1154272, 'steps': 2254, 'loss/train': 1.662119746208191} -09/20/2021 22:18:02 - INFO - __main__ - Step 36072: {'lr': 0.00019954014615906554, 'samples': 1154304, 'steps': 2254, 'loss/train': 2.4525866508483887} -09/20/2021 22:18:03 - INFO - __main__ - Step 36073: {'lr': 0.00019954014615906554, 'samples': 1154336, 'steps': 2254, 'loss/train': 3.9416165351867676} -09/20/2021 22:18:03 - INFO - __main__ - Step 36074: {'lr': 0.00019954014615906554, 'samples': 1154368, 'steps': 2254, 'loss/train': 2.592252731323242} -09/20/2021 22:18:04 - INFO - __main__ - Step 36075: {'lr': 0.00019954014615906554, 'samples': 1154400, 'steps': 2254, 'loss/train': 2.9269416332244873} -09/20/2021 22:18:05 - INFO - __main__ - Step 36076: {'lr': 0.00019954014615906554, 'samples': 1154432, 'steps': 2254, 'loss/train': 2.7078042030334473} -09/20/2021 22:18:06 - INFO - __main__ - Step 36077: {'lr': 0.00019954014615906554, 'samples': 1154464, 'steps': 2254, 'loss/train': 2.0250866413116455} -09/20/2021 22:18:06 - INFO - __main__ - Step 36078: {'lr': 0.00019954014615906554, 'samples': 1154496, 'steps': 2254, 'loss/train': 2.353771924972534} -09/20/2021 22:18:07 - INFO - __main__ - Step 36079: {'lr': 0.00019954014615906554, 'samples': 1154528, 'steps': 2254, 'loss/train': 2.140770435333252} -09/20/2021 22:18:08 - INFO - __main__ - Step 36080: {'lr': 0.00019954014615906554, 'samples': 1154560, 'steps': 2254, 'loss/train': 2.2795214653015137} -09/20/2021 22:18:09 - INFO - __main__ - Step 36081: {'lr': 0.00019953953491788978, 'samples': 1154592, 'steps': 2255, 'loss/train': 2.1041676998138428} -09/20/2021 22:18:09 - INFO - __main__ - Step 36082: {'lr': 0.00019953953491788978, 'samples': 1154624, 'steps': 2255, 'loss/train': 1.8959228992462158} -09/20/2021 22:18:10 - INFO - __main__ - Step 36083: {'lr': 0.00019953953491788978, 'samples': 1154656, 'steps': 2255, 'loss/train': 1.857370138168335} -09/20/2021 22:18:11 - INFO - __main__ - Step 36084: {'lr': 0.00019953953491788978, 'samples': 1154688, 'steps': 2255, 'loss/train': 3.2375781536102295} -09/20/2021 22:18:12 - INFO - __main__ - Step 36085: {'lr': 0.00019953953491788978, 'samples': 1154720, 'steps': 2255, 'loss/train': 3.2062811851501465} -09/20/2021 22:18:12 - INFO - __main__ - Step 36086: {'lr': 0.00019953953491788978, 'samples': 1154752, 'steps': 2255, 'loss/train': 0.9095586538314819} -09/20/2021 22:18:13 - INFO - __main__ - Step 36087: {'lr': 0.00019953953491788978, 'samples': 1154784, 'steps': 2255, 'loss/train': 2.049769878387451} -09/20/2021 22:18:14 - INFO - __main__ - Step 36088: {'lr': 0.00019953953491788978, 'samples': 1154816, 'steps': 2255, 'loss/train': 2.5625433921813965} -09/20/2021 22:18:15 - INFO - __main__ - Step 36089: {'lr': 0.00019953953491788978, 'samples': 1154848, 'steps': 2255, 'loss/train': 2.2707340717315674} -09/20/2021 22:18:15 - INFO - __main__ - Step 36090: {'lr': 0.00019953953491788978, 'samples': 1154880, 'steps': 2255, 'loss/train': 1.9894556999206543} -09/20/2021 22:18:17 - INFO - __main__ - Step 36091: {'lr': 0.00019953953491788978, 'samples': 1154912, 'steps': 2255, 'loss/train': 2.0423569679260254} -09/20/2021 22:18:17 - INFO - __main__ - Step 36092: {'lr': 0.00019953953491788978, 'samples': 1154944, 'steps': 2255, 'loss/train': 2.8023102283477783} -09/20/2021 22:18:18 - INFO - __main__ - Step 36093: {'lr': 0.00019953953491788978, 'samples': 1154976, 'steps': 2255, 'loss/train': 2.3893680572509766} -09/20/2021 22:18:19 - INFO - __main__ - Step 36094: {'lr': 0.00019953953491788978, 'samples': 1155008, 'steps': 2255, 'loss/train': 1.6832153797149658} -09/20/2021 22:18:20 - INFO - __main__ - Step 36095: {'lr': 0.00019953953491788978, 'samples': 1155040, 'steps': 2255, 'loss/train': 2.028113842010498} -09/20/2021 22:18:20 - INFO - __main__ - Step 36096: {'lr': 0.00019953953491788978, 'samples': 1155072, 'steps': 2255, 'loss/train': 2.134061574935913} -09/20/2021 22:18:21 - INFO - __main__ - Step 36097: {'lr': 0.00019953892327168805, 'samples': 1155104, 'steps': 2256, 'loss/train': 1.3480287790298462} -09/20/2021 22:18:22 - INFO - __main__ - Step 36098: {'lr': 0.00019953892327168805, 'samples': 1155136, 'steps': 2256, 'loss/train': 2.508298635482788} -09/20/2021 22:18:23 - INFO - __main__ - Step 36099: {'lr': 0.00019953892327168805, 'samples': 1155168, 'steps': 2256, 'loss/train': 1.8833431005477905} -09/20/2021 22:18:24 - INFO - __main__ - Step 36100: {'lr': 0.00019953892327168805, 'samples': 1155200, 'steps': 2256, 'loss/train': 2.3097856044769287} -09/20/2021 22:18:24 - INFO - __main__ - Step 36101: {'lr': 0.00019953892327168805, 'samples': 1155232, 'steps': 2256, 'loss/train': 2.3266913890838623} -09/20/2021 22:18:25 - INFO - __main__ - Step 36102: {'lr': 0.00019953892327168805, 'samples': 1155264, 'steps': 2256, 'loss/train': 1.8344733715057373} -09/20/2021 22:18:26 - INFO - __main__ - Step 36103: {'lr': 0.00019953892327168805, 'samples': 1155296, 'steps': 2256, 'loss/train': 2.350554943084717} -09/20/2021 22:18:27 - INFO - __main__ - Step 36104: {'lr': 0.00019953892327168805, 'samples': 1155328, 'steps': 2256, 'loss/train': 1.622697353363037} -09/20/2021 22:18:27 - INFO - __main__ - Step 36105: {'lr': 0.00019953892327168805, 'samples': 1155360, 'steps': 2256, 'loss/train': 1.2232164144515991} -09/20/2021 22:18:28 - INFO - __main__ - Step 36106: {'lr': 0.00019953892327168805, 'samples': 1155392, 'steps': 2256, 'loss/train': 2.3192880153656006} -09/20/2021 22:18:29 - INFO - __main__ - Step 36107: {'lr': 0.00019953892327168805, 'samples': 1155424, 'steps': 2256, 'loss/train': 1.3193014860153198} -09/20/2021 22:18:30 - INFO - __main__ - Step 36108: {'lr': 0.00019953892327168805, 'samples': 1155456, 'steps': 2256, 'loss/train': 2.8262784481048584} -09/20/2021 22:18:30 - INFO - __main__ - Step 36109: {'lr': 0.00019953892327168805, 'samples': 1155488, 'steps': 2256, 'loss/train': 2.955333709716797} -09/20/2021 22:18:31 - INFO - __main__ - Step 36110: {'lr': 0.00019953892327168805, 'samples': 1155520, 'steps': 2256, 'loss/train': 0.5630654692649841} -09/20/2021 22:18:32 - INFO - __main__ - Step 36111: {'lr': 0.00019953892327168805, 'samples': 1155552, 'steps': 2256, 'loss/train': 2.105526924133301} -09/20/2021 22:18:33 - INFO - __main__ - Step 36112: {'lr': 0.00019953892327168805, 'samples': 1155584, 'steps': 2256, 'loss/train': 2.5835978984832764} -09/20/2021 22:18:33 - INFO - __main__ - Step 36113: {'lr': 0.00019953831122046284, 'samples': 1155616, 'steps': 2257, 'loss/train': 2.2725279331207275} -09/20/2021 22:18:34 - INFO - __main__ - Step 36114: {'lr': 0.00019953831122046284, 'samples': 1155648, 'steps': 2257, 'loss/train': 1.923558235168457} -09/20/2021 22:18:35 - INFO - __main__ - Step 36115: {'lr': 0.00019953831122046284, 'samples': 1155680, 'steps': 2257, 'loss/train': 3.1297173500061035} -09/20/2021 22:18:36 - INFO - __main__ - Step 36116: {'lr': 0.00019953831122046284, 'samples': 1155712, 'steps': 2257, 'loss/train': 2.6306698322296143} -09/20/2021 22:18:36 - INFO - __main__ - Step 36117: {'lr': 0.00019953831122046284, 'samples': 1155744, 'steps': 2257, 'loss/train': 2.1376686096191406} -09/20/2021 22:18:37 - INFO - __main__ - Step 36118: {'lr': 0.00019953831122046284, 'samples': 1155776, 'steps': 2257, 'loss/train': 3.506300449371338} -09/20/2021 22:18:38 - INFO - __main__ - Step 36119: {'lr': 0.00019953831122046284, 'samples': 1155808, 'steps': 2257, 'loss/train': 2.593200445175171} -09/20/2021 22:18:39 - INFO - __main__ - Step 36120: {'lr': 0.00019953831122046284, 'samples': 1155840, 'steps': 2257, 'loss/train': 1.5905944108963013} -09/20/2021 22:18:39 - INFO - __main__ - Step 36121: {'lr': 0.00019953831122046284, 'samples': 1155872, 'steps': 2257, 'loss/train': 2.6732470989227295} -09/20/2021 22:18:41 - INFO - __main__ - Step 36122: {'lr': 0.00019953831122046284, 'samples': 1155904, 'steps': 2257, 'loss/train': 2.415726900100708} -09/20/2021 22:18:42 - INFO - __main__ - Step 36123: {'lr': 0.00019953831122046284, 'samples': 1155936, 'steps': 2257, 'loss/train': 2.431497573852539} -09/20/2021 22:18:42 - INFO - __main__ - Step 36124: {'lr': 0.00019953831122046284, 'samples': 1155968, 'steps': 2257, 'loss/train': 2.5740199089050293} -09/20/2021 22:18:43 - INFO - __main__ - Step 36125: {'lr': 0.00019953831122046284, 'samples': 1156000, 'steps': 2257, 'loss/train': 2.3865132331848145} -09/20/2021 22:18:44 - INFO - __main__ - Step 36126: {'lr': 0.00019953831122046284, 'samples': 1156032, 'steps': 2257, 'loss/train': 2.199100971221924} -09/20/2021 22:18:44 - INFO - __main__ - Step 36127: {'lr': 0.00019953831122046284, 'samples': 1156064, 'steps': 2257, 'loss/train': 1.4740948677062988} -09/20/2021 22:18:45 - INFO - __main__ - Step 36128: {'lr': 0.00019953831122046284, 'samples': 1156096, 'steps': 2257, 'loss/train': 3.1464598178863525} -09/20/2021 22:18:46 - INFO - __main__ - Step 36129: {'lr': 0.0001995376987642166, 'samples': 1156128, 'steps': 2258, 'loss/train': 1.9512395858764648} -09/20/2021 22:18:47 - INFO - __main__ - Step 36130: {'lr': 0.0001995376987642166, 'samples': 1156160, 'steps': 2258, 'loss/train': 1.993635892868042} -09/20/2021 22:18:48 - INFO - __main__ - Step 36131: {'lr': 0.0001995376987642166, 'samples': 1156192, 'steps': 2258, 'loss/train': 2.036942481994629} -09/20/2021 22:18:48 - INFO - __main__ - Step 36132: {'lr': 0.0001995376987642166, 'samples': 1156224, 'steps': 2258, 'loss/train': 1.7911638021469116} -09/20/2021 22:18:49 - INFO - __main__ - Step 36133: {'lr': 0.0001995376987642166, 'samples': 1156256, 'steps': 2258, 'loss/train': 3.3692965507507324} -09/20/2021 22:18:50 - INFO - __main__ - Step 36134: {'lr': 0.0001995376987642166, 'samples': 1156288, 'steps': 2258, 'loss/train': 2.1065239906311035} -09/20/2021 22:18:51 - INFO - __main__ - Step 36135: {'lr': 0.0001995376987642166, 'samples': 1156320, 'steps': 2258, 'loss/train': 3.44862699508667} -09/20/2021 22:18:51 - INFO - __main__ - Step 36136: {'lr': 0.0001995376987642166, 'samples': 1156352, 'steps': 2258, 'loss/train': 3.8105626106262207} -09/20/2021 22:18:52 - INFO - __main__ - Step 36137: {'lr': 0.0001995376987642166, 'samples': 1156384, 'steps': 2258, 'loss/train': 3.0918242931365967} -09/20/2021 22:18:53 - INFO - __main__ - Step 36138: {'lr': 0.0001995376987642166, 'samples': 1156416, 'steps': 2258, 'loss/train': 1.9431066513061523} -09/20/2021 22:18:54 - INFO - __main__ - Step 36139: {'lr': 0.0001995376987642166, 'samples': 1156448, 'steps': 2258, 'loss/train': 1.8769218921661377} -09/20/2021 22:18:54 - INFO - __main__ - Step 36140: {'lr': 0.0001995376987642166, 'samples': 1156480, 'steps': 2258, 'loss/train': 2.507145404815674} -09/20/2021 22:18:55 - INFO - __main__ - Step 36141: {'lr': 0.0001995376987642166, 'samples': 1156512, 'steps': 2258, 'loss/train': 3.110936164855957} -09/20/2021 22:18:56 - INFO - __main__ - Step 36142: {'lr': 0.0001995376987642166, 'samples': 1156544, 'steps': 2258, 'loss/train': 1.6553171873092651} -09/20/2021 22:18:57 - INFO - __main__ - Step 36143: {'lr': 0.0001995376987642166, 'samples': 1156576, 'steps': 2258, 'loss/train': 1.376177191734314} -09/20/2021 22:18:57 - INFO - __main__ - Step 36144: {'lr': 0.0001995376987642166, 'samples': 1156608, 'steps': 2258, 'loss/train': 2.9395675659179688} -09/20/2021 22:18:58 - INFO - __main__ - Step 36145: {'lr': 0.00019953708590295186, 'samples': 1156640, 'steps': 2259, 'loss/train': 1.6240568161010742} -09/20/2021 22:18:59 - INFO - __main__ - Step 36146: {'lr': 0.00019953708590295186, 'samples': 1156672, 'steps': 2259, 'loss/train': 2.1625096797943115} -09/20/2021 22:19:00 - INFO - __main__ - Step 36147: {'lr': 0.00019953708590295186, 'samples': 1156704, 'steps': 2259, 'loss/train': 1.5951584577560425} -09/20/2021 22:19:00 - INFO - __main__ - Step 36148: {'lr': 0.00019953708590295186, 'samples': 1156736, 'steps': 2259, 'loss/train': 1.5808221101760864} -09/20/2021 22:19:01 - INFO - __main__ - Step 36149: {'lr': 0.00019953708590295186, 'samples': 1156768, 'steps': 2259, 'loss/train': 1.9386097192764282} -09/20/2021 22:19:02 - INFO - __main__ - Step 36150: {'lr': 0.00019953708590295186, 'samples': 1156800, 'steps': 2259, 'loss/train': 2.348659038543701} -09/20/2021 22:19:03 - INFO - __main__ - Step 36151: {'lr': 0.00019953708590295186, 'samples': 1156832, 'steps': 2259, 'loss/train': 2.1558549404144287} -09/20/2021 22:19:04 - INFO - __main__ - Step 36152: {'lr': 0.00019953708590295186, 'samples': 1156864, 'steps': 2259, 'loss/train': 2.646435499191284} -09/20/2021 22:19:05 - INFO - __main__ - Step 36153: {'lr': 0.00019953708590295186, 'samples': 1156896, 'steps': 2259, 'loss/train': 2.619147300720215} -09/20/2021 22:19:06 - INFO - __main__ - Step 36154: {'lr': 0.00019953708590295186, 'samples': 1156928, 'steps': 2259, 'loss/train': 2.7243359088897705} -09/20/2021 22:19:06 - INFO - __main__ - Step 36155: {'lr': 0.00019953708590295186, 'samples': 1156960, 'steps': 2259, 'loss/train': 2.5352234840393066} -09/20/2021 22:19:07 - INFO - __main__ - Step 36156: {'lr': 0.00019953708590295186, 'samples': 1156992, 'steps': 2259, 'loss/train': 1.7828718423843384} -09/20/2021 22:19:08 - INFO - __main__ - Step 36157: {'lr': 0.00019953708590295186, 'samples': 1157024, 'steps': 2259, 'loss/train': 2.2952675819396973} -09/20/2021 22:19:09 - INFO - __main__ - Step 36158: {'lr': 0.00019953708590295186, 'samples': 1157056, 'steps': 2259, 'loss/train': 2.9944381713867188} -09/20/2021 22:19:09 - INFO - __main__ - Step 36159: {'lr': 0.00019953708590295186, 'samples': 1157088, 'steps': 2259, 'loss/train': 2.1231470108032227} -09/20/2021 22:19:10 - INFO - __main__ - Step 36160: {'lr': 0.00019953708590295186, 'samples': 1157120, 'steps': 2259, 'loss/train': 1.9065849781036377} -09/20/2021 22:19:11 - INFO - __main__ - Step 36161: {'lr': 0.00019953647263667112, 'samples': 1157152, 'steps': 2260, 'loss/train': 1.0081212520599365} -09/20/2021 22:19:12 - INFO - __main__ - Step 36162: {'lr': 0.00019953647263667112, 'samples': 1157184, 'steps': 2260, 'loss/train': 1.0633231401443481} -09/20/2021 22:19:12 - INFO - __main__ - Step 36163: {'lr': 0.00019953647263667112, 'samples': 1157216, 'steps': 2260, 'loss/train': 1.7964907884597778} -09/20/2021 22:19:13 - INFO - __main__ - Step 36164: {'lr': 0.00019953647263667112, 'samples': 1157248, 'steps': 2260, 'loss/train': 2.0684351921081543} -09/20/2021 22:19:14 - INFO - __main__ - Step 36165: {'lr': 0.00019953647263667112, 'samples': 1157280, 'steps': 2260, 'loss/train': 2.1354126930236816} -09/20/2021 22:19:15 - INFO - __main__ - Step 36166: {'lr': 0.00019953647263667112, 'samples': 1157312, 'steps': 2260, 'loss/train': 2.271963596343994} -09/20/2021 22:19:15 - INFO - __main__ - Step 36167: {'lr': 0.00019953647263667112, 'samples': 1157344, 'steps': 2260, 'loss/train': 1.5416555404663086} -09/20/2021 22:19:16 - INFO - __main__ - Step 36168: {'lr': 0.00019953647263667112, 'samples': 1157376, 'steps': 2260, 'loss/train': 2.0868897438049316} -09/20/2021 22:19:17 - INFO - __main__ - Step 36169: {'lr': 0.00019953647263667112, 'samples': 1157408, 'steps': 2260, 'loss/train': 1.775511622428894} -09/20/2021 22:19:18 - INFO - __main__ - Step 36170: {'lr': 0.00019953647263667112, 'samples': 1157440, 'steps': 2260, 'loss/train': 1.8322926759719849} -09/20/2021 22:19:18 - INFO - __main__ - Step 36171: {'lr': 0.00019953647263667112, 'samples': 1157472, 'steps': 2260, 'loss/train': 2.6246321201324463} -09/20/2021 22:19:19 - INFO - __main__ - Step 36172: {'lr': 0.00019953647263667112, 'samples': 1157504, 'steps': 2260, 'loss/train': 2.6405577659606934} -09/20/2021 22:19:20 - INFO - __main__ - Step 36173: {'lr': 0.00019953647263667112, 'samples': 1157536, 'steps': 2260, 'loss/train': 2.415403127670288} -09/20/2021 22:19:21 - INFO - __main__ - Step 36174: {'lr': 0.00019953647263667112, 'samples': 1157568, 'steps': 2260, 'loss/train': 2.0508921146392822} -09/20/2021 22:19:21 - INFO - __main__ - Step 36175: {'lr': 0.00019953647263667112, 'samples': 1157600, 'steps': 2260, 'loss/train': 2.1494970321655273} -09/20/2021 22:19:22 - INFO - __main__ - Step 36176: {'lr': 0.00019953647263667112, 'samples': 1157632, 'steps': 2260, 'loss/train': 2.4655048847198486} -09/20/2021 22:19:23 - INFO - __main__ - Step 36177: {'lr': 0.00019953585896537686, 'samples': 1157664, 'steps': 2261, 'loss/train': 1.704977035522461} -09/20/2021 22:19:24 - INFO - __main__ - Step 36178: {'lr': 0.00019953585896537686, 'samples': 1157696, 'steps': 2261, 'loss/train': 1.7565443515777588} -09/20/2021 22:19:25 - INFO - __main__ - Step 36179: {'lr': 0.00019953585896537686, 'samples': 1157728, 'steps': 2261, 'loss/train': 3.362797260284424} -09/20/2021 22:19:25 - INFO - __main__ - Step 36180: {'lr': 0.00019953585896537686, 'samples': 1157760, 'steps': 2261, 'loss/train': 6.159788608551025} -09/20/2021 22:19:26 - INFO - __main__ - Step 36181: {'lr': 0.00019953585896537686, 'samples': 1157792, 'steps': 2261, 'loss/train': 2.451934814453125} -09/20/2021 22:19:27 - INFO - __main__ - Step 36182: {'lr': 0.00019953585896537686, 'samples': 1157824, 'steps': 2261, 'loss/train': 2.358036756515503} -09/20/2021 22:19:28 - INFO - __main__ - Step 36183: {'lr': 0.00019953585896537686, 'samples': 1157856, 'steps': 2261, 'loss/train': 1.8945555686950684} -09/20/2021 22:19:29 - INFO - __main__ - Step 36184: {'lr': 0.00019953585896537686, 'samples': 1157888, 'steps': 2261, 'loss/train': 2.641209602355957} -09/20/2021 22:19:30 - INFO - __main__ - Step 36185: {'lr': 0.00019953585896537686, 'samples': 1157920, 'steps': 2261, 'loss/train': 2.273287534713745} -09/20/2021 22:19:30 - INFO - __main__ - Step 36186: {'lr': 0.00019953585896537686, 'samples': 1157952, 'steps': 2261, 'loss/train': 2.5428881645202637} -09/20/2021 22:19:31 - INFO - __main__ - Step 36187: {'lr': 0.00019953585896537686, 'samples': 1157984, 'steps': 2261, 'loss/train': 3.360027551651001} -09/20/2021 22:19:32 - INFO - __main__ - Step 36188: {'lr': 0.00019953585896537686, 'samples': 1158016, 'steps': 2261, 'loss/train': 2.7088069915771484} -09/20/2021 22:19:33 - INFO - __main__ - Step 36189: {'lr': 0.00019953585896537686, 'samples': 1158048, 'steps': 2261, 'loss/train': 2.3037688732147217} -09/20/2021 22:19:33 - INFO - __main__ - Step 36190: {'lr': 0.00019953585896537686, 'samples': 1158080, 'steps': 2261, 'loss/train': 1.6378318071365356} -09/20/2021 22:19:34 - INFO - __main__ - Step 36191: {'lr': 0.00019953585896537686, 'samples': 1158112, 'steps': 2261, 'loss/train': 2.181405782699585} -09/20/2021 22:19:35 - INFO - __main__ - Step 36192: {'lr': 0.00019953585896537686, 'samples': 1158144, 'steps': 2261, 'loss/train': 1.7031720876693726} -09/20/2021 22:19:36 - INFO - __main__ - Step 36193: {'lr': 0.00019953524488907154, 'samples': 1158176, 'steps': 2262, 'loss/train': 1.7415778636932373} -09/20/2021 22:19:37 - INFO - __main__ - Step 36194: {'lr': 0.00019953524488907154, 'samples': 1158208, 'steps': 2262, 'loss/train': 0.8506142497062683} -09/20/2021 22:19:37 - INFO - __main__ - Step 36195: {'lr': 0.00019953524488907154, 'samples': 1158240, 'steps': 2262, 'loss/train': 1.8548156023025513} -09/20/2021 22:19:38 - INFO - __main__ - Step 36196: {'lr': 0.00019953524488907154, 'samples': 1158272, 'steps': 2262, 'loss/train': 2.5220882892608643} -09/20/2021 22:19:39 - INFO - __main__ - Step 36197: {'lr': 0.00019953524488907154, 'samples': 1158304, 'steps': 2262, 'loss/train': 2.2346012592315674} -09/20/2021 22:19:40 - INFO - __main__ - Step 36198: {'lr': 0.00019953524488907154, 'samples': 1158336, 'steps': 2262, 'loss/train': 1.20236074924469} -09/20/2021 22:19:40 - INFO - __main__ - Step 36199: {'lr': 0.00019953524488907154, 'samples': 1158368, 'steps': 2262, 'loss/train': 0.37763068079948425} -09/20/2021 22:19:41 - INFO - __main__ - Step 36200: {'lr': 0.00019953524488907154, 'samples': 1158400, 'steps': 2262, 'loss/train': 2.4216811656951904} -09/20/2021 22:19:42 - INFO - __main__ - Step 36201: {'lr': 0.00019953524488907154, 'samples': 1158432, 'steps': 2262, 'loss/train': 3.093630313873291} -09/20/2021 22:19:43 - INFO - __main__ - Step 36202: {'lr': 0.00019953524488907154, 'samples': 1158464, 'steps': 2262, 'loss/train': 2.1497764587402344} -09/20/2021 22:19:43 - INFO - __main__ - Step 36203: {'lr': 0.00019953524488907154, 'samples': 1158496, 'steps': 2262, 'loss/train': 2.697545051574707} -09/20/2021 22:19:44 - INFO - __main__ - Step 36204: {'lr': 0.00019953524488907154, 'samples': 1158528, 'steps': 2262, 'loss/train': 2.191612482070923} -09/20/2021 22:19:45 - INFO - __main__ - Step 36205: {'lr': 0.00019953524488907154, 'samples': 1158560, 'steps': 2262, 'loss/train': 2.705845355987549} -09/20/2021 22:19:45 - INFO - __main__ - Step 36206: {'lr': 0.00019953524488907154, 'samples': 1158592, 'steps': 2262, 'loss/train': 1.9001173973083496} -09/20/2021 22:19:46 - INFO - __main__ - Step 36207: {'lr': 0.00019953524488907154, 'samples': 1158624, 'steps': 2262, 'loss/train': 2.4330039024353027} -09/20/2021 22:19:47 - INFO - __main__ - Step 36208: {'lr': 0.00019953524488907154, 'samples': 1158656, 'steps': 2262, 'loss/train': 1.814294695854187} -09/20/2021 22:19:48 - INFO - __main__ - Step 36209: {'lr': 0.00019953463040775772, 'samples': 1158688, 'steps': 2263, 'loss/train': 2.3746306896209717} -09/20/2021 22:19:49 - INFO - __main__ - Step 36210: {'lr': 0.00019953463040775772, 'samples': 1158720, 'steps': 2263, 'loss/train': 1.1539002656936646} -09/20/2021 22:19:49 - INFO - __main__ - Step 36211: {'lr': 0.00019953463040775772, 'samples': 1158752, 'steps': 2263, 'loss/train': 0.2435143142938614} -09/20/2021 22:19:50 - INFO - __main__ - Step 36212: {'lr': 0.00019953463040775772, 'samples': 1158784, 'steps': 2263, 'loss/train': 0.1797974407672882} -09/20/2021 22:19:52 - INFO - __main__ - Step 36213: {'lr': 0.00019953463040775772, 'samples': 1158816, 'steps': 2263, 'loss/train': 2.095797061920166} -09/20/2021 22:19:53 - INFO - __main__ - Step 36214: {'lr': 0.00019953463040775772, 'samples': 1158848, 'steps': 2263, 'loss/train': 2.857758045196533} -09/20/2021 22:19:54 - INFO - __main__ - Step 36215: {'lr': 0.00019953463040775772, 'samples': 1158880, 'steps': 2263, 'loss/train': 3.354748010635376} -09/20/2021 22:19:54 - INFO - __main__ - Step 36216: {'lr': 0.00019953463040775772, 'samples': 1158912, 'steps': 2263, 'loss/train': 1.597426176071167} -09/20/2021 22:19:55 - INFO - __main__ - Step 36217: {'lr': 0.00019953463040775772, 'samples': 1158944, 'steps': 2263, 'loss/train': 1.738211750984192} -09/20/2021 22:19:56 - INFO - __main__ - Step 36218: {'lr': 0.00019953463040775772, 'samples': 1158976, 'steps': 2263, 'loss/train': 2.336808443069458} -09/20/2021 22:19:57 - INFO - __main__ - Step 36219: {'lr': 0.00019953463040775772, 'samples': 1159008, 'steps': 2263, 'loss/train': 2.507676124572754} -09/20/2021 22:19:57 - INFO - __main__ - Step 36220: {'lr': 0.00019953463040775772, 'samples': 1159040, 'steps': 2263, 'loss/train': 1.946035623550415} -09/20/2021 22:19:58 - INFO - __main__ - Step 36221: {'lr': 0.00019953463040775772, 'samples': 1159072, 'steps': 2263, 'loss/train': 2.2361936569213867} -09/20/2021 22:19:59 - INFO - __main__ - Step 36222: {'lr': 0.00019953463040775772, 'samples': 1159104, 'steps': 2263, 'loss/train': 2.0294573307037354} -09/20/2021 22:20:00 - INFO - __main__ - Step 36223: {'lr': 0.00019953463040775772, 'samples': 1159136, 'steps': 2263, 'loss/train': 1.9098764657974243} -09/20/2021 22:20:00 - INFO - __main__ - Step 36224: {'lr': 0.00019953463040775772, 'samples': 1159168, 'steps': 2263, 'loss/train': 0.20201508700847626} -09/20/2021 22:20:01 - INFO - __main__ - Step 36225: {'lr': 0.00019953401552143789, 'samples': 1159200, 'steps': 2264, 'loss/train': 0.11178959906101227} -09/20/2021 22:20:02 - INFO - __main__ - Step 36226: {'lr': 0.00019953401552143789, 'samples': 1159232, 'steps': 2264, 'loss/train': 0.29175636172294617} -09/20/2021 22:20:03 - INFO - __main__ - Step 36227: {'lr': 0.00019953401552143789, 'samples': 1159264, 'steps': 2264, 'loss/train': 2.747380256652832} -09/20/2021 22:20:03 - INFO - __main__ - Step 36228: {'lr': 0.00019953401552143789, 'samples': 1159296, 'steps': 2264, 'loss/train': 2.286829948425293} -09/20/2021 22:20:04 - INFO - __main__ - Step 36229: {'lr': 0.00019953401552143789, 'samples': 1159328, 'steps': 2264, 'loss/train': 2.1541028022766113} -09/20/2021 22:20:05 - INFO - __main__ - Step 36230: {'lr': 0.00019953401552143789, 'samples': 1159360, 'steps': 2264, 'loss/train': 2.044167995452881} -09/20/2021 22:20:06 - INFO - __main__ - Step 36231: {'lr': 0.00019953401552143789, 'samples': 1159392, 'steps': 2264, 'loss/train': 1.1615617275238037} -09/20/2021 22:20:06 - INFO - __main__ - Step 36232: {'lr': 0.00019953401552143789, 'samples': 1159424, 'steps': 2264, 'loss/train': 2.032024621963501} -09/20/2021 22:20:07 - INFO - __main__ - Step 36233: {'lr': 0.00019953401552143789, 'samples': 1159456, 'steps': 2264, 'loss/train': 3.243511199951172} -09/20/2021 22:20:08 - INFO - __main__ - Step 36234: {'lr': 0.00019953401552143789, 'samples': 1159488, 'steps': 2264, 'loss/train': 1.8667161464691162} -09/20/2021 22:20:09 - INFO - __main__ - Step 36235: {'lr': 0.00019953401552143789, 'samples': 1159520, 'steps': 2264, 'loss/train': 2.15189266204834} -09/20/2021 22:20:09 - INFO - __main__ - Step 36236: {'lr': 0.00019953401552143789, 'samples': 1159552, 'steps': 2264, 'loss/train': 2.534824848175049} -09/20/2021 22:20:10 - INFO - __main__ - Step 36237: {'lr': 0.00019953401552143789, 'samples': 1159584, 'steps': 2264, 'loss/train': 2.083684206008911} -09/20/2021 22:20:11 - INFO - __main__ - Step 36238: {'lr': 0.00019953401552143789, 'samples': 1159616, 'steps': 2264, 'loss/train': 3.5652408599853516} -09/20/2021 22:20:12 - INFO - __main__ - Step 36239: {'lr': 0.00019953401552143789, 'samples': 1159648, 'steps': 2264, 'loss/train': 3.0052757263183594} -09/20/2021 22:20:12 - INFO - __main__ - Step 36240: {'lr': 0.00019953401552143789, 'samples': 1159680, 'steps': 2264, 'loss/train': 3.517463207244873} -09/20/2021 22:20:13 - INFO - __main__ - Step 36241: {'lr': 0.00019953340023011451, 'samples': 1159712, 'steps': 2265, 'loss/train': 2.1457762718200684} -09/20/2021 22:20:14 - INFO - __main__ - Step 36242: {'lr': 0.00019953340023011451, 'samples': 1159744, 'steps': 2265, 'loss/train': 2.237746000289917} -09/20/2021 22:20:15 - INFO - __main__ - Step 36243: {'lr': 0.00019953340023011451, 'samples': 1159776, 'steps': 2265, 'loss/train': 1.9494141340255737} -09/20/2021 22:20:16 - INFO - __main__ - Step 36244: {'lr': 0.00019953340023011451, 'samples': 1159808, 'steps': 2265, 'loss/train': 2.2666516304016113} -09/20/2021 22:20:17 - INFO - __main__ - Step 36245: {'lr': 0.00019953340023011451, 'samples': 1159840, 'steps': 2265, 'loss/train': 1.9702365398406982} -09/20/2021 22:20:18 - INFO - __main__ - Step 36246: {'lr': 0.00019953340023011451, 'samples': 1159872, 'steps': 2265, 'loss/train': 1.4117268323898315} -09/20/2021 22:20:18 - INFO - __main__ - Step 36247: {'lr': 0.00019953340023011451, 'samples': 1159904, 'steps': 2265, 'loss/train': 2.347166061401367} -09/20/2021 22:20:19 - INFO - __main__ - Step 36248: {'lr': 0.00019953340023011451, 'samples': 1159936, 'steps': 2265, 'loss/train': 3.800462245941162} -09/20/2021 22:20:20 - INFO - __main__ - Step 36249: {'lr': 0.00019953340023011451, 'samples': 1159968, 'steps': 2265, 'loss/train': 2.4029831886291504} -09/20/2021 22:20:21 - INFO - __main__ - Step 36250: {'lr': 0.00019953340023011451, 'samples': 1160000, 'steps': 2265, 'loss/train': 2.3047616481781006} -09/20/2021 22:20:21 - INFO - __main__ - Step 36251: {'lr': 0.00019953340023011451, 'samples': 1160032, 'steps': 2265, 'loss/train': 2.8570072650909424} -09/20/2021 22:20:22 - INFO - __main__ - Step 36252: {'lr': 0.00019953340023011451, 'samples': 1160064, 'steps': 2265, 'loss/train': 2.2088325023651123} -09/20/2021 22:20:23 - INFO - __main__ - Step 36253: {'lr': 0.00019953340023011451, 'samples': 1160096, 'steps': 2265, 'loss/train': 1.304269790649414} -09/20/2021 22:20:24 - INFO - __main__ - Step 36254: {'lr': 0.00019953340023011451, 'samples': 1160128, 'steps': 2265, 'loss/train': 2.4920966625213623} -09/20/2021 22:20:24 - INFO - __main__ - Step 36255: {'lr': 0.00019953340023011451, 'samples': 1160160, 'steps': 2265, 'loss/train': 1.8266438245773315} -09/20/2021 22:20:25 - INFO - __main__ - Step 36256: {'lr': 0.00019953340023011451, 'samples': 1160192, 'steps': 2265, 'loss/train': 2.2476067543029785} -09/20/2021 22:20:26 - INFO - __main__ - Step 36257: {'lr': 0.0001995327845337901, 'samples': 1160224, 'steps': 2266, 'loss/train': 2.7763490676879883} -09/20/2021 22:20:27 - INFO - __main__ - Step 36258: {'lr': 0.0001995327845337901, 'samples': 1160256, 'steps': 2266, 'loss/train': 0.4696868360042572} -09/20/2021 22:20:27 - INFO - __main__ - Step 36259: {'lr': 0.0001995327845337901, 'samples': 1160288, 'steps': 2266, 'loss/train': 2.527005910873413} -09/20/2021 22:20:28 - INFO - __main__ - Step 36260: {'lr': 0.0001995327845337901, 'samples': 1160320, 'steps': 2266, 'loss/train': 1.213718295097351} -09/20/2021 22:20:29 - INFO - __main__ - Step 36261: {'lr': 0.0001995327845337901, 'samples': 1160352, 'steps': 2266, 'loss/train': 1.341446876525879} -09/20/2021 22:20:30 - INFO - __main__ - Step 36262: {'lr': 0.0001995327845337901, 'samples': 1160384, 'steps': 2266, 'loss/train': 2.1021063327789307} -09/20/2021 22:20:30 - INFO - __main__ - Step 36263: {'lr': 0.0001995327845337901, 'samples': 1160416, 'steps': 2266, 'loss/train': 2.703502655029297} -09/20/2021 22:20:31 - INFO - __main__ - Step 36264: {'lr': 0.0001995327845337901, 'samples': 1160448, 'steps': 2266, 'loss/train': 2.025306224822998} -09/20/2021 22:20:32 - INFO - __main__ - Step 36265: {'lr': 0.0001995327845337901, 'samples': 1160480, 'steps': 2266, 'loss/train': 2.2501981258392334} -09/20/2021 22:20:33 - INFO - __main__ - Step 36266: {'lr': 0.0001995327845337901, 'samples': 1160512, 'steps': 2266, 'loss/train': 0.3453409671783447} -09/20/2021 22:20:33 - INFO - __main__ - Step 36267: {'lr': 0.0001995327845337901, 'samples': 1160544, 'steps': 2266, 'loss/train': 3.155503749847412} -09/20/2021 22:20:34 - INFO - __main__ - Step 36268: {'lr': 0.0001995327845337901, 'samples': 1160576, 'steps': 2266, 'loss/train': 2.107008457183838} -09/20/2021 22:20:35 - INFO - __main__ - Step 36269: {'lr': 0.0001995327845337901, 'samples': 1160608, 'steps': 2266, 'loss/train': 1.8231887817382812} -09/20/2021 22:20:36 - INFO - __main__ - Step 36270: {'lr': 0.0001995327845337901, 'samples': 1160640, 'steps': 2266, 'loss/train': 2.3021321296691895} -09/20/2021 22:20:36 - INFO - __main__ - Step 36271: {'lr': 0.0001995327845337901, 'samples': 1160672, 'steps': 2266, 'loss/train': 1.6726934909820557} -09/20/2021 22:20:37 - INFO - __main__ - Step 36272: {'lr': 0.0001995327845337901, 'samples': 1160704, 'steps': 2266, 'loss/train': 2.371570110321045} -09/20/2021 22:20:38 - INFO - __main__ - Step 36273: {'lr': 0.00019953216843246723, 'samples': 1160736, 'steps': 2267, 'loss/train': 3.1094000339508057} -09/20/2021 22:20:39 - INFO - __main__ - Step 36274: {'lr': 0.00019953216843246723, 'samples': 1160768, 'steps': 2267, 'loss/train': 2.6429812908172607} -09/20/2021 22:20:40 - INFO - __main__ - Step 36275: {'lr': 0.00019953216843246723, 'samples': 1160800, 'steps': 2267, 'loss/train': 1.5051630735397339} -09/20/2021 22:20:41 - INFO - __main__ - Step 36276: {'lr': 0.00019953216843246723, 'samples': 1160832, 'steps': 2267, 'loss/train': 1.993700623512268} -09/20/2021 22:20:42 - INFO - __main__ - Step 36277: {'lr': 0.00019953216843246723, 'samples': 1160864, 'steps': 2267, 'loss/train': 1.4642271995544434} -09/20/2021 22:20:42 - INFO - __main__ - Step 36278: {'lr': 0.00019953216843246723, 'samples': 1160896, 'steps': 2267, 'loss/train': 1.5767148733139038} -09/20/2021 22:20:43 - INFO - __main__ - Step 36279: {'lr': 0.00019953216843246723, 'samples': 1160928, 'steps': 2267, 'loss/train': 1.5053863525390625} -09/20/2021 22:20:44 - INFO - __main__ - Step 36280: {'lr': 0.00019953216843246723, 'samples': 1160960, 'steps': 2267, 'loss/train': 1.964728832244873} -09/20/2021 22:20:45 - INFO - __main__ - Step 36281: {'lr': 0.00019953216843246723, 'samples': 1160992, 'steps': 2267, 'loss/train': 2.115588665008545} -09/20/2021 22:20:45 - INFO - __main__ - Step 36282: {'lr': 0.00019953216843246723, 'samples': 1161024, 'steps': 2267, 'loss/train': 2.408903121948242} -09/20/2021 22:20:46 - INFO - __main__ - Step 36283: {'lr': 0.00019953216843246723, 'samples': 1161056, 'steps': 2267, 'loss/train': 2.1045401096343994} -09/20/2021 22:20:47 - INFO - __main__ - Step 36284: {'lr': 0.00019953216843246723, 'samples': 1161088, 'steps': 2267, 'loss/train': 2.47157621383667} -09/20/2021 22:20:48 - INFO - __main__ - Step 36285: {'lr': 0.00019953216843246723, 'samples': 1161120, 'steps': 2267, 'loss/train': 2.665266513824463} -09/20/2021 22:20:48 - INFO - __main__ - Step 36286: {'lr': 0.00019953216843246723, 'samples': 1161152, 'steps': 2267, 'loss/train': 2.3187649250030518} -09/20/2021 22:20:49 - INFO - __main__ - Step 36287: {'lr': 0.00019953216843246723, 'samples': 1161184, 'steps': 2267, 'loss/train': 2.834582805633545} -09/20/2021 22:20:50 - INFO - __main__ - Step 36288: {'lr': 0.00019953216843246723, 'samples': 1161216, 'steps': 2267, 'loss/train': 1.702940821647644} -09/20/2021 22:20:51 - INFO - __main__ - Step 36289: {'lr': 0.0001995315519261483, 'samples': 1161248, 'steps': 2268, 'loss/train': 1.6143362522125244} -09/20/2021 22:20:51 - INFO - __main__ - Step 36290: {'lr': 0.0001995315519261483, 'samples': 1161280, 'steps': 2268, 'loss/train': 3.1752500534057617} -09/20/2021 22:20:52 - INFO - __main__ - Step 36291: {'lr': 0.0001995315519261483, 'samples': 1161312, 'steps': 2268, 'loss/train': 2.313098907470703} -09/20/2021 22:20:53 - INFO - __main__ - Step 36292: {'lr': 0.0001995315519261483, 'samples': 1161344, 'steps': 2268, 'loss/train': 2.0084469318389893} -09/20/2021 22:20:54 - INFO - __main__ - Step 36293: {'lr': 0.0001995315519261483, 'samples': 1161376, 'steps': 2268, 'loss/train': 1.505721926689148} -09/20/2021 22:20:54 - INFO - __main__ - Step 36294: {'lr': 0.0001995315519261483, 'samples': 1161408, 'steps': 2268, 'loss/train': 2.392066717147827} -09/20/2021 22:20:55 - INFO - __main__ - Step 36295: {'lr': 0.0001995315519261483, 'samples': 1161440, 'steps': 2268, 'loss/train': 2.0297441482543945} -09/20/2021 22:20:56 - INFO - __main__ - Step 36296: {'lr': 0.0001995315519261483, 'samples': 1161472, 'steps': 2268, 'loss/train': 2.817976474761963} -09/20/2021 22:20:57 - INFO - __main__ - Step 36297: {'lr': 0.0001995315519261483, 'samples': 1161504, 'steps': 2268, 'loss/train': 2.4934592247009277} -09/20/2021 22:20:57 - INFO - __main__ - Step 36298: {'lr': 0.0001995315519261483, 'samples': 1161536, 'steps': 2268, 'loss/train': 1.7376731634140015} -09/20/2021 22:20:58 - INFO - __main__ - Step 36299: {'lr': 0.0001995315519261483, 'samples': 1161568, 'steps': 2268, 'loss/train': 2.046095848083496} -09/20/2021 22:20:59 - INFO - __main__ - Step 36300: {'lr': 0.0001995315519261483, 'samples': 1161600, 'steps': 2268, 'loss/train': 0.9765685796737671} -09/20/2021 22:21:00 - INFO - __main__ - Step 36301: {'lr': 0.0001995315519261483, 'samples': 1161632, 'steps': 2268, 'loss/train': 2.361020803451538} -09/20/2021 22:21:00 - INFO - __main__ - Step 36302: {'lr': 0.0001995315519261483, 'samples': 1161664, 'steps': 2268, 'loss/train': 2.5014965534210205} -09/20/2021 22:21:01 - INFO - __main__ - Step 36303: {'lr': 0.0001995315519261483, 'samples': 1161696, 'steps': 2268, 'loss/train': 2.1281208992004395} -09/20/2021 22:21:02 - INFO - __main__ - Step 36304: {'lr': 0.0001995315519261483, 'samples': 1161728, 'steps': 2268, 'loss/train': 2.171207904815674} -09/20/2021 22:21:03 - INFO - __main__ - Step 36305: {'lr': 0.0001995309350148359, 'samples': 1161760, 'steps': 2269, 'loss/train': 2.3054285049438477} -09/20/2021 22:21:04 - INFO - __main__ - Step 36306: {'lr': 0.0001995309350148359, 'samples': 1161792, 'steps': 2269, 'loss/train': 3.351832628250122} -09/20/2021 22:21:05 - INFO - __main__ - Step 36307: {'lr': 0.0001995309350148359, 'samples': 1161824, 'steps': 2269, 'loss/train': 4.49137544631958} -09/20/2021 22:21:06 - INFO - __main__ - Step 36308: {'lr': 0.0001995309350148359, 'samples': 1161856, 'steps': 2269, 'loss/train': 2.991304397583008} -09/20/2021 22:21:06 - INFO - __main__ - Step 36309: {'lr': 0.0001995309350148359, 'samples': 1161888, 'steps': 2269, 'loss/train': 2.4519941806793213} -09/20/2021 22:21:07 - INFO - __main__ - Step 36310: {'lr': 0.0001995309350148359, 'samples': 1161920, 'steps': 2269, 'loss/train': 2.228062152862549} -09/20/2021 22:21:08 - INFO - __main__ - Step 36311: {'lr': 0.0001995309350148359, 'samples': 1161952, 'steps': 2269, 'loss/train': 2.3897323608398438} -09/20/2021 22:21:09 - INFO - __main__ - Step 36312: {'lr': 0.0001995309350148359, 'samples': 1161984, 'steps': 2269, 'loss/train': 1.9837913513183594} -09/20/2021 22:21:09 - INFO - __main__ - Step 36313: {'lr': 0.0001995309350148359, 'samples': 1162016, 'steps': 2269, 'loss/train': 2.679518222808838} -09/20/2021 22:21:10 - INFO - __main__ - Step 36314: {'lr': 0.0001995309350148359, 'samples': 1162048, 'steps': 2269, 'loss/train': 2.695957899093628} -09/20/2021 22:21:11 - INFO - __main__ - Step 36315: {'lr': 0.0001995309350148359, 'samples': 1162080, 'steps': 2269, 'loss/train': 1.533138632774353} -09/20/2021 22:21:12 - INFO - __main__ - Step 36316: {'lr': 0.0001995309350148359, 'samples': 1162112, 'steps': 2269, 'loss/train': 1.5618089437484741} -09/20/2021 22:21:12 - INFO - __main__ - Step 36317: {'lr': 0.0001995309350148359, 'samples': 1162144, 'steps': 2269, 'loss/train': 2.307015895843506} -09/20/2021 22:21:13 - INFO - __main__ - Step 36318: {'lr': 0.0001995309350148359, 'samples': 1162176, 'steps': 2269, 'loss/train': 1.8870184421539307} -09/20/2021 22:21:14 - INFO - __main__ - Step 36319: {'lr': 0.0001995309350148359, 'samples': 1162208, 'steps': 2269, 'loss/train': 1.3749914169311523} -09/20/2021 22:21:15 - INFO - __main__ - Step 36320: {'lr': 0.0001995309350148359, 'samples': 1162240, 'steps': 2269, 'loss/train': 2.62203311920166} -09/20/2021 22:21:15 - INFO - __main__ - Step 36321: {'lr': 0.0001995303176985325, 'samples': 1162272, 'steps': 2270, 'loss/train': 2.9563987255096436} -09/20/2021 22:21:16 - INFO - __main__ - Step 36322: {'lr': 0.0001995303176985325, 'samples': 1162304, 'steps': 2270, 'loss/train': 3.0621676445007324} -09/20/2021 22:21:17 - INFO - __main__ - Step 36323: {'lr': 0.0001995303176985325, 'samples': 1162336, 'steps': 2270, 'loss/train': 2.3715145587921143} -09/20/2021 22:21:18 - INFO - __main__ - Step 36324: {'lr': 0.0001995303176985325, 'samples': 1162368, 'steps': 2270, 'loss/train': 1.9783434867858887} -09/20/2021 22:21:18 - INFO - __main__ - Step 36325: {'lr': 0.0001995303176985325, 'samples': 1162400, 'steps': 2270, 'loss/train': 2.3553223609924316} -09/20/2021 22:21:19 - INFO - __main__ - Step 36326: {'lr': 0.0001995303176985325, 'samples': 1162432, 'steps': 2270, 'loss/train': 2.1212215423583984} -09/20/2021 22:21:20 - INFO - __main__ - Step 36327: {'lr': 0.0001995303176985325, 'samples': 1162464, 'steps': 2270, 'loss/train': 3.0320589542388916} -09/20/2021 22:21:21 - INFO - __main__ - Step 36328: {'lr': 0.0001995303176985325, 'samples': 1162496, 'steps': 2270, 'loss/train': 2.6609065532684326} -09/20/2021 22:21:21 - INFO - __main__ - Step 36329: {'lr': 0.0001995303176985325, 'samples': 1162528, 'steps': 2270, 'loss/train': 2.513988494873047} -09/20/2021 22:21:22 - INFO - __main__ - Step 36330: {'lr': 0.0001995303176985325, 'samples': 1162560, 'steps': 2270, 'loss/train': 2.3751327991485596} -09/20/2021 22:21:23 - INFO - __main__ - Step 36331: {'lr': 0.0001995303176985325, 'samples': 1162592, 'steps': 2270, 'loss/train': 1.637293815612793} -09/20/2021 22:21:24 - INFO - __main__ - Step 36332: {'lr': 0.0001995303176985325, 'samples': 1162624, 'steps': 2270, 'loss/train': 2.712991714477539} -09/20/2021 22:21:24 - INFO - __main__ - Step 36333: {'lr': 0.0001995303176985325, 'samples': 1162656, 'steps': 2270, 'loss/train': 0.5045160055160522} -09/20/2021 22:21:25 - INFO - __main__ - Step 36334: {'lr': 0.0001995303176985325, 'samples': 1162688, 'steps': 2270, 'loss/train': 1.3124622106552124} -09/20/2021 22:21:26 - INFO - __main__ - Step 36335: {'lr': 0.0001995303176985325, 'samples': 1162720, 'steps': 2270, 'loss/train': 2.751887321472168} -09/20/2021 22:21:27 - INFO - __main__ - Step 36336: {'lr': 0.0001995303176985325, 'samples': 1162752, 'steps': 2270, 'loss/train': 1.2022312879562378} -09/20/2021 22:21:28 - INFO - __main__ - Step 36337: {'lr': 0.00019952969997724063, 'samples': 1162784, 'steps': 2271, 'loss/train': 2.323395252227783} -09/20/2021 22:21:29 - INFO - __main__ - Step 36338: {'lr': 0.00019952969997724063, 'samples': 1162816, 'steps': 2271, 'loss/train': 1.8118559122085571} -09/20/2021 22:21:30 - INFO - __main__ - Step 36339: {'lr': 0.00019952969997724063, 'samples': 1162848, 'steps': 2271, 'loss/train': 1.9213536977767944} -09/20/2021 22:21:30 - INFO - __main__ - Step 36340: {'lr': 0.00019952969997724063, 'samples': 1162880, 'steps': 2271, 'loss/train': 1.2521297931671143} -09/20/2021 22:21:31 - INFO - __main__ - Step 36341: {'lr': 0.00019952969997724063, 'samples': 1162912, 'steps': 2271, 'loss/train': 1.6500210762023926} -09/20/2021 22:21:32 - INFO - __main__ - Step 36342: {'lr': 0.00019952969997724063, 'samples': 1162944, 'steps': 2271, 'loss/train': 2.8895161151885986} -09/20/2021 22:21:33 - INFO - __main__ - Step 36343: {'lr': 0.00019952969997724063, 'samples': 1162976, 'steps': 2271, 'loss/train': 2.6054935455322266} -09/20/2021 22:21:33 - INFO - __main__ - Step 36344: {'lr': 0.00019952969997724063, 'samples': 1163008, 'steps': 2271, 'loss/train': 1.933394193649292} -09/20/2021 22:21:34 - INFO - __main__ - Step 36345: {'lr': 0.00019952969997724063, 'samples': 1163040, 'steps': 2271, 'loss/train': 3.6959683895111084} -09/20/2021 22:21:35 - INFO - __main__ - Step 36346: {'lr': 0.00019952969997724063, 'samples': 1163072, 'steps': 2271, 'loss/train': 1.8849269151687622} -09/20/2021 22:21:36 - INFO - __main__ - Step 36347: {'lr': 0.00019952969997724063, 'samples': 1163104, 'steps': 2271, 'loss/train': 1.6828197240829468} -09/20/2021 22:21:36 - INFO - __main__ - Step 36348: {'lr': 0.00019952969997724063, 'samples': 1163136, 'steps': 2271, 'loss/train': 2.0258800983428955} -09/20/2021 22:21:37 - INFO - __main__ - Step 36349: {'lr': 0.00019952969997724063, 'samples': 1163168, 'steps': 2271, 'loss/train': 1.7974340915679932} -09/20/2021 22:21:38 - INFO - __main__ - Step 36350: {'lr': 0.00019952969997724063, 'samples': 1163200, 'steps': 2271, 'loss/train': 1.8241760730743408} -09/20/2021 22:21:39 - INFO - __main__ - Step 36351: {'lr': 0.00019952969997724063, 'samples': 1163232, 'steps': 2271, 'loss/train': 1.8546611070632935} -09/20/2021 22:21:39 - INFO - __main__ - Step 36352: {'lr': 0.00019952969997724063, 'samples': 1163264, 'steps': 2271, 'loss/train': 2.8919036388397217} -09/20/2021 22:21:40 - INFO - __main__ - Step 36353: {'lr': 0.0001995290818509628, 'samples': 1163296, 'steps': 2272, 'loss/train': 1.9773889780044556} -09/20/2021 22:21:41 - INFO - __main__ - Step 36354: {'lr': 0.0001995290818509628, 'samples': 1163328, 'steps': 2272, 'loss/train': 2.0659375190734863} -09/20/2021 22:21:42 - INFO - __main__ - Step 36355: {'lr': 0.0001995290818509628, 'samples': 1163360, 'steps': 2272, 'loss/train': 3.1712372303009033} -09/20/2021 22:21:43 - INFO - __main__ - Step 36356: {'lr': 0.0001995290818509628, 'samples': 1163392, 'steps': 2272, 'loss/train': 1.3444099426269531} -09/20/2021 22:21:43 - INFO - __main__ - Step 36357: {'lr': 0.0001995290818509628, 'samples': 1163424, 'steps': 2272, 'loss/train': 1.2983838319778442} -09/20/2021 22:21:44 - INFO - __main__ - Step 36358: {'lr': 0.0001995290818509628, 'samples': 1163456, 'steps': 2272, 'loss/train': 1.3236910104751587} -09/20/2021 22:21:45 - INFO - __main__ - Step 36359: {'lr': 0.0001995290818509628, 'samples': 1163488, 'steps': 2272, 'loss/train': 2.8523590564727783} -09/20/2021 22:21:46 - INFO - __main__ - Step 36360: {'lr': 0.0001995290818509628, 'samples': 1163520, 'steps': 2272, 'loss/train': 2.796072006225586} -09/20/2021 22:21:46 - INFO - __main__ - Step 36361: {'lr': 0.0001995290818509628, 'samples': 1163552, 'steps': 2272, 'loss/train': 1.7501420974731445} -09/20/2021 22:21:47 - INFO - __main__ - Step 36362: {'lr': 0.0001995290818509628, 'samples': 1163584, 'steps': 2272, 'loss/train': 1.6144616603851318} -09/20/2021 22:21:48 - INFO - __main__ - Step 36363: {'lr': 0.0001995290818509628, 'samples': 1163616, 'steps': 2272, 'loss/train': 2.4905662536621094} -09/20/2021 22:21:49 - INFO - __main__ - Step 36364: {'lr': 0.0001995290818509628, 'samples': 1163648, 'steps': 2272, 'loss/train': 1.8801791667938232} -09/20/2021 22:21:49 - INFO - __main__ - Step 36365: {'lr': 0.0001995290818509628, 'samples': 1163680, 'steps': 2272, 'loss/train': 3.2015116214752197} -09/20/2021 22:21:51 - INFO - __main__ - Step 36366: {'lr': 0.0001995290818509628, 'samples': 1163712, 'steps': 2272, 'loss/train': 1.761014461517334} -09/20/2021 22:21:52 - INFO - __main__ - Step 36367: {'lr': 0.0001995290818509628, 'samples': 1163744, 'steps': 2272, 'loss/train': 2.1147255897521973} -09/20/2021 22:21:52 - INFO - __main__ - Step 36368: {'lr': 0.0001995290818509628, 'samples': 1163776, 'steps': 2272, 'loss/train': 1.8122228384017944} -09/20/2021 22:21:53 - INFO - __main__ - Step 36369: {'lr': 0.0001995284633197015, 'samples': 1163808, 'steps': 2273, 'loss/train': 2.5544631481170654} -09/20/2021 22:21:54 - INFO - __main__ - Step 36370: {'lr': 0.0001995284633197015, 'samples': 1163840, 'steps': 2273, 'loss/train': 2.751460075378418} -09/20/2021 22:21:55 - INFO - __main__ - Step 36371: {'lr': 0.0001995284633197015, 'samples': 1163872, 'steps': 2273, 'loss/train': 3.038198471069336} -09/20/2021 22:21:55 - INFO - __main__ - Step 36372: {'lr': 0.0001995284633197015, 'samples': 1163904, 'steps': 2273, 'loss/train': 2.0789690017700195} -09/20/2021 22:21:56 - INFO - __main__ - Step 36373: {'lr': 0.0001995284633197015, 'samples': 1163936, 'steps': 2273, 'loss/train': 2.3714137077331543} -09/20/2021 22:21:57 - INFO - __main__ - Step 36374: {'lr': 0.0001995284633197015, 'samples': 1163968, 'steps': 2273, 'loss/train': 3.3620662689208984} -09/20/2021 22:21:58 - INFO - __main__ - Step 36375: {'lr': 0.0001995284633197015, 'samples': 1164000, 'steps': 2273, 'loss/train': 2.65244722366333} -09/20/2021 22:21:58 - INFO - __main__ - Step 36376: {'lr': 0.0001995284633197015, 'samples': 1164032, 'steps': 2273, 'loss/train': 0.48599138855934143} -09/20/2021 22:21:59 - INFO - __main__ - Step 36377: {'lr': 0.0001995284633197015, 'samples': 1164064, 'steps': 2273, 'loss/train': 1.9106656312942505} -09/20/2021 22:22:00 - INFO - __main__ - Step 36378: {'lr': 0.0001995284633197015, 'samples': 1164096, 'steps': 2273, 'loss/train': 1.674284815788269} -09/20/2021 22:22:01 - INFO - __main__ - Step 36379: {'lr': 0.0001995284633197015, 'samples': 1164128, 'steps': 2273, 'loss/train': 1.9167217016220093} -09/20/2021 22:22:01 - INFO - __main__ - Step 36380: {'lr': 0.0001995284633197015, 'samples': 1164160, 'steps': 2273, 'loss/train': 2.3779220581054688} -09/20/2021 22:22:02 - INFO - __main__ - Step 36381: {'lr': 0.0001995284633197015, 'samples': 1164192, 'steps': 2273, 'loss/train': 2.2936534881591797} -09/20/2021 22:22:03 - INFO - __main__ - Step 36382: {'lr': 0.0001995284633197015, 'samples': 1164224, 'steps': 2273, 'loss/train': 2.0694475173950195} -09/20/2021 22:22:04 - INFO - __main__ - Step 36383: {'lr': 0.0001995284633197015, 'samples': 1164256, 'steps': 2273, 'loss/train': 2.3778460025787354} -09/20/2021 22:22:04 - INFO - __main__ - Step 36384: {'lr': 0.0001995284633197015, 'samples': 1164288, 'steps': 2273, 'loss/train': 2.053579092025757} -09/20/2021 22:22:05 - INFO - __main__ - Step 36385: {'lr': 0.0001995278443834593, 'samples': 1164320, 'steps': 2274, 'loss/train': 2.9385313987731934} -09/20/2021 22:22:06 - INFO - __main__ - Step 36386: {'lr': 0.0001995278443834593, 'samples': 1164352, 'steps': 2274, 'loss/train': 1.8729069232940674} -09/20/2021 22:22:07 - INFO - __main__ - Step 36387: {'lr': 0.0001995278443834593, 'samples': 1164384, 'steps': 2274, 'loss/train': 6.1213812828063965} -09/20/2021 22:22:08 - INFO - __main__ - Step 36388: {'lr': 0.0001995278443834593, 'samples': 1164416, 'steps': 2274, 'loss/train': 2.9842758178710938} -09/20/2021 22:22:08 - INFO - __main__ - Step 36389: {'lr': 0.0001995278443834593, 'samples': 1164448, 'steps': 2274, 'loss/train': 1.8174915313720703} -09/20/2021 22:22:09 - INFO - __main__ - Step 36390: {'lr': 0.0001995278443834593, 'samples': 1164480, 'steps': 2274, 'loss/train': 3.3606038093566895} -09/20/2021 22:22:10 - INFO - __main__ - Step 36391: {'lr': 0.0001995278443834593, 'samples': 1164512, 'steps': 2274, 'loss/train': 2.6200976371765137} -09/20/2021 22:22:11 - INFO - __main__ - Step 36392: {'lr': 0.0001995278443834593, 'samples': 1164544, 'steps': 2274, 'loss/train': 2.0229644775390625} -09/20/2021 22:22:11 - INFO - __main__ - Step 36393: {'lr': 0.0001995278443834593, 'samples': 1164576, 'steps': 2274, 'loss/train': 4.2891435623168945} -09/20/2021 22:22:12 - INFO - __main__ - Step 36394: {'lr': 0.0001995278443834593, 'samples': 1164608, 'steps': 2274, 'loss/train': 3.5268354415893555} -09/20/2021 22:22:13 - INFO - __main__ - Step 36395: {'lr': 0.0001995278443834593, 'samples': 1164640, 'steps': 2274, 'loss/train': 3.757615804672241} -09/20/2021 22:22:14 - INFO - __main__ - Step 36396: {'lr': 0.0001995278443834593, 'samples': 1164672, 'steps': 2274, 'loss/train': 3.4240410327911377} -09/20/2021 22:22:14 - INFO - __main__ - Step 36397: {'lr': 0.0001995278443834593, 'samples': 1164704, 'steps': 2274, 'loss/train': 1.957135796546936} -09/20/2021 22:22:15 - INFO - __main__ - Step 36398: {'lr': 0.0001995278443834593, 'samples': 1164736, 'steps': 2274, 'loss/train': 2.0776829719543457} -09/20/2021 22:22:16 - INFO - __main__ - Step 36399: {'lr': 0.0001995278443834593, 'samples': 1164768, 'steps': 2274, 'loss/train': 1.7965903282165527} -09/20/2021 22:22:17 - INFO - __main__ - Step 36400: {'lr': 0.0001995278443834593, 'samples': 1164800, 'steps': 2274, 'loss/train': 2.5427539348602295} -09/20/2021 22:22:18 - INFO - __main__ - Step 36401: {'lr': 0.00019952722504223866, 'samples': 1164832, 'steps': 2275, 'loss/train': 2.3119614124298096} -09/20/2021 22:22:19 - INFO - __main__ - Step 36402: {'lr': 0.00019952722504223866, 'samples': 1164864, 'steps': 2275, 'loss/train': 2.7840397357940674} -09/20/2021 22:22:19 - INFO - __main__ - Step 36403: {'lr': 0.00019952722504223866, 'samples': 1164896, 'steps': 2275, 'loss/train': 2.3354060649871826} -09/20/2021 22:22:20 - INFO - __main__ - Step 36404: {'lr': 0.00019952722504223866, 'samples': 1164928, 'steps': 2275, 'loss/train': 2.161641836166382} -09/20/2021 22:22:21 - INFO - __main__ - Step 36405: {'lr': 0.00019952722504223866, 'samples': 1164960, 'steps': 2275, 'loss/train': 2.431220531463623} -09/20/2021 22:22:22 - INFO - __main__ - Step 36406: {'lr': 0.00019952722504223866, 'samples': 1164992, 'steps': 2275, 'loss/train': 2.4625425338745117} -09/20/2021 22:22:22 - INFO - __main__ - Step 36407: {'lr': 0.00019952722504223866, 'samples': 1165024, 'steps': 2275, 'loss/train': 1.792759895324707} -09/20/2021 22:22:23 - INFO - __main__ - Step 36408: {'lr': 0.00019952722504223866, 'samples': 1165056, 'steps': 2275, 'loss/train': 1.8535783290863037} -09/20/2021 22:22:24 - INFO - __main__ - Step 36409: {'lr': 0.00019952722504223866, 'samples': 1165088, 'steps': 2275, 'loss/train': 2.129269599914551} -09/20/2021 22:22:25 - INFO - __main__ - Step 36410: {'lr': 0.00019952722504223866, 'samples': 1165120, 'steps': 2275, 'loss/train': 1.7283010482788086} -09/20/2021 22:22:25 - INFO - __main__ - Step 36411: {'lr': 0.00019952722504223866, 'samples': 1165152, 'steps': 2275, 'loss/train': 2.7736244201660156} -09/20/2021 22:22:26 - INFO - __main__ - Step 36412: {'lr': 0.00019952722504223866, 'samples': 1165184, 'steps': 2275, 'loss/train': 2.864224910736084} -09/20/2021 22:22:27 - INFO - __main__ - Step 36413: {'lr': 0.00019952722504223866, 'samples': 1165216, 'steps': 2275, 'loss/train': 2.2138354778289795} -09/20/2021 22:22:28 - INFO - __main__ - Step 36414: {'lr': 0.00019952722504223866, 'samples': 1165248, 'steps': 2275, 'loss/train': 2.2941970825195312} -09/20/2021 22:22:28 - INFO - __main__ - Step 36415: {'lr': 0.00019952722504223866, 'samples': 1165280, 'steps': 2275, 'loss/train': 2.0896477699279785} -09/20/2021 22:22:29 - INFO - __main__ - Step 36416: {'lr': 0.00019952722504223866, 'samples': 1165312, 'steps': 2275, 'loss/train': 1.8285804986953735} -09/20/2021 22:22:30 - INFO - __main__ - Step 36417: {'lr': 0.00019952660529604216, 'samples': 1165344, 'steps': 2276, 'loss/train': 2.2750837802886963} -09/20/2021 22:22:31 - INFO - __main__ - Step 36418: {'lr': 0.00019952660529604216, 'samples': 1165376, 'steps': 2276, 'loss/train': 2.2754647731781006} -09/20/2021 22:22:32 - INFO - __main__ - Step 36419: {'lr': 0.00019952660529604216, 'samples': 1165408, 'steps': 2276, 'loss/train': 1.0717657804489136} -09/20/2021 22:22:32 - INFO - __main__ - Step 36420: {'lr': 0.00019952660529604216, 'samples': 1165440, 'steps': 2276, 'loss/train': 1.6877597570419312} -09/20/2021 22:22:33 - INFO - __main__ - Step 36421: {'lr': 0.00019952660529604216, 'samples': 1165472, 'steps': 2276, 'loss/train': 2.54358172416687} -09/20/2021 22:22:34 - INFO - __main__ - Step 36422: {'lr': 0.00019952660529604216, 'samples': 1165504, 'steps': 2276, 'loss/train': 2.0241661071777344} -09/20/2021 22:22:35 - INFO - __main__ - Step 36423: {'lr': 0.00019952660529604216, 'samples': 1165536, 'steps': 2276, 'loss/train': 1.6419897079467773} -09/20/2021 22:22:35 - INFO - __main__ - Step 36424: {'lr': 0.00019952660529604216, 'samples': 1165568, 'steps': 2276, 'loss/train': 2.3978590965270996} -09/20/2021 22:22:36 - INFO - __main__ - Step 36425: {'lr': 0.00019952660529604216, 'samples': 1165600, 'steps': 2276, 'loss/train': 2.2424542903900146} -09/20/2021 22:22:37 - INFO - __main__ - Step 36426: {'lr': 0.00019952660529604216, 'samples': 1165632, 'steps': 2276, 'loss/train': 4.316222667694092} -09/20/2021 22:22:38 - INFO - __main__ - Step 36427: {'lr': 0.00019952660529604216, 'samples': 1165664, 'steps': 2276, 'loss/train': 2.170358180999756} -09/20/2021 22:22:38 - INFO - __main__ - Step 36428: {'lr': 0.00019952660529604216, 'samples': 1165696, 'steps': 2276, 'loss/train': 2.2688708305358887} -09/20/2021 22:22:40 - INFO - __main__ - Step 36429: {'lr': 0.00019952660529604216, 'samples': 1165728, 'steps': 2276, 'loss/train': 2.9035167694091797} -09/20/2021 22:22:40 - INFO - __main__ - Step 36430: {'lr': 0.00019952660529604216, 'samples': 1165760, 'steps': 2276, 'loss/train': 3.227285623550415} -09/20/2021 22:22:41 - INFO - __main__ - Step 36431: {'lr': 0.00019952660529604216, 'samples': 1165792, 'steps': 2276, 'loss/train': 2.614816904067993} -09/20/2021 22:22:42 - INFO - __main__ - Step 36432: {'lr': 0.00019952660529604216, 'samples': 1165824, 'steps': 2276, 'loss/train': 2.1337156295776367} -09/20/2021 22:22:43 - INFO - __main__ - Step 36433: {'lr': 0.00019952598514487227, 'samples': 1165856, 'steps': 2277, 'loss/train': 2.461585521697998} -09/20/2021 22:22:43 - INFO - __main__ - Step 36434: {'lr': 0.00019952598514487227, 'samples': 1165888, 'steps': 2277, 'loss/train': 2.9337589740753174} -09/20/2021 22:22:44 - INFO - __main__ - Step 36435: {'lr': 0.00019952598514487227, 'samples': 1165920, 'steps': 2277, 'loss/train': 2.05377197265625} -09/20/2021 22:22:45 - INFO - __main__ - Step 36436: {'lr': 0.00019952598514487227, 'samples': 1165952, 'steps': 2277, 'loss/train': 1.2523075342178345} -09/20/2021 22:22:46 - INFO - __main__ - Step 36437: {'lr': 0.00019952598514487227, 'samples': 1165984, 'steps': 2277, 'loss/train': 2.0828676223754883} -09/20/2021 22:22:46 - INFO - __main__ - Step 36438: {'lr': 0.00019952598514487227, 'samples': 1166016, 'steps': 2277, 'loss/train': 2.212956428527832} -09/20/2021 22:22:47 - INFO - __main__ - Step 36439: {'lr': 0.00019952598514487227, 'samples': 1166048, 'steps': 2277, 'loss/train': 1.789466142654419} -09/20/2021 22:22:48 - INFO - __main__ - Step 36440: {'lr': 0.00019952598514487227, 'samples': 1166080, 'steps': 2277, 'loss/train': 2.088043689727783} -09/20/2021 22:22:49 - INFO - __main__ - Step 36441: {'lr': 0.00019952598514487227, 'samples': 1166112, 'steps': 2277, 'loss/train': 2.564303398132324} -09/20/2021 22:22:49 - INFO - __main__ - Step 36442: {'lr': 0.00019952598514487227, 'samples': 1166144, 'steps': 2277, 'loss/train': 2.266721248626709} -09/20/2021 22:22:50 - INFO - __main__ - Step 36443: {'lr': 0.00019952598514487227, 'samples': 1166176, 'steps': 2277, 'loss/train': 0.9055644273757935} -09/20/2021 22:22:51 - INFO - __main__ - Step 36444: {'lr': 0.00019952598514487227, 'samples': 1166208, 'steps': 2277, 'loss/train': 2.3188390731811523} -09/20/2021 22:22:52 - INFO - __main__ - Step 36445: {'lr': 0.00019952598514487227, 'samples': 1166240, 'steps': 2277, 'loss/train': 3.119535446166992} -09/20/2021 22:22:52 - INFO - __main__ - Step 36446: {'lr': 0.00019952598514487227, 'samples': 1166272, 'steps': 2277, 'loss/train': 1.875491738319397} -09/20/2021 22:22:53 - INFO - __main__ - Step 36447: {'lr': 0.00019952598514487227, 'samples': 1166304, 'steps': 2277, 'loss/train': 2.4128520488739014} -09/20/2021 22:22:54 - INFO - __main__ - Step 36448: {'lr': 0.00019952598514487227, 'samples': 1166336, 'steps': 2277, 'loss/train': 2.456970453262329} -09/20/2021 22:22:55 - INFO - __main__ - Step 36449: {'lr': 0.00019952536458873153, 'samples': 1166368, 'steps': 2278, 'loss/train': 1.7143268585205078} -09/20/2021 22:22:56 - INFO - __main__ - Step 36450: {'lr': 0.00019952536458873153, 'samples': 1166400, 'steps': 2278, 'loss/train': 2.5165319442749023} -09/20/2021 22:22:56 - INFO - __main__ - Step 36451: {'lr': 0.00019952536458873153, 'samples': 1166432, 'steps': 2278, 'loss/train': 1.0100687742233276} -09/20/2021 22:22:57 - INFO - __main__ - Step 36452: {'lr': 0.00019952536458873153, 'samples': 1166464, 'steps': 2278, 'loss/train': 1.082865595817566} -09/20/2021 22:22:58 - INFO - __main__ - Step 36453: {'lr': 0.00019952536458873153, 'samples': 1166496, 'steps': 2278, 'loss/train': 2.455362558364868} -09/20/2021 22:22:59 - INFO - __main__ - Step 36454: {'lr': 0.00019952536458873153, 'samples': 1166528, 'steps': 2278, 'loss/train': 0.23814111948013306} -09/20/2021 22:22:59 - INFO - __main__ - Step 36455: {'lr': 0.00019952536458873153, 'samples': 1166560, 'steps': 2278, 'loss/train': 2.3232314586639404} -09/20/2021 22:23:00 - INFO - __main__ - Step 36456: {'lr': 0.00019952536458873153, 'samples': 1166592, 'steps': 2278, 'loss/train': 2.2412095069885254} -09/20/2021 22:23:01 - INFO - __main__ - Step 36457: {'lr': 0.00019952536458873153, 'samples': 1166624, 'steps': 2278, 'loss/train': 1.3800386190414429} -09/20/2021 22:23:02 - INFO - __main__ - Step 36458: {'lr': 0.00019952536458873153, 'samples': 1166656, 'steps': 2278, 'loss/train': 1.8911923170089722} -09/20/2021 22:23:02 - INFO - __main__ - Step 36459: {'lr': 0.00019952536458873153, 'samples': 1166688, 'steps': 2278, 'loss/train': 1.0314007997512817} -09/20/2021 22:23:04 - INFO - __main__ - Step 36460: {'lr': 0.00019952536458873153, 'samples': 1166720, 'steps': 2278, 'loss/train': 2.1176369190216064} -09/20/2021 22:23:04 - INFO - __main__ - Step 36461: {'lr': 0.00019952536458873153, 'samples': 1166752, 'steps': 2278, 'loss/train': 2.3795218467712402} -09/20/2021 22:23:05 - INFO - __main__ - Step 36462: {'lr': 0.00019952536458873153, 'samples': 1166784, 'steps': 2278, 'loss/train': 3.059208631515503} -09/20/2021 22:23:06 - INFO - __main__ - Step 36463: {'lr': 0.00019952536458873153, 'samples': 1166816, 'steps': 2278, 'loss/train': 2.5326719284057617} -09/20/2021 22:23:07 - INFO - __main__ - Step 36464: {'lr': 0.00019952536458873153, 'samples': 1166848, 'steps': 2278, 'loss/train': 2.5362093448638916} -09/20/2021 22:23:08 - INFO - __main__ - Step 36465: {'lr': 0.00019952474362762245, 'samples': 1166880, 'steps': 2279, 'loss/train': 1.7665910720825195} -09/20/2021 22:23:08 - INFO - __main__ - Step 36466: {'lr': 0.00019952474362762245, 'samples': 1166912, 'steps': 2279, 'loss/train': 1.9748220443725586} -09/20/2021 22:23:09 - INFO - __main__ - Step 36467: {'lr': 0.00019952474362762245, 'samples': 1166944, 'steps': 2279, 'loss/train': 2.5661778450012207} -09/20/2021 22:23:10 - INFO - __main__ - Step 36468: {'lr': 0.00019952474362762245, 'samples': 1166976, 'steps': 2279, 'loss/train': 2.0548009872436523} -09/20/2021 22:23:11 - INFO - __main__ - Step 36469: {'lr': 0.00019952474362762245, 'samples': 1167008, 'steps': 2279, 'loss/train': 2.3878653049468994} -09/20/2021 22:23:11 - INFO - __main__ - Step 36470: {'lr': 0.00019952474362762245, 'samples': 1167040, 'steps': 2279, 'loss/train': 1.5426617860794067} -09/20/2021 22:23:12 - INFO - __main__ - Step 36471: {'lr': 0.00019952474362762245, 'samples': 1167072, 'steps': 2279, 'loss/train': 2.5395779609680176} -09/20/2021 22:23:13 - INFO - __main__ - Step 36472: {'lr': 0.00019952474362762245, 'samples': 1167104, 'steps': 2279, 'loss/train': 0.7323537468910217} -09/20/2021 22:23:14 - INFO - __main__ - Step 36473: {'lr': 0.00019952474362762245, 'samples': 1167136, 'steps': 2279, 'loss/train': 3.507233142852783} -09/20/2021 22:23:14 - INFO - __main__ - Step 36474: {'lr': 0.00019952474362762245, 'samples': 1167168, 'steps': 2279, 'loss/train': 1.7572054862976074} -09/20/2021 22:23:15 - INFO - __main__ - Step 36475: {'lr': 0.00019952474362762245, 'samples': 1167200, 'steps': 2279, 'loss/train': 1.8870691061019897} -09/20/2021 22:23:16 - INFO - __main__ - Step 36476: {'lr': 0.00019952474362762245, 'samples': 1167232, 'steps': 2279, 'loss/train': 2.324847459793091} -09/20/2021 22:23:17 - INFO - __main__ - Step 36477: {'lr': 0.00019952474362762245, 'samples': 1167264, 'steps': 2279, 'loss/train': 2.431627035140991} -09/20/2021 22:23:17 - INFO - __main__ - Step 36478: {'lr': 0.00019952474362762245, 'samples': 1167296, 'steps': 2279, 'loss/train': 1.943352460861206} -09/20/2021 22:23:18 - INFO - __main__ - Step 36479: {'lr': 0.00019952474362762245, 'samples': 1167328, 'steps': 2279, 'loss/train': 0.4824930429458618} -09/20/2021 22:23:19 - INFO - __main__ - Step 36480: {'lr': 0.00019952474362762245, 'samples': 1167360, 'steps': 2279, 'loss/train': 1.3821053504943848} -09/20/2021 22:23:20 - INFO - __main__ - Step 36481: {'lr': 0.0001995241222615476, 'samples': 1167392, 'steps': 2280, 'loss/train': 1.8722835779190063} -09/20/2021 22:23:20 - INFO - __main__ - Step 36482: {'lr': 0.0001995241222615476, 'samples': 1167424, 'steps': 2280, 'loss/train': 2.034324884414673} -09/20/2021 22:23:21 - INFO - __main__ - Step 36483: {'lr': 0.0001995241222615476, 'samples': 1167456, 'steps': 2280, 'loss/train': 1.1835416555404663} -09/20/2021 22:23:22 - INFO - __main__ - Step 36484: {'lr': 0.0001995241222615476, 'samples': 1167488, 'steps': 2280, 'loss/train': 1.7646582126617432} -09/20/2021 22:23:23 - INFO - __main__ - Step 36485: {'lr': 0.0001995241222615476, 'samples': 1167520, 'steps': 2280, 'loss/train': 1.9027073383331299} -09/20/2021 22:23:23 - INFO - __main__ - Step 36486: {'lr': 0.0001995241222615476, 'samples': 1167552, 'steps': 2280, 'loss/train': 2.1372621059417725} -09/20/2021 22:23:24 - INFO - __main__ - Step 36487: {'lr': 0.0001995241222615476, 'samples': 1167584, 'steps': 2280, 'loss/train': 2.2817068099975586} -09/20/2021 22:23:25 - INFO - __main__ - Step 36488: {'lr': 0.0001995241222615476, 'samples': 1167616, 'steps': 2280, 'loss/train': 3.138707399368286} -09/20/2021 22:23:26 - INFO - __main__ - Step 36489: {'lr': 0.0001995241222615476, 'samples': 1167648, 'steps': 2280, 'loss/train': 2.7009947299957275} -09/20/2021 22:23:26 - INFO - __main__ - Step 36490: {'lr': 0.0001995241222615476, 'samples': 1167680, 'steps': 2280, 'loss/train': 1.6995816230773926} -09/20/2021 22:23:28 - INFO - __main__ - Step 36491: {'lr': 0.0001995241222615476, 'samples': 1167712, 'steps': 2280, 'loss/train': 2.960444927215576} -09/20/2021 22:23:29 - INFO - __main__ - Step 36492: {'lr': 0.0001995241222615476, 'samples': 1167744, 'steps': 2280, 'loss/train': 3.1889445781707764} -09/20/2021 22:23:29 - INFO - __main__ - Step 36493: {'lr': 0.0001995241222615476, 'samples': 1167776, 'steps': 2280, 'loss/train': 2.307173490524292} -09/20/2021 22:23:30 - INFO - __main__ - Step 36494: {'lr': 0.0001995241222615476, 'samples': 1167808, 'steps': 2280, 'loss/train': 1.6763397455215454} -09/20/2021 22:23:31 - INFO - __main__ - Step 36495: {'lr': 0.0001995241222615476, 'samples': 1167840, 'steps': 2280, 'loss/train': 2.477854013442993} -09/20/2021 22:23:32 - INFO - __main__ - Step 36496: {'lr': 0.0001995241222615476, 'samples': 1167872, 'steps': 2280, 'loss/train': 1.857216715812683} -09/20/2021 22:23:33 - INFO - __main__ - Step 36497: {'lr': 0.00019952350049050948, 'samples': 1167904, 'steps': 2281, 'loss/train': 2.0445497035980225} -09/20/2021 22:23:33 - INFO - __main__ - Step 36498: {'lr': 0.00019952350049050948, 'samples': 1167936, 'steps': 2281, 'loss/train': 2.6872024536132812} -09/20/2021 22:23:34 - INFO - __main__ - Step 36499: {'lr': 0.00019952350049050948, 'samples': 1167968, 'steps': 2281, 'loss/train': 2.1307966709136963} -09/20/2021 22:23:35 - INFO - __main__ - Step 36500: {'lr': 0.00019952350049050948, 'samples': 1168000, 'steps': 2281, 'loss/train': 1.9932843446731567} -09/20/2021 22:23:36 - INFO - __main__ - Step 36501: {'lr': 0.00019952350049050948, 'samples': 1168032, 'steps': 2281, 'loss/train': 0.2991548776626587} -09/20/2021 22:23:36 - INFO - __main__ - Step 36502: {'lr': 0.00019952350049050948, 'samples': 1168064, 'steps': 2281, 'loss/train': 0.13149288296699524} -09/20/2021 22:23:37 - INFO - __main__ - Step 36503: {'lr': 0.00019952350049050948, 'samples': 1168096, 'steps': 2281, 'loss/train': 2.429081439971924} -09/20/2021 22:23:38 - INFO - __main__ - Step 36504: {'lr': 0.00019952350049050948, 'samples': 1168128, 'steps': 2281, 'loss/train': 1.585347294807434} -09/20/2021 22:23:39 - INFO - __main__ - Step 36505: {'lr': 0.00019952350049050948, 'samples': 1168160, 'steps': 2281, 'loss/train': 2.460371255874634} -09/20/2021 22:23:39 - INFO - __main__ - Step 36506: {'lr': 0.00019952350049050948, 'samples': 1168192, 'steps': 2281, 'loss/train': 2.4798171520233154} -09/20/2021 22:23:40 - INFO - __main__ - Step 36507: {'lr': 0.00019952350049050948, 'samples': 1168224, 'steps': 2281, 'loss/train': 2.530930280685425} -09/20/2021 22:23:41 - INFO - __main__ - Step 36508: {'lr': 0.00019952350049050948, 'samples': 1168256, 'steps': 2281, 'loss/train': 2.5033257007598877} -09/20/2021 22:23:42 - INFO - __main__ - Step 36509: {'lr': 0.00019952350049050948, 'samples': 1168288, 'steps': 2281, 'loss/train': 2.5212109088897705} -09/20/2021 22:23:42 - INFO - __main__ - Step 36510: {'lr': 0.00019952350049050948, 'samples': 1168320, 'steps': 2281, 'loss/train': 2.4747872352600098} -09/20/2021 22:23:43 - INFO - __main__ - Step 36511: {'lr': 0.00019952350049050948, 'samples': 1168352, 'steps': 2281, 'loss/train': 2.4486136436462402} -09/20/2021 22:23:44 - INFO - __main__ - Step 36512: {'lr': 0.00019952350049050948, 'samples': 1168384, 'steps': 2281, 'loss/train': 2.1131176948547363} -09/20/2021 22:23:45 - INFO - __main__ - Step 36513: {'lr': 0.00019952287831451063, 'samples': 1168416, 'steps': 2282, 'loss/train': 1.6230130195617676} -09/20/2021 22:23:45 - INFO - __main__ - Step 36514: {'lr': 0.00019952287831451063, 'samples': 1168448, 'steps': 2282, 'loss/train': 0.8558287620544434} -09/20/2021 22:23:46 - INFO - __main__ - Step 36515: {'lr': 0.00019952287831451063, 'samples': 1168480, 'steps': 2282, 'loss/train': 0.9242494702339172} -09/20/2021 22:23:47 - INFO - __main__ - Step 36516: {'lr': 0.00019952287831451063, 'samples': 1168512, 'steps': 2282, 'loss/train': 2.3167402744293213} -09/20/2021 22:23:48 - INFO - __main__ - Step 36517: {'lr': 0.00019952287831451063, 'samples': 1168544, 'steps': 2282, 'loss/train': 2.846388578414917} -09/20/2021 22:23:48 - INFO - __main__ - Step 36518: {'lr': 0.00019952287831451063, 'samples': 1168576, 'steps': 2282, 'loss/train': 1.3558777570724487} -09/20/2021 22:23:49 - INFO - __main__ - Step 36519: {'lr': 0.00019952287831451063, 'samples': 1168608, 'steps': 2282, 'loss/train': 2.124929904937744} -09/20/2021 22:23:50 - INFO - __main__ - Step 36520: {'lr': 0.00019952287831451063, 'samples': 1168640, 'steps': 2282, 'loss/train': 2.702237129211426} -09/20/2021 22:23:51 - INFO - __main__ - Step 36521: {'lr': 0.00019952287831451063, 'samples': 1168672, 'steps': 2282, 'loss/train': 2.4398179054260254} -09/20/2021 22:23:51 - INFO - __main__ - Step 36522: {'lr': 0.00019952287831451063, 'samples': 1168704, 'steps': 2282, 'loss/train': 3.071857213973999} -09/20/2021 22:23:52 - INFO - __main__ - Step 36523: {'lr': 0.00019952287831451063, 'samples': 1168736, 'steps': 2282, 'loss/train': 2.2224771976470947} -09/20/2021 22:23:53 - INFO - __main__ - Step 36524: {'lr': 0.00019952287831451063, 'samples': 1168768, 'steps': 2282, 'loss/train': 1.8217694759368896} -09/20/2021 22:23:54 - INFO - __main__ - Step 36525: {'lr': 0.00019952287831451063, 'samples': 1168800, 'steps': 2282, 'loss/train': 2.6515588760375977} -09/20/2021 22:23:56 - INFO - __main__ - Step 36526: {'lr': 0.00019952287831451063, 'samples': 1168832, 'steps': 2282, 'loss/train': 2.3452980518341064} -09/20/2021 22:23:57 - INFO - __main__ - Step 36527: {'lr': 0.00019952287831451063, 'samples': 1168864, 'steps': 2282, 'loss/train': 3.060378313064575} -09/20/2021 22:23:57 - INFO - __main__ - Step 36528: {'lr': 0.00019952287831451063, 'samples': 1168896, 'steps': 2282, 'loss/train': 2.1644163131713867} -09/20/2021 22:23:58 - INFO - __main__ - Step 36529: {'lr': 0.00019952225573355357, 'samples': 1168928, 'steps': 2283, 'loss/train': 2.3053441047668457} -09/20/2021 22:23:59 - INFO - __main__ - Step 36530: {'lr': 0.00019952225573355357, 'samples': 1168960, 'steps': 2283, 'loss/train': 3.3691394329071045} -09/20/2021 22:24:00 - INFO - __main__ - Step 36531: {'lr': 0.00019952225573355357, 'samples': 1168992, 'steps': 2283, 'loss/train': 6.252074718475342} -09/20/2021 22:24:00 - INFO - __main__ - Step 36532: {'lr': 0.00019952225573355357, 'samples': 1169024, 'steps': 2283, 'loss/train': 2.0834152698516846} -09/20/2021 22:24:01 - INFO - __main__ - Step 36533: {'lr': 0.00019952225573355357, 'samples': 1169056, 'steps': 2283, 'loss/train': 1.3390305042266846} -09/20/2021 22:24:02 - INFO - __main__ - Step 36534: {'lr': 0.00019952225573355357, 'samples': 1169088, 'steps': 2283, 'loss/train': 1.9368427991867065} -09/20/2021 22:24:03 - INFO - __main__ - Step 36535: {'lr': 0.00019952225573355357, 'samples': 1169120, 'steps': 2283, 'loss/train': 2.4814772605895996} -09/20/2021 22:24:03 - INFO - __main__ - Step 36536: {'lr': 0.00019952225573355357, 'samples': 1169152, 'steps': 2283, 'loss/train': 2.501434087753296} -09/20/2021 22:24:04 - INFO - __main__ - Step 36537: {'lr': 0.00019952225573355357, 'samples': 1169184, 'steps': 2283, 'loss/train': 2.106513023376465} -09/20/2021 22:24:05 - INFO - __main__ - Step 36538: {'lr': 0.00019952225573355357, 'samples': 1169216, 'steps': 2283, 'loss/train': 3.443319082260132} -09/20/2021 22:24:06 - INFO - __main__ - Step 36539: {'lr': 0.00019952225573355357, 'samples': 1169248, 'steps': 2283, 'loss/train': 2.992077589035034} -09/20/2021 22:24:06 - INFO - __main__ - Step 36540: {'lr': 0.00019952225573355357, 'samples': 1169280, 'steps': 2283, 'loss/train': 2.661060333251953} -09/20/2021 22:24:07 - INFO - __main__ - Step 36541: {'lr': 0.00019952225573355357, 'samples': 1169312, 'steps': 2283, 'loss/train': 1.9791117906570435} -09/20/2021 22:24:08 - INFO - __main__ - Step 36542: {'lr': 0.00019952225573355357, 'samples': 1169344, 'steps': 2283, 'loss/train': 2.4196925163269043} -09/20/2021 22:24:09 - INFO - __main__ - Step 36543: {'lr': 0.00019952225573355357, 'samples': 1169376, 'steps': 2283, 'loss/train': 1.8298871517181396} -09/20/2021 22:24:09 - INFO - __main__ - Step 36544: {'lr': 0.00019952225573355357, 'samples': 1169408, 'steps': 2283, 'loss/train': 2.834779739379883} -09/20/2021 22:24:10 - INFO - __main__ - Step 36545: {'lr': 0.00019952163274764083, 'samples': 1169440, 'steps': 2284, 'loss/train': 1.8845301866531372} -09/20/2021 22:24:11 - INFO - __main__ - Step 36546: {'lr': 0.00019952163274764083, 'samples': 1169472, 'steps': 2284, 'loss/train': 0.19388572871685028} -09/20/2021 22:24:12 - INFO - __main__ - Step 36547: {'lr': 0.00019952163274764083, 'samples': 1169504, 'steps': 2284, 'loss/train': 0.15626345574855804} -09/20/2021 22:24:13 - INFO - __main__ - Step 36548: {'lr': 0.00019952163274764083, 'samples': 1169536, 'steps': 2284, 'loss/train': 1.1350085735321045} -09/20/2021 22:24:13 - INFO - __main__ - Step 36549: {'lr': 0.00019952163274764083, 'samples': 1169568, 'steps': 2284, 'loss/train': 1.0730475187301636} -09/20/2021 22:24:14 - INFO - __main__ - Step 36550: {'lr': 0.00019952163274764083, 'samples': 1169600, 'steps': 2284, 'loss/train': 2.5289578437805176} -09/20/2021 22:24:15 - INFO - __main__ - Step 36551: {'lr': 0.00019952163274764083, 'samples': 1169632, 'steps': 2284, 'loss/train': 2.415489912033081} -09/20/2021 22:24:16 - INFO - __main__ - Step 36552: {'lr': 0.00019952163274764083, 'samples': 1169664, 'steps': 2284, 'loss/train': 2.454026222229004} -09/20/2021 22:24:16 - INFO - __main__ - Step 36553: {'lr': 0.00019952163274764083, 'samples': 1169696, 'steps': 2284, 'loss/train': 2.253704309463501} -09/20/2021 22:24:17 - INFO - __main__ - Step 36554: {'lr': 0.00019952163274764083, 'samples': 1169728, 'steps': 2284, 'loss/train': 2.0503458976745605} -09/20/2021 22:24:18 - INFO - __main__ - Step 36555: {'lr': 0.00019952163274764083, 'samples': 1169760, 'steps': 2284, 'loss/train': 2.146909713745117} -09/20/2021 22:24:19 - INFO - __main__ - Step 36556: {'lr': 0.00019952163274764083, 'samples': 1169792, 'steps': 2284, 'loss/train': 2.194589376449585} -09/20/2021 22:24:19 - INFO - __main__ - Step 36557: {'lr': 0.00019952163274764083, 'samples': 1169824, 'steps': 2284, 'loss/train': 1.967680811882019} -09/20/2021 22:24:20 - INFO - __main__ - Step 36558: {'lr': 0.00019952163274764083, 'samples': 1169856, 'steps': 2284, 'loss/train': 2.3286821842193604} -09/20/2021 22:24:21 - INFO - __main__ - Step 36559: {'lr': 0.00019952163274764083, 'samples': 1169888, 'steps': 2284, 'loss/train': 2.181119203567505} -09/20/2021 22:24:22 - INFO - __main__ - Step 36560: {'lr': 0.00019952163274764083, 'samples': 1169920, 'steps': 2284, 'loss/train': 2.390639543533325} -09/20/2021 22:24:23 - INFO - __main__ - Step 36561: {'lr': 0.00019952100935677493, 'samples': 1169952, 'steps': 2285, 'loss/train': 1.9454715251922607} -09/20/2021 22:24:23 - INFO - __main__ - Step 36562: {'lr': 0.00019952100935677493, 'samples': 1169984, 'steps': 2285, 'loss/train': 2.0141208171844482} -09/20/2021 22:24:24 - INFO - __main__ - Step 36563: {'lr': 0.00019952100935677493, 'samples': 1170016, 'steps': 2285, 'loss/train': 2.0267930030822754} -09/20/2021 22:24:25 - INFO - __main__ - Step 36564: {'lr': 0.00019952100935677493, 'samples': 1170048, 'steps': 2285, 'loss/train': 1.9810327291488647} -09/20/2021 22:24:26 - INFO - __main__ - Step 36565: {'lr': 0.00019952100935677493, 'samples': 1170080, 'steps': 2285, 'loss/train': 1.7433511018753052} -09/20/2021 22:24:27 - INFO - __main__ - Step 36566: {'lr': 0.00019952100935677493, 'samples': 1170112, 'steps': 2285, 'loss/train': 2.051131248474121} -09/20/2021 22:24:28 - INFO - __main__ - Step 36567: {'lr': 0.00019952100935677493, 'samples': 1170144, 'steps': 2285, 'loss/train': 2.3258578777313232} -09/20/2021 22:24:29 - INFO - __main__ - Step 36568: {'lr': 0.00019952100935677493, 'samples': 1170176, 'steps': 2285, 'loss/train': 2.9398696422576904} -09/20/2021 22:24:30 - INFO - __main__ - Step 36569: {'lr': 0.00019952100935677493, 'samples': 1170208, 'steps': 2285, 'loss/train': 5.799499988555908} -09/20/2021 22:24:30 - INFO - __main__ - Step 36570: {'lr': 0.00019952100935677493, 'samples': 1170240, 'steps': 2285, 'loss/train': 2.894435405731201} -09/20/2021 22:24:31 - INFO - __main__ - Step 36571: {'lr': 0.00019952100935677493, 'samples': 1170272, 'steps': 2285, 'loss/train': 1.7341845035552979} -09/20/2021 22:24:32 - INFO - __main__ - Step 36572: {'lr': 0.00019952100935677493, 'samples': 1170304, 'steps': 2285, 'loss/train': 2.516695976257324} -09/20/2021 22:24:33 - INFO - __main__ - Step 36573: {'lr': 0.00019952100935677493, 'samples': 1170336, 'steps': 2285, 'loss/train': 0.6316594481468201} -09/20/2021 22:24:33 - INFO - __main__ - Step 36574: {'lr': 0.00019952100935677493, 'samples': 1170368, 'steps': 2285, 'loss/train': 2.0954010486602783} -09/20/2021 22:24:34 - INFO - __main__ - Step 36575: {'lr': 0.00019952100935677493, 'samples': 1170400, 'steps': 2285, 'loss/train': 2.049412250518799} -09/20/2021 22:24:35 - INFO - __main__ - Step 36576: {'lr': 0.00019952100935677493, 'samples': 1170432, 'steps': 2285, 'loss/train': 1.947569727897644} -09/20/2021 22:24:36 - INFO - __main__ - Step 36577: {'lr': 0.00019952038556095847, 'samples': 1170464, 'steps': 2286, 'loss/train': 1.455338716506958} -09/20/2021 22:24:36 - INFO - __main__ - Step 36578: {'lr': 0.00019952038556095847, 'samples': 1170496, 'steps': 2286, 'loss/train': 2.213909387588501} -09/20/2021 22:24:37 - INFO - __main__ - Step 36579: {'lr': 0.00019952038556095847, 'samples': 1170528, 'steps': 2286, 'loss/train': 1.8692128658294678} -09/20/2021 22:24:38 - INFO - __main__ - Step 36580: {'lr': 0.00019952038556095847, 'samples': 1170560, 'steps': 2286, 'loss/train': 2.2257912158966064} -09/20/2021 22:24:39 - INFO - __main__ - Step 36581: {'lr': 0.00019952038556095847, 'samples': 1170592, 'steps': 2286, 'loss/train': 0.18221142888069153} -09/20/2021 22:24:39 - INFO - __main__ - Step 36582: {'lr': 0.00019952038556095847, 'samples': 1170624, 'steps': 2286, 'loss/train': 0.314309298992157} -09/20/2021 22:24:40 - INFO - __main__ - Step 36583: {'lr': 0.00019952038556095847, 'samples': 1170656, 'steps': 2286, 'loss/train': 2.197366714477539} -09/20/2021 22:24:41 - INFO - __main__ - Step 36584: {'lr': 0.00019952038556095847, 'samples': 1170688, 'steps': 2286, 'loss/train': 2.145155906677246} -09/20/2021 22:24:42 - INFO - __main__ - Step 36585: {'lr': 0.00019952038556095847, 'samples': 1170720, 'steps': 2286, 'loss/train': 2.3143858909606934} -09/20/2021 22:24:42 - INFO - __main__ - Step 36586: {'lr': 0.00019952038556095847, 'samples': 1170752, 'steps': 2286, 'loss/train': 2.2658121585845947} -09/20/2021 22:24:43 - INFO - __main__ - Step 36587: {'lr': 0.00019952038556095847, 'samples': 1170784, 'steps': 2286, 'loss/train': 3.1693553924560547} -09/20/2021 22:24:44 - INFO - __main__ - Step 36588: {'lr': 0.00019952038556095847, 'samples': 1170816, 'steps': 2286, 'loss/train': 3.0082175731658936} -09/20/2021 22:24:45 - INFO - __main__ - Step 36589: {'lr': 0.00019952038556095847, 'samples': 1170848, 'steps': 2286, 'loss/train': 3.1412837505340576} -09/20/2021 22:24:45 - INFO - __main__ - Step 36590: {'lr': 0.00019952038556095847, 'samples': 1170880, 'steps': 2286, 'loss/train': 2.9826302528381348} -09/20/2021 22:24:46 - INFO - __main__ - Step 36591: {'lr': 0.00019952038556095847, 'samples': 1170912, 'steps': 2286, 'loss/train': 1.5194711685180664} -09/20/2021 22:24:47 - INFO - __main__ - Step 36592: {'lr': 0.00019952038556095847, 'samples': 1170944, 'steps': 2286, 'loss/train': 2.6503567695617676} -09/20/2021 22:24:48 - INFO - __main__ - Step 36593: {'lr': 0.00019951976136019394, 'samples': 1170976, 'steps': 2287, 'loss/train': 2.560046672821045} -09/20/2021 22:24:49 - INFO - __main__ - Step 36594: {'lr': 0.00019951976136019394, 'samples': 1171008, 'steps': 2287, 'loss/train': 2.298802375793457} -09/20/2021 22:24:49 - INFO - __main__ - Step 36595: {'lr': 0.00019951976136019394, 'samples': 1171040, 'steps': 2287, 'loss/train': 1.889609694480896} -09/20/2021 22:24:50 - INFO - __main__ - Step 36596: {'lr': 0.00019951976136019394, 'samples': 1171072, 'steps': 2287, 'loss/train': 3.346367835998535} -09/20/2021 22:24:52 - INFO - __main__ - Step 36597: {'lr': 0.00019951976136019394, 'samples': 1171104, 'steps': 2287, 'loss/train': 2.2202866077423096} -09/20/2021 22:24:52 - INFO - __main__ - Step 36598: {'lr': 0.00019951976136019394, 'samples': 1171136, 'steps': 2287, 'loss/train': 1.9980394840240479} -09/20/2021 22:24:53 - INFO - __main__ - Step 36599: {'lr': 0.00019951976136019394, 'samples': 1171168, 'steps': 2287, 'loss/train': 2.3787059783935547} -09/20/2021 22:24:54 - INFO - __main__ - Step 36600: {'lr': 0.00019951976136019394, 'samples': 1171200, 'steps': 2287, 'loss/train': 2.7070939540863037} -09/20/2021 22:24:54 - INFO - __main__ - Step 36601: {'lr': 0.00019951976136019394, 'samples': 1171232, 'steps': 2287, 'loss/train': 0.48276135325431824} -09/20/2021 22:24:55 - INFO - __main__ - Step 36602: {'lr': 0.00019951976136019394, 'samples': 1171264, 'steps': 2287, 'loss/train': 0.40600135922431946} -09/20/2021 22:24:56 - INFO - __main__ - Step 36603: {'lr': 0.00019951976136019394, 'samples': 1171296, 'steps': 2287, 'loss/train': 0.2011752724647522} -09/20/2021 22:24:57 - INFO - __main__ - Step 36604: {'lr': 0.00019951976136019394, 'samples': 1171328, 'steps': 2287, 'loss/train': 0.2241710126399994} -09/20/2021 22:24:58 - INFO - __main__ - Step 36605: {'lr': 0.00019951976136019394, 'samples': 1171360, 'steps': 2287, 'loss/train': 2.526517152786255} -09/20/2021 22:24:58 - INFO - __main__ - Step 36606: {'lr': 0.00019951976136019394, 'samples': 1171392, 'steps': 2287, 'loss/train': 1.6713497638702393} -09/20/2021 22:24:59 - INFO - __main__ - Step 36607: {'lr': 0.00019951976136019394, 'samples': 1171424, 'steps': 2287, 'loss/train': 2.733372688293457} -09/20/2021 22:25:00 - INFO - __main__ - Step 36608: {'lr': 0.00019951976136019394, 'samples': 1171456, 'steps': 2287, 'loss/train': 2.200993299484253} -09/20/2021 22:25:01 - INFO - __main__ - Step 36609: {'lr': 0.00019951913675448387, 'samples': 1171488, 'steps': 2288, 'loss/train': 2.4643566608428955} -09/20/2021 22:25:01 - INFO - __main__ - Step 36610: {'lr': 0.00019951913675448387, 'samples': 1171520, 'steps': 2288, 'loss/train': 2.0034704208374023} -09/20/2021 22:25:02 - INFO - __main__ - Step 36611: {'lr': 0.00019951913675448387, 'samples': 1171552, 'steps': 2288, 'loss/train': 1.8201881647109985} -09/20/2021 22:25:03 - INFO - __main__ - Step 36612: {'lr': 0.00019951913675448387, 'samples': 1171584, 'steps': 2288, 'loss/train': 1.9840441942214966} -09/20/2021 22:25:04 - INFO - __main__ - Step 36613: {'lr': 0.00019951913675448387, 'samples': 1171616, 'steps': 2288, 'loss/train': 2.2847654819488525} -09/20/2021 22:25:04 - INFO - __main__ - Step 36614: {'lr': 0.00019951913675448387, 'samples': 1171648, 'steps': 2288, 'loss/train': 2.229933977127075} -09/20/2021 22:25:05 - INFO - __main__ - Step 36615: {'lr': 0.00019951913675448387, 'samples': 1171680, 'steps': 2288, 'loss/train': 1.7063502073287964} -09/20/2021 22:25:06 - INFO - __main__ - Step 36616: {'lr': 0.00019951913675448387, 'samples': 1171712, 'steps': 2288, 'loss/train': 2.709972620010376} -09/20/2021 22:25:07 - INFO - __main__ - Step 36617: {'lr': 0.00019951913675448387, 'samples': 1171744, 'steps': 2288, 'loss/train': 2.526939630508423} -09/20/2021 22:25:07 - INFO - __main__ - Step 36618: {'lr': 0.00019951913675448387, 'samples': 1171776, 'steps': 2288, 'loss/train': 2.3323919773101807} -09/20/2021 22:25:08 - INFO - __main__ - Step 36619: {'lr': 0.00019951913675448387, 'samples': 1171808, 'steps': 2288, 'loss/train': 2.7139692306518555} -09/20/2021 22:25:09 - INFO - __main__ - Step 36620: {'lr': 0.00019951913675448387, 'samples': 1171840, 'steps': 2288, 'loss/train': 5.696954727172852} -09/20/2021 22:25:10 - INFO - __main__ - Step 36621: {'lr': 0.00019951913675448387, 'samples': 1171872, 'steps': 2288, 'loss/train': 5.465641021728516} -09/20/2021 22:25:10 - INFO - __main__ - Step 36622: {'lr': 0.00019951913675448387, 'samples': 1171904, 'steps': 2288, 'loss/train': 2.5403289794921875} -09/20/2021 22:25:11 - INFO - __main__ - Step 36623: {'lr': 0.00019951913675448387, 'samples': 1171936, 'steps': 2288, 'loss/train': 1.5835442543029785} -09/20/2021 22:25:12 - INFO - __main__ - Step 36624: {'lr': 0.00019951913675448387, 'samples': 1171968, 'steps': 2288, 'loss/train': 2.3023746013641357} -09/20/2021 22:25:13 - INFO - __main__ - Step 36625: {'lr': 0.00019951851174383083, 'samples': 1172000, 'steps': 2289, 'loss/train': 2.976649045944214} -09/20/2021 22:25:14 - INFO - __main__ - Step 36626: {'lr': 0.00019951851174383083, 'samples': 1172032, 'steps': 2289, 'loss/train': 2.29030704498291} -09/20/2021 22:25:14 - INFO - __main__ - Step 36627: {'lr': 0.00019951851174383083, 'samples': 1172064, 'steps': 2289, 'loss/train': 2.756807565689087} -09/20/2021 22:25:16 - INFO - __main__ - Step 36628: {'lr': 0.00019951851174383083, 'samples': 1172096, 'steps': 2289, 'loss/train': 2.805598020553589} -09/20/2021 22:25:16 - INFO - __main__ - Step 36629: {'lr': 0.00019951851174383083, 'samples': 1172128, 'steps': 2289, 'loss/train': 2.2833621501922607} -09/20/2021 22:25:17 - INFO - __main__ - Step 36630: {'lr': 0.00019951851174383083, 'samples': 1172160, 'steps': 2289, 'loss/train': 1.2037659883499146} -09/20/2021 22:25:18 - INFO - __main__ - Step 36631: {'lr': 0.00019951851174383083, 'samples': 1172192, 'steps': 2289, 'loss/train': 1.8619576692581177} -09/20/2021 22:25:19 - INFO - __main__ - Step 36632: {'lr': 0.00019951851174383083, 'samples': 1172224, 'steps': 2289, 'loss/train': 2.049484968185425} -09/20/2021 22:25:19 - INFO - __main__ - Step 36633: {'lr': 0.00019951851174383083, 'samples': 1172256, 'steps': 2289, 'loss/train': 2.8837459087371826} -09/20/2021 22:25:20 - INFO - __main__ - Step 36634: {'lr': 0.00019951851174383083, 'samples': 1172288, 'steps': 2289, 'loss/train': 2.513688087463379} -09/20/2021 22:25:21 - INFO - __main__ - Step 36635: {'lr': 0.00019951851174383083, 'samples': 1172320, 'steps': 2289, 'loss/train': 2.676378011703491} -09/20/2021 22:25:22 - INFO - __main__ - Step 36636: {'lr': 0.00019951851174383083, 'samples': 1172352, 'steps': 2289, 'loss/train': 2.3112409114837646} -09/20/2021 22:25:22 - INFO - __main__ - Step 36637: {'lr': 0.00019951851174383083, 'samples': 1172384, 'steps': 2289, 'loss/train': 1.7745492458343506} -09/20/2021 22:25:23 - INFO - __main__ - Step 36638: {'lr': 0.00019951851174383083, 'samples': 1172416, 'steps': 2289, 'loss/train': 2.038853883743286} -09/20/2021 22:25:24 - INFO - __main__ - Step 36639: {'lr': 0.00019951851174383083, 'samples': 1172448, 'steps': 2289, 'loss/train': 1.8086864948272705} -09/20/2021 22:25:25 - INFO - __main__ - Step 36640: {'lr': 0.00019951851174383083, 'samples': 1172480, 'steps': 2289, 'loss/train': 1.9504672288894653} -09/20/2021 22:25:25 - INFO - __main__ - Step 36641: {'lr': 0.00019951788632823733, 'samples': 1172512, 'steps': 2290, 'loss/train': 2.446627378463745} -09/20/2021 22:25:26 - INFO - __main__ - Step 36642: {'lr': 0.00019951788632823733, 'samples': 1172544, 'steps': 2290, 'loss/train': 2.9647059440612793} -09/20/2021 22:25:27 - INFO - __main__ - Step 36643: {'lr': 0.00019951788632823733, 'samples': 1172576, 'steps': 2290, 'loss/train': 1.6046526432037354} -09/20/2021 22:25:28 - INFO - __main__ - Step 36644: {'lr': 0.00019951788632823733, 'samples': 1172608, 'steps': 2290, 'loss/train': 1.5840225219726562} -09/20/2021 22:25:28 - INFO - __main__ - Step 36645: {'lr': 0.00019951788632823733, 'samples': 1172640, 'steps': 2290, 'loss/train': 1.344071626663208} -09/20/2021 22:25:29 - INFO - __main__ - Step 36646: {'lr': 0.00019951788632823733, 'samples': 1172672, 'steps': 2290, 'loss/train': 2.9566428661346436} -09/20/2021 22:25:30 - INFO - __main__ - Step 36647: {'lr': 0.00019951788632823733, 'samples': 1172704, 'steps': 2290, 'loss/train': 3.0463666915893555} -09/20/2021 22:25:31 - INFO - __main__ - Step 36648: {'lr': 0.00019951788632823733, 'samples': 1172736, 'steps': 2290, 'loss/train': 2.312116861343384} -09/20/2021 22:25:31 - INFO - __main__ - Step 36649: {'lr': 0.00019951788632823733, 'samples': 1172768, 'steps': 2290, 'loss/train': 1.3413584232330322} -09/20/2021 22:25:32 - INFO - __main__ - Step 36650: {'lr': 0.00019951788632823733, 'samples': 1172800, 'steps': 2290, 'loss/train': 2.411308526992798} -09/20/2021 22:25:33 - INFO - __main__ - Step 36651: {'lr': 0.00019951788632823733, 'samples': 1172832, 'steps': 2290, 'loss/train': 1.8239333629608154} -09/20/2021 22:25:34 - INFO - __main__ - Step 36652: {'lr': 0.00019951788632823733, 'samples': 1172864, 'steps': 2290, 'loss/train': 3.0037386417388916} -09/20/2021 22:25:34 - INFO - __main__ - Step 36653: {'lr': 0.00019951788632823733, 'samples': 1172896, 'steps': 2290, 'loss/train': 2.844146966934204} -09/20/2021 22:25:35 - INFO - __main__ - Step 36654: {'lr': 0.00019951788632823733, 'samples': 1172928, 'steps': 2290, 'loss/train': 1.5264705419540405} -09/20/2021 22:25:36 - INFO - __main__ - Step 36655: {'lr': 0.00019951788632823733, 'samples': 1172960, 'steps': 2290, 'loss/train': 2.0819404125213623} -09/20/2021 22:25:37 - INFO - __main__ - Step 36656: {'lr': 0.00019951788632823733, 'samples': 1172992, 'steps': 2290, 'loss/train': 2.240440607070923} -09/20/2021 22:25:38 - INFO - __main__ - Step 36657: {'lr': 0.00019951726050770598, 'samples': 1173024, 'steps': 2291, 'loss/train': 1.922670841217041} -09/20/2021 22:25:38 - INFO - __main__ - Step 36658: {'lr': 0.00019951726050770598, 'samples': 1173056, 'steps': 2291, 'loss/train': 2.5099687576293945} -09/20/2021 22:25:40 - INFO - __main__ - Step 36659: {'lr': 0.00019951726050770598, 'samples': 1173088, 'steps': 2291, 'loss/train': 2.3834660053253174} -09/20/2021 22:25:41 - INFO - __main__ - Step 36660: {'lr': 0.00019951726050770598, 'samples': 1173120, 'steps': 2291, 'loss/train': 3.0473153591156006} -09/20/2021 22:25:41 - INFO - __main__ - Step 36661: {'lr': 0.00019951726050770598, 'samples': 1173152, 'steps': 2291, 'loss/train': 2.4463186264038086} -09/20/2021 22:25:42 - INFO - __main__ - Step 36662: {'lr': 0.00019951726050770598, 'samples': 1173184, 'steps': 2291, 'loss/train': 2.9133381843566895} -09/20/2021 22:25:43 - INFO - __main__ - Step 36663: {'lr': 0.00019951726050770598, 'samples': 1173216, 'steps': 2291, 'loss/train': 2.717503070831299} -09/20/2021 22:25:44 - INFO - __main__ - Step 36664: {'lr': 0.00019951726050770598, 'samples': 1173248, 'steps': 2291, 'loss/train': 2.3745296001434326} -09/20/2021 22:25:44 - INFO - __main__ - Step 36665: {'lr': 0.00019951726050770598, 'samples': 1173280, 'steps': 2291, 'loss/train': 2.2393782138824463} -09/20/2021 22:25:45 - INFO - __main__ - Step 36666: {'lr': 0.00019951726050770598, 'samples': 1173312, 'steps': 2291, 'loss/train': 3.672868013381958} -09/20/2021 22:25:46 - INFO - __main__ - Step 36667: {'lr': 0.00019951726050770598, 'samples': 1173344, 'steps': 2291, 'loss/train': 3.6486685276031494} -09/20/2021 22:25:47 - INFO - __main__ - Step 36668: {'lr': 0.00019951726050770598, 'samples': 1173376, 'steps': 2291, 'loss/train': 1.8754773139953613} -09/20/2021 22:25:47 - INFO - __main__ - Step 36669: {'lr': 0.00019951726050770598, 'samples': 1173408, 'steps': 2291, 'loss/train': 1.9772242307662964} -09/20/2021 22:25:48 - INFO - __main__ - Step 36670: {'lr': 0.00019951726050770598, 'samples': 1173440, 'steps': 2291, 'loss/train': 0.15433910489082336} -09/20/2021 22:25:49 - INFO - __main__ - Step 36671: {'lr': 0.00019951726050770598, 'samples': 1173472, 'steps': 2291, 'loss/train': 0.18874166905879974} -09/20/2021 22:25:50 - INFO - __main__ - Step 36672: {'lr': 0.00019951726050770598, 'samples': 1173504, 'steps': 2291, 'loss/train': 0.350298136472702} -09/20/2021 22:25:50 - INFO - __main__ - Step 36673: {'lr': 0.00019951663428223926, 'samples': 1173536, 'steps': 2292, 'loss/train': 0.2630663514137268} -09/20/2021 22:25:51 - INFO - __main__ - Step 36674: {'lr': 0.00019951663428223926, 'samples': 1173568, 'steps': 2292, 'loss/train': 1.729101538658142} -09/20/2021 22:25:52 - INFO - __main__ - Step 36675: {'lr': 0.00019951663428223926, 'samples': 1173600, 'steps': 2292, 'loss/train': 1.0149253606796265} -09/20/2021 22:25:53 - INFO - __main__ - Step 36676: {'lr': 0.00019951663428223926, 'samples': 1173632, 'steps': 2292, 'loss/train': 0.6396934986114502} -09/20/2021 22:25:53 - INFO - __main__ - Step 36677: {'lr': 0.00019951663428223926, 'samples': 1173664, 'steps': 2292, 'loss/train': 0.9390486478805542} -09/20/2021 22:25:54 - INFO - __main__ - Step 36678: {'lr': 0.00019951663428223926, 'samples': 1173696, 'steps': 2292, 'loss/train': 2.216949462890625} -09/20/2021 22:25:55 - INFO - __main__ - Step 36679: {'lr': 0.00019951663428223926, 'samples': 1173728, 'steps': 2292, 'loss/train': 2.130474805831909} -09/20/2021 22:25:56 - INFO - __main__ - Step 36680: {'lr': 0.00019951663428223926, 'samples': 1173760, 'steps': 2292, 'loss/train': 0.18757124245166779} -09/20/2021 22:25:56 - INFO - __main__ - Step 36681: {'lr': 0.00019951663428223926, 'samples': 1173792, 'steps': 2292, 'loss/train': 0.24675549566745758} -09/20/2021 22:25:57 - INFO - __main__ - Step 36682: {'lr': 0.00019951663428223926, 'samples': 1173824, 'steps': 2292, 'loss/train': 0.2473347783088684} -09/20/2021 22:25:58 - INFO - __main__ - Step 36683: {'lr': 0.00019951663428223926, 'samples': 1173856, 'steps': 2292, 'loss/train': 2.7925498485565186} -09/20/2021 22:25:59 - INFO - __main__ - Step 36684: {'lr': 0.00019951663428223926, 'samples': 1173888, 'steps': 2292, 'loss/train': 2.5561485290527344} -09/20/2021 22:25:59 - INFO - __main__ - Step 36685: {'lr': 0.00019951663428223926, 'samples': 1173920, 'steps': 2292, 'loss/train': 1.0468223094940186} -09/20/2021 22:26:00 - INFO - __main__ - Step 36686: {'lr': 0.00019951663428223926, 'samples': 1173952, 'steps': 2292, 'loss/train': 2.9527781009674072} -09/20/2021 22:26:01 - INFO - __main__ - Step 36687: {'lr': 0.00019951663428223926, 'samples': 1173984, 'steps': 2292, 'loss/train': 2.3823366165161133} -09/20/2021 22:26:02 - INFO - __main__ - Step 36688: {'lr': 0.00019951663428223926, 'samples': 1174016, 'steps': 2292, 'loss/train': 2.0389485359191895} -09/20/2021 22:26:03 - INFO - __main__ - Step 36689: {'lr': 0.00019951600765183972, 'samples': 1174048, 'steps': 2293, 'loss/train': 2.947693347930908} -09/20/2021 22:26:03 - INFO - __main__ - Step 36690: {'lr': 0.00019951600765183972, 'samples': 1174080, 'steps': 2293, 'loss/train': 2.096932888031006} -09/20/2021 22:26:05 - INFO - __main__ - Step 36691: {'lr': 0.00019951600765183972, 'samples': 1174112, 'steps': 2293, 'loss/train': 2.0821385383605957} -09/20/2021 22:26:05 - INFO - __main__ - Step 36692: {'lr': 0.00019951600765183972, 'samples': 1174144, 'steps': 2293, 'loss/train': 2.430800199508667} -09/20/2021 22:26:06 - INFO - __main__ - Step 36693: {'lr': 0.00019951600765183972, 'samples': 1174176, 'steps': 2293, 'loss/train': 1.8682143688201904} -09/20/2021 22:26:07 - INFO - __main__ - Step 36694: {'lr': 0.00019951600765183972, 'samples': 1174208, 'steps': 2293, 'loss/train': 1.9408117532730103} -09/20/2021 22:26:08 - INFO - __main__ - Step 36695: {'lr': 0.00019951600765183972, 'samples': 1174240, 'steps': 2293, 'loss/train': 2.6931748390197754} -09/20/2021 22:26:08 - INFO - __main__ - Step 36696: {'lr': 0.00019951600765183972, 'samples': 1174272, 'steps': 2293, 'loss/train': 1.4824836254119873} -09/20/2021 22:26:09 - INFO - __main__ - Step 36697: {'lr': 0.00019951600765183972, 'samples': 1174304, 'steps': 2293, 'loss/train': 2.2933788299560547} -09/20/2021 22:26:10 - INFO - __main__ - Step 36698: {'lr': 0.00019951600765183972, 'samples': 1174336, 'steps': 2293, 'loss/train': 1.9442543983459473} -09/20/2021 22:26:11 - INFO - __main__ - Step 36699: {'lr': 0.00019951600765183972, 'samples': 1174368, 'steps': 2293, 'loss/train': 2.0600745677948} -09/20/2021 22:26:11 - INFO - __main__ - Step 36700: {'lr': 0.00019951600765183972, 'samples': 1174400, 'steps': 2293, 'loss/train': 2.571690797805786} -09/20/2021 22:26:12 - INFO - __main__ - Step 36701: {'lr': 0.00019951600765183972, 'samples': 1174432, 'steps': 2293, 'loss/train': 1.87307608127594} -09/20/2021 22:26:13 - INFO - __main__ - Step 36702: {'lr': 0.00019951600765183972, 'samples': 1174464, 'steps': 2293, 'loss/train': 1.7346515655517578} -09/20/2021 22:26:14 - INFO - __main__ - Step 36703: {'lr': 0.00019951600765183972, 'samples': 1174496, 'steps': 2293, 'loss/train': 2.0474555492401123} -09/20/2021 22:26:14 - INFO - __main__ - Step 36704: {'lr': 0.00019951600765183972, 'samples': 1174528, 'steps': 2293, 'loss/train': 2.3868167400360107} -09/20/2021 22:26:15 - INFO - __main__ - Step 36705: {'lr': 0.00019951538061650998, 'samples': 1174560, 'steps': 2294, 'loss/train': 2.423811197280884} -09/20/2021 22:26:16 - INFO - __main__ - Step 36706: {'lr': 0.00019951538061650998, 'samples': 1174592, 'steps': 2294, 'loss/train': 2.7689664363861084} -09/20/2021 22:26:17 - INFO - __main__ - Step 36707: {'lr': 0.00019951538061650998, 'samples': 1174624, 'steps': 2294, 'loss/train': 1.9687526226043701} -09/20/2021 22:26:18 - INFO - __main__ - Step 36708: {'lr': 0.00019951538061650998, 'samples': 1174656, 'steps': 2294, 'loss/train': 2.33652925491333} -09/20/2021 22:26:18 - INFO - __main__ - Step 36709: {'lr': 0.00019951538061650998, 'samples': 1174688, 'steps': 2294, 'loss/train': 2.4198544025421143} -09/20/2021 22:26:19 - INFO - __main__ - Step 36710: {'lr': 0.00019951538061650998, 'samples': 1174720, 'steps': 2294, 'loss/train': 2.13702392578125} -09/20/2021 22:26:20 - INFO - __main__ - Step 36711: {'lr': 0.00019951538061650998, 'samples': 1174752, 'steps': 2294, 'loss/train': 2.509652853012085} -09/20/2021 22:26:21 - INFO - __main__ - Step 36712: {'lr': 0.00019951538061650998, 'samples': 1174784, 'steps': 2294, 'loss/train': 2.1797850131988525} -09/20/2021 22:26:21 - INFO - __main__ - Step 36713: {'lr': 0.00019951538061650998, 'samples': 1174816, 'steps': 2294, 'loss/train': 2.2397279739379883} -09/20/2021 22:26:22 - INFO - __main__ - Step 36714: {'lr': 0.00019951538061650998, 'samples': 1174848, 'steps': 2294, 'loss/train': 2.354245662689209} -09/20/2021 22:26:23 - INFO - __main__ - Step 36715: {'lr': 0.00019951538061650998, 'samples': 1174880, 'steps': 2294, 'loss/train': 2.0748324394226074} -09/20/2021 22:26:24 - INFO - __main__ - Step 36716: {'lr': 0.00019951538061650998, 'samples': 1174912, 'steps': 2294, 'loss/train': 2.532498836517334} -09/20/2021 22:26:24 - INFO - __main__ - Step 36717: {'lr': 0.00019951538061650998, 'samples': 1174944, 'steps': 2294, 'loss/train': 2.3190016746520996} -09/20/2021 22:26:25 - INFO - __main__ - Step 36718: {'lr': 0.00019951538061650998, 'samples': 1174976, 'steps': 2294, 'loss/train': 2.3374083042144775} -09/20/2021 22:26:26 - INFO - __main__ - Step 36719: {'lr': 0.00019951538061650998, 'samples': 1175008, 'steps': 2294, 'loss/train': 1.5307122468948364} -09/20/2021 22:26:27 - INFO - __main__ - Step 36720: {'lr': 0.00019951538061650998, 'samples': 1175040, 'steps': 2294, 'loss/train': 2.5375678539276123} -09/20/2021 22:26:28 - INFO - __main__ - Step 36721: {'lr': 0.0001995147531762525, 'samples': 1175072, 'steps': 2295, 'loss/train': 1.496902585029602} -09/20/2021 22:26:29 - INFO - __main__ - Step 36722: {'lr': 0.0001995147531762525, 'samples': 1175104, 'steps': 2295, 'loss/train': 2.2443082332611084} -09/20/2021 22:26:29 - INFO - __main__ - Step 36723: {'lr': 0.0001995147531762525, 'samples': 1175136, 'steps': 2295, 'loss/train': 2.256924629211426} -09/20/2021 22:26:30 - INFO - __main__ - Step 36724: {'lr': 0.0001995147531762525, 'samples': 1175168, 'steps': 2295, 'loss/train': 1.514407753944397} -09/20/2021 22:26:31 - INFO - __main__ - Step 36725: {'lr': 0.0001995147531762525, 'samples': 1175200, 'steps': 2295, 'loss/train': 2.5873048305511475} -09/20/2021 22:26:32 - INFO - __main__ - Step 36726: {'lr': 0.0001995147531762525, 'samples': 1175232, 'steps': 2295, 'loss/train': 2.8079707622528076} -09/20/2021 22:26:32 - INFO - __main__ - Step 36727: {'lr': 0.0001995147531762525, 'samples': 1175264, 'steps': 2295, 'loss/train': 2.441810131072998} -09/20/2021 22:26:33 - INFO - __main__ - Step 36728: {'lr': 0.0001995147531762525, 'samples': 1175296, 'steps': 2295, 'loss/train': 2.306750535964966} -09/20/2021 22:26:34 - INFO - __main__ - Step 36729: {'lr': 0.0001995147531762525, 'samples': 1175328, 'steps': 2295, 'loss/train': 1.2569870948791504} -09/20/2021 22:26:35 - INFO - __main__ - Step 36730: {'lr': 0.0001995147531762525, 'samples': 1175360, 'steps': 2295, 'loss/train': 2.9539759159088135} -09/20/2021 22:26:35 - INFO - __main__ - Step 36731: {'lr': 0.0001995147531762525, 'samples': 1175392, 'steps': 2295, 'loss/train': 2.7732784748077393} -09/20/2021 22:26:36 - INFO - __main__ - Step 36732: {'lr': 0.0001995147531762525, 'samples': 1175424, 'steps': 2295, 'loss/train': 2.2221968173980713} -09/20/2021 22:26:37 - INFO - __main__ - Step 36733: {'lr': 0.0001995147531762525, 'samples': 1175456, 'steps': 2295, 'loss/train': 1.702162742614746} -09/20/2021 22:26:38 - INFO - __main__ - Step 36734: {'lr': 0.0001995147531762525, 'samples': 1175488, 'steps': 2295, 'loss/train': 1.1988203525543213} -09/20/2021 22:26:38 - INFO - __main__ - Step 36735: {'lr': 0.0001995147531762525, 'samples': 1175520, 'steps': 2295, 'loss/train': 0.6187059283256531} -09/20/2021 22:26:39 - INFO - __main__ - Step 36736: {'lr': 0.0001995147531762525, 'samples': 1175552, 'steps': 2295, 'loss/train': 2.0379812717437744} -09/20/2021 22:26:40 - INFO - __main__ - Step 36737: {'lr': 0.0001995141253310699, 'samples': 1175584, 'steps': 2296, 'loss/train': 1.9671684503555298} -09/20/2021 22:26:41 - INFO - __main__ - Step 36738: {'lr': 0.0001995141253310699, 'samples': 1175616, 'steps': 2296, 'loss/train': 1.575227975845337} -09/20/2021 22:26:42 - INFO - __main__ - Step 36739: {'lr': 0.0001995141253310699, 'samples': 1175648, 'steps': 2296, 'loss/train': 2.8979835510253906} -09/20/2021 22:26:42 - INFO - __main__ - Step 36740: {'lr': 0.0001995141253310699, 'samples': 1175680, 'steps': 2296, 'loss/train': 2.73341965675354} -09/20/2021 22:26:43 - INFO - __main__ - Step 36741: {'lr': 0.0001995141253310699, 'samples': 1175712, 'steps': 2296, 'loss/train': 3.0387814044952393} -09/20/2021 22:26:44 - INFO - __main__ - Step 36742: {'lr': 0.0001995141253310699, 'samples': 1175744, 'steps': 2296, 'loss/train': 2.257176160812378} -09/20/2021 22:26:45 - INFO - __main__ - Step 36743: {'lr': 0.0001995141253310699, 'samples': 1175776, 'steps': 2296, 'loss/train': 1.3558800220489502} -09/20/2021 22:26:45 - INFO - __main__ - Step 36744: {'lr': 0.0001995141253310699, 'samples': 1175808, 'steps': 2296, 'loss/train': 3.388061046600342} -09/20/2021 22:26:46 - INFO - __main__ - Step 36745: {'lr': 0.0001995141253310699, 'samples': 1175840, 'steps': 2296, 'loss/train': 2.050433397293091} -09/20/2021 22:26:47 - INFO - __main__ - Step 36746: {'lr': 0.0001995141253310699, 'samples': 1175872, 'steps': 2296, 'loss/train': 2.025865077972412} -09/20/2021 22:26:48 - INFO - __main__ - Step 36747: {'lr': 0.0001995141253310699, 'samples': 1175904, 'steps': 2296, 'loss/train': 2.9410064220428467} -09/20/2021 22:26:48 - INFO - __main__ - Step 36748: {'lr': 0.0001995141253310699, 'samples': 1175936, 'steps': 2296, 'loss/train': 2.9897196292877197} -09/20/2021 22:26:49 - INFO - __main__ - Step 36749: {'lr': 0.0001995141253310699, 'samples': 1175968, 'steps': 2296, 'loss/train': 1.7063690423965454} -09/20/2021 22:26:50 - INFO - __main__ - Step 36750: {'lr': 0.0001995141253310699, 'samples': 1176000, 'steps': 2296, 'loss/train': 2.3031721115112305} -09/20/2021 22:26:51 - INFO - __main__ - Step 36751: {'lr': 0.0001995141253310699, 'samples': 1176032, 'steps': 2296, 'loss/train': 0.9609403610229492} -09/20/2021 22:26:52 - INFO - __main__ - Step 36752: {'lr': 0.0001995141253310699, 'samples': 1176064, 'steps': 2296, 'loss/train': 2.2568325996398926} -09/20/2021 22:26:53 - INFO - __main__ - Step 36753: {'lr': 0.0001995134970809647, 'samples': 1176096, 'steps': 2297, 'loss/train': 1.5692657232284546} -09/20/2021 22:26:53 - INFO - __main__ - Step 36754: {'lr': 0.0001995134970809647, 'samples': 1176128, 'steps': 2297, 'loss/train': 1.8788301944732666} -09/20/2021 22:26:54 - INFO - __main__ - Step 36755: {'lr': 0.0001995134970809647, 'samples': 1176160, 'steps': 2297, 'loss/train': 1.5853629112243652} -09/20/2021 22:26:55 - INFO - __main__ - Step 36756: {'lr': 0.0001995134970809647, 'samples': 1176192, 'steps': 2297, 'loss/train': 2.069730520248413} -09/20/2021 22:26:56 - INFO - __main__ - Step 36757: {'lr': 0.0001995134970809647, 'samples': 1176224, 'steps': 2297, 'loss/train': 2.015500783920288} -09/20/2021 22:26:56 - INFO - __main__ - Step 36758: {'lr': 0.0001995134970809647, 'samples': 1176256, 'steps': 2297, 'loss/train': 1.9212781190872192} -09/20/2021 22:26:57 - INFO - __main__ - Step 36759: {'lr': 0.0001995134970809647, 'samples': 1176288, 'steps': 2297, 'loss/train': 1.71111261844635} -09/20/2021 22:26:58 - INFO - __main__ - Step 36760: {'lr': 0.0001995134970809647, 'samples': 1176320, 'steps': 2297, 'loss/train': 3.020672559738159} -09/20/2021 22:26:59 - INFO - __main__ - Step 36761: {'lr': 0.0001995134970809647, 'samples': 1176352, 'steps': 2297, 'loss/train': 2.170886993408203} -09/20/2021 22:26:59 - INFO - __main__ - Step 36762: {'lr': 0.0001995134970809647, 'samples': 1176384, 'steps': 2297, 'loss/train': 1.820667028427124} -09/20/2021 22:27:00 - INFO - __main__ - Step 36763: {'lr': 0.0001995134970809647, 'samples': 1176416, 'steps': 2297, 'loss/train': 2.2287418842315674} -09/20/2021 22:27:01 - INFO - __main__ - Step 36764: {'lr': 0.0001995134970809647, 'samples': 1176448, 'steps': 2297, 'loss/train': 1.7061585187911987} -09/20/2021 22:27:02 - INFO - __main__ - Step 36765: {'lr': 0.0001995134970809647, 'samples': 1176480, 'steps': 2297, 'loss/train': 2.108433246612549} -09/20/2021 22:27:02 - INFO - __main__ - Step 36766: {'lr': 0.0001995134970809647, 'samples': 1176512, 'steps': 2297, 'loss/train': 2.55381441116333} -09/20/2021 22:27:03 - INFO - __main__ - Step 36767: {'lr': 0.0001995134970809647, 'samples': 1176544, 'steps': 2297, 'loss/train': 1.153815746307373} -09/20/2021 22:27:04 - INFO - __main__ - Step 36768: {'lr': 0.0001995134970809647, 'samples': 1176576, 'steps': 2297, 'loss/train': 2.822230100631714} -09/20/2021 22:27:05 - INFO - __main__ - Step 36769: {'lr': 0.00019951286842593945, 'samples': 1176608, 'steps': 2298, 'loss/train': 2.0378849506378174} -09/20/2021 22:27:06 - INFO - __main__ - Step 36770: {'lr': 0.00019951286842593945, 'samples': 1176640, 'steps': 2298, 'loss/train': 2.0682287216186523} -09/20/2021 22:27:06 - INFO - __main__ - Step 36771: {'lr': 0.00019951286842593945, 'samples': 1176672, 'steps': 2298, 'loss/train': 1.7287441492080688} -09/20/2021 22:27:07 - INFO - __main__ - Step 36772: {'lr': 0.00019951286842593945, 'samples': 1176704, 'steps': 2298, 'loss/train': 2.6603052616119385} -09/20/2021 22:27:08 - INFO - __main__ - Step 36773: {'lr': 0.00019951286842593945, 'samples': 1176736, 'steps': 2298, 'loss/train': 1.2891467809677124} -09/20/2021 22:27:09 - INFO - __main__ - Step 36774: {'lr': 0.00019951286842593945, 'samples': 1176768, 'steps': 2298, 'loss/train': 2.4970574378967285} -09/20/2021 22:27:09 - INFO - __main__ - Step 36775: {'lr': 0.00019951286842593945, 'samples': 1176800, 'steps': 2298, 'loss/train': 2.2673275470733643} -09/20/2021 22:27:10 - INFO - __main__ - Step 36776: {'lr': 0.00019951286842593945, 'samples': 1176832, 'steps': 2298, 'loss/train': 1.66635000705719} -09/20/2021 22:27:11 - INFO - __main__ - Step 36777: {'lr': 0.00019951286842593945, 'samples': 1176864, 'steps': 2298, 'loss/train': 1.33997642993927} -09/20/2021 22:27:12 - INFO - __main__ - Step 36778: {'lr': 0.00019951286842593945, 'samples': 1176896, 'steps': 2298, 'loss/train': 0.923003077507019} -09/20/2021 22:27:12 - INFO - __main__ - Step 36779: {'lr': 0.00019951286842593945, 'samples': 1176928, 'steps': 2298, 'loss/train': 2.976271390914917} -09/20/2021 22:27:13 - INFO - __main__ - Step 36780: {'lr': 0.00019951286842593945, 'samples': 1176960, 'steps': 2298, 'loss/train': 1.7883204221725464} -09/20/2021 22:27:14 - INFO - __main__ - Step 36781: {'lr': 0.00019951286842593945, 'samples': 1176992, 'steps': 2298, 'loss/train': 2.0986578464508057} -09/20/2021 22:27:15 - INFO - __main__ - Step 36782: {'lr': 0.00019951286842593945, 'samples': 1177024, 'steps': 2298, 'loss/train': 1.9042867422103882} -09/20/2021 22:27:16 - INFO - __main__ - Step 36783: {'lr': 0.00019951286842593945, 'samples': 1177056, 'steps': 2298, 'loss/train': 1.9596954584121704} -09/20/2021 22:27:17 - INFO - __main__ - Step 36784: {'lr': 0.00019951286842593945, 'samples': 1177088, 'steps': 2298, 'loss/train': 2.6387112140655518} -09/20/2021 22:27:18 - INFO - __main__ - Step 36785: {'lr': 0.00019951223936599677, 'samples': 1177120, 'steps': 2299, 'loss/train': 2.3844316005706787} -09/20/2021 22:27:18 - INFO - __main__ - Step 36786: {'lr': 0.00019951223936599677, 'samples': 1177152, 'steps': 2299, 'loss/train': 2.934873342514038} -09/20/2021 22:27:19 - INFO - __main__ - Step 36787: {'lr': 0.00019951223936599677, 'samples': 1177184, 'steps': 2299, 'loss/train': 2.6782493591308594} -09/20/2021 22:27:20 - INFO - __main__ - Step 36788: {'lr': 0.00019951223936599677, 'samples': 1177216, 'steps': 2299, 'loss/train': 2.6914961338043213} -09/20/2021 22:27:21 - INFO - __main__ - Step 36789: {'lr': 0.00019951223936599677, 'samples': 1177248, 'steps': 2299, 'loss/train': 0.5791849493980408} -09/20/2021 22:27:21 - INFO - __main__ - Step 36790: {'lr': 0.00019951223936599677, 'samples': 1177280, 'steps': 2299, 'loss/train': 1.9950287342071533} -09/20/2021 22:27:22 - INFO - __main__ - Step 36791: {'lr': 0.00019951223936599677, 'samples': 1177312, 'steps': 2299, 'loss/train': 1.974664330482483} -09/20/2021 22:27:23 - INFO - __main__ - Step 36792: {'lr': 0.00019951223936599677, 'samples': 1177344, 'steps': 2299, 'loss/train': 3.0509514808654785} -09/20/2021 22:27:24 - INFO - __main__ - Step 36793: {'lr': 0.00019951223936599677, 'samples': 1177376, 'steps': 2299, 'loss/train': 2.0259430408477783} -09/20/2021 22:27:24 - INFO - __main__ - Step 36794: {'lr': 0.00019951223936599677, 'samples': 1177408, 'steps': 2299, 'loss/train': 0.9847284555435181} -09/20/2021 22:27:25 - INFO - __main__ - Step 36795: {'lr': 0.00019951223936599677, 'samples': 1177440, 'steps': 2299, 'loss/train': 2.514005184173584} -09/20/2021 22:27:26 - INFO - __main__ - Step 36796: {'lr': 0.00019951223936599677, 'samples': 1177472, 'steps': 2299, 'loss/train': 2.739478588104248} -09/20/2021 22:27:27 - INFO - __main__ - Step 36797: {'lr': 0.00019951223936599677, 'samples': 1177504, 'steps': 2299, 'loss/train': 1.926837682723999} -09/20/2021 22:27:27 - INFO - __main__ - Step 36798: {'lr': 0.00019951223936599677, 'samples': 1177536, 'steps': 2299, 'loss/train': 1.7503167390823364} -09/20/2021 22:27:28 - INFO - __main__ - Step 36799: {'lr': 0.00019951223936599677, 'samples': 1177568, 'steps': 2299, 'loss/train': 2.7234699726104736} -09/20/2021 22:27:29 - INFO - __main__ - Step 36800: {'lr': 0.00019951223936599677, 'samples': 1177600, 'steps': 2299, 'loss/train': 1.4650598764419556} -09/20/2021 22:27:30 - INFO - __main__ - Step 36801: {'lr': 0.00019951160990113912, 'samples': 1177632, 'steps': 2300, 'loss/train': 2.2509262561798096} -09/20/2021 22:27:30 - INFO - __main__ - Step 36802: {'lr': 0.00019951160990113912, 'samples': 1177664, 'steps': 2300, 'loss/train': 2.389171838760376} -09/20/2021 22:27:31 - INFO - __main__ - Step 36803: {'lr': 0.00019951160990113912, 'samples': 1177696, 'steps': 2300, 'loss/train': 2.2291979789733887} -09/20/2021 22:27:32 - INFO - __main__ - Step 36804: {'lr': 0.00019951160990113912, 'samples': 1177728, 'steps': 2300, 'loss/train': 1.7279393672943115} -09/20/2021 22:27:33 - INFO - __main__ - Step 36805: {'lr': 0.00019951160990113912, 'samples': 1177760, 'steps': 2300, 'loss/train': 2.544384241104126} -09/20/2021 22:27:33 - INFO - __main__ - Step 36806: {'lr': 0.00019951160990113912, 'samples': 1177792, 'steps': 2300, 'loss/train': 2.496236562728882} -09/20/2021 22:27:34 - INFO - __main__ - Step 36807: {'lr': 0.00019951160990113912, 'samples': 1177824, 'steps': 2300, 'loss/train': 1.6102697849273682} -09/20/2021 22:27:35 - INFO - __main__ - Step 36808: {'lr': 0.00019951160990113912, 'samples': 1177856, 'steps': 2300, 'loss/train': 2.9158384799957275} -09/20/2021 22:27:36 - INFO - __main__ - Step 36809: {'lr': 0.00019951160990113912, 'samples': 1177888, 'steps': 2300, 'loss/train': 2.3232243061065674} -09/20/2021 22:27:36 - INFO - __main__ - Step 36810: {'lr': 0.00019951160990113912, 'samples': 1177920, 'steps': 2300, 'loss/train': 1.3348970413208008} -09/20/2021 22:27:37 - INFO - __main__ - Step 36811: {'lr': 0.00019951160990113912, 'samples': 1177952, 'steps': 2300, 'loss/train': 2.5474321842193604} -09/20/2021 22:27:38 - INFO - __main__ - Step 36812: {'lr': 0.00019951160990113912, 'samples': 1177984, 'steps': 2300, 'loss/train': 1.8281490802764893} -09/20/2021 22:27:40 - INFO - __main__ - Step 36813: {'lr': 0.00019951160990113912, 'samples': 1178016, 'steps': 2300, 'loss/train': 1.8246403932571411} -09/20/2021 22:27:40 - INFO - __main__ - Step 36814: {'lr': 0.00019951160990113912, 'samples': 1178048, 'steps': 2300, 'loss/train': 2.147516965866089} -09/20/2021 22:27:41 - INFO - __main__ - Step 36815: {'lr': 0.00019951160990113912, 'samples': 1178080, 'steps': 2300, 'loss/train': 2.380370855331421} -09/20/2021 22:27:42 - INFO - __main__ - Step 36816: {'lr': 0.00019951160990113912, 'samples': 1178112, 'steps': 2300, 'loss/train': 2.3312811851501465} -09/20/2021 22:27:43 - INFO - __main__ - Step 36817: {'lr': 0.00019951098003136917, 'samples': 1178144, 'steps': 2301, 'loss/train': 7.116545677185059} -09/20/2021 22:27:43 - INFO - __main__ - Step 36818: {'lr': 0.00019951098003136917, 'samples': 1178176, 'steps': 2301, 'loss/train': 1.757141351699829} -09/20/2021 22:27:44 - INFO - __main__ - Step 36819: {'lr': 0.00019951098003136917, 'samples': 1178208, 'steps': 2301, 'loss/train': 2.2985963821411133} -09/20/2021 22:27:45 - INFO - __main__ - Step 36820: {'lr': 0.00019951098003136917, 'samples': 1178240, 'steps': 2301, 'loss/train': 2.316720485687256} -09/20/2021 22:27:46 - INFO - __main__ - Step 36821: {'lr': 0.00019951098003136917, 'samples': 1178272, 'steps': 2301, 'loss/train': 1.5643187761306763} -09/20/2021 22:27:46 - INFO - __main__ - Step 36822: {'lr': 0.00019951098003136917, 'samples': 1178304, 'steps': 2301, 'loss/train': 2.5597164630889893} -09/20/2021 22:27:47 - INFO - __main__ - Step 36823: {'lr': 0.00019951098003136917, 'samples': 1178336, 'steps': 2301, 'loss/train': 2.292144536972046} -09/20/2021 22:27:48 - INFO - __main__ - Step 36824: {'lr': 0.00019951098003136917, 'samples': 1178368, 'steps': 2301, 'loss/train': 0.33342891931533813} -09/20/2021 22:27:49 - INFO - __main__ - Step 36825: {'lr': 0.00019951098003136917, 'samples': 1178400, 'steps': 2301, 'loss/train': 3.063948631286621} -09/20/2021 22:27:49 - INFO - __main__ - Step 36826: {'lr': 0.00019951098003136917, 'samples': 1178432, 'steps': 2301, 'loss/train': 0.66388338804245} -09/20/2021 22:27:50 - INFO - __main__ - Step 36827: {'lr': 0.00019951098003136917, 'samples': 1178464, 'steps': 2301, 'loss/train': 1.5145217180252075} -09/20/2021 22:27:51 - INFO - __main__ - Step 36828: {'lr': 0.00019951098003136917, 'samples': 1178496, 'steps': 2301, 'loss/train': 1.184579849243164} -09/20/2021 22:27:52 - INFO - __main__ - Step 36829: {'lr': 0.00019951098003136917, 'samples': 1178528, 'steps': 2301, 'loss/train': 1.7412320375442505} -09/20/2021 22:27:52 - INFO - __main__ - Step 36830: {'lr': 0.00019951098003136917, 'samples': 1178560, 'steps': 2301, 'loss/train': 2.3796792030334473} -09/20/2021 22:27:53 - INFO - __main__ - Step 36831: {'lr': 0.00019951098003136917, 'samples': 1178592, 'steps': 2301, 'loss/train': 2.3960747718811035} -09/20/2021 22:27:54 - INFO - __main__ - Step 36832: {'lr': 0.00019951098003136917, 'samples': 1178624, 'steps': 2301, 'loss/train': 2.4829065799713135} -09/20/2021 22:27:55 - INFO - __main__ - Step 36833: {'lr': 0.0001995103497566894, 'samples': 1178656, 'steps': 2302, 'loss/train': 2.4267451763153076} -09/20/2021 22:27:56 - INFO - __main__ - Step 36834: {'lr': 0.0001995103497566894, 'samples': 1178688, 'steps': 2302, 'loss/train': 1.5760046243667603} -09/20/2021 22:27:56 - INFO - __main__ - Step 36835: {'lr': 0.0001995103497566894, 'samples': 1178720, 'steps': 2302, 'loss/train': 2.7896716594696045} -09/20/2021 22:27:57 - INFO - __main__ - Step 36836: {'lr': 0.0001995103497566894, 'samples': 1178752, 'steps': 2302, 'loss/train': 0.677612841129303} -09/20/2021 22:27:58 - INFO - __main__ - Step 36837: {'lr': 0.0001995103497566894, 'samples': 1178784, 'steps': 2302, 'loss/train': 0.6852595210075378} -09/20/2021 22:27:59 - INFO - __main__ - Step 36838: {'lr': 0.0001995103497566894, 'samples': 1178816, 'steps': 2302, 'loss/train': 0.60203617811203} -09/20/2021 22:27:59 - INFO - __main__ - Step 36839: {'lr': 0.0001995103497566894, 'samples': 1178848, 'steps': 2302, 'loss/train': 0.5960957407951355} -09/20/2021 22:28:00 - INFO - __main__ - Step 36840: {'lr': 0.0001995103497566894, 'samples': 1178880, 'steps': 2302, 'loss/train': 0.6741915941238403} -09/20/2021 22:28:01 - INFO - __main__ - Step 36841: {'lr': 0.0001995103497566894, 'samples': 1178912, 'steps': 2302, 'loss/train': 0.6488465070724487} -09/20/2021 22:28:02 - INFO - __main__ - Step 36842: {'lr': 0.0001995103497566894, 'samples': 1178944, 'steps': 2302, 'loss/train': 0.6712769269943237} -09/20/2021 22:28:02 - INFO - __main__ - Step 36843: {'lr': 0.0001995103497566894, 'samples': 1178976, 'steps': 2302, 'loss/train': 0.9962755441665649} -09/20/2021 22:28:03 - INFO - __main__ - Step 36844: {'lr': 0.0001995103497566894, 'samples': 1179008, 'steps': 2302, 'loss/train': 2.5103588104248047} -09/20/2021 22:28:04 - INFO - __main__ - Step 36845: {'lr': 0.0001995103497566894, 'samples': 1179040, 'steps': 2302, 'loss/train': 1.38399338722229} -09/20/2021 22:28:05 - INFO - __main__ - Step 36846: {'lr': 0.0001995103497566894, 'samples': 1179072, 'steps': 2302, 'loss/train': 1.3574341535568237} -09/20/2021 22:28:05 - INFO - __main__ - Step 36847: {'lr': 0.0001995103497566894, 'samples': 1179104, 'steps': 2302, 'loss/train': 2.701070547103882} -09/20/2021 22:28:06 - INFO - __main__ - Step 36848: {'lr': 0.0001995103497566894, 'samples': 1179136, 'steps': 2302, 'loss/train': 2.6320834159851074} -09/20/2021 22:28:07 - INFO - __main__ - Step 36849: {'lr': 0.0001995097190771024, 'samples': 1179168, 'steps': 2303, 'loss/train': 2.413989782333374} -09/20/2021 22:28:09 - INFO - __main__ - Step 36850: {'lr': 0.0001995097190771024, 'samples': 1179200, 'steps': 2303, 'loss/train': 2.9430723190307617} -09/20/2021 22:28:10 - INFO - __main__ - Step 36851: {'lr': 0.0001995097190771024, 'samples': 1179232, 'steps': 2303, 'loss/train': 1.1805789470672607} -09/20/2021 22:28:10 - INFO - __main__ - Step 36852: {'lr': 0.0001995097190771024, 'samples': 1179264, 'steps': 2303, 'loss/train': 2.455076217651367} -09/20/2021 22:28:11 - INFO - __main__ - Step 36853: {'lr': 0.0001995097190771024, 'samples': 1179296, 'steps': 2303, 'loss/train': 2.486970901489258} -09/20/2021 22:28:12 - INFO - __main__ - Step 36854: {'lr': 0.0001995097190771024, 'samples': 1179328, 'steps': 2303, 'loss/train': 2.7667815685272217} -09/20/2021 22:28:13 - INFO - __main__ - Step 36855: {'lr': 0.0001995097190771024, 'samples': 1179360, 'steps': 2303, 'loss/train': 2.7021007537841797} -09/20/2021 22:28:13 - INFO - __main__ - Step 36856: {'lr': 0.0001995097190771024, 'samples': 1179392, 'steps': 2303, 'loss/train': 2.1974070072174072} -09/20/2021 22:28:14 - INFO - __main__ - Step 36857: {'lr': 0.0001995097190771024, 'samples': 1179424, 'steps': 2303, 'loss/train': 1.287096619606018} -09/20/2021 22:28:15 - INFO - __main__ - Step 36858: {'lr': 0.0001995097190771024, 'samples': 1179456, 'steps': 2303, 'loss/train': 2.2720673084259033} -09/20/2021 22:28:16 - INFO - __main__ - Step 36859: {'lr': 0.0001995097190771024, 'samples': 1179488, 'steps': 2303, 'loss/train': 2.7118871212005615} -09/20/2021 22:28:16 - INFO - __main__ - Step 36860: {'lr': 0.0001995097190771024, 'samples': 1179520, 'steps': 2303, 'loss/train': 2.683093547821045} -09/20/2021 22:28:17 - INFO - __main__ - Step 36861: {'lr': 0.0001995097190771024, 'samples': 1179552, 'steps': 2303, 'loss/train': 2.949983835220337} -09/20/2021 22:28:18 - INFO - __main__ - Step 36862: {'lr': 0.0001995097190771024, 'samples': 1179584, 'steps': 2303, 'loss/train': 0.37542232871055603} -09/20/2021 22:28:19 - INFO - __main__ - Step 36863: {'lr': 0.0001995097190771024, 'samples': 1179616, 'steps': 2303, 'loss/train': 0.4479106366634369} -09/20/2021 22:28:19 - INFO - __main__ - Step 36864: {'lr': 0.0001995097190771024, 'samples': 1179648, 'steps': 2303, 'loss/train': 0.23775745928287506} -09/20/2021 22:28:20 - INFO - __main__ - Step 36865: {'lr': 0.00019950908799261073, 'samples': 1179680, 'steps': 2304, 'loss/train': 0.37152400612831116} -09/20/2021 22:28:21 - INFO - __main__ - Step 36866: {'lr': 0.00019950908799261073, 'samples': 1179712, 'steps': 2304, 'loss/train': 1.3879393339157104} -09/20/2021 22:28:22 - INFO - __main__ - Step 36867: {'lr': 0.00019950908799261073, 'samples': 1179744, 'steps': 2304, 'loss/train': 1.9953054189682007} -09/20/2021 22:28:22 - INFO - __main__ - Step 36868: {'lr': 0.00019950908799261073, 'samples': 1179776, 'steps': 2304, 'loss/train': 2.7894086837768555} -09/20/2021 22:28:23 - INFO - __main__ - Step 36869: {'lr': 0.00019950908799261073, 'samples': 1179808, 'steps': 2304, 'loss/train': 2.3100626468658447} -09/20/2021 22:28:24 - INFO - __main__ - Step 36870: {'lr': 0.00019950908799261073, 'samples': 1179840, 'steps': 2304, 'loss/train': 2.2930283546447754} -09/20/2021 22:28:25 - INFO - __main__ - Step 36871: {'lr': 0.00019950908799261073, 'samples': 1179872, 'steps': 2304, 'loss/train': 1.8755567073822021} -09/20/2021 22:28:25 - INFO - __main__ - Step 36872: {'lr': 0.00019950908799261073, 'samples': 1179904, 'steps': 2304, 'loss/train': 1.7504903078079224} -09/20/2021 22:28:26 - INFO - __main__ - Step 36873: {'lr': 0.00019950908799261073, 'samples': 1179936, 'steps': 2304, 'loss/train': 2.0629632472991943} -09/20/2021 22:28:27 - INFO - __main__ - Step 36874: {'lr': 0.00019950908799261073, 'samples': 1179968, 'steps': 2304, 'loss/train': 2.830981492996216} -09/20/2021 22:28:28 - INFO - __main__ - Step 36875: {'lr': 0.00019950908799261073, 'samples': 1180000, 'steps': 2304, 'loss/train': 5.058315753936768} -09/20/2021 22:28:28 - INFO - __main__ - Step 36876: {'lr': 0.00019950908799261073, 'samples': 1180032, 'steps': 2304, 'loss/train': 1.6665713787078857} -09/20/2021 22:28:29 - INFO - __main__ - Step 36877: {'lr': 0.00019950908799261073, 'samples': 1180064, 'steps': 2304, 'loss/train': 2.057396411895752} -09/20/2021 22:28:30 - INFO - __main__ - Step 36878: {'lr': 0.00019950908799261073, 'samples': 1180096, 'steps': 2304, 'loss/train': 1.96552312374115} -09/20/2021 22:28:31 - INFO - __main__ - Step 36879: {'lr': 0.00019950908799261073, 'samples': 1180128, 'steps': 2304, 'loss/train': 2.077418804168701} -09/20/2021 22:28:31 - INFO - __main__ - Step 36880: {'lr': 0.00019950908799261073, 'samples': 1180160, 'steps': 2304, 'loss/train': 1.637285590171814} -09/20/2021 22:28:32 - INFO - __main__ - Step 36881: {'lr': 0.000199508456503217, 'samples': 1180192, 'steps': 2305, 'loss/train': 0.32787081599235535} -09/20/2021 22:28:33 - INFO - __main__ - Step 36882: {'lr': 0.000199508456503217, 'samples': 1180224, 'steps': 2305, 'loss/train': 0.3290289342403412} -09/20/2021 22:28:35 - INFO - __main__ - Step 36883: {'lr': 0.000199508456503217, 'samples': 1180256, 'steps': 2305, 'loss/train': 0.19020670652389526} -09/20/2021 22:28:36 - INFO - __main__ - Step 36884: {'lr': 0.000199508456503217, 'samples': 1180288, 'steps': 2305, 'loss/train': 1.6720987558364868} -09/20/2021 22:28:36 - INFO - __main__ - Step 36885: {'lr': 0.000199508456503217, 'samples': 1180320, 'steps': 2305, 'loss/train': 2.396331310272217} -09/20/2021 22:28:37 - INFO - __main__ - Step 36886: {'lr': 0.000199508456503217, 'samples': 1180352, 'steps': 2305, 'loss/train': 3.409463882446289} -09/20/2021 22:28:38 - INFO - __main__ - Step 36887: {'lr': 0.000199508456503217, 'samples': 1180384, 'steps': 2305, 'loss/train': 1.6157101392745972} -09/20/2021 22:28:39 - INFO - __main__ - Step 36888: {'lr': 0.000199508456503217, 'samples': 1180416, 'steps': 2305, 'loss/train': 2.6895158290863037} -09/20/2021 22:28:39 - INFO - __main__ - Step 36889: {'lr': 0.000199508456503217, 'samples': 1180448, 'steps': 2305, 'loss/train': 2.202906608581543} -09/20/2021 22:28:40 - INFO - __main__ - Step 36890: {'lr': 0.000199508456503217, 'samples': 1180480, 'steps': 2305, 'loss/train': 1.5573641061782837} -09/20/2021 22:28:41 - INFO - __main__ - Step 36891: {'lr': 0.000199508456503217, 'samples': 1180512, 'steps': 2305, 'loss/train': 2.055788040161133} -09/20/2021 22:28:42 - INFO - __main__ - Step 36892: {'lr': 0.000199508456503217, 'samples': 1180544, 'steps': 2305, 'loss/train': 2.4433419704437256} -09/20/2021 22:28:42 - INFO - __main__ - Step 36893: {'lr': 0.000199508456503217, 'samples': 1180576, 'steps': 2305, 'loss/train': 3.289597511291504} -09/20/2021 22:28:43 - INFO - __main__ - Step 36894: {'lr': 0.000199508456503217, 'samples': 1180608, 'steps': 2305, 'loss/train': 1.469946026802063} -09/20/2021 22:28:44 - INFO - __main__ - Step 36895: {'lr': 0.000199508456503217, 'samples': 1180640, 'steps': 2305, 'loss/train': 2.990215539932251} -09/20/2021 22:28:45 - INFO - __main__ - Step 36896: {'lr': 0.000199508456503217, 'samples': 1180672, 'steps': 2305, 'loss/train': 2.9402031898498535} -09/20/2021 22:28:45 - INFO - __main__ - Step 36897: {'lr': 0.0001995078246089237, 'samples': 1180704, 'steps': 2306, 'loss/train': 2.154517412185669} -09/20/2021 22:28:46 - INFO - __main__ - Step 36898: {'lr': 0.0001995078246089237, 'samples': 1180736, 'steps': 2306, 'loss/train': 1.6510519981384277} -09/20/2021 22:28:47 - INFO - __main__ - Step 36899: {'lr': 0.0001995078246089237, 'samples': 1180768, 'steps': 2306, 'loss/train': 2.0783891677856445} -09/20/2021 22:28:48 - INFO - __main__ - Step 36900: {'lr': 0.0001995078246089237, 'samples': 1180800, 'steps': 2306, 'loss/train': 1.7153847217559814} -09/20/2021 22:28:48 - INFO - __main__ - Step 36901: {'lr': 0.0001995078246089237, 'samples': 1180832, 'steps': 2306, 'loss/train': 2.439913034439087} -09/20/2021 22:28:49 - INFO - __main__ - Step 36902: {'lr': 0.0001995078246089237, 'samples': 1180864, 'steps': 2306, 'loss/train': 1.7753777503967285} -09/20/2021 22:28:50 - INFO - __main__ - Step 36903: {'lr': 0.0001995078246089237, 'samples': 1180896, 'steps': 2306, 'loss/train': 1.5881116390228271} -09/20/2021 22:28:51 - INFO - __main__ - Step 36904: {'lr': 0.0001995078246089237, 'samples': 1180928, 'steps': 2306, 'loss/train': 1.390164852142334} -09/20/2021 22:28:51 - INFO - __main__ - Step 36905: {'lr': 0.0001995078246089237, 'samples': 1180960, 'steps': 2306, 'loss/train': 2.633345365524292} -09/20/2021 22:28:52 - INFO - __main__ - Step 36906: {'lr': 0.0001995078246089237, 'samples': 1180992, 'steps': 2306, 'loss/train': 2.791731834411621} -09/20/2021 22:28:53 - INFO - __main__ - Step 36907: {'lr': 0.0001995078246089237, 'samples': 1181024, 'steps': 2306, 'loss/train': 1.6168935298919678} -09/20/2021 22:28:54 - INFO - __main__ - Step 36908: {'lr': 0.0001995078246089237, 'samples': 1181056, 'steps': 2306, 'loss/train': 2.4930472373962402} -09/20/2021 22:28:54 - INFO - __main__ - Step 36909: {'lr': 0.0001995078246089237, 'samples': 1181088, 'steps': 2306, 'loss/train': 2.9729111194610596} -09/20/2021 22:28:55 - INFO - __main__ - Step 36910: {'lr': 0.0001995078246089237, 'samples': 1181120, 'steps': 2306, 'loss/train': 2.7134623527526855} -09/20/2021 22:28:56 - INFO - __main__ - Step 36911: {'lr': 0.0001995078246089237, 'samples': 1181152, 'steps': 2306, 'loss/train': 2.1310276985168457} -09/20/2021 22:28:57 - INFO - __main__ - Step 36912: {'lr': 0.0001995078246089237, 'samples': 1181184, 'steps': 2306, 'loss/train': 2.5783140659332275} -09/20/2021 22:28:58 - INFO - __main__ - Step 36913: {'lr': 0.00019950719230973349, 'samples': 1181216, 'steps': 2307, 'loss/train': 0.47835639119148254} -09/20/2021 22:28:58 - INFO - __main__ - Step 36914: {'lr': 0.00019950719230973349, 'samples': 1181248, 'steps': 2307, 'loss/train': 0.3690048158168793} -09/20/2021 22:28:59 - INFO - __main__ - Step 36915: {'lr': 0.00019950719230973349, 'samples': 1181280, 'steps': 2307, 'loss/train': 0.3044336140155792} -09/20/2021 22:29:00 - INFO - __main__ - Step 36916: {'lr': 0.00019950719230973349, 'samples': 1181312, 'steps': 2307, 'loss/train': 0.54073566198349} -09/20/2021 22:29:01 - INFO - __main__ - Step 36917: {'lr': 0.00019950719230973349, 'samples': 1181344, 'steps': 2307, 'loss/train': 0.4397168457508087} -09/20/2021 22:29:02 - INFO - __main__ - Step 36918: {'lr': 0.00019950719230973349, 'samples': 1181376, 'steps': 2307, 'loss/train': 0.42503517866134644} -09/20/2021 22:29:03 - INFO - __main__ - Step 36919: {'lr': 0.00019950719230973349, 'samples': 1181408, 'steps': 2307, 'loss/train': 2.9114816188812256} -09/20/2021 22:29:03 - INFO - __main__ - Step 36920: {'lr': 0.00019950719230973349, 'samples': 1181440, 'steps': 2307, 'loss/train': 2.8645267486572266} -09/20/2021 22:29:04 - INFO - __main__ - Step 36921: {'lr': 0.00019950719230973349, 'samples': 1181472, 'steps': 2307, 'loss/train': 2.1416351795196533} -09/20/2021 22:29:05 - INFO - __main__ - Step 36922: {'lr': 0.00019950719230973349, 'samples': 1181504, 'steps': 2307, 'loss/train': 1.9192215204238892} -09/20/2021 22:29:06 - INFO - __main__ - Step 36923: {'lr': 0.00019950719230973349, 'samples': 1181536, 'steps': 2307, 'loss/train': 2.10367488861084} -09/20/2021 22:29:06 - INFO - __main__ - Step 36924: {'lr': 0.00019950719230973349, 'samples': 1181568, 'steps': 2307, 'loss/train': 2.622363328933716} -09/20/2021 22:29:07 - INFO - __main__ - Step 36925: {'lr': 0.00019950719230973349, 'samples': 1181600, 'steps': 2307, 'loss/train': 2.445819139480591} -09/20/2021 22:29:08 - INFO - __main__ - Step 36926: {'lr': 0.00019950719230973349, 'samples': 1181632, 'steps': 2307, 'loss/train': 2.1496193408966064} -09/20/2021 22:29:09 - INFO - __main__ - Step 36927: {'lr': 0.00019950719230973349, 'samples': 1181664, 'steps': 2307, 'loss/train': 1.9300518035888672} -09/20/2021 22:29:09 - INFO - __main__ - Step 36928: {'lr': 0.00019950719230973349, 'samples': 1181696, 'steps': 2307, 'loss/train': 2.6059114933013916} -09/20/2021 22:29:10 - INFO - __main__ - Step 36929: {'lr': 0.00019950655960564889, 'samples': 1181728, 'steps': 2308, 'loss/train': 1.7833969593048096} -09/20/2021 22:29:11 - INFO - __main__ - Step 36930: {'lr': 0.00019950655960564889, 'samples': 1181760, 'steps': 2308, 'loss/train': 2.085671901702881} -09/20/2021 22:29:12 - INFO - __main__ - Step 36931: {'lr': 0.00019950655960564889, 'samples': 1181792, 'steps': 2308, 'loss/train': 2.0369324684143066} -09/20/2021 22:29:13 - INFO - __main__ - Step 36932: {'lr': 0.00019950655960564889, 'samples': 1181824, 'steps': 2308, 'loss/train': 2.382840633392334} -09/20/2021 22:29:13 - INFO - __main__ - Step 36933: {'lr': 0.00019950655960564889, 'samples': 1181856, 'steps': 2308, 'loss/train': 1.682417869567871} -09/20/2021 22:29:14 - INFO - __main__ - Step 36934: {'lr': 0.00019950655960564889, 'samples': 1181888, 'steps': 2308, 'loss/train': 2.6551969051361084} -09/20/2021 22:29:15 - INFO - __main__ - Step 36935: {'lr': 0.00019950655960564889, 'samples': 1181920, 'steps': 2308, 'loss/train': 2.199215888977051} -09/20/2021 22:29:16 - INFO - __main__ - Step 36936: {'lr': 0.00019950655960564889, 'samples': 1181952, 'steps': 2308, 'loss/train': 2.336611270904541} -09/20/2021 22:29:16 - INFO - __main__ - Step 36937: {'lr': 0.00019950655960564889, 'samples': 1181984, 'steps': 2308, 'loss/train': 1.9185199737548828} -09/20/2021 22:29:17 - INFO - __main__ - Step 36938: {'lr': 0.00019950655960564889, 'samples': 1182016, 'steps': 2308, 'loss/train': 0.9721820950508118} -09/20/2021 22:29:18 - INFO - __main__ - Step 36939: {'lr': 0.00019950655960564889, 'samples': 1182048, 'steps': 2308, 'loss/train': 6.206055164337158} -09/20/2021 22:29:19 - INFO - __main__ - Step 36940: {'lr': 0.00019950655960564889, 'samples': 1182080, 'steps': 2308, 'loss/train': 3.2316272258758545} -09/20/2021 22:29:19 - INFO - __main__ - Step 36941: {'lr': 0.00019950655960564889, 'samples': 1182112, 'steps': 2308, 'loss/train': 0.5809347629547119} -09/20/2021 22:29:20 - INFO - __main__ - Step 36942: {'lr': 0.00019950655960564889, 'samples': 1182144, 'steps': 2308, 'loss/train': 2.8531265258789062} -09/20/2021 22:29:21 - INFO - __main__ - Step 36943: {'lr': 0.00019950655960564889, 'samples': 1182176, 'steps': 2308, 'loss/train': 2.4328720569610596} -09/20/2021 22:29:22 - INFO - __main__ - Step 36944: {'lr': 0.00019950655960564889, 'samples': 1182208, 'steps': 2308, 'loss/train': 2.5563313961029053} -09/20/2021 22:29:22 - INFO - __main__ - Step 36945: {'lr': 0.00019950592649667245, 'samples': 1182240, 'steps': 2309, 'loss/train': 2.1397368907928467} -09/20/2021 22:29:23 - INFO - __main__ - Step 36946: {'lr': 0.00019950592649667245, 'samples': 1182272, 'steps': 2309, 'loss/train': 2.9066569805145264} -09/20/2021 22:29:24 - INFO - __main__ - Step 36947: {'lr': 0.00019950592649667245, 'samples': 1182304, 'steps': 2309, 'loss/train': 1.0090296268463135} -09/20/2021 22:29:25 - INFO - __main__ - Step 36948: {'lr': 0.00019950592649667245, 'samples': 1182336, 'steps': 2309, 'loss/train': 0.7327121496200562} -09/20/2021 22:29:26 - INFO - __main__ - Step 36949: {'lr': 0.00019950592649667245, 'samples': 1182368, 'steps': 2309, 'loss/train': 2.278682231903076} -09/20/2021 22:29:27 - INFO - __main__ - Step 36950: {'lr': 0.00019950592649667245, 'samples': 1182400, 'steps': 2309, 'loss/train': 1.6909925937652588} -09/20/2021 22:29:27 - INFO - __main__ - Step 36951: {'lr': 0.00019950592649667245, 'samples': 1182432, 'steps': 2309, 'loss/train': 2.161964178085327} -09/20/2021 22:29:28 - INFO - __main__ - Step 36952: {'lr': 0.00019950592649667245, 'samples': 1182464, 'steps': 2309, 'loss/train': 2.669299840927124} -09/20/2021 22:29:29 - INFO - __main__ - Step 36953: {'lr': 0.00019950592649667245, 'samples': 1182496, 'steps': 2309, 'loss/train': 2.2679474353790283} -09/20/2021 22:29:30 - INFO - __main__ - Step 36954: {'lr': 0.00019950592649667245, 'samples': 1182528, 'steps': 2309, 'loss/train': 1.3384416103363037} -09/20/2021 22:29:30 - INFO - __main__ - Step 36955: {'lr': 0.00019950592649667245, 'samples': 1182560, 'steps': 2309, 'loss/train': 1.4245713949203491} -09/20/2021 22:29:31 - INFO - __main__ - Step 36956: {'lr': 0.00019950592649667245, 'samples': 1182592, 'steps': 2309, 'loss/train': 1.219451665878296} -09/20/2021 22:29:32 - INFO - __main__ - Step 36957: {'lr': 0.00019950592649667245, 'samples': 1182624, 'steps': 2309, 'loss/train': 1.8057483434677124} -09/20/2021 22:29:33 - INFO - __main__ - Step 36958: {'lr': 0.00019950592649667245, 'samples': 1182656, 'steps': 2309, 'loss/train': 2.6104965209960938} -09/20/2021 22:29:33 - INFO - __main__ - Step 36959: {'lr': 0.00019950592649667245, 'samples': 1182688, 'steps': 2309, 'loss/train': 2.156461477279663} -09/20/2021 22:29:34 - INFO - __main__ - Step 36960: {'lr': 0.00019950592649667245, 'samples': 1182720, 'steps': 2309, 'loss/train': 3.3179497718811035} -09/20/2021 22:29:35 - INFO - __main__ - Step 36961: {'lr': 0.00019950529298280682, 'samples': 1182752, 'steps': 2310, 'loss/train': 2.419344902038574} -09/20/2021 22:29:36 - INFO - __main__ - Step 36962: {'lr': 0.00019950529298280682, 'samples': 1182784, 'steps': 2310, 'loss/train': 3.27730131149292} -09/20/2021 22:29:37 - INFO - __main__ - Step 36963: {'lr': 0.00019950529298280682, 'samples': 1182816, 'steps': 2310, 'loss/train': 2.790178060531616} -09/20/2021 22:29:37 - INFO - __main__ - Step 36964: {'lr': 0.00019950529298280682, 'samples': 1182848, 'steps': 2310, 'loss/train': 0.8929738998413086} -09/20/2021 22:29:38 - INFO - __main__ - Step 36965: {'lr': 0.00019950529298280682, 'samples': 1182880, 'steps': 2310, 'loss/train': 2.1794958114624023} -09/20/2021 22:29:39 - INFO - __main__ - Step 36966: {'lr': 0.00019950529298280682, 'samples': 1182912, 'steps': 2310, 'loss/train': 2.118513822555542} -09/20/2021 22:29:40 - INFO - __main__ - Step 36967: {'lr': 0.00019950529298280682, 'samples': 1182944, 'steps': 2310, 'loss/train': 2.6910006999969482} -09/20/2021 22:29:40 - INFO - __main__ - Step 36968: {'lr': 0.00019950529298280682, 'samples': 1182976, 'steps': 2310, 'loss/train': 2.1620676517486572} -09/20/2021 22:29:41 - INFO - __main__ - Step 36969: {'lr': 0.00019950529298280682, 'samples': 1183008, 'steps': 2310, 'loss/train': 2.758857488632202} -09/20/2021 22:29:42 - INFO - __main__ - Step 36970: {'lr': 0.00019950529298280682, 'samples': 1183040, 'steps': 2310, 'loss/train': 1.1083651781082153} -09/20/2021 22:29:43 - INFO - __main__ - Step 36971: {'lr': 0.00019950529298280682, 'samples': 1183072, 'steps': 2310, 'loss/train': 2.413910150527954} -09/20/2021 22:29:43 - INFO - __main__ - Step 36972: {'lr': 0.00019950529298280682, 'samples': 1183104, 'steps': 2310, 'loss/train': 2.614987373352051} -09/20/2021 22:29:44 - INFO - __main__ - Step 36973: {'lr': 0.00019950529298280682, 'samples': 1183136, 'steps': 2310, 'loss/train': 2.871166944503784} -09/20/2021 22:29:45 - INFO - __main__ - Step 36974: {'lr': 0.00019950529298280682, 'samples': 1183168, 'steps': 2310, 'loss/train': 2.4077930450439453} -09/20/2021 22:29:46 - INFO - __main__ - Step 36975: {'lr': 0.00019950529298280682, 'samples': 1183200, 'steps': 2310, 'loss/train': 2.479365825653076} -09/20/2021 22:29:46 - INFO - __main__ - Step 36976: {'lr': 0.00019950529298280682, 'samples': 1183232, 'steps': 2310, 'loss/train': 2.7464170455932617} -09/20/2021 22:29:47 - INFO - __main__ - Step 36977: {'lr': 0.00019950465906405453, 'samples': 1183264, 'steps': 2311, 'loss/train': 2.151771068572998} -09/20/2021 22:29:49 - INFO - __main__ - Step 36978: {'lr': 0.00019950465906405453, 'samples': 1183296, 'steps': 2311, 'loss/train': 1.9700921773910522} -09/20/2021 22:29:49 - INFO - __main__ - Step 36979: {'lr': 0.00019950465906405453, 'samples': 1183328, 'steps': 2311, 'loss/train': 1.9808874130249023} -09/20/2021 22:29:50 - INFO - __main__ - Step 36980: {'lr': 0.00019950465906405453, 'samples': 1183360, 'steps': 2311, 'loss/train': 2.8853261470794678} -09/20/2021 22:29:51 - INFO - __main__ - Step 36981: {'lr': 0.00019950465906405453, 'samples': 1183392, 'steps': 2311, 'loss/train': 0.4124436676502228} -09/20/2021 22:29:52 - INFO - __main__ - Step 36982: {'lr': 0.00019950465906405453, 'samples': 1183424, 'steps': 2311, 'loss/train': 2.416764259338379} -09/20/2021 22:29:52 - INFO - __main__ - Step 36983: {'lr': 0.00019950465906405453, 'samples': 1183456, 'steps': 2311, 'loss/train': 1.839063286781311} -09/20/2021 22:29:53 - INFO - __main__ - Step 36984: {'lr': 0.00019950465906405453, 'samples': 1183488, 'steps': 2311, 'loss/train': 3.240614175796509} -09/20/2021 22:29:54 - INFO - __main__ - Step 36985: {'lr': 0.00019950465906405453, 'samples': 1183520, 'steps': 2311, 'loss/train': 2.504323720932007} -09/20/2021 22:29:55 - INFO - __main__ - Step 36986: {'lr': 0.00019950465906405453, 'samples': 1183552, 'steps': 2311, 'loss/train': 1.9140065908432007} -09/20/2021 22:29:55 - INFO - __main__ - Step 36987: {'lr': 0.00019950465906405453, 'samples': 1183584, 'steps': 2311, 'loss/train': 1.7673747539520264} -09/20/2021 22:29:56 - INFO - __main__ - Step 36988: {'lr': 0.00019950465906405453, 'samples': 1183616, 'steps': 2311, 'loss/train': 2.4424071311950684} -09/20/2021 22:29:57 - INFO - __main__ - Step 36989: {'lr': 0.00019950465906405453, 'samples': 1183648, 'steps': 2311, 'loss/train': 2.9023289680480957} -09/20/2021 22:29:58 - INFO - __main__ - Step 36990: {'lr': 0.00019950465906405453, 'samples': 1183680, 'steps': 2311, 'loss/train': 2.2411179542541504} -09/20/2021 22:29:58 - INFO - __main__ - Step 36991: {'lr': 0.00019950465906405453, 'samples': 1183712, 'steps': 2311, 'loss/train': 1.9468756914138794} -09/20/2021 22:29:59 - INFO - __main__ - Step 36992: {'lr': 0.00019950465906405453, 'samples': 1183744, 'steps': 2311, 'loss/train': 2.0308752059936523} -09/20/2021 22:30:00 - INFO - __main__ - Step 36993: {'lr': 0.0001995040247404182, 'samples': 1183776, 'steps': 2312, 'loss/train': 2.103423833847046} -09/20/2021 22:30:01 - INFO - __main__ - Step 36994: {'lr': 0.0001995040247404182, 'samples': 1183808, 'steps': 2312, 'loss/train': 2.537952184677124} -09/20/2021 22:30:02 - INFO - __main__ - Step 36995: {'lr': 0.0001995040247404182, 'samples': 1183840, 'steps': 2312, 'loss/train': 2.4358460903167725} -09/20/2021 22:30:02 - INFO - __main__ - Step 36996: {'lr': 0.0001995040247404182, 'samples': 1183872, 'steps': 2312, 'loss/train': 2.4980366230010986} -09/20/2021 22:30:03 - INFO - __main__ - Step 36997: {'lr': 0.0001995040247404182, 'samples': 1183904, 'steps': 2312, 'loss/train': 1.7558706998825073} -09/20/2021 22:30:04 - INFO - __main__ - Step 36998: {'lr': 0.0001995040247404182, 'samples': 1183936, 'steps': 2312, 'loss/train': 1.575111985206604} -09/20/2021 22:30:05 - INFO - __main__ - Step 36999: {'lr': 0.0001995040247404182, 'samples': 1183968, 'steps': 2312, 'loss/train': 2.1389658451080322} -09/20/2021 22:30:05 - INFO - __main__ - Step 37000: {'lr': 0.0001995040247404182, 'samples': 1184000, 'steps': 2312, 'loss/train': 2.0352823734283447} -09/20/2021 22:30:06 - INFO - __main__ - Step 37001: {'lr': 0.0001995040247404182, 'samples': 1184032, 'steps': 2312, 'loss/train': 2.0899288654327393} -09/20/2021 22:30:07 - INFO - __main__ - Step 37002: {'lr': 0.0001995040247404182, 'samples': 1184064, 'steps': 2312, 'loss/train': 1.619226098060608} -09/20/2021 22:30:08 - INFO - __main__ - Step 37003: {'lr': 0.0001995040247404182, 'samples': 1184096, 'steps': 2312, 'loss/train': 0.3155755400657654} -09/20/2021 22:30:08 - INFO - __main__ - Step 37004: {'lr': 0.0001995040247404182, 'samples': 1184128, 'steps': 2312, 'loss/train': 0.3946026563644409} -09/20/2021 22:30:09 - INFO - __main__ - Step 37005: {'lr': 0.0001995040247404182, 'samples': 1184160, 'steps': 2312, 'loss/train': 0.2288421094417572} -09/20/2021 22:30:10 - INFO - __main__ - Step 37006: {'lr': 0.0001995040247404182, 'samples': 1184192, 'steps': 2312, 'loss/train': 0.4056825637817383} -09/20/2021 22:30:11 - INFO - __main__ - Step 37007: {'lr': 0.0001995040247404182, 'samples': 1184224, 'steps': 2312, 'loss/train': 3.0170271396636963} -09/20/2021 22:30:11 - INFO - __main__ - Step 37008: {'lr': 0.0001995040247404182, 'samples': 1184256, 'steps': 2312, 'loss/train': 2.2270750999450684} -09/20/2021 22:30:13 - INFO - __main__ - Step 37009: {'lr': 0.00019950339001190032, 'samples': 1184288, 'steps': 2313, 'loss/train': 2.327998161315918} -09/20/2021 22:30:14 - INFO - __main__ - Step 37010: {'lr': 0.00019950339001190032, 'samples': 1184320, 'steps': 2313, 'loss/train': 1.8317514657974243} -09/20/2021 22:30:14 - INFO - __main__ - Step 37011: {'lr': 0.00019950339001190032, 'samples': 1184352, 'steps': 2313, 'loss/train': 2.23630428314209} -09/20/2021 22:30:15 - INFO - __main__ - Step 37012: {'lr': 0.00019950339001190032, 'samples': 1184384, 'steps': 2313, 'loss/train': 1.8848330974578857} -09/20/2021 22:30:16 - INFO - __main__ - Step 37013: {'lr': 0.00019950339001190032, 'samples': 1184416, 'steps': 2313, 'loss/train': 2.725416660308838} -09/20/2021 22:30:17 - INFO - __main__ - Step 37014: {'lr': 0.00019950339001190032, 'samples': 1184448, 'steps': 2313, 'loss/train': 2.5440664291381836} -09/20/2021 22:30:17 - INFO - __main__ - Step 37015: {'lr': 0.00019950339001190032, 'samples': 1184480, 'steps': 2313, 'loss/train': 2.3939433097839355} -09/20/2021 22:30:18 - INFO - __main__ - Step 37016: {'lr': 0.00019950339001190032, 'samples': 1184512, 'steps': 2313, 'loss/train': 2.2036054134368896} -09/20/2021 22:30:19 - INFO - __main__ - Step 37017: {'lr': 0.00019950339001190032, 'samples': 1184544, 'steps': 2313, 'loss/train': 1.8340388536453247} -09/20/2021 22:30:20 - INFO - __main__ - Step 37018: {'lr': 0.00019950339001190032, 'samples': 1184576, 'steps': 2313, 'loss/train': 2.14327073097229} -09/20/2021 22:30:20 - INFO - __main__ - Step 37019: {'lr': 0.00019950339001190032, 'samples': 1184608, 'steps': 2313, 'loss/train': 1.9812802076339722} -09/20/2021 22:30:21 - INFO - __main__ - Step 37020: {'lr': 0.00019950339001190032, 'samples': 1184640, 'steps': 2313, 'loss/train': 3.020944833755493} -09/20/2021 22:30:22 - INFO - __main__ - Step 37021: {'lr': 0.00019950339001190032, 'samples': 1184672, 'steps': 2313, 'loss/train': 2.356302499771118} -09/20/2021 22:30:23 - INFO - __main__ - Step 37022: {'lr': 0.00019950339001190032, 'samples': 1184704, 'steps': 2313, 'loss/train': 2.1275289058685303} -09/20/2021 22:30:23 - INFO - __main__ - Step 37023: {'lr': 0.00019950339001190032, 'samples': 1184736, 'steps': 2313, 'loss/train': 1.7692149877548218} -09/20/2021 22:30:24 - INFO - __main__ - Step 37024: {'lr': 0.00019950339001190032, 'samples': 1184768, 'steps': 2313, 'loss/train': 0.6290568113327026} -09/20/2021 22:30:25 - INFO - __main__ - Step 37025: {'lr': 0.00019950275487850357, 'samples': 1184800, 'steps': 2314, 'loss/train': 1.1499062776565552} -09/20/2021 22:30:26 - INFO - __main__ - Step 37026: {'lr': 0.00019950275487850357, 'samples': 1184832, 'steps': 2314, 'loss/train': 2.1447267532348633} -09/20/2021 22:30:27 - INFO - __main__ - Step 37027: {'lr': 0.00019950275487850357, 'samples': 1184864, 'steps': 2314, 'loss/train': 2.319676637649536} -09/20/2021 22:30:27 - INFO - __main__ - Step 37028: {'lr': 0.00019950275487850357, 'samples': 1184896, 'steps': 2314, 'loss/train': 1.683861494064331} -09/20/2021 22:30:28 - INFO - __main__ - Step 37029: {'lr': 0.00019950275487850357, 'samples': 1184928, 'steps': 2314, 'loss/train': 4.495555400848389} -09/20/2021 22:30:29 - INFO - __main__ - Step 37030: {'lr': 0.00019950275487850357, 'samples': 1184960, 'steps': 2314, 'loss/train': 1.7872408628463745} -09/20/2021 22:30:30 - INFO - __main__ - Step 37031: {'lr': 0.00019950275487850357, 'samples': 1184992, 'steps': 2314, 'loss/train': 0.8267501592636108} -09/20/2021 22:30:30 - INFO - __main__ - Step 37032: {'lr': 0.00019950275487850357, 'samples': 1185024, 'steps': 2314, 'loss/train': 0.6261339783668518} -09/20/2021 22:30:31 - INFO - __main__ - Step 37033: {'lr': 0.00019950275487850357, 'samples': 1185056, 'steps': 2314, 'loss/train': 2.9208292961120605} -09/20/2021 22:30:32 - INFO - __main__ - Step 37034: {'lr': 0.00019950275487850357, 'samples': 1185088, 'steps': 2314, 'loss/train': 2.1479222774505615} -09/20/2021 22:30:33 - INFO - __main__ - Step 37035: {'lr': 0.00019950275487850357, 'samples': 1185120, 'steps': 2314, 'loss/train': 2.114333152770996} -09/20/2021 22:30:33 - INFO - __main__ - Step 37036: {'lr': 0.00019950275487850357, 'samples': 1185152, 'steps': 2314, 'loss/train': 3.128004312515259} -09/20/2021 22:30:34 - INFO - __main__ - Step 37037: {'lr': 0.00019950275487850357, 'samples': 1185184, 'steps': 2314, 'loss/train': 2.346832036972046} -09/20/2021 22:30:35 - INFO - __main__ - Step 37038: {'lr': 0.00019950275487850357, 'samples': 1185216, 'steps': 2314, 'loss/train': 2.136404275894165} -09/20/2021 22:30:36 - INFO - __main__ - Step 37039: {'lr': 0.00019950275487850357, 'samples': 1185248, 'steps': 2314, 'loss/train': 2.2670626640319824} -09/20/2021 22:30:37 - INFO - __main__ - Step 37040: {'lr': 0.00019950275487850357, 'samples': 1185280, 'steps': 2314, 'loss/train': 0.4344088137149811} -09/20/2021 22:30:38 - INFO - __main__ - Step 37041: {'lr': 0.0001995021193402305, 'samples': 1185312, 'steps': 2315, 'loss/train': 2.9160690307617188} -09/20/2021 22:30:39 - INFO - __main__ - Step 37042: {'lr': 0.0001995021193402305, 'samples': 1185344, 'steps': 2315, 'loss/train': 2.8204808235168457} -09/20/2021 22:30:40 - INFO - __main__ - Step 37043: {'lr': 0.0001995021193402305, 'samples': 1185376, 'steps': 2315, 'loss/train': 3.268021821975708} -09/20/2021 22:30:40 - INFO - __main__ - Step 37044: {'lr': 0.0001995021193402305, 'samples': 1185408, 'steps': 2315, 'loss/train': 2.334995746612549} -09/20/2021 22:30:41 - INFO - __main__ - Step 37045: {'lr': 0.0001995021193402305, 'samples': 1185440, 'steps': 2315, 'loss/train': 2.4356398582458496} -09/20/2021 22:30:42 - INFO - __main__ - Step 37046: {'lr': 0.0001995021193402305, 'samples': 1185472, 'steps': 2315, 'loss/train': 2.739071846008301} -09/20/2021 22:30:43 - INFO - __main__ - Step 37047: {'lr': 0.0001995021193402305, 'samples': 1185504, 'steps': 2315, 'loss/train': 1.977515697479248} -09/20/2021 22:30:43 - INFO - __main__ - Step 37048: {'lr': 0.0001995021193402305, 'samples': 1185536, 'steps': 2315, 'loss/train': 3.644619941711426} -09/20/2021 22:30:44 - INFO - __main__ - Step 37049: {'lr': 0.0001995021193402305, 'samples': 1185568, 'steps': 2315, 'loss/train': 1.1412931680679321} -09/20/2021 22:30:45 - INFO - __main__ - Step 37050: {'lr': 0.0001995021193402305, 'samples': 1185600, 'steps': 2315, 'loss/train': 2.5377767086029053} -09/20/2021 22:30:46 - INFO - __main__ - Step 37051: {'lr': 0.0001995021193402305, 'samples': 1185632, 'steps': 2315, 'loss/train': 2.9962658882141113} -09/20/2021 22:30:46 - INFO - __main__ - Step 37052: {'lr': 0.0001995021193402305, 'samples': 1185664, 'steps': 2315, 'loss/train': 2.778519630432129} -09/20/2021 22:30:47 - INFO - __main__ - Step 37053: {'lr': 0.0001995021193402305, 'samples': 1185696, 'steps': 2315, 'loss/train': 2.2812185287475586} -09/20/2021 22:30:48 - INFO - __main__ - Step 37054: {'lr': 0.0001995021193402305, 'samples': 1185728, 'steps': 2315, 'loss/train': 1.836717963218689} -09/20/2021 22:30:49 - INFO - __main__ - Step 37055: {'lr': 0.0001995021193402305, 'samples': 1185760, 'steps': 2315, 'loss/train': 1.8371260166168213} -09/20/2021 22:30:49 - INFO - __main__ - Step 37056: {'lr': 0.0001995021193402305, 'samples': 1185792, 'steps': 2315, 'loss/train': 1.8497822284698486} -09/20/2021 22:30:50 - INFO - __main__ - Step 37057: {'lr': 0.0001995014833970837, 'samples': 1185824, 'steps': 2316, 'loss/train': 1.9151601791381836} -09/20/2021 22:30:51 - INFO - __main__ - Step 37058: {'lr': 0.0001995014833970837, 'samples': 1185856, 'steps': 2316, 'loss/train': 1.2360249757766724} -09/20/2021 22:30:52 - INFO - __main__ - Step 37059: {'lr': 0.0001995014833970837, 'samples': 1185888, 'steps': 2316, 'loss/train': 2.95778489112854} -09/20/2021 22:30:52 - INFO - __main__ - Step 37060: {'lr': 0.0001995014833970837, 'samples': 1185920, 'steps': 2316, 'loss/train': 2.518138885498047} -09/20/2021 22:30:53 - INFO - __main__ - Step 37061: {'lr': 0.0001995014833970837, 'samples': 1185952, 'steps': 2316, 'loss/train': 2.0577805042266846} -09/20/2021 22:30:54 - INFO - __main__ - Step 37062: {'lr': 0.0001995014833970837, 'samples': 1185984, 'steps': 2316, 'loss/train': 0.5359758138656616} -09/20/2021 22:30:55 - INFO - __main__ - Step 37063: {'lr': 0.0001995014833970837, 'samples': 1186016, 'steps': 2316, 'loss/train': 0.18280147016048431} -09/20/2021 22:30:55 - INFO - __main__ - Step 37064: {'lr': 0.0001995014833970837, 'samples': 1186048, 'steps': 2316, 'loss/train': 0.5132797360420227} -09/20/2021 22:30:56 - INFO - __main__ - Step 37065: {'lr': 0.0001995014833970837, 'samples': 1186080, 'steps': 2316, 'loss/train': 0.18608269095420837} -09/20/2021 22:30:57 - INFO - __main__ - Step 37066: {'lr': 0.0001995014833970837, 'samples': 1186112, 'steps': 2316, 'loss/train': 0.3879016637802124} -09/20/2021 22:30:58 - INFO - __main__ - Step 37067: {'lr': 0.0001995014833970837, 'samples': 1186144, 'steps': 2316, 'loss/train': 0.2937532365322113} -09/20/2021 22:30:58 - INFO - __main__ - Step 37068: {'lr': 0.0001995014833970837, 'samples': 1186176, 'steps': 2316, 'loss/train': 1.6691343784332275} -09/20/2021 22:30:59 - INFO - __main__ - Step 37069: {'lr': 0.0001995014833970837, 'samples': 1186208, 'steps': 2316, 'loss/train': 2.465653657913208} -09/20/2021 22:31:01 - INFO - __main__ - Step 37070: {'lr': 0.0001995014833970837, 'samples': 1186240, 'steps': 2316, 'loss/train': 2.1870100498199463} -09/20/2021 22:31:02 - INFO - __main__ - Step 37071: {'lr': 0.0001995014833970837, 'samples': 1186272, 'steps': 2316, 'loss/train': 1.6803946495056152} -09/20/2021 22:31:03 - INFO - __main__ - Step 37072: {'lr': 0.0001995014833970837, 'samples': 1186304, 'steps': 2316, 'loss/train': 1.898516058921814} -09/20/2021 22:31:03 - INFO - __main__ - Step 37073: {'lr': 0.0001995008470490657, 'samples': 1186336, 'steps': 2317, 'loss/train': 2.536329746246338} -09/20/2021 22:31:04 - INFO - __main__ - Step 37074: {'lr': 0.0001995008470490657, 'samples': 1186368, 'steps': 2317, 'loss/train': 1.7087069749832153} -09/20/2021 22:31:05 - INFO - __main__ - Step 37075: {'lr': 0.0001995008470490657, 'samples': 1186400, 'steps': 2317, 'loss/train': 2.602463960647583} -09/20/2021 22:31:06 - INFO - __main__ - Step 37076: {'lr': 0.0001995008470490657, 'samples': 1186432, 'steps': 2317, 'loss/train': 1.5814517736434937} -09/20/2021 22:31:06 - INFO - __main__ - Step 37077: {'lr': 0.0001995008470490657, 'samples': 1186464, 'steps': 2317, 'loss/train': 1.223340392112732} -09/20/2021 22:31:07 - INFO - __main__ - Step 37078: {'lr': 0.0001995008470490657, 'samples': 1186496, 'steps': 2317, 'loss/train': 2.2432305812835693} -09/20/2021 22:31:08 - INFO - __main__ - Step 37079: {'lr': 0.0001995008470490657, 'samples': 1186528, 'steps': 2317, 'loss/train': 1.7930753231048584} -09/20/2021 22:31:09 - INFO - __main__ - Step 37080: {'lr': 0.0001995008470490657, 'samples': 1186560, 'steps': 2317, 'loss/train': 0.4122645854949951} -09/20/2021 22:31:09 - INFO - __main__ - Step 37081: {'lr': 0.0001995008470490657, 'samples': 1186592, 'steps': 2317, 'loss/train': 0.795714795589447} -09/20/2021 22:31:10 - INFO - __main__ - Step 37082: {'lr': 0.0001995008470490657, 'samples': 1186624, 'steps': 2317, 'loss/train': 0.6954382658004761} -09/20/2021 22:31:11 - INFO - __main__ - Step 37083: {'lr': 0.0001995008470490657, 'samples': 1186656, 'steps': 2317, 'loss/train': 2.7783026695251465} -09/20/2021 22:31:12 - INFO - __main__ - Step 37084: {'lr': 0.0001995008470490657, 'samples': 1186688, 'steps': 2317, 'loss/train': 2.520382881164551} -09/20/2021 22:31:12 - INFO - __main__ - Step 37085: {'lr': 0.0001995008470490657, 'samples': 1186720, 'steps': 2317, 'loss/train': 1.916652798652649} -09/20/2021 22:31:13 - INFO - __main__ - Step 37086: {'lr': 0.0001995008470490657, 'samples': 1186752, 'steps': 2317, 'loss/train': 1.846400499343872} -09/20/2021 22:31:14 - INFO - __main__ - Step 37087: {'lr': 0.0001995008470490657, 'samples': 1186784, 'steps': 2317, 'loss/train': 1.6038569211959839} -09/20/2021 22:31:15 - INFO - __main__ - Step 37088: {'lr': 0.0001995008470490657, 'samples': 1186816, 'steps': 2317, 'loss/train': 1.200553059577942} -09/20/2021 22:31:16 - INFO - __main__ - Step 37089: {'lr': 0.00019950021029617918, 'samples': 1186848, 'steps': 2318, 'loss/train': 2.402621269226074} -09/20/2021 22:31:16 - INFO - __main__ - Step 37090: {'lr': 0.00019950021029617918, 'samples': 1186880, 'steps': 2318, 'loss/train': 2.339186191558838} -09/20/2021 22:31:17 - INFO - __main__ - Step 37091: {'lr': 0.00019950021029617918, 'samples': 1186912, 'steps': 2318, 'loss/train': 1.4472978115081787} -09/20/2021 22:31:18 - INFO - __main__ - Step 37092: {'lr': 0.00019950021029617918, 'samples': 1186944, 'steps': 2318, 'loss/train': 2.5438449382781982} -09/20/2021 22:31:19 - INFO - __main__ - Step 37093: {'lr': 0.00019950021029617918, 'samples': 1186976, 'steps': 2318, 'loss/train': 2.027554988861084} -09/20/2021 22:31:19 - INFO - __main__ - Step 37094: {'lr': 0.00019950021029617918, 'samples': 1187008, 'steps': 2318, 'loss/train': 2.2472715377807617} -09/20/2021 22:31:20 - INFO - __main__ - Step 37095: {'lr': 0.00019950021029617918, 'samples': 1187040, 'steps': 2318, 'loss/train': 1.5197639465332031} -09/20/2021 22:31:21 - INFO - __main__ - Step 37096: {'lr': 0.00019950021029617918, 'samples': 1187072, 'steps': 2318, 'loss/train': 2.241884708404541} -09/20/2021 22:31:22 - INFO - __main__ - Step 37097: {'lr': 0.00019950021029617918, 'samples': 1187104, 'steps': 2318, 'loss/train': 2.553055763244629} -09/20/2021 22:31:22 - INFO - __main__ - Step 37098: {'lr': 0.00019950021029617918, 'samples': 1187136, 'steps': 2318, 'loss/train': 2.200139045715332} -09/20/2021 22:31:23 - INFO - __main__ - Step 37099: {'lr': 0.00019950021029617918, 'samples': 1187168, 'steps': 2318, 'loss/train': 1.8665056228637695} -09/20/2021 22:31:24 - INFO - __main__ - Step 37100: {'lr': 0.00019950021029617918, 'samples': 1187200, 'steps': 2318, 'loss/train': 0.26006707549095154} -09/20/2021 22:31:25 - INFO - __main__ - Step 37101: {'lr': 0.00019950021029617918, 'samples': 1187232, 'steps': 2318, 'loss/train': 0.20085224509239197} -09/20/2021 22:31:25 - INFO - __main__ - Step 37102: {'lr': 0.00019950021029617918, 'samples': 1187264, 'steps': 2318, 'loss/train': 0.194830983877182} -09/20/2021 22:31:26 - INFO - __main__ - Step 37103: {'lr': 0.00019950021029617918, 'samples': 1187296, 'steps': 2318, 'loss/train': 0.26279014348983765} -09/20/2021 22:31:27 - INFO - __main__ - Step 37104: {'lr': 0.00019950021029617918, 'samples': 1187328, 'steps': 2318, 'loss/train': 0.4635680317878723} -09/20/2021 22:31:28 - INFO - __main__ - Step 37105: {'lr': 0.0001994995731384267, 'samples': 1187360, 'steps': 2319, 'loss/train': 1.6757789850234985} -09/20/2021 22:31:29 - INFO - __main__ - Step 37106: {'lr': 0.0001994995731384267, 'samples': 1187392, 'steps': 2319, 'loss/train': 0.9501187801361084} -09/20/2021 22:31:30 - INFO - __main__ - Step 37107: {'lr': 0.0001994995731384267, 'samples': 1187424, 'steps': 2319, 'loss/train': 2.521113157272339} -09/20/2021 22:31:30 - INFO - __main__ - Step 37108: {'lr': 0.0001994995731384267, 'samples': 1187456, 'steps': 2319, 'loss/train': 2.730499267578125} -09/20/2021 22:31:31 - INFO - __main__ - Step 37109: {'lr': 0.0001994995731384267, 'samples': 1187488, 'steps': 2319, 'loss/train': 2.015465259552002} -09/20/2021 22:31:32 - INFO - __main__ - Step 37110: {'lr': 0.0001994995731384267, 'samples': 1187520, 'steps': 2319, 'loss/train': 1.664561152458191} -09/20/2021 22:31:33 - INFO - __main__ - Step 37111: {'lr': 0.0001994995731384267, 'samples': 1187552, 'steps': 2319, 'loss/train': 2.5198330879211426} -09/20/2021 22:31:33 - INFO - __main__ - Step 37112: {'lr': 0.0001994995731384267, 'samples': 1187584, 'steps': 2319, 'loss/train': 1.6533758640289307} -09/20/2021 22:31:34 - INFO - __main__ - Step 37113: {'lr': 0.0001994995731384267, 'samples': 1187616, 'steps': 2319, 'loss/train': 1.4971644878387451} -09/20/2021 22:31:35 - INFO - __main__ - Step 37114: {'lr': 0.0001994995731384267, 'samples': 1187648, 'steps': 2319, 'loss/train': 2.4867494106292725} -09/20/2021 22:31:36 - INFO - __main__ - Step 37115: {'lr': 0.0001994995731384267, 'samples': 1187680, 'steps': 2319, 'loss/train': 1.9251415729522705} -09/20/2021 22:31:36 - INFO - __main__ - Step 37116: {'lr': 0.0001994995731384267, 'samples': 1187712, 'steps': 2319, 'loss/train': 2.2576487064361572} -09/20/2021 22:31:37 - INFO - __main__ - Step 37117: {'lr': 0.0001994995731384267, 'samples': 1187744, 'steps': 2319, 'loss/train': 2.373190402984619} -09/20/2021 22:31:38 - INFO - __main__ - Step 37118: {'lr': 0.0001994995731384267, 'samples': 1187776, 'steps': 2319, 'loss/train': 3.3867127895355225} -09/20/2021 22:31:39 - INFO - __main__ - Step 37119: {'lr': 0.0001994995731384267, 'samples': 1187808, 'steps': 2319, 'loss/train': 0.7961713075637817} -09/20/2021 22:31:39 - INFO - __main__ - Step 37120: {'lr': 0.0001994995731384267, 'samples': 1187840, 'steps': 2319, 'loss/train': 2.790003776550293} -09/20/2021 22:31:40 - INFO - __main__ - Step 37121: {'lr': 0.00019949893557581077, 'samples': 1187872, 'steps': 2320, 'loss/train': 2.2459800243377686} -09/20/2021 22:31:41 - INFO - __main__ - Step 37122: {'lr': 0.00019949893557581077, 'samples': 1187904, 'steps': 2320, 'loss/train': 2.437079429626465} -09/20/2021 22:31:42 - INFO - __main__ - Step 37123: {'lr': 0.00019949893557581077, 'samples': 1187936, 'steps': 2320, 'loss/train': 2.2264792919158936} -09/20/2021 22:31:43 - INFO - __main__ - Step 37124: {'lr': 0.00019949893557581077, 'samples': 1187968, 'steps': 2320, 'loss/train': 1.771805763244629} -09/20/2021 22:31:43 - INFO - __main__ - Step 37125: {'lr': 0.00019949893557581077, 'samples': 1188000, 'steps': 2320, 'loss/train': 2.8490169048309326} -09/20/2021 22:31:44 - INFO - __main__ - Step 37126: {'lr': 0.00019949893557581077, 'samples': 1188032, 'steps': 2320, 'loss/train': 0.6490399241447449} -09/20/2021 22:31:45 - INFO - __main__ - Step 37127: {'lr': 0.00019949893557581077, 'samples': 1188064, 'steps': 2320, 'loss/train': 2.288717269897461} -09/20/2021 22:31:46 - INFO - __main__ - Step 37128: {'lr': 0.00019949893557581077, 'samples': 1188096, 'steps': 2320, 'loss/train': 1.7315901517868042} -09/20/2021 22:31:46 - INFO - __main__ - Step 37129: {'lr': 0.00019949893557581077, 'samples': 1188128, 'steps': 2320, 'loss/train': 2.260108470916748} -09/20/2021 22:31:47 - INFO - __main__ - Step 37130: {'lr': 0.00019949893557581077, 'samples': 1188160, 'steps': 2320, 'loss/train': 2.3806309700012207} -09/20/2021 22:31:48 - INFO - __main__ - Step 37131: {'lr': 0.00019949893557581077, 'samples': 1188192, 'steps': 2320, 'loss/train': 2.448225736618042} -09/20/2021 22:31:49 - INFO - __main__ - Step 37132: {'lr': 0.00019949893557581077, 'samples': 1188224, 'steps': 2320, 'loss/train': 2.2264950275421143} -09/20/2021 22:31:49 - INFO - __main__ - Step 37133: {'lr': 0.00019949893557581077, 'samples': 1188256, 'steps': 2320, 'loss/train': 1.965470552444458} -09/20/2021 22:31:50 - INFO - __main__ - Step 37134: {'lr': 0.00019949893557581077, 'samples': 1188288, 'steps': 2320, 'loss/train': 2.9306092262268066} -09/20/2021 22:31:51 - INFO - __main__ - Step 37135: {'lr': 0.00019949893557581077, 'samples': 1188320, 'steps': 2320, 'loss/train': 2.5666608810424805} -09/20/2021 22:31:52 - INFO - __main__ - Step 37136: {'lr': 0.00019949893557581077, 'samples': 1188352, 'steps': 2320, 'loss/train': 2.89210844039917} -09/20/2021 22:31:53 - INFO - __main__ - Step 37137: {'lr': 0.00019949829760833413, 'samples': 1188384, 'steps': 2321, 'loss/train': 2.7832136154174805} -09/20/2021 22:31:54 - INFO - __main__ - Step 37138: {'lr': 0.00019949829760833413, 'samples': 1188416, 'steps': 2321, 'loss/train': 2.8222815990448} -09/20/2021 22:31:55 - INFO - __main__ - Step 37139: {'lr': 0.00019949829760833413, 'samples': 1188448, 'steps': 2321, 'loss/train': 2.5779805183410645} -09/20/2021 22:31:56 - INFO - __main__ - Step 37140: {'lr': 0.00019949829760833413, 'samples': 1188480, 'steps': 2321, 'loss/train': 3.8148303031921387} -09/20/2021 22:31:56 - INFO - __main__ - Step 37141: {'lr': 0.00019949829760833413, 'samples': 1188512, 'steps': 2321, 'loss/train': 2.421367645263672} -09/20/2021 22:31:57 - INFO - __main__ - Step 37142: {'lr': 0.00019949829760833413, 'samples': 1188544, 'steps': 2321, 'loss/train': 2.1995718479156494} -09/20/2021 22:31:58 - INFO - __main__ - Step 37143: {'lr': 0.00019949829760833413, 'samples': 1188576, 'steps': 2321, 'loss/train': 1.9439058303833008} -09/20/2021 22:31:59 - INFO - __main__ - Step 37144: {'lr': 0.00019949829760833413, 'samples': 1188608, 'steps': 2321, 'loss/train': 3.380950689315796} -09/20/2021 22:31:59 - INFO - __main__ - Step 37145: {'lr': 0.00019949829760833413, 'samples': 1188640, 'steps': 2321, 'loss/train': 3.275573492050171} -09/20/2021 22:32:00 - INFO - __main__ - Step 37146: {'lr': 0.00019949829760833413, 'samples': 1188672, 'steps': 2321, 'loss/train': 3.296764373779297} -09/20/2021 22:32:01 - INFO - __main__ - Step 37147: {'lr': 0.00019949829760833413, 'samples': 1188704, 'steps': 2321, 'loss/train': 3.2924060821533203} -09/20/2021 22:32:02 - INFO - __main__ - Step 37148: {'lr': 0.00019949829760833413, 'samples': 1188736, 'steps': 2321, 'loss/train': 3.2674665451049805} -09/20/2021 22:32:02 - INFO - __main__ - Step 37149: {'lr': 0.00019949829760833413, 'samples': 1188768, 'steps': 2321, 'loss/train': 3.2738707065582275} -09/20/2021 22:32:03 - INFO - __main__ - Step 37150: {'lr': 0.00019949829760833413, 'samples': 1188800, 'steps': 2321, 'loss/train': 2.6989457607269287} -09/20/2021 22:32:04 - INFO - __main__ - Step 37151: {'lr': 0.00019949829760833413, 'samples': 1188832, 'steps': 2321, 'loss/train': 2.455105781555176} -09/20/2021 22:32:05 - INFO - __main__ - Step 37152: {'lr': 0.00019949829760833413, 'samples': 1188864, 'steps': 2321, 'loss/train': 2.812608003616333} -09/20/2021 22:32:05 - INFO - __main__ - Step 37153: {'lr': 0.0001994976592359993, 'samples': 1188896, 'steps': 2322, 'loss/train': 1.600669026374817} -09/20/2021 22:32:06 - INFO - __main__ - Step 37154: {'lr': 0.0001994976592359993, 'samples': 1188928, 'steps': 2322, 'loss/train': 2.1533424854278564} -09/20/2021 22:32:07 - INFO - __main__ - Step 37155: {'lr': 0.0001994976592359993, 'samples': 1188960, 'steps': 2322, 'loss/train': 2.1373164653778076} -09/20/2021 22:32:08 - INFO - __main__ - Step 37156: {'lr': 0.0001994976592359993, 'samples': 1188992, 'steps': 2322, 'loss/train': 1.7616496086120605} -09/20/2021 22:32:08 - INFO - __main__ - Step 37157: {'lr': 0.0001994976592359993, 'samples': 1189024, 'steps': 2322, 'loss/train': 1.7858607769012451} -09/20/2021 22:32:09 - INFO - __main__ - Step 37158: {'lr': 0.0001994976592359993, 'samples': 1189056, 'steps': 2322, 'loss/train': 1.6521337032318115} -09/20/2021 22:32:10 - INFO - __main__ - Step 37159: {'lr': 0.0001994976592359993, 'samples': 1189088, 'steps': 2322, 'loss/train': 2.5522537231445312} -09/20/2021 22:32:11 - INFO - __main__ - Step 37160: {'lr': 0.0001994976592359993, 'samples': 1189120, 'steps': 2322, 'loss/train': 2.6948297023773193} -09/20/2021 22:32:11 - INFO - __main__ - Step 37161: {'lr': 0.0001994976592359993, 'samples': 1189152, 'steps': 2322, 'loss/train': 2.735442876815796} -09/20/2021 22:32:12 - INFO - __main__ - Step 37162: {'lr': 0.0001994976592359993, 'samples': 1189184, 'steps': 2322, 'loss/train': 2.285011053085327} -09/20/2021 22:32:13 - INFO - __main__ - Step 37163: {'lr': 0.0001994976592359993, 'samples': 1189216, 'steps': 2322, 'loss/train': 2.5238378047943115} -09/20/2021 22:32:14 - INFO - __main__ - Step 37164: {'lr': 0.0001994976592359993, 'samples': 1189248, 'steps': 2322, 'loss/train': 2.43156099319458} -09/20/2021 22:32:14 - INFO - __main__ - Step 37165: {'lr': 0.0001994976592359993, 'samples': 1189280, 'steps': 2322, 'loss/train': 0.1841985285282135} -09/20/2021 22:32:15 - INFO - __main__ - Step 37166: {'lr': 0.0001994976592359993, 'samples': 1189312, 'steps': 2322, 'loss/train': 0.39870646595954895} -09/20/2021 22:32:16 - INFO - __main__ - Step 37167: {'lr': 0.0001994976592359993, 'samples': 1189344, 'steps': 2322, 'loss/train': 0.35745787620544434} -09/20/2021 22:32:17 - INFO - __main__ - Step 37168: {'lr': 0.0001994976592359993, 'samples': 1189376, 'steps': 2322, 'loss/train': 2.3932666778564453} -09/20/2021 22:32:18 - INFO - __main__ - Step 37169: {'lr': 0.00019949702045880886, 'samples': 1189408, 'steps': 2323, 'loss/train': 1.5030421018600464} -09/20/2021 22:32:19 - INFO - __main__ - Step 37170: {'lr': 0.00019949702045880886, 'samples': 1189440, 'steps': 2323, 'loss/train': 2.7211403846740723} -09/20/2021 22:32:20 - INFO - __main__ - Step 37171: {'lr': 0.00019949702045880886, 'samples': 1189472, 'steps': 2323, 'loss/train': 1.7625702619552612} -09/20/2021 22:32:20 - INFO - __main__ - Step 37172: {'lr': 0.00019949702045880886, 'samples': 1189504, 'steps': 2323, 'loss/train': 1.1216119527816772} -09/20/2021 22:32:21 - INFO - __main__ - Step 37173: {'lr': 0.00019949702045880886, 'samples': 1189536, 'steps': 2323, 'loss/train': 2.083205461502075} -09/20/2021 22:32:22 - INFO - __main__ - Step 37174: {'lr': 0.00019949702045880886, 'samples': 1189568, 'steps': 2323, 'loss/train': 2.2559664249420166} -09/20/2021 22:32:23 - INFO - __main__ - Step 37175: {'lr': 0.00019949702045880886, 'samples': 1189600, 'steps': 2323, 'loss/train': 0.7639403939247131} -09/20/2021 22:32:23 - INFO - __main__ - Step 37176: {'lr': 0.00019949702045880886, 'samples': 1189632, 'steps': 2323, 'loss/train': 1.617600679397583} -09/20/2021 22:32:24 - INFO - __main__ - Step 37177: {'lr': 0.00019949702045880886, 'samples': 1189664, 'steps': 2323, 'loss/train': 2.3845880031585693} -09/20/2021 22:32:25 - INFO - __main__ - Step 37178: {'lr': 0.00019949702045880886, 'samples': 1189696, 'steps': 2323, 'loss/train': 2.3798820972442627} -09/20/2021 22:32:26 - INFO - __main__ - Step 37179: {'lr': 0.00019949702045880886, 'samples': 1189728, 'steps': 2323, 'loss/train': 2.457012891769409} -09/20/2021 22:32:26 - INFO - __main__ - Step 37180: {'lr': 0.00019949702045880886, 'samples': 1189760, 'steps': 2323, 'loss/train': 2.725095272064209} -09/20/2021 22:32:27 - INFO - __main__ - Step 37181: {'lr': 0.00019949702045880886, 'samples': 1189792, 'steps': 2323, 'loss/train': 0.6722154021263123} -09/20/2021 22:32:28 - INFO - __main__ - Step 37182: {'lr': 0.00019949702045880886, 'samples': 1189824, 'steps': 2323, 'loss/train': 2.5400283336639404} -09/20/2021 22:32:29 - INFO - __main__ - Step 37183: {'lr': 0.00019949702045880886, 'samples': 1189856, 'steps': 2323, 'loss/train': 0.9644425511360168} -09/20/2021 22:32:29 - INFO - __main__ - Step 37184: {'lr': 0.00019949702045880886, 'samples': 1189888, 'steps': 2323, 'loss/train': 2.501290798187256} -09/20/2021 22:32:30 - INFO - __main__ - Step 37185: {'lr': 0.00019949638127676544, 'samples': 1189920, 'steps': 2324, 'loss/train': 2.6804134845733643} -09/20/2021 22:32:31 - INFO - __main__ - Step 37186: {'lr': 0.00019949638127676544, 'samples': 1189952, 'steps': 2324, 'loss/train': 1.5568406581878662} -09/20/2021 22:32:32 - INFO - __main__ - Step 37187: {'lr': 0.00019949638127676544, 'samples': 1189984, 'steps': 2324, 'loss/train': 0.4193529188632965} -09/20/2021 22:32:33 - INFO - __main__ - Step 37188: {'lr': 0.00019949638127676544, 'samples': 1190016, 'steps': 2324, 'loss/train': 1.2364305257797241} -09/20/2021 22:32:33 - INFO - __main__ - Step 37189: {'lr': 0.00019949638127676544, 'samples': 1190048, 'steps': 2324, 'loss/train': 0.47065746784210205} -09/20/2021 22:32:34 - INFO - __main__ - Step 37190: {'lr': 0.00019949638127676544, 'samples': 1190080, 'steps': 2324, 'loss/train': 1.4211399555206299} -09/20/2021 22:32:35 - INFO - __main__ - Step 37191: {'lr': 0.00019949638127676544, 'samples': 1190112, 'steps': 2324, 'loss/train': 1.9912323951721191} -09/20/2021 22:32:36 - INFO - __main__ - Step 37192: {'lr': 0.00019949638127676544, 'samples': 1190144, 'steps': 2324, 'loss/train': 2.0259835720062256} -09/20/2021 22:32:36 - INFO - __main__ - Step 37193: {'lr': 0.00019949638127676544, 'samples': 1190176, 'steps': 2324, 'loss/train': 2.164564371109009} -09/20/2021 22:32:37 - INFO - __main__ - Step 37194: {'lr': 0.00019949638127676544, 'samples': 1190208, 'steps': 2324, 'loss/train': 3.124910831451416} -09/20/2021 22:32:38 - INFO - __main__ - Step 37195: {'lr': 0.00019949638127676544, 'samples': 1190240, 'steps': 2324, 'loss/train': 1.8629891872406006} -09/20/2021 22:32:39 - INFO - __main__ - Step 37196: {'lr': 0.00019949638127676544, 'samples': 1190272, 'steps': 2324, 'loss/train': 2.2220804691314697} -09/20/2021 22:32:39 - INFO - __main__ - Step 37197: {'lr': 0.00019949638127676544, 'samples': 1190304, 'steps': 2324, 'loss/train': 2.830482006072998} -09/20/2021 22:32:40 - INFO - __main__ - Step 37198: {'lr': 0.00019949638127676544, 'samples': 1190336, 'steps': 2324, 'loss/train': 2.5373787879943848} -09/20/2021 22:32:41 - INFO - __main__ - Step 37199: {'lr': 0.00019949638127676544, 'samples': 1190368, 'steps': 2324, 'loss/train': 1.1984835863113403} -09/20/2021 22:32:42 - INFO - __main__ - Step 37200: {'lr': 0.00019949638127676544, 'samples': 1190400, 'steps': 2324, 'loss/train': 2.241088390350342} -09/20/2021 22:32:42 - INFO - __main__ - Step 37201: {'lr': 0.00019949574168987163, 'samples': 1190432, 'steps': 2325, 'loss/train': 2.755507469177246} -09/20/2021 22:32:44 - INFO - __main__ - Step 37202: {'lr': 0.00019949574168987163, 'samples': 1190464, 'steps': 2325, 'loss/train': 2.951795816421509} -09/20/2021 22:32:45 - INFO - __main__ - Step 37203: {'lr': 0.00019949574168987163, 'samples': 1190496, 'steps': 2325, 'loss/train': 0.2521500587463379} -09/20/2021 22:32:46 - INFO - __main__ - Step 37204: {'lr': 0.00019949574168987163, 'samples': 1190528, 'steps': 2325, 'loss/train': 0.2092658430337906} -09/20/2021 22:32:47 - INFO - __main__ - Step 37205: {'lr': 0.00019949574168987163, 'samples': 1190560, 'steps': 2325, 'loss/train': 0.23702594637870789} -09/20/2021 22:32:47 - INFO - __main__ - Step 37206: {'lr': 0.00019949574168987163, 'samples': 1190592, 'steps': 2325, 'loss/train': 2.808833122253418} -09/20/2021 22:32:48 - INFO - __main__ - Step 37207: {'lr': 0.00019949574168987163, 'samples': 1190624, 'steps': 2325, 'loss/train': 2.823845863342285} -09/20/2021 22:32:49 - INFO - __main__ - Step 37208: {'lr': 0.00019949574168987163, 'samples': 1190656, 'steps': 2325, 'loss/train': 2.439392328262329} -09/20/2021 22:32:50 - INFO - __main__ - Step 37209: {'lr': 0.00019949574168987163, 'samples': 1190688, 'steps': 2325, 'loss/train': 0.932277262210846} -09/20/2021 22:32:50 - INFO - __main__ - Step 37210: {'lr': 0.00019949574168987163, 'samples': 1190720, 'steps': 2325, 'loss/train': 2.285905361175537} -09/20/2021 22:32:51 - INFO - __main__ - Step 37211: {'lr': 0.00019949574168987163, 'samples': 1190752, 'steps': 2325, 'loss/train': 2.5284476280212402} -09/20/2021 22:32:52 - INFO - __main__ - Step 37212: {'lr': 0.00019949574168987163, 'samples': 1190784, 'steps': 2325, 'loss/train': 2.819770574569702} -09/20/2021 22:32:53 - INFO - __main__ - Step 37213: {'lr': 0.00019949574168987163, 'samples': 1190816, 'steps': 2325, 'loss/train': 2.5434634685516357} -09/20/2021 22:32:53 - INFO - __main__ - Step 37214: {'lr': 0.00019949574168987163, 'samples': 1190848, 'steps': 2325, 'loss/train': 2.826796293258667} -09/20/2021 22:32:54 - INFO - __main__ - Step 37215: {'lr': 0.00019949574168987163, 'samples': 1190880, 'steps': 2325, 'loss/train': 1.9496158361434937} -09/20/2021 22:32:55 - INFO - __main__ - Step 37216: {'lr': 0.00019949574168987163, 'samples': 1190912, 'steps': 2325, 'loss/train': 2.427696943283081} -09/20/2021 22:32:56 - INFO - __main__ - Step 37217: {'lr': 0.00019949510169813003, 'samples': 1190944, 'steps': 2326, 'loss/train': 1.6653614044189453} -09/20/2021 22:32:56 - INFO - __main__ - Step 37218: {'lr': 0.00019949510169813003, 'samples': 1190976, 'steps': 2326, 'loss/train': 1.3968082666397095} -09/20/2021 22:32:57 - INFO - __main__ - Step 37219: {'lr': 0.00019949510169813003, 'samples': 1191008, 'steps': 2326, 'loss/train': 2.0693225860595703} -09/20/2021 22:32:58 - INFO - __main__ - Step 37220: {'lr': 0.00019949510169813003, 'samples': 1191040, 'steps': 2326, 'loss/train': 2.3655622005462646} -09/20/2021 22:32:59 - INFO - __main__ - Step 37221: {'lr': 0.00019949510169813003, 'samples': 1191072, 'steps': 2326, 'loss/train': 2.3069140911102295} -09/20/2021 22:32:59 - INFO - __main__ - Step 37222: {'lr': 0.00019949510169813003, 'samples': 1191104, 'steps': 2326, 'loss/train': 2.068559408187866} -09/20/2021 22:33:00 - INFO - __main__ - Step 37223: {'lr': 0.00019949510169813003, 'samples': 1191136, 'steps': 2326, 'loss/train': 1.4536919593811035} -09/20/2021 22:33:01 - INFO - __main__ - Step 37224: {'lr': 0.00019949510169813003, 'samples': 1191168, 'steps': 2326, 'loss/train': 1.6511214971542358} -09/20/2021 22:33:02 - INFO - __main__ - Step 37225: {'lr': 0.00019949510169813003, 'samples': 1191200, 'steps': 2326, 'loss/train': 1.5048249959945679} -09/20/2021 22:33:02 - INFO - __main__ - Step 37226: {'lr': 0.00019949510169813003, 'samples': 1191232, 'steps': 2326, 'loss/train': 1.617907166481018} -09/20/2021 22:33:03 - INFO - __main__ - Step 37227: {'lr': 0.00019949510169813003, 'samples': 1191264, 'steps': 2326, 'loss/train': 1.9486435651779175} -09/20/2021 22:33:04 - INFO - __main__ - Step 37228: {'lr': 0.00019949510169813003, 'samples': 1191296, 'steps': 2326, 'loss/train': 2.519775390625} -09/20/2021 22:33:05 - INFO - __main__ - Step 37229: {'lr': 0.00019949510169813003, 'samples': 1191328, 'steps': 2326, 'loss/train': 2.458216905593872} -09/20/2021 22:33:05 - INFO - __main__ - Step 37230: {'lr': 0.00019949510169813003, 'samples': 1191360, 'steps': 2326, 'loss/train': 2.0896565914154053} -09/20/2021 22:33:06 - INFO - __main__ - Step 37231: {'lr': 0.00019949510169813003, 'samples': 1191392, 'steps': 2326, 'loss/train': 2.299375057220459} -09/20/2021 22:33:08 - INFO - __main__ - Step 37232: {'lr': 0.00019949510169813003, 'samples': 1191424, 'steps': 2326, 'loss/train': 2.3518428802490234} -09/20/2021 22:33:08 - INFO - __main__ - Step 37233: {'lr': 0.00019949446130154325, 'samples': 1191456, 'steps': 2327, 'loss/train': 1.5880417823791504} -09/20/2021 22:33:09 - INFO - __main__ - Step 37234: {'lr': 0.00019949446130154325, 'samples': 1191488, 'steps': 2327, 'loss/train': 2.620396375656128} -09/20/2021 22:33:10 - INFO - __main__ - Step 37235: {'lr': 0.00019949446130154325, 'samples': 1191520, 'steps': 2327, 'loss/train': 2.5478150844573975} -09/20/2021 22:33:11 - INFO - __main__ - Step 37236: {'lr': 0.00019949446130154325, 'samples': 1191552, 'steps': 2327, 'loss/train': 2.0282139778137207} -09/20/2021 22:33:11 - INFO - __main__ - Step 37237: {'lr': 0.00019949446130154325, 'samples': 1191584, 'steps': 2327, 'loss/train': 2.6745505332946777} -09/20/2021 22:33:12 - INFO - __main__ - Step 37238: {'lr': 0.00019949446130154325, 'samples': 1191616, 'steps': 2327, 'loss/train': 2.1039037704467773} -09/20/2021 22:33:13 - INFO - __main__ - Step 37239: {'lr': 0.00019949446130154325, 'samples': 1191648, 'steps': 2327, 'loss/train': 1.7080284357070923} -09/20/2021 22:33:14 - INFO - __main__ - Step 37240: {'lr': 0.00019949446130154325, 'samples': 1191680, 'steps': 2327, 'loss/train': 2.5317792892456055} -09/20/2021 22:33:14 - INFO - __main__ - Step 37241: {'lr': 0.00019949446130154325, 'samples': 1191712, 'steps': 2327, 'loss/train': 2.057309627532959} -09/20/2021 22:33:15 - INFO - __main__ - Step 37242: {'lr': 0.00019949446130154325, 'samples': 1191744, 'steps': 2327, 'loss/train': 1.7918308973312378} -09/20/2021 22:33:16 - INFO - __main__ - Step 37243: {'lr': 0.00019949446130154325, 'samples': 1191776, 'steps': 2327, 'loss/train': 1.9233129024505615} -09/20/2021 22:33:17 - INFO - __main__ - Step 37244: {'lr': 0.00019949446130154325, 'samples': 1191808, 'steps': 2327, 'loss/train': 1.8504925966262817} -09/20/2021 22:33:17 - INFO - __main__ - Step 37245: {'lr': 0.00019949446130154325, 'samples': 1191840, 'steps': 2327, 'loss/train': 3.292738199234009} -09/20/2021 22:33:18 - INFO - __main__ - Step 37246: {'lr': 0.00019949446130154325, 'samples': 1191872, 'steps': 2327, 'loss/train': 2.599344491958618} -09/20/2021 22:33:19 - INFO - __main__ - Step 37247: {'lr': 0.00019949446130154325, 'samples': 1191904, 'steps': 2327, 'loss/train': 1.5099267959594727} -09/20/2021 22:33:20 - INFO - __main__ - Step 37248: {'lr': 0.00019949446130154325, 'samples': 1191936, 'steps': 2327, 'loss/train': 2.4511380195617676} -09/20/2021 22:33:21 - INFO - __main__ - Step 37249: {'lr': 0.00019949382050011387, 'samples': 1191968, 'steps': 2328, 'loss/train': 2.188777446746826} -09/20/2021 22:33:21 - INFO - __main__ - Step 37250: {'lr': 0.00019949382050011387, 'samples': 1192000, 'steps': 2328, 'loss/train': 2.389641523361206} -09/20/2021 22:33:22 - INFO - __main__ - Step 37251: {'lr': 0.00019949382050011387, 'samples': 1192032, 'steps': 2328, 'loss/train': 2.3336970806121826} -09/20/2021 22:33:23 - INFO - __main__ - Step 37252: {'lr': 0.00019949382050011387, 'samples': 1192064, 'steps': 2328, 'loss/train': 3.0296013355255127} -09/20/2021 22:33:24 - INFO - __main__ - Step 37253: {'lr': 0.00019949382050011387, 'samples': 1192096, 'steps': 2328, 'loss/train': 3.0675837993621826} -09/20/2021 22:33:24 - INFO - __main__ - Step 37254: {'lr': 0.00019949382050011387, 'samples': 1192128, 'steps': 2328, 'loss/train': 2.2463581562042236} -09/20/2021 22:33:25 - INFO - __main__ - Step 37255: {'lr': 0.00019949382050011387, 'samples': 1192160, 'steps': 2328, 'loss/train': 1.9263615608215332} -09/20/2021 22:33:26 - INFO - __main__ - Step 37256: {'lr': 0.00019949382050011387, 'samples': 1192192, 'steps': 2328, 'loss/train': 2.1419639587402344} -09/20/2021 22:33:27 - INFO - __main__ - Step 37257: {'lr': 0.00019949382050011387, 'samples': 1192224, 'steps': 2328, 'loss/train': 5.240021228790283} -09/20/2021 22:33:27 - INFO - __main__ - Step 37258: {'lr': 0.00019949382050011387, 'samples': 1192256, 'steps': 2328, 'loss/train': 3.496762752532959} -09/20/2021 22:33:28 - INFO - __main__ - Step 37259: {'lr': 0.00019949382050011387, 'samples': 1192288, 'steps': 2328, 'loss/train': 1.9540181159973145} -09/20/2021 22:33:29 - INFO - __main__ - Step 37260: {'lr': 0.00019949382050011387, 'samples': 1192320, 'steps': 2328, 'loss/train': 3.003382921218872} -09/20/2021 22:33:30 - INFO - __main__ - Step 37261: {'lr': 0.00019949382050011387, 'samples': 1192352, 'steps': 2328, 'loss/train': 2.430565595626831} -09/20/2021 22:33:30 - INFO - __main__ - Step 37262: {'lr': 0.00019949382050011387, 'samples': 1192384, 'steps': 2328, 'loss/train': 2.3702735900878906} -09/20/2021 22:33:32 - INFO - __main__ - Step 37263: {'lr': 0.00019949382050011387, 'samples': 1192416, 'steps': 2328, 'loss/train': 2.890988826751709} -09/20/2021 22:33:32 - INFO - __main__ - Step 37264: {'lr': 0.00019949382050011387, 'samples': 1192448, 'steps': 2328, 'loss/train': 0.39480963349342346} -09/20/2021 22:33:33 - INFO - __main__ - Step 37265: {'lr': 0.00019949317929384455, 'samples': 1192480, 'steps': 2329, 'loss/train': 2.5685184001922607} -09/20/2021 22:33:34 - INFO - __main__ - Step 37266: {'lr': 0.00019949317929384455, 'samples': 1192512, 'steps': 2329, 'loss/train': 2.8794190883636475} -09/20/2021 22:33:35 - INFO - __main__ - Step 37267: {'lr': 0.00019949317929384455, 'samples': 1192544, 'steps': 2329, 'loss/train': 2.008247137069702} -09/20/2021 22:33:35 - INFO - __main__ - Step 37268: {'lr': 0.00019949317929384455, 'samples': 1192576, 'steps': 2329, 'loss/train': 1.5503122806549072} -09/20/2021 22:33:36 - INFO - __main__ - Step 37269: {'lr': 0.00019949317929384455, 'samples': 1192608, 'steps': 2329, 'loss/train': 2.4557173252105713} -09/20/2021 22:33:37 - INFO - __main__ - Step 37270: {'lr': 0.00019949317929384455, 'samples': 1192640, 'steps': 2329, 'loss/train': 2.717567205429077} -09/20/2021 22:33:38 - INFO - __main__ - Step 37271: {'lr': 0.00019949317929384455, 'samples': 1192672, 'steps': 2329, 'loss/train': 2.3849384784698486} -09/20/2021 22:33:38 - INFO - __main__ - Step 37272: {'lr': 0.00019949317929384455, 'samples': 1192704, 'steps': 2329, 'loss/train': 2.226231813430786} -09/20/2021 22:33:39 - INFO - __main__ - Step 37273: {'lr': 0.00019949317929384455, 'samples': 1192736, 'steps': 2329, 'loss/train': 1.4128780364990234} -09/20/2021 22:33:40 - INFO - __main__ - Step 37274: {'lr': 0.00019949317929384455, 'samples': 1192768, 'steps': 2329, 'loss/train': 2.5762462615966797} -09/20/2021 22:33:41 - INFO - __main__ - Step 37275: {'lr': 0.00019949317929384455, 'samples': 1192800, 'steps': 2329, 'loss/train': 1.7044416666030884} -09/20/2021 22:33:41 - INFO - __main__ - Step 37276: {'lr': 0.00019949317929384455, 'samples': 1192832, 'steps': 2329, 'loss/train': 1.2648146152496338} -09/20/2021 22:33:42 - INFO - __main__ - Step 37277: {'lr': 0.00019949317929384455, 'samples': 1192864, 'steps': 2329, 'loss/train': 2.1921136379241943} -09/20/2021 22:33:43 - INFO - __main__ - Step 37278: {'lr': 0.00019949317929384455, 'samples': 1192896, 'steps': 2329, 'loss/train': 0.6123780608177185} -09/20/2021 22:33:44 - INFO - __main__ - Step 37279: {'lr': 0.00019949317929384455, 'samples': 1192928, 'steps': 2329, 'loss/train': 2.2570719718933105} -09/20/2021 22:33:44 - INFO - __main__ - Step 37280: {'lr': 0.00019949317929384455, 'samples': 1192960, 'steps': 2329, 'loss/train': 0.9909029603004456} -09/20/2021 22:33:45 - INFO - __main__ - Step 37281: {'lr': 0.00019949253768273786, 'samples': 1192992, 'steps': 2330, 'loss/train': 2.4988110065460205} -09/20/2021 22:33:46 - INFO - __main__ - Step 37282: {'lr': 0.00019949253768273786, 'samples': 1193024, 'steps': 2330, 'loss/train': 1.1412363052368164} -09/20/2021 22:33:47 - INFO - __main__ - Step 37283: {'lr': 0.00019949253768273786, 'samples': 1193056, 'steps': 2330, 'loss/train': 1.060996651649475} -09/20/2021 22:33:48 - INFO - __main__ - Step 37284: {'lr': 0.00019949253768273786, 'samples': 1193088, 'steps': 2330, 'loss/train': 0.8099561929702759} -09/20/2021 22:33:48 - INFO - __main__ - Step 37285: {'lr': 0.00019949253768273786, 'samples': 1193120, 'steps': 2330, 'loss/train': 1.2339062690734863} -09/20/2021 22:33:49 - INFO - __main__ - Step 37286: {'lr': 0.00019949253768273786, 'samples': 1193152, 'steps': 2330, 'loss/train': 1.6698269844055176} -09/20/2021 22:33:50 - INFO - __main__ - Step 37287: {'lr': 0.00019949253768273786, 'samples': 1193184, 'steps': 2330, 'loss/train': 2.6283509731292725} -09/20/2021 22:33:51 - INFO - __main__ - Step 37288: {'lr': 0.00019949253768273786, 'samples': 1193216, 'steps': 2330, 'loss/train': 2.261676073074341} -09/20/2021 22:33:51 - INFO - __main__ - Step 37289: {'lr': 0.00019949253768273786, 'samples': 1193248, 'steps': 2330, 'loss/train': 1.6543560028076172} -09/20/2021 22:33:52 - INFO - __main__ - Step 37290: {'lr': 0.00019949253768273786, 'samples': 1193280, 'steps': 2330, 'loss/train': 2.536900520324707} -09/20/2021 22:33:53 - INFO - __main__ - Step 37291: {'lr': 0.00019949253768273786, 'samples': 1193312, 'steps': 2330, 'loss/train': 2.8599870204925537} -09/20/2021 22:33:54 - INFO - __main__ - Step 37292: {'lr': 0.00019949253768273786, 'samples': 1193344, 'steps': 2330, 'loss/train': 2.2082784175872803} -09/20/2021 22:33:54 - INFO - __main__ - Step 37293: {'lr': 0.00019949253768273786, 'samples': 1193376, 'steps': 2330, 'loss/train': 2.845876693725586} -09/20/2021 22:33:55 - INFO - __main__ - Step 37294: {'lr': 0.00019949253768273786, 'samples': 1193408, 'steps': 2330, 'loss/train': 1.9275314807891846} -09/20/2021 22:33:56 - INFO - __main__ - Step 37295: {'lr': 0.00019949253768273786, 'samples': 1193440, 'steps': 2330, 'loss/train': 1.36782968044281} -09/20/2021 22:33:57 - INFO - __main__ - Step 37296: {'lr': 0.00019949253768273786, 'samples': 1193472, 'steps': 2330, 'loss/train': 2.1071767807006836} -09/20/2021 22:33:58 - INFO - __main__ - Step 37297: {'lr': 0.00019949189566679642, 'samples': 1193504, 'steps': 2331, 'loss/train': 2.0131003856658936} -09/20/2021 22:33:59 - INFO - __main__ - Step 37298: {'lr': 0.00019949189566679642, 'samples': 1193536, 'steps': 2331, 'loss/train': 2.7623822689056396} -09/20/2021 22:34:00 - INFO - __main__ - Step 37299: {'lr': 0.00019949189566679642, 'samples': 1193568, 'steps': 2331, 'loss/train': 0.7439407110214233} -09/20/2021 22:34:00 - INFO - __main__ - Step 37300: {'lr': 0.00019949189566679642, 'samples': 1193600, 'steps': 2331, 'loss/train': 3.064901113510132} -09/20/2021 22:34:01 - INFO - __main__ - Step 37301: {'lr': 0.00019949189566679642, 'samples': 1193632, 'steps': 2331, 'loss/train': 2.0030179023742676} -09/20/2021 22:34:02 - INFO - __main__ - Step 37302: {'lr': 0.00019949189566679642, 'samples': 1193664, 'steps': 2331, 'loss/train': 0.5181025862693787} -09/20/2021 22:34:03 - INFO - __main__ - Step 37303: {'lr': 0.00019949189566679642, 'samples': 1193696, 'steps': 2331, 'loss/train': 1.97951340675354} -09/20/2021 22:34:03 - INFO - __main__ - Step 37304: {'lr': 0.00019949189566679642, 'samples': 1193728, 'steps': 2331, 'loss/train': 2.799898147583008} -09/20/2021 22:34:04 - INFO - __main__ - Step 37305: {'lr': 0.00019949189566679642, 'samples': 1193760, 'steps': 2331, 'loss/train': 2.28407883644104} -09/20/2021 22:34:05 - INFO - __main__ - Step 37306: {'lr': 0.00019949189566679642, 'samples': 1193792, 'steps': 2331, 'loss/train': 1.7509288787841797} -09/20/2021 22:34:06 - INFO - __main__ - Step 37307: {'lr': 0.00019949189566679642, 'samples': 1193824, 'steps': 2331, 'loss/train': 1.7493374347686768} -09/20/2021 22:34:06 - INFO - __main__ - Step 37308: {'lr': 0.00019949189566679642, 'samples': 1193856, 'steps': 2331, 'loss/train': 2.421994209289551} -09/20/2021 22:34:07 - INFO - __main__ - Step 37309: {'lr': 0.00019949189566679642, 'samples': 1193888, 'steps': 2331, 'loss/train': 3.1816580295562744} -09/20/2021 22:34:08 - INFO - __main__ - Step 37310: {'lr': 0.00019949189566679642, 'samples': 1193920, 'steps': 2331, 'loss/train': 2.311765670776367} -09/20/2021 22:34:09 - INFO - __main__ - Step 37311: {'lr': 0.00019949189566679642, 'samples': 1193952, 'steps': 2331, 'loss/train': 2.827024459838867} -09/20/2021 22:34:09 - INFO - __main__ - Step 37312: {'lr': 0.00019949189566679642, 'samples': 1193984, 'steps': 2331, 'loss/train': 2.3141374588012695} -09/20/2021 22:34:10 - INFO - __main__ - Step 37313: {'lr': 0.00019949125324602286, 'samples': 1194016, 'steps': 2332, 'loss/train': 2.2451674938201904} -09/20/2021 22:34:11 - INFO - __main__ - Step 37314: {'lr': 0.00019949125324602286, 'samples': 1194048, 'steps': 2332, 'loss/train': 2.2616519927978516} -09/20/2021 22:34:12 - INFO - __main__ - Step 37315: {'lr': 0.00019949125324602286, 'samples': 1194080, 'steps': 2332, 'loss/train': 2.557131052017212} -09/20/2021 22:34:12 - INFO - __main__ - Step 37316: {'lr': 0.00019949125324602286, 'samples': 1194112, 'steps': 2332, 'loss/train': 2.7472176551818848} -09/20/2021 22:34:13 - INFO - __main__ - Step 37317: {'lr': 0.00019949125324602286, 'samples': 1194144, 'steps': 2332, 'loss/train': 2.751044988632202} -09/20/2021 22:34:14 - INFO - __main__ - Step 37318: {'lr': 0.00019949125324602286, 'samples': 1194176, 'steps': 2332, 'loss/train': 2.428318738937378} -09/20/2021 22:34:15 - INFO - __main__ - Step 37319: {'lr': 0.00019949125324602286, 'samples': 1194208, 'steps': 2332, 'loss/train': 2.7228941917419434} -09/20/2021 22:34:15 - INFO - __main__ - Step 37320: {'lr': 0.00019949125324602286, 'samples': 1194240, 'steps': 2332, 'loss/train': 1.7402009963989258} -09/20/2021 22:34:16 - INFO - __main__ - Step 37321: {'lr': 0.00019949125324602286, 'samples': 1194272, 'steps': 2332, 'loss/train': 0.6884371638298035} -09/20/2021 22:34:17 - INFO - __main__ - Step 37322: {'lr': 0.00019949125324602286, 'samples': 1194304, 'steps': 2332, 'loss/train': 2.271016836166382} -09/20/2021 22:34:18 - INFO - __main__ - Step 37323: {'lr': 0.00019949125324602286, 'samples': 1194336, 'steps': 2332, 'loss/train': 2.6929545402526855} -09/20/2021 22:34:18 - INFO - __main__ - Step 37324: {'lr': 0.00019949125324602286, 'samples': 1194368, 'steps': 2332, 'loss/train': 2.3453519344329834} -09/20/2021 22:34:19 - INFO - __main__ - Step 37325: {'lr': 0.00019949125324602286, 'samples': 1194400, 'steps': 2332, 'loss/train': 3.4341793060302734} -09/20/2021 22:34:20 - INFO - __main__ - Step 37326: {'lr': 0.00019949125324602286, 'samples': 1194432, 'steps': 2332, 'loss/train': 2.618805408477783} -09/20/2021 22:34:21 - INFO - __main__ - Step 37327: {'lr': 0.00019949125324602286, 'samples': 1194464, 'steps': 2332, 'loss/train': 2.207814931869507} -09/20/2021 22:34:22 - INFO - __main__ - Step 37328: {'lr': 0.00019949125324602286, 'samples': 1194496, 'steps': 2332, 'loss/train': 2.5448741912841797} -09/20/2021 22:34:23 - INFO - __main__ - Step 37329: {'lr': 0.00019949061042041975, 'samples': 1194528, 'steps': 2333, 'loss/train': 2.9390478134155273} -09/20/2021 22:34:24 - INFO - __main__ - Step 37330: {'lr': 0.00019949061042041975, 'samples': 1194560, 'steps': 2333, 'loss/train': 2.2167866230010986} -09/20/2021 22:34:24 - INFO - __main__ - Step 37331: {'lr': 0.00019949061042041975, 'samples': 1194592, 'steps': 2333, 'loss/train': 1.7795528173446655} -09/20/2021 22:34:25 - INFO - __main__ - Step 37332: {'lr': 0.00019949061042041975, 'samples': 1194624, 'steps': 2333, 'loss/train': 2.833843231201172} -09/20/2021 22:34:26 - INFO - __main__ - Step 37333: {'lr': 0.00019949061042041975, 'samples': 1194656, 'steps': 2333, 'loss/train': 1.9572069644927979} -09/20/2021 22:34:27 - INFO - __main__ - Step 37334: {'lr': 0.00019949061042041975, 'samples': 1194688, 'steps': 2333, 'loss/train': 1.9075474739074707} -09/20/2021 22:34:27 - INFO - __main__ - Step 37335: {'lr': 0.00019949061042041975, 'samples': 1194720, 'steps': 2333, 'loss/train': 3.258721113204956} -09/20/2021 22:34:28 - INFO - __main__ - Step 37336: {'lr': 0.00019949061042041975, 'samples': 1194752, 'steps': 2333, 'loss/train': 1.6136436462402344} -09/20/2021 22:34:29 - INFO - __main__ - Step 37337: {'lr': 0.00019949061042041975, 'samples': 1194784, 'steps': 2333, 'loss/train': 2.6145498752593994} -09/20/2021 22:34:30 - INFO - __main__ - Step 37338: {'lr': 0.00019949061042041975, 'samples': 1194816, 'steps': 2333, 'loss/train': 0.8668856620788574} -09/20/2021 22:34:30 - INFO - __main__ - Step 37339: {'lr': 0.00019949061042041975, 'samples': 1194848, 'steps': 2333, 'loss/train': 2.6283812522888184} -09/20/2021 22:34:31 - INFO - __main__ - Step 37340: {'lr': 0.00019949061042041975, 'samples': 1194880, 'steps': 2333, 'loss/train': 2.070979595184326} -09/20/2021 22:34:32 - INFO - __main__ - Step 37341: {'lr': 0.00019949061042041975, 'samples': 1194912, 'steps': 2333, 'loss/train': 2.3348209857940674} -09/20/2021 22:34:33 - INFO - __main__ - Step 37342: {'lr': 0.00019949061042041975, 'samples': 1194944, 'steps': 2333, 'loss/train': 1.7217624187469482} -09/20/2021 22:34:33 - INFO - __main__ - Step 37343: {'lr': 0.00019949061042041975, 'samples': 1194976, 'steps': 2333, 'loss/train': 2.2016777992248535} -09/20/2021 22:34:34 - INFO - __main__ - Step 37344: {'lr': 0.00019949061042041975, 'samples': 1195008, 'steps': 2333, 'loss/train': 1.451278805732727} -09/20/2021 22:34:35 - INFO - __main__ - Step 37345: {'lr': 0.00019948996718998973, 'samples': 1195040, 'steps': 2334, 'loss/train': 1.9660756587982178} -09/20/2021 22:34:36 - INFO - __main__ - Step 37346: {'lr': 0.00019948996718998973, 'samples': 1195072, 'steps': 2334, 'loss/train': 2.894491195678711} -09/20/2021 22:34:36 - INFO - __main__ - Step 37347: {'lr': 0.00019948996718998973, 'samples': 1195104, 'steps': 2334, 'loss/train': 2.778505563735962} -09/20/2021 22:34:37 - INFO - __main__ - Step 37348: {'lr': 0.00019948996718998973, 'samples': 1195136, 'steps': 2334, 'loss/train': 1.5714592933654785} -09/20/2021 22:34:38 - INFO - __main__ - Step 37349: {'lr': 0.00019948996718998973, 'samples': 1195168, 'steps': 2334, 'loss/train': 2.313737392425537} -09/20/2021 22:34:39 - INFO - __main__ - Step 37350: {'lr': 0.00019948996718998973, 'samples': 1195200, 'steps': 2334, 'loss/train': 2.405717134475708} -09/20/2021 22:34:39 - INFO - __main__ - Step 37351: {'lr': 0.00019948996718998973, 'samples': 1195232, 'steps': 2334, 'loss/train': 2.42207407951355} -09/20/2021 22:34:40 - INFO - __main__ - Step 37352: {'lr': 0.00019948996718998973, 'samples': 1195264, 'steps': 2334, 'loss/train': 1.6911733150482178} -09/20/2021 22:34:41 - INFO - __main__ - Step 37353: {'lr': 0.00019948996718998973, 'samples': 1195296, 'steps': 2334, 'loss/train': 2.364846706390381} -09/20/2021 22:34:42 - INFO - __main__ - Step 37354: {'lr': 0.00019948996718998973, 'samples': 1195328, 'steps': 2334, 'loss/train': 2.1687448024749756} -09/20/2021 22:34:42 - INFO - __main__ - Step 37355: {'lr': 0.00019948996718998973, 'samples': 1195360, 'steps': 2334, 'loss/train': 2.6663150787353516} -09/20/2021 22:34:43 - INFO - __main__ - Step 37356: {'lr': 0.00019948996718998973, 'samples': 1195392, 'steps': 2334, 'loss/train': 2.146495819091797} -09/20/2021 22:34:44 - INFO - __main__ - Step 37357: {'lr': 0.00019948996718998973, 'samples': 1195424, 'steps': 2334, 'loss/train': 1.9470981359481812} -09/20/2021 22:34:45 - INFO - __main__ - Step 37358: {'lr': 0.00019948996718998973, 'samples': 1195456, 'steps': 2334, 'loss/train': 2.0569097995758057} -09/20/2021 22:34:46 - INFO - __main__ - Step 37359: {'lr': 0.00019948996718998973, 'samples': 1195488, 'steps': 2334, 'loss/train': 0.5681872963905334} -09/20/2021 22:34:47 - INFO - __main__ - Step 37360: {'lr': 0.00019948996718998973, 'samples': 1195520, 'steps': 2334, 'loss/train': 1.878335952758789} -09/20/2021 22:34:48 - INFO - __main__ - Step 37361: {'lr': 0.00019948932355473545, 'samples': 1195552, 'steps': 2335, 'loss/train': 2.1556661128997803} -09/20/2021 22:34:48 - INFO - __main__ - Step 37362: {'lr': 0.00019948932355473545, 'samples': 1195584, 'steps': 2335, 'loss/train': 1.3343312740325928} -09/20/2021 22:34:49 - INFO - __main__ - Step 37363: {'lr': 0.00019948932355473545, 'samples': 1195616, 'steps': 2335, 'loss/train': 1.4313644170761108} -09/20/2021 22:34:50 - INFO - __main__ - Step 37364: {'lr': 0.00019948932355473545, 'samples': 1195648, 'steps': 2335, 'loss/train': 2.251049757003784} -09/20/2021 22:34:51 - INFO - __main__ - Step 37365: {'lr': 0.00019948932355473545, 'samples': 1195680, 'steps': 2335, 'loss/train': 2.065142869949341} -09/20/2021 22:34:51 - INFO - __main__ - Step 37366: {'lr': 0.00019948932355473545, 'samples': 1195712, 'steps': 2335, 'loss/train': 1.4937715530395508} -09/20/2021 22:34:52 - INFO - __main__ - Step 37367: {'lr': 0.00019948932355473545, 'samples': 1195744, 'steps': 2335, 'loss/train': 2.340733289718628} -09/20/2021 22:34:53 - INFO - __main__ - Step 37368: {'lr': 0.00019948932355473545, 'samples': 1195776, 'steps': 2335, 'loss/train': 2.1354830265045166} -09/20/2021 22:34:54 - INFO - __main__ - Step 37369: {'lr': 0.00019948932355473545, 'samples': 1195808, 'steps': 2335, 'loss/train': 2.179929494857788} -09/20/2021 22:34:54 - INFO - __main__ - Step 37370: {'lr': 0.00019948932355473545, 'samples': 1195840, 'steps': 2335, 'loss/train': 1.5499080419540405} -09/20/2021 22:34:55 - INFO - __main__ - Step 37371: {'lr': 0.00019948932355473545, 'samples': 1195872, 'steps': 2335, 'loss/train': 1.9546397924423218} -09/20/2021 22:34:56 - INFO - __main__ - Step 37372: {'lr': 0.00019948932355473545, 'samples': 1195904, 'steps': 2335, 'loss/train': 2.779299020767212} -09/20/2021 22:34:57 - INFO - __main__ - Step 37373: {'lr': 0.00019948932355473545, 'samples': 1195936, 'steps': 2335, 'loss/train': 1.4424742460250854} -09/20/2021 22:34:57 - INFO - __main__ - Step 37374: {'lr': 0.00019948932355473545, 'samples': 1195968, 'steps': 2335, 'loss/train': 2.439516305923462} -09/20/2021 22:34:58 - INFO - __main__ - Step 37375: {'lr': 0.00019948932355473545, 'samples': 1196000, 'steps': 2335, 'loss/train': 2.05901837348938} -09/20/2021 22:34:59 - INFO - __main__ - Step 37376: {'lr': 0.00019948932355473545, 'samples': 1196032, 'steps': 2335, 'loss/train': 2.113912343978882} -09/20/2021 22:35:00 - INFO - __main__ - Step 37377: {'lr': 0.00019948867951465946, 'samples': 1196064, 'steps': 2336, 'loss/train': 2.9350976943969727} -09/20/2021 22:35:00 - INFO - __main__ - Step 37378: {'lr': 0.00019948867951465946, 'samples': 1196096, 'steps': 2336, 'loss/train': 2.105691909790039} -09/20/2021 22:35:01 - INFO - __main__ - Step 37379: {'lr': 0.00019948867951465946, 'samples': 1196128, 'steps': 2336, 'loss/train': 0.4656647741794586} -09/20/2021 22:35:02 - INFO - __main__ - Step 37380: {'lr': 0.00019948867951465946, 'samples': 1196160, 'steps': 2336, 'loss/train': 1.8488030433654785} -09/20/2021 22:35:03 - INFO - __main__ - Step 37381: {'lr': 0.00019948867951465946, 'samples': 1196192, 'steps': 2336, 'loss/train': 2.0183606147766113} -09/20/2021 22:35:03 - INFO - __main__ - Step 37382: {'lr': 0.00019948867951465946, 'samples': 1196224, 'steps': 2336, 'loss/train': 2.4527430534362793} -09/20/2021 22:35:04 - INFO - __main__ - Step 37383: {'lr': 0.00019948867951465946, 'samples': 1196256, 'steps': 2336, 'loss/train': 2.3793511390686035} -09/20/2021 22:35:05 - INFO - __main__ - Step 37384: {'lr': 0.00019948867951465946, 'samples': 1196288, 'steps': 2336, 'loss/train': 0.9658355116844177} -09/20/2021 22:35:06 - INFO - __main__ - Step 37385: {'lr': 0.00019948867951465946, 'samples': 1196320, 'steps': 2336, 'loss/train': 2.9754655361175537} -09/20/2021 22:35:06 - INFO - __main__ - Step 37386: {'lr': 0.00019948867951465946, 'samples': 1196352, 'steps': 2336, 'loss/train': 2.1922435760498047} -09/20/2021 22:35:07 - INFO - __main__ - Step 37387: {'lr': 0.00019948867951465946, 'samples': 1196384, 'steps': 2336, 'loss/train': 2.4445760250091553} -09/20/2021 22:35:08 - INFO - __main__ - Step 37388: {'lr': 0.00019948867951465946, 'samples': 1196416, 'steps': 2336, 'loss/train': 2.4470715522766113} -09/20/2021 22:35:09 - INFO - __main__ - Step 37389: {'lr': 0.00019948867951465946, 'samples': 1196448, 'steps': 2336, 'loss/train': 2.8703038692474365} -09/20/2021 22:35:10 - INFO - __main__ - Step 37390: {'lr': 0.00019948867951465946, 'samples': 1196480, 'steps': 2336, 'loss/train': 2.0513715744018555} -09/20/2021 22:35:11 - INFO - __main__ - Step 37391: {'lr': 0.00019948867951465946, 'samples': 1196512, 'steps': 2336, 'loss/train': 1.7053205966949463} -09/20/2021 22:35:11 - INFO - __main__ - Step 37392: {'lr': 0.00019948867951465946, 'samples': 1196544, 'steps': 2336, 'loss/train': 1.9211678504943848} -09/20/2021 22:35:12 - INFO - __main__ - Step 37393: {'lr': 0.00019948803506976445, 'samples': 1196576, 'steps': 2337, 'loss/train': 2.5155491828918457} -09/20/2021 22:35:13 - INFO - __main__ - Step 37394: {'lr': 0.00019948803506976445, 'samples': 1196608, 'steps': 2337, 'loss/train': 2.237123727798462} -09/20/2021 22:35:14 - INFO - __main__ - Step 37395: {'lr': 0.00019948803506976445, 'samples': 1196640, 'steps': 2337, 'loss/train': 3.113758087158203} -09/20/2021 22:35:15 - INFO - __main__ - Step 37396: {'lr': 0.00019948803506976445, 'samples': 1196672, 'steps': 2337, 'loss/train': 3.472276210784912} -09/20/2021 22:35:15 - INFO - __main__ - Step 37397: {'lr': 0.00019948803506976445, 'samples': 1196704, 'steps': 2337, 'loss/train': 2.722304344177246} -09/20/2021 22:35:16 - INFO - __main__ - Step 37398: {'lr': 0.00019948803506976445, 'samples': 1196736, 'steps': 2337, 'loss/train': 2.241886615753174} -09/20/2021 22:35:17 - INFO - __main__ - Step 37399: {'lr': 0.00019948803506976445, 'samples': 1196768, 'steps': 2337, 'loss/train': 2.777174472808838} -09/20/2021 22:35:18 - INFO - __main__ - Step 37400: {'lr': 0.00019948803506976445, 'samples': 1196800, 'steps': 2337, 'loss/train': 2.5592479705810547} -09/20/2021 22:35:18 - INFO - __main__ - Step 37401: {'lr': 0.00019948803506976445, 'samples': 1196832, 'steps': 2337, 'loss/train': 3.557770013809204} -09/20/2021 22:35:19 - INFO - __main__ - Step 37402: {'lr': 0.00019948803506976445, 'samples': 1196864, 'steps': 2337, 'loss/train': 1.9837111234664917} -09/20/2021 22:35:20 - INFO - __main__ - Step 37403: {'lr': 0.00019948803506976445, 'samples': 1196896, 'steps': 2337, 'loss/train': 2.082746982574463} -09/20/2021 22:35:21 - INFO - __main__ - Step 37404: {'lr': 0.00019948803506976445, 'samples': 1196928, 'steps': 2337, 'loss/train': 2.7345380783081055} -09/20/2021 22:35:21 - INFO - __main__ - Step 37405: {'lr': 0.00019948803506976445, 'samples': 1196960, 'steps': 2337, 'loss/train': 2.3971428871154785} -09/20/2021 22:35:22 - INFO - __main__ - Step 37406: {'lr': 0.00019948803506976445, 'samples': 1196992, 'steps': 2337, 'loss/train': 1.829336404800415} -09/20/2021 22:35:23 - INFO - __main__ - Step 37407: {'lr': 0.00019948803506976445, 'samples': 1197024, 'steps': 2337, 'loss/train': 2.672351360321045} -09/20/2021 22:35:24 - INFO - __main__ - Step 37408: {'lr': 0.00019948803506976445, 'samples': 1197056, 'steps': 2337, 'loss/train': 2.008805990219116} -09/20/2021 22:35:25 - INFO - __main__ - Step 37409: {'lr': 0.000199487390220053, 'samples': 1197088, 'steps': 2338, 'loss/train': 1.3414065837860107} -09/20/2021 22:35:25 - INFO - __main__ - Step 37410: {'lr': 0.000199487390220053, 'samples': 1197120, 'steps': 2338, 'loss/train': 3.666663646697998} -09/20/2021 22:35:26 - INFO - __main__ - Step 37411: {'lr': 0.000199487390220053, 'samples': 1197152, 'steps': 2338, 'loss/train': 2.848435878753662} -09/20/2021 22:35:27 - INFO - __main__ - Step 37412: {'lr': 0.000199487390220053, 'samples': 1197184, 'steps': 2338, 'loss/train': 2.4417572021484375} -09/20/2021 22:35:28 - INFO - __main__ - Step 37413: {'lr': 0.000199487390220053, 'samples': 1197216, 'steps': 2338, 'loss/train': 2.5303499698638916} -09/20/2021 22:35:28 - INFO - __main__ - Step 37414: {'lr': 0.000199487390220053, 'samples': 1197248, 'steps': 2338, 'loss/train': 2.173419237136841} -09/20/2021 22:35:29 - INFO - __main__ - Step 37415: {'lr': 0.000199487390220053, 'samples': 1197280, 'steps': 2338, 'loss/train': 1.1876933574676514} -09/20/2021 22:35:30 - INFO - __main__ - Step 37416: {'lr': 0.000199487390220053, 'samples': 1197312, 'steps': 2338, 'loss/train': 2.7931594848632812} -09/20/2021 22:35:31 - INFO - __main__ - Step 37417: {'lr': 0.000199487390220053, 'samples': 1197344, 'steps': 2338, 'loss/train': 3.2540626525878906} -09/20/2021 22:35:31 - INFO - __main__ - Step 37418: {'lr': 0.000199487390220053, 'samples': 1197376, 'steps': 2338, 'loss/train': 2.850029945373535} -09/20/2021 22:35:33 - INFO - __main__ - Step 37419: {'lr': 0.000199487390220053, 'samples': 1197408, 'steps': 2338, 'loss/train': 2.216944932937622} -09/20/2021 22:35:33 - INFO - __main__ - Step 37420: {'lr': 0.000199487390220053, 'samples': 1197440, 'steps': 2338, 'loss/train': 2.584777593612671} -09/20/2021 22:35:34 - INFO - __main__ - Step 37421: {'lr': 0.000199487390220053, 'samples': 1197472, 'steps': 2338, 'loss/train': 2.0939197540283203} -09/20/2021 22:35:35 - INFO - __main__ - Step 37422: {'lr': 0.000199487390220053, 'samples': 1197504, 'steps': 2338, 'loss/train': 2.9320199489593506} -09/20/2021 22:35:36 - INFO - __main__ - Step 37423: {'lr': 0.000199487390220053, 'samples': 1197536, 'steps': 2338, 'loss/train': 2.880953073501587} -09/20/2021 22:35:36 - INFO - __main__ - Step 37424: {'lr': 0.000199487390220053, 'samples': 1197568, 'steps': 2338, 'loss/train': 2.127427577972412} -09/20/2021 22:35:37 - INFO - __main__ - Step 37425: {'lr': 0.00019948674496552776, 'samples': 1197600, 'steps': 2339, 'loss/train': 2.2020676136016846} -09/20/2021 22:35:38 - INFO - __main__ - Step 37426: {'lr': 0.00019948674496552776, 'samples': 1197632, 'steps': 2339, 'loss/train': 2.693129777908325} -09/20/2021 22:35:39 - INFO - __main__ - Step 37427: {'lr': 0.00019948674496552776, 'samples': 1197664, 'steps': 2339, 'loss/train': 1.0235954523086548} -09/20/2021 22:35:39 - INFO - __main__ - Step 37428: {'lr': 0.00019948674496552776, 'samples': 1197696, 'steps': 2339, 'loss/train': 2.0317559242248535} -09/20/2021 22:35:40 - INFO - __main__ - Step 37429: {'lr': 0.00019948674496552776, 'samples': 1197728, 'steps': 2339, 'loss/train': 2.1792664527893066} -09/20/2021 22:35:41 - INFO - __main__ - Step 37430: {'lr': 0.00019948674496552776, 'samples': 1197760, 'steps': 2339, 'loss/train': 2.158630847930908} -09/20/2021 22:35:42 - INFO - __main__ - Step 37431: {'lr': 0.00019948674496552776, 'samples': 1197792, 'steps': 2339, 'loss/train': 1.922264814376831} -09/20/2021 22:35:42 - INFO - __main__ - Step 37432: {'lr': 0.00019948674496552776, 'samples': 1197824, 'steps': 2339, 'loss/train': 3.2035863399505615} -09/20/2021 22:35:43 - INFO - __main__ - Step 37433: {'lr': 0.00019948674496552776, 'samples': 1197856, 'steps': 2339, 'loss/train': 2.618983268737793} -09/20/2021 22:35:44 - INFO - __main__ - Step 37434: {'lr': 0.00019948674496552776, 'samples': 1197888, 'steps': 2339, 'loss/train': 1.9488166570663452} -09/20/2021 22:35:45 - INFO - __main__ - Step 37435: {'lr': 0.00019948674496552776, 'samples': 1197920, 'steps': 2339, 'loss/train': 2.270374298095703} -09/20/2021 22:35:45 - INFO - __main__ - Step 37436: {'lr': 0.00019948674496552776, 'samples': 1197952, 'steps': 2339, 'loss/train': 2.3388023376464844} -09/20/2021 22:35:46 - INFO - __main__ - Step 37437: {'lr': 0.00019948674496552776, 'samples': 1197984, 'steps': 2339, 'loss/train': 3.9295787811279297} -09/20/2021 22:35:47 - INFO - __main__ - Step 37438: {'lr': 0.00019948674496552776, 'samples': 1198016, 'steps': 2339, 'loss/train': 3.24535870552063} -09/20/2021 22:35:48 - INFO - __main__ - Step 37439: {'lr': 0.00019948674496552776, 'samples': 1198048, 'steps': 2339, 'loss/train': 2.0344977378845215} -09/20/2021 22:35:48 - INFO - __main__ - Step 37440: {'lr': 0.00019948674496552776, 'samples': 1198080, 'steps': 2339, 'loss/train': 3.000016927719116} -09/20/2021 22:35:49 - INFO - __main__ - Step 37441: {'lr': 0.00019948609930619133, 'samples': 1198112, 'steps': 2340, 'loss/train': 2.2968528270721436} -09/20/2021 22:35:50 - INFO - __main__ - Step 37442: {'lr': 0.00019948609930619133, 'samples': 1198144, 'steps': 2340, 'loss/train': 3.1190454959869385} -09/20/2021 22:35:51 - INFO - __main__ - Step 37443: {'lr': 0.00019948609930619133, 'samples': 1198176, 'steps': 2340, 'loss/train': 1.6139308214187622} -09/20/2021 22:35:52 - INFO - __main__ - Step 37444: {'lr': 0.00019948609930619133, 'samples': 1198208, 'steps': 2340, 'loss/train': 2.147350311279297} -09/20/2021 22:35:52 - INFO - __main__ - Step 37445: {'lr': 0.00019948609930619133, 'samples': 1198240, 'steps': 2340, 'loss/train': 2.8369638919830322} -09/20/2021 22:35:53 - INFO - __main__ - Step 37446: {'lr': 0.00019948609930619133, 'samples': 1198272, 'steps': 2340, 'loss/train': 2.4308815002441406} -09/20/2021 22:35:54 - INFO - __main__ - Step 37447: {'lr': 0.00019948609930619133, 'samples': 1198304, 'steps': 2340, 'loss/train': 1.8467437028884888} -09/20/2021 22:35:55 - INFO - __main__ - Step 37448: {'lr': 0.00019948609930619133, 'samples': 1198336, 'steps': 2340, 'loss/train': 2.4223010540008545} -09/20/2021 22:35:56 - INFO - __main__ - Step 37449: {'lr': 0.00019948609930619133, 'samples': 1198368, 'steps': 2340, 'loss/train': 2.1746151447296143} -09/20/2021 22:35:57 - INFO - __main__ - Step 37450: {'lr': 0.00019948609930619133, 'samples': 1198400, 'steps': 2340, 'loss/train': 1.505321741104126} -09/20/2021 22:35:57 - INFO - __main__ - Step 37451: {'lr': 0.00019948609930619133, 'samples': 1198432, 'steps': 2340, 'loss/train': 1.2233657836914062} -09/20/2021 22:35:58 - INFO - __main__ - Step 37452: {'lr': 0.00019948609930619133, 'samples': 1198464, 'steps': 2340, 'loss/train': 1.1503057479858398} -09/20/2021 22:35:59 - INFO - __main__ - Step 37453: {'lr': 0.00019948609930619133, 'samples': 1198496, 'steps': 2340, 'loss/train': 1.2704432010650635} -09/20/2021 22:36:00 - INFO - __main__ - Step 37454: {'lr': 0.00019948609930619133, 'samples': 1198528, 'steps': 2340, 'loss/train': 1.4536411762237549} -09/20/2021 22:36:00 - INFO - __main__ - Step 37455: {'lr': 0.00019948609930619133, 'samples': 1198560, 'steps': 2340, 'loss/train': 2.0471529960632324} -09/20/2021 22:36:01 - INFO - __main__ - Step 37456: {'lr': 0.00019948609930619133, 'samples': 1198592, 'steps': 2340, 'loss/train': 2.452991008758545} -09/20/2021 22:36:02 - INFO - __main__ - Step 37457: {'lr': 0.00019948545324204636, 'samples': 1198624, 'steps': 2341, 'loss/train': 2.6179418563842773} -09/20/2021 22:36:03 - INFO - __main__ - Step 37458: {'lr': 0.00019948545324204636, 'samples': 1198656, 'steps': 2341, 'loss/train': 1.896181583404541} -09/20/2021 22:36:03 - INFO - __main__ - Step 37459: {'lr': 0.00019948545324204636, 'samples': 1198688, 'steps': 2341, 'loss/train': 1.1119478940963745} -09/20/2021 22:36:04 - INFO - __main__ - Step 37460: {'lr': 0.00019948545324204636, 'samples': 1198720, 'steps': 2341, 'loss/train': 2.134955644607544} -09/20/2021 22:36:05 - INFO - __main__ - Step 37461: {'lr': 0.00019948545324204636, 'samples': 1198752, 'steps': 2341, 'loss/train': 2.4629650115966797} -09/20/2021 22:36:06 - INFO - __main__ - Step 37462: {'lr': 0.00019948545324204636, 'samples': 1198784, 'steps': 2341, 'loss/train': 1.2198351621627808} -09/20/2021 22:36:06 - INFO - __main__ - Step 37463: {'lr': 0.00019948545324204636, 'samples': 1198816, 'steps': 2341, 'loss/train': 2.3756723403930664} -09/20/2021 22:36:07 - INFO - __main__ - Step 37464: {'lr': 0.00019948545324204636, 'samples': 1198848, 'steps': 2341, 'loss/train': 2.032930850982666} -09/20/2021 22:36:08 - INFO - __main__ - Step 37465: {'lr': 0.00019948545324204636, 'samples': 1198880, 'steps': 2341, 'loss/train': 2.5301897525787354} -09/20/2021 22:36:09 - INFO - __main__ - Step 37466: {'lr': 0.00019948545324204636, 'samples': 1198912, 'steps': 2341, 'loss/train': 1.7571803331375122} -09/20/2021 22:36:09 - INFO - __main__ - Step 37467: {'lr': 0.00019948545324204636, 'samples': 1198944, 'steps': 2341, 'loss/train': 2.6197996139526367} -09/20/2021 22:36:10 - INFO - __main__ - Step 37468: {'lr': 0.00019948545324204636, 'samples': 1198976, 'steps': 2341, 'loss/train': 2.6666011810302734} -09/20/2021 22:36:11 - INFO - __main__ - Step 37469: {'lr': 0.00019948545324204636, 'samples': 1199008, 'steps': 2341, 'loss/train': 2.820756196975708} -09/20/2021 22:36:12 - INFO - __main__ - Step 37470: {'lr': 0.00019948545324204636, 'samples': 1199040, 'steps': 2341, 'loss/train': 1.672816514968872} -09/20/2021 22:36:12 - INFO - __main__ - Step 37471: {'lr': 0.00019948545324204636, 'samples': 1199072, 'steps': 2341, 'loss/train': 2.7457735538482666} -09/20/2021 22:36:13 - INFO - __main__ - Step 37472: {'lr': 0.00019948545324204636, 'samples': 1199104, 'steps': 2341, 'loss/train': 2.856842279434204} -09/20/2021 22:36:14 - INFO - __main__ - Step 37473: {'lr': 0.00019948480677309542, 'samples': 1199136, 'steps': 2342, 'loss/train': 1.9392259120941162} -09/20/2021 22:36:15 - INFO - __main__ - Step 37474: {'lr': 0.00019948480677309542, 'samples': 1199168, 'steps': 2342, 'loss/train': 0.5916040539741516} -09/20/2021 22:36:16 - INFO - __main__ - Step 37475: {'lr': 0.00019948480677309542, 'samples': 1199200, 'steps': 2342, 'loss/train': 1.6295746564865112} -09/20/2021 22:36:16 - INFO - __main__ - Step 37476: {'lr': 0.00019948480677309542, 'samples': 1199232, 'steps': 2342, 'loss/train': 1.0617763996124268} -09/20/2021 22:36:17 - INFO - __main__ - Step 37477: {'lr': 0.00019948480677309542, 'samples': 1199264, 'steps': 2342, 'loss/train': 1.9689619541168213} -09/20/2021 22:36:18 - INFO - __main__ - Step 37478: {'lr': 0.00019948480677309542, 'samples': 1199296, 'steps': 2342, 'loss/train': 1.8726308345794678} -09/20/2021 22:36:19 - INFO - __main__ - Step 37479: {'lr': 0.00019948480677309542, 'samples': 1199328, 'steps': 2342, 'loss/train': 2.0787909030914307} -09/20/2021 22:36:20 - INFO - __main__ - Step 37480: {'lr': 0.00019948480677309542, 'samples': 1199360, 'steps': 2342, 'loss/train': 2.154043436050415} -09/20/2021 22:36:21 - INFO - __main__ - Step 37481: {'lr': 0.00019948480677309542, 'samples': 1199392, 'steps': 2342, 'loss/train': 0.8643302917480469} -09/20/2021 22:36:21 - INFO - __main__ - Step 37482: {'lr': 0.00019948480677309542, 'samples': 1199424, 'steps': 2342, 'loss/train': 1.786258339881897} -09/20/2021 22:36:22 - INFO - __main__ - Step 37483: {'lr': 0.00019948480677309542, 'samples': 1199456, 'steps': 2342, 'loss/train': 3.382189989089966} -09/20/2021 22:36:23 - INFO - __main__ - Step 37484: {'lr': 0.00019948480677309542, 'samples': 1199488, 'steps': 2342, 'loss/train': 1.1374404430389404} -09/20/2021 22:36:24 - INFO - __main__ - Step 37485: {'lr': 0.00019948480677309542, 'samples': 1199520, 'steps': 2342, 'loss/train': 3.359008550643921} -09/20/2021 22:36:24 - INFO - __main__ - Step 37486: {'lr': 0.00019948480677309542, 'samples': 1199552, 'steps': 2342, 'loss/train': 2.896221160888672} -09/20/2021 22:36:25 - INFO - __main__ - Step 37487: {'lr': 0.00019948480677309542, 'samples': 1199584, 'steps': 2342, 'loss/train': 1.8551348447799683} -09/20/2021 22:36:26 - INFO - __main__ - Step 37488: {'lr': 0.00019948480677309542, 'samples': 1199616, 'steps': 2342, 'loss/train': 3.1403472423553467} -09/20/2021 22:36:27 - INFO - __main__ - Step 37489: {'lr': 0.00019948415989934123, 'samples': 1199648, 'steps': 2343, 'loss/train': 1.5485306978225708} -09/20/2021 22:36:27 - INFO - __main__ - Step 37490: {'lr': 0.00019948415989934123, 'samples': 1199680, 'steps': 2343, 'loss/train': 1.220573902130127} -09/20/2021 22:36:28 - INFO - __main__ - Step 37491: {'lr': 0.00019948415989934123, 'samples': 1199712, 'steps': 2343, 'loss/train': 2.2547659873962402} -09/20/2021 22:36:29 - INFO - __main__ - Step 37492: {'lr': 0.00019948415989934123, 'samples': 1199744, 'steps': 2343, 'loss/train': 1.9708442687988281} -09/20/2021 22:36:30 - INFO - __main__ - Step 37493: {'lr': 0.00019948415989934123, 'samples': 1199776, 'steps': 2343, 'loss/train': 2.437739610671997} -09/20/2021 22:36:30 - INFO - __main__ - Step 37494: {'lr': 0.00019948415989934123, 'samples': 1199808, 'steps': 2343, 'loss/train': 2.9674794673919678} -09/20/2021 22:36:31 - INFO - __main__ - Step 37495: {'lr': 0.00019948415989934123, 'samples': 1199840, 'steps': 2343, 'loss/train': 0.9341135025024414} -09/20/2021 22:36:32 - INFO - __main__ - Step 37496: {'lr': 0.00019948415989934123, 'samples': 1199872, 'steps': 2343, 'loss/train': 2.1265807151794434} -09/20/2021 22:36:33 - INFO - __main__ - Step 37497: {'lr': 0.00019948415989934123, 'samples': 1199904, 'steps': 2343, 'loss/train': 2.453650951385498} -09/20/2021 22:36:33 - INFO - __main__ - Step 37498: {'lr': 0.00019948415989934123, 'samples': 1199936, 'steps': 2343, 'loss/train': 3.390075445175171} -09/20/2021 22:36:34 - INFO - __main__ - Step 37499: {'lr': 0.00019948415989934123, 'samples': 1199968, 'steps': 2343, 'loss/train': 2.6019039154052734} -09/20/2021 22:36:35 - INFO - __main__ - Step 37500: {'lr': 0.00019948415989934123, 'samples': 1200000, 'steps': 2343, 'loss/train': 1.6070277690887451} -09/20/2021 22:36:36 - INFO - __main__ - Step 37501: {'lr': 0.00019948415989934123, 'samples': 1200032, 'steps': 2343, 'loss/train': 2.1496448516845703} -09/20/2021 22:36:37 - INFO - __main__ - Step 37502: {'lr': 0.00019948415989934123, 'samples': 1200064, 'steps': 2343, 'loss/train': 1.550202488899231} -09/20/2021 22:36:37 - INFO - __main__ - Step 37503: {'lr': 0.00019948415989934123, 'samples': 1200096, 'steps': 2343, 'loss/train': 1.7705295085906982} -09/20/2021 22:36:38 - INFO - __main__ - Step 37504: {'lr': 0.00019948415989934123, 'samples': 1200128, 'steps': 2343, 'loss/train': 2.2291295528411865} -09/20/2021 22:36:39 - INFO - __main__ - Step 37505: {'lr': 0.00019948351262078634, 'samples': 1200160, 'steps': 2344, 'loss/train': 1.2696993350982666} -09/20/2021 22:36:40 - INFO - __main__ - Step 37506: {'lr': 0.00019948351262078634, 'samples': 1200192, 'steps': 2344, 'loss/train': 2.1802802085876465} -09/20/2021 22:36:40 - INFO - __main__ - Step 37507: {'lr': 0.00019948351262078634, 'samples': 1200224, 'steps': 2344, 'loss/train': 1.3557476997375488} -09/20/2021 22:36:41 - INFO - __main__ - Step 37508: {'lr': 0.00019948351262078634, 'samples': 1200256, 'steps': 2344, 'loss/train': 1.9815493822097778} -09/20/2021 22:36:42 - INFO - __main__ - Step 37509: {'lr': 0.00019948351262078634, 'samples': 1200288, 'steps': 2344, 'loss/train': 2.2817747592926025} -09/20/2021 22:36:43 - INFO - __main__ - Step 37510: {'lr': 0.00019948351262078634, 'samples': 1200320, 'steps': 2344, 'loss/train': 2.444185495376587} -09/20/2021 22:36:44 - INFO - __main__ - Step 37511: {'lr': 0.00019948351262078634, 'samples': 1200352, 'steps': 2344, 'loss/train': 1.5269603729248047} -09/20/2021 22:36:45 - INFO - __main__ - Step 37512: {'lr': 0.00019948351262078634, 'samples': 1200384, 'steps': 2344, 'loss/train': 1.6218310594558716} -09/20/2021 22:36:46 - INFO - __main__ - Step 37513: {'lr': 0.00019948351262078634, 'samples': 1200416, 'steps': 2344, 'loss/train': 1.7488223314285278} -09/20/2021 22:36:46 - INFO - __main__ - Step 37514: {'lr': 0.00019948351262078634, 'samples': 1200448, 'steps': 2344, 'loss/train': 1.9354791641235352} -09/20/2021 22:36:47 - INFO - __main__ - Step 37515: {'lr': 0.00019948351262078634, 'samples': 1200480, 'steps': 2344, 'loss/train': 1.6696529388427734} -09/20/2021 22:36:48 - INFO - __main__ - Step 37516: {'lr': 0.00019948351262078634, 'samples': 1200512, 'steps': 2344, 'loss/train': 1.1046134233474731} -09/20/2021 22:36:49 - INFO - __main__ - Step 37517: {'lr': 0.00019948351262078634, 'samples': 1200544, 'steps': 2344, 'loss/train': 0.99893718957901} -09/20/2021 22:36:49 - INFO - __main__ - Step 37518: {'lr': 0.00019948351262078634, 'samples': 1200576, 'steps': 2344, 'loss/train': 2.2726056575775146} -09/20/2021 22:36:50 - INFO - __main__ - Step 37519: {'lr': 0.00019948351262078634, 'samples': 1200608, 'steps': 2344, 'loss/train': 0.5948994159698486} -09/20/2021 22:36:51 - INFO - __main__ - Step 37520: {'lr': 0.00019948351262078634, 'samples': 1200640, 'steps': 2344, 'loss/train': 2.8305609226226807} -09/20/2021 22:36:52 - INFO - __main__ - Step 37521: {'lr': 0.00019948286493743348, 'samples': 1200672, 'steps': 2345, 'loss/train': 2.235565662384033} -09/20/2021 22:36:52 - INFO - __main__ - Step 37522: {'lr': 0.00019948286493743348, 'samples': 1200704, 'steps': 2345, 'loss/train': 1.8658910989761353} -09/20/2021 22:36:53 - INFO - __main__ - Step 37523: {'lr': 0.00019948286493743348, 'samples': 1200736, 'steps': 2345, 'loss/train': 2.8847553730010986} -09/20/2021 22:36:54 - INFO - __main__ - Step 37524: {'lr': 0.00019948286493743348, 'samples': 1200768, 'steps': 2345, 'loss/train': 2.9212183952331543} -09/20/2021 22:36:55 - INFO - __main__ - Step 37525: {'lr': 0.00019948286493743348, 'samples': 1200800, 'steps': 2345, 'loss/train': 2.8584365844726562} -09/20/2021 22:36:55 - INFO - __main__ - Step 37526: {'lr': 0.00019948286493743348, 'samples': 1200832, 'steps': 2345, 'loss/train': 3.3809144496917725} -09/20/2021 22:36:56 - INFO - __main__ - Step 37527: {'lr': 0.00019948286493743348, 'samples': 1200864, 'steps': 2345, 'loss/train': 3.6727442741394043} -09/20/2021 22:36:57 - INFO - __main__ - Step 37528: {'lr': 0.00019948286493743348, 'samples': 1200896, 'steps': 2345, 'loss/train': 2.5441808700561523} -09/20/2021 22:36:58 - INFO - __main__ - Step 37529: {'lr': 0.00019948286493743348, 'samples': 1200928, 'steps': 2345, 'loss/train': 1.9750328063964844} -09/20/2021 22:36:58 - INFO - __main__ - Step 37530: {'lr': 0.00019948286493743348, 'samples': 1200960, 'steps': 2345, 'loss/train': 2.7753381729125977} -09/20/2021 22:36:59 - INFO - __main__ - Step 37531: {'lr': 0.00019948286493743348, 'samples': 1200992, 'steps': 2345, 'loss/train': 3.2280004024505615} -09/20/2021 22:37:00 - INFO - __main__ - Step 37532: {'lr': 0.00019948286493743348, 'samples': 1201024, 'steps': 2345, 'loss/train': 2.701355457305908} -09/20/2021 22:37:01 - INFO - __main__ - Step 37533: {'lr': 0.00019948286493743348, 'samples': 1201056, 'steps': 2345, 'loss/train': 1.7909802198410034} -09/20/2021 22:37:01 - INFO - __main__ - Step 37534: {'lr': 0.00019948286493743348, 'samples': 1201088, 'steps': 2345, 'loss/train': 2.68987774848938} -09/20/2021 22:37:02 - INFO - __main__ - Step 37535: {'lr': 0.00019948286493743348, 'samples': 1201120, 'steps': 2345, 'loss/train': 1.6673088073730469} -09/20/2021 22:37:03 - INFO - __main__ - Step 37536: {'lr': 0.00019948286493743348, 'samples': 1201152, 'steps': 2345, 'loss/train': 1.967328429222107} -09/20/2021 22:37:04 - INFO - __main__ - Step 37537: {'lr': 0.00019948221684928518, 'samples': 1201184, 'steps': 2346, 'loss/train': 1.5843819379806519} -09/20/2021 22:37:05 - INFO - __main__ - Step 37538: {'lr': 0.00019948221684928518, 'samples': 1201216, 'steps': 2346, 'loss/train': 2.1095433235168457} -09/20/2021 22:37:05 - INFO - __main__ - Step 37539: {'lr': 0.00019948221684928518, 'samples': 1201248, 'steps': 2346, 'loss/train': 1.8340381383895874} -09/20/2021 22:37:07 - INFO - __main__ - Step 37540: {'lr': 0.00019948221684928518, 'samples': 1201280, 'steps': 2346, 'loss/train': 1.836475133895874} -09/20/2021 22:37:08 - INFO - __main__ - Step 37541: {'lr': 0.00019948221684928518, 'samples': 1201312, 'steps': 2346, 'loss/train': 1.8665105104446411} -09/20/2021 22:37:09 - INFO - __main__ - Step 37542: {'lr': 0.00019948221684928518, 'samples': 1201344, 'steps': 2346, 'loss/train': 1.836332082748413} -09/20/2021 22:37:09 - INFO - __main__ - Step 37543: {'lr': 0.00019948221684928518, 'samples': 1201376, 'steps': 2346, 'loss/train': 1.7753363847732544} -09/20/2021 22:37:10 - INFO - __main__ - Step 37544: {'lr': 0.00019948221684928518, 'samples': 1201408, 'steps': 2346, 'loss/train': 1.935394048690796} -09/20/2021 22:37:11 - INFO - __main__ - Step 37545: {'lr': 0.00019948221684928518, 'samples': 1201440, 'steps': 2346, 'loss/train': 3.11142897605896} -09/20/2021 22:37:12 - INFO - __main__ - Step 37546: {'lr': 0.00019948221684928518, 'samples': 1201472, 'steps': 2346, 'loss/train': 2.9887044429779053} -09/20/2021 22:37:12 - INFO - __main__ - Step 37547: {'lr': 0.00019948221684928518, 'samples': 1201504, 'steps': 2346, 'loss/train': 2.075324535369873} -09/20/2021 22:37:13 - INFO - __main__ - Step 37548: {'lr': 0.00019948221684928518, 'samples': 1201536, 'steps': 2346, 'loss/train': 1.9790637493133545} -09/20/2021 22:37:14 - INFO - __main__ - Step 37549: {'lr': 0.00019948221684928518, 'samples': 1201568, 'steps': 2346, 'loss/train': 1.5775558948516846} -09/20/2021 22:37:15 - INFO - __main__ - Step 37550: {'lr': 0.00019948221684928518, 'samples': 1201600, 'steps': 2346, 'loss/train': 1.8177732229232788} -09/20/2021 22:37:15 - INFO - __main__ - Step 37551: {'lr': 0.00019948221684928518, 'samples': 1201632, 'steps': 2346, 'loss/train': 2.92515230178833} -09/20/2021 22:37:16 - INFO - __main__ - Step 37552: {'lr': 0.00019948221684928518, 'samples': 1201664, 'steps': 2346, 'loss/train': 1.7772326469421387} -09/20/2021 22:37:17 - INFO - __main__ - Step 37553: {'lr': 0.00019948156835634416, 'samples': 1201696, 'steps': 2347, 'loss/train': 2.9371609687805176} -09/20/2021 22:37:18 - INFO - __main__ - Step 37554: {'lr': 0.00019948156835634416, 'samples': 1201728, 'steps': 2347, 'loss/train': 2.047398328781128} -09/20/2021 22:37:18 - INFO - __main__ - Step 37555: {'lr': 0.00019948156835634416, 'samples': 1201760, 'steps': 2347, 'loss/train': 0.39320841431617737} -09/20/2021 22:37:19 - INFO - __main__ - Step 37556: {'lr': 0.00019948156835634416, 'samples': 1201792, 'steps': 2347, 'loss/train': 2.319852828979492} -09/20/2021 22:37:20 - INFO - __main__ - Step 37557: {'lr': 0.00019948156835634416, 'samples': 1201824, 'steps': 2347, 'loss/train': 1.5100325345993042} -09/20/2021 22:37:21 - INFO - __main__ - Step 37558: {'lr': 0.00019948156835634416, 'samples': 1201856, 'steps': 2347, 'loss/train': 2.5160694122314453} -09/20/2021 22:37:21 - INFO - __main__ - Step 37559: {'lr': 0.00019948156835634416, 'samples': 1201888, 'steps': 2347, 'loss/train': 1.8162320852279663} -09/20/2021 22:37:22 - INFO - __main__ - Step 37560: {'lr': 0.00019948156835634416, 'samples': 1201920, 'steps': 2347, 'loss/train': 2.1382713317871094} -09/20/2021 22:37:23 - INFO - __main__ - Step 37561: {'lr': 0.00019948156835634416, 'samples': 1201952, 'steps': 2347, 'loss/train': 2.334388494491577} -09/20/2021 22:37:24 - INFO - __main__ - Step 37562: {'lr': 0.00019948156835634416, 'samples': 1201984, 'steps': 2347, 'loss/train': 2.1730058193206787} -09/20/2021 22:37:24 - INFO - __main__ - Step 37563: {'lr': 0.00019948156835634416, 'samples': 1202016, 'steps': 2347, 'loss/train': 2.1830153465270996} -09/20/2021 22:37:25 - INFO - __main__ - Step 37564: {'lr': 0.00019948156835634416, 'samples': 1202048, 'steps': 2347, 'loss/train': 2.073326349258423} -09/20/2021 22:37:26 - INFO - __main__ - Step 37565: {'lr': 0.00019948156835634416, 'samples': 1202080, 'steps': 2347, 'loss/train': 1.8622519969940186} -09/20/2021 22:37:27 - INFO - __main__ - Step 37566: {'lr': 0.00019948156835634416, 'samples': 1202112, 'steps': 2347, 'loss/train': 3.08418869972229} -09/20/2021 22:37:27 - INFO - __main__ - Step 37567: {'lr': 0.00019948156835634416, 'samples': 1202144, 'steps': 2347, 'loss/train': 1.9745686054229736} -09/20/2021 22:37:28 - INFO - __main__ - Step 37568: {'lr': 0.00019948156835634416, 'samples': 1202176, 'steps': 2347, 'loss/train': 2.629483938217163} -09/20/2021 22:37:29 - INFO - __main__ - Step 37569: {'lr': 0.00019948091945861301, 'samples': 1202208, 'steps': 2348, 'loss/train': 1.875488042831421} -09/20/2021 22:37:30 - INFO - __main__ - Step 37570: {'lr': 0.00019948091945861301, 'samples': 1202240, 'steps': 2348, 'loss/train': 2.4865238666534424} -09/20/2021 22:37:31 - INFO - __main__ - Step 37571: {'lr': 0.00019948091945861301, 'samples': 1202272, 'steps': 2348, 'loss/train': 2.5251059532165527} -09/20/2021 22:37:32 - INFO - __main__ - Step 37572: {'lr': 0.00019948091945861301, 'samples': 1202304, 'steps': 2348, 'loss/train': 1.9516685009002686} -09/20/2021 22:37:33 - INFO - __main__ - Step 37573: {'lr': 0.00019948091945861301, 'samples': 1202336, 'steps': 2348, 'loss/train': 2.5482819080352783} -09/20/2021 22:37:33 - INFO - __main__ - Step 37574: {'lr': 0.00019948091945861301, 'samples': 1202368, 'steps': 2348, 'loss/train': 2.1461257934570312} -09/20/2021 22:37:34 - INFO - __main__ - Step 37575: {'lr': 0.00019948091945861301, 'samples': 1202400, 'steps': 2348, 'loss/train': 2.1626193523406982} -09/20/2021 22:37:35 - INFO - __main__ - Step 37576: {'lr': 0.00019948091945861301, 'samples': 1202432, 'steps': 2348, 'loss/train': 1.876960039138794} -09/20/2021 22:37:36 - INFO - __main__ - Step 37577: {'lr': 0.00019948091945861301, 'samples': 1202464, 'steps': 2348, 'loss/train': 2.5936005115509033} -09/20/2021 22:37:36 - INFO - __main__ - Step 37578: {'lr': 0.00019948091945861301, 'samples': 1202496, 'steps': 2348, 'loss/train': 2.0572617053985596} -09/20/2021 22:37:37 - INFO - __main__ - Step 37579: {'lr': 0.00019948091945861301, 'samples': 1202528, 'steps': 2348, 'loss/train': 0.5308538675308228} -09/20/2021 22:37:38 - INFO - __main__ - Step 37580: {'lr': 0.00019948091945861301, 'samples': 1202560, 'steps': 2348, 'loss/train': 2.1667118072509766} -09/20/2021 22:37:39 - INFO - __main__ - Step 37581: {'lr': 0.00019948091945861301, 'samples': 1202592, 'steps': 2348, 'loss/train': 2.1408121585845947} -09/20/2021 22:37:39 - INFO - __main__ - Step 37582: {'lr': 0.00019948091945861301, 'samples': 1202624, 'steps': 2348, 'loss/train': 2.1817805767059326} -09/20/2021 22:37:40 - INFO - __main__ - Step 37583: {'lr': 0.00019948091945861301, 'samples': 1202656, 'steps': 2348, 'loss/train': 1.609431266784668} -09/20/2021 22:37:41 - INFO - __main__ - Step 37584: {'lr': 0.00019948091945861301, 'samples': 1202688, 'steps': 2348, 'loss/train': 1.2007312774658203} -09/20/2021 22:37:42 - INFO - __main__ - Step 37585: {'lr': 0.00019948027015609442, 'samples': 1202720, 'steps': 2349, 'loss/train': 1.861230492591858} -09/20/2021 22:37:43 - INFO - __main__ - Step 37586: {'lr': 0.00019948027015609442, 'samples': 1202752, 'steps': 2349, 'loss/train': 1.4580633640289307} -09/20/2021 22:37:43 - INFO - __main__ - Step 37587: {'lr': 0.00019948027015609442, 'samples': 1202784, 'steps': 2349, 'loss/train': 2.706115245819092} -09/20/2021 22:37:44 - INFO - __main__ - Step 37588: {'lr': 0.00019948027015609442, 'samples': 1202816, 'steps': 2349, 'loss/train': 3.001302719116211} -09/20/2021 22:37:45 - INFO - __main__ - Step 37589: {'lr': 0.00019948027015609442, 'samples': 1202848, 'steps': 2349, 'loss/train': 2.1165990829467773} -09/20/2021 22:37:46 - INFO - __main__ - Step 37590: {'lr': 0.00019948027015609442, 'samples': 1202880, 'steps': 2349, 'loss/train': 2.443525791168213} -09/20/2021 22:37:46 - INFO - __main__ - Step 37591: {'lr': 0.00019948027015609442, 'samples': 1202912, 'steps': 2349, 'loss/train': 1.5554989576339722} -09/20/2021 22:37:47 - INFO - __main__ - Step 37592: {'lr': 0.00019948027015609442, 'samples': 1202944, 'steps': 2349, 'loss/train': 0.9857234358787537} -09/20/2021 22:37:48 - INFO - __main__ - Step 37593: {'lr': 0.00019948027015609442, 'samples': 1202976, 'steps': 2349, 'loss/train': 2.6239283084869385} -09/20/2021 22:37:49 - INFO - __main__ - Step 37594: {'lr': 0.00019948027015609442, 'samples': 1203008, 'steps': 2349, 'loss/train': 3.1029000282287598} -09/20/2021 22:37:49 - INFO - __main__ - Step 37595: {'lr': 0.00019948027015609442, 'samples': 1203040, 'steps': 2349, 'loss/train': 2.083200454711914} -09/20/2021 22:37:50 - INFO - __main__ - Step 37596: {'lr': 0.00019948027015609442, 'samples': 1203072, 'steps': 2349, 'loss/train': 2.1658356189727783} -09/20/2021 22:37:51 - INFO - __main__ - Step 37597: {'lr': 0.00019948027015609442, 'samples': 1203104, 'steps': 2349, 'loss/train': 1.8018786907196045} -09/20/2021 22:37:52 - INFO - __main__ - Step 37598: {'lr': 0.00019948027015609442, 'samples': 1203136, 'steps': 2349, 'loss/train': 2.8430888652801514} -09/20/2021 22:37:52 - INFO - __main__ - Step 37599: {'lr': 0.00019948027015609442, 'samples': 1203168, 'steps': 2349, 'loss/train': 2.1185479164123535} -09/20/2021 22:37:53 - INFO - __main__ - Step 37600: {'lr': 0.00019948027015609442, 'samples': 1203200, 'steps': 2349, 'loss/train': 2.322054386138916} -09/20/2021 22:37:54 - INFO - __main__ - Step 37601: {'lr': 0.00019947962044879094, 'samples': 1203232, 'steps': 2350, 'loss/train': 1.9909908771514893} -09/20/2021 22:37:55 - INFO - __main__ - Step 37602: {'lr': 0.00019947962044879094, 'samples': 1203264, 'steps': 2350, 'loss/train': 1.778879165649414} -09/20/2021 22:37:56 - INFO - __main__ - Step 37603: {'lr': 0.00019947962044879094, 'samples': 1203296, 'steps': 2350, 'loss/train': 2.419832944869995} -09/20/2021 22:37:57 - INFO - __main__ - Step 37604: {'lr': 0.00019947962044879094, 'samples': 1203328, 'steps': 2350, 'loss/train': 2.9796199798583984} -09/20/2021 22:37:57 - INFO - __main__ - Step 37605: {'lr': 0.00019947962044879094, 'samples': 1203360, 'steps': 2350, 'loss/train': 2.8794362545013428} -09/20/2021 22:37:58 - INFO - __main__ - Step 37606: {'lr': 0.00019947962044879094, 'samples': 1203392, 'steps': 2350, 'loss/train': 1.1409395933151245} -09/20/2021 22:37:59 - INFO - __main__ - Step 37607: {'lr': 0.00019947962044879094, 'samples': 1203424, 'steps': 2350, 'loss/train': 2.844897985458374} -09/20/2021 22:38:00 - INFO - __main__ - Step 37608: {'lr': 0.00019947962044879094, 'samples': 1203456, 'steps': 2350, 'loss/train': 3.0358963012695312} -09/20/2021 22:38:00 - INFO - __main__ - Step 37609: {'lr': 0.00019947962044879094, 'samples': 1203488, 'steps': 2350, 'loss/train': 2.2477850914001465} -09/20/2021 22:38:01 - INFO - __main__ - Step 37610: {'lr': 0.00019947962044879094, 'samples': 1203520, 'steps': 2350, 'loss/train': 2.606221914291382} -09/20/2021 22:38:02 - INFO - __main__ - Step 37611: {'lr': 0.00019947962044879094, 'samples': 1203552, 'steps': 2350, 'loss/train': 2.6598901748657227} -09/20/2021 22:38:03 - INFO - __main__ - Step 37612: {'lr': 0.00019947962044879094, 'samples': 1203584, 'steps': 2350, 'loss/train': 2.5201597213745117} -09/20/2021 22:38:03 - INFO - __main__ - Step 37613: {'lr': 0.00019947962044879094, 'samples': 1203616, 'steps': 2350, 'loss/train': 2.4208755493164062} -09/20/2021 22:38:04 - INFO - __main__ - Step 37614: {'lr': 0.00019947962044879094, 'samples': 1203648, 'steps': 2350, 'loss/train': 2.1972265243530273} -09/20/2021 22:38:05 - INFO - __main__ - Step 37615: {'lr': 0.00019947962044879094, 'samples': 1203680, 'steps': 2350, 'loss/train': 2.453782796859741} -09/20/2021 22:38:06 - INFO - __main__ - Step 37616: {'lr': 0.00019947962044879094, 'samples': 1203712, 'steps': 2350, 'loss/train': 2.7214694023132324} -09/20/2021 22:38:07 - INFO - __main__ - Step 37617: {'lr': 0.0001994789703367053, 'samples': 1203744, 'steps': 2351, 'loss/train': 1.3508646488189697} -09/20/2021 22:38:07 - INFO - __main__ - Step 37618: {'lr': 0.0001994789703367053, 'samples': 1203776, 'steps': 2351, 'loss/train': 2.4970781803131104} -09/20/2021 22:38:08 - INFO - __main__ - Step 37619: {'lr': 0.0001994789703367053, 'samples': 1203808, 'steps': 2351, 'loss/train': 1.5521981716156006} -09/20/2021 22:38:09 - INFO - __main__ - Step 37620: {'lr': 0.0001994789703367053, 'samples': 1203840, 'steps': 2351, 'loss/train': 0.7414994835853577} -09/20/2021 22:38:10 - INFO - __main__ - Step 37621: {'lr': 0.0001994789703367053, 'samples': 1203872, 'steps': 2351, 'loss/train': 2.5212936401367188} -09/20/2021 22:38:10 - INFO - __main__ - Step 37622: {'lr': 0.0001994789703367053, 'samples': 1203904, 'steps': 2351, 'loss/train': 2.84005069732666} -09/20/2021 22:38:11 - INFO - __main__ - Step 37623: {'lr': 0.0001994789703367053, 'samples': 1203936, 'steps': 2351, 'loss/train': 1.7818747758865356} -09/20/2021 22:38:12 - INFO - __main__ - Step 37624: {'lr': 0.0001994789703367053, 'samples': 1203968, 'steps': 2351, 'loss/train': 1.8722895383834839} -09/20/2021 22:38:13 - INFO - __main__ - Step 37625: {'lr': 0.0001994789703367053, 'samples': 1204000, 'steps': 2351, 'loss/train': 2.971848487854004} -09/20/2021 22:38:13 - INFO - __main__ - Step 37626: {'lr': 0.0001994789703367053, 'samples': 1204032, 'steps': 2351, 'loss/train': 2.4709908962249756} -09/20/2021 22:38:14 - INFO - __main__ - Step 37627: {'lr': 0.0001994789703367053, 'samples': 1204064, 'steps': 2351, 'loss/train': 2.8949356079101562} -09/20/2021 22:38:15 - INFO - __main__ - Step 37628: {'lr': 0.0001994789703367053, 'samples': 1204096, 'steps': 2351, 'loss/train': 2.4676551818847656} -09/20/2021 22:38:16 - INFO - __main__ - Step 37629: {'lr': 0.0001994789703367053, 'samples': 1204128, 'steps': 2351, 'loss/train': 2.56136417388916} -09/20/2021 22:38:16 - INFO - __main__ - Step 37630: {'lr': 0.0001994789703367053, 'samples': 1204160, 'steps': 2351, 'loss/train': 1.9373588562011719} -09/20/2021 22:38:17 - INFO - __main__ - Step 37631: {'lr': 0.0001994789703367053, 'samples': 1204192, 'steps': 2351, 'loss/train': 1.9447948932647705} -09/20/2021 22:38:18 - INFO - __main__ - Step 37632: {'lr': 0.0001994789703367053, 'samples': 1204224, 'steps': 2351, 'loss/train': 2.562901258468628} -09/20/2021 22:38:19 - INFO - __main__ - Step 37633: {'lr': 0.0001994783198198401, 'samples': 1204256, 'steps': 2352, 'loss/train': 2.25223708152771} -09/20/2021 22:38:20 - INFO - __main__ - Step 37634: {'lr': 0.0001994783198198401, 'samples': 1204288, 'steps': 2352, 'loss/train': 2.0728702545166016} -09/20/2021 22:38:21 - INFO - __main__ - Step 37635: {'lr': 0.0001994783198198401, 'samples': 1204320, 'steps': 2352, 'loss/train': 2.5081262588500977} -09/20/2021 22:38:22 - INFO - __main__ - Step 37636: {'lr': 0.0001994783198198401, 'samples': 1204352, 'steps': 2352, 'loss/train': 1.5691471099853516} -09/20/2021 22:38:22 - INFO - __main__ - Step 37637: {'lr': 0.0001994783198198401, 'samples': 1204384, 'steps': 2352, 'loss/train': 2.145007371902466} -09/20/2021 22:38:23 - INFO - __main__ - Step 37638: {'lr': 0.0001994783198198401, 'samples': 1204416, 'steps': 2352, 'loss/train': 2.8345251083374023} -09/20/2021 22:38:24 - INFO - __main__ - Step 37639: {'lr': 0.0001994783198198401, 'samples': 1204448, 'steps': 2352, 'loss/train': 2.522859811782837} -09/20/2021 22:38:25 - INFO - __main__ - Step 37640: {'lr': 0.0001994783198198401, 'samples': 1204480, 'steps': 2352, 'loss/train': 2.2556915283203125} -09/20/2021 22:38:25 - INFO - __main__ - Step 37641: {'lr': 0.0001994783198198401, 'samples': 1204512, 'steps': 2352, 'loss/train': 2.3906989097595215} -09/20/2021 22:38:26 - INFO - __main__ - Step 37642: {'lr': 0.0001994783198198401, 'samples': 1204544, 'steps': 2352, 'loss/train': 3.3201518058776855} -09/20/2021 22:38:27 - INFO - __main__ - Step 37643: {'lr': 0.0001994783198198401, 'samples': 1204576, 'steps': 2352, 'loss/train': 2.3893556594848633} -09/20/2021 22:38:28 - INFO - __main__ - Step 37644: {'lr': 0.0001994783198198401, 'samples': 1204608, 'steps': 2352, 'loss/train': 2.356642484664917} -09/20/2021 22:38:28 - INFO - __main__ - Step 37645: {'lr': 0.0001994783198198401, 'samples': 1204640, 'steps': 2352, 'loss/train': 2.0036942958831787} -09/20/2021 22:38:29 - INFO - __main__ - Step 37646: {'lr': 0.0001994783198198401, 'samples': 1204672, 'steps': 2352, 'loss/train': 2.190356731414795} -09/20/2021 22:38:30 - INFO - __main__ - Step 37647: {'lr': 0.0001994783198198401, 'samples': 1204704, 'steps': 2352, 'loss/train': 1.471555471420288} -09/20/2021 22:38:31 - INFO - __main__ - Step 37648: {'lr': 0.0001994783198198401, 'samples': 1204736, 'steps': 2352, 'loss/train': 2.0574135780334473} -09/20/2021 22:38:31 - INFO - __main__ - Step 37649: {'lr': 0.00019947766889819802, 'samples': 1204768, 'steps': 2353, 'loss/train': 2.1056597232818604} -09/20/2021 22:38:32 - INFO - __main__ - Step 37650: {'lr': 0.00019947766889819802, 'samples': 1204800, 'steps': 2353, 'loss/train': 1.9289034605026245} -09/20/2021 22:38:33 - INFO - __main__ - Step 37651: {'lr': 0.00019947766889819802, 'samples': 1204832, 'steps': 2353, 'loss/train': 2.2933566570281982} -09/20/2021 22:38:34 - INFO - __main__ - Step 37652: {'lr': 0.00019947766889819802, 'samples': 1204864, 'steps': 2353, 'loss/train': 2.317882776260376} -09/20/2021 22:38:34 - INFO - __main__ - Step 37653: {'lr': 0.00019947766889819802, 'samples': 1204896, 'steps': 2353, 'loss/train': 1.8720253705978394} -09/20/2021 22:38:35 - INFO - __main__ - Step 37654: {'lr': 0.00019947766889819802, 'samples': 1204928, 'steps': 2353, 'loss/train': 2.960569143295288} -09/20/2021 22:38:36 - INFO - __main__ - Step 37655: {'lr': 0.00019947766889819802, 'samples': 1204960, 'steps': 2353, 'loss/train': 3.0819036960601807} -09/20/2021 22:38:37 - INFO - __main__ - Step 37656: {'lr': 0.00019947766889819802, 'samples': 1204992, 'steps': 2353, 'loss/train': 1.4412577152252197} -09/20/2021 22:38:37 - INFO - __main__ - Step 37657: {'lr': 0.00019947766889819802, 'samples': 1205024, 'steps': 2353, 'loss/train': 2.521707534790039} -09/20/2021 22:38:38 - INFO - __main__ - Step 37658: {'lr': 0.00019947766889819802, 'samples': 1205056, 'steps': 2353, 'loss/train': 1.8041408061981201} -09/20/2021 22:38:39 - INFO - __main__ - Step 37659: {'lr': 0.00019947766889819802, 'samples': 1205088, 'steps': 2353, 'loss/train': 1.7245652675628662} -09/20/2021 22:38:40 - INFO - __main__ - Step 37660: {'lr': 0.00019947766889819802, 'samples': 1205120, 'steps': 2353, 'loss/train': 2.1574673652648926} -09/20/2021 22:38:40 - INFO - __main__ - Step 37661: {'lr': 0.00019947766889819802, 'samples': 1205152, 'steps': 2353, 'loss/train': 2.203484535217285} -09/20/2021 22:38:41 - INFO - __main__ - Step 37662: {'lr': 0.00019947766889819802, 'samples': 1205184, 'steps': 2353, 'loss/train': 2.459378480911255} -09/20/2021 22:38:42 - INFO - __main__ - Step 37663: {'lr': 0.00019947766889819802, 'samples': 1205216, 'steps': 2353, 'loss/train': 2.1880457401275635} -09/20/2021 22:38:43 - INFO - __main__ - Step 37664: {'lr': 0.00019947766889819802, 'samples': 1205248, 'steps': 2353, 'loss/train': 2.277374505996704} -09/20/2021 22:38:44 - INFO - __main__ - Step 37665: {'lr': 0.00019947701757178166, 'samples': 1205280, 'steps': 2354, 'loss/train': 2.629242181777954} -09/20/2021 22:38:45 - INFO - __main__ - Step 37666: {'lr': 0.00019947701757178166, 'samples': 1205312, 'steps': 2354, 'loss/train': 1.8618968725204468} -09/20/2021 22:38:46 - INFO - __main__ - Step 37667: {'lr': 0.00019947701757178166, 'samples': 1205344, 'steps': 2354, 'loss/train': 2.469097137451172} -09/20/2021 22:38:46 - INFO - __main__ - Step 37668: {'lr': 0.00019947701757178166, 'samples': 1205376, 'steps': 2354, 'loss/train': 2.2844133377075195} -09/20/2021 22:38:47 - INFO - __main__ - Step 37669: {'lr': 0.00019947701757178166, 'samples': 1205408, 'steps': 2354, 'loss/train': 2.359016180038452} -09/20/2021 22:38:48 - INFO - __main__ - Step 37670: {'lr': 0.00019947701757178166, 'samples': 1205440, 'steps': 2354, 'loss/train': 2.2899069786071777} -09/20/2021 22:38:49 - INFO - __main__ - Step 37671: {'lr': 0.00019947701757178166, 'samples': 1205472, 'steps': 2354, 'loss/train': 1.7864348888397217} -09/20/2021 22:38:49 - INFO - __main__ - Step 37672: {'lr': 0.00019947701757178166, 'samples': 1205504, 'steps': 2354, 'loss/train': 2.5539071559906006} -09/20/2021 22:38:50 - INFO - __main__ - Step 37673: {'lr': 0.00019947701757178166, 'samples': 1205536, 'steps': 2354, 'loss/train': 1.350190281867981} -09/20/2021 22:38:51 - INFO - __main__ - Step 37674: {'lr': 0.00019947701757178166, 'samples': 1205568, 'steps': 2354, 'loss/train': 1.181350827217102} -09/20/2021 22:38:52 - INFO - __main__ - Step 37675: {'lr': 0.00019947701757178166, 'samples': 1205600, 'steps': 2354, 'loss/train': 2.6758546829223633} -09/20/2021 22:38:52 - INFO - __main__ - Step 37676: {'lr': 0.00019947701757178166, 'samples': 1205632, 'steps': 2354, 'loss/train': 3.0194528102874756} -09/20/2021 22:38:53 - INFO - __main__ - Step 37677: {'lr': 0.00019947701757178166, 'samples': 1205664, 'steps': 2354, 'loss/train': 1.9311683177947998} -09/20/2021 22:38:54 - INFO - __main__ - Step 37678: {'lr': 0.00019947701757178166, 'samples': 1205696, 'steps': 2354, 'loss/train': 1.7855377197265625} -09/20/2021 22:38:55 - INFO - __main__ - Step 37679: {'lr': 0.00019947701757178166, 'samples': 1205728, 'steps': 2354, 'loss/train': 1.8681880235671997} -09/20/2021 22:38:55 - INFO - __main__ - Step 37680: {'lr': 0.00019947701757178166, 'samples': 1205760, 'steps': 2354, 'loss/train': 2.448497772216797} -09/20/2021 22:38:56 - INFO - __main__ - Step 37681: {'lr': 0.00019947636584059374, 'samples': 1205792, 'steps': 2355, 'loss/train': 2.276094436645508} -09/20/2021 22:38:57 - INFO - __main__ - Step 37682: {'lr': 0.00019947636584059374, 'samples': 1205824, 'steps': 2355, 'loss/train': 1.378698468208313} -09/20/2021 22:38:58 - INFO - __main__ - Step 37683: {'lr': 0.00019947636584059374, 'samples': 1205856, 'steps': 2355, 'loss/train': 3.3640575408935547} -09/20/2021 22:38:59 - INFO - __main__ - Step 37684: {'lr': 0.00019947636584059374, 'samples': 1205888, 'steps': 2355, 'loss/train': 2.036844491958618} -09/20/2021 22:38:59 - INFO - __main__ - Step 37685: {'lr': 0.00019947636584059374, 'samples': 1205920, 'steps': 2355, 'loss/train': 1.8323835134506226} -09/20/2021 22:39:00 - INFO - __main__ - Step 37686: {'lr': 0.00019947636584059374, 'samples': 1205952, 'steps': 2355, 'loss/train': 2.2531731128692627} -09/20/2021 22:39:01 - INFO - __main__ - Step 37687: {'lr': 0.00019947636584059374, 'samples': 1205984, 'steps': 2355, 'loss/train': 2.496647596359253} -09/20/2021 22:39:02 - INFO - __main__ - Step 37688: {'lr': 0.00019947636584059374, 'samples': 1206016, 'steps': 2355, 'loss/train': 2.1493642330169678} -09/20/2021 22:39:02 - INFO - __main__ - Step 37689: {'lr': 0.00019947636584059374, 'samples': 1206048, 'steps': 2355, 'loss/train': 1.6618869304656982} -09/20/2021 22:39:03 - INFO - __main__ - Step 37690: {'lr': 0.00019947636584059374, 'samples': 1206080, 'steps': 2355, 'loss/train': 2.8611831665039062} -09/20/2021 22:39:04 - INFO - __main__ - Step 37691: {'lr': 0.00019947636584059374, 'samples': 1206112, 'steps': 2355, 'loss/train': 1.9252873659133911} -09/20/2021 22:39:05 - INFO - __main__ - Step 37692: {'lr': 0.00019947636584059374, 'samples': 1206144, 'steps': 2355, 'loss/train': 1.835592269897461} -09/20/2021 22:39:05 - INFO - __main__ - Step 37693: {'lr': 0.00019947636584059374, 'samples': 1206176, 'steps': 2355, 'loss/train': 0.9207303524017334} -09/20/2021 22:39:06 - INFO - __main__ - Step 37694: {'lr': 0.00019947636584059374, 'samples': 1206208, 'steps': 2355, 'loss/train': 2.2954587936401367} -09/20/2021 22:39:07 - INFO - __main__ - Step 37695: {'lr': 0.00019947636584059374, 'samples': 1206240, 'steps': 2355, 'loss/train': 2.3751370906829834} -09/20/2021 22:39:08 - INFO - __main__ - Step 37696: {'lr': 0.00019947636584059374, 'samples': 1206272, 'steps': 2355, 'loss/train': 2.0925402641296387} -09/20/2021 22:39:09 - INFO - __main__ - Step 37697: {'lr': 0.00019947571370463688, 'samples': 1206304, 'steps': 2356, 'loss/train': 1.4811036586761475} -09/20/2021 22:39:10 - INFO - __main__ - Step 37698: {'lr': 0.00019947571370463688, 'samples': 1206336, 'steps': 2356, 'loss/train': 2.464674949645996} -09/20/2021 22:39:10 - INFO - __main__ - Step 37699: {'lr': 0.00019947571370463688, 'samples': 1206368, 'steps': 2356, 'loss/train': 2.1651647090911865} -09/20/2021 22:39:11 - INFO - __main__ - Step 37700: {'lr': 0.00019947571370463688, 'samples': 1206400, 'steps': 2356, 'loss/train': 2.1023454666137695} -09/20/2021 22:39:12 - INFO - __main__ - Step 37701: {'lr': 0.00019947571370463688, 'samples': 1206432, 'steps': 2356, 'loss/train': 1.5014005899429321} -09/20/2021 22:39:13 - INFO - __main__ - Step 37702: {'lr': 0.00019947571370463688, 'samples': 1206464, 'steps': 2356, 'loss/train': 2.057880163192749} -09/20/2021 22:39:13 - INFO - __main__ - Step 37703: {'lr': 0.00019947571370463688, 'samples': 1206496, 'steps': 2356, 'loss/train': 1.6143786907196045} -09/20/2021 22:39:14 - INFO - __main__ - Step 37704: {'lr': 0.00019947571370463688, 'samples': 1206528, 'steps': 2356, 'loss/train': 2.14421010017395} -09/20/2021 22:39:15 - INFO - __main__ - Step 37705: {'lr': 0.00019947571370463688, 'samples': 1206560, 'steps': 2356, 'loss/train': 3.3423995971679688} -09/20/2021 22:39:16 - INFO - __main__ - Step 37706: {'lr': 0.00019947571370463688, 'samples': 1206592, 'steps': 2356, 'loss/train': 2.0928995609283447} -09/20/2021 22:39:16 - INFO - __main__ - Step 37707: {'lr': 0.00019947571370463688, 'samples': 1206624, 'steps': 2356, 'loss/train': 2.9027740955352783} -09/20/2021 22:39:17 - INFO - __main__ - Step 37708: {'lr': 0.00019947571370463688, 'samples': 1206656, 'steps': 2356, 'loss/train': 1.6054528951644897} -09/20/2021 22:39:18 - INFO - __main__ - Step 37709: {'lr': 0.00019947571370463688, 'samples': 1206688, 'steps': 2356, 'loss/train': 2.4780139923095703} -09/20/2021 22:39:19 - INFO - __main__ - Step 37710: {'lr': 0.00019947571370463688, 'samples': 1206720, 'steps': 2356, 'loss/train': 2.3262534141540527} -09/20/2021 22:39:19 - INFO - __main__ - Step 37711: {'lr': 0.00019947571370463688, 'samples': 1206752, 'steps': 2356, 'loss/train': 1.6975302696228027} -09/20/2021 22:39:20 - INFO - __main__ - Step 37712: {'lr': 0.00019947571370463688, 'samples': 1206784, 'steps': 2356, 'loss/train': 1.9724479913711548} -09/20/2021 22:39:21 - INFO - __main__ - Step 37713: {'lr': 0.0001994750611639137, 'samples': 1206816, 'steps': 2357, 'loss/train': 2.391503095626831} -09/20/2021 22:39:22 - INFO - __main__ - Step 37714: {'lr': 0.0001994750611639137, 'samples': 1206848, 'steps': 2357, 'loss/train': 2.9834513664245605} -09/20/2021 22:39:23 - INFO - __main__ - Step 37715: {'lr': 0.0001994750611639137, 'samples': 1206880, 'steps': 2357, 'loss/train': 2.1193060874938965} -09/20/2021 22:39:23 - INFO - __main__ - Step 37716: {'lr': 0.0001994750611639137, 'samples': 1206912, 'steps': 2357, 'loss/train': 3.046213388442993} -09/20/2021 22:39:24 - INFO - __main__ - Step 37717: {'lr': 0.0001994750611639137, 'samples': 1206944, 'steps': 2357, 'loss/train': 2.150465965270996} -09/20/2021 22:39:25 - INFO - __main__ - Step 37718: {'lr': 0.0001994750611639137, 'samples': 1206976, 'steps': 2357, 'loss/train': 2.604088068008423} -09/20/2021 22:39:26 - INFO - __main__ - Step 37719: {'lr': 0.0001994750611639137, 'samples': 1207008, 'steps': 2357, 'loss/train': 1.9745618104934692} -09/20/2021 22:39:26 - INFO - __main__ - Step 37720: {'lr': 0.0001994750611639137, 'samples': 1207040, 'steps': 2357, 'loss/train': 2.309189796447754} -09/20/2021 22:39:27 - INFO - __main__ - Step 37721: {'lr': 0.0001994750611639137, 'samples': 1207072, 'steps': 2357, 'loss/train': 1.7184712886810303} -09/20/2021 22:39:28 - INFO - __main__ - Step 37722: {'lr': 0.0001994750611639137, 'samples': 1207104, 'steps': 2357, 'loss/train': 2.1007742881774902} -09/20/2021 22:39:29 - INFO - __main__ - Step 37723: {'lr': 0.0001994750611639137, 'samples': 1207136, 'steps': 2357, 'loss/train': 2.4061851501464844} -09/20/2021 22:39:29 - INFO - __main__ - Step 37724: {'lr': 0.0001994750611639137, 'samples': 1207168, 'steps': 2357, 'loss/train': 2.6319658756256104} -09/20/2021 22:39:31 - INFO - __main__ - Step 37725: {'lr': 0.0001994750611639137, 'samples': 1207200, 'steps': 2357, 'loss/train': 2.3283071517944336} -09/20/2021 22:39:31 - INFO - __main__ - Step 37726: {'lr': 0.0001994750611639137, 'samples': 1207232, 'steps': 2357, 'loss/train': 2.7523064613342285} -09/20/2021 22:39:32 - INFO - __main__ - Step 37727: {'lr': 0.0001994750611639137, 'samples': 1207264, 'steps': 2357, 'loss/train': 1.921033501625061} -09/20/2021 22:39:33 - INFO - __main__ - Step 37728: {'lr': 0.0001994750611639137, 'samples': 1207296, 'steps': 2357, 'loss/train': 1.9155912399291992} -09/20/2021 22:39:34 - INFO - __main__ - Step 37729: {'lr': 0.00019947440821842686, 'samples': 1207328, 'steps': 2358, 'loss/train': 2.7932980060577393} -09/20/2021 22:39:35 - INFO - __main__ - Step 37730: {'lr': 0.00019947440821842686, 'samples': 1207360, 'steps': 2358, 'loss/train': 1.7547909021377563} -09/20/2021 22:39:35 - INFO - __main__ - Step 37731: {'lr': 0.00019947440821842686, 'samples': 1207392, 'steps': 2358, 'loss/train': 1.1861292123794556} -09/20/2021 22:39:36 - INFO - __main__ - Step 37732: {'lr': 0.00019947440821842686, 'samples': 1207424, 'steps': 2358, 'loss/train': 1.9381145238876343} -09/20/2021 22:39:37 - INFO - __main__ - Step 37733: {'lr': 0.00019947440821842686, 'samples': 1207456, 'steps': 2358, 'loss/train': 1.5582600831985474} -09/20/2021 22:39:38 - INFO - __main__ - Step 37734: {'lr': 0.00019947440821842686, 'samples': 1207488, 'steps': 2358, 'loss/train': 1.7070484161376953} -09/20/2021 22:39:38 - INFO - __main__ - Step 37735: {'lr': 0.00019947440821842686, 'samples': 1207520, 'steps': 2358, 'loss/train': 2.0431907176971436} -09/20/2021 22:39:39 - INFO - __main__ - Step 37736: {'lr': 0.00019947440821842686, 'samples': 1207552, 'steps': 2358, 'loss/train': 1.512825608253479} -09/20/2021 22:39:40 - INFO - __main__ - Step 37737: {'lr': 0.00019947440821842686, 'samples': 1207584, 'steps': 2358, 'loss/train': 2.470749855041504} -09/20/2021 22:39:41 - INFO - __main__ - Step 37738: {'lr': 0.00019947440821842686, 'samples': 1207616, 'steps': 2358, 'loss/train': 2.4889538288116455} -09/20/2021 22:39:41 - INFO - __main__ - Step 37739: {'lr': 0.00019947440821842686, 'samples': 1207648, 'steps': 2358, 'loss/train': 2.437778949737549} -09/20/2021 22:39:42 - INFO - __main__ - Step 37740: {'lr': 0.00019947440821842686, 'samples': 1207680, 'steps': 2358, 'loss/train': 1.609511375427246} -09/20/2021 22:39:43 - INFO - __main__ - Step 37741: {'lr': 0.00019947440821842686, 'samples': 1207712, 'steps': 2358, 'loss/train': 1.4846482276916504} -09/20/2021 22:39:44 - INFO - __main__ - Step 37742: {'lr': 0.00019947440821842686, 'samples': 1207744, 'steps': 2358, 'loss/train': 1.8197731971740723} -09/20/2021 22:39:44 - INFO - __main__ - Step 37743: {'lr': 0.00019947440821842686, 'samples': 1207776, 'steps': 2358, 'loss/train': 2.194905996322632} -09/20/2021 22:39:45 - INFO - __main__ - Step 37744: {'lr': 0.00019947440821842686, 'samples': 1207808, 'steps': 2358, 'loss/train': 2.6022789478302} -09/20/2021 22:39:46 - INFO - __main__ - Step 37745: {'lr': 0.0001994737548681791, 'samples': 1207840, 'steps': 2359, 'loss/train': 2.8486690521240234} -09/20/2021 22:39:47 - INFO - __main__ - Step 37746: {'lr': 0.0001994737548681791, 'samples': 1207872, 'steps': 2359, 'loss/train': 1.328084945678711} -09/20/2021 22:39:47 - INFO - __main__ - Step 37747: {'lr': 0.0001994737548681791, 'samples': 1207904, 'steps': 2359, 'loss/train': 1.0732128620147705} -09/20/2021 22:39:48 - INFO - __main__ - Step 37748: {'lr': 0.0001994737548681791, 'samples': 1207936, 'steps': 2359, 'loss/train': 2.4002928733825684} -09/20/2021 22:39:49 - INFO - __main__ - Step 37749: {'lr': 0.0001994737548681791, 'samples': 1207968, 'steps': 2359, 'loss/train': 2.4710257053375244} -09/20/2021 22:39:50 - INFO - __main__ - Step 37750: {'lr': 0.0001994737548681791, 'samples': 1208000, 'steps': 2359, 'loss/train': 2.182802200317383} -09/20/2021 22:39:50 - INFO - __main__ - Step 37751: {'lr': 0.0001994737548681791, 'samples': 1208032, 'steps': 2359, 'loss/train': 0.5792672634124756} -09/20/2021 22:39:51 - INFO - __main__ - Step 37752: {'lr': 0.0001994737548681791, 'samples': 1208064, 'steps': 2359, 'loss/train': 1.755230188369751} -09/20/2021 22:39:52 - INFO - __main__ - Step 37753: {'lr': 0.0001994737548681791, 'samples': 1208096, 'steps': 2359, 'loss/train': 2.1259827613830566} -09/20/2021 22:39:53 - INFO - __main__ - Step 37754: {'lr': 0.0001994737548681791, 'samples': 1208128, 'steps': 2359, 'loss/train': 2.619537115097046} -09/20/2021 22:39:53 - INFO - __main__ - Step 37755: {'lr': 0.0001994737548681791, 'samples': 1208160, 'steps': 2359, 'loss/train': 2.3237462043762207} -09/20/2021 22:39:55 - INFO - __main__ - Step 37756: {'lr': 0.0001994737548681791, 'samples': 1208192, 'steps': 2359, 'loss/train': 1.6637866497039795} -09/20/2021 22:39:56 - INFO - __main__ - Step 37757: {'lr': 0.0001994737548681791, 'samples': 1208224, 'steps': 2359, 'loss/train': 1.6807746887207031} -09/20/2021 22:39:56 - INFO - __main__ - Step 37758: {'lr': 0.0001994737548681791, 'samples': 1208256, 'steps': 2359, 'loss/train': 2.1027274131774902} -09/20/2021 22:39:57 - INFO - __main__ - Step 37759: {'lr': 0.0001994737548681791, 'samples': 1208288, 'steps': 2359, 'loss/train': 1.5100842714309692} -09/20/2021 22:39:58 - INFO - __main__ - Step 37760: {'lr': 0.0001994737548681791, 'samples': 1208320, 'steps': 2359, 'loss/train': 2.470857620239258} -09/20/2021 22:39:59 - INFO - __main__ - Step 37761: {'lr': 0.00019947310111317296, 'samples': 1208352, 'steps': 2360, 'loss/train': 2.2998528480529785} -09/20/2021 22:40:00 - INFO - __main__ - Step 37762: {'lr': 0.00019947310111317296, 'samples': 1208384, 'steps': 2360, 'loss/train': 2.474195718765259} -09/20/2021 22:40:00 - INFO - __main__ - Step 37763: {'lr': 0.00019947310111317296, 'samples': 1208416, 'steps': 2360, 'loss/train': 1.6152403354644775} -09/20/2021 22:40:01 - INFO - __main__ - Step 37764: {'lr': 0.00019947310111317296, 'samples': 1208448, 'steps': 2360, 'loss/train': 2.3016581535339355} -09/20/2021 22:40:02 - INFO - __main__ - Step 37765: {'lr': 0.00019947310111317296, 'samples': 1208480, 'steps': 2360, 'loss/train': 1.4928951263427734} -09/20/2021 22:40:03 - INFO - __main__ - Step 37766: {'lr': 0.00019947310111317296, 'samples': 1208512, 'steps': 2360, 'loss/train': 1.5530661344528198} -09/20/2021 22:40:03 - INFO - __main__ - Step 37767: {'lr': 0.00019947310111317296, 'samples': 1208544, 'steps': 2360, 'loss/train': 1.9454991817474365} -09/20/2021 22:40:04 - INFO - __main__ - Step 37768: {'lr': 0.00019947310111317296, 'samples': 1208576, 'steps': 2360, 'loss/train': 2.0321204662323} -09/20/2021 22:40:05 - INFO - __main__ - Step 37769: {'lr': 0.00019947310111317296, 'samples': 1208608, 'steps': 2360, 'loss/train': 2.0087392330169678} -09/20/2021 22:40:06 - INFO - __main__ - Step 37770: {'lr': 0.00019947310111317296, 'samples': 1208640, 'steps': 2360, 'loss/train': 1.922488808631897} -09/20/2021 22:40:06 - INFO - __main__ - Step 37771: {'lr': 0.00019947310111317296, 'samples': 1208672, 'steps': 2360, 'loss/train': 2.2773616313934326} -09/20/2021 22:40:07 - INFO - __main__ - Step 37772: {'lr': 0.00019947310111317296, 'samples': 1208704, 'steps': 2360, 'loss/train': 2.2187047004699707} -09/20/2021 22:40:08 - INFO - __main__ - Step 37773: {'lr': 0.00019947310111317296, 'samples': 1208736, 'steps': 2360, 'loss/train': 2.5840868949890137} -09/20/2021 22:40:09 - INFO - __main__ - Step 37774: {'lr': 0.00019947310111317296, 'samples': 1208768, 'steps': 2360, 'loss/train': 2.886248826980591} -09/20/2021 22:40:09 - INFO - __main__ - Step 37775: {'lr': 0.00019947310111317296, 'samples': 1208800, 'steps': 2360, 'loss/train': 2.021592378616333} -09/20/2021 22:40:10 - INFO - __main__ - Step 37776: {'lr': 0.00019947310111317296, 'samples': 1208832, 'steps': 2360, 'loss/train': 2.054772138595581} -09/20/2021 22:40:11 - INFO - __main__ - Step 37777: {'lr': 0.00019947244695341118, 'samples': 1208864, 'steps': 2361, 'loss/train': 1.9011415243148804} -09/20/2021 22:40:12 - INFO - __main__ - Step 37778: {'lr': 0.00019947244695341118, 'samples': 1208896, 'steps': 2361, 'loss/train': 1.8346848487854004} -09/20/2021 22:40:12 - INFO - __main__ - Step 37779: {'lr': 0.00019947244695341118, 'samples': 1208928, 'steps': 2361, 'loss/train': 1.1930451393127441} -09/20/2021 22:40:13 - INFO - __main__ - Step 37780: {'lr': 0.00019947244695341118, 'samples': 1208960, 'steps': 2361, 'loss/train': 1.3328156471252441} -09/20/2021 22:40:14 - INFO - __main__ - Step 37781: {'lr': 0.00019947244695341118, 'samples': 1208992, 'steps': 2361, 'loss/train': 2.6981778144836426} -09/20/2021 22:40:15 - INFO - __main__ - Step 37782: {'lr': 0.00019947244695341118, 'samples': 1209024, 'steps': 2361, 'loss/train': 1.9045335054397583} -09/20/2021 22:40:15 - INFO - __main__ - Step 37783: {'lr': 0.00019947244695341118, 'samples': 1209056, 'steps': 2361, 'loss/train': 2.3534069061279297} -09/20/2021 22:40:16 - INFO - __main__ - Step 37784: {'lr': 0.00019947244695341118, 'samples': 1209088, 'steps': 2361, 'loss/train': 2.5159385204315186} -09/20/2021 22:40:17 - INFO - __main__ - Step 37785: {'lr': 0.00019947244695341118, 'samples': 1209120, 'steps': 2361, 'loss/train': 2.712033271789551} -09/20/2021 22:40:18 - INFO - __main__ - Step 37786: {'lr': 0.00019947244695341118, 'samples': 1209152, 'steps': 2361, 'loss/train': 2.1603105068206787} -09/20/2021 22:40:18 - INFO - __main__ - Step 37787: {'lr': 0.00019947244695341118, 'samples': 1209184, 'steps': 2361, 'loss/train': 3.0769128799438477} -09/20/2021 22:40:19 - INFO - __main__ - Step 37788: {'lr': 0.00019947244695341118, 'samples': 1209216, 'steps': 2361, 'loss/train': 2.035776138305664} -09/20/2021 22:40:20 - INFO - __main__ - Step 37789: {'lr': 0.00019947244695341118, 'samples': 1209248, 'steps': 2361, 'loss/train': 2.280062675476074} -09/20/2021 22:40:21 - INFO - __main__ - Step 37790: {'lr': 0.00019947244695341118, 'samples': 1209280, 'steps': 2361, 'loss/train': 1.9818538427352905} -09/20/2021 22:40:21 - INFO - __main__ - Step 37791: {'lr': 0.00019947244695341118, 'samples': 1209312, 'steps': 2361, 'loss/train': 4.632205963134766} -09/20/2021 22:40:23 - INFO - __main__ - Step 37792: {'lr': 0.00019947244695341118, 'samples': 1209344, 'steps': 2361, 'loss/train': 3.708033561706543} -09/20/2021 22:40:24 - INFO - __main__ - Step 37793: {'lr': 0.00019947179238889642, 'samples': 1209376, 'steps': 2362, 'loss/train': 0.2418796569108963} -09/20/2021 22:40:24 - INFO - __main__ - Step 37794: {'lr': 0.00019947179238889642, 'samples': 1209408, 'steps': 2362, 'loss/train': 0.17522960901260376} -09/20/2021 22:40:25 - INFO - __main__ - Step 37795: {'lr': 0.00019947179238889642, 'samples': 1209440, 'steps': 2362, 'loss/train': 0.3642621338367462} -09/20/2021 22:40:26 - INFO - __main__ - Step 37796: {'lr': 0.00019947179238889642, 'samples': 1209472, 'steps': 2362, 'loss/train': 0.1337370127439499} -09/20/2021 22:40:27 - INFO - __main__ - Step 37797: {'lr': 0.00019947179238889642, 'samples': 1209504, 'steps': 2362, 'loss/train': 0.38325196504592896} -09/20/2021 22:40:27 - INFO - __main__ - Step 37798: {'lr': 0.00019947179238889642, 'samples': 1209536, 'steps': 2362, 'loss/train': 1.6666500568389893} -09/20/2021 22:40:28 - INFO - __main__ - Step 37799: {'lr': 0.00019947179238889642, 'samples': 1209568, 'steps': 2362, 'loss/train': 1.5674327611923218} -09/20/2021 22:40:29 - INFO - __main__ - Step 37800: {'lr': 0.00019947179238889642, 'samples': 1209600, 'steps': 2362, 'loss/train': 2.7609288692474365} -09/20/2021 22:40:30 - INFO - __main__ - Step 37801: {'lr': 0.00019947179238889642, 'samples': 1209632, 'steps': 2362, 'loss/train': 1.9203170537948608} -09/20/2021 22:40:30 - INFO - __main__ - Step 37802: {'lr': 0.00019947179238889642, 'samples': 1209664, 'steps': 2362, 'loss/train': 1.7695902585983276} -09/20/2021 22:40:31 - INFO - __main__ - Step 37803: {'lr': 0.00019947179238889642, 'samples': 1209696, 'steps': 2362, 'loss/train': 2.1483075618743896} -09/20/2021 22:40:32 - INFO - __main__ - Step 37804: {'lr': 0.00019947179238889642, 'samples': 1209728, 'steps': 2362, 'loss/train': 2.280168294906616} -09/20/2021 22:40:33 - INFO - __main__ - Step 37805: {'lr': 0.00019947179238889642, 'samples': 1209760, 'steps': 2362, 'loss/train': 2.1626975536346436} -09/20/2021 22:40:33 - INFO - __main__ - Step 37806: {'lr': 0.00019947179238889642, 'samples': 1209792, 'steps': 2362, 'loss/train': 2.519185781478882} -09/20/2021 22:40:34 - INFO - __main__ - Step 37807: {'lr': 0.00019947179238889642, 'samples': 1209824, 'steps': 2362, 'loss/train': 2.079038619995117} -09/20/2021 22:40:35 - INFO - __main__ - Step 37808: {'lr': 0.00019947179238889642, 'samples': 1209856, 'steps': 2362, 'loss/train': 2.327944040298462} -09/20/2021 22:40:36 - INFO - __main__ - Step 37809: {'lr': 0.0001994711374196313, 'samples': 1209888, 'steps': 2363, 'loss/train': 1.4507153034210205} -09/20/2021 22:40:37 - INFO - __main__ - Step 37810: {'lr': 0.0001994711374196313, 'samples': 1209920, 'steps': 2363, 'loss/train': 1.432961106300354} -09/20/2021 22:40:37 - INFO - __main__ - Step 37811: {'lr': 0.0001994711374196313, 'samples': 1209952, 'steps': 2363, 'loss/train': 0.37714940309524536} -09/20/2021 22:40:38 - INFO - __main__ - Step 37812: {'lr': 0.0001994711374196313, 'samples': 1209984, 'steps': 2363, 'loss/train': 2.155813217163086} -09/20/2021 22:40:39 - INFO - __main__ - Step 37813: {'lr': 0.0001994711374196313, 'samples': 1210016, 'steps': 2363, 'loss/train': 0.5374304056167603} -09/20/2021 22:40:40 - INFO - __main__ - Step 37814: {'lr': 0.0001994711374196313, 'samples': 1210048, 'steps': 2363, 'loss/train': 2.5226361751556396} -09/20/2021 22:40:40 - INFO - __main__ - Step 37815: {'lr': 0.0001994711374196313, 'samples': 1210080, 'steps': 2363, 'loss/train': 0.63106769323349} -09/20/2021 22:40:41 - INFO - __main__ - Step 37816: {'lr': 0.0001994711374196313, 'samples': 1210112, 'steps': 2363, 'loss/train': 1.397774338722229} -09/20/2021 22:40:42 - INFO - __main__ - Step 37817: {'lr': 0.0001994711374196313, 'samples': 1210144, 'steps': 2363, 'loss/train': 1.8245844841003418} -09/20/2021 22:40:43 - INFO - __main__ - Step 37818: {'lr': 0.0001994711374196313, 'samples': 1210176, 'steps': 2363, 'loss/train': 2.7484564781188965} -09/20/2021 22:40:43 - INFO - __main__ - Step 37819: {'lr': 0.0001994711374196313, 'samples': 1210208, 'steps': 2363, 'loss/train': 2.306077003479004} -09/20/2021 22:40:44 - INFO - __main__ - Step 37820: {'lr': 0.0001994711374196313, 'samples': 1210240, 'steps': 2363, 'loss/train': 1.9603500366210938} -09/20/2021 22:40:45 - INFO - __main__ - Step 37821: {'lr': 0.0001994711374196313, 'samples': 1210272, 'steps': 2363, 'loss/train': 2.91563081741333} -09/20/2021 22:40:46 - INFO - __main__ - Step 37822: {'lr': 0.0001994711374196313, 'samples': 1210304, 'steps': 2363, 'loss/train': 3.0405497550964355} -09/20/2021 22:40:46 - INFO - __main__ - Step 37823: {'lr': 0.0001994711374196313, 'samples': 1210336, 'steps': 2363, 'loss/train': 0.3601324260234833} -09/20/2021 22:40:48 - INFO - __main__ - Step 37824: {'lr': 0.0001994711374196313, 'samples': 1210368, 'steps': 2363, 'loss/train': 0.46449437737464905} -09/20/2021 22:40:49 - INFO - __main__ - Step 37825: {'lr': 0.00019947048204561852, 'samples': 1210400, 'steps': 2364, 'loss/train': 2.0184850692749023} -09/20/2021 22:40:49 - INFO - __main__ - Step 37826: {'lr': 0.00019947048204561852, 'samples': 1210432, 'steps': 2364, 'loss/train': 2.3406314849853516} -09/20/2021 22:40:50 - INFO - __main__ - Step 37827: {'lr': 0.00019947048204561852, 'samples': 1210464, 'steps': 2364, 'loss/train': 1.965713620185852} -09/20/2021 22:40:51 - INFO - __main__ - Step 37828: {'lr': 0.00019947048204561852, 'samples': 1210496, 'steps': 2364, 'loss/train': 2.355626344680786} -09/20/2021 22:40:52 - INFO - __main__ - Step 37829: {'lr': 0.00019947048204561852, 'samples': 1210528, 'steps': 2364, 'loss/train': 2.480332374572754} -09/20/2021 22:40:52 - INFO - __main__ - Step 37830: {'lr': 0.00019947048204561852, 'samples': 1210560, 'steps': 2364, 'loss/train': 2.42830753326416} -09/20/2021 22:40:53 - INFO - __main__ - Step 37831: {'lr': 0.00019947048204561852, 'samples': 1210592, 'steps': 2364, 'loss/train': 2.2864556312561035} -09/20/2021 22:40:54 - INFO - __main__ - Step 37832: {'lr': 0.00019947048204561852, 'samples': 1210624, 'steps': 2364, 'loss/train': 2.3343241214752197} -09/20/2021 22:40:55 - INFO - __main__ - Step 37833: {'lr': 0.00019947048204561852, 'samples': 1210656, 'steps': 2364, 'loss/train': 2.563478469848633} -09/20/2021 22:40:55 - INFO - __main__ - Step 37834: {'lr': 0.00019947048204561852, 'samples': 1210688, 'steps': 2364, 'loss/train': 2.401798725128174} -09/20/2021 22:40:56 - INFO - __main__ - Step 37835: {'lr': 0.00019947048204561852, 'samples': 1210720, 'steps': 2364, 'loss/train': 3.4262197017669678} -09/20/2021 22:40:57 - INFO - __main__ - Step 37836: {'lr': 0.00019947048204561852, 'samples': 1210752, 'steps': 2364, 'loss/train': 2.290377378463745} -09/20/2021 22:40:58 - INFO - __main__ - Step 37837: {'lr': 0.00019947048204561852, 'samples': 1210784, 'steps': 2364, 'loss/train': 2.746145009994507} -09/20/2021 22:40:58 - INFO - __main__ - Step 37838: {'lr': 0.00019947048204561852, 'samples': 1210816, 'steps': 2364, 'loss/train': 1.0388928651809692} -09/20/2021 22:40:59 - INFO - __main__ - Step 37839: {'lr': 0.00019947048204561852, 'samples': 1210848, 'steps': 2364, 'loss/train': 2.5556066036224365} -09/20/2021 22:41:00 - INFO - __main__ - Step 37840: {'lr': 0.00019947048204561852, 'samples': 1210880, 'steps': 2364, 'loss/train': 2.66719388961792} -09/20/2021 22:41:01 - INFO - __main__ - Step 37841: {'lr': 0.00019946982626686073, 'samples': 1210912, 'steps': 2365, 'loss/train': 1.8344568014144897} -09/20/2021 22:41:01 - INFO - __main__ - Step 37842: {'lr': 0.00019946982626686073, 'samples': 1210944, 'steps': 2365, 'loss/train': 2.3919715881347656} -09/20/2021 22:41:02 - INFO - __main__ - Step 37843: {'lr': 0.00019946982626686073, 'samples': 1210976, 'steps': 2365, 'loss/train': 2.1931018829345703} -09/20/2021 22:41:03 - INFO - __main__ - Step 37844: {'lr': 0.00019946982626686073, 'samples': 1211008, 'steps': 2365, 'loss/train': 0.5637112855911255} -09/20/2021 22:41:04 - INFO - __main__ - Step 37845: {'lr': 0.00019946982626686073, 'samples': 1211040, 'steps': 2365, 'loss/train': 2.097673177719116} -09/20/2021 22:41:04 - INFO - __main__ - Step 37846: {'lr': 0.00019946982626686073, 'samples': 1211072, 'steps': 2365, 'loss/train': 2.3214378356933594} -09/20/2021 22:41:05 - INFO - __main__ - Step 37847: {'lr': 0.00019946982626686073, 'samples': 1211104, 'steps': 2365, 'loss/train': 2.804849624633789} -09/20/2021 22:41:06 - INFO - __main__ - Step 37848: {'lr': 0.00019946982626686073, 'samples': 1211136, 'steps': 2365, 'loss/train': 2.3437936305999756} -09/20/2021 22:41:07 - INFO - __main__ - Step 37849: {'lr': 0.00019946982626686073, 'samples': 1211168, 'steps': 2365, 'loss/train': 2.266341209411621} -09/20/2021 22:41:07 - INFO - __main__ - Step 37850: {'lr': 0.00019946982626686073, 'samples': 1211200, 'steps': 2365, 'loss/train': 1.6666624546051025} -09/20/2021 22:41:08 - INFO - __main__ - Step 37851: {'lr': 0.00019946982626686073, 'samples': 1211232, 'steps': 2365, 'loss/train': 2.435892343521118} -09/20/2021 22:41:09 - INFO - __main__ - Step 37852: {'lr': 0.00019946982626686073, 'samples': 1211264, 'steps': 2365, 'loss/train': 1.442787528038025} -09/20/2021 22:41:10 - INFO - __main__ - Step 37853: {'lr': 0.00019946982626686073, 'samples': 1211296, 'steps': 2365, 'loss/train': 1.3911769390106201} -09/20/2021 22:41:10 - INFO - __main__ - Step 37854: {'lr': 0.00019946982626686073, 'samples': 1211328, 'steps': 2365, 'loss/train': 1.5345326662063599} -09/20/2021 22:41:11 - INFO - __main__ - Step 37855: {'lr': 0.00019946982626686073, 'samples': 1211360, 'steps': 2365, 'loss/train': 2.4982500076293945} -09/20/2021 22:41:13 - INFO - __main__ - Step 37856: {'lr': 0.00019946982626686073, 'samples': 1211392, 'steps': 2365, 'loss/train': 2.655451536178589} -09/20/2021 22:41:14 - INFO - __main__ - Step 37857: {'lr': 0.0001994691700833606, 'samples': 1211424, 'steps': 2366, 'loss/train': 2.3537518978118896} -09/20/2021 22:41:15 - INFO - __main__ - Step 37858: {'lr': 0.0001994691700833606, 'samples': 1211456, 'steps': 2366, 'loss/train': 1.9569565057754517} -09/20/2021 22:41:16 - INFO - __main__ - Step 37859: {'lr': 0.0001994691700833606, 'samples': 1211488, 'steps': 2366, 'loss/train': 1.8448684215545654} -09/20/2021 22:41:16 - INFO - __main__ - Step 37860: {'lr': 0.0001994691700833606, 'samples': 1211520, 'steps': 2366, 'loss/train': 2.3477773666381836} -09/20/2021 22:41:17 - INFO - __main__ - Step 37861: {'lr': 0.0001994691700833606, 'samples': 1211552, 'steps': 2366, 'loss/train': 2.179483652114868} -09/20/2021 22:41:18 - INFO - __main__ - Step 37862: {'lr': 0.0001994691700833606, 'samples': 1211584, 'steps': 2366, 'loss/train': 2.543814182281494} -09/20/2021 22:41:19 - INFO - __main__ - Step 37863: {'lr': 0.0001994691700833606, 'samples': 1211616, 'steps': 2366, 'loss/train': 2.706674814224243} -09/20/2021 22:41:19 - INFO - __main__ - Step 37864: {'lr': 0.0001994691700833606, 'samples': 1211648, 'steps': 2366, 'loss/train': 2.142000675201416} -09/20/2021 22:41:20 - INFO - __main__ - Step 37865: {'lr': 0.0001994691700833606, 'samples': 1211680, 'steps': 2366, 'loss/train': 1.3577661514282227} -09/20/2021 22:41:21 - INFO - __main__ - Step 37866: {'lr': 0.0001994691700833606, 'samples': 1211712, 'steps': 2366, 'loss/train': 1.8388793468475342} -09/20/2021 22:41:22 - INFO - __main__ - Step 37867: {'lr': 0.0001994691700833606, 'samples': 1211744, 'steps': 2366, 'loss/train': 3.345323324203491} -09/20/2021 22:41:23 - INFO - __main__ - Step 37868: {'lr': 0.0001994691700833606, 'samples': 1211776, 'steps': 2366, 'loss/train': 1.7535299062728882} -09/20/2021 22:41:23 - INFO - __main__ - Step 37869: {'lr': 0.0001994691700833606, 'samples': 1211808, 'steps': 2366, 'loss/train': 1.7459133863449097} -09/20/2021 22:41:24 - INFO - __main__ - Step 37870: {'lr': 0.0001994691700833606, 'samples': 1211840, 'steps': 2366, 'loss/train': 2.8883986473083496} -09/20/2021 22:41:25 - INFO - __main__ - Step 37871: {'lr': 0.0001994691700833606, 'samples': 1211872, 'steps': 2366, 'loss/train': 2.6242613792419434} -09/20/2021 22:41:26 - INFO - __main__ - Step 37872: {'lr': 0.0001994691700833606, 'samples': 1211904, 'steps': 2366, 'loss/train': 1.8878309726715088} -09/20/2021 22:41:26 - INFO - __main__ - Step 37873: {'lr': 0.0001994685134951208, 'samples': 1211936, 'steps': 2367, 'loss/train': 2.220355272293091} -09/20/2021 22:41:27 - INFO - __main__ - Step 37874: {'lr': 0.0001994685134951208, 'samples': 1211968, 'steps': 2367, 'loss/train': 1.8668535947799683} -09/20/2021 22:41:28 - INFO - __main__ - Step 37875: {'lr': 0.0001994685134951208, 'samples': 1212000, 'steps': 2367, 'loss/train': 2.2773876190185547} -09/20/2021 22:41:29 - INFO - __main__ - Step 37876: {'lr': 0.0001994685134951208, 'samples': 1212032, 'steps': 2367, 'loss/train': 0.7419587969779968} -09/20/2021 22:41:29 - INFO - __main__ - Step 37877: {'lr': 0.0001994685134951208, 'samples': 1212064, 'steps': 2367, 'loss/train': 0.8416272401809692} -09/20/2021 22:41:30 - INFO - __main__ - Step 37878: {'lr': 0.0001994685134951208, 'samples': 1212096, 'steps': 2367, 'loss/train': 0.20868085324764252} -09/20/2021 22:41:31 - INFO - __main__ - Step 37879: {'lr': 0.0001994685134951208, 'samples': 1212128, 'steps': 2367, 'loss/train': 0.24591787159442902} -09/20/2021 22:41:32 - INFO - __main__ - Step 37880: {'lr': 0.0001994685134951208, 'samples': 1212160, 'steps': 2367, 'loss/train': 0.5406654477119446} -09/20/2021 22:41:32 - INFO - __main__ - Step 37881: {'lr': 0.0001994685134951208, 'samples': 1212192, 'steps': 2367, 'loss/train': 0.30687132477760315} -09/20/2021 22:41:33 - INFO - __main__ - Step 37882: {'lr': 0.0001994685134951208, 'samples': 1212224, 'steps': 2367, 'loss/train': 0.4096651077270508} -09/20/2021 22:41:34 - INFO - __main__ - Step 37883: {'lr': 0.0001994685134951208, 'samples': 1212256, 'steps': 2367, 'loss/train': 1.8442916870117188} -09/20/2021 22:41:35 - INFO - __main__ - Step 37884: {'lr': 0.0001994685134951208, 'samples': 1212288, 'steps': 2367, 'loss/train': 2.240985631942749} -09/20/2021 22:41:35 - INFO - __main__ - Step 37885: {'lr': 0.0001994685134951208, 'samples': 1212320, 'steps': 2367, 'loss/train': 2.5581212043762207} -09/20/2021 22:41:36 - INFO - __main__ - Step 37886: {'lr': 0.0001994685134951208, 'samples': 1212352, 'steps': 2367, 'loss/train': 1.8634694814682007} -09/20/2021 22:41:37 - INFO - __main__ - Step 37887: {'lr': 0.0001994685134951208, 'samples': 1212384, 'steps': 2367, 'loss/train': 2.040199041366577} -09/20/2021 22:41:38 - INFO - __main__ - Step 37888: {'lr': 0.0001994685134951208, 'samples': 1212416, 'steps': 2367, 'loss/train': 3.099691152572632} -09/20/2021 22:41:39 - INFO - __main__ - Step 37889: {'lr': 0.000199467856502144, 'samples': 1212448, 'steps': 2368, 'loss/train': 1.9667092561721802} -09/20/2021 22:41:40 - INFO - __main__ - Step 37890: {'lr': 0.000199467856502144, 'samples': 1212480, 'steps': 2368, 'loss/train': 2.0549228191375732} -09/20/2021 22:41:41 - INFO - __main__ - Step 37891: {'lr': 0.000199467856502144, 'samples': 1212512, 'steps': 2368, 'loss/train': 1.9080044031143188} -09/20/2021 22:41:41 - INFO - __main__ - Step 37892: {'lr': 0.000199467856502144, 'samples': 1212544, 'steps': 2368, 'loss/train': 2.3004226684570312} -09/20/2021 22:41:42 - INFO - __main__ - Step 37893: {'lr': 0.000199467856502144, 'samples': 1212576, 'steps': 2368, 'loss/train': 1.7941396236419678} -09/20/2021 22:41:43 - INFO - __main__ - Step 37894: {'lr': 0.000199467856502144, 'samples': 1212608, 'steps': 2368, 'loss/train': 1.653560757637024} -09/20/2021 22:41:44 - INFO - __main__ - Step 37895: {'lr': 0.000199467856502144, 'samples': 1212640, 'steps': 2368, 'loss/train': 1.6976587772369385} -09/20/2021 22:41:44 - INFO - __main__ - Step 37896: {'lr': 0.000199467856502144, 'samples': 1212672, 'steps': 2368, 'loss/train': 2.508504867553711} -09/20/2021 22:41:45 - INFO - __main__ - Step 37897: {'lr': 0.000199467856502144, 'samples': 1212704, 'steps': 2368, 'loss/train': 3.0768144130706787} -09/20/2021 22:41:46 - INFO - __main__ - Step 37898: {'lr': 0.000199467856502144, 'samples': 1212736, 'steps': 2368, 'loss/train': 2.555922031402588} -09/20/2021 22:41:47 - INFO - __main__ - Step 37899: {'lr': 0.000199467856502144, 'samples': 1212768, 'steps': 2368, 'loss/train': 2.3529906272888184} -09/20/2021 22:41:47 - INFO - __main__ - Step 37900: {'lr': 0.000199467856502144, 'samples': 1212800, 'steps': 2368, 'loss/train': 1.819877028465271} -09/20/2021 22:41:48 - INFO - __main__ - Step 37901: {'lr': 0.000199467856502144, 'samples': 1212832, 'steps': 2368, 'loss/train': 2.3460853099823} -09/20/2021 22:41:49 - INFO - __main__ - Step 37902: {'lr': 0.000199467856502144, 'samples': 1212864, 'steps': 2368, 'loss/train': 3.588068723678589} -09/20/2021 22:41:50 - INFO - __main__ - Step 37903: {'lr': 0.000199467856502144, 'samples': 1212896, 'steps': 2368, 'loss/train': 2.42378568649292} -09/20/2021 22:41:50 - INFO - __main__ - Step 37904: {'lr': 0.000199467856502144, 'samples': 1212928, 'steps': 2368, 'loss/train': 2.753868579864502} -09/20/2021 22:41:51 - INFO - __main__ - Step 37905: {'lr': 0.00019946719910443288, 'samples': 1212960, 'steps': 2369, 'loss/train': 2.097705364227295} -09/20/2021 22:41:52 - INFO - __main__ - Step 37906: {'lr': 0.00019946719910443288, 'samples': 1212992, 'steps': 2369, 'loss/train': 0.14144642651081085} -09/20/2021 22:41:53 - INFO - __main__ - Step 37907: {'lr': 0.00019946719910443288, 'samples': 1213024, 'steps': 2369, 'loss/train': 0.41937708854675293} -09/20/2021 22:41:53 - INFO - __main__ - Step 37908: {'lr': 0.00019946719910443288, 'samples': 1213056, 'steps': 2369, 'loss/train': 0.4272522032260895} -09/20/2021 22:41:54 - INFO - __main__ - Step 37909: {'lr': 0.00019946719910443288, 'samples': 1213088, 'steps': 2369, 'loss/train': 2.9466965198516846} -09/20/2021 22:41:55 - INFO - __main__ - Step 37910: {'lr': 0.00019946719910443288, 'samples': 1213120, 'steps': 2369, 'loss/train': 1.320312261581421} -09/20/2021 22:41:56 - INFO - __main__ - Step 37911: {'lr': 0.00019946719910443288, 'samples': 1213152, 'steps': 2369, 'loss/train': 2.1572413444519043} -09/20/2021 22:41:57 - INFO - __main__ - Step 37912: {'lr': 0.00019946719910443288, 'samples': 1213184, 'steps': 2369, 'loss/train': 2.1537632942199707} -09/20/2021 22:41:57 - INFO - __main__ - Step 37913: {'lr': 0.00019946719910443288, 'samples': 1213216, 'steps': 2369, 'loss/train': 2.5904312133789062} -09/20/2021 22:41:58 - INFO - __main__ - Step 37914: {'lr': 0.00019946719910443288, 'samples': 1213248, 'steps': 2369, 'loss/train': 2.579957962036133} -09/20/2021 22:41:59 - INFO - __main__ - Step 37915: {'lr': 0.00019946719910443288, 'samples': 1213280, 'steps': 2369, 'loss/train': 2.4560739994049072} -09/20/2021 22:42:00 - INFO - __main__ - Step 37916: {'lr': 0.00019946719910443288, 'samples': 1213312, 'steps': 2369, 'loss/train': 2.40339732170105} -09/20/2021 22:42:00 - INFO - __main__ - Step 37917: {'lr': 0.00019946719910443288, 'samples': 1213344, 'steps': 2369, 'loss/train': 1.8939493894577026} -09/20/2021 22:42:02 - INFO - __main__ - Step 37918: {'lr': 0.00019946719910443288, 'samples': 1213376, 'steps': 2369, 'loss/train': 2.468156337738037} -09/20/2021 22:42:02 - INFO - __main__ - Step 37919: {'lr': 0.00019946719910443288, 'samples': 1213408, 'steps': 2369, 'loss/train': 1.4732273817062378} -09/20/2021 22:42:03 - INFO - __main__ - Step 37920: {'lr': 0.00019946719910443288, 'samples': 1213440, 'steps': 2369, 'loss/train': 2.3176307678222656} -09/20/2021 22:42:04 - INFO - __main__ - Step 37921: {'lr': 0.00019946654130199013, 'samples': 1213472, 'steps': 2370, 'loss/train': 1.9512532949447632} -09/20/2021 22:42:05 - INFO - __main__ - Step 37922: {'lr': 0.00019946654130199013, 'samples': 1213504, 'steps': 2370, 'loss/train': 2.692857503890991} -09/20/2021 22:42:06 - INFO - __main__ - Step 37923: {'lr': 0.00019946654130199013, 'samples': 1213536, 'steps': 2370, 'loss/train': 1.9585472345352173} -09/20/2021 22:42:06 - INFO - __main__ - Step 37924: {'lr': 0.00019946654130199013, 'samples': 1213568, 'steps': 2370, 'loss/train': 2.142153024673462} -09/20/2021 22:42:07 - INFO - __main__ - Step 37925: {'lr': 0.00019946654130199013, 'samples': 1213600, 'steps': 2370, 'loss/train': 1.6149617433547974} -09/20/2021 22:42:08 - INFO - __main__ - Step 37926: {'lr': 0.00019946654130199013, 'samples': 1213632, 'steps': 2370, 'loss/train': 1.5101274251937866} -09/20/2021 22:42:09 - INFO - __main__ - Step 37927: {'lr': 0.00019946654130199013, 'samples': 1213664, 'steps': 2370, 'loss/train': 1.7024354934692383} -09/20/2021 22:42:09 - INFO - __main__ - Step 37928: {'lr': 0.00019946654130199013, 'samples': 1213696, 'steps': 2370, 'loss/train': 3.280639171600342} -09/20/2021 22:42:10 - INFO - __main__ - Step 37929: {'lr': 0.00019946654130199013, 'samples': 1213728, 'steps': 2370, 'loss/train': 2.2967281341552734} -09/20/2021 22:42:11 - INFO - __main__ - Step 37930: {'lr': 0.00019946654130199013, 'samples': 1213760, 'steps': 2370, 'loss/train': 1.6311018466949463} -09/20/2021 22:42:12 - INFO - __main__ - Step 37931: {'lr': 0.00019946654130199013, 'samples': 1213792, 'steps': 2370, 'loss/train': 2.4810354709625244} -09/20/2021 22:42:12 - INFO - __main__ - Step 37932: {'lr': 0.00019946654130199013, 'samples': 1213824, 'steps': 2370, 'loss/train': 2.72634220123291} -09/20/2021 22:42:13 - INFO - __main__ - Step 37933: {'lr': 0.00019946654130199013, 'samples': 1213856, 'steps': 2370, 'loss/train': 2.4968032836914062} -09/20/2021 22:42:14 - INFO - __main__ - Step 37934: {'lr': 0.00019946654130199013, 'samples': 1213888, 'steps': 2370, 'loss/train': 2.0866458415985107} -09/20/2021 22:42:15 - INFO - __main__ - Step 37935: {'lr': 0.00019946654130199013, 'samples': 1213920, 'steps': 2370, 'loss/train': 1.656402826309204} -09/20/2021 22:42:15 - INFO - __main__ - Step 37936: {'lr': 0.00019946654130199013, 'samples': 1213952, 'steps': 2370, 'loss/train': 1.8590425252914429} -09/20/2021 22:42:16 - INFO - __main__ - Step 37937: {'lr': 0.0001994658830948184, 'samples': 1213984, 'steps': 2371, 'loss/train': 2.0250277519226074} -09/20/2021 22:42:17 - INFO - __main__ - Step 37938: {'lr': 0.0001994658830948184, 'samples': 1214016, 'steps': 2371, 'loss/train': 2.428302526473999} -09/20/2021 22:42:18 - INFO - __main__ - Step 37939: {'lr': 0.0001994658830948184, 'samples': 1214048, 'steps': 2371, 'loss/train': 2.659227132797241} -09/20/2021 22:42:18 - INFO - __main__ - Step 37940: {'lr': 0.0001994658830948184, 'samples': 1214080, 'steps': 2371, 'loss/train': 1.6066538095474243} -09/20/2021 22:42:19 - INFO - __main__ - Step 37941: {'lr': 0.0001994658830948184, 'samples': 1214112, 'steps': 2371, 'loss/train': 1.1570261716842651} -09/20/2021 22:42:20 - INFO - __main__ - Step 37942: {'lr': 0.0001994658830948184, 'samples': 1214144, 'steps': 2371, 'loss/train': 2.35536789894104} -09/20/2021 22:42:21 - INFO - __main__ - Step 37943: {'lr': 0.0001994658830948184, 'samples': 1214176, 'steps': 2371, 'loss/train': 1.9129648208618164} -09/20/2021 22:42:21 - INFO - __main__ - Step 37944: {'lr': 0.0001994658830948184, 'samples': 1214208, 'steps': 2371, 'loss/train': 0.8649541139602661} -09/20/2021 22:42:22 - INFO - __main__ - Step 37945: {'lr': 0.0001994658830948184, 'samples': 1214240, 'steps': 2371, 'loss/train': 2.474010944366455} -09/20/2021 22:42:23 - INFO - __main__ - Step 37946: {'lr': 0.0001994658830948184, 'samples': 1214272, 'steps': 2371, 'loss/train': 1.6685924530029297} -09/20/2021 22:42:24 - INFO - __main__ - Step 37947: {'lr': 0.0001994658830948184, 'samples': 1214304, 'steps': 2371, 'loss/train': 2.503716230392456} -09/20/2021 22:42:24 - INFO - __main__ - Step 37948: {'lr': 0.0001994658830948184, 'samples': 1214336, 'steps': 2371, 'loss/train': 2.2599263191223145} -09/20/2021 22:42:26 - INFO - __main__ - Step 37949: {'lr': 0.0001994658830948184, 'samples': 1214368, 'steps': 2371, 'loss/train': 2.3796775341033936} -09/20/2021 22:42:26 - INFO - __main__ - Step 37950: {'lr': 0.0001994658830948184, 'samples': 1214400, 'steps': 2371, 'loss/train': 1.8829572200775146} -09/20/2021 22:42:27 - INFO - __main__ - Step 37951: {'lr': 0.0001994658830948184, 'samples': 1214432, 'steps': 2371, 'loss/train': 2.5183510780334473} -09/20/2021 22:42:28 - INFO - __main__ - Step 37952: {'lr': 0.0001994658830948184, 'samples': 1214464, 'steps': 2371, 'loss/train': 2.518653392791748} -09/20/2021 22:42:29 - INFO - __main__ - Step 37953: {'lr': 0.00019946522448292039, 'samples': 1214496, 'steps': 2372, 'loss/train': 1.6538618803024292} -09/20/2021 22:42:30 - INFO - __main__ - Step 37954: {'lr': 0.00019946522448292039, 'samples': 1214528, 'steps': 2372, 'loss/train': 1.9263811111450195} -09/20/2021 22:42:30 - INFO - __main__ - Step 37955: {'lr': 0.00019946522448292039, 'samples': 1214560, 'steps': 2372, 'loss/train': 2.8367230892181396} -09/20/2021 22:42:31 - INFO - __main__ - Step 37956: {'lr': 0.00019946522448292039, 'samples': 1214592, 'steps': 2372, 'loss/train': 1.173738956451416} -09/20/2021 22:42:32 - INFO - __main__ - Step 37957: {'lr': 0.00019946522448292039, 'samples': 1214624, 'steps': 2372, 'loss/train': 1.512326717376709} -09/20/2021 22:42:33 - INFO - __main__ - Step 37958: {'lr': 0.00019946522448292039, 'samples': 1214656, 'steps': 2372, 'loss/train': 2.1177163124084473} -09/20/2021 22:42:33 - INFO - __main__ - Step 37959: {'lr': 0.00019946522448292039, 'samples': 1214688, 'steps': 2372, 'loss/train': 2.609461545944214} -09/20/2021 22:42:34 - INFO - __main__ - Step 37960: {'lr': 0.00019946522448292039, 'samples': 1214720, 'steps': 2372, 'loss/train': 1.3865822553634644} -09/20/2021 22:42:35 - INFO - __main__ - Step 37961: {'lr': 0.00019946522448292039, 'samples': 1214752, 'steps': 2372, 'loss/train': 1.9676709175109863} -09/20/2021 22:42:36 - INFO - __main__ - Step 37962: {'lr': 0.00019946522448292039, 'samples': 1214784, 'steps': 2372, 'loss/train': 2.784796953201294} -09/20/2021 22:42:36 - INFO - __main__ - Step 37963: {'lr': 0.00019946522448292039, 'samples': 1214816, 'steps': 2372, 'loss/train': 2.5885448455810547} -09/20/2021 22:42:37 - INFO - __main__ - Step 37964: {'lr': 0.00019946522448292039, 'samples': 1214848, 'steps': 2372, 'loss/train': 1.7888864278793335} -09/20/2021 22:42:38 - INFO - __main__ - Step 37965: {'lr': 0.00019946522448292039, 'samples': 1214880, 'steps': 2372, 'loss/train': 2.4631290435791016} -09/20/2021 22:42:39 - INFO - __main__ - Step 37966: {'lr': 0.00019946522448292039, 'samples': 1214912, 'steps': 2372, 'loss/train': 2.0685713291168213} -09/20/2021 22:42:39 - INFO - __main__ - Step 37967: {'lr': 0.00019946522448292039, 'samples': 1214944, 'steps': 2372, 'loss/train': 0.6756879091262817} -09/20/2021 22:42:40 - INFO - __main__ - Step 37968: {'lr': 0.00019946522448292039, 'samples': 1214976, 'steps': 2372, 'loss/train': 1.1870639324188232} -09/20/2021 22:42:41 - INFO - __main__ - Step 37969: {'lr': 0.00019946456546629873, 'samples': 1215008, 'steps': 2373, 'loss/train': 2.1128664016723633} -09/20/2021 22:42:42 - INFO - __main__ - Step 37970: {'lr': 0.00019946456546629873, 'samples': 1215040, 'steps': 2373, 'loss/train': 2.213639497756958} -09/20/2021 22:42:42 - INFO - __main__ - Step 37971: {'lr': 0.00019946456546629873, 'samples': 1215072, 'steps': 2373, 'loss/train': 1.5152263641357422} -09/20/2021 22:42:43 - INFO - __main__ - Step 37972: {'lr': 0.00019946456546629873, 'samples': 1215104, 'steps': 2373, 'loss/train': 2.4302971363067627} -09/20/2021 22:42:44 - INFO - __main__ - Step 37973: {'lr': 0.00019946456546629873, 'samples': 1215136, 'steps': 2373, 'loss/train': 1.7009811401367188} -09/20/2021 22:42:45 - INFO - __main__ - Step 37974: {'lr': 0.00019946456546629873, 'samples': 1215168, 'steps': 2373, 'loss/train': 2.564484119415283} -09/20/2021 22:42:45 - INFO - __main__ - Step 37975: {'lr': 0.00019946456546629873, 'samples': 1215200, 'steps': 2373, 'loss/train': 1.5378215312957764} -09/20/2021 22:42:46 - INFO - __main__ - Step 37976: {'lr': 0.00019946456546629873, 'samples': 1215232, 'steps': 2373, 'loss/train': 2.8014140129089355} -09/20/2021 22:42:47 - INFO - __main__ - Step 37977: {'lr': 0.00019946456546629873, 'samples': 1215264, 'steps': 2373, 'loss/train': 2.6796586513519287} -09/20/2021 22:42:48 - INFO - __main__ - Step 37978: {'lr': 0.00019946456546629873, 'samples': 1215296, 'steps': 2373, 'loss/train': 2.472449779510498} -09/20/2021 22:42:49 - INFO - __main__ - Step 37979: {'lr': 0.00019946456546629873, 'samples': 1215328, 'steps': 2373, 'loss/train': 1.980561375617981} -09/20/2021 22:42:50 - INFO - __main__ - Step 37980: {'lr': 0.00019946456546629873, 'samples': 1215360, 'steps': 2373, 'loss/train': 1.0881584882736206} -09/20/2021 22:42:50 - INFO - __main__ - Step 37981: {'lr': 0.00019946456546629873, 'samples': 1215392, 'steps': 2373, 'loss/train': 1.711112141609192} -09/20/2021 22:42:51 - INFO - __main__ - Step 37982: {'lr': 0.00019946456546629873, 'samples': 1215424, 'steps': 2373, 'loss/train': 1.600182056427002} -09/20/2021 22:42:52 - INFO - __main__ - Step 37983: {'lr': 0.00019946456546629873, 'samples': 1215456, 'steps': 2373, 'loss/train': 2.3748018741607666} -09/20/2021 22:42:53 - INFO - __main__ - Step 37984: {'lr': 0.00019946456546629873, 'samples': 1215488, 'steps': 2373, 'loss/train': 2.243413209915161} -09/20/2021 22:42:54 - INFO - __main__ - Step 37985: {'lr': 0.00019946390604495617, 'samples': 1215520, 'steps': 2374, 'loss/train': 1.8305115699768066} -09/20/2021 22:42:54 - INFO - __main__ - Step 37986: {'lr': 0.00019946390604495617, 'samples': 1215552, 'steps': 2374, 'loss/train': 0.5244085192680359} -09/20/2021 22:42:55 - INFO - __main__ - Step 37987: {'lr': 0.00019946390604495617, 'samples': 1215584, 'steps': 2374, 'loss/train': 2.2348411083221436} -09/20/2021 22:42:56 - INFO - __main__ - Step 37988: {'lr': 0.00019946390604495617, 'samples': 1215616, 'steps': 2374, 'loss/train': 2.7033307552337646} -09/20/2021 22:42:57 - INFO - __main__ - Step 37989: {'lr': 0.00019946390604495617, 'samples': 1215648, 'steps': 2374, 'loss/train': 3.4291138648986816} -09/20/2021 22:42:57 - INFO - __main__ - Step 37990: {'lr': 0.00019946390604495617, 'samples': 1215680, 'steps': 2374, 'loss/train': 2.230107307434082} -09/20/2021 22:42:58 - INFO - __main__ - Step 37991: {'lr': 0.00019946390604495617, 'samples': 1215712, 'steps': 2374, 'loss/train': 2.495068073272705} -09/20/2021 22:42:59 - INFO - __main__ - Step 37992: {'lr': 0.00019946390604495617, 'samples': 1215744, 'steps': 2374, 'loss/train': 2.221801519393921} -09/20/2021 22:43:00 - INFO - __main__ - Step 37993: {'lr': 0.00019946390604495617, 'samples': 1215776, 'steps': 2374, 'loss/train': 2.077430486679077} -09/20/2021 22:43:00 - INFO - __main__ - Step 37994: {'lr': 0.00019946390604495617, 'samples': 1215808, 'steps': 2374, 'loss/train': 1.175343632698059} -09/20/2021 22:43:01 - INFO - __main__ - Step 37995: {'lr': 0.00019946390604495617, 'samples': 1215840, 'steps': 2374, 'loss/train': 2.5413482189178467} -09/20/2021 22:43:02 - INFO - __main__ - Step 37996: {'lr': 0.00019946390604495617, 'samples': 1215872, 'steps': 2374, 'loss/train': 1.460758924484253} -09/20/2021 22:43:03 - INFO - __main__ - Step 37997: {'lr': 0.00019946390604495617, 'samples': 1215904, 'steps': 2374, 'loss/train': 2.509611129760742} -09/20/2021 22:43:03 - INFO - __main__ - Step 37998: {'lr': 0.00019946390604495617, 'samples': 1215936, 'steps': 2374, 'loss/train': 2.1883087158203125} -09/20/2021 22:43:04 - INFO - __main__ - Step 37999: {'lr': 0.00019946390604495617, 'samples': 1215968, 'steps': 2374, 'loss/train': 1.541595220565796} -09/20/2021 22:43:05 - INFO - __main__ - Step 38000: {'lr': 0.00019946390604495617, 'samples': 1216000, 'steps': 2374, 'loss/train': 1.2594845294952393} -09/20/2021 22:43:06 - INFO - __main__ - Step 38001: {'lr': 0.00019946324621889535, 'samples': 1216032, 'steps': 2375, 'loss/train': 2.835869312286377} -09/20/2021 22:43:06 - INFO - __main__ - Step 38002: {'lr': 0.00019946324621889535, 'samples': 1216064, 'steps': 2375, 'loss/train': 1.6464574337005615} -09/20/2021 22:43:07 - INFO - __main__ - Step 38003: {'lr': 0.00019946324621889535, 'samples': 1216096, 'steps': 2375, 'loss/train': 1.878480315208435} -09/20/2021 22:43:08 - INFO - __main__ - Step 38004: {'lr': 0.00019946324621889535, 'samples': 1216128, 'steps': 2375, 'loss/train': 3.1977310180664062} -09/20/2021 22:43:09 - INFO - __main__ - Step 38005: {'lr': 0.00019946324621889535, 'samples': 1216160, 'steps': 2375, 'loss/train': 2.7171802520751953} -09/20/2021 22:43:09 - INFO - __main__ - Step 38006: {'lr': 0.00019946324621889535, 'samples': 1216192, 'steps': 2375, 'loss/train': 2.335264205932617} -09/20/2021 22:43:10 - INFO - __main__ - Step 38007: {'lr': 0.00019946324621889535, 'samples': 1216224, 'steps': 2375, 'loss/train': 2.498325824737549} -09/20/2021 22:43:11 - INFO - __main__ - Step 38008: {'lr': 0.00019946324621889535, 'samples': 1216256, 'steps': 2375, 'loss/train': 1.8992623090744019} -09/20/2021 22:43:12 - INFO - __main__ - Step 38009: {'lr': 0.00019946324621889535, 'samples': 1216288, 'steps': 2375, 'loss/train': 2.2317118644714355} -09/20/2021 22:43:13 - INFO - __main__ - Step 38010: {'lr': 0.00019946324621889535, 'samples': 1216320, 'steps': 2375, 'loss/train': 2.1563925743103027} -09/20/2021 22:43:14 - INFO - __main__ - Step 38011: {'lr': 0.00019946324621889535, 'samples': 1216352, 'steps': 2375, 'loss/train': 2.265622138977051} -09/20/2021 22:43:14 - INFO - __main__ - Step 38012: {'lr': 0.00019946324621889535, 'samples': 1216384, 'steps': 2375, 'loss/train': 1.8325330018997192} -09/20/2021 22:43:15 - INFO - __main__ - Step 38013: {'lr': 0.00019946324621889535, 'samples': 1216416, 'steps': 2375, 'loss/train': 2.5710582733154297} -09/20/2021 22:43:16 - INFO - __main__ - Step 38014: {'lr': 0.00019946324621889535, 'samples': 1216448, 'steps': 2375, 'loss/train': 1.2302711009979248} -09/20/2021 22:43:17 - INFO - __main__ - Step 38015: {'lr': 0.00019946324621889535, 'samples': 1216480, 'steps': 2375, 'loss/train': 0.8668976426124573} -09/20/2021 22:43:17 - INFO - __main__ - Step 38016: {'lr': 0.00019946324621889535, 'samples': 1216512, 'steps': 2375, 'loss/train': 3.5269172191619873} -09/20/2021 22:43:18 - INFO - __main__ - Step 38017: {'lr': 0.00019946258598811897, 'samples': 1216544, 'steps': 2376, 'loss/train': 2.0426933765411377} -09/20/2021 22:43:19 - INFO - __main__ - Step 38018: {'lr': 0.00019946258598811897, 'samples': 1216576, 'steps': 2376, 'loss/train': 1.5866389274597168} -09/20/2021 22:43:20 - INFO - __main__ - Step 38019: {'lr': 0.00019946258598811897, 'samples': 1216608, 'steps': 2376, 'loss/train': 1.4382377862930298} -09/20/2021 22:43:21 - INFO - __main__ - Step 38020: {'lr': 0.00019946258598811897, 'samples': 1216640, 'steps': 2376, 'loss/train': 1.924060344696045} -09/20/2021 22:43:21 - INFO - __main__ - Step 38021: {'lr': 0.00019946258598811897, 'samples': 1216672, 'steps': 2376, 'loss/train': 2.571850538253784} -09/20/2021 22:43:22 - INFO - __main__ - Step 38022: {'lr': 0.00019946258598811897, 'samples': 1216704, 'steps': 2376, 'loss/train': 2.721968412399292} -09/20/2021 22:43:23 - INFO - __main__ - Step 38023: {'lr': 0.00019946258598811897, 'samples': 1216736, 'steps': 2376, 'loss/train': 1.8163479566574097} -09/20/2021 22:43:24 - INFO - __main__ - Step 38024: {'lr': 0.00019946258598811897, 'samples': 1216768, 'steps': 2376, 'loss/train': 2.0873172283172607} -09/20/2021 22:43:24 - INFO - __main__ - Step 38025: {'lr': 0.00019946258598811897, 'samples': 1216800, 'steps': 2376, 'loss/train': 2.155305862426758} -09/20/2021 22:43:25 - INFO - __main__ - Step 38026: {'lr': 0.00019946258598811897, 'samples': 1216832, 'steps': 2376, 'loss/train': 1.9822413921356201} -09/20/2021 22:43:26 - INFO - __main__ - Step 38027: {'lr': 0.00019946258598811897, 'samples': 1216864, 'steps': 2376, 'loss/train': 1.2322059869766235} -09/20/2021 22:43:27 - INFO - __main__ - Step 38028: {'lr': 0.00019946258598811897, 'samples': 1216896, 'steps': 2376, 'loss/train': 2.181455612182617} -09/20/2021 22:43:27 - INFO - __main__ - Step 38029: {'lr': 0.00019946258598811897, 'samples': 1216928, 'steps': 2376, 'loss/train': 1.52262544631958} -09/20/2021 22:43:28 - INFO - __main__ - Step 38030: {'lr': 0.00019946258598811897, 'samples': 1216960, 'steps': 2376, 'loss/train': 2.3264102935791016} -09/20/2021 22:43:29 - INFO - __main__ - Step 38031: {'lr': 0.00019946258598811897, 'samples': 1216992, 'steps': 2376, 'loss/train': 2.081554651260376} -09/20/2021 22:43:30 - INFO - __main__ - Step 38032: {'lr': 0.00019946258598811897, 'samples': 1217024, 'steps': 2376, 'loss/train': 2.197190046310425} -09/20/2021 22:43:31 - INFO - __main__ - Step 38033: {'lr': 0.00019946192535262973, 'samples': 1217056, 'steps': 2377, 'loss/train': 1.8735281229019165} -09/20/2021 22:43:31 - INFO - __main__ - Step 38034: {'lr': 0.00019946192535262973, 'samples': 1217088, 'steps': 2377, 'loss/train': 2.1368861198425293} -09/20/2021 22:43:32 - INFO - __main__ - Step 38035: {'lr': 0.00019946192535262973, 'samples': 1217120, 'steps': 2377, 'loss/train': 0.7794325947761536} -09/20/2021 22:43:33 - INFO - __main__ - Step 38036: {'lr': 0.00019946192535262973, 'samples': 1217152, 'steps': 2377, 'loss/train': 2.0943500995635986} -09/20/2021 22:43:34 - INFO - __main__ - Step 38037: {'lr': 0.00019946192535262973, 'samples': 1217184, 'steps': 2377, 'loss/train': 1.5985196828842163} -09/20/2021 22:43:34 - INFO - __main__ - Step 38038: {'lr': 0.00019946192535262973, 'samples': 1217216, 'steps': 2377, 'loss/train': 2.339979410171509} -09/20/2021 22:43:35 - INFO - __main__ - Step 38039: {'lr': 0.00019946192535262973, 'samples': 1217248, 'steps': 2377, 'loss/train': 1.678371787071228} -09/20/2021 22:43:36 - INFO - __main__ - Step 38040: {'lr': 0.00019946192535262973, 'samples': 1217280, 'steps': 2377, 'loss/train': 2.44594407081604} -09/20/2021 22:43:37 - INFO - __main__ - Step 38041: {'lr': 0.00019946192535262973, 'samples': 1217312, 'steps': 2377, 'loss/train': 0.7460276484489441} -09/20/2021 22:43:38 - INFO - __main__ - Step 38042: {'lr': 0.00019946192535262973, 'samples': 1217344, 'steps': 2377, 'loss/train': 0.7910380363464355} -09/20/2021 22:43:39 - INFO - __main__ - Step 38043: {'lr': 0.00019946192535262973, 'samples': 1217376, 'steps': 2377, 'loss/train': 2.5597870349884033} -09/20/2021 22:43:40 - INFO - __main__ - Step 38044: {'lr': 0.00019946192535262973, 'samples': 1217408, 'steps': 2377, 'loss/train': 1.9693647623062134} -09/20/2021 22:43:40 - INFO - __main__ - Step 38045: {'lr': 0.00019946192535262973, 'samples': 1217440, 'steps': 2377, 'loss/train': 0.21815557777881622} -09/20/2021 22:43:41 - INFO - __main__ - Step 38046: {'lr': 0.00019946192535262973, 'samples': 1217472, 'steps': 2377, 'loss/train': 0.25391247868537903} -09/20/2021 22:43:42 - INFO - __main__ - Step 38047: {'lr': 0.00019946192535262973, 'samples': 1217504, 'steps': 2377, 'loss/train': 0.21522961556911469} -09/20/2021 22:43:43 - INFO - __main__ - Step 38048: {'lr': 0.00019946192535262973, 'samples': 1217536, 'steps': 2377, 'loss/train': 2.539867639541626} -09/20/2021 22:43:44 - INFO - __main__ - Step 38049: {'lr': 0.0001994612643124303, 'samples': 1217568, 'steps': 2378, 'loss/train': 2.72778582572937} -09/20/2021 22:43:44 - INFO - __main__ - Step 38050: {'lr': 0.0001994612643124303, 'samples': 1217600, 'steps': 2378, 'loss/train': 2.5705690383911133} -09/20/2021 22:43:45 - INFO - __main__ - Step 38051: {'lr': 0.0001994612643124303, 'samples': 1217632, 'steps': 2378, 'loss/train': 2.4356324672698975} -09/20/2021 22:43:46 - INFO - __main__ - Step 38052: {'lr': 0.0001994612643124303, 'samples': 1217664, 'steps': 2378, 'loss/train': 1.4723198413848877} -09/20/2021 22:43:47 - INFO - __main__ - Step 38053: {'lr': 0.0001994612643124303, 'samples': 1217696, 'steps': 2378, 'loss/train': 2.388178825378418} -09/20/2021 22:43:47 - INFO - __main__ - Step 38054: {'lr': 0.0001994612643124303, 'samples': 1217728, 'steps': 2378, 'loss/train': 3.108919143676758} -09/20/2021 22:43:48 - INFO - __main__ - Step 38055: {'lr': 0.0001994612643124303, 'samples': 1217760, 'steps': 2378, 'loss/train': 2.582123041152954} -09/20/2021 22:43:49 - INFO - __main__ - Step 38056: {'lr': 0.0001994612643124303, 'samples': 1217792, 'steps': 2378, 'loss/train': 1.1762568950653076} -09/20/2021 22:43:50 - INFO - __main__ - Step 38057: {'lr': 0.0001994612643124303, 'samples': 1217824, 'steps': 2378, 'loss/train': 3.1609578132629395} -09/20/2021 22:43:50 - INFO - __main__ - Step 38058: {'lr': 0.0001994612643124303, 'samples': 1217856, 'steps': 2378, 'loss/train': 1.3009446859359741} -09/20/2021 22:43:51 - INFO - __main__ - Step 38059: {'lr': 0.0001994612643124303, 'samples': 1217888, 'steps': 2378, 'loss/train': 1.1217306852340698} -09/20/2021 22:43:52 - INFO - __main__ - Step 38060: {'lr': 0.0001994612643124303, 'samples': 1217920, 'steps': 2378, 'loss/train': 1.5797443389892578} -09/20/2021 22:43:53 - INFO - __main__ - Step 38061: {'lr': 0.0001994612643124303, 'samples': 1217952, 'steps': 2378, 'loss/train': 2.7280824184417725} -09/20/2021 22:43:53 - INFO - __main__ - Step 38062: {'lr': 0.0001994612643124303, 'samples': 1217984, 'steps': 2378, 'loss/train': 2.410473346710205} -09/20/2021 22:43:54 - INFO - __main__ - Step 38063: {'lr': 0.0001994612643124303, 'samples': 1218016, 'steps': 2378, 'loss/train': 1.8440724611282349} -09/20/2021 22:43:55 - INFO - __main__ - Step 38064: {'lr': 0.0001994612643124303, 'samples': 1218048, 'steps': 2378, 'loss/train': 1.599223017692566} -09/20/2021 22:43:56 - INFO - __main__ - Step 38065: {'lr': 0.00019946060286752334, 'samples': 1218080, 'steps': 2379, 'loss/train': 1.6883114576339722} -09/20/2021 22:43:56 - INFO - __main__ - Step 38066: {'lr': 0.00019946060286752334, 'samples': 1218112, 'steps': 2379, 'loss/train': 1.9688208103179932} -09/20/2021 22:43:57 - INFO - __main__ - Step 38067: {'lr': 0.00019946060286752334, 'samples': 1218144, 'steps': 2379, 'loss/train': 2.2137486934661865} -09/20/2021 22:43:58 - INFO - __main__ - Step 38068: {'lr': 0.00019946060286752334, 'samples': 1218176, 'steps': 2379, 'loss/train': 3.3852732181549072} -09/20/2021 22:43:59 - INFO - __main__ - Step 38069: {'lr': 0.00019946060286752334, 'samples': 1218208, 'steps': 2379, 'loss/train': 1.6489890813827515} -09/20/2021 22:43:59 - INFO - __main__ - Step 38070: {'lr': 0.00019946060286752334, 'samples': 1218240, 'steps': 2379, 'loss/train': 0.6231203079223633} -09/20/2021 22:44:00 - INFO - __main__ - Step 38071: {'lr': 0.00019946060286752334, 'samples': 1218272, 'steps': 2379, 'loss/train': 0.5225957632064819} -09/20/2021 22:44:01 - INFO - __main__ - Step 38072: {'lr': 0.00019946060286752334, 'samples': 1218304, 'steps': 2379, 'loss/train': 0.546221911907196} -09/20/2021 22:44:02 - INFO - __main__ - Step 38073: {'lr': 0.00019946060286752334, 'samples': 1218336, 'steps': 2379, 'loss/train': 0.2888262867927551} -09/20/2021 22:44:02 - INFO - __main__ - Step 38074: {'lr': 0.00019946060286752334, 'samples': 1218368, 'steps': 2379, 'loss/train': 0.5076727867126465} -09/20/2021 22:44:03 - INFO - __main__ - Step 38075: {'lr': 0.00019946060286752334, 'samples': 1218400, 'steps': 2379, 'loss/train': 0.15865080058574677} -09/20/2021 22:44:05 - INFO - __main__ - Step 38076: {'lr': 0.00019946060286752334, 'samples': 1218432, 'steps': 2379, 'loss/train': 0.5187078714370728} -09/20/2021 22:44:06 - INFO - __main__ - Step 38077: {'lr': 0.00019946060286752334, 'samples': 1218464, 'steps': 2379, 'loss/train': 2.0390844345092773} -09/20/2021 22:44:06 - INFO - __main__ - Step 38078: {'lr': 0.00019946060286752334, 'samples': 1218496, 'steps': 2379, 'loss/train': 0.15519648790359497} -09/20/2021 22:44:07 - INFO - __main__ - Step 38079: {'lr': 0.00019946060286752334, 'samples': 1218528, 'steps': 2379, 'loss/train': 0.15139934420585632} -09/20/2021 22:44:08 - INFO - __main__ - Step 38080: {'lr': 0.00019946060286752334, 'samples': 1218560, 'steps': 2379, 'loss/train': 1.523316502571106} -09/20/2021 22:44:09 - INFO - __main__ - Step 38081: {'lr': 0.0001994599410179116, 'samples': 1218592, 'steps': 2380, 'loss/train': 0.4972608685493469} -09/20/2021 22:44:09 - INFO - __main__ - Step 38082: {'lr': 0.0001994599410179116, 'samples': 1218624, 'steps': 2380, 'loss/train': 3.0683579444885254} -09/20/2021 22:44:10 - INFO - __main__ - Step 38083: {'lr': 0.0001994599410179116, 'samples': 1218656, 'steps': 2380, 'loss/train': 2.8465323448181152} -09/20/2021 22:44:11 - INFO - __main__ - Step 38084: {'lr': 0.0001994599410179116, 'samples': 1218688, 'steps': 2380, 'loss/train': 2.2597479820251465} -09/20/2021 22:44:12 - INFO - __main__ - Step 38085: {'lr': 0.0001994599410179116, 'samples': 1218720, 'steps': 2380, 'loss/train': 0.8877872228622437} -09/20/2021 22:44:12 - INFO - __main__ - Step 38086: {'lr': 0.0001994599410179116, 'samples': 1218752, 'steps': 2380, 'loss/train': 0.7662012577056885} -09/20/2021 22:44:13 - INFO - __main__ - Step 38087: {'lr': 0.0001994599410179116, 'samples': 1218784, 'steps': 2380, 'loss/train': 0.8977095484733582} -09/20/2021 22:44:14 - INFO - __main__ - Step 38088: {'lr': 0.0001994599410179116, 'samples': 1218816, 'steps': 2380, 'loss/train': 1.3162695169448853} -09/20/2021 22:44:15 - INFO - __main__ - Step 38089: {'lr': 0.0001994599410179116, 'samples': 1218848, 'steps': 2380, 'loss/train': 2.1380398273468018} -09/20/2021 22:44:15 - INFO - __main__ - Step 38090: {'lr': 0.0001994599410179116, 'samples': 1218880, 'steps': 2380, 'loss/train': 0.25117143988609314} -09/20/2021 22:44:16 - INFO - __main__ - Step 38091: {'lr': 0.0001994599410179116, 'samples': 1218912, 'steps': 2380, 'loss/train': 0.3958739936351776} -09/20/2021 22:44:17 - INFO - __main__ - Step 38092: {'lr': 0.0001994599410179116, 'samples': 1218944, 'steps': 2380, 'loss/train': 0.18870079517364502} -09/20/2021 22:44:18 - INFO - __main__ - Step 38093: {'lr': 0.0001994599410179116, 'samples': 1218976, 'steps': 2380, 'loss/train': 1.7648885250091553} -09/20/2021 22:44:18 - INFO - __main__ - Step 38094: {'lr': 0.0001994599410179116, 'samples': 1219008, 'steps': 2380, 'loss/train': 2.8655645847320557} -09/20/2021 22:44:19 - INFO - __main__ - Step 38095: {'lr': 0.0001994599410179116, 'samples': 1219040, 'steps': 2380, 'loss/train': 2.7190845012664795} -09/20/2021 22:44:20 - INFO - __main__ - Step 38096: {'lr': 0.0001994599410179116, 'samples': 1219072, 'steps': 2380, 'loss/train': 0.927524745464325} -09/20/2021 22:44:21 - INFO - __main__ - Step 38097: {'lr': 0.00019945927876359774, 'samples': 1219104, 'steps': 2381, 'loss/train': 2.3281397819519043} -09/20/2021 22:44:22 - INFO - __main__ - Step 38098: {'lr': 0.00019945927876359774, 'samples': 1219136, 'steps': 2381, 'loss/train': 0.1410224735736847} -09/20/2021 22:44:22 - INFO - __main__ - Step 38099: {'lr': 0.00019945927876359774, 'samples': 1219168, 'steps': 2381, 'loss/train': 0.2685947120189667} -09/20/2021 22:44:23 - INFO - __main__ - Step 38100: {'lr': 0.00019945927876359774, 'samples': 1219200, 'steps': 2381, 'loss/train': 0.13666878640651703} -09/20/2021 22:44:24 - INFO - __main__ - Step 38101: {'lr': 0.00019945927876359774, 'samples': 1219232, 'steps': 2381, 'loss/train': 0.15465639531612396} -09/20/2021 22:44:25 - INFO - __main__ - Step 38102: {'lr': 0.00019945927876359774, 'samples': 1219264, 'steps': 2381, 'loss/train': 0.25261569023132324} -09/20/2021 22:44:25 - INFO - __main__ - Step 38103: {'lr': 0.00019945927876359774, 'samples': 1219296, 'steps': 2381, 'loss/train': 1.3744843006134033} -09/20/2021 22:44:26 - INFO - __main__ - Step 38104: {'lr': 0.00019945927876359774, 'samples': 1219328, 'steps': 2381, 'loss/train': 1.328797698020935} -09/20/2021 22:44:27 - INFO - __main__ - Step 38105: {'lr': 0.00019945927876359774, 'samples': 1219360, 'steps': 2381, 'loss/train': 1.3724608421325684} -09/20/2021 22:44:28 - INFO - __main__ - Step 38106: {'lr': 0.00019945927876359774, 'samples': 1219392, 'steps': 2381, 'loss/train': 1.3407618999481201} -09/20/2021 22:44:28 - INFO - __main__ - Step 38107: {'lr': 0.00019945927876359774, 'samples': 1219424, 'steps': 2381, 'loss/train': 2.4842236042022705} -09/20/2021 22:44:30 - INFO - __main__ - Step 38108: {'lr': 0.00019945927876359774, 'samples': 1219456, 'steps': 2381, 'loss/train': 1.9891993999481201} -09/20/2021 22:44:30 - INFO - __main__ - Step 38109: {'lr': 0.00019945927876359774, 'samples': 1219488, 'steps': 2381, 'loss/train': 1.6354715824127197} -09/20/2021 22:44:31 - INFO - __main__ - Step 38110: {'lr': 0.00019945927876359774, 'samples': 1219520, 'steps': 2381, 'loss/train': 2.5806336402893066} -09/20/2021 22:44:32 - INFO - __main__ - Step 38111: {'lr': 0.00019945927876359774, 'samples': 1219552, 'steps': 2381, 'loss/train': 0.7468742728233337} -09/20/2021 22:44:33 - INFO - __main__ - Step 38112: {'lr': 0.00019945927876359774, 'samples': 1219584, 'steps': 2381, 'loss/train': 2.171156644821167} -09/20/2021 22:44:33 - INFO - __main__ - Step 38113: {'lr': 0.00019945861610458446, 'samples': 1219616, 'steps': 2382, 'loss/train': 2.8337748050689697} -09/20/2021 22:44:34 - INFO - __main__ - Step 38114: {'lr': 0.00019945861610458446, 'samples': 1219648, 'steps': 2382, 'loss/train': 1.6818897724151611} -09/20/2021 22:44:35 - INFO - __main__ - Step 38115: {'lr': 0.00019945861610458446, 'samples': 1219680, 'steps': 2382, 'loss/train': 2.389758825302124} -09/20/2021 22:44:36 - INFO - __main__ - Step 38116: {'lr': 0.00019945861610458446, 'samples': 1219712, 'steps': 2382, 'loss/train': 2.3430068492889404} -09/20/2021 22:44:36 - INFO - __main__ - Step 38117: {'lr': 0.00019945861610458446, 'samples': 1219744, 'steps': 2382, 'loss/train': 3.2272262573242188} -09/20/2021 22:44:37 - INFO - __main__ - Step 38118: {'lr': 0.00019945861610458446, 'samples': 1219776, 'steps': 2382, 'loss/train': 2.503911018371582} -09/20/2021 22:44:38 - INFO - __main__ - Step 38119: {'lr': 0.00019945861610458446, 'samples': 1219808, 'steps': 2382, 'loss/train': 2.994560718536377} -09/20/2021 22:44:39 - INFO - __main__ - Step 38120: {'lr': 0.00019945861610458446, 'samples': 1219840, 'steps': 2382, 'loss/train': 2.2343201637268066} -09/20/2021 22:44:39 - INFO - __main__ - Step 38121: {'lr': 0.00019945861610458446, 'samples': 1219872, 'steps': 2382, 'loss/train': 1.406255841255188} -09/20/2021 22:44:40 - INFO - __main__ - Step 38122: {'lr': 0.00019945861610458446, 'samples': 1219904, 'steps': 2382, 'loss/train': 1.6653523445129395} -09/20/2021 22:44:41 - INFO - __main__ - Step 38123: {'lr': 0.00019945861610458446, 'samples': 1219936, 'steps': 2382, 'loss/train': 1.1333649158477783} -09/20/2021 22:44:42 - INFO - __main__ - Step 38124: {'lr': 0.00019945861610458446, 'samples': 1219968, 'steps': 2382, 'loss/train': 2.535858631134033} -09/20/2021 22:44:42 - INFO - __main__ - Step 38125: {'lr': 0.00019945861610458446, 'samples': 1220000, 'steps': 2382, 'loss/train': 1.2581820487976074} -09/20/2021 22:44:43 - INFO - __main__ - Step 38126: {'lr': 0.00019945861610458446, 'samples': 1220032, 'steps': 2382, 'loss/train': 0.5744725465774536} -09/20/2021 22:44:44 - INFO - __main__ - Step 38127: {'lr': 0.00019945861610458446, 'samples': 1220064, 'steps': 2382, 'loss/train': 2.413151741027832} -09/20/2021 22:44:45 - INFO - __main__ - Step 38128: {'lr': 0.00019945861610458446, 'samples': 1220096, 'steps': 2382, 'loss/train': 3.2931840419769287} -09/20/2021 22:44:46 - INFO - __main__ - Step 38129: {'lr': 0.00019945795304087443, 'samples': 1220128, 'steps': 2383, 'loss/train': 1.6219024658203125} -09/20/2021 22:44:46 - INFO - __main__ - Step 38130: {'lr': 0.00019945795304087443, 'samples': 1220160, 'steps': 2383, 'loss/train': 2.3529984951019287} -09/20/2021 22:44:47 - INFO - __main__ - Step 38131: {'lr': 0.00019945795304087443, 'samples': 1220192, 'steps': 2383, 'loss/train': 2.084503412246704} -09/20/2021 22:44:48 - INFO - __main__ - Step 38132: {'lr': 0.00019945795304087443, 'samples': 1220224, 'steps': 2383, 'loss/train': 1.054067611694336} -09/20/2021 22:44:49 - INFO - __main__ - Step 38133: {'lr': 0.00019945795304087443, 'samples': 1220256, 'steps': 2383, 'loss/train': 2.5468320846557617} -09/20/2021 22:44:49 - INFO - __main__ - Step 38134: {'lr': 0.00019945795304087443, 'samples': 1220288, 'steps': 2383, 'loss/train': 1.8927732706069946} -09/20/2021 22:44:50 - INFO - __main__ - Step 38135: {'lr': 0.00019945795304087443, 'samples': 1220320, 'steps': 2383, 'loss/train': 2.2015938758850098} -09/20/2021 22:44:51 - INFO - __main__ - Step 38136: {'lr': 0.00019945795304087443, 'samples': 1220352, 'steps': 2383, 'loss/train': 2.2161343097686768} -09/20/2021 22:44:52 - INFO - __main__ - Step 38137: {'lr': 0.00019945795304087443, 'samples': 1220384, 'steps': 2383, 'loss/train': 2.406304359436035} -09/20/2021 22:44:53 - INFO - __main__ - Step 38138: {'lr': 0.00019945795304087443, 'samples': 1220416, 'steps': 2383, 'loss/train': 2.556103467941284} -09/20/2021 22:44:54 - INFO - __main__ - Step 38139: {'lr': 0.00019945795304087443, 'samples': 1220448, 'steps': 2383, 'loss/train': 1.8432245254516602} -09/20/2021 22:44:55 - INFO - __main__ - Step 38140: {'lr': 0.00019945795304087443, 'samples': 1220480, 'steps': 2383, 'loss/train': 1.3835740089416504} -09/20/2021 22:44:56 - INFO - __main__ - Step 38141: {'lr': 0.00019945795304087443, 'samples': 1220512, 'steps': 2383, 'loss/train': 2.7063207626342773} -09/20/2021 22:44:56 - INFO - __main__ - Step 38142: {'lr': 0.00019945795304087443, 'samples': 1220544, 'steps': 2383, 'loss/train': 2.5345442295074463} -09/20/2021 22:44:57 - INFO - __main__ - Step 38143: {'lr': 0.00019945795304087443, 'samples': 1220576, 'steps': 2383, 'loss/train': 1.5200588703155518} -09/20/2021 22:44:58 - INFO - __main__ - Step 38144: {'lr': 0.00019945795304087443, 'samples': 1220608, 'steps': 2383, 'loss/train': 1.7270742654800415} -09/20/2021 22:44:59 - INFO - __main__ - Step 38145: {'lr': 0.00019945728957247044, 'samples': 1220640, 'steps': 2384, 'loss/train': 1.3940118551254272} -09/20/2021 22:45:00 - INFO - __main__ - Step 38146: {'lr': 0.00019945728957247044, 'samples': 1220672, 'steps': 2384, 'loss/train': 2.399733543395996} -09/20/2021 22:45:00 - INFO - __main__ - Step 38147: {'lr': 0.00019945728957247044, 'samples': 1220704, 'steps': 2384, 'loss/train': 1.7890444993972778} -09/20/2021 22:45:01 - INFO - __main__ - Step 38148: {'lr': 0.00019945728957247044, 'samples': 1220736, 'steps': 2384, 'loss/train': 2.556424140930176} -09/20/2021 22:45:02 - INFO - __main__ - Step 38149: {'lr': 0.00019945728957247044, 'samples': 1220768, 'steps': 2384, 'loss/train': 2.5361530780792236} -09/20/2021 22:45:03 - INFO - __main__ - Step 38150: {'lr': 0.00019945728957247044, 'samples': 1220800, 'steps': 2384, 'loss/train': 2.216306209564209} -09/20/2021 22:45:03 - INFO - __main__ - Step 38151: {'lr': 0.00019945728957247044, 'samples': 1220832, 'steps': 2384, 'loss/train': 1.3439298868179321} -09/20/2021 22:45:04 - INFO - __main__ - Step 38152: {'lr': 0.00019945728957247044, 'samples': 1220864, 'steps': 2384, 'loss/train': 2.88555645942688} -09/20/2021 22:45:05 - INFO - __main__ - Step 38153: {'lr': 0.00019945728957247044, 'samples': 1220896, 'steps': 2384, 'loss/train': 2.5502376556396484} -09/20/2021 22:45:06 - INFO - __main__ - Step 38154: {'lr': 0.00019945728957247044, 'samples': 1220928, 'steps': 2384, 'loss/train': 0.8575791716575623} -09/20/2021 22:45:06 - INFO - __main__ - Step 38155: {'lr': 0.00019945728957247044, 'samples': 1220960, 'steps': 2384, 'loss/train': 2.2389795780181885} -09/20/2021 22:45:07 - INFO - __main__ - Step 38156: {'lr': 0.00019945728957247044, 'samples': 1220992, 'steps': 2384, 'loss/train': 2.0800909996032715} -09/20/2021 22:45:08 - INFO - __main__ - Step 38157: {'lr': 0.00019945728957247044, 'samples': 1221024, 'steps': 2384, 'loss/train': 2.5105319023132324} -09/20/2021 22:45:09 - INFO - __main__ - Step 38158: {'lr': 0.00019945728957247044, 'samples': 1221056, 'steps': 2384, 'loss/train': 1.7920852899551392} -09/20/2021 22:45:09 - INFO - __main__ - Step 38159: {'lr': 0.00019945728957247044, 'samples': 1221088, 'steps': 2384, 'loss/train': 1.9336161613464355} -09/20/2021 22:45:10 - INFO - __main__ - Step 38160: {'lr': 0.00019945728957247044, 'samples': 1221120, 'steps': 2384, 'loss/train': 1.8943614959716797} -09/20/2021 22:45:11 - INFO - __main__ - Step 38161: {'lr': 0.00019945662569937505, 'samples': 1221152, 'steps': 2385, 'loss/train': 2.1333584785461426} -09/20/2021 22:45:12 - INFO - __main__ - Step 38162: {'lr': 0.00019945662569937505, 'samples': 1221184, 'steps': 2385, 'loss/train': 2.1660470962524414} -09/20/2021 22:45:12 - INFO - __main__ - Step 38163: {'lr': 0.00019945662569937505, 'samples': 1221216, 'steps': 2385, 'loss/train': 2.1468489170074463} -09/20/2021 22:45:13 - INFO - __main__ - Step 38164: {'lr': 0.00019945662569937505, 'samples': 1221248, 'steps': 2385, 'loss/train': 2.111912727355957} -09/20/2021 22:45:14 - INFO - __main__ - Step 38165: {'lr': 0.00019945662569937505, 'samples': 1221280, 'steps': 2385, 'loss/train': 2.1459763050079346} -09/20/2021 22:45:15 - INFO - __main__ - Step 38166: {'lr': 0.00019945662569937505, 'samples': 1221312, 'steps': 2385, 'loss/train': 2.133540391921997} -09/20/2021 22:45:15 - INFO - __main__ - Step 38167: {'lr': 0.00019945662569937505, 'samples': 1221344, 'steps': 2385, 'loss/train': 2.0970828533172607} -09/20/2021 22:45:16 - INFO - __main__ - Step 38168: {'lr': 0.00019945662569937505, 'samples': 1221376, 'steps': 2385, 'loss/train': 2.14831280708313} -09/20/2021 22:45:17 - INFO - __main__ - Step 38169: {'lr': 0.00019945662569937505, 'samples': 1221408, 'steps': 2385, 'loss/train': 2.314727544784546} -09/20/2021 22:45:18 - INFO - __main__ - Step 38170: {'lr': 0.00019945662569937505, 'samples': 1221440, 'steps': 2385, 'loss/train': 0.910568356513977} -09/20/2021 22:45:18 - INFO - __main__ - Step 38171: {'lr': 0.00019945662569937505, 'samples': 1221472, 'steps': 2385, 'loss/train': 1.7531037330627441} -09/20/2021 22:45:19 - INFO - __main__ - Step 38172: {'lr': 0.00019945662569937505, 'samples': 1221504, 'steps': 2385, 'loss/train': 2.241570234298706} -09/20/2021 22:45:20 - INFO - __main__ - Step 38173: {'lr': 0.00019945662569937505, 'samples': 1221536, 'steps': 2385, 'loss/train': 2.2233097553253174} -09/20/2021 22:45:21 - INFO - __main__ - Step 38174: {'lr': 0.00019945662569937505, 'samples': 1221568, 'steps': 2385, 'loss/train': 2.6405696868896484} -09/20/2021 22:45:21 - INFO - __main__ - Step 38175: {'lr': 0.00019945662569937505, 'samples': 1221600, 'steps': 2385, 'loss/train': 0.3035544455051422} -09/20/2021 22:45:22 - INFO - __main__ - Step 38176: {'lr': 0.00019945662569937505, 'samples': 1221632, 'steps': 2385, 'loss/train': 0.2903272211551666} -09/20/2021 22:45:23 - INFO - __main__ - Step 38177: {'lr': 0.0001994559614215911, 'samples': 1221664, 'steps': 2386, 'loss/train': 0.3815220594406128} -09/20/2021 22:45:24 - INFO - __main__ - Step 38178: {'lr': 0.0001994559614215911, 'samples': 1221696, 'steps': 2386, 'loss/train': 0.1855926364660263} -09/20/2021 22:45:25 - INFO - __main__ - Step 38179: {'lr': 0.0001994559614215911, 'samples': 1221728, 'steps': 2386, 'loss/train': 0.19120430946350098} -09/20/2021 22:45:25 - INFO - __main__ - Step 38180: {'lr': 0.0001994559614215911, 'samples': 1221760, 'steps': 2386, 'loss/train': 0.7221275568008423} -09/20/2021 22:45:27 - INFO - __main__ - Step 38181: {'lr': 0.0001994559614215911, 'samples': 1221792, 'steps': 2386, 'loss/train': 0.5259423851966858} -09/20/2021 22:45:28 - INFO - __main__ - Step 38182: {'lr': 0.0001994559614215911, 'samples': 1221824, 'steps': 2386, 'loss/train': 2.3397982120513916} -09/20/2021 22:45:29 - INFO - __main__ - Step 38183: {'lr': 0.0001994559614215911, 'samples': 1221856, 'steps': 2386, 'loss/train': 2.3133163452148438} -09/20/2021 22:45:29 - INFO - __main__ - Step 38184: {'lr': 0.0001994559614215911, 'samples': 1221888, 'steps': 2386, 'loss/train': 1.7401572465896606} -09/20/2021 22:45:30 - INFO - __main__ - Step 38185: {'lr': 0.0001994559614215911, 'samples': 1221920, 'steps': 2386, 'loss/train': 1.8526180982589722} -09/20/2021 22:45:31 - INFO - __main__ - Step 38186: {'lr': 0.0001994559614215911, 'samples': 1221952, 'steps': 2386, 'loss/train': 2.252549886703491} -09/20/2021 22:45:32 - INFO - __main__ - Step 38187: {'lr': 0.0001994559614215911, 'samples': 1221984, 'steps': 2386, 'loss/train': 1.2566152811050415} -09/20/2021 22:45:32 - INFO - __main__ - Step 38188: {'lr': 0.0001994559614215911, 'samples': 1222016, 'steps': 2386, 'loss/train': 2.47731876373291} -09/20/2021 22:45:33 - INFO - __main__ - Step 38189: {'lr': 0.0001994559614215911, 'samples': 1222048, 'steps': 2386, 'loss/train': 1.1370929479599} -09/20/2021 22:45:34 - INFO - __main__ - Step 38190: {'lr': 0.0001994559614215911, 'samples': 1222080, 'steps': 2386, 'loss/train': 0.5319451093673706} -09/20/2021 22:45:35 - INFO - __main__ - Step 38191: {'lr': 0.0001994559614215911, 'samples': 1222112, 'steps': 2386, 'loss/train': 3.08126163482666} -09/20/2021 22:45:35 - INFO - __main__ - Step 38192: {'lr': 0.0001994559614215911, 'samples': 1222144, 'steps': 2386, 'loss/train': 2.4231479167938232} -09/20/2021 22:45:36 - INFO - __main__ - Step 38193: {'lr': 0.0001994552967391212, 'samples': 1222176, 'steps': 2387, 'loss/train': 1.985894799232483} -09/20/2021 22:45:37 - INFO - __main__ - Step 38194: {'lr': 0.0001994552967391212, 'samples': 1222208, 'steps': 2387, 'loss/train': 2.369802474975586} -09/20/2021 22:45:38 - INFO - __main__ - Step 38195: {'lr': 0.0001994552967391212, 'samples': 1222240, 'steps': 2387, 'loss/train': 1.3630667924880981} -09/20/2021 22:45:38 - INFO - __main__ - Step 38196: {'lr': 0.0001994552967391212, 'samples': 1222272, 'steps': 2387, 'loss/train': 2.5953617095947266} -09/20/2021 22:45:39 - INFO - __main__ - Step 38197: {'lr': 0.0001994552967391212, 'samples': 1222304, 'steps': 2387, 'loss/train': 1.521527647972107} -09/20/2021 22:45:40 - INFO - __main__ - Step 38198: {'lr': 0.0001994552967391212, 'samples': 1222336, 'steps': 2387, 'loss/train': 1.8263767957687378} -09/20/2021 22:45:41 - INFO - __main__ - Step 38199: {'lr': 0.0001994552967391212, 'samples': 1222368, 'steps': 2387, 'loss/train': 3.0409932136535645} -09/20/2021 22:45:41 - INFO - __main__ - Step 38200: {'lr': 0.0001994552967391212, 'samples': 1222400, 'steps': 2387, 'loss/train': 2.3012497425079346} -09/20/2021 22:45:42 - INFO - __main__ - Step 38201: {'lr': 0.0001994552967391212, 'samples': 1222432, 'steps': 2387, 'loss/train': 2.181359052658081} -09/20/2021 22:45:43 - INFO - __main__ - Step 38202: {'lr': 0.0001994552967391212, 'samples': 1222464, 'steps': 2387, 'loss/train': 2.6994800567626953} -09/20/2021 22:45:44 - INFO - __main__ - Step 38203: {'lr': 0.0001994552967391212, 'samples': 1222496, 'steps': 2387, 'loss/train': 2.41259503364563} -09/20/2021 22:45:44 - INFO - __main__ - Step 38204: {'lr': 0.0001994552967391212, 'samples': 1222528, 'steps': 2387, 'loss/train': 1.9033527374267578} -09/20/2021 22:45:45 - INFO - __main__ - Step 38205: {'lr': 0.0001994552967391212, 'samples': 1222560, 'steps': 2387, 'loss/train': 2.1259169578552246} -09/20/2021 22:45:46 - INFO - __main__ - Step 38206: {'lr': 0.0001994552967391212, 'samples': 1222592, 'steps': 2387, 'loss/train': 3.24887752532959} -09/20/2021 22:45:47 - INFO - __main__ - Step 38207: {'lr': 0.0001994552967391212, 'samples': 1222624, 'steps': 2387, 'loss/train': 2.236973285675049} -09/20/2021 22:45:47 - INFO - __main__ - Step 38208: {'lr': 0.0001994552967391212, 'samples': 1222656, 'steps': 2387, 'loss/train': 2.1139724254608154} -09/20/2021 22:45:48 - INFO - __main__ - Step 38209: {'lr': 0.0001994546316519681, 'samples': 1222688, 'steps': 2388, 'loss/train': 1.566475510597229} -09/20/2021 22:45:49 - INFO - __main__ - Step 38210: {'lr': 0.0001994546316519681, 'samples': 1222720, 'steps': 2388, 'loss/train': 2.2864367961883545} -09/20/2021 22:45:50 - INFO - __main__ - Step 38211: {'lr': 0.0001994546316519681, 'samples': 1222752, 'steps': 2388, 'loss/train': 2.875755548477173} -09/20/2021 22:45:51 - INFO - __main__ - Step 38212: {'lr': 0.0001994546316519681, 'samples': 1222784, 'steps': 2388, 'loss/train': 1.9478105306625366} -09/20/2021 22:45:52 - INFO - __main__ - Step 38213: {'lr': 0.0001994546316519681, 'samples': 1222816, 'steps': 2388, 'loss/train': 1.986578345298767} -09/20/2021 22:45:53 - INFO - __main__ - Step 38214: {'lr': 0.0001994546316519681, 'samples': 1222848, 'steps': 2388, 'loss/train': 1.6534509658813477} -09/20/2021 22:45:53 - INFO - __main__ - Step 38215: {'lr': 0.0001994546316519681, 'samples': 1222880, 'steps': 2388, 'loss/train': 1.8670542240142822} -09/20/2021 22:45:54 - INFO - __main__ - Step 38216: {'lr': 0.0001994546316519681, 'samples': 1222912, 'steps': 2388, 'loss/train': 3.463505744934082} -09/20/2021 22:45:55 - INFO - __main__ - Step 38217: {'lr': 0.0001994546316519681, 'samples': 1222944, 'steps': 2388, 'loss/train': 2.468106508255005} -09/20/2021 22:45:56 - INFO - __main__ - Step 38218: {'lr': 0.0001994546316519681, 'samples': 1222976, 'steps': 2388, 'loss/train': 1.7174779176712036} -09/20/2021 22:45:56 - INFO - __main__ - Step 38219: {'lr': 0.0001994546316519681, 'samples': 1223008, 'steps': 2388, 'loss/train': 2.2975916862487793} -09/20/2021 22:45:57 - INFO - __main__ - Step 38220: {'lr': 0.0001994546316519681, 'samples': 1223040, 'steps': 2388, 'loss/train': 2.1491334438323975} -09/20/2021 22:45:58 - INFO - __main__ - Step 38221: {'lr': 0.0001994546316519681, 'samples': 1223072, 'steps': 2388, 'loss/train': 2.955591917037964} -09/20/2021 22:45:59 - INFO - __main__ - Step 38222: {'lr': 0.0001994546316519681, 'samples': 1223104, 'steps': 2388, 'loss/train': 2.0187485218048096} -09/20/2021 22:45:59 - INFO - __main__ - Step 38223: {'lr': 0.0001994546316519681, 'samples': 1223136, 'steps': 2388, 'loss/train': 2.104377031326294} -09/20/2021 22:46:00 - INFO - __main__ - Step 38224: {'lr': 0.0001994546316519681, 'samples': 1223168, 'steps': 2388, 'loss/train': 2.0090556144714355} -09/20/2021 22:46:01 - INFO - __main__ - Step 38225: {'lr': 0.00019945396616013444, 'samples': 1223200, 'steps': 2389, 'loss/train': 2.4226136207580566} -09/20/2021 22:46:02 - INFO - __main__ - Step 38226: {'lr': 0.00019945396616013444, 'samples': 1223232, 'steps': 2389, 'loss/train': 2.3797855377197266} -09/20/2021 22:46:02 - INFO - __main__ - Step 38227: {'lr': 0.00019945396616013444, 'samples': 1223264, 'steps': 2389, 'loss/train': 2.773134469985962} -09/20/2021 22:46:03 - INFO - __main__ - Step 38228: {'lr': 0.00019945396616013444, 'samples': 1223296, 'steps': 2389, 'loss/train': 1.8679814338684082} -09/20/2021 22:46:04 - INFO - __main__ - Step 38229: {'lr': 0.00019945396616013444, 'samples': 1223328, 'steps': 2389, 'loss/train': 1.5750699043273926} -09/20/2021 22:46:05 - INFO - __main__ - Step 38230: {'lr': 0.00019945396616013444, 'samples': 1223360, 'steps': 2389, 'loss/train': 2.5495965480804443} -09/20/2021 22:46:05 - INFO - __main__ - Step 38231: {'lr': 0.00019945396616013444, 'samples': 1223392, 'steps': 2389, 'loss/train': 0.7378814220428467} -09/20/2021 22:46:06 - INFO - __main__ - Step 38232: {'lr': 0.00019945396616013444, 'samples': 1223424, 'steps': 2389, 'loss/train': 2.5355706214904785} -09/20/2021 22:46:07 - INFO - __main__ - Step 38233: {'lr': 0.00019945396616013444, 'samples': 1223456, 'steps': 2389, 'loss/train': 1.3119072914123535} -09/20/2021 22:46:08 - INFO - __main__ - Step 38234: {'lr': 0.00019945396616013444, 'samples': 1223488, 'steps': 2389, 'loss/train': 2.0994739532470703} -09/20/2021 22:46:09 - INFO - __main__ - Step 38235: {'lr': 0.00019945396616013444, 'samples': 1223520, 'steps': 2389, 'loss/train': 1.8245418071746826} -09/20/2021 22:46:09 - INFO - __main__ - Step 38236: {'lr': 0.00019945396616013444, 'samples': 1223552, 'steps': 2389, 'loss/train': 1.976036787033081} -09/20/2021 22:46:10 - INFO - __main__ - Step 38237: {'lr': 0.00019945396616013444, 'samples': 1223584, 'steps': 2389, 'loss/train': 1.2300560474395752} -09/20/2021 22:46:11 - INFO - __main__ - Step 38238: {'lr': 0.00019945396616013444, 'samples': 1223616, 'steps': 2389, 'loss/train': 2.2481210231781006} -09/20/2021 22:46:12 - INFO - __main__ - Step 38239: {'lr': 0.00019945396616013444, 'samples': 1223648, 'steps': 2389, 'loss/train': 2.2881171703338623} -09/20/2021 22:46:12 - INFO - __main__ - Step 38240: {'lr': 0.00019945396616013444, 'samples': 1223680, 'steps': 2389, 'loss/train': 2.4084441661834717} -09/20/2021 22:46:14 - INFO - __main__ - Step 38241: {'lr': 0.00019945330026362304, 'samples': 1223712, 'steps': 2390, 'loss/train': 1.6750956773757935} -09/20/2021 22:46:15 - INFO - __main__ - Step 38242: {'lr': 0.00019945330026362304, 'samples': 1223744, 'steps': 2390, 'loss/train': 1.8383746147155762} -09/20/2021 22:46:15 - INFO - __main__ - Step 38243: {'lr': 0.00019945330026362304, 'samples': 1223776, 'steps': 2390, 'loss/train': 2.1551647186279297} -09/20/2021 22:46:16 - INFO - __main__ - Step 38244: {'lr': 0.00019945330026362304, 'samples': 1223808, 'steps': 2390, 'loss/train': 2.532869338989258} -09/20/2021 22:46:17 - INFO - __main__ - Step 38245: {'lr': 0.00019945330026362304, 'samples': 1223840, 'steps': 2390, 'loss/train': 1.7356488704681396} -09/20/2021 22:46:18 - INFO - __main__ - Step 38246: {'lr': 0.00019945330026362304, 'samples': 1223872, 'steps': 2390, 'loss/train': 2.7152702808380127} -09/20/2021 22:46:18 - INFO - __main__ - Step 38247: {'lr': 0.00019945330026362304, 'samples': 1223904, 'steps': 2390, 'loss/train': 1.8495476245880127} -09/20/2021 22:46:19 - INFO - __main__ - Step 38248: {'lr': 0.00019945330026362304, 'samples': 1223936, 'steps': 2390, 'loss/train': 2.443051815032959} -09/20/2021 22:46:20 - INFO - __main__ - Step 38249: {'lr': 0.00019945330026362304, 'samples': 1223968, 'steps': 2390, 'loss/train': 2.1684377193450928} -09/20/2021 22:46:21 - INFO - __main__ - Step 38250: {'lr': 0.00019945330026362304, 'samples': 1224000, 'steps': 2390, 'loss/train': 1.9656803607940674} -09/20/2021 22:46:21 - INFO - __main__ - Step 38251: {'lr': 0.00019945330026362304, 'samples': 1224032, 'steps': 2390, 'loss/train': 2.1475813388824463} -09/20/2021 22:46:22 - INFO - __main__ - Step 38252: {'lr': 0.00019945330026362304, 'samples': 1224064, 'steps': 2390, 'loss/train': 2.3516275882720947} -09/20/2021 22:46:23 - INFO - __main__ - Step 38253: {'lr': 0.00019945330026362304, 'samples': 1224096, 'steps': 2390, 'loss/train': 2.1963815689086914} -09/20/2021 22:46:24 - INFO - __main__ - Step 38254: {'lr': 0.00019945330026362304, 'samples': 1224128, 'steps': 2390, 'loss/train': 0.1997244507074356} -09/20/2021 22:46:24 - INFO - __main__ - Step 38255: {'lr': 0.00019945330026362304, 'samples': 1224160, 'steps': 2390, 'loss/train': 0.10606106370687485} -09/20/2021 22:46:25 - INFO - __main__ - Step 38256: {'lr': 0.00019945330026362304, 'samples': 1224192, 'steps': 2390, 'loss/train': 0.12548349797725677} -09/20/2021 22:46:26 - INFO - __main__ - Step 38257: {'lr': 0.00019945263396243653, 'samples': 1224224, 'steps': 2391, 'loss/train': 2.0197300910949707} -09/20/2021 22:46:27 - INFO - __main__ - Step 38258: {'lr': 0.00019945263396243653, 'samples': 1224256, 'steps': 2391, 'loss/train': 2.1712889671325684} -09/20/2021 22:46:27 - INFO - __main__ - Step 38259: {'lr': 0.00019945263396243653, 'samples': 1224288, 'steps': 2391, 'loss/train': 2.1830546855926514} -09/20/2021 22:46:28 - INFO - __main__ - Step 38260: {'lr': 0.00019945263396243653, 'samples': 1224320, 'steps': 2391, 'loss/train': 1.6850320100784302} -09/20/2021 22:46:29 - INFO - __main__ - Step 38261: {'lr': 0.00019945263396243653, 'samples': 1224352, 'steps': 2391, 'loss/train': 2.2330336570739746} -09/20/2021 22:46:30 - INFO - __main__ - Step 38262: {'lr': 0.00019945263396243653, 'samples': 1224384, 'steps': 2391, 'loss/train': 1.714386224746704} -09/20/2021 22:46:30 - INFO - __main__ - Step 38263: {'lr': 0.00019945263396243653, 'samples': 1224416, 'steps': 2391, 'loss/train': 2.3337297439575195} -09/20/2021 22:46:31 - INFO - __main__ - Step 38264: {'lr': 0.00019945263396243653, 'samples': 1224448, 'steps': 2391, 'loss/train': 2.790071487426758} -09/20/2021 22:46:32 - INFO - __main__ - Step 38265: {'lr': 0.00019945263396243653, 'samples': 1224480, 'steps': 2391, 'loss/train': 2.689363479614258} -09/20/2021 22:46:33 - INFO - __main__ - Step 38266: {'lr': 0.00019945263396243653, 'samples': 1224512, 'steps': 2391, 'loss/train': 1.1942603588104248} -09/20/2021 22:46:33 - INFO - __main__ - Step 38267: {'lr': 0.00019945263396243653, 'samples': 1224544, 'steps': 2391, 'loss/train': 0.7750887274742126} -09/20/2021 22:46:34 - INFO - __main__ - Step 38268: {'lr': 0.00019945263396243653, 'samples': 1224576, 'steps': 2391, 'loss/train': 3.3601224422454834} -09/20/2021 22:46:35 - INFO - __main__ - Step 38269: {'lr': 0.00019945263396243653, 'samples': 1224608, 'steps': 2391, 'loss/train': 2.7507541179656982} -09/20/2021 22:46:36 - INFO - __main__ - Step 38270: {'lr': 0.00019945263396243653, 'samples': 1224640, 'steps': 2391, 'loss/train': 2.0998573303222656} -09/20/2021 22:46:37 - INFO - __main__ - Step 38271: {'lr': 0.00019945263396243653, 'samples': 1224672, 'steps': 2391, 'loss/train': 1.9175018072128296} -09/20/2021 22:46:38 - INFO - __main__ - Step 38272: {'lr': 0.00019945263396243653, 'samples': 1224704, 'steps': 2391, 'loss/train': 2.2657382488250732} -09/20/2021 22:46:39 - INFO - __main__ - Step 38273: {'lr': 0.0001994519672565776, 'samples': 1224736, 'steps': 2392, 'loss/train': 1.265843152999878} -09/20/2021 22:46:39 - INFO - __main__ - Step 38274: {'lr': 0.0001994519672565776, 'samples': 1224768, 'steps': 2392, 'loss/train': 1.942421793937683} -09/20/2021 22:46:40 - INFO - __main__ - Step 38275: {'lr': 0.0001994519672565776, 'samples': 1224800, 'steps': 2392, 'loss/train': 2.0572264194488525} -09/20/2021 22:46:41 - INFO - __main__ - Step 38276: {'lr': 0.0001994519672565776, 'samples': 1224832, 'steps': 2392, 'loss/train': 3.5997118949890137} -09/20/2021 22:46:42 - INFO - __main__ - Step 38277: {'lr': 0.0001994519672565776, 'samples': 1224864, 'steps': 2392, 'loss/train': 3.011408567428589} -09/20/2021 22:46:42 - INFO - __main__ - Step 38278: {'lr': 0.0001994519672565776, 'samples': 1224896, 'steps': 2392, 'loss/train': 3.018653392791748} -09/20/2021 22:46:43 - INFO - __main__ - Step 38279: {'lr': 0.0001994519672565776, 'samples': 1224928, 'steps': 2392, 'loss/train': 2.211357831954956} -09/20/2021 22:46:44 - INFO - __main__ - Step 38280: {'lr': 0.0001994519672565776, 'samples': 1224960, 'steps': 2392, 'loss/train': 2.2086265087127686} -09/20/2021 22:46:45 - INFO - __main__ - Step 38281: {'lr': 0.0001994519672565776, 'samples': 1224992, 'steps': 2392, 'loss/train': 0.6690268516540527} -09/20/2021 22:46:45 - INFO - __main__ - Step 38282: {'lr': 0.0001994519672565776, 'samples': 1225024, 'steps': 2392, 'loss/train': 1.8269767761230469} -09/20/2021 22:46:46 - INFO - __main__ - Step 38283: {'lr': 0.0001994519672565776, 'samples': 1225056, 'steps': 2392, 'loss/train': 2.165578603744507} -09/20/2021 22:46:47 - INFO - __main__ - Step 38284: {'lr': 0.0001994519672565776, 'samples': 1225088, 'steps': 2392, 'loss/train': 1.7227368354797363} -09/20/2021 22:46:48 - INFO - __main__ - Step 38285: {'lr': 0.0001994519672565776, 'samples': 1225120, 'steps': 2392, 'loss/train': 2.5422792434692383} -09/20/2021 22:46:48 - INFO - __main__ - Step 38286: {'lr': 0.0001994519672565776, 'samples': 1225152, 'steps': 2392, 'loss/train': 3.5866918563842773} -09/20/2021 22:46:49 - INFO - __main__ - Step 38287: {'lr': 0.0001994519672565776, 'samples': 1225184, 'steps': 2392, 'loss/train': 1.6136053800582886} -09/20/2021 22:46:50 - INFO - __main__ - Step 38288: {'lr': 0.0001994519672565776, 'samples': 1225216, 'steps': 2392, 'loss/train': 1.3881243467330933} -09/20/2021 22:46:51 - INFO - __main__ - Step 38289: {'lr': 0.00019945130014604906, 'samples': 1225248, 'steps': 2393, 'loss/train': 1.4641329050064087} -09/20/2021 22:46:51 - INFO - __main__ - Step 38290: {'lr': 0.00019945130014604906, 'samples': 1225280, 'steps': 2393, 'loss/train': 1.3164070844650269} -09/20/2021 22:46:52 - INFO - __main__ - Step 38291: {'lr': 0.00019945130014604906, 'samples': 1225312, 'steps': 2393, 'loss/train': 2.9264864921569824} -09/20/2021 22:46:53 - INFO - __main__ - Step 38292: {'lr': 0.00019945130014604906, 'samples': 1225344, 'steps': 2393, 'loss/train': 0.531509280204773} -09/20/2021 22:46:54 - INFO - __main__ - Step 38293: {'lr': 0.00019945130014604906, 'samples': 1225376, 'steps': 2393, 'loss/train': 2.191898822784424} -09/20/2021 22:46:54 - INFO - __main__ - Step 38294: {'lr': 0.00019945130014604906, 'samples': 1225408, 'steps': 2393, 'loss/train': 2.403836250305176} -09/20/2021 22:46:55 - INFO - __main__ - Step 38295: {'lr': 0.00019945130014604906, 'samples': 1225440, 'steps': 2393, 'loss/train': 2.375312566757202} -09/20/2021 22:46:56 - INFO - __main__ - Step 38296: {'lr': 0.00019945130014604906, 'samples': 1225472, 'steps': 2393, 'loss/train': 2.138570547103882} -09/20/2021 22:46:57 - INFO - __main__ - Step 38297: {'lr': 0.00019945130014604906, 'samples': 1225504, 'steps': 2393, 'loss/train': 2.604156255722046} -09/20/2021 22:46:57 - INFO - __main__ - Step 38298: {'lr': 0.00019945130014604906, 'samples': 1225536, 'steps': 2393, 'loss/train': 3.335598945617676} -09/20/2021 22:46:58 - INFO - __main__ - Step 38299: {'lr': 0.00019945130014604906, 'samples': 1225568, 'steps': 2393, 'loss/train': 2.214259386062622} -09/20/2021 22:46:59 - INFO - __main__ - Step 38300: {'lr': 0.00019945130014604906, 'samples': 1225600, 'steps': 2393, 'loss/train': 1.4324787855148315} -09/20/2021 22:47:00 - INFO - __main__ - Step 38301: {'lr': 0.00019945130014604906, 'samples': 1225632, 'steps': 2393, 'loss/train': 1.3670988082885742} -09/20/2021 22:47:01 - INFO - __main__ - Step 38302: {'lr': 0.00019945130014604906, 'samples': 1225664, 'steps': 2393, 'loss/train': 2.752094030380249} -09/20/2021 22:47:02 - INFO - __main__ - Step 38303: {'lr': 0.00019945130014604906, 'samples': 1225696, 'steps': 2393, 'loss/train': 2.173447608947754} -09/20/2021 22:47:03 - INFO - __main__ - Step 38304: {'lr': 0.00019945130014604906, 'samples': 1225728, 'steps': 2393, 'loss/train': 2.102489471435547} -09/20/2021 22:47:03 - INFO - __main__ - Step 38305: {'lr': 0.00019945063263085352, 'samples': 1225760, 'steps': 2394, 'loss/train': 1.2755342721939087} -09/20/2021 22:47:04 - INFO - __main__ - Step 38306: {'lr': 0.00019945063263085352, 'samples': 1225792, 'steps': 2394, 'loss/train': 2.0907063484191895} -09/20/2021 22:47:05 - INFO - __main__ - Step 38307: {'lr': 0.00019945063263085352, 'samples': 1225824, 'steps': 2394, 'loss/train': 2.678772211074829} -09/20/2021 22:47:06 - INFO - __main__ - Step 38308: {'lr': 0.00019945063263085352, 'samples': 1225856, 'steps': 2394, 'loss/train': 1.9563226699829102} -09/20/2021 22:47:06 - INFO - __main__ - Step 38309: {'lr': 0.00019945063263085352, 'samples': 1225888, 'steps': 2394, 'loss/train': 2.1125147342681885} -09/20/2021 22:47:07 - INFO - __main__ - Step 38310: {'lr': 0.00019945063263085352, 'samples': 1225920, 'steps': 2394, 'loss/train': 2.5365355014801025} -09/20/2021 22:47:08 - INFO - __main__ - Step 38311: {'lr': 0.00019945063263085352, 'samples': 1225952, 'steps': 2394, 'loss/train': 2.6069018840789795} -09/20/2021 22:47:09 - INFO - __main__ - Step 38312: {'lr': 0.00019945063263085352, 'samples': 1225984, 'steps': 2394, 'loss/train': 2.404020309448242} -09/20/2021 22:47:09 - INFO - __main__ - Step 38313: {'lr': 0.00019945063263085352, 'samples': 1226016, 'steps': 2394, 'loss/train': 2.614718437194824} -09/20/2021 22:47:10 - INFO - __main__ - Step 38314: {'lr': 0.00019945063263085352, 'samples': 1226048, 'steps': 2394, 'loss/train': 2.1081085205078125} -09/20/2021 22:47:11 - INFO - __main__ - Step 38315: {'lr': 0.00019945063263085352, 'samples': 1226080, 'steps': 2394, 'loss/train': 2.185906410217285} -09/20/2021 22:47:12 - INFO - __main__ - Step 38316: {'lr': 0.00019945063263085352, 'samples': 1226112, 'steps': 2394, 'loss/train': 2.1056692600250244} -09/20/2021 22:47:12 - INFO - __main__ - Step 38317: {'lr': 0.00019945063263085352, 'samples': 1226144, 'steps': 2394, 'loss/train': 2.377614974975586} -09/20/2021 22:47:13 - INFO - __main__ - Step 38318: {'lr': 0.00019945063263085352, 'samples': 1226176, 'steps': 2394, 'loss/train': 1.6035956144332886} -09/20/2021 22:47:14 - INFO - __main__ - Step 38319: {'lr': 0.00019945063263085352, 'samples': 1226208, 'steps': 2394, 'loss/train': 1.7411909103393555} -09/20/2021 22:47:15 - INFO - __main__ - Step 38320: {'lr': 0.00019945063263085352, 'samples': 1226240, 'steps': 2394, 'loss/train': 2.0366814136505127} -09/20/2021 22:47:16 - INFO - __main__ - Step 38321: {'lr': 0.00019944996471099374, 'samples': 1226272, 'steps': 2395, 'loss/train': 2.021714448928833} -09/20/2021 22:47:16 - INFO - __main__ - Step 38322: {'lr': 0.00019944996471099374, 'samples': 1226304, 'steps': 2395, 'loss/train': 0.3783864378929138} -09/20/2021 22:47:17 - INFO - __main__ - Step 38323: {'lr': 0.00019944996471099374, 'samples': 1226336, 'steps': 2395, 'loss/train': 2.3562495708465576} -09/20/2021 22:47:18 - INFO - __main__ - Step 38324: {'lr': 0.00019944996471099374, 'samples': 1226368, 'steps': 2395, 'loss/train': 1.2202847003936768} -09/20/2021 22:47:19 - INFO - __main__ - Step 38325: {'lr': 0.00019944996471099374, 'samples': 1226400, 'steps': 2395, 'loss/train': 2.263643264770508} -09/20/2021 22:47:19 - INFO - __main__ - Step 38326: {'lr': 0.00019944996471099374, 'samples': 1226432, 'steps': 2395, 'loss/train': 1.3726540803909302} -09/20/2021 22:47:20 - INFO - __main__ - Step 38327: {'lr': 0.00019944996471099374, 'samples': 1226464, 'steps': 2395, 'loss/train': 2.015817880630493} -09/20/2021 22:47:21 - INFO - __main__ - Step 38328: {'lr': 0.00019944996471099374, 'samples': 1226496, 'steps': 2395, 'loss/train': 2.1260485649108887} -09/20/2021 22:47:22 - INFO - __main__ - Step 38329: {'lr': 0.00019944996471099374, 'samples': 1226528, 'steps': 2395, 'loss/train': 1.057600498199463} -09/20/2021 22:47:22 - INFO - __main__ - Step 38330: {'lr': 0.00019944996471099374, 'samples': 1226560, 'steps': 2395, 'loss/train': 4.0302839279174805} -09/20/2021 22:47:23 - INFO - __main__ - Step 38331: {'lr': 0.00019944996471099374, 'samples': 1226592, 'steps': 2395, 'loss/train': 1.4794145822525024} -09/20/2021 22:47:24 - INFO - __main__ - Step 38332: {'lr': 0.00019944996471099374, 'samples': 1226624, 'steps': 2395, 'loss/train': 2.417684555053711} -09/20/2021 22:47:25 - INFO - __main__ - Step 38333: {'lr': 0.00019944996471099374, 'samples': 1226656, 'steps': 2395, 'loss/train': 1.6651763916015625} -09/20/2021 22:47:26 - INFO - __main__ - Step 38334: {'lr': 0.00019944996471099374, 'samples': 1226688, 'steps': 2395, 'loss/train': 1.997559905052185} -09/20/2021 22:47:27 - INFO - __main__ - Step 38335: {'lr': 0.00019944996471099374, 'samples': 1226720, 'steps': 2395, 'loss/train': 2.106353521347046} -09/20/2021 22:47:27 - INFO - __main__ - Step 38336: {'lr': 0.00019944996471099374, 'samples': 1226752, 'steps': 2395, 'loss/train': 3.4635090827941895} -09/20/2021 22:47:28 - INFO - __main__ - Step 38337: {'lr': 0.00019944929638647247, 'samples': 1226784, 'steps': 2396, 'loss/train': 2.9147415161132812} -09/20/2021 22:47:29 - INFO - __main__ - Step 38338: {'lr': 0.00019944929638647247, 'samples': 1226816, 'steps': 2396, 'loss/train': 2.443420648574829} -09/20/2021 22:47:30 - INFO - __main__ - Step 38339: {'lr': 0.00019944929638647247, 'samples': 1226848, 'steps': 2396, 'loss/train': 1.8544949293136597} -09/20/2021 22:47:30 - INFO - __main__ - Step 38340: {'lr': 0.00019944929638647247, 'samples': 1226880, 'steps': 2396, 'loss/train': 2.622974395751953} -09/20/2021 22:47:31 - INFO - __main__ - Step 38341: {'lr': 0.00019944929638647247, 'samples': 1226912, 'steps': 2396, 'loss/train': 2.6206772327423096} -09/20/2021 22:47:32 - INFO - __main__ - Step 38342: {'lr': 0.00019944929638647247, 'samples': 1226944, 'steps': 2396, 'loss/train': 1.5332329273223877} -09/20/2021 22:47:33 - INFO - __main__ - Step 38343: {'lr': 0.00019944929638647247, 'samples': 1226976, 'steps': 2396, 'loss/train': 2.732938289642334} -09/20/2021 22:47:33 - INFO - __main__ - Step 38344: {'lr': 0.00019944929638647247, 'samples': 1227008, 'steps': 2396, 'loss/train': 2.731509208679199} -09/20/2021 22:47:34 - INFO - __main__ - Step 38345: {'lr': 0.00019944929638647247, 'samples': 1227040, 'steps': 2396, 'loss/train': 1.7092249393463135} -09/20/2021 22:47:35 - INFO - __main__ - Step 38346: {'lr': 0.00019944929638647247, 'samples': 1227072, 'steps': 2396, 'loss/train': 2.219196081161499} -09/20/2021 22:47:36 - INFO - __main__ - Step 38347: {'lr': 0.00019944929638647247, 'samples': 1227104, 'steps': 2396, 'loss/train': 1.5166339874267578} -09/20/2021 22:47:36 - INFO - __main__ - Step 38348: {'lr': 0.00019944929638647247, 'samples': 1227136, 'steps': 2396, 'loss/train': 2.2131245136260986} -09/20/2021 22:47:37 - INFO - __main__ - Step 38349: {'lr': 0.00019944929638647247, 'samples': 1227168, 'steps': 2396, 'loss/train': 2.0707955360412598} -09/20/2021 22:47:38 - INFO - __main__ - Step 38350: {'lr': 0.00019944929638647247, 'samples': 1227200, 'steps': 2396, 'loss/train': 2.581744432449341} -09/20/2021 22:47:39 - INFO - __main__ - Step 38351: {'lr': 0.00019944929638647247, 'samples': 1227232, 'steps': 2396, 'loss/train': 2.049722909927368} -09/20/2021 22:47:39 - INFO - __main__ - Step 38352: {'lr': 0.00019944929638647247, 'samples': 1227264, 'steps': 2396, 'loss/train': 1.5010926723480225} -09/20/2021 22:47:40 - INFO - __main__ - Step 38353: {'lr': 0.0001994486276572924, 'samples': 1227296, 'steps': 2397, 'loss/train': 2.8770105838775635} -09/20/2021 22:47:41 - INFO - __main__ - Step 38354: {'lr': 0.0001994486276572924, 'samples': 1227328, 'steps': 2397, 'loss/train': 1.191314458847046} -09/20/2021 22:47:42 - INFO - __main__ - Step 38355: {'lr': 0.0001994486276572924, 'samples': 1227360, 'steps': 2397, 'loss/train': 1.64564847946167} -09/20/2021 22:47:43 - INFO - __main__ - Step 38356: {'lr': 0.0001994486276572924, 'samples': 1227392, 'steps': 2397, 'loss/train': 2.1515214443206787} -09/20/2021 22:47:43 - INFO - __main__ - Step 38357: {'lr': 0.0001994486276572924, 'samples': 1227424, 'steps': 2397, 'loss/train': 1.5727827548980713} -09/20/2021 22:47:44 - INFO - __main__ - Step 38358: {'lr': 0.0001994486276572924, 'samples': 1227456, 'steps': 2397, 'loss/train': 2.804257869720459} -09/20/2021 22:47:45 - INFO - __main__ - Step 38359: {'lr': 0.0001994486276572924, 'samples': 1227488, 'steps': 2397, 'loss/train': 0.6724240183830261} -09/20/2021 22:47:46 - INFO - __main__ - Step 38360: {'lr': 0.0001994486276572924, 'samples': 1227520, 'steps': 2397, 'loss/train': 1.7415889501571655} -09/20/2021 22:47:46 - INFO - __main__ - Step 38361: {'lr': 0.0001994486276572924, 'samples': 1227552, 'steps': 2397, 'loss/train': 2.037846803665161} -09/20/2021 22:47:47 - INFO - __main__ - Step 38362: {'lr': 0.0001994486276572924, 'samples': 1227584, 'steps': 2397, 'loss/train': 1.7911494970321655} -09/20/2021 22:47:48 - INFO - __main__ - Step 38363: {'lr': 0.0001994486276572924, 'samples': 1227616, 'steps': 2397, 'loss/train': 2.638400077819824} -09/20/2021 22:47:49 - INFO - __main__ - Step 38364: {'lr': 0.0001994486276572924, 'samples': 1227648, 'steps': 2397, 'loss/train': 2.1181399822235107} -09/20/2021 22:47:50 - INFO - __main__ - Step 38365: {'lr': 0.0001994486276572924, 'samples': 1227680, 'steps': 2397, 'loss/train': 2.0833661556243896} -09/20/2021 22:47:51 - INFO - __main__ - Step 38366: {'lr': 0.0001994486276572924, 'samples': 1227712, 'steps': 2397, 'loss/train': 1.1986427307128906} -09/20/2021 22:47:51 - INFO - __main__ - Step 38367: {'lr': 0.0001994486276572924, 'samples': 1227744, 'steps': 2397, 'loss/train': 2.066084623336792} -09/20/2021 22:47:52 - INFO - __main__ - Step 38368: {'lr': 0.0001994486276572924, 'samples': 1227776, 'steps': 2397, 'loss/train': 3.1221580505371094} -09/20/2021 22:47:53 - INFO - __main__ - Step 38369: {'lr': 0.00019944795852345625, 'samples': 1227808, 'steps': 2398, 'loss/train': 1.3921074867248535} -09/20/2021 22:47:54 - INFO - __main__ - Step 38370: {'lr': 0.00019944795852345625, 'samples': 1227840, 'steps': 2398, 'loss/train': 1.5537832975387573} -09/20/2021 22:47:54 - INFO - __main__ - Step 38371: {'lr': 0.00019944795852345625, 'samples': 1227872, 'steps': 2398, 'loss/train': 1.8078136444091797} -09/20/2021 22:47:55 - INFO - __main__ - Step 38372: {'lr': 0.00019944795852345625, 'samples': 1227904, 'steps': 2398, 'loss/train': 1.5011329650878906} -09/20/2021 22:47:56 - INFO - __main__ - Step 38373: {'lr': 0.00019944795852345625, 'samples': 1227936, 'steps': 2398, 'loss/train': 2.5557634830474854} -09/20/2021 22:47:57 - INFO - __main__ - Step 38374: {'lr': 0.00019944795852345625, 'samples': 1227968, 'steps': 2398, 'loss/train': 1.085740089416504} -09/20/2021 22:47:57 - INFO - __main__ - Step 38375: {'lr': 0.00019944795852345625, 'samples': 1228000, 'steps': 2398, 'loss/train': 2.6256086826324463} -09/20/2021 22:47:58 - INFO - __main__ - Step 38376: {'lr': 0.00019944795852345625, 'samples': 1228032, 'steps': 2398, 'loss/train': 2.7506630420684814} -09/20/2021 22:47:59 - INFO - __main__ - Step 38377: {'lr': 0.00019944795852345625, 'samples': 1228064, 'steps': 2398, 'loss/train': 2.745990037918091} -09/20/2021 22:48:00 - INFO - __main__ - Step 38378: {'lr': 0.00019944795852345625, 'samples': 1228096, 'steps': 2398, 'loss/train': 2.7662856578826904} -09/20/2021 22:48:00 - INFO - __main__ - Step 38379: {'lr': 0.00019944795852345625, 'samples': 1228128, 'steps': 2398, 'loss/train': 1.6717808246612549} -09/20/2021 22:48:01 - INFO - __main__ - Step 38380: {'lr': 0.00019944795852345625, 'samples': 1228160, 'steps': 2398, 'loss/train': 2.9338412284851074} -09/20/2021 22:48:02 - INFO - __main__ - Step 38381: {'lr': 0.00019944795852345625, 'samples': 1228192, 'steps': 2398, 'loss/train': 2.2584824562072754} -09/20/2021 22:48:03 - INFO - __main__ - Step 38382: {'lr': 0.00019944795852345625, 'samples': 1228224, 'steps': 2398, 'loss/train': 2.1962890625} -09/20/2021 22:48:03 - INFO - __main__ - Step 38383: {'lr': 0.00019944795852345625, 'samples': 1228256, 'steps': 2398, 'loss/train': 2.585646390914917} -09/20/2021 22:48:04 - INFO - __main__ - Step 38384: {'lr': 0.00019944795852345625, 'samples': 1228288, 'steps': 2398, 'loss/train': 2.7455646991729736} -09/20/2021 22:48:05 - INFO - __main__ - Step 38385: {'lr': 0.00019944728898496668, 'samples': 1228320, 'steps': 2399, 'loss/train': 2.184314012527466} -09/20/2021 22:48:06 - INFO - __main__ - Step 38386: {'lr': 0.00019944728898496668, 'samples': 1228352, 'steps': 2399, 'loss/train': 1.966115951538086} -09/20/2021 22:48:07 - INFO - __main__ - Step 38387: {'lr': 0.00019944728898496668, 'samples': 1228384, 'steps': 2399, 'loss/train': 2.2617526054382324} -09/20/2021 22:48:07 - INFO - __main__ - Step 38388: {'lr': 0.00019944728898496668, 'samples': 1228416, 'steps': 2399, 'loss/train': 0.6460198760032654} -09/20/2021 22:48:08 - INFO - __main__ - Step 38389: {'lr': 0.00019944728898496668, 'samples': 1228448, 'steps': 2399, 'loss/train': 1.7081382274627686} -09/20/2021 22:48:09 - INFO - __main__ - Step 38390: {'lr': 0.00019944728898496668, 'samples': 1228480, 'steps': 2399, 'loss/train': 0.45379558205604553} -09/20/2021 22:48:10 - INFO - __main__ - Step 38391: {'lr': 0.00019944728898496668, 'samples': 1228512, 'steps': 2399, 'loss/train': 2.2328786849975586} -09/20/2021 22:48:10 - INFO - __main__ - Step 38392: {'lr': 0.00019944728898496668, 'samples': 1228544, 'steps': 2399, 'loss/train': 2.010892629623413} -09/20/2021 22:48:11 - INFO - __main__ - Step 38393: {'lr': 0.00019944728898496668, 'samples': 1228576, 'steps': 2399, 'loss/train': 2.448296308517456} -09/20/2021 22:48:12 - INFO - __main__ - Step 38394: {'lr': 0.00019944728898496668, 'samples': 1228608, 'steps': 2399, 'loss/train': 0.8542489409446716} -09/20/2021 22:48:13 - INFO - __main__ - Step 38395: {'lr': 0.00019944728898496668, 'samples': 1228640, 'steps': 2399, 'loss/train': 2.0344436168670654} -09/20/2021 22:48:14 - INFO - __main__ - Step 38396: {'lr': 0.00019944728898496668, 'samples': 1228672, 'steps': 2399, 'loss/train': 3.640050172805786} -09/20/2021 22:48:15 - INFO - __main__ - Step 38397: {'lr': 0.00019944728898496668, 'samples': 1228704, 'steps': 2399, 'loss/train': 2.0030405521392822} -09/20/2021 22:48:15 - INFO - __main__ - Step 38398: {'lr': 0.00019944728898496668, 'samples': 1228736, 'steps': 2399, 'loss/train': 3.194864273071289} -09/20/2021 22:48:16 - INFO - __main__ - Step 38399: {'lr': 0.00019944728898496668, 'samples': 1228768, 'steps': 2399, 'loss/train': 2.5814239978790283} -09/20/2021 22:48:17 - INFO - __main__ - Step 38400: {'lr': 0.00019944728898496668, 'samples': 1228800, 'steps': 2399, 'loss/train': 1.36338472366333} -09/20/2021 22:48:18 - INFO - __main__ - Step 38401: {'lr': 0.00019944661904182655, 'samples': 1228832, 'steps': 2400, 'loss/train': 1.9803597927093506} -09/20/2021 22:48:19 - INFO - __main__ - Step 38402: {'lr': 0.00019944661904182655, 'samples': 1228864, 'steps': 2400, 'loss/train': 2.141803026199341} -09/20/2021 22:48:19 - INFO - __main__ - Step 38403: {'lr': 0.00019944661904182655, 'samples': 1228896, 'steps': 2400, 'loss/train': 2.2310760021209717} -09/20/2021 22:48:20 - INFO - __main__ - Step 38404: {'lr': 0.00019944661904182655, 'samples': 1228928, 'steps': 2400, 'loss/train': 3.171926975250244} -09/20/2021 22:48:21 - INFO - __main__ - Step 38405: {'lr': 0.00019944661904182655, 'samples': 1228960, 'steps': 2400, 'loss/train': 3.174753427505493} -09/20/2021 22:48:22 - INFO - __main__ - Step 38406: {'lr': 0.00019944661904182655, 'samples': 1228992, 'steps': 2400, 'loss/train': 1.5743111371994019} -09/20/2021 22:48:22 - INFO - __main__ - Step 38407: {'lr': 0.00019944661904182655, 'samples': 1229024, 'steps': 2400, 'loss/train': 2.657195568084717} -09/20/2021 22:48:23 - INFO - __main__ - Step 38408: {'lr': 0.00019944661904182655, 'samples': 1229056, 'steps': 2400, 'loss/train': 1.641024112701416} -09/20/2021 22:48:24 - INFO - __main__ - Step 38409: {'lr': 0.00019944661904182655, 'samples': 1229088, 'steps': 2400, 'loss/train': 1.4691137075424194} -09/20/2021 22:48:25 - INFO - __main__ - Step 38410: {'lr': 0.00019944661904182655, 'samples': 1229120, 'steps': 2400, 'loss/train': 1.4348537921905518} -09/20/2021 22:48:25 - INFO - __main__ - Step 38411: {'lr': 0.00019944661904182655, 'samples': 1229152, 'steps': 2400, 'loss/train': 1.9502917528152466} -09/20/2021 22:48:26 - INFO - __main__ - Step 38412: {'lr': 0.00019944661904182655, 'samples': 1229184, 'steps': 2400, 'loss/train': 2.28424072265625} -09/20/2021 22:48:27 - INFO - __main__ - Step 38413: {'lr': 0.00019944661904182655, 'samples': 1229216, 'steps': 2400, 'loss/train': 2.1366026401519775} -09/20/2021 22:48:28 - INFO - __main__ - Step 38414: {'lr': 0.00019944661904182655, 'samples': 1229248, 'steps': 2400, 'loss/train': 1.2238140106201172} -09/20/2021 22:48:28 - INFO - __main__ - Step 38415: {'lr': 0.00019944661904182655, 'samples': 1229280, 'steps': 2400, 'loss/train': 3.262690782546997} -09/20/2021 22:48:29 - INFO - __main__ - Step 38416: {'lr': 0.00019944661904182655, 'samples': 1229312, 'steps': 2400, 'loss/train': 1.9908090829849243} -09/20/2021 22:48:30 - INFO - __main__ - Step 38417: {'lr': 0.0001994459486940385, 'samples': 1229344, 'steps': 2401, 'loss/train': 1.9887570142745972} -09/20/2021 22:48:31 - INFO - __main__ - Step 38418: {'lr': 0.0001994459486940385, 'samples': 1229376, 'steps': 2401, 'loss/train': 2.359488010406494} -09/20/2021 22:48:31 - INFO - __main__ - Step 38419: {'lr': 0.0001994459486940385, 'samples': 1229408, 'steps': 2401, 'loss/train': 0.825180172920227} -09/20/2021 22:48:32 - INFO - __main__ - Step 38420: {'lr': 0.0001994459486940385, 'samples': 1229440, 'steps': 2401, 'loss/train': 3.2208688259124756} -09/20/2021 22:48:33 - INFO - __main__ - Step 38421: {'lr': 0.0001994459486940385, 'samples': 1229472, 'steps': 2401, 'loss/train': 4.743980884552002} -09/20/2021 22:48:34 - INFO - __main__ - Step 38422: {'lr': 0.0001994459486940385, 'samples': 1229504, 'steps': 2401, 'loss/train': 2.135918140411377} -09/20/2021 22:48:34 - INFO - __main__ - Step 38423: {'lr': 0.0001994459486940385, 'samples': 1229536, 'steps': 2401, 'loss/train': 2.6000547409057617} -09/20/2021 22:48:35 - INFO - __main__ - Step 38424: {'lr': 0.0001994459486940385, 'samples': 1229568, 'steps': 2401, 'loss/train': 2.5978665351867676} -09/20/2021 22:48:36 - INFO - __main__ - Step 38425: {'lr': 0.0001994459486940385, 'samples': 1229600, 'steps': 2401, 'loss/train': 2.294158935546875} -09/20/2021 22:48:37 - INFO - __main__ - Step 38426: {'lr': 0.0001994459486940385, 'samples': 1229632, 'steps': 2401, 'loss/train': 2.7034308910369873} -09/20/2021 22:48:38 - INFO - __main__ - Step 38427: {'lr': 0.0001994459486940385, 'samples': 1229664, 'steps': 2401, 'loss/train': 2.1662516593933105} -09/20/2021 22:48:39 - INFO - __main__ - Step 38428: {'lr': 0.0001994459486940385, 'samples': 1229696, 'steps': 2401, 'loss/train': 2.633009672164917} -09/20/2021 22:48:39 - INFO - __main__ - Step 38429: {'lr': 0.0001994459486940385, 'samples': 1229728, 'steps': 2401, 'loss/train': 1.7364572286605835} -09/20/2021 22:48:40 - INFO - __main__ - Step 38430: {'lr': 0.0001994459486940385, 'samples': 1229760, 'steps': 2401, 'loss/train': 2.1950876712799072} -09/20/2021 22:48:41 - INFO - __main__ - Step 38431: {'lr': 0.0001994459486940385, 'samples': 1229792, 'steps': 2401, 'loss/train': 2.6420226097106934} -09/20/2021 22:48:42 - INFO - __main__ - Step 38432: {'lr': 0.0001994459486940385, 'samples': 1229824, 'steps': 2401, 'loss/train': 2.8789684772491455} -09/20/2021 22:48:43 - INFO - __main__ - Step 38433: {'lr': 0.00019944527794160525, 'samples': 1229856, 'steps': 2402, 'loss/train': 2.007558584213257} -09/20/2021 22:48:43 - INFO - __main__ - Step 38434: {'lr': 0.00019944527794160525, 'samples': 1229888, 'steps': 2402, 'loss/train': 2.343454122543335} -09/20/2021 22:48:44 - INFO - __main__ - Step 38435: {'lr': 0.00019944527794160525, 'samples': 1229920, 'steps': 2402, 'loss/train': 3.050133466720581} -09/20/2021 22:48:45 - INFO - __main__ - Step 38436: {'lr': 0.00019944527794160525, 'samples': 1229952, 'steps': 2402, 'loss/train': 2.001106023788452} -09/20/2021 22:48:46 - INFO - __main__ - Step 38437: {'lr': 0.00019944527794160525, 'samples': 1229984, 'steps': 2402, 'loss/train': 2.2014803886413574} -09/20/2021 22:48:46 - INFO - __main__ - Step 38438: {'lr': 0.00019944527794160525, 'samples': 1230016, 'steps': 2402, 'loss/train': 2.1624507904052734} -09/20/2021 22:48:47 - INFO - __main__ - Step 38439: {'lr': 0.00019944527794160525, 'samples': 1230048, 'steps': 2402, 'loss/train': 1.50975501537323} -09/20/2021 22:48:48 - INFO - __main__ - Step 38440: {'lr': 0.00019944527794160525, 'samples': 1230080, 'steps': 2402, 'loss/train': 2.2176311016082764} -09/20/2021 22:48:49 - INFO - __main__ - Step 38441: {'lr': 0.00019944527794160525, 'samples': 1230112, 'steps': 2402, 'loss/train': 2.8011834621429443} -09/20/2021 22:48:49 - INFO - __main__ - Step 38442: {'lr': 0.00019944527794160525, 'samples': 1230144, 'steps': 2402, 'loss/train': 1.7959883213043213} -09/20/2021 22:48:50 - INFO - __main__ - Step 38443: {'lr': 0.00019944527794160525, 'samples': 1230176, 'steps': 2402, 'loss/train': 1.6040513515472412} -09/20/2021 22:48:51 - INFO - __main__ - Step 38444: {'lr': 0.00019944527794160525, 'samples': 1230208, 'steps': 2402, 'loss/train': 1.9286857843399048} -09/20/2021 22:48:52 - INFO - __main__ - Step 38445: {'lr': 0.00019944527794160525, 'samples': 1230240, 'steps': 2402, 'loss/train': 6.057656288146973} -09/20/2021 22:48:52 - INFO - __main__ - Step 38446: {'lr': 0.00019944527794160525, 'samples': 1230272, 'steps': 2402, 'loss/train': 1.0144678354263306} -09/20/2021 22:48:53 - INFO - __main__ - Step 38447: {'lr': 0.00019944527794160525, 'samples': 1230304, 'steps': 2402, 'loss/train': 0.8560815453529358} -09/20/2021 22:48:54 - INFO - __main__ - Step 38448: {'lr': 0.00019944527794160525, 'samples': 1230336, 'steps': 2402, 'loss/train': 2.297544002532959} -09/20/2021 22:48:55 - INFO - __main__ - Step 38449: {'lr': 0.00019944460678452956, 'samples': 1230368, 'steps': 2403, 'loss/train': 2.5051980018615723} -09/20/2021 22:48:55 - INFO - __main__ - Step 38450: {'lr': 0.00019944460678452956, 'samples': 1230400, 'steps': 2403, 'loss/train': 2.4687366485595703} -09/20/2021 22:48:56 - INFO - __main__ - Step 38451: {'lr': 0.00019944460678452956, 'samples': 1230432, 'steps': 2403, 'loss/train': 2.2741503715515137} -09/20/2021 22:48:57 - INFO - __main__ - Step 38452: {'lr': 0.00019944460678452956, 'samples': 1230464, 'steps': 2403, 'loss/train': 3.602104425430298} -09/20/2021 22:48:58 - INFO - __main__ - Step 38453: {'lr': 0.00019944460678452956, 'samples': 1230496, 'steps': 2403, 'loss/train': 1.9751091003417969} -09/20/2021 22:48:58 - INFO - __main__ - Step 38454: {'lr': 0.00019944460678452956, 'samples': 1230528, 'steps': 2403, 'loss/train': 1.4617944955825806} -09/20/2021 22:48:59 - INFO - __main__ - Step 38455: {'lr': 0.00019944460678452956, 'samples': 1230560, 'steps': 2403, 'loss/train': 2.2082512378692627} -09/20/2021 22:49:00 - INFO - __main__ - Step 38456: {'lr': 0.00019944460678452956, 'samples': 1230592, 'steps': 2403, 'loss/train': 2.193674325942993} -09/20/2021 22:49:01 - INFO - __main__ - Step 38457: {'lr': 0.00019944460678452956, 'samples': 1230624, 'steps': 2403, 'loss/train': 2.56553053855896} -09/20/2021 22:49:02 - INFO - __main__ - Step 38458: {'lr': 0.00019944460678452956, 'samples': 1230656, 'steps': 2403, 'loss/train': 1.6441891193389893} -09/20/2021 22:49:03 - INFO - __main__ - Step 38459: {'lr': 0.00019944460678452956, 'samples': 1230688, 'steps': 2403, 'loss/train': 1.7817134857177734} -09/20/2021 22:49:03 - INFO - __main__ - Step 38460: {'lr': 0.00019944460678452956, 'samples': 1230720, 'steps': 2403, 'loss/train': 2.116271734237671} -09/20/2021 22:49:04 - INFO - __main__ - Step 38461: {'lr': 0.00019944460678452956, 'samples': 1230752, 'steps': 2403, 'loss/train': 1.7964246273040771} -09/20/2021 22:49:05 - INFO - __main__ - Step 38462: {'lr': 0.00019944460678452956, 'samples': 1230784, 'steps': 2403, 'loss/train': 2.2068002223968506} -09/20/2021 22:49:06 - INFO - __main__ - Step 38463: {'lr': 0.00019944460678452956, 'samples': 1230816, 'steps': 2403, 'loss/train': 1.5633502006530762} -09/20/2021 22:49:06 - INFO - __main__ - Step 38464: {'lr': 0.00019944460678452956, 'samples': 1230848, 'steps': 2403, 'loss/train': 2.5733296871185303} -09/20/2021 22:49:07 - INFO - __main__ - Step 38465: {'lr': 0.00019944393522281414, 'samples': 1230880, 'steps': 2404, 'loss/train': 3.0188279151916504} -09/20/2021 22:49:08 - INFO - __main__ - Step 38466: {'lr': 0.00019944393522281414, 'samples': 1230912, 'steps': 2404, 'loss/train': 2.062807083129883} -09/20/2021 22:49:09 - INFO - __main__ - Step 38467: {'lr': 0.00019944393522281414, 'samples': 1230944, 'steps': 2404, 'loss/train': 2.4702987670898438} -09/20/2021 22:49:10 - INFO - __main__ - Step 38468: {'lr': 0.00019944393522281414, 'samples': 1230976, 'steps': 2404, 'loss/train': 1.8479126691818237} -09/20/2021 22:49:10 - INFO - __main__ - Step 38469: {'lr': 0.00019944393522281414, 'samples': 1231008, 'steps': 2404, 'loss/train': 1.6692067384719849} -09/20/2021 22:49:11 - INFO - __main__ - Step 38470: {'lr': 0.00019944393522281414, 'samples': 1231040, 'steps': 2404, 'loss/train': 1.5840001106262207} -09/20/2021 22:49:12 - INFO - __main__ - Step 38471: {'lr': 0.00019944393522281414, 'samples': 1231072, 'steps': 2404, 'loss/train': 2.478255033493042} -09/20/2021 22:49:13 - INFO - __main__ - Step 38472: {'lr': 0.00019944393522281414, 'samples': 1231104, 'steps': 2404, 'loss/train': 1.657037615776062} -09/20/2021 22:49:13 - INFO - __main__ - Step 38473: {'lr': 0.00019944393522281414, 'samples': 1231136, 'steps': 2404, 'loss/train': 1.901384949684143} -09/20/2021 22:49:14 - INFO - __main__ - Step 38474: {'lr': 0.00019944393522281414, 'samples': 1231168, 'steps': 2404, 'loss/train': 0.6520915627479553} -09/20/2021 22:49:15 - INFO - __main__ - Step 38475: {'lr': 0.00019944393522281414, 'samples': 1231200, 'steps': 2404, 'loss/train': 2.0390233993530273} -09/20/2021 22:49:16 - INFO - __main__ - Step 38476: {'lr': 0.00019944393522281414, 'samples': 1231232, 'steps': 2404, 'loss/train': 1.9941195249557495} -09/20/2021 22:49:16 - INFO - __main__ - Step 38477: {'lr': 0.00019944393522281414, 'samples': 1231264, 'steps': 2404, 'loss/train': 1.9727768898010254} -09/20/2021 22:49:17 - INFO - __main__ - Step 38478: {'lr': 0.00019944393522281414, 'samples': 1231296, 'steps': 2404, 'loss/train': 1.6448135375976562} -09/20/2021 22:49:18 - INFO - __main__ - Step 38479: {'lr': 0.00019944393522281414, 'samples': 1231328, 'steps': 2404, 'loss/train': 2.73931884765625} -09/20/2021 22:49:19 - INFO - __main__ - Step 38480: {'lr': 0.00019944393522281414, 'samples': 1231360, 'steps': 2404, 'loss/train': 2.3375537395477295} -09/20/2021 22:49:19 - INFO - __main__ - Step 38481: {'lr': 0.00019944326325646174, 'samples': 1231392, 'steps': 2405, 'loss/train': 2.609213352203369} -09/20/2021 22:49:20 - INFO - __main__ - Step 38482: {'lr': 0.00019944326325646174, 'samples': 1231424, 'steps': 2405, 'loss/train': 2.4481446743011475} -09/20/2021 22:49:21 - INFO - __main__ - Step 38483: {'lr': 0.00019944326325646174, 'samples': 1231456, 'steps': 2405, 'loss/train': 2.203531503677368} -09/20/2021 22:49:22 - INFO - __main__ - Step 38484: {'lr': 0.00019944326325646174, 'samples': 1231488, 'steps': 2405, 'loss/train': 2.3713388442993164} -09/20/2021 22:49:22 - INFO - __main__ - Step 38485: {'lr': 0.00019944326325646174, 'samples': 1231520, 'steps': 2405, 'loss/train': 1.9373226165771484} -09/20/2021 22:49:23 - INFO - __main__ - Step 38486: {'lr': 0.00019944326325646174, 'samples': 1231552, 'steps': 2405, 'loss/train': 1.7198915481567383} -09/20/2021 22:49:25 - INFO - __main__ - Step 38487: {'lr': 0.00019944326325646174, 'samples': 1231584, 'steps': 2405, 'loss/train': 2.3479669094085693} -09/20/2021 22:49:26 - INFO - __main__ - Step 38488: {'lr': 0.00019944326325646174, 'samples': 1231616, 'steps': 2405, 'loss/train': 2.721616506576538} -09/20/2021 22:49:26 - INFO - __main__ - Step 38489: {'lr': 0.00019944326325646174, 'samples': 1231648, 'steps': 2405, 'loss/train': 2.3970108032226562} -09/20/2021 22:49:27 - INFO - __main__ - Step 38490: {'lr': 0.00019944326325646174, 'samples': 1231680, 'steps': 2405, 'loss/train': 2.181877613067627} -09/20/2021 22:49:28 - INFO - __main__ - Step 38491: {'lr': 0.00019944326325646174, 'samples': 1231712, 'steps': 2405, 'loss/train': 2.216273546218872} -09/20/2021 22:49:29 - INFO - __main__ - Step 38492: {'lr': 0.00019944326325646174, 'samples': 1231744, 'steps': 2405, 'loss/train': 2.2493669986724854} -09/20/2021 22:49:29 - INFO - __main__ - Step 38493: {'lr': 0.00019944326325646174, 'samples': 1231776, 'steps': 2405, 'loss/train': 1.9771214723587036} -09/20/2021 22:49:30 - INFO - __main__ - Step 38494: {'lr': 0.00019944326325646174, 'samples': 1231808, 'steps': 2405, 'loss/train': 1.9244115352630615} -09/20/2021 22:49:31 - INFO - __main__ - Step 38495: {'lr': 0.00019944326325646174, 'samples': 1231840, 'steps': 2405, 'loss/train': 1.963206171989441} -09/20/2021 22:49:32 - INFO - __main__ - Step 38496: {'lr': 0.00019944326325646174, 'samples': 1231872, 'steps': 2405, 'loss/train': 1.8884774446487427} -09/20/2021 22:49:33 - INFO - __main__ - Step 38497: {'lr': 0.00019944259088547513, 'samples': 1231904, 'steps': 2406, 'loss/train': 1.5837783813476562} -09/20/2021 22:49:33 - INFO - __main__ - Step 38498: {'lr': 0.00019944259088547513, 'samples': 1231936, 'steps': 2406, 'loss/train': 2.823072910308838} -09/20/2021 22:49:34 - INFO - __main__ - Step 38499: {'lr': 0.00019944259088547513, 'samples': 1231968, 'steps': 2406, 'loss/train': 1.7339566946029663} -09/20/2021 22:49:35 - INFO - __main__ - Step 38500: {'lr': 0.00019944259088547513, 'samples': 1232000, 'steps': 2406, 'loss/train': 2.2408199310302734} -09/20/2021 22:49:36 - INFO - __main__ - Step 38501: {'lr': 0.00019944259088547513, 'samples': 1232032, 'steps': 2406, 'loss/train': 2.8204710483551025} -09/20/2021 22:49:36 - INFO - __main__ - Step 38502: {'lr': 0.00019944259088547513, 'samples': 1232064, 'steps': 2406, 'loss/train': 2.399324655532837} -09/20/2021 22:49:37 - INFO - __main__ - Step 38503: {'lr': 0.00019944259088547513, 'samples': 1232096, 'steps': 2406, 'loss/train': 1.6748602390289307} -09/20/2021 22:49:38 - INFO - __main__ - Step 38504: {'lr': 0.00019944259088547513, 'samples': 1232128, 'steps': 2406, 'loss/train': 2.2161378860473633} -09/20/2021 22:49:39 - INFO - __main__ - Step 38505: {'lr': 0.00019944259088547513, 'samples': 1232160, 'steps': 2406, 'loss/train': 3.21401309967041} -09/20/2021 22:49:39 - INFO - __main__ - Step 38506: {'lr': 0.00019944259088547513, 'samples': 1232192, 'steps': 2406, 'loss/train': 1.7962318658828735} -09/20/2021 22:49:40 - INFO - __main__ - Step 38507: {'lr': 0.00019944259088547513, 'samples': 1232224, 'steps': 2406, 'loss/train': 2.27034854888916} -09/20/2021 22:49:41 - INFO - __main__ - Step 38508: {'lr': 0.00019944259088547513, 'samples': 1232256, 'steps': 2406, 'loss/train': 1.4500318765640259} -09/20/2021 22:49:42 - INFO - __main__ - Step 38509: {'lr': 0.00019944259088547513, 'samples': 1232288, 'steps': 2406, 'loss/train': 3.0353968143463135} -09/20/2021 22:49:42 - INFO - __main__ - Step 38510: {'lr': 0.00019944259088547513, 'samples': 1232320, 'steps': 2406, 'loss/train': 2.1544835567474365} -09/20/2021 22:49:43 - INFO - __main__ - Step 38511: {'lr': 0.00019944259088547513, 'samples': 1232352, 'steps': 2406, 'loss/train': 1.429587483406067} -09/20/2021 22:49:44 - INFO - __main__ - Step 38512: {'lr': 0.00019944259088547513, 'samples': 1232384, 'steps': 2406, 'loss/train': 2.7909488677978516} -09/20/2021 22:49:45 - INFO - __main__ - Step 38513: {'lr': 0.00019944191810985693, 'samples': 1232416, 'steps': 2407, 'loss/train': 0.6624940633773804} -09/20/2021 22:49:45 - INFO - __main__ - Step 38514: {'lr': 0.00019944191810985693, 'samples': 1232448, 'steps': 2407, 'loss/train': 2.7455172538757324} -09/20/2021 22:49:46 - INFO - __main__ - Step 38515: {'lr': 0.00019944191810985693, 'samples': 1232480, 'steps': 2407, 'loss/train': 2.5259408950805664} -09/20/2021 22:49:47 - INFO - __main__ - Step 38516: {'lr': 0.00019944191810985693, 'samples': 1232512, 'steps': 2407, 'loss/train': 2.6879820823669434} -09/20/2021 22:49:48 - INFO - __main__ - Step 38517: {'lr': 0.00019944191810985693, 'samples': 1232544, 'steps': 2407, 'loss/train': 1.7084707021713257} -09/20/2021 22:49:49 - INFO - __main__ - Step 38518: {'lr': 0.00019944191810985693, 'samples': 1232576, 'steps': 2407, 'loss/train': 2.2628488540649414} -09/20/2021 22:49:50 - INFO - __main__ - Step 38519: {'lr': 0.00019944191810985693, 'samples': 1232608, 'steps': 2407, 'loss/train': 2.074462413787842} -09/20/2021 22:49:51 - INFO - __main__ - Step 38520: {'lr': 0.00019944191810985693, 'samples': 1232640, 'steps': 2407, 'loss/train': 2.1053531169891357} -09/20/2021 22:49:51 - INFO - __main__ - Step 38521: {'lr': 0.00019944191810985693, 'samples': 1232672, 'steps': 2407, 'loss/train': 3.871722936630249} -09/20/2021 22:49:52 - INFO - __main__ - Step 38522: {'lr': 0.00019944191810985693, 'samples': 1232704, 'steps': 2407, 'loss/train': 2.0755856037139893} -09/20/2021 22:49:53 - INFO - __main__ - Step 38523: {'lr': 0.00019944191810985693, 'samples': 1232736, 'steps': 2407, 'loss/train': 2.011399745941162} -09/20/2021 22:49:54 - INFO - __main__ - Step 38524: {'lr': 0.00019944191810985693, 'samples': 1232768, 'steps': 2407, 'loss/train': 1.4953633546829224} -09/20/2021 22:49:54 - INFO - __main__ - Step 38525: {'lr': 0.00019944191810985693, 'samples': 1232800, 'steps': 2407, 'loss/train': 0.1952272653579712} -09/20/2021 22:49:55 - INFO - __main__ - Step 38526: {'lr': 0.00019944191810985693, 'samples': 1232832, 'steps': 2407, 'loss/train': 0.10323891043663025} -09/20/2021 22:49:56 - INFO - __main__ - Step 38527: {'lr': 0.00019944191810985693, 'samples': 1232864, 'steps': 2407, 'loss/train': 0.2918945550918579} -09/20/2021 22:49:57 - INFO - __main__ - Step 38528: {'lr': 0.00019944191810985693, 'samples': 1232896, 'steps': 2407, 'loss/train': 1.9939031600952148} -09/20/2021 22:49:57 - INFO - __main__ - Step 38529: {'lr': 0.00019944124492961, 'samples': 1232928, 'steps': 2408, 'loss/train': 1.0527215003967285} -09/20/2021 22:49:58 - INFO - __main__ - Step 38530: {'lr': 0.00019944124492961, 'samples': 1232960, 'steps': 2408, 'loss/train': 2.300264835357666} -09/20/2021 22:49:59 - INFO - __main__ - Step 38531: {'lr': 0.00019944124492961, 'samples': 1232992, 'steps': 2408, 'loss/train': 2.1938650608062744} -09/20/2021 22:50:00 - INFO - __main__ - Step 38532: {'lr': 0.00019944124492961, 'samples': 1233024, 'steps': 2408, 'loss/train': 2.2587039470672607} -09/20/2021 22:50:00 - INFO - __main__ - Step 38533: {'lr': 0.00019944124492961, 'samples': 1233056, 'steps': 2408, 'loss/train': 2.534527063369751} -09/20/2021 22:50:01 - INFO - __main__ - Step 38534: {'lr': 0.00019944124492961, 'samples': 1233088, 'steps': 2408, 'loss/train': 2.004249334335327} -09/20/2021 22:50:02 - INFO - __main__ - Step 38535: {'lr': 0.00019944124492961, 'samples': 1233120, 'steps': 2408, 'loss/train': 2.7898736000061035} -09/20/2021 22:50:03 - INFO - __main__ - Step 38536: {'lr': 0.00019944124492961, 'samples': 1233152, 'steps': 2408, 'loss/train': 3.1568984985351562} -09/20/2021 22:50:03 - INFO - __main__ - Step 38537: {'lr': 0.00019944124492961, 'samples': 1233184, 'steps': 2408, 'loss/train': 2.434108257293701} -09/20/2021 22:50:04 - INFO - __main__ - Step 38538: {'lr': 0.00019944124492961, 'samples': 1233216, 'steps': 2408, 'loss/train': 2.6442902088165283} -09/20/2021 22:50:05 - INFO - __main__ - Step 38539: {'lr': 0.00019944124492961, 'samples': 1233248, 'steps': 2408, 'loss/train': 1.3366681337356567} -09/20/2021 22:50:06 - INFO - __main__ - Step 38540: {'lr': 0.00019944124492961, 'samples': 1233280, 'steps': 2408, 'loss/train': 2.218970537185669} -09/20/2021 22:50:06 - INFO - __main__ - Step 38541: {'lr': 0.00019944124492961, 'samples': 1233312, 'steps': 2408, 'loss/train': 2.4467506408691406} -09/20/2021 22:50:07 - INFO - __main__ - Step 38542: {'lr': 0.00019944124492961, 'samples': 1233344, 'steps': 2408, 'loss/train': 1.6638683080673218} -09/20/2021 22:50:08 - INFO - __main__ - Step 38543: {'lr': 0.00019944124492961, 'samples': 1233376, 'steps': 2408, 'loss/train': 3.095461368560791} -09/20/2021 22:50:09 - INFO - __main__ - Step 38544: {'lr': 0.00019944124492961, 'samples': 1233408, 'steps': 2408, 'loss/train': 1.2573131322860718} -09/20/2021 22:50:10 - INFO - __main__ - Step 38545: {'lr': 0.000199440571344737, 'samples': 1233440, 'steps': 2409, 'loss/train': 2.440164804458618} -09/20/2021 22:50:10 - INFO - __main__ - Step 38546: {'lr': 0.000199440571344737, 'samples': 1233472, 'steps': 2409, 'loss/train': 1.549380898475647} -09/20/2021 22:50:11 - INFO - __main__ - Step 38547: {'lr': 0.000199440571344737, 'samples': 1233504, 'steps': 2409, 'loss/train': 2.7982001304626465} -09/20/2021 22:50:12 - INFO - __main__ - Step 38548: {'lr': 0.000199440571344737, 'samples': 1233536, 'steps': 2409, 'loss/train': 1.05253005027771} -09/20/2021 22:50:13 - INFO - __main__ - Step 38549: {'lr': 0.000199440571344737, 'samples': 1233568, 'steps': 2409, 'loss/train': 1.8208035230636597} -09/20/2021 22:50:14 - INFO - __main__ - Step 38550: {'lr': 0.000199440571344737, 'samples': 1233600, 'steps': 2409, 'loss/train': 2.762392997741699} -09/20/2021 22:50:15 - INFO - __main__ - Step 38551: {'lr': 0.000199440571344737, 'samples': 1233632, 'steps': 2409, 'loss/train': 0.4922037720680237} -09/20/2021 22:50:15 - INFO - __main__ - Step 38552: {'lr': 0.000199440571344737, 'samples': 1233664, 'steps': 2409, 'loss/train': 1.0676747560501099} -09/20/2021 22:50:16 - INFO - __main__ - Step 38553: {'lr': 0.000199440571344737, 'samples': 1233696, 'steps': 2409, 'loss/train': 0.9509314894676208} -09/20/2021 22:50:17 - INFO - __main__ - Step 38554: {'lr': 0.000199440571344737, 'samples': 1233728, 'steps': 2409, 'loss/train': 1.525402307510376} -09/20/2021 22:50:18 - INFO - __main__ - Step 38555: {'lr': 0.000199440571344737, 'samples': 1233760, 'steps': 2409, 'loss/train': 2.0912249088287354} -09/20/2021 22:50:18 - INFO - __main__ - Step 38556: {'lr': 0.000199440571344737, 'samples': 1233792, 'steps': 2409, 'loss/train': 2.3600499629974365} -09/20/2021 22:50:19 - INFO - __main__ - Step 38557: {'lr': 0.000199440571344737, 'samples': 1233824, 'steps': 2409, 'loss/train': 2.1975913047790527} -09/20/2021 22:50:20 - INFO - __main__ - Step 38558: {'lr': 0.000199440571344737, 'samples': 1233856, 'steps': 2409, 'loss/train': 2.0312747955322266} -09/20/2021 22:50:21 - INFO - __main__ - Step 38559: {'lr': 0.000199440571344737, 'samples': 1233888, 'steps': 2409, 'loss/train': 2.302649736404419} -09/20/2021 22:50:21 - INFO - __main__ - Step 38560: {'lr': 0.000199440571344737, 'samples': 1233920, 'steps': 2409, 'loss/train': 1.7377865314483643} -09/20/2021 22:50:22 - INFO - __main__ - Step 38561: {'lr': 0.00019943989735524075, 'samples': 1233952, 'steps': 2410, 'loss/train': 2.2772862911224365} -09/20/2021 22:50:23 - INFO - __main__ - Step 38562: {'lr': 0.00019943989735524075, 'samples': 1233984, 'steps': 2410, 'loss/train': 2.1996302604675293} -09/20/2021 22:50:24 - INFO - __main__ - Step 38563: {'lr': 0.00019943989735524075, 'samples': 1234016, 'steps': 2410, 'loss/train': 1.5823525190353394} -09/20/2021 22:50:24 - INFO - __main__ - Step 38564: {'lr': 0.00019943989735524075, 'samples': 1234048, 'steps': 2410, 'loss/train': 1.3685346841812134} -09/20/2021 22:50:25 - INFO - __main__ - Step 38565: {'lr': 0.00019943989735524075, 'samples': 1234080, 'steps': 2410, 'loss/train': 2.6102356910705566} -09/20/2021 22:50:26 - INFO - __main__ - Step 38566: {'lr': 0.00019943989735524075, 'samples': 1234112, 'steps': 2410, 'loss/train': 1.547286868095398} -09/20/2021 22:50:27 - INFO - __main__ - Step 38567: {'lr': 0.00019943989735524075, 'samples': 1234144, 'steps': 2410, 'loss/train': 2.1767544746398926} -09/20/2021 22:50:27 - INFO - __main__ - Step 38568: {'lr': 0.00019943989735524075, 'samples': 1234176, 'steps': 2410, 'loss/train': 2.295900583267212} -09/20/2021 22:50:28 - INFO - __main__ - Step 38569: {'lr': 0.00019943989735524075, 'samples': 1234208, 'steps': 2410, 'loss/train': 1.3034719228744507} -09/20/2021 22:50:29 - INFO - __main__ - Step 38570: {'lr': 0.00019943989735524075, 'samples': 1234240, 'steps': 2410, 'loss/train': 1.8152172565460205} -09/20/2021 22:50:30 - INFO - __main__ - Step 38571: {'lr': 0.00019943989735524075, 'samples': 1234272, 'steps': 2410, 'loss/train': 3.239763021469116} -09/20/2021 22:50:30 - INFO - __main__ - Step 38572: {'lr': 0.00019943989735524075, 'samples': 1234304, 'steps': 2410, 'loss/train': 2.177530527114868} -09/20/2021 22:50:31 - INFO - __main__ - Step 38573: {'lr': 0.00019943989735524075, 'samples': 1234336, 'steps': 2410, 'loss/train': 1.0147825479507446} -09/20/2021 22:50:32 - INFO - __main__ - Step 38574: {'lr': 0.00019943989735524075, 'samples': 1234368, 'steps': 2410, 'loss/train': 2.0276668071746826} -09/20/2021 22:50:33 - INFO - __main__ - Step 38575: {'lr': 0.00019943989735524075, 'samples': 1234400, 'steps': 2410, 'loss/train': 1.4507544040679932} -09/20/2021 22:50:33 - INFO - __main__ - Step 38576: {'lr': 0.00019943989735524075, 'samples': 1234432, 'steps': 2410, 'loss/train': 2.161832571029663} -09/20/2021 22:50:34 - INFO - __main__ - Step 38577: {'lr': 0.0001994392229611239, 'samples': 1234464, 'steps': 2411, 'loss/train': 1.9360735416412354} -09/20/2021 22:50:35 - INFO - __main__ - Step 38578: {'lr': 0.0001994392229611239, 'samples': 1234496, 'steps': 2411, 'loss/train': 1.0233958959579468} -09/20/2021 22:50:37 - INFO - __main__ - Step 38579: {'lr': 0.0001994392229611239, 'samples': 1234528, 'steps': 2411, 'loss/train': 2.5698909759521484} -09/20/2021 22:50:37 - INFO - __main__ - Step 38580: {'lr': 0.0001994392229611239, 'samples': 1234560, 'steps': 2411, 'loss/train': 2.500319242477417} -09/20/2021 22:50:38 - INFO - __main__ - Step 38581: {'lr': 0.0001994392229611239, 'samples': 1234592, 'steps': 2411, 'loss/train': 1.2080495357513428} -09/20/2021 22:50:39 - INFO - __main__ - Step 38582: {'lr': 0.0001994392229611239, 'samples': 1234624, 'steps': 2411, 'loss/train': 2.4999096393585205} -09/20/2021 22:50:40 - INFO - __main__ - Step 38583: {'lr': 0.0001994392229611239, 'samples': 1234656, 'steps': 2411, 'loss/train': 2.3204567432403564} -09/20/2021 22:50:40 - INFO - __main__ - Step 38584: {'lr': 0.0001994392229611239, 'samples': 1234688, 'steps': 2411, 'loss/train': 1.7856237888336182} -09/20/2021 22:50:41 - INFO - __main__ - Step 38585: {'lr': 0.0001994392229611239, 'samples': 1234720, 'steps': 2411, 'loss/train': 2.2805726528167725} -09/20/2021 22:50:42 - INFO - __main__ - Step 38586: {'lr': 0.0001994392229611239, 'samples': 1234752, 'steps': 2411, 'loss/train': 1.8901342153549194} -09/20/2021 22:50:43 - INFO - __main__ - Step 38587: {'lr': 0.0001994392229611239, 'samples': 1234784, 'steps': 2411, 'loss/train': 2.2892940044403076} -09/20/2021 22:50:43 - INFO - __main__ - Step 38588: {'lr': 0.0001994392229611239, 'samples': 1234816, 'steps': 2411, 'loss/train': 1.5360651016235352} -09/20/2021 22:50:44 - INFO - __main__ - Step 38589: {'lr': 0.0001994392229611239, 'samples': 1234848, 'steps': 2411, 'loss/train': 2.6852195262908936} -09/20/2021 22:50:45 - INFO - __main__ - Step 38590: {'lr': 0.0001994392229611239, 'samples': 1234880, 'steps': 2411, 'loss/train': 2.2525081634521484} -09/20/2021 22:50:46 - INFO - __main__ - Step 38591: {'lr': 0.0001994392229611239, 'samples': 1234912, 'steps': 2411, 'loss/train': 1.836268424987793} -09/20/2021 22:50:46 - INFO - __main__ - Step 38592: {'lr': 0.0001994392229611239, 'samples': 1234944, 'steps': 2411, 'loss/train': 1.83729088306427} -09/20/2021 22:50:47 - INFO - __main__ - Step 38593: {'lr': 0.00019943854816238926, 'samples': 1234976, 'steps': 2412, 'loss/train': 2.0786805152893066} -09/20/2021 22:50:48 - INFO - __main__ - Step 38594: {'lr': 0.00019943854816238926, 'samples': 1235008, 'steps': 2412, 'loss/train': 2.2572824954986572} -09/20/2021 22:50:49 - INFO - __main__ - Step 38595: {'lr': 0.00019943854816238926, 'samples': 1235040, 'steps': 2412, 'loss/train': 1.2469068765640259} -09/20/2021 22:50:49 - INFO - __main__ - Step 38596: {'lr': 0.00019943854816238926, 'samples': 1235072, 'steps': 2412, 'loss/train': 2.2582738399505615} -09/20/2021 22:50:50 - INFO - __main__ - Step 38597: {'lr': 0.00019943854816238926, 'samples': 1235104, 'steps': 2412, 'loss/train': 1.7085729837417603} -09/20/2021 22:50:51 - INFO - __main__ - Step 38598: {'lr': 0.00019943854816238926, 'samples': 1235136, 'steps': 2412, 'loss/train': 2.4674582481384277} -09/20/2021 22:50:52 - INFO - __main__ - Step 38599: {'lr': 0.00019943854816238926, 'samples': 1235168, 'steps': 2412, 'loss/train': 2.231276273727417} -09/20/2021 22:50:52 - INFO - __main__ - Step 38600: {'lr': 0.00019943854816238926, 'samples': 1235200, 'steps': 2412, 'loss/train': 1.790772557258606} -09/20/2021 22:50:53 - INFO - __main__ - Step 38601: {'lr': 0.00019943854816238926, 'samples': 1235232, 'steps': 2412, 'loss/train': 0.9732401967048645} -09/20/2021 22:50:54 - INFO - __main__ - Step 38602: {'lr': 0.00019943854816238926, 'samples': 1235264, 'steps': 2412, 'loss/train': 2.934387683868408} -09/20/2021 22:50:55 - INFO - __main__ - Step 38603: {'lr': 0.00019943854816238926, 'samples': 1235296, 'steps': 2412, 'loss/train': 2.173046827316284} -09/20/2021 22:50:55 - INFO - __main__ - Step 38604: {'lr': 0.00019943854816238926, 'samples': 1235328, 'steps': 2412, 'loss/train': 2.3887851238250732} -09/20/2021 22:50:56 - INFO - __main__ - Step 38605: {'lr': 0.00019943854816238926, 'samples': 1235360, 'steps': 2412, 'loss/train': 3.630993604660034} -09/20/2021 22:50:57 - INFO - __main__ - Step 38606: {'lr': 0.00019943854816238926, 'samples': 1235392, 'steps': 2412, 'loss/train': 3.697709798812866} -09/20/2021 22:50:58 - INFO - __main__ - Step 38607: {'lr': 0.00019943854816238926, 'samples': 1235424, 'steps': 2412, 'loss/train': 3.3328566551208496} -09/20/2021 22:50:58 - INFO - __main__ - Step 38608: {'lr': 0.00019943854816238926, 'samples': 1235456, 'steps': 2412, 'loss/train': 3.4021615982055664} -09/20/2021 22:50:59 - INFO - __main__ - Step 38609: {'lr': 0.00019943787295903954, 'samples': 1235488, 'steps': 2413, 'loss/train': 4.70005464553833} -09/20/2021 22:51:02 - INFO - __main__ - Step 38610: {'lr': 0.00019943787295903954, 'samples': 1235520, 'steps': 2413, 'loss/train': 2.4273762702941895} -09/20/2021 22:51:02 - INFO - __main__ - Step 38611: {'lr': 0.00019943787295903954, 'samples': 1235552, 'steps': 2413, 'loss/train': 1.164976716041565} -09/20/2021 22:51:03 - INFO - __main__ - Step 38612: {'lr': 0.00019943787295903954, 'samples': 1235584, 'steps': 2413, 'loss/train': 2.3832626342773438} -09/20/2021 22:51:04 - INFO - __main__ - Step 38613: {'lr': 0.00019943787295903954, 'samples': 1235616, 'steps': 2413, 'loss/train': 2.2803707122802734} -09/20/2021 22:51:05 - INFO - __main__ - Step 38614: {'lr': 0.00019943787295903954, 'samples': 1235648, 'steps': 2413, 'loss/train': 2.5498476028442383} -09/20/2021 22:51:05 - INFO - __main__ - Step 38615: {'lr': 0.00019943787295903954, 'samples': 1235680, 'steps': 2413, 'loss/train': 0.195208340883255} -09/20/2021 22:51:06 - INFO - __main__ - Step 38616: {'lr': 0.00019943787295903954, 'samples': 1235712, 'steps': 2413, 'loss/train': 0.3395998775959015} -09/20/2021 22:51:07 - INFO - __main__ - Step 38617: {'lr': 0.00019943787295903954, 'samples': 1235744, 'steps': 2413, 'loss/train': 0.12741757929325104} -09/20/2021 22:51:08 - INFO - __main__ - Step 38618: {'lr': 0.00019943787295903954, 'samples': 1235776, 'steps': 2413, 'loss/train': 1.6069672107696533} -09/20/2021 22:51:08 - INFO - __main__ - Step 38619: {'lr': 0.00019943787295903954, 'samples': 1235808, 'steps': 2413, 'loss/train': 1.953700065612793} -09/20/2021 22:51:09 - INFO - __main__ - Step 38620: {'lr': 0.00019943787295903954, 'samples': 1235840, 'steps': 2413, 'loss/train': 3.093606472015381} -09/20/2021 22:51:10 - INFO - __main__ - Step 38621: {'lr': 0.00019943787295903954, 'samples': 1235872, 'steps': 2413, 'loss/train': 3.004749298095703} -09/20/2021 22:51:11 - INFO - __main__ - Step 38622: {'lr': 0.00019943787295903954, 'samples': 1235904, 'steps': 2413, 'loss/train': 2.5857882499694824} -09/20/2021 22:51:11 - INFO - __main__ - Step 38623: {'lr': 0.00019943787295903954, 'samples': 1235936, 'steps': 2413, 'loss/train': 2.3025078773498535} -09/20/2021 22:51:12 - INFO - __main__ - Step 38624: {'lr': 0.00019943787295903954, 'samples': 1235968, 'steps': 2413, 'loss/train': 1.4899251461029053} -09/20/2021 22:51:13 - INFO - __main__ - Step 38625: {'lr': 0.0001994371973510775, 'samples': 1236000, 'steps': 2414, 'loss/train': 2.3568227291107178} -09/20/2021 22:51:14 - INFO - __main__ - Step 38626: {'lr': 0.0001994371973510775, 'samples': 1236032, 'steps': 2414, 'loss/train': 1.672200322151184} -09/20/2021 22:51:14 - INFO - __main__ - Step 38627: {'lr': 0.0001994371973510775, 'samples': 1236064, 'steps': 2414, 'loss/train': 1.7059258222579956} -09/20/2021 22:51:15 - INFO - __main__ - Step 38628: {'lr': 0.0001994371973510775, 'samples': 1236096, 'steps': 2414, 'loss/train': 1.5723381042480469} -09/20/2021 22:51:16 - INFO - __main__ - Step 38629: {'lr': 0.0001994371973510775, 'samples': 1236128, 'steps': 2414, 'loss/train': 1.8000197410583496} -09/20/2021 22:51:17 - INFO - __main__ - Step 38630: {'lr': 0.0001994371973510775, 'samples': 1236160, 'steps': 2414, 'loss/train': 2.2145838737487793} -09/20/2021 22:51:17 - INFO - __main__ - Step 38631: {'lr': 0.0001994371973510775, 'samples': 1236192, 'steps': 2414, 'loss/train': 2.311958074569702} -09/20/2021 22:51:18 - INFO - __main__ - Step 38632: {'lr': 0.0001994371973510775, 'samples': 1236224, 'steps': 2414, 'loss/train': 1.8054938316345215} -09/20/2021 22:51:19 - INFO - __main__ - Step 38633: {'lr': 0.0001994371973510775, 'samples': 1236256, 'steps': 2414, 'loss/train': 1.3824265003204346} -09/20/2021 22:51:20 - INFO - __main__ - Step 38634: {'lr': 0.0001994371973510775, 'samples': 1236288, 'steps': 2414, 'loss/train': 1.7376383543014526} -09/20/2021 22:51:20 - INFO - __main__ - Step 38635: {'lr': 0.0001994371973510775, 'samples': 1236320, 'steps': 2414, 'loss/train': 1.3442918062210083} -09/20/2021 22:51:21 - INFO - __main__ - Step 38636: {'lr': 0.0001994371973510775, 'samples': 1236352, 'steps': 2414, 'loss/train': 1.4884053468704224} -09/20/2021 22:51:22 - INFO - __main__ - Step 38637: {'lr': 0.0001994371973510775, 'samples': 1236384, 'steps': 2414, 'loss/train': 1.5004663467407227} -09/20/2021 22:51:23 - INFO - __main__ - Step 38638: {'lr': 0.0001994371973510775, 'samples': 1236416, 'steps': 2414, 'loss/train': 1.6488423347473145} -09/20/2021 22:51:23 - INFO - __main__ - Step 38639: {'lr': 0.0001994371973510775, 'samples': 1236448, 'steps': 2414, 'loss/train': 1.3747142553329468} -09/20/2021 22:51:24 - INFO - __main__ - Step 38640: {'lr': 0.0001994371973510775, 'samples': 1236480, 'steps': 2414, 'loss/train': 1.6376279592514038} -09/20/2021 22:51:25 - INFO - __main__ - Step 38641: {'lr': 0.0001994365213385059, 'samples': 1236512, 'steps': 2415, 'loss/train': 1.2115036249160767} -09/20/2021 22:51:26 - INFO - __main__ - Step 38642: {'lr': 0.0001994365213385059, 'samples': 1236544, 'steps': 2415, 'loss/train': 1.1712599992752075} -09/20/2021 22:51:27 - INFO - __main__ - Step 38643: {'lr': 0.0001994365213385059, 'samples': 1236576, 'steps': 2415, 'loss/train': 1.1033422946929932} -09/20/2021 22:51:27 - INFO - __main__ - Step 38644: {'lr': 0.0001994365213385059, 'samples': 1236608, 'steps': 2415, 'loss/train': 1.236196756362915} -09/20/2021 22:51:28 - INFO - __main__ - Step 38645: {'lr': 0.0001994365213385059, 'samples': 1236640, 'steps': 2415, 'loss/train': 0.9928369522094727} -09/20/2021 22:51:29 - INFO - __main__ - Step 38646: {'lr': 0.0001994365213385059, 'samples': 1236672, 'steps': 2415, 'loss/train': 1.2257143259048462} -09/20/2021 22:51:30 - INFO - __main__ - Step 38647: {'lr': 0.0001994365213385059, 'samples': 1236704, 'steps': 2415, 'loss/train': 1.495031476020813} -09/20/2021 22:51:30 - INFO - __main__ - Step 38648: {'lr': 0.0001994365213385059, 'samples': 1236736, 'steps': 2415, 'loss/train': 2.791499137878418} -09/20/2021 22:51:32 - INFO - __main__ - Step 38649: {'lr': 0.0001994365213385059, 'samples': 1236768, 'steps': 2415, 'loss/train': 1.8403133153915405} -09/20/2021 22:51:32 - INFO - __main__ - Step 38650: {'lr': 0.0001994365213385059, 'samples': 1236800, 'steps': 2415, 'loss/train': 2.4485552310943604} -09/20/2021 22:51:33 - INFO - __main__ - Step 38651: {'lr': 0.0001994365213385059, 'samples': 1236832, 'steps': 2415, 'loss/train': 2.6159520149230957} -09/20/2021 22:51:34 - INFO - __main__ - Step 38652: {'lr': 0.0001994365213385059, 'samples': 1236864, 'steps': 2415, 'loss/train': 2.055665969848633} -09/20/2021 22:51:35 - INFO - __main__ - Step 38653: {'lr': 0.0001994365213385059, 'samples': 1236896, 'steps': 2415, 'loss/train': 2.201991081237793} -09/20/2021 22:51:35 - INFO - __main__ - Step 38654: {'lr': 0.0001994365213385059, 'samples': 1236928, 'steps': 2415, 'loss/train': 2.8489041328430176} -09/20/2021 22:51:36 - INFO - __main__ - Step 38655: {'lr': 0.0001994365213385059, 'samples': 1236960, 'steps': 2415, 'loss/train': 2.3317368030548096} -09/20/2021 22:51:37 - INFO - __main__ - Step 38656: {'lr': 0.0001994365213385059, 'samples': 1236992, 'steps': 2415, 'loss/train': 1.4168754816055298} -09/20/2021 22:51:38 - INFO - __main__ - Step 38657: {'lr': 0.0001994358449213275, 'samples': 1237024, 'steps': 2416, 'loss/train': 2.0747361183166504} -09/20/2021 22:51:39 - INFO - __main__ - Step 38658: {'lr': 0.0001994358449213275, 'samples': 1237056, 'steps': 2416, 'loss/train': 2.3002333641052246} -09/20/2021 22:51:39 - INFO - __main__ - Step 38659: {'lr': 0.0001994358449213275, 'samples': 1237088, 'steps': 2416, 'loss/train': 3.125584363937378} -09/20/2021 22:51:40 - INFO - __main__ - Step 38660: {'lr': 0.0001994358449213275, 'samples': 1237120, 'steps': 2416, 'loss/train': 1.8160040378570557} -09/20/2021 22:51:41 - INFO - __main__ - Step 38661: {'lr': 0.0001994358449213275, 'samples': 1237152, 'steps': 2416, 'loss/train': 1.7684714794158936} -09/20/2021 22:51:42 - INFO - __main__ - Step 38662: {'lr': 0.0001994358449213275, 'samples': 1237184, 'steps': 2416, 'loss/train': 1.690813660621643} -09/20/2021 22:51:42 - INFO - __main__ - Step 38663: {'lr': 0.0001994358449213275, 'samples': 1237216, 'steps': 2416, 'loss/train': 2.1156904697418213} -09/20/2021 22:51:43 - INFO - __main__ - Step 38664: {'lr': 0.0001994358449213275, 'samples': 1237248, 'steps': 2416, 'loss/train': 2.17768931388855} -09/20/2021 22:51:44 - INFO - __main__ - Step 38665: {'lr': 0.0001994358449213275, 'samples': 1237280, 'steps': 2416, 'loss/train': 1.215514063835144} -09/20/2021 22:51:45 - INFO - __main__ - Step 38666: {'lr': 0.0001994358449213275, 'samples': 1237312, 'steps': 2416, 'loss/train': 2.7089874744415283} -09/20/2021 22:51:45 - INFO - __main__ - Step 38667: {'lr': 0.0001994358449213275, 'samples': 1237344, 'steps': 2416, 'loss/train': 1.302564024925232} -09/20/2021 22:51:46 - INFO - __main__ - Step 38668: {'lr': 0.0001994358449213275, 'samples': 1237376, 'steps': 2416, 'loss/train': 3.1711196899414062} -09/20/2021 22:51:47 - INFO - __main__ - Step 38669: {'lr': 0.0001994358449213275, 'samples': 1237408, 'steps': 2416, 'loss/train': 2.8423190116882324} -09/20/2021 22:51:48 - INFO - __main__ - Step 38670: {'lr': 0.0001994358449213275, 'samples': 1237440, 'steps': 2416, 'loss/train': 2.5581345558166504} -09/20/2021 22:51:48 - INFO - __main__ - Step 38671: {'lr': 0.0001994358449213275, 'samples': 1237472, 'steps': 2416, 'loss/train': 2.4995057582855225} -09/20/2021 22:51:49 - INFO - __main__ - Step 38672: {'lr': 0.0001994358449213275, 'samples': 1237504, 'steps': 2416, 'loss/train': 1.841124176979065} -09/20/2021 22:51:50 - INFO - __main__ - Step 38673: {'lr': 0.00019943516809954498, 'samples': 1237536, 'steps': 2417, 'loss/train': 1.8249095678329468} -09/20/2021 22:51:51 - INFO - __main__ - Step 38674: {'lr': 0.00019943516809954498, 'samples': 1237568, 'steps': 2417, 'loss/train': 1.7910771369934082} -09/20/2021 22:51:51 - INFO - __main__ - Step 38675: {'lr': 0.00019943516809954498, 'samples': 1237600, 'steps': 2417, 'loss/train': 1.378029227256775} -09/20/2021 22:51:52 - INFO - __main__ - Step 38676: {'lr': 0.00019943516809954498, 'samples': 1237632, 'steps': 2417, 'loss/train': 2.3673770427703857} -09/20/2021 22:51:53 - INFO - __main__ - Step 38677: {'lr': 0.00019943516809954498, 'samples': 1237664, 'steps': 2417, 'loss/train': 1.62478768825531} -09/20/2021 22:51:54 - INFO - __main__ - Step 38678: {'lr': 0.00019943516809954498, 'samples': 1237696, 'steps': 2417, 'loss/train': 3.0184617042541504} -09/20/2021 22:51:54 - INFO - __main__ - Step 38679: {'lr': 0.00019943516809954498, 'samples': 1237728, 'steps': 2417, 'loss/train': 1.8596465587615967} -09/20/2021 22:51:56 - INFO - __main__ - Step 38680: {'lr': 0.00019943516809954498, 'samples': 1237760, 'steps': 2417, 'loss/train': 2.5235092639923096} -09/20/2021 22:51:56 - INFO - __main__ - Step 38681: {'lr': 0.00019943516809954498, 'samples': 1237792, 'steps': 2417, 'loss/train': 1.386931300163269} -09/20/2021 22:51:57 - INFO - __main__ - Step 38682: {'lr': 0.00019943516809954498, 'samples': 1237824, 'steps': 2417, 'loss/train': 1.5846067667007446} -09/20/2021 22:51:58 - INFO - __main__ - Step 38683: {'lr': 0.00019943516809954498, 'samples': 1237856, 'steps': 2417, 'loss/train': 2.441650152206421} -09/20/2021 22:51:59 - INFO - __main__ - Step 38684: {'lr': 0.00019943516809954498, 'samples': 1237888, 'steps': 2417, 'loss/train': 1.150457501411438} -09/20/2021 22:51:59 - INFO - __main__ - Step 38685: {'lr': 0.00019943516809954498, 'samples': 1237920, 'steps': 2417, 'loss/train': 2.162627696990967} -09/20/2021 22:52:00 - INFO - __main__ - Step 38686: {'lr': 0.00019943516809954498, 'samples': 1237952, 'steps': 2417, 'loss/train': 5.24540901184082} -09/20/2021 22:52:01 - INFO - __main__ - Step 38687: {'lr': 0.00019943516809954498, 'samples': 1237984, 'steps': 2417, 'loss/train': 2.1296069622039795} -09/20/2021 22:52:02 - INFO - __main__ - Step 38688: {'lr': 0.00019943516809954498, 'samples': 1238016, 'steps': 2417, 'loss/train': 1.590425968170166} -09/20/2021 22:52:03 - INFO - __main__ - Step 38689: {'lr': 0.00019943449087316117, 'samples': 1238048, 'steps': 2418, 'loss/train': 1.5895746946334839} -09/20/2021 22:52:03 - INFO - __main__ - Step 38690: {'lr': 0.00019943449087316117, 'samples': 1238080, 'steps': 2418, 'loss/train': 2.1723368167877197} -09/20/2021 22:52:04 - INFO - __main__ - Step 38691: {'lr': 0.00019943449087316117, 'samples': 1238112, 'steps': 2418, 'loss/train': 3.0008928775787354} -09/20/2021 22:52:05 - INFO - __main__ - Step 38692: {'lr': 0.00019943449087316117, 'samples': 1238144, 'steps': 2418, 'loss/train': 2.217872381210327} -09/20/2021 22:52:06 - INFO - __main__ - Step 38693: {'lr': 0.00019943449087316117, 'samples': 1238176, 'steps': 2418, 'loss/train': 2.106553077697754} -09/20/2021 22:52:06 - INFO - __main__ - Step 38694: {'lr': 0.00019943449087316117, 'samples': 1238208, 'steps': 2418, 'loss/train': 2.683635950088501} -09/20/2021 22:52:07 - INFO - __main__ - Step 38695: {'lr': 0.00019943449087316117, 'samples': 1238240, 'steps': 2418, 'loss/train': 1.661390781402588} -09/20/2021 22:52:08 - INFO - __main__ - Step 38696: {'lr': 0.00019943449087316117, 'samples': 1238272, 'steps': 2418, 'loss/train': 1.8555974960327148} -09/20/2021 22:52:09 - INFO - __main__ - Step 38697: {'lr': 0.00019943449087316117, 'samples': 1238304, 'steps': 2418, 'loss/train': 2.5457510948181152} -09/20/2021 22:52:09 - INFO - __main__ - Step 38698: {'lr': 0.00019943449087316117, 'samples': 1238336, 'steps': 2418, 'loss/train': 1.9373332262039185} -09/20/2021 22:52:10 - INFO - __main__ - Step 38699: {'lr': 0.00019943449087316117, 'samples': 1238368, 'steps': 2418, 'loss/train': 2.931009531021118} -09/20/2021 22:52:11 - INFO - __main__ - Step 38700: {'lr': 0.00019943449087316117, 'samples': 1238400, 'steps': 2418, 'loss/train': 1.4369025230407715} -09/20/2021 22:52:12 - INFO - __main__ - Step 38701: {'lr': 0.00019943449087316117, 'samples': 1238432, 'steps': 2418, 'loss/train': 2.075230836868286} -09/20/2021 22:52:12 - INFO - __main__ - Step 38702: {'lr': 0.00019943449087316117, 'samples': 1238464, 'steps': 2418, 'loss/train': 2.328461170196533} -09/20/2021 22:52:13 - INFO - __main__ - Step 38703: {'lr': 0.00019943449087316117, 'samples': 1238496, 'steps': 2418, 'loss/train': 1.9358429908752441} -09/20/2021 22:52:14 - INFO - __main__ - Step 38704: {'lr': 0.00019943449087316117, 'samples': 1238528, 'steps': 2418, 'loss/train': 0.5835780501365662} -09/20/2021 22:52:15 - INFO - __main__ - Step 38705: {'lr': 0.0001994338132421788, 'samples': 1238560, 'steps': 2419, 'loss/train': 1.711938500404358} -09/20/2021 22:52:15 - INFO - __main__ - Step 38706: {'lr': 0.0001994338132421788, 'samples': 1238592, 'steps': 2419, 'loss/train': 2.287417411804199} -09/20/2021 22:52:16 - INFO - __main__ - Step 38707: {'lr': 0.0001994338132421788, 'samples': 1238624, 'steps': 2419, 'loss/train': 3.0230188369750977} -09/20/2021 22:52:17 - INFO - __main__ - Step 38708: {'lr': 0.0001994338132421788, 'samples': 1238656, 'steps': 2419, 'loss/train': 1.9887752532958984} -09/20/2021 22:52:18 - INFO - __main__ - Step 38709: {'lr': 0.0001994338132421788, 'samples': 1238688, 'steps': 2419, 'loss/train': 1.1363519430160522} -09/20/2021 22:52:18 - INFO - __main__ - Step 38710: {'lr': 0.0001994338132421788, 'samples': 1238720, 'steps': 2419, 'loss/train': 0.7342553734779358} -09/20/2021 22:52:20 - INFO - __main__ - Step 38711: {'lr': 0.0001994338132421788, 'samples': 1238752, 'steps': 2419, 'loss/train': 2.4318430423736572} -09/20/2021 22:52:21 - INFO - __main__ - Step 38712: {'lr': 0.0001994338132421788, 'samples': 1238784, 'steps': 2419, 'loss/train': 1.9761394262313843} -09/20/2021 22:52:21 - INFO - __main__ - Step 38713: {'lr': 0.0001994338132421788, 'samples': 1238816, 'steps': 2419, 'loss/train': 0.578491747379303} -09/20/2021 22:52:22 - INFO - __main__ - Step 38714: {'lr': 0.0001994338132421788, 'samples': 1238848, 'steps': 2419, 'loss/train': 0.6948642134666443} -09/20/2021 22:52:23 - INFO - __main__ - Step 38715: {'lr': 0.0001994338132421788, 'samples': 1238880, 'steps': 2419, 'loss/train': 0.665041983127594} -09/20/2021 22:52:24 - INFO - __main__ - Step 38716: {'lr': 0.0001994338132421788, 'samples': 1238912, 'steps': 2419, 'loss/train': 1.9317188262939453} -09/20/2021 22:52:24 - INFO - __main__ - Step 38717: {'lr': 0.0001994338132421788, 'samples': 1238944, 'steps': 2419, 'loss/train': 1.2203195095062256} -09/20/2021 22:52:25 - INFO - __main__ - Step 38718: {'lr': 0.0001994338132421788, 'samples': 1238976, 'steps': 2419, 'loss/train': 2.0626559257507324} -09/20/2021 22:52:26 - INFO - __main__ - Step 38719: {'lr': 0.0001994338132421788, 'samples': 1239008, 'steps': 2419, 'loss/train': 3.1313772201538086} -09/20/2021 22:52:27 - INFO - __main__ - Step 38720: {'lr': 0.0001994338132421788, 'samples': 1239040, 'steps': 2419, 'loss/train': 1.399372935295105} -09/20/2021 22:52:28 - INFO - __main__ - Step 38721: {'lr': 0.00019943313520660066, 'samples': 1239072, 'steps': 2420, 'loss/train': 1.940401315689087} -09/20/2021 22:52:28 - INFO - __main__ - Step 38722: {'lr': 0.00019943313520660066, 'samples': 1239104, 'steps': 2420, 'loss/train': 2.034057140350342} -09/20/2021 22:52:29 - INFO - __main__ - Step 38723: {'lr': 0.00019943313520660066, 'samples': 1239136, 'steps': 2420, 'loss/train': 2.257404327392578} -09/20/2021 22:52:30 - INFO - __main__ - Step 38724: {'lr': 0.00019943313520660066, 'samples': 1239168, 'steps': 2420, 'loss/train': 0.3759215772151947} -09/20/2021 22:52:31 - INFO - __main__ - Step 38725: {'lr': 0.00019943313520660066, 'samples': 1239200, 'steps': 2420, 'loss/train': 3.0701544284820557} -09/20/2021 22:52:31 - INFO - __main__ - Step 38726: {'lr': 0.00019943313520660066, 'samples': 1239232, 'steps': 2420, 'loss/train': 2.229126453399658} -09/20/2021 22:52:32 - INFO - __main__ - Step 38727: {'lr': 0.00019943313520660066, 'samples': 1239264, 'steps': 2420, 'loss/train': 2.3728973865509033} -09/20/2021 22:52:33 - INFO - __main__ - Step 38728: {'lr': 0.00019943313520660066, 'samples': 1239296, 'steps': 2420, 'loss/train': 3.103275775909424} -09/20/2021 22:52:34 - INFO - __main__ - Step 38729: {'lr': 0.00019943313520660066, 'samples': 1239328, 'steps': 2420, 'loss/train': 3.1180577278137207} -09/20/2021 22:52:34 - INFO - __main__ - Step 38730: {'lr': 0.00019943313520660066, 'samples': 1239360, 'steps': 2420, 'loss/train': 1.753650188446045} -09/20/2021 22:52:35 - INFO - __main__ - Step 38731: {'lr': 0.00019943313520660066, 'samples': 1239392, 'steps': 2420, 'loss/train': 2.835639715194702} -09/20/2021 22:52:36 - INFO - __main__ - Step 38732: {'lr': 0.00019943313520660066, 'samples': 1239424, 'steps': 2420, 'loss/train': 1.0117133855819702} -09/20/2021 22:52:37 - INFO - __main__ - Step 38733: {'lr': 0.00019943313520660066, 'samples': 1239456, 'steps': 2420, 'loss/train': 2.52595591545105} -09/20/2021 22:52:37 - INFO - __main__ - Step 38734: {'lr': 0.00019943313520660066, 'samples': 1239488, 'steps': 2420, 'loss/train': 2.401242971420288} -09/20/2021 22:52:38 - INFO - __main__ - Step 38735: {'lr': 0.00019943313520660066, 'samples': 1239520, 'steps': 2420, 'loss/train': 2.49810528755188} -09/20/2021 22:52:39 - INFO - __main__ - Step 38736: {'lr': 0.00019943313520660066, 'samples': 1239552, 'steps': 2420, 'loss/train': 2.0716934204101562} -09/20/2021 22:52:40 - INFO - __main__ - Step 38737: {'lr': 0.00019943245676642946, 'samples': 1239584, 'steps': 2421, 'loss/train': 2.057185649871826} -09/20/2021 22:52:40 - INFO - __main__ - Step 38738: {'lr': 0.00019943245676642946, 'samples': 1239616, 'steps': 2421, 'loss/train': 2.297481060028076} -09/20/2021 22:52:41 - INFO - __main__ - Step 38739: {'lr': 0.00019943245676642946, 'samples': 1239648, 'steps': 2421, 'loss/train': 1.2506356239318848} -09/20/2021 22:52:42 - INFO - __main__ - Step 38740: {'lr': 0.00019943245676642946, 'samples': 1239680, 'steps': 2421, 'loss/train': 2.5228095054626465} -09/20/2021 22:52:43 - INFO - __main__ - Step 38741: {'lr': 0.00019943245676642946, 'samples': 1239712, 'steps': 2421, 'loss/train': 1.4294718503952026} -09/20/2021 22:52:44 - INFO - __main__ - Step 38742: {'lr': 0.00019943245676642946, 'samples': 1239744, 'steps': 2421, 'loss/train': 2.612705707550049} -09/20/2021 22:52:45 - INFO - __main__ - Step 38743: {'lr': 0.00019943245676642946, 'samples': 1239776, 'steps': 2421, 'loss/train': 1.4718562364578247} -09/20/2021 22:52:45 - INFO - __main__ - Step 38744: {'lr': 0.00019943245676642946, 'samples': 1239808, 'steps': 2421, 'loss/train': 3.0379223823547363} -09/20/2021 22:52:46 - INFO - __main__ - Step 38745: {'lr': 0.00019943245676642946, 'samples': 1239840, 'steps': 2421, 'loss/train': 2.758594512939453} -09/20/2021 22:52:47 - INFO - __main__ - Step 38746: {'lr': 0.00019943245676642946, 'samples': 1239872, 'steps': 2421, 'loss/train': 2.631063938140869} -09/20/2021 22:52:48 - INFO - __main__ - Step 38747: {'lr': 0.00019943245676642946, 'samples': 1239904, 'steps': 2421, 'loss/train': 1.976832628250122} -09/20/2021 22:52:48 - INFO - __main__ - Step 38748: {'lr': 0.00019943245676642946, 'samples': 1239936, 'steps': 2421, 'loss/train': 0.4199032485485077} -09/20/2021 22:52:49 - INFO - __main__ - Step 38749: {'lr': 0.00019943245676642946, 'samples': 1239968, 'steps': 2421, 'loss/train': 1.970790147781372} -09/20/2021 22:52:50 - INFO - __main__ - Step 38750: {'lr': 0.00019943245676642946, 'samples': 1240000, 'steps': 2421, 'loss/train': 1.9774287939071655} -09/20/2021 22:52:51 - INFO - __main__ - Step 38751: {'lr': 0.00019943245676642946, 'samples': 1240032, 'steps': 2421, 'loss/train': 2.366753339767456} -09/20/2021 22:52:51 - INFO - __main__ - Step 38752: {'lr': 0.00019943245676642946, 'samples': 1240064, 'steps': 2421, 'loss/train': 1.5620230436325073} -09/20/2021 22:52:52 - INFO - __main__ - Step 38753: {'lr': 0.00019943177792166797, 'samples': 1240096, 'steps': 2422, 'loss/train': 0.8253918290138245} -09/20/2021 22:52:53 - INFO - __main__ - Step 38754: {'lr': 0.00019943177792166797, 'samples': 1240128, 'steps': 2422, 'loss/train': 2.182889938354492} -09/20/2021 22:52:54 - INFO - __main__ - Step 38755: {'lr': 0.00019943177792166797, 'samples': 1240160, 'steps': 2422, 'loss/train': 2.2987446784973145} -09/20/2021 22:52:55 - INFO - __main__ - Step 38756: {'lr': 0.00019943177792166797, 'samples': 1240192, 'steps': 2422, 'loss/train': 2.029616355895996} -09/20/2021 22:52:55 - INFO - __main__ - Step 38757: {'lr': 0.00019943177792166797, 'samples': 1240224, 'steps': 2422, 'loss/train': 2.30777645111084} -09/20/2021 22:52:56 - INFO - __main__ - Step 38758: {'lr': 0.00019943177792166797, 'samples': 1240256, 'steps': 2422, 'loss/train': 2.3336756229400635} -09/20/2021 22:52:57 - INFO - __main__ - Step 38759: {'lr': 0.00019943177792166797, 'samples': 1240288, 'steps': 2422, 'loss/train': 1.895197868347168} -09/20/2021 22:52:58 - INFO - __main__ - Step 38760: {'lr': 0.00019943177792166797, 'samples': 1240320, 'steps': 2422, 'loss/train': 3.119971513748169} -09/20/2021 22:52:58 - INFO - __main__ - Step 38761: {'lr': 0.00019943177792166797, 'samples': 1240352, 'steps': 2422, 'loss/train': 2.5516483783721924} -09/20/2021 22:52:59 - INFO - __main__ - Step 38762: {'lr': 0.00019943177792166797, 'samples': 1240384, 'steps': 2422, 'loss/train': 2.194180488586426} -09/20/2021 22:53:00 - INFO - __main__ - Step 38763: {'lr': 0.00019943177792166797, 'samples': 1240416, 'steps': 2422, 'loss/train': 2.5424346923828125} -09/20/2021 22:53:01 - INFO - __main__ - Step 38764: {'lr': 0.00019943177792166797, 'samples': 1240448, 'steps': 2422, 'loss/train': 1.066537618637085} -09/20/2021 22:53:01 - INFO - __main__ - Step 38765: {'lr': 0.00019943177792166797, 'samples': 1240480, 'steps': 2422, 'loss/train': 2.2012789249420166} -09/20/2021 22:53:02 - INFO - __main__ - Step 38766: {'lr': 0.00019943177792166797, 'samples': 1240512, 'steps': 2422, 'loss/train': 2.853285312652588} -09/20/2021 22:53:03 - INFO - __main__ - Step 38767: {'lr': 0.00019943177792166797, 'samples': 1240544, 'steps': 2422, 'loss/train': 2.9701309204101562} -09/20/2021 22:53:04 - INFO - __main__ - Step 38768: {'lr': 0.00019943177792166797, 'samples': 1240576, 'steps': 2422, 'loss/train': 2.429616689682007} -09/20/2021 22:53:04 - INFO - __main__ - Step 38769: {'lr': 0.00019943109867231895, 'samples': 1240608, 'steps': 2423, 'loss/train': 2.249328374862671} -09/20/2021 22:53:05 - INFO - __main__ - Step 38770: {'lr': 0.00019943109867231895, 'samples': 1240640, 'steps': 2423, 'loss/train': 2.2934184074401855} -09/20/2021 22:53:06 - INFO - __main__ - Step 38771: {'lr': 0.00019943109867231895, 'samples': 1240672, 'steps': 2423, 'loss/train': 2.429051637649536} -09/20/2021 22:53:07 - INFO - __main__ - Step 38772: {'lr': 0.00019943109867231895, 'samples': 1240704, 'steps': 2423, 'loss/train': 1.6652233600616455} -09/20/2021 22:53:08 - INFO - __main__ - Step 38773: {'lr': 0.00019943109867231895, 'samples': 1240736, 'steps': 2423, 'loss/train': 2.66424298286438} -09/20/2021 22:53:09 - INFO - __main__ - Step 38774: {'lr': 0.00019943109867231895, 'samples': 1240768, 'steps': 2423, 'loss/train': 1.5315781831741333} -09/20/2021 22:53:09 - INFO - __main__ - Step 38775: {'lr': 0.00019943109867231895, 'samples': 1240800, 'steps': 2423, 'loss/train': 3.700272560119629} -09/20/2021 22:53:10 - INFO - __main__ - Step 38776: {'lr': 0.00019943109867231895, 'samples': 1240832, 'steps': 2423, 'loss/train': 2.246835708618164} -09/20/2021 22:53:11 - INFO - __main__ - Step 38777: {'lr': 0.00019943109867231895, 'samples': 1240864, 'steps': 2423, 'loss/train': 1.8494353294372559} -09/20/2021 22:53:12 - INFO - __main__ - Step 38778: {'lr': 0.00019943109867231895, 'samples': 1240896, 'steps': 2423, 'loss/train': 2.357671022415161} -09/20/2021 22:53:12 - INFO - __main__ - Step 38779: {'lr': 0.00019943109867231895, 'samples': 1240928, 'steps': 2423, 'loss/train': 2.55481219291687} -09/20/2021 22:53:13 - INFO - __main__ - Step 38780: {'lr': 0.00019943109867231895, 'samples': 1240960, 'steps': 2423, 'loss/train': 2.3780710697174072} -09/20/2021 22:53:14 - INFO - __main__ - Step 38781: {'lr': 0.00019943109867231895, 'samples': 1240992, 'steps': 2423, 'loss/train': 1.4033348560333252} -09/20/2021 22:53:15 - INFO - __main__ - Step 38782: {'lr': 0.00019943109867231895, 'samples': 1241024, 'steps': 2423, 'loss/train': 2.2192604541778564} -09/20/2021 22:53:15 - INFO - __main__ - Step 38783: {'lr': 0.00019943109867231895, 'samples': 1241056, 'steps': 2423, 'loss/train': 2.1573023796081543} -09/20/2021 22:53:16 - INFO - __main__ - Step 38784: {'lr': 0.00019943109867231895, 'samples': 1241088, 'steps': 2423, 'loss/train': 2.1460156440734863} -09/20/2021 22:53:17 - INFO - __main__ - Step 38785: {'lr': 0.0001994304190183852, 'samples': 1241120, 'steps': 2424, 'loss/train': 0.4021831154823303} -09/20/2021 22:53:18 - INFO - __main__ - Step 38786: {'lr': 0.0001994304190183852, 'samples': 1241152, 'steps': 2424, 'loss/train': 2.577364444732666} -09/20/2021 22:53:19 - INFO - __main__ - Step 38787: {'lr': 0.0001994304190183852, 'samples': 1241184, 'steps': 2424, 'loss/train': 1.1581284999847412} -09/20/2021 22:53:19 - INFO - __main__ - Step 38788: {'lr': 0.0001994304190183852, 'samples': 1241216, 'steps': 2424, 'loss/train': 2.2397725582122803} -09/20/2021 22:53:20 - INFO - __main__ - Step 38789: {'lr': 0.0001994304190183852, 'samples': 1241248, 'steps': 2424, 'loss/train': 1.8228158950805664} -09/20/2021 22:53:21 - INFO - __main__ - Step 38790: {'lr': 0.0001994304190183852, 'samples': 1241280, 'steps': 2424, 'loss/train': 1.38878333568573} -09/20/2021 22:53:22 - INFO - __main__ - Step 38791: {'lr': 0.0001994304190183852, 'samples': 1241312, 'steps': 2424, 'loss/train': 1.3542550802230835} -09/20/2021 22:53:22 - INFO - __main__ - Step 38792: {'lr': 0.0001994304190183852, 'samples': 1241344, 'steps': 2424, 'loss/train': 1.8997291326522827} -09/20/2021 22:53:23 - INFO - __main__ - Step 38793: {'lr': 0.0001994304190183852, 'samples': 1241376, 'steps': 2424, 'loss/train': 3.059879779815674} -09/20/2021 22:53:24 - INFO - __main__ - Step 38794: {'lr': 0.0001994304190183852, 'samples': 1241408, 'steps': 2424, 'loss/train': 0.969836950302124} -09/20/2021 22:53:25 - INFO - __main__ - Step 38795: {'lr': 0.0001994304190183852, 'samples': 1241440, 'steps': 2424, 'loss/train': 2.3750503063201904} -09/20/2021 22:53:25 - INFO - __main__ - Step 38796: {'lr': 0.0001994304190183852, 'samples': 1241472, 'steps': 2424, 'loss/train': 0.952845573425293} -09/20/2021 22:53:26 - INFO - __main__ - Step 38797: {'lr': 0.0001994304190183852, 'samples': 1241504, 'steps': 2424, 'loss/train': 1.8617199659347534} -09/20/2021 22:53:27 - INFO - __main__ - Step 38798: {'lr': 0.0001994304190183852, 'samples': 1241536, 'steps': 2424, 'loss/train': 2.455819606781006} -09/20/2021 22:53:28 - INFO - __main__ - Step 38799: {'lr': 0.0001994304190183852, 'samples': 1241568, 'steps': 2424, 'loss/train': 2.0143423080444336} -09/20/2021 22:53:28 - INFO - __main__ - Step 38800: {'lr': 0.0001994304190183852, 'samples': 1241600, 'steps': 2424, 'loss/train': 2.325852155685425} -09/20/2021 22:53:29 - INFO - __main__ - Step 38801: {'lr': 0.00019942973895986944, 'samples': 1241632, 'steps': 2425, 'loss/train': 0.1962355673313141} -09/20/2021 22:53:30 - INFO - __main__ - Step 38802: {'lr': 0.00019942973895986944, 'samples': 1241664, 'steps': 2425, 'loss/train': 0.4287523329257965} -09/20/2021 22:53:31 - INFO - __main__ - Step 38803: {'lr': 0.00019942973895986944, 'samples': 1241696, 'steps': 2425, 'loss/train': 0.15628156065940857} -09/20/2021 22:53:32 - INFO - __main__ - Step 38804: {'lr': 0.00019942973895986944, 'samples': 1241728, 'steps': 2425, 'loss/train': 1.9459341764450073} -09/20/2021 22:53:33 - INFO - __main__ - Step 38805: {'lr': 0.00019942973895986944, 'samples': 1241760, 'steps': 2425, 'loss/train': 2.5470824241638184} -09/20/2021 22:53:34 - INFO - __main__ - Step 38806: {'lr': 0.00019942973895986944, 'samples': 1241792, 'steps': 2425, 'loss/train': 1.3261163234710693} -09/20/2021 22:53:34 - INFO - __main__ - Step 38807: {'lr': 0.00019942973895986944, 'samples': 1241824, 'steps': 2425, 'loss/train': 2.0138165950775146} -09/20/2021 22:53:35 - INFO - __main__ - Step 38808: {'lr': 0.00019942973895986944, 'samples': 1241856, 'steps': 2425, 'loss/train': 2.0729780197143555} -09/20/2021 22:53:36 - INFO - __main__ - Step 38809: {'lr': 0.00019942973895986944, 'samples': 1241888, 'steps': 2425, 'loss/train': 2.267305612564087} -09/20/2021 22:53:37 - INFO - __main__ - Step 38810: {'lr': 0.00019942973895986944, 'samples': 1241920, 'steps': 2425, 'loss/train': 1.4727765321731567} -09/20/2021 22:53:37 - INFO - __main__ - Step 38811: {'lr': 0.00019942973895986944, 'samples': 1241952, 'steps': 2425, 'loss/train': 2.177565097808838} -09/20/2021 22:53:38 - INFO - __main__ - Step 38812: {'lr': 0.00019942973895986944, 'samples': 1241984, 'steps': 2425, 'loss/train': 2.2147607803344727} -09/20/2021 22:53:39 - INFO - __main__ - Step 38813: {'lr': 0.00019942973895986944, 'samples': 1242016, 'steps': 2425, 'loss/train': 2.1961100101470947} -09/20/2021 22:53:40 - INFO - __main__ - Step 38814: {'lr': 0.00019942973895986944, 'samples': 1242048, 'steps': 2425, 'loss/train': 2.5684409141540527} -09/20/2021 22:53:40 - INFO - __main__ - Step 38815: {'lr': 0.00019942973895986944, 'samples': 1242080, 'steps': 2425, 'loss/train': 1.196199655532837} -09/20/2021 22:53:41 - INFO - __main__ - Step 38816: {'lr': 0.00019942973895986944, 'samples': 1242112, 'steps': 2425, 'loss/train': 2.235440254211426} -09/20/2021 22:53:42 - INFO - __main__ - Step 38817: {'lr': 0.0001994290584967745, 'samples': 1242144, 'steps': 2426, 'loss/train': 1.046288251876831} -09/20/2021 22:53:43 - INFO - __main__ - Step 38818: {'lr': 0.0001994290584967745, 'samples': 1242176, 'steps': 2426, 'loss/train': 2.295637845993042} -09/20/2021 22:53:43 - INFO - __main__ - Step 38819: {'lr': 0.0001994290584967745, 'samples': 1242208, 'steps': 2426, 'loss/train': 3.28214430809021} -09/20/2021 22:53:44 - INFO - __main__ - Step 38820: {'lr': 0.0001994290584967745, 'samples': 1242240, 'steps': 2426, 'loss/train': 2.440648078918457} -09/20/2021 22:53:45 - INFO - __main__ - Step 38821: {'lr': 0.0001994290584967745, 'samples': 1242272, 'steps': 2426, 'loss/train': 1.938346266746521} -09/20/2021 22:53:46 - INFO - __main__ - Step 38822: {'lr': 0.0001994290584967745, 'samples': 1242304, 'steps': 2426, 'loss/train': 2.06874418258667} -09/20/2021 22:53:46 - INFO - __main__ - Step 38823: {'lr': 0.0001994290584967745, 'samples': 1242336, 'steps': 2426, 'loss/train': 1.9834195375442505} -09/20/2021 22:53:47 - INFO - __main__ - Step 38824: {'lr': 0.0001994290584967745, 'samples': 1242368, 'steps': 2426, 'loss/train': 2.482919454574585} -09/20/2021 22:53:48 - INFO - __main__ - Step 38825: {'lr': 0.0001994290584967745, 'samples': 1242400, 'steps': 2426, 'loss/train': 0.5560184717178345} -09/20/2021 22:53:49 - INFO - __main__ - Step 38826: {'lr': 0.0001994290584967745, 'samples': 1242432, 'steps': 2426, 'loss/train': 2.8200626373291016} -09/20/2021 22:53:49 - INFO - __main__ - Step 38827: {'lr': 0.0001994290584967745, 'samples': 1242464, 'steps': 2426, 'loss/train': 1.9623472690582275} -09/20/2021 22:53:50 - INFO - __main__ - Step 38828: {'lr': 0.0001994290584967745, 'samples': 1242496, 'steps': 2426, 'loss/train': 2.050318717956543} -09/20/2021 22:53:51 - INFO - __main__ - Step 38829: {'lr': 0.0001994290584967745, 'samples': 1242528, 'steps': 2426, 'loss/train': 3.0974791049957275} -09/20/2021 22:53:52 - INFO - __main__ - Step 38830: {'lr': 0.0001994290584967745, 'samples': 1242560, 'steps': 2426, 'loss/train': 4.8364763259887695} -09/20/2021 22:53:52 - INFO - __main__ - Step 38831: {'lr': 0.0001994290584967745, 'samples': 1242592, 'steps': 2426, 'loss/train': 1.7583034038543701} -09/20/2021 22:53:53 - INFO - __main__ - Step 38832: {'lr': 0.0001994290584967745, 'samples': 1242624, 'steps': 2426, 'loss/train': 1.9506325721740723} -09/20/2021 22:53:54 - INFO - __main__ - Step 38833: {'lr': 0.00019942837762910304, 'samples': 1242656, 'steps': 2427, 'loss/train': 1.7047233581542969} -09/20/2021 22:53:55 - INFO - __main__ - Step 38834: {'lr': 0.00019942837762910304, 'samples': 1242688, 'steps': 2427, 'loss/train': 2.228142499923706} -09/20/2021 22:53:56 - INFO - __main__ - Step 38835: {'lr': 0.00019942837762910304, 'samples': 1242720, 'steps': 2427, 'loss/train': 2.275561809539795} -09/20/2021 22:53:58 - INFO - __main__ - Step 38836: {'lr': 0.00019942837762910304, 'samples': 1242752, 'steps': 2427, 'loss/train': 2.1848902702331543} -09/20/2021 22:53:59 - INFO - __main__ - Step 38837: {'lr': 0.00019942837762910304, 'samples': 1242784, 'steps': 2427, 'loss/train': 1.9485206604003906} -09/20/2021 22:53:59 - INFO - __main__ - Step 38838: {'lr': 0.00019942837762910304, 'samples': 1242816, 'steps': 2427, 'loss/train': 1.7905828952789307} -09/20/2021 22:54:00 - INFO - __main__ - Step 38839: {'lr': 0.00019942837762910304, 'samples': 1242848, 'steps': 2427, 'loss/train': 1.5351243019104004} -09/20/2021 22:54:01 - INFO - __main__ - Step 38840: {'lr': 0.00019942837762910304, 'samples': 1242880, 'steps': 2427, 'loss/train': 1.724814772605896} -09/20/2021 22:54:02 - INFO - __main__ - Step 38841: {'lr': 0.00019942837762910304, 'samples': 1242912, 'steps': 2427, 'loss/train': 1.4048677682876587} -09/20/2021 22:54:02 - INFO - __main__ - Step 38842: {'lr': 0.00019942837762910304, 'samples': 1242944, 'steps': 2427, 'loss/train': 2.66987943649292} -09/20/2021 22:54:03 - INFO - __main__ - Step 38843: {'lr': 0.00019942837762910304, 'samples': 1242976, 'steps': 2427, 'loss/train': 2.9686405658721924} -09/20/2021 22:54:04 - INFO - __main__ - Step 38844: {'lr': 0.00019942837762910304, 'samples': 1243008, 'steps': 2427, 'loss/train': 1.4383177757263184} -09/20/2021 22:54:05 - INFO - __main__ - Step 38845: {'lr': 0.00019942837762910304, 'samples': 1243040, 'steps': 2427, 'loss/train': 2.108339309692383} -09/20/2021 22:54:05 - INFO - __main__ - Step 38846: {'lr': 0.00019942837762910304, 'samples': 1243072, 'steps': 2427, 'loss/train': 3.0377681255340576} -09/20/2021 22:54:06 - INFO - __main__ - Step 38847: {'lr': 0.00019942837762910304, 'samples': 1243104, 'steps': 2427, 'loss/train': 2.1900734901428223} -09/20/2021 22:54:07 - INFO - __main__ - Step 38848: {'lr': 0.00019942837762910304, 'samples': 1243136, 'steps': 2427, 'loss/train': 2.1641087532043457} -09/20/2021 22:54:08 - INFO - __main__ - Step 38849: {'lr': 0.00019942769635685793, 'samples': 1243168, 'steps': 2428, 'loss/train': 1.5982890129089355} -09/20/2021 22:54:08 - INFO - __main__ - Step 38850: {'lr': 0.00019942769635685793, 'samples': 1243200, 'steps': 2428, 'loss/train': 2.6784048080444336} -09/20/2021 22:54:09 - INFO - __main__ - Step 38851: {'lr': 0.00019942769635685793, 'samples': 1243232, 'steps': 2428, 'loss/train': 2.7374982833862305} -09/20/2021 22:54:10 - INFO - __main__ - Step 38852: {'lr': 0.00019942769635685793, 'samples': 1243264, 'steps': 2428, 'loss/train': 2.1879374980926514} -09/20/2021 22:54:11 - INFO - __main__ - Step 38853: {'lr': 0.00019942769635685793, 'samples': 1243296, 'steps': 2428, 'loss/train': 2.2877705097198486} -09/20/2021 22:54:11 - INFO - __main__ - Step 38854: {'lr': 0.00019942769635685793, 'samples': 1243328, 'steps': 2428, 'loss/train': 0.8896512389183044} -09/20/2021 22:54:12 - INFO - __main__ - Step 38855: {'lr': 0.00019942769635685793, 'samples': 1243360, 'steps': 2428, 'loss/train': 0.6450305581092834} -09/20/2021 22:54:13 - INFO - __main__ - Step 38856: {'lr': 0.00019942769635685793, 'samples': 1243392, 'steps': 2428, 'loss/train': 1.9430744647979736} -09/20/2021 22:54:14 - INFO - __main__ - Step 38857: {'lr': 0.00019942769635685793, 'samples': 1243424, 'steps': 2428, 'loss/train': 1.2092368602752686} -09/20/2021 22:54:14 - INFO - __main__ - Step 38858: {'lr': 0.00019942769635685793, 'samples': 1243456, 'steps': 2428, 'loss/train': 2.8236706256866455} -09/20/2021 22:54:15 - INFO - __main__ - Step 38859: {'lr': 0.00019942769635685793, 'samples': 1243488, 'steps': 2428, 'loss/train': 0.9755412340164185} -09/20/2021 22:54:16 - INFO - __main__ - Step 38860: {'lr': 0.00019942769635685793, 'samples': 1243520, 'steps': 2428, 'loss/train': 0.7225189208984375} -09/20/2021 22:54:17 - INFO - __main__ - Step 38861: {'lr': 0.00019942769635685793, 'samples': 1243552, 'steps': 2428, 'loss/train': 0.6345390677452087} -09/20/2021 22:54:17 - INFO - __main__ - Step 38862: {'lr': 0.00019942769635685793, 'samples': 1243584, 'steps': 2428, 'loss/train': 1.1664807796478271} -09/20/2021 22:54:18 - INFO - __main__ - Step 38863: {'lr': 0.00019942769635685793, 'samples': 1243616, 'steps': 2428, 'loss/train': 0.6806764602661133} -09/20/2021 22:54:19 - INFO - __main__ - Step 38864: {'lr': 0.00019942769635685793, 'samples': 1243648, 'steps': 2428, 'loss/train': 1.001360297203064} -09/20/2021 22:54:20 - INFO - __main__ - Step 38865: {'lr': 0.00019942701468004194, 'samples': 1243680, 'steps': 2429, 'loss/train': 0.6467605233192444} -09/20/2021 22:54:21 - INFO - __main__ - Step 38866: {'lr': 0.00019942701468004194, 'samples': 1243712, 'steps': 2429, 'loss/train': 0.6167780756950378} -09/20/2021 22:54:21 - INFO - __main__ - Step 38867: {'lr': 0.00019942701468004194, 'samples': 1243744, 'steps': 2429, 'loss/train': 1.6399784088134766} -09/20/2021 22:54:22 - INFO - __main__ - Step 38868: {'lr': 0.00019942701468004194, 'samples': 1243776, 'steps': 2429, 'loss/train': 2.2594282627105713} -09/20/2021 22:54:23 - INFO - __main__ - Step 38869: {'lr': 0.00019942701468004194, 'samples': 1243808, 'steps': 2429, 'loss/train': 3.159024715423584} -09/20/2021 22:54:24 - INFO - __main__ - Step 38870: {'lr': 0.00019942701468004194, 'samples': 1243840, 'steps': 2429, 'loss/train': 2.05517578125} -09/20/2021 22:54:24 - INFO - __main__ - Step 38871: {'lr': 0.00019942701468004194, 'samples': 1243872, 'steps': 2429, 'loss/train': 2.9481117725372314} -09/20/2021 22:54:26 - INFO - __main__ - Step 38872: {'lr': 0.00019942701468004194, 'samples': 1243904, 'steps': 2429, 'loss/train': 3.1528549194335938} -09/20/2021 22:54:27 - INFO - __main__ - Step 38873: {'lr': 0.00019942701468004194, 'samples': 1243936, 'steps': 2429, 'loss/train': 1.5618014335632324} -09/20/2021 22:54:27 - INFO - __main__ - Step 38874: {'lr': 0.00019942701468004194, 'samples': 1243968, 'steps': 2429, 'loss/train': 0.6202369332313538} -09/20/2021 22:54:28 - INFO - __main__ - Step 38875: {'lr': 0.00019942701468004194, 'samples': 1244000, 'steps': 2429, 'loss/train': 0.5336000919342041} -09/20/2021 22:54:29 - INFO - __main__ - Step 38876: {'lr': 0.00019942701468004194, 'samples': 1244032, 'steps': 2429, 'loss/train': 0.44398340582847595} -09/20/2021 22:54:30 - INFO - __main__ - Step 38877: {'lr': 0.00019942701468004194, 'samples': 1244064, 'steps': 2429, 'loss/train': 0.6050159335136414} -09/20/2021 22:54:30 - INFO - __main__ - Step 38878: {'lr': 0.00019942701468004194, 'samples': 1244096, 'steps': 2429, 'loss/train': 0.695357084274292} -09/20/2021 22:54:31 - INFO - __main__ - Step 38879: {'lr': 0.00019942701468004194, 'samples': 1244128, 'steps': 2429, 'loss/train': 0.5485756993293762} -09/20/2021 22:54:32 - INFO - __main__ - Step 38880: {'lr': 0.00019942701468004194, 'samples': 1244160, 'steps': 2429, 'loss/train': 0.5900508165359497} -09/20/2021 22:54:33 - INFO - __main__ - Step 38881: {'lr': 0.0001994263325986578, 'samples': 1244192, 'steps': 2430, 'loss/train': 0.5085539817810059} -09/20/2021 22:54:33 - INFO - __main__ - Step 38882: {'lr': 0.0001994263325986578, 'samples': 1244224, 'steps': 2430, 'loss/train': 1.679089069366455} -09/20/2021 22:54:34 - INFO - __main__ - Step 38883: {'lr': 0.0001994263325986578, 'samples': 1244256, 'steps': 2430, 'loss/train': 2.5746312141418457} -09/20/2021 22:54:35 - INFO - __main__ - Step 38884: {'lr': 0.0001994263325986578, 'samples': 1244288, 'steps': 2430, 'loss/train': 2.8174819946289062} -09/20/2021 22:54:36 - INFO - __main__ - Step 38885: {'lr': 0.0001994263325986578, 'samples': 1244320, 'steps': 2430, 'loss/train': 1.6564176082611084} -09/20/2021 22:54:36 - INFO - __main__ - Step 38886: {'lr': 0.0001994263325986578, 'samples': 1244352, 'steps': 2430, 'loss/train': 2.8206186294555664} -09/20/2021 22:54:37 - INFO - __main__ - Step 38887: {'lr': 0.0001994263325986578, 'samples': 1244384, 'steps': 2430, 'loss/train': 2.2450170516967773} -09/20/2021 22:54:38 - INFO - __main__ - Step 38888: {'lr': 0.0001994263325986578, 'samples': 1244416, 'steps': 2430, 'loss/train': 2.662504196166992} -09/20/2021 22:54:39 - INFO - __main__ - Step 38889: {'lr': 0.0001994263325986578, 'samples': 1244448, 'steps': 2430, 'loss/train': 3.055341958999634} -09/20/2021 22:54:39 - INFO - __main__ - Step 38890: {'lr': 0.0001994263325986578, 'samples': 1244480, 'steps': 2430, 'loss/train': 2.225442409515381} -09/20/2021 22:54:40 - INFO - __main__ - Step 38891: {'lr': 0.0001994263325986578, 'samples': 1244512, 'steps': 2430, 'loss/train': 2.174384593963623} -09/20/2021 22:54:41 - INFO - __main__ - Step 38892: {'lr': 0.0001994263325986578, 'samples': 1244544, 'steps': 2430, 'loss/train': 2.262136220932007} -09/20/2021 22:54:42 - INFO - __main__ - Step 38893: {'lr': 0.0001994263325986578, 'samples': 1244576, 'steps': 2430, 'loss/train': 2.2551043033599854} -09/20/2021 22:54:42 - INFO - __main__ - Step 38894: {'lr': 0.0001994263325986578, 'samples': 1244608, 'steps': 2430, 'loss/train': 2.4943172931671143} -09/20/2021 22:54:43 - INFO - __main__ - Step 38895: {'lr': 0.0001994263325986578, 'samples': 1244640, 'steps': 2430, 'loss/train': 1.5448051691055298} -09/20/2021 22:54:44 - INFO - __main__ - Step 38896: {'lr': 0.0001994263325986578, 'samples': 1244672, 'steps': 2430, 'loss/train': 1.9215714931488037} -09/20/2021 22:54:45 - INFO - __main__ - Step 38897: {'lr': 0.00019942565011270825, 'samples': 1244704, 'steps': 2431, 'loss/train': 2.049154758453369} -09/20/2021 22:54:46 - INFO - __main__ - Step 38898: {'lr': 0.00019942565011270825, 'samples': 1244736, 'steps': 2431, 'loss/train': 1.468914270401001} -09/20/2021 22:54:46 - INFO - __main__ - Step 38899: {'lr': 0.00019942565011270825, 'samples': 1244768, 'steps': 2431, 'loss/train': 2.6634247303009033} -09/20/2021 22:54:47 - INFO - __main__ - Step 38900: {'lr': 0.00019942565011270825, 'samples': 1244800, 'steps': 2431, 'loss/train': 2.689342498779297} -09/20/2021 22:54:48 - INFO - __main__ - Step 38901: {'lr': 0.00019942565011270825, 'samples': 1244832, 'steps': 2431, 'loss/train': 0.826637864112854} -09/20/2021 22:54:49 - INFO - __main__ - Step 38902: {'lr': 0.00019942565011270825, 'samples': 1244864, 'steps': 2431, 'loss/train': 2.520237684249878} -09/20/2021 22:54:49 - INFO - __main__ - Step 38903: {'lr': 0.00019942565011270825, 'samples': 1244896, 'steps': 2431, 'loss/train': 2.0157623291015625} -09/20/2021 22:54:50 - INFO - __main__ - Step 38904: {'lr': 0.00019942565011270825, 'samples': 1244928, 'steps': 2431, 'loss/train': 1.3934885263442993} -09/20/2021 22:54:51 - INFO - __main__ - Step 38905: {'lr': 0.00019942565011270825, 'samples': 1244960, 'steps': 2431, 'loss/train': 0.8226352334022522} -09/20/2021 22:54:52 - INFO - __main__ - Step 38906: {'lr': 0.00019942565011270825, 'samples': 1244992, 'steps': 2431, 'loss/train': 2.6504502296447754} -09/20/2021 22:54:52 - INFO - __main__ - Step 38907: {'lr': 0.00019942565011270825, 'samples': 1245024, 'steps': 2431, 'loss/train': 1.8717820644378662} -09/20/2021 22:54:53 - INFO - __main__ - Step 38908: {'lr': 0.00019942565011270825, 'samples': 1245056, 'steps': 2431, 'loss/train': 1.9927189350128174} -09/20/2021 22:54:54 - INFO - __main__ - Step 38909: {'lr': 0.00019942565011270825, 'samples': 1245088, 'steps': 2431, 'loss/train': 2.6300549507141113} -09/20/2021 22:54:55 - INFO - __main__ - Step 38910: {'lr': 0.00019942565011270825, 'samples': 1245120, 'steps': 2431, 'loss/train': 3.6466829776763916} -09/20/2021 22:54:56 - INFO - __main__ - Step 38911: {'lr': 0.00019942565011270825, 'samples': 1245152, 'steps': 2431, 'loss/train': 1.7469418048858643} -09/20/2021 22:54:57 - INFO - __main__ - Step 38912: {'lr': 0.00019942565011270825, 'samples': 1245184, 'steps': 2431, 'loss/train': 1.8167213201522827} -09/20/2021 22:54:58 - INFO - __main__ - Step 38913: {'lr': 0.00019942496722219618, 'samples': 1245216, 'steps': 2432, 'loss/train': 2.3278415203094482} -09/20/2021 22:54:58 - INFO - __main__ - Step 38914: {'lr': 0.00019942496722219618, 'samples': 1245248, 'steps': 2432, 'loss/train': 2.8996620178222656} -09/20/2021 22:54:59 - INFO - __main__ - Step 38915: {'lr': 0.00019942496722219618, 'samples': 1245280, 'steps': 2432, 'loss/train': 1.0568958520889282} -09/20/2021 22:55:00 - INFO - __main__ - Step 38916: {'lr': 0.00019942496722219618, 'samples': 1245312, 'steps': 2432, 'loss/train': 1.8769553899765015} -09/20/2021 22:55:01 - INFO - __main__ - Step 38917: {'lr': 0.00019942496722219618, 'samples': 1245344, 'steps': 2432, 'loss/train': 2.3577380180358887} -09/20/2021 22:55:01 - INFO - __main__ - Step 38918: {'lr': 0.00019942496722219618, 'samples': 1245376, 'steps': 2432, 'loss/train': 1.3813220262527466} -09/20/2021 22:55:02 - INFO - __main__ - Step 38919: {'lr': 0.00019942496722219618, 'samples': 1245408, 'steps': 2432, 'loss/train': 2.291642665863037} -09/20/2021 22:55:03 - INFO - __main__ - Step 38920: {'lr': 0.00019942496722219618, 'samples': 1245440, 'steps': 2432, 'loss/train': 1.8628371953964233} -09/20/2021 22:55:04 - INFO - __main__ - Step 38921: {'lr': 0.00019942496722219618, 'samples': 1245472, 'steps': 2432, 'loss/train': 2.2357194423675537} -09/20/2021 22:55:04 - INFO - __main__ - Step 38922: {'lr': 0.00019942496722219618, 'samples': 1245504, 'steps': 2432, 'loss/train': 1.9065587520599365} -09/20/2021 22:55:05 - INFO - __main__ - Step 38923: {'lr': 0.00019942496722219618, 'samples': 1245536, 'steps': 2432, 'loss/train': 2.315967559814453} -09/20/2021 22:55:06 - INFO - __main__ - Step 38924: {'lr': 0.00019942496722219618, 'samples': 1245568, 'steps': 2432, 'loss/train': 2.0243616104125977} -09/20/2021 22:55:07 - INFO - __main__ - Step 38925: {'lr': 0.00019942496722219618, 'samples': 1245600, 'steps': 2432, 'loss/train': 2.087265968322754} -09/20/2021 22:55:07 - INFO - __main__ - Step 38926: {'lr': 0.00019942496722219618, 'samples': 1245632, 'steps': 2432, 'loss/train': 2.4014699459075928} -09/20/2021 22:55:08 - INFO - __main__ - Step 38927: {'lr': 0.00019942496722219618, 'samples': 1245664, 'steps': 2432, 'loss/train': 2.5785772800445557} -09/20/2021 22:55:09 - INFO - __main__ - Step 38928: {'lr': 0.00019942496722219618, 'samples': 1245696, 'steps': 2432, 'loss/train': 2.7534704208374023} -09/20/2021 22:55:10 - INFO - __main__ - Step 38929: {'lr': 0.00019942428392712426, 'samples': 1245728, 'steps': 2433, 'loss/train': 1.7304767370224} -09/20/2021 22:55:10 - INFO - __main__ - Step 38930: {'lr': 0.00019942428392712426, 'samples': 1245760, 'steps': 2433, 'loss/train': 1.513129711151123} -09/20/2021 22:55:11 - INFO - __main__ - Step 38931: {'lr': 0.00019942428392712426, 'samples': 1245792, 'steps': 2433, 'loss/train': 3.881673574447632} -09/20/2021 22:55:12 - INFO - __main__ - Step 38932: {'lr': 0.00019942428392712426, 'samples': 1245824, 'steps': 2433, 'loss/train': 2.3233211040496826} -09/20/2021 22:55:13 - INFO - __main__ - Step 38933: {'lr': 0.00019942428392712426, 'samples': 1245856, 'steps': 2433, 'loss/train': 2.285003900527954} -09/20/2021 22:55:13 - INFO - __main__ - Step 38934: {'lr': 0.00019942428392712426, 'samples': 1245888, 'steps': 2433, 'loss/train': 2.612534284591675} -09/20/2021 22:55:14 - INFO - __main__ - Step 38935: {'lr': 0.00019942428392712426, 'samples': 1245920, 'steps': 2433, 'loss/train': 2.94179630279541} -09/20/2021 22:55:15 - INFO - __main__ - Step 38936: {'lr': 0.00019942428392712426, 'samples': 1245952, 'steps': 2433, 'loss/train': 2.5273869037628174} -09/20/2021 22:55:16 - INFO - __main__ - Step 38937: {'lr': 0.00019942428392712426, 'samples': 1245984, 'steps': 2433, 'loss/train': 2.6630258560180664} -09/20/2021 22:55:16 - INFO - __main__ - Step 38938: {'lr': 0.00019942428392712426, 'samples': 1246016, 'steps': 2433, 'loss/train': 0.5245691537857056} -09/20/2021 22:55:17 - INFO - __main__ - Step 38939: {'lr': 0.00019942428392712426, 'samples': 1246048, 'steps': 2433, 'loss/train': 2.7907602787017822} -09/20/2021 22:55:18 - INFO - __main__ - Step 38940: {'lr': 0.00019942428392712426, 'samples': 1246080, 'steps': 2433, 'loss/train': 3.9484407901763916} -09/20/2021 22:55:20 - INFO - __main__ - Step 38941: {'lr': 0.00019942428392712426, 'samples': 1246112, 'steps': 2433, 'loss/train': 2.6960649490356445} -09/20/2021 22:55:20 - INFO - __main__ - Step 38942: {'lr': 0.00019942428392712426, 'samples': 1246144, 'steps': 2433, 'loss/train': 1.3776671886444092} -09/20/2021 22:55:21 - INFO - __main__ - Step 38943: {'lr': 0.00019942428392712426, 'samples': 1246176, 'steps': 2433, 'loss/train': 2.2692372798919678} -09/20/2021 22:55:22 - INFO - __main__ - Step 38944: {'lr': 0.00019942428392712426, 'samples': 1246208, 'steps': 2433, 'loss/train': 2.2843892574310303} -09/20/2021 22:55:23 - INFO - __main__ - Step 38945: {'lr': 0.00019942360022749534, 'samples': 1246240, 'steps': 2434, 'loss/train': 1.7564842700958252} -09/20/2021 22:55:24 - INFO - __main__ - Step 38946: {'lr': 0.00019942360022749534, 'samples': 1246272, 'steps': 2434, 'loss/train': 2.366612434387207} -09/20/2021 22:55:24 - INFO - __main__ - Step 38947: {'lr': 0.00019942360022749534, 'samples': 1246304, 'steps': 2434, 'loss/train': 2.251887083053589} -09/20/2021 22:55:25 - INFO - __main__ - Step 38948: {'lr': 0.00019942360022749534, 'samples': 1246336, 'steps': 2434, 'loss/train': 2.7329001426696777} -09/20/2021 22:55:26 - INFO - __main__ - Step 38949: {'lr': 0.00019942360022749534, 'samples': 1246368, 'steps': 2434, 'loss/train': 0.45245471596717834} -09/20/2021 22:55:27 - INFO - __main__ - Step 38950: {'lr': 0.00019942360022749534, 'samples': 1246400, 'steps': 2434, 'loss/train': 0.2937794327735901} -09/20/2021 22:55:27 - INFO - __main__ - Step 38951: {'lr': 0.00019942360022749534, 'samples': 1246432, 'steps': 2434, 'loss/train': 0.24295702576637268} -09/20/2021 22:55:28 - INFO - __main__ - Step 38952: {'lr': 0.00019942360022749534, 'samples': 1246464, 'steps': 2434, 'loss/train': 0.2802872359752655} -09/20/2021 22:55:29 - INFO - __main__ - Step 38953: {'lr': 0.00019942360022749534, 'samples': 1246496, 'steps': 2434, 'loss/train': 0.6054017543792725} -09/20/2021 22:55:30 - INFO - __main__ - Step 38954: {'lr': 0.00019942360022749534, 'samples': 1246528, 'steps': 2434, 'loss/train': 2.5971672534942627} -09/20/2021 22:55:30 - INFO - __main__ - Step 38955: {'lr': 0.00019942360022749534, 'samples': 1246560, 'steps': 2434, 'loss/train': 2.3643276691436768} -09/20/2021 22:55:31 - INFO - __main__ - Step 38956: {'lr': 0.00019942360022749534, 'samples': 1246592, 'steps': 2434, 'loss/train': 2.1316099166870117} -09/20/2021 22:55:32 - INFO - __main__ - Step 38957: {'lr': 0.00019942360022749534, 'samples': 1246624, 'steps': 2434, 'loss/train': 2.14730167388916} -09/20/2021 22:55:33 - INFO - __main__ - Step 38958: {'lr': 0.00019942360022749534, 'samples': 1246656, 'steps': 2434, 'loss/train': 2.502230167388916} -09/20/2021 22:55:33 - INFO - __main__ - Step 38959: {'lr': 0.00019942360022749534, 'samples': 1246688, 'steps': 2434, 'loss/train': 2.279242992401123} -09/20/2021 22:55:34 - INFO - __main__ - Step 38960: {'lr': 0.00019942360022749534, 'samples': 1246720, 'steps': 2434, 'loss/train': 0.8631714582443237} -09/20/2021 22:55:35 - INFO - __main__ - Step 38961: {'lr': 0.00019942291612331218, 'samples': 1246752, 'steps': 2435, 'loss/train': 1.2280632257461548} -09/20/2021 22:55:36 - INFO - __main__ - Step 38962: {'lr': 0.00019942291612331218, 'samples': 1246784, 'steps': 2435, 'loss/train': 3.2844724655151367} -09/20/2021 22:55:36 - INFO - __main__ - Step 38963: {'lr': 0.00019942291612331218, 'samples': 1246816, 'steps': 2435, 'loss/train': 2.4696288108825684} -09/20/2021 22:55:37 - INFO - __main__ - Step 38964: {'lr': 0.00019942291612331218, 'samples': 1246848, 'steps': 2435, 'loss/train': 2.5419530868530273} -09/20/2021 22:55:38 - INFO - __main__ - Step 38965: {'lr': 0.00019942291612331218, 'samples': 1246880, 'steps': 2435, 'loss/train': 3.196974992752075} -09/20/2021 22:55:39 - INFO - __main__ - Step 38966: {'lr': 0.00019942291612331218, 'samples': 1246912, 'steps': 2435, 'loss/train': 1.585267424583435} -09/20/2021 22:55:39 - INFO - __main__ - Step 38967: {'lr': 0.00019942291612331218, 'samples': 1246944, 'steps': 2435, 'loss/train': 2.252718925476074} -09/20/2021 22:55:40 - INFO - __main__ - Step 38968: {'lr': 0.00019942291612331218, 'samples': 1246976, 'steps': 2435, 'loss/train': 2.0002965927124023} -09/20/2021 22:55:41 - INFO - __main__ - Step 38969: {'lr': 0.00019942291612331218, 'samples': 1247008, 'steps': 2435, 'loss/train': 0.9293336272239685} -09/20/2021 22:55:42 - INFO - __main__ - Step 38970: {'lr': 0.00019942291612331218, 'samples': 1247040, 'steps': 2435, 'loss/train': 0.792346179485321} -09/20/2021 22:55:42 - INFO - __main__ - Step 38971: {'lr': 0.00019942291612331218, 'samples': 1247072, 'steps': 2435, 'loss/train': 0.3648759126663208} -09/20/2021 22:55:43 - INFO - __main__ - Step 38972: {'lr': 0.00019942291612331218, 'samples': 1247104, 'steps': 2435, 'loss/train': 0.32878950238227844} -09/20/2021 22:55:44 - INFO - __main__ - Step 38973: {'lr': 0.00019942291612331218, 'samples': 1247136, 'steps': 2435, 'loss/train': 0.17220240831375122} -09/20/2021 22:55:45 - INFO - __main__ - Step 38974: {'lr': 0.00019942291612331218, 'samples': 1247168, 'steps': 2435, 'loss/train': 0.6166651844978333} -09/20/2021 22:55:46 - INFO - __main__ - Step 38975: {'lr': 0.00019942291612331218, 'samples': 1247200, 'steps': 2435, 'loss/train': 0.2772200107574463} -09/20/2021 22:55:47 - INFO - __main__ - Step 38976: {'lr': 0.00019942291612331218, 'samples': 1247232, 'steps': 2435, 'loss/train': 2.1099865436553955} -09/20/2021 22:55:48 - INFO - __main__ - Step 38977: {'lr': 0.00019942223161457755, 'samples': 1247264, 'steps': 2436, 'loss/train': 2.0369865894317627} -09/20/2021 22:55:49 - INFO - __main__ - Step 38978: {'lr': 0.00019942223161457755, 'samples': 1247296, 'steps': 2436, 'loss/train': 2.2357680797576904} -09/20/2021 22:55:50 - INFO - __main__ - Step 38979: {'lr': 0.00019942223161457755, 'samples': 1247328, 'steps': 2436, 'loss/train': 2.177044630050659} -09/20/2021 22:55:50 - INFO - __main__ - Step 38980: {'lr': 0.00019942223161457755, 'samples': 1247360, 'steps': 2436, 'loss/train': 2.222238302230835} -09/20/2021 22:55:51 - INFO - __main__ - Step 38981: {'lr': 0.00019942223161457755, 'samples': 1247392, 'steps': 2436, 'loss/train': 2.187570095062256} -09/20/2021 22:55:52 - INFO - __main__ - Step 38982: {'lr': 0.00019942223161457755, 'samples': 1247424, 'steps': 2436, 'loss/train': 2.188938617706299} -09/20/2021 22:55:53 - INFO - __main__ - Step 38983: {'lr': 0.00019942223161457755, 'samples': 1247456, 'steps': 2436, 'loss/train': 2.070232391357422} -09/20/2021 22:55:53 - INFO - __main__ - Step 38984: {'lr': 0.00019942223161457755, 'samples': 1247488, 'steps': 2436, 'loss/train': 2.123120069503784} -09/20/2021 22:55:54 - INFO - __main__ - Step 38985: {'lr': 0.00019942223161457755, 'samples': 1247520, 'steps': 2436, 'loss/train': 2.2143421173095703} -09/20/2021 22:55:55 - INFO - __main__ - Step 38986: {'lr': 0.00019942223161457755, 'samples': 1247552, 'steps': 2436, 'loss/train': 2.161571741104126} -09/20/2021 22:55:56 - INFO - __main__ - Step 38987: {'lr': 0.00019942223161457755, 'samples': 1247584, 'steps': 2436, 'loss/train': 2.1431915760040283} -09/20/2021 22:55:56 - INFO - __main__ - Step 38988: {'lr': 0.00019942223161457755, 'samples': 1247616, 'steps': 2436, 'loss/train': 1.1715202331542969} -09/20/2021 22:55:57 - INFO - __main__ - Step 38989: {'lr': 0.00019942223161457755, 'samples': 1247648, 'steps': 2436, 'loss/train': 1.5590440034866333} -09/20/2021 22:55:58 - INFO - __main__ - Step 38990: {'lr': 0.00019942223161457755, 'samples': 1247680, 'steps': 2436, 'loss/train': 1.642472267150879} -09/20/2021 22:55:59 - INFO - __main__ - Step 38991: {'lr': 0.00019942223161457755, 'samples': 1247712, 'steps': 2436, 'loss/train': 2.005037546157837} -09/20/2021 22:55:59 - INFO - __main__ - Step 38992: {'lr': 0.00019942223161457755, 'samples': 1247744, 'steps': 2436, 'loss/train': 2.619652271270752} -09/20/2021 22:56:00 - INFO - __main__ - Step 38993: {'lr': 0.00019942154670129423, 'samples': 1247776, 'steps': 2437, 'loss/train': 2.5435714721679688} -09/20/2021 22:56:01 - INFO - __main__ - Step 38994: {'lr': 0.00019942154670129423, 'samples': 1247808, 'steps': 2437, 'loss/train': 1.9108954668045044} -09/20/2021 22:56:02 - INFO - __main__ - Step 38995: {'lr': 0.00019942154670129423, 'samples': 1247840, 'steps': 2437, 'loss/train': 3.0292227268218994} -09/20/2021 22:56:02 - INFO - __main__ - Step 38996: {'lr': 0.00019942154670129423, 'samples': 1247872, 'steps': 2437, 'loss/train': 2.8008289337158203} -09/20/2021 22:56:03 - INFO - __main__ - Step 38997: {'lr': 0.00019942154670129423, 'samples': 1247904, 'steps': 2437, 'loss/train': 0.464123010635376} -09/20/2021 22:56:04 - INFO - __main__ - Step 38998: {'lr': 0.00019942154670129423, 'samples': 1247936, 'steps': 2437, 'loss/train': 2.152276039123535} -09/20/2021 22:56:05 - INFO - __main__ - Step 38999: {'lr': 0.00019942154670129423, 'samples': 1247968, 'steps': 2437, 'loss/train': 1.6798595190048218} -09/20/2021 22:56:05 - INFO - __main__ - Step 39000: {'lr': 0.00019942154670129423, 'samples': 1248000, 'steps': 2437, 'loss/train': 3.128596544265747} -09/20/2021 22:56:06 - INFO - __main__ - Step 39001: {'lr': 0.00019942154670129423, 'samples': 1248032, 'steps': 2437, 'loss/train': 2.2209396362304688} -09/20/2021 22:56:07 - INFO - __main__ - Step 39002: {'lr': 0.00019942154670129423, 'samples': 1248064, 'steps': 2437, 'loss/train': 2.0346550941467285} -09/20/2021 22:56:08 - INFO - __main__ - Step 39003: {'lr': 0.00019942154670129423, 'samples': 1248096, 'steps': 2437, 'loss/train': 1.1549997329711914} -09/20/2021 22:56:08 - INFO - __main__ - Step 39004: {'lr': 0.00019942154670129423, 'samples': 1248128, 'steps': 2437, 'loss/train': 2.0433428287506104} -09/20/2021 22:56:09 - INFO - __main__ - Step 39005: {'lr': 0.00019942154670129423, 'samples': 1248160, 'steps': 2437, 'loss/train': 1.899658441543579} -09/20/2021 22:56:10 - INFO - __main__ - Step 39006: {'lr': 0.00019942154670129423, 'samples': 1248192, 'steps': 2437, 'loss/train': 0.9517035484313965} -09/20/2021 22:56:11 - INFO - __main__ - Step 39007: {'lr': 0.00019942154670129423, 'samples': 1248224, 'steps': 2437, 'loss/train': 2.0313072204589844} -09/20/2021 22:56:11 - INFO - __main__ - Step 39008: {'lr': 0.00019942154670129423, 'samples': 1248256, 'steps': 2437, 'loss/train': 1.7564142942428589} -09/20/2021 22:56:12 - INFO - __main__ - Step 39009: {'lr': 0.00019942086138346506, 'samples': 1248288, 'steps': 2438, 'loss/train': 2.0536787509918213} -09/20/2021 22:56:13 - INFO - __main__ - Step 39010: {'lr': 0.00019942086138346506, 'samples': 1248320, 'steps': 2438, 'loss/train': 1.8257272243499756} -09/20/2021 22:56:14 - INFO - __main__ - Step 39011: {'lr': 0.00019942086138346506, 'samples': 1248352, 'steps': 2438, 'loss/train': 2.1733639240264893} -09/20/2021 22:56:15 - INFO - __main__ - Step 39012: {'lr': 0.00019942086138346506, 'samples': 1248384, 'steps': 2438, 'loss/train': 1.9354991912841797} -09/20/2021 22:56:16 - INFO - __main__ - Step 39013: {'lr': 0.00019942086138346506, 'samples': 1248416, 'steps': 2438, 'loss/train': 1.3133385181427002} -09/20/2021 22:56:17 - INFO - __main__ - Step 39014: {'lr': 0.00019942086138346506, 'samples': 1248448, 'steps': 2438, 'loss/train': 2.2507877349853516} -09/20/2021 22:56:17 - INFO - __main__ - Step 39015: {'lr': 0.00019942086138346506, 'samples': 1248480, 'steps': 2438, 'loss/train': 1.826418161392212} -09/20/2021 22:56:18 - INFO - __main__ - Step 39016: {'lr': 0.00019942086138346506, 'samples': 1248512, 'steps': 2438, 'loss/train': 1.9335837364196777} -09/20/2021 22:56:19 - INFO - __main__ - Step 39017: {'lr': 0.00019942086138346506, 'samples': 1248544, 'steps': 2438, 'loss/train': 2.8090202808380127} -09/20/2021 22:56:20 - INFO - __main__ - Step 39018: {'lr': 0.00019942086138346506, 'samples': 1248576, 'steps': 2438, 'loss/train': 1.5890085697174072} -09/20/2021 22:56:20 - INFO - __main__ - Step 39019: {'lr': 0.00019942086138346506, 'samples': 1248608, 'steps': 2438, 'loss/train': 1.637917160987854} -09/20/2021 22:56:21 - INFO - __main__ - Step 39020: {'lr': 0.00019942086138346506, 'samples': 1248640, 'steps': 2438, 'loss/train': 1.5029716491699219} -09/20/2021 22:56:22 - INFO - __main__ - Step 39021: {'lr': 0.00019942086138346506, 'samples': 1248672, 'steps': 2438, 'loss/train': 1.928551435470581} -09/20/2021 22:56:23 - INFO - __main__ - Step 39022: {'lr': 0.00019942086138346506, 'samples': 1248704, 'steps': 2438, 'loss/train': 3.1483325958251953} -09/20/2021 22:56:23 - INFO - __main__ - Step 39023: {'lr': 0.00019942086138346506, 'samples': 1248736, 'steps': 2438, 'loss/train': 3.4730007648468018} -09/20/2021 22:56:24 - INFO - __main__ - Step 39024: {'lr': 0.00019942086138346506, 'samples': 1248768, 'steps': 2438, 'loss/train': 2.2806684970855713} -09/20/2021 22:56:25 - INFO - __main__ - Step 39025: {'lr': 0.00019942017566109278, 'samples': 1248800, 'steps': 2439, 'loss/train': 2.256923198699951} -09/20/2021 22:56:26 - INFO - __main__ - Step 39026: {'lr': 0.00019942017566109278, 'samples': 1248832, 'steps': 2439, 'loss/train': 1.9003316164016724} -09/20/2021 22:56:26 - INFO - __main__ - Step 39027: {'lr': 0.00019942017566109278, 'samples': 1248864, 'steps': 2439, 'loss/train': 1.590947151184082} -09/20/2021 22:56:27 - INFO - __main__ - Step 39028: {'lr': 0.00019942017566109278, 'samples': 1248896, 'steps': 2439, 'loss/train': 2.4669580459594727} -09/20/2021 22:56:28 - INFO - __main__ - Step 39029: {'lr': 0.00019942017566109278, 'samples': 1248928, 'steps': 2439, 'loss/train': 2.2636146545410156} -09/20/2021 22:56:29 - INFO - __main__ - Step 39030: {'lr': 0.00019942017566109278, 'samples': 1248960, 'steps': 2439, 'loss/train': 2.2769150733947754} -09/20/2021 22:56:29 - INFO - __main__ - Step 39031: {'lr': 0.00019942017566109278, 'samples': 1248992, 'steps': 2439, 'loss/train': 2.1165058612823486} -09/20/2021 22:56:30 - INFO - __main__ - Step 39032: {'lr': 0.00019942017566109278, 'samples': 1249024, 'steps': 2439, 'loss/train': 2.077179431915283} -09/20/2021 22:56:31 - INFO - __main__ - Step 39033: {'lr': 0.00019942017566109278, 'samples': 1249056, 'steps': 2439, 'loss/train': 1.5593003034591675} -09/20/2021 22:56:32 - INFO - __main__ - Step 39034: {'lr': 0.00019942017566109278, 'samples': 1249088, 'steps': 2439, 'loss/train': 2.5603623390197754} -09/20/2021 22:56:32 - INFO - __main__ - Step 39035: {'lr': 0.00019942017566109278, 'samples': 1249120, 'steps': 2439, 'loss/train': 1.3287830352783203} -09/20/2021 22:56:33 - INFO - __main__ - Step 39036: {'lr': 0.00019942017566109278, 'samples': 1249152, 'steps': 2439, 'loss/train': 1.8509695529937744} -09/20/2021 22:56:34 - INFO - __main__ - Step 39037: {'lr': 0.00019942017566109278, 'samples': 1249184, 'steps': 2439, 'loss/train': 2.9083728790283203} -09/20/2021 22:56:35 - INFO - __main__ - Step 39038: {'lr': 0.00019942017566109278, 'samples': 1249216, 'steps': 2439, 'loss/train': 2.4762768745422363} -09/20/2021 22:56:35 - INFO - __main__ - Step 39039: {'lr': 0.00019942017566109278, 'samples': 1249248, 'steps': 2439, 'loss/train': 3.000596284866333} -09/20/2021 22:56:36 - INFO - __main__ - Step 39040: {'lr': 0.00019942017566109278, 'samples': 1249280, 'steps': 2439, 'loss/train': 2.340019941329956} -09/20/2021 22:56:37 - INFO - __main__ - Step 39041: {'lr': 0.00019941948953418014, 'samples': 1249312, 'steps': 2440, 'loss/train': 1.76030433177948} -09/20/2021 22:56:38 - INFO - __main__ - Step 39042: {'lr': 0.00019941948953418014, 'samples': 1249344, 'steps': 2440, 'loss/train': 2.230775833129883} -09/20/2021 22:56:39 - INFO - __main__ - Step 39043: {'lr': 0.00019941948953418014, 'samples': 1249376, 'steps': 2440, 'loss/train': 2.3835275173187256} -09/20/2021 22:56:40 - INFO - __main__ - Step 39044: {'lr': 0.00019941948953418014, 'samples': 1249408, 'steps': 2440, 'loss/train': 2.9141316413879395} -09/20/2021 22:56:41 - INFO - __main__ - Step 39045: {'lr': 0.00019941948953418014, 'samples': 1249440, 'steps': 2440, 'loss/train': 1.9798592329025269} -09/20/2021 22:56:41 - INFO - __main__ - Step 39046: {'lr': 0.00019941948953418014, 'samples': 1249472, 'steps': 2440, 'loss/train': 1.82035493850708} -09/20/2021 22:56:42 - INFO - __main__ - Step 39047: {'lr': 0.00019941948953418014, 'samples': 1249504, 'steps': 2440, 'loss/train': 2.6554043292999268} -09/20/2021 22:56:43 - INFO - __main__ - Step 39048: {'lr': 0.00019941948953418014, 'samples': 1249536, 'steps': 2440, 'loss/train': 2.677588701248169} -09/20/2021 22:56:44 - INFO - __main__ - Step 39049: {'lr': 0.00019941948953418014, 'samples': 1249568, 'steps': 2440, 'loss/train': 1.3833569288253784} -09/20/2021 22:56:44 - INFO - __main__ - Step 39050: {'lr': 0.00019941948953418014, 'samples': 1249600, 'steps': 2440, 'loss/train': 2.06596302986145} -09/20/2021 22:56:45 - INFO - __main__ - Step 39051: {'lr': 0.00019941948953418014, 'samples': 1249632, 'steps': 2440, 'loss/train': 1.7405904531478882} -09/20/2021 22:56:46 - INFO - __main__ - Step 39052: {'lr': 0.00019941948953418014, 'samples': 1249664, 'steps': 2440, 'loss/train': 2.1715548038482666} -09/20/2021 22:56:47 - INFO - __main__ - Step 39053: {'lr': 0.00019941948953418014, 'samples': 1249696, 'steps': 2440, 'loss/train': 3.499619960784912} -09/20/2021 22:56:47 - INFO - __main__ - Step 39054: {'lr': 0.00019941948953418014, 'samples': 1249728, 'steps': 2440, 'loss/train': 2.67541766166687} -09/20/2021 22:56:48 - INFO - __main__ - Step 39055: {'lr': 0.00019941948953418014, 'samples': 1249760, 'steps': 2440, 'loss/train': 2.571272134780884} -09/20/2021 22:56:49 - INFO - __main__ - Step 39056: {'lr': 0.00019941948953418014, 'samples': 1249792, 'steps': 2440, 'loss/train': 2.5733227729797363} -09/20/2021 22:56:50 - INFO - __main__ - Step 39057: {'lr': 0.00019941880300273005, 'samples': 1249824, 'steps': 2441, 'loss/train': 2.6400835514068604} -09/20/2021 22:56:51 - INFO - __main__ - Step 39058: {'lr': 0.00019941880300273005, 'samples': 1249856, 'steps': 2441, 'loss/train': 2.497591018676758} -09/20/2021 22:56:51 - INFO - __main__ - Step 39059: {'lr': 0.00019941880300273005, 'samples': 1249888, 'steps': 2441, 'loss/train': 2.3782427310943604} -09/20/2021 22:56:52 - INFO - __main__ - Step 39060: {'lr': 0.00019941880300273005, 'samples': 1249920, 'steps': 2441, 'loss/train': 1.9073798656463623} -09/20/2021 22:56:53 - INFO - __main__ - Step 39061: {'lr': 0.00019941880300273005, 'samples': 1249952, 'steps': 2441, 'loss/train': 2.3777124881744385} -09/20/2021 22:56:54 - INFO - __main__ - Step 39062: {'lr': 0.00019941880300273005, 'samples': 1249984, 'steps': 2441, 'loss/train': 1.9430522918701172} -09/20/2021 22:56:54 - INFO - __main__ - Step 39063: {'lr': 0.00019941880300273005, 'samples': 1250016, 'steps': 2441, 'loss/train': 1.4641807079315186} -09/20/2021 22:56:55 - INFO - __main__ - Step 39064: {'lr': 0.00019941880300273005, 'samples': 1250048, 'steps': 2441, 'loss/train': 1.9656057357788086} -09/20/2021 22:56:56 - INFO - __main__ - Step 39065: {'lr': 0.00019941880300273005, 'samples': 1250080, 'steps': 2441, 'loss/train': 1.943403720855713} -09/20/2021 22:56:57 - INFO - __main__ - Step 39066: {'lr': 0.00019941880300273005, 'samples': 1250112, 'steps': 2441, 'loss/train': 0.3484153151512146} -09/20/2021 22:56:57 - INFO - __main__ - Step 39067: {'lr': 0.00019941880300273005, 'samples': 1250144, 'steps': 2441, 'loss/train': 3.1943490505218506} -09/20/2021 22:56:58 - INFO - __main__ - Step 39068: {'lr': 0.00019941880300273005, 'samples': 1250176, 'steps': 2441, 'loss/train': 1.609876036643982} -09/20/2021 22:56:59 - INFO - __main__ - Step 39069: {'lr': 0.00019941880300273005, 'samples': 1250208, 'steps': 2441, 'loss/train': 1.7433550357818604} -09/20/2021 22:57:00 - INFO - __main__ - Step 39070: {'lr': 0.00019941880300273005, 'samples': 1250240, 'steps': 2441, 'loss/train': 1.2073625326156616} -09/20/2021 22:57:00 - INFO - __main__ - Step 39071: {'lr': 0.00019941880300273005, 'samples': 1250272, 'steps': 2441, 'loss/train': 1.112979531288147} -09/20/2021 22:57:01 - INFO - __main__ - Step 39072: {'lr': 0.00019941880300273005, 'samples': 1250304, 'steps': 2441, 'loss/train': 1.2664748430252075} -09/20/2021 22:57:02 - INFO - __main__ - Step 39073: {'lr': 0.0001994181160667452, 'samples': 1250336, 'steps': 2442, 'loss/train': 1.0074455738067627} -09/20/2021 22:57:03 - INFO - __main__ - Step 39074: {'lr': 0.0001994181160667452, 'samples': 1250368, 'steps': 2442, 'loss/train': 2.7954752445220947} -09/20/2021 22:57:04 - INFO - __main__ - Step 39075: {'lr': 0.0001994181160667452, 'samples': 1250400, 'steps': 2442, 'loss/train': 0.4682176411151886} -09/20/2021 22:57:05 - INFO - __main__ - Step 39076: {'lr': 0.0001994181160667452, 'samples': 1250432, 'steps': 2442, 'loss/train': 2.3703672885894775} -09/20/2021 22:57:06 - INFO - __main__ - Step 39077: {'lr': 0.0001994181160667452, 'samples': 1250464, 'steps': 2442, 'loss/train': 2.7427103519439697} -09/20/2021 22:57:06 - INFO - __main__ - Step 39078: {'lr': 0.0001994181160667452, 'samples': 1250496, 'steps': 2442, 'loss/train': 2.3476240634918213} -09/20/2021 22:57:07 - INFO - __main__ - Step 39079: {'lr': 0.0001994181160667452, 'samples': 1250528, 'steps': 2442, 'loss/train': 1.8110765218734741} -09/20/2021 22:57:08 - INFO - __main__ - Step 39080: {'lr': 0.0001994181160667452, 'samples': 1250560, 'steps': 2442, 'loss/train': 2.0719027519226074} -09/20/2021 22:57:09 - INFO - __main__ - Step 39081: {'lr': 0.0001994181160667452, 'samples': 1250592, 'steps': 2442, 'loss/train': 2.0251448154449463} -09/20/2021 22:57:09 - INFO - __main__ - Step 39082: {'lr': 0.0001994181160667452, 'samples': 1250624, 'steps': 2442, 'loss/train': 2.228104829788208} -09/20/2021 22:57:10 - INFO - __main__ - Step 39083: {'lr': 0.0001994181160667452, 'samples': 1250656, 'steps': 2442, 'loss/train': 3.051239252090454} -09/20/2021 22:57:11 - INFO - __main__ - Step 39084: {'lr': 0.0001994181160667452, 'samples': 1250688, 'steps': 2442, 'loss/train': 2.9569380283355713} -09/20/2021 22:57:12 - INFO - __main__ - Step 39085: {'lr': 0.0001994181160667452, 'samples': 1250720, 'steps': 2442, 'loss/train': 1.4906699657440186} -09/20/2021 22:57:12 - INFO - __main__ - Step 39086: {'lr': 0.0001994181160667452, 'samples': 1250752, 'steps': 2442, 'loss/train': 2.5710079669952393} -09/20/2021 22:57:13 - INFO - __main__ - Step 39087: {'lr': 0.0001994181160667452, 'samples': 1250784, 'steps': 2442, 'loss/train': 2.112417697906494} -09/20/2021 22:57:14 - INFO - __main__ - Step 39088: {'lr': 0.0001994181160667452, 'samples': 1250816, 'steps': 2442, 'loss/train': 2.562861204147339} -09/20/2021 22:57:15 - INFO - __main__ - Step 39089: {'lr': 0.00019941742872622842, 'samples': 1250848, 'steps': 2443, 'loss/train': 1.4957703351974487} -09/20/2021 22:57:15 - INFO - __main__ - Step 39090: {'lr': 0.00019941742872622842, 'samples': 1250880, 'steps': 2443, 'loss/train': 2.7103183269500732} -09/20/2021 22:57:16 - INFO - __main__ - Step 39091: {'lr': 0.00019941742872622842, 'samples': 1250912, 'steps': 2443, 'loss/train': 2.9832186698913574} -09/20/2021 22:57:17 - INFO - __main__ - Step 39092: {'lr': 0.00019941742872622842, 'samples': 1250944, 'steps': 2443, 'loss/train': 2.2863874435424805} -09/20/2021 22:57:18 - INFO - __main__ - Step 39093: {'lr': 0.00019941742872622842, 'samples': 1250976, 'steps': 2443, 'loss/train': 1.9014016389846802} -09/20/2021 22:57:18 - INFO - __main__ - Step 39094: {'lr': 0.00019941742872622842, 'samples': 1251008, 'steps': 2443, 'loss/train': 3.2278897762298584} -09/20/2021 22:57:19 - INFO - __main__ - Step 39095: {'lr': 0.00019941742872622842, 'samples': 1251040, 'steps': 2443, 'loss/train': 2.166271924972534} -09/20/2021 22:57:20 - INFO - __main__ - Step 39096: {'lr': 0.00019941742872622842, 'samples': 1251072, 'steps': 2443, 'loss/train': 2.162388801574707} -09/20/2021 22:57:21 - INFO - __main__ - Step 39097: {'lr': 0.00019941742872622842, 'samples': 1251104, 'steps': 2443, 'loss/train': 1.1090707778930664} -09/20/2021 22:57:21 - INFO - __main__ - Step 39098: {'lr': 0.00019941742872622842, 'samples': 1251136, 'steps': 2443, 'loss/train': 1.9247777462005615} -09/20/2021 22:57:22 - INFO - __main__ - Step 39099: {'lr': 0.00019941742872622842, 'samples': 1251168, 'steps': 2443, 'loss/train': 2.7144174575805664} -09/20/2021 22:57:23 - INFO - __main__ - Step 39100: {'lr': 0.00019941742872622842, 'samples': 1251200, 'steps': 2443, 'loss/train': 1.7496392726898193} -09/20/2021 22:57:24 - INFO - __main__ - Step 39101: {'lr': 0.00019941742872622842, 'samples': 1251232, 'steps': 2443, 'loss/train': 1.969122052192688} -09/20/2021 22:57:24 - INFO - __main__ - Step 39102: {'lr': 0.00019941742872622842, 'samples': 1251264, 'steps': 2443, 'loss/train': 3.3025448322296143} -09/20/2021 22:57:25 - INFO - __main__ - Step 39103: {'lr': 0.00019941742872622842, 'samples': 1251296, 'steps': 2443, 'loss/train': 2.164236068725586} -09/20/2021 22:57:26 - INFO - __main__ - Step 39104: {'lr': 0.00019941742872622842, 'samples': 1251328, 'steps': 2443, 'loss/train': 2.8366005420684814} -09/20/2021 22:57:27 - INFO - __main__ - Step 39105: {'lr': 0.0001994167409811825, 'samples': 1251360, 'steps': 2444, 'loss/train': 0.2713623642921448} -09/20/2021 22:57:28 - INFO - __main__ - Step 39106: {'lr': 0.0001994167409811825, 'samples': 1251392, 'steps': 2444, 'loss/train': 0.1322234719991684} -09/20/2021 22:57:29 - INFO - __main__ - Step 39107: {'lr': 0.0001994167409811825, 'samples': 1251424, 'steps': 2444, 'loss/train': 0.47383180260658264} -09/20/2021 22:57:30 - INFO - __main__ - Step 39108: {'lr': 0.0001994167409811825, 'samples': 1251456, 'steps': 2444, 'loss/train': 1.9775220155715942} -09/20/2021 22:57:30 - INFO - __main__ - Step 39109: {'lr': 0.0001994167409811825, 'samples': 1251488, 'steps': 2444, 'loss/train': 1.9879111051559448} -09/20/2021 22:57:31 - INFO - __main__ - Step 39110: {'lr': 0.0001994167409811825, 'samples': 1251520, 'steps': 2444, 'loss/train': 2.313138008117676} -09/20/2021 22:57:32 - INFO - __main__ - Step 39111: {'lr': 0.0001994167409811825, 'samples': 1251552, 'steps': 2444, 'loss/train': 1.8099409341812134} -09/20/2021 22:57:33 - INFO - __main__ - Step 39112: {'lr': 0.0001994167409811825, 'samples': 1251584, 'steps': 2444, 'loss/train': 2.3848094940185547} -09/20/2021 22:57:33 - INFO - __main__ - Step 39113: {'lr': 0.0001994167409811825, 'samples': 1251616, 'steps': 2444, 'loss/train': 2.884364604949951} -09/20/2021 22:57:34 - INFO - __main__ - Step 39114: {'lr': 0.0001994167409811825, 'samples': 1251648, 'steps': 2444, 'loss/train': 1.7066595554351807} -09/20/2021 22:57:35 - INFO - __main__ - Step 39115: {'lr': 0.0001994167409811825, 'samples': 1251680, 'steps': 2444, 'loss/train': 1.6136780977249146} -09/20/2021 22:57:36 - INFO - __main__ - Step 39116: {'lr': 0.0001994167409811825, 'samples': 1251712, 'steps': 2444, 'loss/train': 2.0395894050598145} -09/20/2021 22:57:36 - INFO - __main__ - Step 39117: {'lr': 0.0001994167409811825, 'samples': 1251744, 'steps': 2444, 'loss/train': 2.2076258659362793} -09/20/2021 22:57:37 - INFO - __main__ - Step 39118: {'lr': 0.0001994167409811825, 'samples': 1251776, 'steps': 2444, 'loss/train': 2.3083136081695557} -09/20/2021 22:57:38 - INFO - __main__ - Step 39119: {'lr': 0.0001994167409811825, 'samples': 1251808, 'steps': 2444, 'loss/train': 2.6719863414764404} -09/20/2021 22:57:39 - INFO - __main__ - Step 39120: {'lr': 0.0001994167409811825, 'samples': 1251840, 'steps': 2444, 'loss/train': 2.2442514896392822} -09/20/2021 22:57:39 - INFO - __main__ - Step 39121: {'lr': 0.0001994160528316103, 'samples': 1251872, 'steps': 2445, 'loss/train': 1.61607027053833} -09/20/2021 22:57:40 - INFO - __main__ - Step 39122: {'lr': 0.0001994160528316103, 'samples': 1251904, 'steps': 2445, 'loss/train': 2.134852409362793} -09/20/2021 22:57:41 - INFO - __main__ - Step 39123: {'lr': 0.0001994160528316103, 'samples': 1251936, 'steps': 2445, 'loss/train': 2.4017672538757324} -09/20/2021 22:57:42 - INFO - __main__ - Step 39124: {'lr': 0.0001994160528316103, 'samples': 1251968, 'steps': 2445, 'loss/train': 1.3438334465026855} -09/20/2021 22:57:43 - INFO - __main__ - Step 39125: {'lr': 0.0001994160528316103, 'samples': 1252000, 'steps': 2445, 'loss/train': 2.406996488571167} -09/20/2021 22:57:43 - INFO - __main__ - Step 39126: {'lr': 0.0001994160528316103, 'samples': 1252032, 'steps': 2445, 'loss/train': 1.8993169069290161} -09/20/2021 22:57:44 - INFO - __main__ - Step 39127: {'lr': 0.0001994160528316103, 'samples': 1252064, 'steps': 2445, 'loss/train': 1.6604784727096558} -09/20/2021 22:57:45 - INFO - __main__ - Step 39128: {'lr': 0.0001994160528316103, 'samples': 1252096, 'steps': 2445, 'loss/train': 1.9302250146865845} -09/20/2021 22:57:46 - INFO - __main__ - Step 39129: {'lr': 0.0001994160528316103, 'samples': 1252128, 'steps': 2445, 'loss/train': 1.6753243207931519} -09/20/2021 22:57:46 - INFO - __main__ - Step 39130: {'lr': 0.0001994160528316103, 'samples': 1252160, 'steps': 2445, 'loss/train': 2.72251558303833} -09/20/2021 22:57:47 - INFO - __main__ - Step 39131: {'lr': 0.0001994160528316103, 'samples': 1252192, 'steps': 2445, 'loss/train': 2.5807228088378906} -09/20/2021 22:57:48 - INFO - __main__ - Step 39132: {'lr': 0.0001994160528316103, 'samples': 1252224, 'steps': 2445, 'loss/train': 2.0273258686065674} -09/20/2021 22:57:49 - INFO - __main__ - Step 39133: {'lr': 0.0001994160528316103, 'samples': 1252256, 'steps': 2445, 'loss/train': 1.6249051094055176} -09/20/2021 22:57:49 - INFO - __main__ - Step 39134: {'lr': 0.0001994160528316103, 'samples': 1252288, 'steps': 2445, 'loss/train': 2.45540452003479} -09/20/2021 22:57:50 - INFO - __main__ - Step 39135: {'lr': 0.0001994160528316103, 'samples': 1252320, 'steps': 2445, 'loss/train': 2.780933380126953} -09/20/2021 22:57:51 - INFO - __main__ - Step 39136: {'lr': 0.0001994160528316103, 'samples': 1252352, 'steps': 2445, 'loss/train': 2.191678285598755} -09/20/2021 22:57:52 - INFO - __main__ - Step 39137: {'lr': 0.0001994153642775145, 'samples': 1252384, 'steps': 2446, 'loss/train': 2.1506412029266357} -09/20/2021 22:57:53 - INFO - __main__ - Step 39138: {'lr': 0.0001994153642775145, 'samples': 1252416, 'steps': 2446, 'loss/train': 2.6040401458740234} -09/20/2021 22:57:54 - INFO - __main__ - Step 39139: {'lr': 0.0001994153642775145, 'samples': 1252448, 'steps': 2446, 'loss/train': 2.015763521194458} -09/20/2021 22:57:54 - INFO - __main__ - Step 39140: {'lr': 0.0001994153642775145, 'samples': 1252480, 'steps': 2446, 'loss/train': 2.492258071899414} -09/20/2021 22:57:55 - INFO - __main__ - Step 39141: {'lr': 0.0001994153642775145, 'samples': 1252512, 'steps': 2446, 'loss/train': 2.4818780422210693} -09/20/2021 22:57:56 - INFO - __main__ - Step 39142: {'lr': 0.0001994153642775145, 'samples': 1252544, 'steps': 2446, 'loss/train': 1.5095582008361816} -09/20/2021 22:57:57 - INFO - __main__ - Step 39143: {'lr': 0.0001994153642775145, 'samples': 1252576, 'steps': 2446, 'loss/train': 1.7635492086410522} -09/20/2021 22:57:57 - INFO - __main__ - Step 39144: {'lr': 0.0001994153642775145, 'samples': 1252608, 'steps': 2446, 'loss/train': 2.13207745552063} -09/20/2021 22:57:58 - INFO - __main__ - Step 39145: {'lr': 0.0001994153642775145, 'samples': 1252640, 'steps': 2446, 'loss/train': 2.0265731811523438} -09/20/2021 22:57:59 - INFO - __main__ - Step 39146: {'lr': 0.0001994153642775145, 'samples': 1252672, 'steps': 2446, 'loss/train': 2.4114856719970703} -09/20/2021 22:58:00 - INFO - __main__ - Step 39147: {'lr': 0.0001994153642775145, 'samples': 1252704, 'steps': 2446, 'loss/train': 2.7209455966949463} -09/20/2021 22:58:00 - INFO - __main__ - Step 39148: {'lr': 0.0001994153642775145, 'samples': 1252736, 'steps': 2446, 'loss/train': 1.7889084815979004} -09/20/2021 22:58:01 - INFO - __main__ - Step 39149: {'lr': 0.0001994153642775145, 'samples': 1252768, 'steps': 2446, 'loss/train': 1.7906261682510376} -09/20/2021 22:58:02 - INFO - __main__ - Step 39150: {'lr': 0.0001994153642775145, 'samples': 1252800, 'steps': 2446, 'loss/train': 1.2973179817199707} -09/20/2021 22:58:03 - INFO - __main__ - Step 39151: {'lr': 0.0001994153642775145, 'samples': 1252832, 'steps': 2446, 'loss/train': 2.7997236251831055} -09/20/2021 22:58:03 - INFO - __main__ - Step 39152: {'lr': 0.0001994153642775145, 'samples': 1252864, 'steps': 2446, 'loss/train': 2.1069324016571045} -09/20/2021 22:58:04 - INFO - __main__ - Step 39153: {'lr': 0.00019941467531889802, 'samples': 1252896, 'steps': 2447, 'loss/train': 1.1839925050735474} -09/20/2021 22:58:05 - INFO - __main__ - Step 39154: {'lr': 0.00019941467531889802, 'samples': 1252928, 'steps': 2447, 'loss/train': 2.4602935314178467} -09/20/2021 22:58:06 - INFO - __main__ - Step 39155: {'lr': 0.00019941467531889802, 'samples': 1252960, 'steps': 2447, 'loss/train': 1.991212248802185} -09/20/2021 22:58:07 - INFO - __main__ - Step 39156: {'lr': 0.00019941467531889802, 'samples': 1252992, 'steps': 2447, 'loss/train': 2.283262252807617} -09/20/2021 22:58:07 - INFO - __main__ - Step 39157: {'lr': 0.00019941467531889802, 'samples': 1253024, 'steps': 2447, 'loss/train': 2.4114532470703125} -09/20/2021 22:58:08 - INFO - __main__ - Step 39158: {'lr': 0.00019941467531889802, 'samples': 1253056, 'steps': 2447, 'loss/train': 0.8359308242797852} -09/20/2021 22:58:09 - INFO - __main__ - Step 39159: {'lr': 0.00019941467531889802, 'samples': 1253088, 'steps': 2447, 'loss/train': 0.6816631555557251} -09/20/2021 22:58:10 - INFO - __main__ - Step 39160: {'lr': 0.00019941467531889802, 'samples': 1253120, 'steps': 2447, 'loss/train': 2.406878709793091} -09/20/2021 22:58:10 - INFO - __main__ - Step 39161: {'lr': 0.00019941467531889802, 'samples': 1253152, 'steps': 2447, 'loss/train': 1.9004546403884888} -09/20/2021 22:58:11 - INFO - __main__ - Step 39162: {'lr': 0.00019941467531889802, 'samples': 1253184, 'steps': 2447, 'loss/train': 2.141981840133667} -09/20/2021 22:58:12 - INFO - __main__ - Step 39163: {'lr': 0.00019941467531889802, 'samples': 1253216, 'steps': 2447, 'loss/train': 1.741616129875183} -09/20/2021 22:58:13 - INFO - __main__ - Step 39164: {'lr': 0.00019941467531889802, 'samples': 1253248, 'steps': 2447, 'loss/train': 1.9630382061004639} -09/20/2021 22:58:13 - INFO - __main__ - Step 39165: {'lr': 0.00019941467531889802, 'samples': 1253280, 'steps': 2447, 'loss/train': 2.223994255065918} -09/20/2021 22:58:14 - INFO - __main__ - Step 39166: {'lr': 0.00019941467531889802, 'samples': 1253312, 'steps': 2447, 'loss/train': 2.4528326988220215} -09/20/2021 22:58:16 - INFO - __main__ - Step 39167: {'lr': 0.00019941467531889802, 'samples': 1253344, 'steps': 2447, 'loss/train': 2.558478832244873} -09/20/2021 22:58:17 - INFO - __main__ - Step 39168: {'lr': 0.00019941467531889802, 'samples': 1253376, 'steps': 2447, 'loss/train': 1.8758604526519775} -09/20/2021 22:58:18 - INFO - __main__ - Step 39169: {'lr': 0.0001994139859557636, 'samples': 1253408, 'steps': 2448, 'loss/train': 0.5126200914382935} -09/20/2021 22:58:18 - INFO - __main__ - Step 39170: {'lr': 0.0001994139859557636, 'samples': 1253440, 'steps': 2448, 'loss/train': 0.17947900295257568} -09/20/2021 22:58:19 - INFO - __main__ - Step 39171: {'lr': 0.0001994139859557636, 'samples': 1253472, 'steps': 2448, 'loss/train': 0.2955796718597412} -09/20/2021 22:58:20 - INFO - __main__ - Step 39172: {'lr': 0.0001994139859557636, 'samples': 1253504, 'steps': 2448, 'loss/train': 1.9009686708450317} -09/20/2021 22:58:21 - INFO - __main__ - Step 39173: {'lr': 0.0001994139859557636, 'samples': 1253536, 'steps': 2448, 'loss/train': 2.4427216053009033} -09/20/2021 22:58:21 - INFO - __main__ - Step 39174: {'lr': 0.0001994139859557636, 'samples': 1253568, 'steps': 2448, 'loss/train': 2.695406913757324} -09/20/2021 22:58:22 - INFO - __main__ - Step 39175: {'lr': 0.0001994139859557636, 'samples': 1253600, 'steps': 2448, 'loss/train': 1.7687265872955322} -09/20/2021 22:58:23 - INFO - __main__ - Step 39176: {'lr': 0.0001994139859557636, 'samples': 1253632, 'steps': 2448, 'loss/train': 1.9368376731872559} -09/20/2021 22:58:24 - INFO - __main__ - Step 39177: {'lr': 0.0001994139859557636, 'samples': 1253664, 'steps': 2448, 'loss/train': 2.601811170578003} -09/20/2021 22:58:24 - INFO - __main__ - Step 39178: {'lr': 0.0001994139859557636, 'samples': 1253696, 'steps': 2448, 'loss/train': 1.045715570449829} -09/20/2021 22:58:25 - INFO - __main__ - Step 39179: {'lr': 0.0001994139859557636, 'samples': 1253728, 'steps': 2448, 'loss/train': 2.093733072280884} -09/20/2021 22:58:26 - INFO - __main__ - Step 39180: {'lr': 0.0001994139859557636, 'samples': 1253760, 'steps': 2448, 'loss/train': 2.728896141052246} -09/20/2021 22:58:27 - INFO - __main__ - Step 39181: {'lr': 0.0001994139859557636, 'samples': 1253792, 'steps': 2448, 'loss/train': 3.7734081745147705} -09/20/2021 22:58:27 - INFO - __main__ - Step 39182: {'lr': 0.0001994139859557636, 'samples': 1253824, 'steps': 2448, 'loss/train': 1.3475209474563599} -09/20/2021 22:58:28 - INFO - __main__ - Step 39183: {'lr': 0.0001994139859557636, 'samples': 1253856, 'steps': 2448, 'loss/train': 1.3569788932800293} -09/20/2021 22:58:29 - INFO - __main__ - Step 39184: {'lr': 0.0001994139859557636, 'samples': 1253888, 'steps': 2448, 'loss/train': 2.0107860565185547} -09/20/2021 22:58:30 - INFO - __main__ - Step 39185: {'lr': 0.00019941329618811403, 'samples': 1253920, 'steps': 2449, 'loss/train': 1.6768280267715454} -09/20/2021 22:58:30 - INFO - __main__ - Step 39186: {'lr': 0.00019941329618811403, 'samples': 1253952, 'steps': 2449, 'loss/train': 2.6300065517425537} -09/20/2021 22:58:31 - INFO - __main__ - Step 39187: {'lr': 0.00019941329618811403, 'samples': 1253984, 'steps': 2449, 'loss/train': 2.6532883644104004} -09/20/2021 22:58:32 - INFO - __main__ - Step 39188: {'lr': 0.00019941329618811403, 'samples': 1254016, 'steps': 2449, 'loss/train': 2.6380231380462646} -09/20/2021 22:58:33 - INFO - __main__ - Step 39189: {'lr': 0.00019941329618811403, 'samples': 1254048, 'steps': 2449, 'loss/train': 2.6252834796905518} -09/20/2021 22:58:33 - INFO - __main__ - Step 39190: {'lr': 0.00019941329618811403, 'samples': 1254080, 'steps': 2449, 'loss/train': 2.2727015018463135} -09/20/2021 22:58:34 - INFO - __main__ - Step 39191: {'lr': 0.00019941329618811403, 'samples': 1254112, 'steps': 2449, 'loss/train': 2.6083810329437256} -09/20/2021 22:58:35 - INFO - __main__ - Step 39192: {'lr': 0.00019941329618811403, 'samples': 1254144, 'steps': 2449, 'loss/train': 0.2833653688430786} -09/20/2021 22:58:36 - INFO - __main__ - Step 39193: {'lr': 0.00019941329618811403, 'samples': 1254176, 'steps': 2449, 'loss/train': 2.869945764541626} -09/20/2021 22:58:36 - INFO - __main__ - Step 39194: {'lr': 0.00019941329618811403, 'samples': 1254208, 'steps': 2449, 'loss/train': 2.2293238639831543} -09/20/2021 22:58:37 - INFO - __main__ - Step 39195: {'lr': 0.00019941329618811403, 'samples': 1254240, 'steps': 2449, 'loss/train': 2.5931711196899414} -09/20/2021 22:58:38 - INFO - __main__ - Step 39196: {'lr': 0.00019941329618811403, 'samples': 1254272, 'steps': 2449, 'loss/train': 2.201979875564575} -09/20/2021 22:58:40 - INFO - __main__ - Step 39197: {'lr': 0.00019941329618811403, 'samples': 1254304, 'steps': 2449, 'loss/train': 1.9147380590438843} -09/20/2021 22:58:40 - INFO - __main__ - Step 39198: {'lr': 0.00019941329618811403, 'samples': 1254336, 'steps': 2449, 'loss/train': 3.172839879989624} -09/20/2021 22:58:41 - INFO - __main__ - Step 39199: {'lr': 0.00019941329618811403, 'samples': 1254368, 'steps': 2449, 'loss/train': 2.7939603328704834} -09/20/2021 22:58:42 - INFO - __main__ - Step 39200: {'lr': 0.00019941329618811403, 'samples': 1254400, 'steps': 2449, 'loss/train': 0.8460861444473267} -09/20/2021 22:58:43 - INFO - __main__ - Step 39201: {'lr': 0.00019941260601595218, 'samples': 1254432, 'steps': 2450, 'loss/train': 1.8909369707107544} -09/20/2021 22:58:44 - INFO - __main__ - Step 39202: {'lr': 0.00019941260601595218, 'samples': 1254464, 'steps': 2450, 'loss/train': 1.9404292106628418} -09/20/2021 22:58:44 - INFO - __main__ - Step 39203: {'lr': 0.00019941260601595218, 'samples': 1254496, 'steps': 2450, 'loss/train': 1.9295554161071777} -09/20/2021 22:58:45 - INFO - __main__ - Step 39204: {'lr': 0.00019941260601595218, 'samples': 1254528, 'steps': 2450, 'loss/train': 1.5292619466781616} -09/20/2021 22:58:46 - INFO - __main__ - Step 39205: {'lr': 0.00019941260601595218, 'samples': 1254560, 'steps': 2450, 'loss/train': 1.8088891506195068} -09/20/2021 22:58:47 - INFO - __main__ - Step 39206: {'lr': 0.00019941260601595218, 'samples': 1254592, 'steps': 2450, 'loss/train': 1.4870564937591553} -09/20/2021 22:58:47 - INFO - __main__ - Step 39207: {'lr': 0.00019941260601595218, 'samples': 1254624, 'steps': 2450, 'loss/train': 2.126716375350952} -09/20/2021 22:58:48 - INFO - __main__ - Step 39208: {'lr': 0.00019941260601595218, 'samples': 1254656, 'steps': 2450, 'loss/train': 1.9416327476501465} -09/20/2021 22:58:49 - INFO - __main__ - Step 39209: {'lr': 0.00019941260601595218, 'samples': 1254688, 'steps': 2450, 'loss/train': 2.128319501876831} -09/20/2021 22:58:50 - INFO - __main__ - Step 39210: {'lr': 0.00019941260601595218, 'samples': 1254720, 'steps': 2450, 'loss/train': 2.926360607147217} -09/20/2021 22:58:50 - INFO - __main__ - Step 39211: {'lr': 0.00019941260601595218, 'samples': 1254752, 'steps': 2450, 'loss/train': 1.9892067909240723} -09/20/2021 22:58:51 - INFO - __main__ - Step 39212: {'lr': 0.00019941260601595218, 'samples': 1254784, 'steps': 2450, 'loss/train': 2.5476667881011963} -09/20/2021 22:58:52 - INFO - __main__ - Step 39213: {'lr': 0.00019941260601595218, 'samples': 1254816, 'steps': 2450, 'loss/train': 1.219546914100647} -09/20/2021 22:58:53 - INFO - __main__ - Step 39214: {'lr': 0.00019941260601595218, 'samples': 1254848, 'steps': 2450, 'loss/train': 3.7425730228424072} -09/20/2021 22:58:53 - INFO - __main__ - Step 39215: {'lr': 0.00019941260601595218, 'samples': 1254880, 'steps': 2450, 'loss/train': 3.345874071121216} -09/20/2021 22:58:54 - INFO - __main__ - Step 39216: {'lr': 0.00019941260601595218, 'samples': 1254912, 'steps': 2450, 'loss/train': 3.327622890472412} -09/20/2021 22:58:55 - INFO - __main__ - Step 39217: {'lr': 0.00019941191543928078, 'samples': 1254944, 'steps': 2451, 'loss/train': 1.3732136487960815} -09/20/2021 22:58:56 - INFO - __main__ - Step 39218: {'lr': 0.00019941191543928078, 'samples': 1254976, 'steps': 2451, 'loss/train': 3.2852299213409424} -09/20/2021 22:58:56 - INFO - __main__ - Step 39219: {'lr': 0.00019941191543928078, 'samples': 1255008, 'steps': 2451, 'loss/train': 1.6825655698776245} -09/20/2021 22:58:57 - INFO - __main__ - Step 39220: {'lr': 0.00019941191543928078, 'samples': 1255040, 'steps': 2451, 'loss/train': 2.117384195327759} -09/20/2021 22:58:58 - INFO - __main__ - Step 39221: {'lr': 0.00019941191543928078, 'samples': 1255072, 'steps': 2451, 'loss/train': 2.565218687057495} -09/20/2021 22:58:59 - INFO - __main__ - Step 39222: {'lr': 0.00019941191543928078, 'samples': 1255104, 'steps': 2451, 'loss/train': 2.0871450901031494} -09/20/2021 22:58:59 - INFO - __main__ - Step 39223: {'lr': 0.00019941191543928078, 'samples': 1255136, 'steps': 2451, 'loss/train': 1.5654197931289673} -09/20/2021 22:59:00 - INFO - __main__ - Step 39224: {'lr': 0.00019941191543928078, 'samples': 1255168, 'steps': 2451, 'loss/train': 2.0356221199035645} -09/20/2021 22:59:01 - INFO - __main__ - Step 39225: {'lr': 0.00019941191543928078, 'samples': 1255200, 'steps': 2451, 'loss/train': 2.7985587120056152} -09/20/2021 22:59:02 - INFO - __main__ - Step 39226: {'lr': 0.00019941191543928078, 'samples': 1255232, 'steps': 2451, 'loss/train': 1.957076072692871} -09/20/2021 22:59:02 - INFO - __main__ - Step 39227: {'lr': 0.00019941191543928078, 'samples': 1255264, 'steps': 2451, 'loss/train': 1.0053620338439941} -09/20/2021 22:59:03 - INFO - __main__ - Step 39228: {'lr': 0.00019941191543928078, 'samples': 1255296, 'steps': 2451, 'loss/train': 1.1160482168197632} -09/20/2021 22:59:04 - INFO - __main__ - Step 39229: {'lr': 0.00019941191543928078, 'samples': 1255328, 'steps': 2451, 'loss/train': 0.8338621258735657} -09/20/2021 22:59:05 - INFO - __main__ - Step 39230: {'lr': 0.00019941191543928078, 'samples': 1255360, 'steps': 2451, 'loss/train': 0.7885697484016418} -09/20/2021 22:59:05 - INFO - __main__ - Step 39231: {'lr': 0.00019941191543928078, 'samples': 1255392, 'steps': 2451, 'loss/train': 0.7546660900115967} -09/20/2021 22:59:06 - INFO - __main__ - Step 39232: {'lr': 0.00019941191543928078, 'samples': 1255424, 'steps': 2451, 'loss/train': 0.8392519354820251} -09/20/2021 22:59:07 - INFO - __main__ - Step 39233: {'lr': 0.00019941122445810272, 'samples': 1255456, 'steps': 2452, 'loss/train': 0.5006834268569946} -09/20/2021 22:59:08 - INFO - __main__ - Step 39234: {'lr': 0.00019941122445810272, 'samples': 1255488, 'steps': 2452, 'loss/train': 0.6018502116203308} -09/20/2021 22:59:09 - INFO - __main__ - Step 39235: {'lr': 0.00019941122445810272, 'samples': 1255520, 'steps': 2452, 'loss/train': 1.0547611713409424} -09/20/2021 22:59:10 - INFO - __main__ - Step 39236: {'lr': 0.00019941122445810272, 'samples': 1255552, 'steps': 2452, 'loss/train': 1.8668407201766968} -09/20/2021 22:59:11 - INFO - __main__ - Step 39237: {'lr': 0.00019941122445810272, 'samples': 1255584, 'steps': 2452, 'loss/train': 0.5714860558509827} -09/20/2021 22:59:11 - INFO - __main__ - Step 39238: {'lr': 0.00019941122445810272, 'samples': 1255616, 'steps': 2452, 'loss/train': 2.9890847206115723} -09/20/2021 22:59:12 - INFO - __main__ - Step 39239: {'lr': 0.00019941122445810272, 'samples': 1255648, 'steps': 2452, 'loss/train': 2.1019506454467773} -09/20/2021 22:59:13 - INFO - __main__ - Step 39240: {'lr': 0.00019941122445810272, 'samples': 1255680, 'steps': 2452, 'loss/train': 2.9336888790130615} -09/20/2021 22:59:14 - INFO - __main__ - Step 39241: {'lr': 0.00019941122445810272, 'samples': 1255712, 'steps': 2452, 'loss/train': 1.8568618297576904} -09/20/2021 22:59:14 - INFO - __main__ - Step 39242: {'lr': 0.00019941122445810272, 'samples': 1255744, 'steps': 2452, 'loss/train': 2.3064842224121094} -09/20/2021 22:59:15 - INFO - __main__ - Step 39243: {'lr': 0.00019941122445810272, 'samples': 1255776, 'steps': 2452, 'loss/train': 2.9301857948303223} -09/20/2021 22:59:16 - INFO - __main__ - Step 39244: {'lr': 0.00019941122445810272, 'samples': 1255808, 'steps': 2452, 'loss/train': 2.2593138217926025} -09/20/2021 22:59:17 - INFO - __main__ - Step 39245: {'lr': 0.00019941122445810272, 'samples': 1255840, 'steps': 2452, 'loss/train': 1.1543986797332764} -09/20/2021 22:59:17 - INFO - __main__ - Step 39246: {'lr': 0.00019941122445810272, 'samples': 1255872, 'steps': 2452, 'loss/train': 2.019789934158325} -09/20/2021 22:59:18 - INFO - __main__ - Step 39247: {'lr': 0.00019941122445810272, 'samples': 1255904, 'steps': 2452, 'loss/train': 2.0709218978881836} -09/20/2021 22:59:19 - INFO - __main__ - Step 39248: {'lr': 0.00019941122445810272, 'samples': 1255936, 'steps': 2452, 'loss/train': 1.7333478927612305} -09/20/2021 22:59:20 - INFO - __main__ - Step 39249: {'lr': 0.00019941053307242075, 'samples': 1255968, 'steps': 2453, 'loss/train': 1.402142882347107} -09/20/2021 22:59:20 - INFO - __main__ - Step 39250: {'lr': 0.00019941053307242075, 'samples': 1256000, 'steps': 2453, 'loss/train': 1.8112750053405762} -09/20/2021 22:59:21 - INFO - __main__ - Step 39251: {'lr': 0.00019941053307242075, 'samples': 1256032, 'steps': 2453, 'loss/train': 2.520895004272461} -09/20/2021 22:59:22 - INFO - __main__ - Step 39252: {'lr': 0.00019941053307242075, 'samples': 1256064, 'steps': 2453, 'loss/train': 1.855506181716919} -09/20/2021 22:59:23 - INFO - __main__ - Step 39253: {'lr': 0.00019941053307242075, 'samples': 1256096, 'steps': 2453, 'loss/train': 1.6873239278793335} -09/20/2021 22:59:23 - INFO - __main__ - Step 39254: {'lr': 0.00019941053307242075, 'samples': 1256128, 'steps': 2453, 'loss/train': 1.8021860122680664} -09/20/2021 22:59:24 - INFO - __main__ - Step 39255: {'lr': 0.00019941053307242075, 'samples': 1256160, 'steps': 2453, 'loss/train': 0.44417664408683777} -09/20/2021 22:59:25 - INFO - __main__ - Step 39256: {'lr': 0.00019941053307242075, 'samples': 1256192, 'steps': 2453, 'loss/train': 2.315558433532715} -09/20/2021 22:59:26 - INFO - __main__ - Step 39257: {'lr': 0.00019941053307242075, 'samples': 1256224, 'steps': 2453, 'loss/train': 1.434093713760376} -09/20/2021 22:59:26 - INFO - __main__ - Step 39258: {'lr': 0.00019941053307242075, 'samples': 1256256, 'steps': 2453, 'loss/train': 2.110515832901001} -09/20/2021 22:59:27 - INFO - __main__ - Step 39259: {'lr': 0.00019941053307242075, 'samples': 1256288, 'steps': 2453, 'loss/train': 1.6800730228424072} -09/20/2021 22:59:28 - INFO - __main__ - Step 39260: {'lr': 0.00019941053307242075, 'samples': 1256320, 'steps': 2453, 'loss/train': 2.497673511505127} -09/20/2021 22:59:29 - INFO - __main__ - Step 39261: {'lr': 0.00019941053307242075, 'samples': 1256352, 'steps': 2453, 'loss/train': 2.3366806507110596} -09/20/2021 22:59:29 - INFO - __main__ - Step 39262: {'lr': 0.00019941053307242075, 'samples': 1256384, 'steps': 2453, 'loss/train': 1.602041482925415} -09/20/2021 22:59:30 - INFO - __main__ - Step 39263: {'lr': 0.00019941053307242075, 'samples': 1256416, 'steps': 2453, 'loss/train': 1.8719435930252075} -09/20/2021 22:59:31 - INFO - __main__ - Step 39264: {'lr': 0.00019941053307242075, 'samples': 1256448, 'steps': 2453, 'loss/train': 2.0675384998321533} -09/20/2021 22:59:32 - INFO - __main__ - Step 39265: {'lr': 0.00019940984128223775, 'samples': 1256480, 'steps': 2454, 'loss/train': 1.6441189050674438} -09/20/2021 22:59:33 - INFO - __main__ - Step 39266: {'lr': 0.00019940984128223775, 'samples': 1256512, 'steps': 2454, 'loss/train': 0.3283960521221161} -09/20/2021 22:59:34 - INFO - __main__ - Step 39267: {'lr': 0.00019940984128223775, 'samples': 1256544, 'steps': 2454, 'loss/train': 1.7645152807235718} -09/20/2021 22:59:35 - INFO - __main__ - Step 39268: {'lr': 0.00019940984128223775, 'samples': 1256576, 'steps': 2454, 'loss/train': 2.202216863632202} -09/20/2021 22:59:35 - INFO - __main__ - Step 39269: {'lr': 0.00019940984128223775, 'samples': 1256608, 'steps': 2454, 'loss/train': 2.310549259185791} -09/20/2021 22:59:36 - INFO - __main__ - Step 39270: {'lr': 0.00019940984128223775, 'samples': 1256640, 'steps': 2454, 'loss/train': 2.695888042449951} -09/20/2021 22:59:37 - INFO - __main__ - Step 39271: {'lr': 0.00019940984128223775, 'samples': 1256672, 'steps': 2454, 'loss/train': 2.2863965034484863} -09/20/2021 22:59:38 - INFO - __main__ - Step 39272: {'lr': 0.00019940984128223775, 'samples': 1256704, 'steps': 2454, 'loss/train': 2.355604887008667} -09/20/2021 22:59:38 - INFO - __main__ - Step 39273: {'lr': 0.00019940984128223775, 'samples': 1256736, 'steps': 2454, 'loss/train': 2.4250316619873047} -09/20/2021 22:59:39 - INFO - __main__ - Step 39274: {'lr': 0.00019940984128223775, 'samples': 1256768, 'steps': 2454, 'loss/train': 0.7255918979644775} -09/20/2021 22:59:40 - INFO - __main__ - Step 39275: {'lr': 0.00019940984128223775, 'samples': 1256800, 'steps': 2454, 'loss/train': 2.194606304168701} -09/20/2021 22:59:41 - INFO - __main__ - Step 39276: {'lr': 0.00019940984128223775, 'samples': 1256832, 'steps': 2454, 'loss/train': 1.806969404220581} -09/20/2021 22:59:41 - INFO - __main__ - Step 39277: {'lr': 0.00019940984128223775, 'samples': 1256864, 'steps': 2454, 'loss/train': 1.6475539207458496} -09/20/2021 22:59:42 - INFO - __main__ - Step 39278: {'lr': 0.00019940984128223775, 'samples': 1256896, 'steps': 2454, 'loss/train': 2.7848026752471924} -09/20/2021 22:59:43 - INFO - __main__ - Step 39279: {'lr': 0.00019940984128223775, 'samples': 1256928, 'steps': 2454, 'loss/train': 2.354095220565796} -09/20/2021 22:59:44 - INFO - __main__ - Step 39280: {'lr': 0.00019940984128223775, 'samples': 1256960, 'steps': 2454, 'loss/train': 2.1131107807159424} -09/20/2021 22:59:45 - INFO - __main__ - Step 39281: {'lr': 0.00019940914908755643, 'samples': 1256992, 'steps': 2455, 'loss/train': 0.6367318630218506} -09/20/2021 22:59:45 - INFO - __main__ - Step 39282: {'lr': 0.00019940914908755643, 'samples': 1257024, 'steps': 2455, 'loss/train': 1.2329128980636597} -09/20/2021 22:59:46 - INFO - __main__ - Step 39283: {'lr': 0.00019940914908755643, 'samples': 1257056, 'steps': 2455, 'loss/train': 1.0786361694335938} -09/20/2021 22:59:47 - INFO - __main__ - Step 39284: {'lr': 0.00019940914908755643, 'samples': 1257088, 'steps': 2455, 'loss/train': 0.9468652606010437} -09/20/2021 22:59:48 - INFO - __main__ - Step 39285: {'lr': 0.00019940914908755643, 'samples': 1257120, 'steps': 2455, 'loss/train': 1.5874831676483154} -09/20/2021 22:59:48 - INFO - __main__ - Step 39286: {'lr': 0.00019940914908755643, 'samples': 1257152, 'steps': 2455, 'loss/train': 2.4695088863372803} -09/20/2021 22:59:49 - INFO - __main__ - Step 39287: {'lr': 0.00019940914908755643, 'samples': 1257184, 'steps': 2455, 'loss/train': 1.849776268005371} -09/20/2021 22:59:50 - INFO - __main__ - Step 39288: {'lr': 0.00019940914908755643, 'samples': 1257216, 'steps': 2455, 'loss/train': 1.719133973121643} -09/20/2021 22:59:51 - INFO - __main__ - Step 39289: {'lr': 0.00019940914908755643, 'samples': 1257248, 'steps': 2455, 'loss/train': 0.6926193237304688} -09/20/2021 22:59:51 - INFO - __main__ - Step 39290: {'lr': 0.00019940914908755643, 'samples': 1257280, 'steps': 2455, 'loss/train': 1.9792147874832153} -09/20/2021 22:59:52 - INFO - __main__ - Step 39291: {'lr': 0.00019940914908755643, 'samples': 1257312, 'steps': 2455, 'loss/train': 1.904662013053894} -09/20/2021 22:59:53 - INFO - __main__ - Step 39292: {'lr': 0.00019940914908755643, 'samples': 1257344, 'steps': 2455, 'loss/train': 2.8148348331451416} -09/20/2021 22:59:54 - INFO - __main__ - Step 39293: {'lr': 0.00019940914908755643, 'samples': 1257376, 'steps': 2455, 'loss/train': 1.7365258932113647} -09/20/2021 22:59:54 - INFO - __main__ - Step 39294: {'lr': 0.00019940914908755643, 'samples': 1257408, 'steps': 2455, 'loss/train': 1.6766656637191772} -09/20/2021 22:59:55 - INFO - __main__ - Step 39295: {'lr': 0.00019940914908755643, 'samples': 1257440, 'steps': 2455, 'loss/train': 1.6162952184677124} -09/20/2021 22:59:56 - INFO - __main__ - Step 39296: {'lr': 0.00019940914908755643, 'samples': 1257472, 'steps': 2455, 'loss/train': 2.693483352661133} -09/20/2021 22:59:57 - INFO - __main__ - Step 39297: {'lr': 0.00019940845648837972, 'samples': 1257504, 'steps': 2456, 'loss/train': 1.8928916454315186} -09/20/2021 22:59:58 - INFO - __main__ - Step 39298: {'lr': 0.00019940845648837972, 'samples': 1257536, 'steps': 2456, 'loss/train': 1.7813212871551514} -09/20/2021 22:59:59 - INFO - __main__ - Step 39299: {'lr': 0.00019940845648837972, 'samples': 1257568, 'steps': 2456, 'loss/train': 2.270815849304199} -09/20/2021 23:00:00 - INFO - __main__ - Step 39300: {'lr': 0.00019940845648837972, 'samples': 1257600, 'steps': 2456, 'loss/train': 2.191861391067505} -09/20/2021 23:00:00 - INFO - __main__ - Step 39301: {'lr': 0.00019940845648837972, 'samples': 1257632, 'steps': 2456, 'loss/train': 1.4814887046813965} -09/20/2021 23:00:01 - INFO - __main__ - Step 39302: {'lr': 0.00019940845648837972, 'samples': 1257664, 'steps': 2456, 'loss/train': 2.422257423400879} -09/20/2021 23:00:02 - INFO - __main__ - Step 39303: {'lr': 0.00019940845648837972, 'samples': 1257696, 'steps': 2456, 'loss/train': 2.2507529258728027} -09/20/2021 23:00:03 - INFO - __main__ - Step 39304: {'lr': 0.00019940845648837972, 'samples': 1257728, 'steps': 2456, 'loss/train': 3.4056437015533447} -09/20/2021 23:00:03 - INFO - __main__ - Step 39305: {'lr': 0.00019940845648837972, 'samples': 1257760, 'steps': 2456, 'loss/train': 2.1099178791046143} -09/20/2021 23:00:04 - INFO - __main__ - Step 39306: {'lr': 0.00019940845648837972, 'samples': 1257792, 'steps': 2456, 'loss/train': 4.436611175537109} -09/20/2021 23:00:05 - INFO - __main__ - Step 39307: {'lr': 0.00019940845648837972, 'samples': 1257824, 'steps': 2456, 'loss/train': 1.8503329753875732} -09/20/2021 23:00:06 - INFO - __main__ - Step 39308: {'lr': 0.00019940845648837972, 'samples': 1257856, 'steps': 2456, 'loss/train': 2.8158504962921143} -09/20/2021 23:00:06 - INFO - __main__ - Step 39309: {'lr': 0.00019940845648837972, 'samples': 1257888, 'steps': 2456, 'loss/train': 2.0622575283050537} -09/20/2021 23:00:07 - INFO - __main__ - Step 39310: {'lr': 0.00019940845648837972, 'samples': 1257920, 'steps': 2456, 'loss/train': 2.188080072402954} -09/20/2021 23:00:08 - INFO - __main__ - Step 39311: {'lr': 0.00019940845648837972, 'samples': 1257952, 'steps': 2456, 'loss/train': 1.6965423822402954} -09/20/2021 23:00:09 - INFO - __main__ - Step 39312: {'lr': 0.00019940845648837972, 'samples': 1257984, 'steps': 2456, 'loss/train': 1.5885170698165894} -09/20/2021 23:00:09 - INFO - __main__ - Step 39313: {'lr': 0.00019940776348471035, 'samples': 1258016, 'steps': 2457, 'loss/train': 2.174729824066162} -09/20/2021 23:00:10 - INFO - __main__ - Step 39314: {'lr': 0.00019940776348471035, 'samples': 1258048, 'steps': 2457, 'loss/train': 2.5574162006378174} -09/20/2021 23:00:11 - INFO - __main__ - Step 39315: {'lr': 0.00019940776348471035, 'samples': 1258080, 'steps': 2457, 'loss/train': 2.018113851547241} -09/20/2021 23:00:12 - INFO - __main__ - Step 39316: {'lr': 0.00019940776348471035, 'samples': 1258112, 'steps': 2457, 'loss/train': 2.773972988128662} -09/20/2021 23:00:12 - INFO - __main__ - Step 39317: {'lr': 0.00019940776348471035, 'samples': 1258144, 'steps': 2457, 'loss/train': 2.891730546951294} -09/20/2021 23:00:13 - INFO - __main__ - Step 39318: {'lr': 0.00019940776348471035, 'samples': 1258176, 'steps': 2457, 'loss/train': 1.187881588935852} -09/20/2021 23:00:14 - INFO - __main__ - Step 39319: {'lr': 0.00019940776348471035, 'samples': 1258208, 'steps': 2457, 'loss/train': 1.3230534791946411} -09/20/2021 23:00:15 - INFO - __main__ - Step 39320: {'lr': 0.00019940776348471035, 'samples': 1258240, 'steps': 2457, 'loss/train': 1.8305225372314453} -09/20/2021 23:00:15 - INFO - __main__ - Step 39321: {'lr': 0.00019940776348471035, 'samples': 1258272, 'steps': 2457, 'loss/train': 1.8470193147659302} -09/20/2021 23:00:16 - INFO - __main__ - Step 39322: {'lr': 0.00019940776348471035, 'samples': 1258304, 'steps': 2457, 'loss/train': 1.958223819732666} -09/20/2021 23:00:17 - INFO - __main__ - Step 39323: {'lr': 0.00019940776348471035, 'samples': 1258336, 'steps': 2457, 'loss/train': 1.947834849357605} -09/20/2021 23:00:18 - INFO - __main__ - Step 39324: {'lr': 0.00019940776348471035, 'samples': 1258368, 'steps': 2457, 'loss/train': 1.6587674617767334} -09/20/2021 23:00:18 - INFO - __main__ - Step 39325: {'lr': 0.00019940776348471035, 'samples': 1258400, 'steps': 2457, 'loss/train': 2.5481069087982178} -09/20/2021 23:00:19 - INFO - __main__ - Step 39326: {'lr': 0.00019940776348471035, 'samples': 1258432, 'steps': 2457, 'loss/train': 1.9144717454910278} -09/20/2021 23:00:20 - INFO - __main__ - Step 39327: {'lr': 0.00019940776348471035, 'samples': 1258464, 'steps': 2457, 'loss/train': 2.1832973957061768} -09/20/2021 23:00:21 - INFO - __main__ - Step 39328: {'lr': 0.00019940776348471035, 'samples': 1258496, 'steps': 2457, 'loss/train': 2.283059597015381} -09/20/2021 23:00:22 - INFO - __main__ - Step 39329: {'lr': 0.00019940707007655117, 'samples': 1258528, 'steps': 2458, 'loss/train': 2.064851760864258} -09/20/2021 23:00:23 - INFO - __main__ - Step 39330: {'lr': 0.00019940707007655117, 'samples': 1258560, 'steps': 2458, 'loss/train': 1.799355149269104} -09/20/2021 23:00:24 - INFO - __main__ - Step 39331: {'lr': 0.00019940707007655117, 'samples': 1258592, 'steps': 2458, 'loss/train': 2.4233484268188477} -09/20/2021 23:00:24 - INFO - __main__ - Step 39332: {'lr': 0.00019940707007655117, 'samples': 1258624, 'steps': 2458, 'loss/train': 2.3019328117370605} -09/20/2021 23:00:25 - INFO - __main__ - Step 39333: {'lr': 0.00019940707007655117, 'samples': 1258656, 'steps': 2458, 'loss/train': 2.9225239753723145} -09/20/2021 23:00:26 - INFO - __main__ - Step 39334: {'lr': 0.00019940707007655117, 'samples': 1258688, 'steps': 2458, 'loss/train': 1.317747950553894} -09/20/2021 23:00:27 - INFO - __main__ - Step 39335: {'lr': 0.00019940707007655117, 'samples': 1258720, 'steps': 2458, 'loss/train': 1.525661587715149} -09/20/2021 23:00:27 - INFO - __main__ - Step 39336: {'lr': 0.00019940707007655117, 'samples': 1258752, 'steps': 2458, 'loss/train': 2.001814603805542} -09/20/2021 23:00:28 - INFO - __main__ - Step 39337: {'lr': 0.00019940707007655117, 'samples': 1258784, 'steps': 2458, 'loss/train': 1.4563267230987549} -09/20/2021 23:00:29 - INFO - __main__ - Step 39338: {'lr': 0.00019940707007655117, 'samples': 1258816, 'steps': 2458, 'loss/train': 2.3825931549072266} -09/20/2021 23:00:30 - INFO - __main__ - Step 39339: {'lr': 0.00019940707007655117, 'samples': 1258848, 'steps': 2458, 'loss/train': 1.8492958545684814} -09/20/2021 23:00:30 - INFO - __main__ - Step 39340: {'lr': 0.00019940707007655117, 'samples': 1258880, 'steps': 2458, 'loss/train': 2.2534687519073486} -09/20/2021 23:00:31 - INFO - __main__ - Step 39341: {'lr': 0.00019940707007655117, 'samples': 1258912, 'steps': 2458, 'loss/train': 1.6948049068450928} -09/20/2021 23:00:32 - INFO - __main__ - Step 39342: {'lr': 0.00019940707007655117, 'samples': 1258944, 'steps': 2458, 'loss/train': 2.4775991439819336} -09/20/2021 23:00:33 - INFO - __main__ - Step 39343: {'lr': 0.00019940707007655117, 'samples': 1258976, 'steps': 2458, 'loss/train': 1.8614007234573364} -09/20/2021 23:00:33 - INFO - __main__ - Step 39344: {'lr': 0.00019940707007655117, 'samples': 1259008, 'steps': 2458, 'loss/train': 0.2020336091518402} -09/20/2021 23:00:34 - INFO - __main__ - Step 39345: {'lr': 0.00019940637626390502, 'samples': 1259040, 'steps': 2459, 'loss/train': 0.33656591176986694} -09/20/2021 23:00:35 - INFO - __main__ - Step 39346: {'lr': 0.00019940637626390502, 'samples': 1259072, 'steps': 2459, 'loss/train': 2.5835399627685547} -09/20/2021 23:00:36 - INFO - __main__ - Step 39347: {'lr': 0.00019940637626390502, 'samples': 1259104, 'steps': 2459, 'loss/train': 2.513179063796997} -09/20/2021 23:00:37 - INFO - __main__ - Step 39348: {'lr': 0.00019940637626390502, 'samples': 1259136, 'steps': 2459, 'loss/train': 2.1064915657043457} -09/20/2021 23:00:37 - INFO - __main__ - Step 39349: {'lr': 0.00019940637626390502, 'samples': 1259168, 'steps': 2459, 'loss/train': 1.2320886850357056} -09/20/2021 23:00:38 - INFO - __main__ - Step 39350: {'lr': 0.00019940637626390502, 'samples': 1259200, 'steps': 2459, 'loss/train': 2.410975694656372} -09/20/2021 23:00:39 - INFO - __main__ - Step 39351: {'lr': 0.00019940637626390502, 'samples': 1259232, 'steps': 2459, 'loss/train': 1.8494536876678467} -09/20/2021 23:00:40 - INFO - __main__ - Step 39352: {'lr': 0.00019940637626390502, 'samples': 1259264, 'steps': 2459, 'loss/train': 2.3179848194122314} -09/20/2021 23:00:40 - INFO - __main__ - Step 39353: {'lr': 0.00019940637626390502, 'samples': 1259296, 'steps': 2459, 'loss/train': 2.0341038703918457} -09/20/2021 23:00:41 - INFO - __main__ - Step 39354: {'lr': 0.00019940637626390502, 'samples': 1259328, 'steps': 2459, 'loss/train': 2.6524033546447754} -09/20/2021 23:00:42 - INFO - __main__ - Step 39355: {'lr': 0.00019940637626390502, 'samples': 1259360, 'steps': 2459, 'loss/train': 2.537944793701172} -09/20/2021 23:00:43 - INFO - __main__ - Step 39356: {'lr': 0.00019940637626390502, 'samples': 1259392, 'steps': 2459, 'loss/train': 2.5330700874328613} -09/20/2021 23:00:43 - INFO - __main__ - Step 39357: {'lr': 0.00019940637626390502, 'samples': 1259424, 'steps': 2459, 'loss/train': 2.9095990657806396} -09/20/2021 23:00:44 - INFO - __main__ - Step 39358: {'lr': 0.00019940637626390502, 'samples': 1259456, 'steps': 2459, 'loss/train': 2.7688724994659424} -09/20/2021 23:00:45 - INFO - __main__ - Step 39359: {'lr': 0.00019940637626390502, 'samples': 1259488, 'steps': 2459, 'loss/train': 2.411388874053955} -09/20/2021 23:00:46 - INFO - __main__ - Step 39360: {'lr': 0.00019940637626390502, 'samples': 1259520, 'steps': 2459, 'loss/train': 2.117537021636963} -09/20/2021 23:00:47 - INFO - __main__ - Step 39361: {'lr': 0.00019940568204677474, 'samples': 1259552, 'steps': 2460, 'loss/train': 1.1950559616088867} -09/20/2021 23:00:48 - INFO - __main__ - Step 39362: {'lr': 0.00019940568204677474, 'samples': 1259584, 'steps': 2460, 'loss/train': 2.056952714920044} -09/20/2021 23:00:49 - INFO - __main__ - Step 39363: {'lr': 0.00019940568204677474, 'samples': 1259616, 'steps': 2460, 'loss/train': 1.7631351947784424} -09/20/2021 23:00:49 - INFO - __main__ - Step 39364: {'lr': 0.00019940568204677474, 'samples': 1259648, 'steps': 2460, 'loss/train': 2.0555319786071777} -09/20/2021 23:00:50 - INFO - __main__ - Step 39365: {'lr': 0.00019940568204677474, 'samples': 1259680, 'steps': 2460, 'loss/train': 2.6785616874694824} -09/20/2021 23:00:51 - INFO - __main__ - Step 39366: {'lr': 0.00019940568204677474, 'samples': 1259712, 'steps': 2460, 'loss/train': 1.8799940347671509} -09/20/2021 23:00:52 - INFO - __main__ - Step 39367: {'lr': 0.00019940568204677474, 'samples': 1259744, 'steps': 2460, 'loss/train': 2.0580763816833496} -09/20/2021 23:00:52 - INFO - __main__ - Step 39368: {'lr': 0.00019940568204677474, 'samples': 1259776, 'steps': 2460, 'loss/train': 2.21174955368042} -09/20/2021 23:00:53 - INFO - __main__ - Step 39369: {'lr': 0.00019940568204677474, 'samples': 1259808, 'steps': 2460, 'loss/train': 2.388925790786743} -09/20/2021 23:00:54 - INFO - __main__ - Step 39370: {'lr': 0.00019940568204677474, 'samples': 1259840, 'steps': 2460, 'loss/train': 2.11722731590271} -09/20/2021 23:00:55 - INFO - __main__ - Step 39371: {'lr': 0.00019940568204677474, 'samples': 1259872, 'steps': 2460, 'loss/train': 1.8226728439331055} -09/20/2021 23:00:55 - INFO - __main__ - Step 39372: {'lr': 0.00019940568204677474, 'samples': 1259904, 'steps': 2460, 'loss/train': 0.2523401081562042} -09/20/2021 23:00:56 - INFO - __main__ - Step 39373: {'lr': 0.00019940568204677474, 'samples': 1259936, 'steps': 2460, 'loss/train': 0.1732766181230545} -09/20/2021 23:00:57 - INFO - __main__ - Step 39374: {'lr': 0.00019940568204677474, 'samples': 1259968, 'steps': 2460, 'loss/train': 0.3422086238861084} -09/20/2021 23:00:58 - INFO - __main__ - Step 39375: {'lr': 0.00019940568204677474, 'samples': 1260000, 'steps': 2460, 'loss/train': 0.3635479807853699} -09/20/2021 23:00:58 - INFO - __main__ - Step 39376: {'lr': 0.00019940568204677474, 'samples': 1260032, 'steps': 2460, 'loss/train': 1.1399890184402466} -09/20/2021 23:00:59 - INFO - __main__ - Step 39377: {'lr': 0.00019940498742516312, 'samples': 1260064, 'steps': 2461, 'loss/train': 2.096729278564453} -09/20/2021 23:01:00 - INFO - __main__ - Step 39378: {'lr': 0.00019940498742516312, 'samples': 1260096, 'steps': 2461, 'loss/train': 2.3438634872436523} -09/20/2021 23:01:01 - INFO - __main__ - Step 39379: {'lr': 0.00019940498742516312, 'samples': 1260128, 'steps': 2461, 'loss/train': 2.6299431324005127} -09/20/2021 23:01:01 - INFO - __main__ - Step 39380: {'lr': 0.00019940498742516312, 'samples': 1260160, 'steps': 2461, 'loss/train': 2.29618239402771} -09/20/2021 23:01:02 - INFO - __main__ - Step 39381: {'lr': 0.00019940498742516312, 'samples': 1260192, 'steps': 2461, 'loss/train': 1.8309005498886108} -09/20/2021 23:01:03 - INFO - __main__ - Step 39382: {'lr': 0.00019940498742516312, 'samples': 1260224, 'steps': 2461, 'loss/train': 1.4416074752807617} -09/20/2021 23:01:04 - INFO - __main__ - Step 39383: {'lr': 0.00019940498742516312, 'samples': 1260256, 'steps': 2461, 'loss/train': 2.6743898391723633} -09/20/2021 23:01:04 - INFO - __main__ - Step 39384: {'lr': 0.00019940498742516312, 'samples': 1260288, 'steps': 2461, 'loss/train': 2.092905044555664} -09/20/2021 23:01:05 - INFO - __main__ - Step 39385: {'lr': 0.00019940498742516312, 'samples': 1260320, 'steps': 2461, 'loss/train': 1.4426770210266113} -09/20/2021 23:01:06 - INFO - __main__ - Step 39386: {'lr': 0.00019940498742516312, 'samples': 1260352, 'steps': 2461, 'loss/train': 1.8679741621017456} -09/20/2021 23:01:07 - INFO - __main__ - Step 39387: {'lr': 0.00019940498742516312, 'samples': 1260384, 'steps': 2461, 'loss/train': 2.132474422454834} -09/20/2021 23:01:07 - INFO - __main__ - Step 39388: {'lr': 0.00019940498742516312, 'samples': 1260416, 'steps': 2461, 'loss/train': 1.731458306312561} -09/20/2021 23:01:08 - INFO - __main__ - Step 39389: {'lr': 0.00019940498742516312, 'samples': 1260448, 'steps': 2461, 'loss/train': 2.068763494491577} -09/20/2021 23:01:10 - INFO - __main__ - Step 39390: {'lr': 0.00019940498742516312, 'samples': 1260480, 'steps': 2461, 'loss/train': 1.7441571950912476} -09/20/2021 23:01:10 - INFO - __main__ - Step 39391: {'lr': 0.00019940498742516312, 'samples': 1260512, 'steps': 2461, 'loss/train': 2.022782564163208} -09/20/2021 23:01:11 - INFO - __main__ - Step 39392: {'lr': 0.00019940498742516312, 'samples': 1260544, 'steps': 2461, 'loss/train': 1.809718370437622} -09/20/2021 23:01:12 - INFO - __main__ - Step 39393: {'lr': 0.00019940429239907298, 'samples': 1260576, 'steps': 2462, 'loss/train': 1.985358476638794} -09/20/2021 23:01:13 - INFO - __main__ - Step 39394: {'lr': 0.00019940429239907298, 'samples': 1260608, 'steps': 2462, 'loss/train': 1.8528786897659302} -09/20/2021 23:01:13 - INFO - __main__ - Step 39395: {'lr': 0.00019940429239907298, 'samples': 1260640, 'steps': 2462, 'loss/train': 0.2298344224691391} -09/20/2021 23:01:14 - INFO - __main__ - Step 39396: {'lr': 0.00019940429239907298, 'samples': 1260672, 'steps': 2462, 'loss/train': 0.1871269792318344} -09/20/2021 23:01:15 - INFO - __main__ - Step 39397: {'lr': 0.00019940429239907298, 'samples': 1260704, 'steps': 2462, 'loss/train': 0.2909148037433624} -09/20/2021 23:01:16 - INFO - __main__ - Step 39398: {'lr': 0.00019940429239907298, 'samples': 1260736, 'steps': 2462, 'loss/train': 2.6016976833343506} -09/20/2021 23:01:16 - INFO - __main__ - Step 39399: {'lr': 0.00019940429239907298, 'samples': 1260768, 'steps': 2462, 'loss/train': 2.237441301345825} -09/20/2021 23:01:17 - INFO - __main__ - Step 39400: {'lr': 0.00019940429239907298, 'samples': 1260800, 'steps': 2462, 'loss/train': 1.8136330842971802} -09/20/2021 23:01:18 - INFO - __main__ - Step 39401: {'lr': 0.00019940429239907298, 'samples': 1260832, 'steps': 2462, 'loss/train': 2.1914541721343994} -09/20/2021 23:01:19 - INFO - __main__ - Step 39402: {'lr': 0.00019940429239907298, 'samples': 1260864, 'steps': 2462, 'loss/train': 2.664818286895752} -09/20/2021 23:01:19 - INFO - __main__ - Step 39403: {'lr': 0.00019940429239907298, 'samples': 1260896, 'steps': 2462, 'loss/train': 1.6455472707748413} -09/20/2021 23:01:20 - INFO - __main__ - Step 39404: {'lr': 0.00019940429239907298, 'samples': 1260928, 'steps': 2462, 'loss/train': 1.8523170948028564} -09/20/2021 23:01:21 - INFO - __main__ - Step 39405: {'lr': 0.00019940429239907298, 'samples': 1260960, 'steps': 2462, 'loss/train': 2.2809176445007324} -09/20/2021 23:01:22 - INFO - __main__ - Step 39406: {'lr': 0.00019940429239907298, 'samples': 1260992, 'steps': 2462, 'loss/train': 2.2027511596679688} -09/20/2021 23:01:22 - INFO - __main__ - Step 39407: {'lr': 0.00019940429239907298, 'samples': 1261024, 'steps': 2462, 'loss/train': 1.9769299030303955} -09/20/2021 23:01:23 - INFO - __main__ - Step 39408: {'lr': 0.00019940429239907298, 'samples': 1261056, 'steps': 2462, 'loss/train': 2.7845728397369385} -09/20/2021 23:01:24 - INFO - __main__ - Step 39409: {'lr': 0.00019940359696850714, 'samples': 1261088, 'steps': 2463, 'loss/train': 1.5542762279510498} -09/20/2021 23:01:25 - INFO - __main__ - Step 39410: {'lr': 0.00019940359696850714, 'samples': 1261120, 'steps': 2463, 'loss/train': 2.4396591186523438} -09/20/2021 23:01:26 - INFO - __main__ - Step 39411: {'lr': 0.00019940359696850714, 'samples': 1261152, 'steps': 2463, 'loss/train': 1.828683614730835} -09/20/2021 23:01:26 - INFO - __main__ - Step 39412: {'lr': 0.00019940359696850714, 'samples': 1261184, 'steps': 2463, 'loss/train': 2.586299419403076} -09/20/2021 23:01:27 - INFO - __main__ - Step 39413: {'lr': 0.00019940359696850714, 'samples': 1261216, 'steps': 2463, 'loss/train': 3.1485936641693115} -09/20/2021 23:01:28 - INFO - __main__ - Step 39414: {'lr': 0.00019940359696850714, 'samples': 1261248, 'steps': 2463, 'loss/train': 0.39747175574302673} -09/20/2021 23:01:29 - INFO - __main__ - Step 39415: {'lr': 0.00019940359696850714, 'samples': 1261280, 'steps': 2463, 'loss/train': 0.39086440205574036} -09/20/2021 23:01:29 - INFO - __main__ - Step 39416: {'lr': 0.00019940359696850714, 'samples': 1261312, 'steps': 2463, 'loss/train': 0.26170778274536133} -09/20/2021 23:01:30 - INFO - __main__ - Step 39417: {'lr': 0.00019940359696850714, 'samples': 1261344, 'steps': 2463, 'loss/train': 0.06971865892410278} -09/20/2021 23:01:31 - INFO - __main__ - Step 39418: {'lr': 0.00019940359696850714, 'samples': 1261376, 'steps': 2463, 'loss/train': 1.4354774951934814} -09/20/2021 23:01:32 - INFO - __main__ - Step 39419: {'lr': 0.00019940359696850714, 'samples': 1261408, 'steps': 2463, 'loss/train': 0.7043482661247253} -09/20/2021 23:01:32 - INFO - __main__ - Step 39420: {'lr': 0.00019940359696850714, 'samples': 1261440, 'steps': 2463, 'loss/train': 1.8568061590194702} -09/20/2021 23:01:33 - INFO - __main__ - Step 39421: {'lr': 0.00019940359696850714, 'samples': 1261472, 'steps': 2463, 'loss/train': 2.443525552749634} -09/20/2021 23:01:35 - INFO - __main__ - Step 39422: {'lr': 0.00019940359696850714, 'samples': 1261504, 'steps': 2463, 'loss/train': 2.150534152984619} -09/20/2021 23:01:35 - INFO - __main__ - Step 39423: {'lr': 0.00019940359696850714, 'samples': 1261536, 'steps': 2463, 'loss/train': 1.9512237310409546} -09/20/2021 23:01:36 - INFO - __main__ - Step 39424: {'lr': 0.00019940359696850714, 'samples': 1261568, 'steps': 2463, 'loss/train': 2.68318510055542} -09/20/2021 23:01:37 - INFO - __main__ - Step 39425: {'lr': 0.00019940290113346846, 'samples': 1261600, 'steps': 2464, 'loss/train': 1.627021312713623} -09/20/2021 23:01:38 - INFO - __main__ - Step 39426: {'lr': 0.00019940290113346846, 'samples': 1261632, 'steps': 2464, 'loss/train': 2.675175905227661} -09/20/2021 23:01:39 - INFO - __main__ - Step 39427: {'lr': 0.00019940290113346846, 'samples': 1261664, 'steps': 2464, 'loss/train': 1.4992702007293701} -09/20/2021 23:01:39 - INFO - __main__ - Step 39428: {'lr': 0.00019940290113346846, 'samples': 1261696, 'steps': 2464, 'loss/train': 2.943179130554199} -09/20/2021 23:01:40 - INFO - __main__ - Step 39429: {'lr': 0.00019940290113346846, 'samples': 1261728, 'steps': 2464, 'loss/train': 2.7442667484283447} -09/20/2021 23:01:41 - INFO - __main__ - Step 39430: {'lr': 0.00019940290113346846, 'samples': 1261760, 'steps': 2464, 'loss/train': 1.5753064155578613} -09/20/2021 23:01:42 - INFO - __main__ - Step 39431: {'lr': 0.00019940290113346846, 'samples': 1261792, 'steps': 2464, 'loss/train': 1.6601598262786865} -09/20/2021 23:01:42 - INFO - __main__ - Step 39432: {'lr': 0.00019940290113346846, 'samples': 1261824, 'steps': 2464, 'loss/train': 2.0269699096679688} -09/20/2021 23:01:43 - INFO - __main__ - Step 39433: {'lr': 0.00019940290113346846, 'samples': 1261856, 'steps': 2464, 'loss/train': 3.0298595428466797} -09/20/2021 23:01:44 - INFO - __main__ - Step 39434: {'lr': 0.00019940290113346846, 'samples': 1261888, 'steps': 2464, 'loss/train': 2.264648199081421} -09/20/2021 23:01:45 - INFO - __main__ - Step 39435: {'lr': 0.00019940290113346846, 'samples': 1261920, 'steps': 2464, 'loss/train': 2.562901020050049} -09/20/2021 23:01:45 - INFO - __main__ - Step 39436: {'lr': 0.00019940290113346846, 'samples': 1261952, 'steps': 2464, 'loss/train': 2.516282081604004} -09/20/2021 23:01:46 - INFO - __main__ - Step 39437: {'lr': 0.00019940290113346846, 'samples': 1261984, 'steps': 2464, 'loss/train': 1.6447899341583252} -09/20/2021 23:01:47 - INFO - __main__ - Step 39438: {'lr': 0.00019940290113346846, 'samples': 1262016, 'steps': 2464, 'loss/train': 3.6293575763702393} -09/20/2021 23:01:48 - INFO - __main__ - Step 39439: {'lr': 0.00019940290113346846, 'samples': 1262048, 'steps': 2464, 'loss/train': 1.8245339393615723} -09/20/2021 23:01:48 - INFO - __main__ - Step 39440: {'lr': 0.00019940290113346846, 'samples': 1262080, 'steps': 2464, 'loss/train': 2.4617414474487305} -09/20/2021 23:01:49 - INFO - __main__ - Step 39441: {'lr': 0.0001994022048939598, 'samples': 1262112, 'steps': 2465, 'loss/train': 0.11573190242052078} -09/20/2021 23:01:50 - INFO - __main__ - Step 39442: {'lr': 0.0001994022048939598, 'samples': 1262144, 'steps': 2465, 'loss/train': 0.1670159101486206} -09/20/2021 23:01:51 - INFO - __main__ - Step 39443: {'lr': 0.0001994022048939598, 'samples': 1262176, 'steps': 2465, 'loss/train': 0.22695402801036835} -09/20/2021 23:01:51 - INFO - __main__ - Step 39444: {'lr': 0.0001994022048939598, 'samples': 1262208, 'steps': 2465, 'loss/train': 0.2945655882358551} -09/20/2021 23:01:52 - INFO - __main__ - Step 39445: {'lr': 0.0001994022048939598, 'samples': 1262240, 'steps': 2465, 'loss/train': 1.503069519996643} -09/20/2021 23:01:53 - INFO - __main__ - Step 39446: {'lr': 0.0001994022048939598, 'samples': 1262272, 'steps': 2465, 'loss/train': 1.2308412790298462} -09/20/2021 23:01:54 - INFO - __main__ - Step 39447: {'lr': 0.0001994022048939598, 'samples': 1262304, 'steps': 2465, 'loss/train': 2.708336353302002} -09/20/2021 23:01:54 - INFO - __main__ - Step 39448: {'lr': 0.0001994022048939598, 'samples': 1262336, 'steps': 2465, 'loss/train': 2.124767541885376} -09/20/2021 23:01:55 - INFO - __main__ - Step 39449: {'lr': 0.0001994022048939598, 'samples': 1262368, 'steps': 2465, 'loss/train': 1.6850653886795044} -09/20/2021 23:01:56 - INFO - __main__ - Step 39450: {'lr': 0.0001994022048939598, 'samples': 1262400, 'steps': 2465, 'loss/train': 1.8587117195129395} -09/20/2021 23:01:57 - INFO - __main__ - Step 39451: {'lr': 0.0001994022048939598, 'samples': 1262432, 'steps': 2465, 'loss/train': 1.71977961063385} -09/20/2021 23:01:57 - INFO - __main__ - Step 39452: {'lr': 0.0001994022048939598, 'samples': 1262464, 'steps': 2465, 'loss/train': 1.6656367778778076} -09/20/2021 23:01:58 - INFO - __main__ - Step 39453: {'lr': 0.0001994022048939598, 'samples': 1262496, 'steps': 2465, 'loss/train': 2.2143521308898926} -09/20/2021 23:01:59 - INFO - __main__ - Step 39454: {'lr': 0.0001994022048939598, 'samples': 1262528, 'steps': 2465, 'loss/train': 2.9191460609436035} -09/20/2021 23:02:00 - INFO - __main__ - Step 39455: {'lr': 0.0001994022048939598, 'samples': 1262560, 'steps': 2465, 'loss/train': 2.050379991531372} -09/20/2021 23:02:01 - INFO - __main__ - Step 39456: {'lr': 0.0001994022048939598, 'samples': 1262592, 'steps': 2465, 'loss/train': 0.27226296067237854} -09/20/2021 23:02:02 - INFO - __main__ - Step 39457: {'lr': 0.00019940150824998389, 'samples': 1262624, 'steps': 2466, 'loss/train': 1.6265678405761719} -09/20/2021 23:02:03 - INFO - __main__ - Step 39458: {'lr': 0.00019940150824998389, 'samples': 1262656, 'steps': 2466, 'loss/train': 1.624560832977295} -09/20/2021 23:02:04 - INFO - __main__ - Step 39459: {'lr': 0.00019940150824998389, 'samples': 1262688, 'steps': 2466, 'loss/train': 1.7678680419921875} -09/20/2021 23:02:04 - INFO - __main__ - Step 39460: {'lr': 0.00019940150824998389, 'samples': 1262720, 'steps': 2466, 'loss/train': 1.789650321006775} -09/20/2021 23:02:05 - INFO - __main__ - Step 39461: {'lr': 0.00019940150824998389, 'samples': 1262752, 'steps': 2466, 'loss/train': 2.266364574432373} -09/20/2021 23:02:06 - INFO - __main__ - Step 39462: {'lr': 0.00019940150824998389, 'samples': 1262784, 'steps': 2466, 'loss/train': 1.8731918334960938} -09/20/2021 23:02:07 - INFO - __main__ - Step 39463: {'lr': 0.00019940150824998389, 'samples': 1262816, 'steps': 2466, 'loss/train': 2.3167917728424072} -09/20/2021 23:02:07 - INFO - __main__ - Step 39464: {'lr': 0.00019940150824998389, 'samples': 1262848, 'steps': 2466, 'loss/train': 2.058504104614258} -09/20/2021 23:02:08 - INFO - __main__ - Step 39465: {'lr': 0.00019940150824998389, 'samples': 1262880, 'steps': 2466, 'loss/train': 1.7785627841949463} -09/20/2021 23:02:09 - INFO - __main__ - Step 39466: {'lr': 0.00019940150824998389, 'samples': 1262912, 'steps': 2466, 'loss/train': 2.3603768348693848} -09/20/2021 23:02:10 - INFO - __main__ - Step 39467: {'lr': 0.00019940150824998389, 'samples': 1262944, 'steps': 2466, 'loss/train': 2.9565751552581787} -09/20/2021 23:02:10 - INFO - __main__ - Step 39468: {'lr': 0.00019940150824998389, 'samples': 1262976, 'steps': 2466, 'loss/train': 1.4266704320907593} -09/20/2021 23:02:11 - INFO - __main__ - Step 39469: {'lr': 0.00019940150824998389, 'samples': 1263008, 'steps': 2466, 'loss/train': 1.2538588047027588} -09/20/2021 23:02:12 - INFO - __main__ - Step 39470: {'lr': 0.00019940150824998389, 'samples': 1263040, 'steps': 2466, 'loss/train': 0.5759544372558594} -09/20/2021 23:02:13 - INFO - __main__ - Step 39471: {'lr': 0.00019940150824998389, 'samples': 1263072, 'steps': 2466, 'loss/train': 2.098175525665283} -09/20/2021 23:02:13 - INFO - __main__ - Step 39472: {'lr': 0.00019940150824998389, 'samples': 1263104, 'steps': 2466, 'loss/train': 2.2242038249969482} -09/20/2021 23:02:14 - INFO - __main__ - Step 39473: {'lr': 0.00019940081120154365, 'samples': 1263136, 'steps': 2467, 'loss/train': 2.0420024394989014} -09/20/2021 23:02:15 - INFO - __main__ - Step 39474: {'lr': 0.00019940081120154365, 'samples': 1263168, 'steps': 2467, 'loss/train': 1.8120012283325195} -09/20/2021 23:02:16 - INFO - __main__ - Step 39475: {'lr': 0.00019940081120154365, 'samples': 1263200, 'steps': 2467, 'loss/train': 2.4721877574920654} -09/20/2021 23:02:17 - INFO - __main__ - Step 39476: {'lr': 0.00019940081120154365, 'samples': 1263232, 'steps': 2467, 'loss/train': 1.837823510169983} -09/20/2021 23:02:17 - INFO - __main__ - Step 39477: {'lr': 0.00019940081120154365, 'samples': 1263264, 'steps': 2467, 'loss/train': 1.7640910148620605} -09/20/2021 23:02:18 - INFO - __main__ - Step 39478: {'lr': 0.00019940081120154365, 'samples': 1263296, 'steps': 2467, 'loss/train': 1.7355196475982666} -09/20/2021 23:02:19 - INFO - __main__ - Step 39479: {'lr': 0.00019940081120154365, 'samples': 1263328, 'steps': 2467, 'loss/train': 1.9143006801605225} -09/20/2021 23:02:20 - INFO - __main__ - Step 39480: {'lr': 0.00019940081120154365, 'samples': 1263360, 'steps': 2467, 'loss/train': 2.260267972946167} -09/20/2021 23:02:20 - INFO - __main__ - Step 39481: {'lr': 0.00019940081120154365, 'samples': 1263392, 'steps': 2467, 'loss/train': 1.7043702602386475} -09/20/2021 23:02:21 - INFO - __main__ - Step 39482: {'lr': 0.00019940081120154365, 'samples': 1263424, 'steps': 2467, 'loss/train': 1.9853626489639282} -09/20/2021 23:02:22 - INFO - __main__ - Step 39483: {'lr': 0.00019940081120154365, 'samples': 1263456, 'steps': 2467, 'loss/train': 2.52134108543396} -09/20/2021 23:02:23 - INFO - __main__ - Step 39484: {'lr': 0.00019940081120154365, 'samples': 1263488, 'steps': 2467, 'loss/train': 1.8123626708984375} -09/20/2021 23:02:23 - INFO - __main__ - Step 39485: {'lr': 0.00019940081120154365, 'samples': 1263520, 'steps': 2467, 'loss/train': 2.002960205078125} -09/20/2021 23:02:25 - INFO - __main__ - Step 39486: {'lr': 0.00019940081120154365, 'samples': 1263552, 'steps': 2467, 'loss/train': 1.544482707977295} -09/20/2021 23:02:26 - INFO - __main__ - Step 39487: {'lr': 0.00019940081120154365, 'samples': 1263584, 'steps': 2467, 'loss/train': 2.6120777130126953} -09/20/2021 23:02:27 - INFO - __main__ - Step 39488: {'lr': 0.00019940081120154365, 'samples': 1263616, 'steps': 2467, 'loss/train': 2.4414334297180176} -09/20/2021 23:02:27 - INFO - __main__ - Step 39489: {'lr': 0.0001994001137486419, 'samples': 1263648, 'steps': 2468, 'loss/train': 2.0476667881011963} -09/20/2021 23:02:28 - INFO - __main__ - Step 39490: {'lr': 0.0001994001137486419, 'samples': 1263680, 'steps': 2468, 'loss/train': 1.9067375659942627} -09/20/2021 23:02:29 - INFO - __main__ - Step 39491: {'lr': 0.0001994001137486419, 'samples': 1263712, 'steps': 2468, 'loss/train': 1.8162424564361572} -09/20/2021 23:02:30 - INFO - __main__ - Step 39492: {'lr': 0.0001994001137486419, 'samples': 1263744, 'steps': 2468, 'loss/train': 2.043768882751465} -09/20/2021 23:02:30 - INFO - __main__ - Step 39493: {'lr': 0.0001994001137486419, 'samples': 1263776, 'steps': 2468, 'loss/train': 2.3655037879943848} -09/20/2021 23:02:31 - INFO - __main__ - Step 39494: {'lr': 0.0001994001137486419, 'samples': 1263808, 'steps': 2468, 'loss/train': 2.503790855407715} -09/20/2021 23:02:32 - INFO - __main__ - Step 39495: {'lr': 0.0001994001137486419, 'samples': 1263840, 'steps': 2468, 'loss/train': 0.1431078314781189} -09/20/2021 23:02:33 - INFO - __main__ - Step 39496: {'lr': 0.0001994001137486419, 'samples': 1263872, 'steps': 2468, 'loss/train': 0.15601846575737} -09/20/2021 23:02:33 - INFO - __main__ - Step 39497: {'lr': 0.0001994001137486419, 'samples': 1263904, 'steps': 2468, 'loss/train': 2.6521506309509277} -09/20/2021 23:02:34 - INFO - __main__ - Step 39498: {'lr': 0.0001994001137486419, 'samples': 1263936, 'steps': 2468, 'loss/train': 2.9726157188415527} -09/20/2021 23:02:35 - INFO - __main__ - Step 39499: {'lr': 0.0001994001137486419, 'samples': 1263968, 'steps': 2468, 'loss/train': 2.92443585395813} -09/20/2021 23:02:36 - INFO - __main__ - Step 39500: {'lr': 0.0001994001137486419, 'samples': 1264000, 'steps': 2468, 'loss/train': 2.2172627449035645} -09/20/2021 23:02:36 - INFO - __main__ - Step 39501: {'lr': 0.0001994001137486419, 'samples': 1264032, 'steps': 2468, 'loss/train': 2.393718957901001} -09/20/2021 23:02:37 - INFO - __main__ - Step 39502: {'lr': 0.0001994001137486419, 'samples': 1264064, 'steps': 2468, 'loss/train': 1.8453928232192993} -09/20/2021 23:02:38 - INFO - __main__ - Step 39503: {'lr': 0.0001994001137486419, 'samples': 1264096, 'steps': 2468, 'loss/train': 2.789238691329956} -09/20/2021 23:02:39 - INFO - __main__ - Step 39504: {'lr': 0.0001994001137486419, 'samples': 1264128, 'steps': 2468, 'loss/train': 1.9364700317382812} -09/20/2021 23:02:40 - INFO - __main__ - Step 39505: {'lr': 0.0001993994158912815, 'samples': 1264160, 'steps': 2469, 'loss/train': 2.821782350540161} -09/20/2021 23:02:40 - INFO - __main__ - Step 39506: {'lr': 0.0001993994158912815, 'samples': 1264192, 'steps': 2469, 'loss/train': 2.3387272357940674} -09/20/2021 23:02:41 - INFO - __main__ - Step 39507: {'lr': 0.0001993994158912815, 'samples': 1264224, 'steps': 2469, 'loss/train': 1.458086371421814} -09/20/2021 23:02:42 - INFO - __main__ - Step 39508: {'lr': 0.0001993994158912815, 'samples': 1264256, 'steps': 2469, 'loss/train': 2.6443727016448975} -09/20/2021 23:02:43 - INFO - __main__ - Step 39509: {'lr': 0.0001993994158912815, 'samples': 1264288, 'steps': 2469, 'loss/train': 2.6150662899017334} -09/20/2021 23:02:43 - INFO - __main__ - Step 39510: {'lr': 0.0001993994158912815, 'samples': 1264320, 'steps': 2469, 'loss/train': 3.396592140197754} -09/20/2021 23:02:44 - INFO - __main__ - Step 39511: {'lr': 0.0001993994158912815, 'samples': 1264352, 'steps': 2469, 'loss/train': 1.6893973350524902} -09/20/2021 23:02:45 - INFO - __main__ - Step 39512: {'lr': 0.0001993994158912815, 'samples': 1264384, 'steps': 2469, 'loss/train': 2.4304168224334717} -09/20/2021 23:02:46 - INFO - __main__ - Step 39513: {'lr': 0.0001993994158912815, 'samples': 1264416, 'steps': 2469, 'loss/train': 2.5099427700042725} -09/20/2021 23:02:46 - INFO - __main__ - Step 39514: {'lr': 0.0001993994158912815, 'samples': 1264448, 'steps': 2469, 'loss/train': 2.283304452896118} -09/20/2021 23:02:47 - INFO - __main__ - Step 39515: {'lr': 0.0001993994158912815, 'samples': 1264480, 'steps': 2469, 'loss/train': 2.359865188598633} -09/20/2021 23:02:48 - INFO - __main__ - Step 39516: {'lr': 0.0001993994158912815, 'samples': 1264512, 'steps': 2469, 'loss/train': 2.373802900314331} -09/20/2021 23:02:49 - INFO - __main__ - Step 39517: {'lr': 0.0001993994158912815, 'samples': 1264544, 'steps': 2469, 'loss/train': 2.7697744369506836} -09/20/2021 23:02:50 - INFO - __main__ - Step 39518: {'lr': 0.0001993994158912815, 'samples': 1264576, 'steps': 2469, 'loss/train': 0.8936000466346741} -09/20/2021 23:02:51 - INFO - __main__ - Step 39519: {'lr': 0.0001993994158912815, 'samples': 1264608, 'steps': 2469, 'loss/train': 1.6485893726348877} -09/20/2021 23:02:52 - INFO - __main__ - Step 39520: {'lr': 0.0001993994158912815, 'samples': 1264640, 'steps': 2469, 'loss/train': 1.8615983724594116} -09/20/2021 23:02:52 - INFO - __main__ - Step 39521: {'lr': 0.00019939871762946526, 'samples': 1264672, 'steps': 2470, 'loss/train': 2.1610538959503174} -09/20/2021 23:02:53 - INFO - __main__ - Step 39522: {'lr': 0.00019939871762946526, 'samples': 1264704, 'steps': 2470, 'loss/train': 2.511781930923462} -09/20/2021 23:02:54 - INFO - __main__ - Step 39523: {'lr': 0.00019939871762946526, 'samples': 1264736, 'steps': 2470, 'loss/train': 2.43152117729187} -09/20/2021 23:02:55 - INFO - __main__ - Step 39524: {'lr': 0.00019939871762946526, 'samples': 1264768, 'steps': 2470, 'loss/train': 2.641874313354492} -09/20/2021 23:02:55 - INFO - __main__ - Step 39525: {'lr': 0.00019939871762946526, 'samples': 1264800, 'steps': 2470, 'loss/train': 2.296403169631958} -09/20/2021 23:02:56 - INFO - __main__ - Step 39526: {'lr': 0.00019939871762946526, 'samples': 1264832, 'steps': 2470, 'loss/train': 2.1920218467712402} -09/20/2021 23:02:57 - INFO - __main__ - Step 39527: {'lr': 0.00019939871762946526, 'samples': 1264864, 'steps': 2470, 'loss/train': 1.614396572113037} -09/20/2021 23:02:58 - INFO - __main__ - Step 39528: {'lr': 0.00019939871762946526, 'samples': 1264896, 'steps': 2470, 'loss/train': 1.042703628540039} -09/20/2021 23:02:58 - INFO - __main__ - Step 39529: {'lr': 0.00019939871762946526, 'samples': 1264928, 'steps': 2470, 'loss/train': 2.501697063446045} -09/20/2021 23:02:59 - INFO - __main__ - Step 39530: {'lr': 0.00019939871762946526, 'samples': 1264960, 'steps': 2470, 'loss/train': 2.546084403991699} -09/20/2021 23:03:00 - INFO - __main__ - Step 39531: {'lr': 0.00019939871762946526, 'samples': 1264992, 'steps': 2470, 'loss/train': 1.8593931198120117} -09/20/2021 23:03:01 - INFO - __main__ - Step 39532: {'lr': 0.00019939871762946526, 'samples': 1265024, 'steps': 2470, 'loss/train': 1.2274813652038574} -09/20/2021 23:03:01 - INFO - __main__ - Step 39533: {'lr': 0.00019939871762946526, 'samples': 1265056, 'steps': 2470, 'loss/train': 0.42837098240852356} -09/20/2021 23:03:02 - INFO - __main__ - Step 39534: {'lr': 0.00019939871762946526, 'samples': 1265088, 'steps': 2470, 'loss/train': 2.4605960845947266} -09/20/2021 23:03:03 - INFO - __main__ - Step 39535: {'lr': 0.00019939871762946526, 'samples': 1265120, 'steps': 2470, 'loss/train': 1.9959224462509155} -09/20/2021 23:03:04 - INFO - __main__ - Step 39536: {'lr': 0.00019939871762946526, 'samples': 1265152, 'steps': 2470, 'loss/train': 1.7003495693206787} -09/20/2021 23:03:05 - INFO - __main__ - Step 39537: {'lr': 0.00019939801896319597, 'samples': 1265184, 'steps': 2471, 'loss/train': 1.1678533554077148} -09/20/2021 23:03:05 - INFO - __main__ - Step 39538: {'lr': 0.00019939801896319597, 'samples': 1265216, 'steps': 2471, 'loss/train': 1.2098854780197144} -09/20/2021 23:03:06 - INFO - __main__ - Step 39539: {'lr': 0.00019939801896319597, 'samples': 1265248, 'steps': 2471, 'loss/train': 1.2511379718780518} -09/20/2021 23:03:07 - INFO - __main__ - Step 39540: {'lr': 0.00019939801896319597, 'samples': 1265280, 'steps': 2471, 'loss/train': 1.2419346570968628} -09/20/2021 23:03:08 - INFO - __main__ - Step 39541: {'lr': 0.00019939801896319597, 'samples': 1265312, 'steps': 2471, 'loss/train': 1.8248294591903687} -09/20/2021 23:03:08 - INFO - __main__ - Step 39542: {'lr': 0.00019939801896319597, 'samples': 1265344, 'steps': 2471, 'loss/train': 2.36722469329834} -09/20/2021 23:03:09 - INFO - __main__ - Step 39543: {'lr': 0.00019939801896319597, 'samples': 1265376, 'steps': 2471, 'loss/train': 3.086841344833374} -09/20/2021 23:03:10 - INFO - __main__ - Step 39544: {'lr': 0.00019939801896319597, 'samples': 1265408, 'steps': 2471, 'loss/train': 2.194488048553467} -09/20/2021 23:03:11 - INFO - __main__ - Step 39545: {'lr': 0.00019939801896319597, 'samples': 1265440, 'steps': 2471, 'loss/train': 2.2892680168151855} -09/20/2021 23:03:11 - INFO - __main__ - Step 39546: {'lr': 0.00019939801896319597, 'samples': 1265472, 'steps': 2471, 'loss/train': 2.0074641704559326} -09/20/2021 23:03:12 - INFO - __main__ - Step 39547: {'lr': 0.00019939801896319597, 'samples': 1265504, 'steps': 2471, 'loss/train': 1.6725467443466187} -09/20/2021 23:03:13 - INFO - __main__ - Step 39548: {'lr': 0.00019939801896319597, 'samples': 1265536, 'steps': 2471, 'loss/train': 2.22037672996521} -09/20/2021 23:03:14 - INFO - __main__ - Step 39549: {'lr': 0.00019939801896319597, 'samples': 1265568, 'steps': 2471, 'loss/train': 1.5832693576812744} -09/20/2021 23:03:14 - INFO - __main__ - Step 39550: {'lr': 0.00019939801896319597, 'samples': 1265600, 'steps': 2471, 'loss/train': 1.812211036682129} -09/20/2021 23:03:15 - INFO - __main__ - Step 39551: {'lr': 0.00019939801896319597, 'samples': 1265632, 'steps': 2471, 'loss/train': 1.7277450561523438} -09/20/2021 23:03:16 - INFO - __main__ - Step 39552: {'lr': 0.00019939801896319597, 'samples': 1265664, 'steps': 2471, 'loss/train': 1.577204704284668} -09/20/2021 23:03:17 - INFO - __main__ - Step 39553: {'lr': 0.00019939731989247655, 'samples': 1265696, 'steps': 2472, 'loss/train': 2.1753692626953125} -09/20/2021 23:03:18 - INFO - __main__ - Step 39554: {'lr': 0.00019939731989247655, 'samples': 1265728, 'steps': 2472, 'loss/train': 1.8077152967453003} -09/20/2021 23:03:19 - INFO - __main__ - Step 39555: {'lr': 0.00019939731989247655, 'samples': 1265760, 'steps': 2472, 'loss/train': 1.7357778549194336} -09/20/2021 23:03:19 - INFO - __main__ - Step 39556: {'lr': 0.00019939731989247655, 'samples': 1265792, 'steps': 2472, 'loss/train': 1.86420738697052} -09/20/2021 23:03:20 - INFO - __main__ - Step 39557: {'lr': 0.00019939731989247655, 'samples': 1265824, 'steps': 2472, 'loss/train': 3.4332847595214844} -09/20/2021 23:03:21 - INFO - __main__ - Step 39558: {'lr': 0.00019939731989247655, 'samples': 1265856, 'steps': 2472, 'loss/train': 2.698429822921753} -09/20/2021 23:03:22 - INFO - __main__ - Step 39559: {'lr': 0.00019939731989247655, 'samples': 1265888, 'steps': 2472, 'loss/train': 2.7058017253875732} -09/20/2021 23:03:22 - INFO - __main__ - Step 39560: {'lr': 0.00019939731989247655, 'samples': 1265920, 'steps': 2472, 'loss/train': 1.6697498559951782} -09/20/2021 23:03:23 - INFO - __main__ - Step 39561: {'lr': 0.00019939731989247655, 'samples': 1265952, 'steps': 2472, 'loss/train': 2.0447428226470947} -09/20/2021 23:03:24 - INFO - __main__ - Step 39562: {'lr': 0.00019939731989247655, 'samples': 1265984, 'steps': 2472, 'loss/train': 3.02289080619812} -09/20/2021 23:03:25 - INFO - __main__ - Step 39563: {'lr': 0.00019939731989247655, 'samples': 1266016, 'steps': 2472, 'loss/train': 1.7833002805709839} -09/20/2021 23:03:25 - INFO - __main__ - Step 39564: {'lr': 0.00019939731989247655, 'samples': 1266048, 'steps': 2472, 'loss/train': 1.8276925086975098} -09/20/2021 23:03:26 - INFO - __main__ - Step 39565: {'lr': 0.00019939731989247655, 'samples': 1266080, 'steps': 2472, 'loss/train': 2.2947072982788086} -09/20/2021 23:03:27 - INFO - __main__ - Step 39566: {'lr': 0.00019939731989247655, 'samples': 1266112, 'steps': 2472, 'loss/train': 3.278455972671509} -09/20/2021 23:03:28 - INFO - __main__ - Step 39567: {'lr': 0.00019939731989247655, 'samples': 1266144, 'steps': 2472, 'loss/train': 2.283763885498047} -09/20/2021 23:03:28 - INFO - __main__ - Step 39568: {'lr': 0.00019939731989247655, 'samples': 1266176, 'steps': 2472, 'loss/train': 2.128741979598999} -09/20/2021 23:03:29 - INFO - __main__ - Step 39569: {'lr': 0.00019939662041730985, 'samples': 1266208, 'steps': 2473, 'loss/train': 2.361823558807373} -09/20/2021 23:03:30 - INFO - __main__ - Step 39570: {'lr': 0.00019939662041730985, 'samples': 1266240, 'steps': 2473, 'loss/train': 0.48715054988861084} -09/20/2021 23:03:31 - INFO - __main__ - Step 39571: {'lr': 0.00019939662041730985, 'samples': 1266272, 'steps': 2473, 'loss/train': 1.9945765733718872} -09/20/2021 23:03:32 - INFO - __main__ - Step 39572: {'lr': 0.00019939662041730985, 'samples': 1266304, 'steps': 2473, 'loss/train': 2.231112480163574} -09/20/2021 23:03:32 - INFO - __main__ - Step 39573: {'lr': 0.00019939662041730985, 'samples': 1266336, 'steps': 2473, 'loss/train': 1.2675701379776} -09/20/2021 23:03:33 - INFO - __main__ - Step 39574: {'lr': 0.00019939662041730985, 'samples': 1266368, 'steps': 2473, 'loss/train': 2.567711114883423} -09/20/2021 23:03:34 - INFO - __main__ - Step 39575: {'lr': 0.00019939662041730985, 'samples': 1266400, 'steps': 2473, 'loss/train': 0.7140372395515442} -09/20/2021 23:03:35 - INFO - __main__ - Step 39576: {'lr': 0.00019939662041730985, 'samples': 1266432, 'steps': 2473, 'loss/train': 2.9944114685058594} -09/20/2021 23:03:35 - INFO - __main__ - Step 39577: {'lr': 0.00019939662041730985, 'samples': 1266464, 'steps': 2473, 'loss/train': 1.9347014427185059} -09/20/2021 23:03:36 - INFO - __main__ - Step 39578: {'lr': 0.00019939662041730985, 'samples': 1266496, 'steps': 2473, 'loss/train': 1.8591971397399902} -09/20/2021 23:03:37 - INFO - __main__ - Step 39579: {'lr': 0.00019939662041730985, 'samples': 1266528, 'steps': 2473, 'loss/train': 2.0390055179595947} -09/20/2021 23:03:38 - INFO - __main__ - Step 39580: {'lr': 0.00019939662041730985, 'samples': 1266560, 'steps': 2473, 'loss/train': 1.5614824295043945} -09/20/2021 23:03:38 - INFO - __main__ - Step 39581: {'lr': 0.00019939662041730985, 'samples': 1266592, 'steps': 2473, 'loss/train': 2.9686758518218994} -09/20/2021 23:03:39 - INFO - __main__ - Step 39582: {'lr': 0.00019939662041730985, 'samples': 1266624, 'steps': 2473, 'loss/train': 2.942641496658325} -09/20/2021 23:03:40 - INFO - __main__ - Step 39583: {'lr': 0.00019939662041730985, 'samples': 1266656, 'steps': 2473, 'loss/train': 1.479238748550415} -09/20/2021 23:03:41 - INFO - __main__ - Step 39584: {'lr': 0.00019939662041730985, 'samples': 1266688, 'steps': 2473, 'loss/train': 1.9212350845336914} -09/20/2021 23:03:42 - INFO - __main__ - Step 39585: {'lr': 0.00019939592053769866, 'samples': 1266720, 'steps': 2474, 'loss/train': 2.935353994369507} -09/20/2021 23:03:43 - INFO - __main__ - Step 39586: {'lr': 0.00019939592053769866, 'samples': 1266752, 'steps': 2474, 'loss/train': 2.742926836013794} -09/20/2021 23:03:44 - INFO - __main__ - Step 39587: {'lr': 0.00019939592053769866, 'samples': 1266784, 'steps': 2474, 'loss/train': 1.4683501720428467} -09/20/2021 23:03:44 - INFO - __main__ - Step 39588: {'lr': 0.00019939592053769866, 'samples': 1266816, 'steps': 2474, 'loss/train': 2.580387592315674} -09/20/2021 23:03:45 - INFO - __main__ - Step 39589: {'lr': 0.00019939592053769866, 'samples': 1266848, 'steps': 2474, 'loss/train': 2.624119281768799} -09/20/2021 23:03:46 - INFO - __main__ - Step 39590: {'lr': 0.00019939592053769866, 'samples': 1266880, 'steps': 2474, 'loss/train': 2.1928975582122803} -09/20/2021 23:03:47 - INFO - __main__ - Step 39591: {'lr': 0.00019939592053769866, 'samples': 1266912, 'steps': 2474, 'loss/train': 1.3039171695709229} -09/20/2021 23:03:47 - INFO - __main__ - Step 39592: {'lr': 0.00019939592053769866, 'samples': 1266944, 'steps': 2474, 'loss/train': 2.570050001144409} -09/20/2021 23:03:48 - INFO - __main__ - Step 39593: {'lr': 0.00019939592053769866, 'samples': 1266976, 'steps': 2474, 'loss/train': 1.689961314201355} -09/20/2021 23:03:49 - INFO - __main__ - Step 39594: {'lr': 0.00019939592053769866, 'samples': 1267008, 'steps': 2474, 'loss/train': 3.0343523025512695} -09/20/2021 23:03:50 - INFO - __main__ - Step 39595: {'lr': 0.00019939592053769866, 'samples': 1267040, 'steps': 2474, 'loss/train': 0.37094566226005554} -09/20/2021 23:03:50 - INFO - __main__ - Step 39596: {'lr': 0.00019939592053769866, 'samples': 1267072, 'steps': 2474, 'loss/train': 1.5013172626495361} -09/20/2021 23:03:51 - INFO - __main__ - Step 39597: {'lr': 0.00019939592053769866, 'samples': 1267104, 'steps': 2474, 'loss/train': 0.24899709224700928} -09/20/2021 23:03:52 - INFO - __main__ - Step 39598: {'lr': 0.00019939592053769866, 'samples': 1267136, 'steps': 2474, 'loss/train': 1.9979151487350464} -09/20/2021 23:03:53 - INFO - __main__ - Step 39599: {'lr': 0.00019939592053769866, 'samples': 1267168, 'steps': 2474, 'loss/train': 1.0088480710983276} -09/20/2021 23:03:53 - INFO - __main__ - Step 39600: {'lr': 0.00019939592053769866, 'samples': 1267200, 'steps': 2474, 'loss/train': 2.1499507427215576} -09/20/2021 23:03:54 - INFO - __main__ - Step 39601: {'lr': 0.00019939522025364589, 'samples': 1267232, 'steps': 2475, 'loss/train': 3.229396104812622} -09/20/2021 23:03:55 - INFO - __main__ - Step 39602: {'lr': 0.00019939522025364589, 'samples': 1267264, 'steps': 2475, 'loss/train': 1.327633023262024} -09/20/2021 23:03:56 - INFO - __main__ - Step 39603: {'lr': 0.00019939522025364589, 'samples': 1267296, 'steps': 2475, 'loss/train': 1.8298767805099487} -09/20/2021 23:03:56 - INFO - __main__ - Step 39604: {'lr': 0.00019939522025364589, 'samples': 1267328, 'steps': 2475, 'loss/train': 1.8634837865829468} -09/20/2021 23:03:57 - INFO - __main__ - Step 39605: {'lr': 0.00019939522025364589, 'samples': 1267360, 'steps': 2475, 'loss/train': 1.6320300102233887} -09/20/2021 23:03:58 - INFO - __main__ - Step 39606: {'lr': 0.00019939522025364589, 'samples': 1267392, 'steps': 2475, 'loss/train': 2.967600107192993} -09/20/2021 23:03:59 - INFO - __main__ - Step 39607: {'lr': 0.00019939522025364589, 'samples': 1267424, 'steps': 2475, 'loss/train': 1.0955928564071655} -09/20/2021 23:03:59 - INFO - __main__ - Step 39608: {'lr': 0.00019939522025364589, 'samples': 1267456, 'steps': 2475, 'loss/train': 2.593123435974121} -09/20/2021 23:04:00 - INFO - __main__ - Step 39609: {'lr': 0.00019939522025364589, 'samples': 1267488, 'steps': 2475, 'loss/train': 1.8126789331436157} -09/20/2021 23:04:01 - INFO - __main__ - Step 39610: {'lr': 0.00019939522025364589, 'samples': 1267520, 'steps': 2475, 'loss/train': 1.3977915048599243} -09/20/2021 23:04:02 - INFO - __main__ - Step 39611: {'lr': 0.00019939522025364589, 'samples': 1267552, 'steps': 2475, 'loss/train': 1.1850279569625854} -09/20/2021 23:04:02 - INFO - __main__ - Step 39612: {'lr': 0.00019939522025364589, 'samples': 1267584, 'steps': 2475, 'loss/train': 0.44476062059402466} -09/20/2021 23:04:03 - INFO - __main__ - Step 39613: {'lr': 0.00019939522025364589, 'samples': 1267616, 'steps': 2475, 'loss/train': 2.5063352584838867} -09/20/2021 23:04:04 - INFO - __main__ - Step 39614: {'lr': 0.00019939522025364589, 'samples': 1267648, 'steps': 2475, 'loss/train': 1.4413442611694336} -09/20/2021 23:04:05 - INFO - __main__ - Step 39615: {'lr': 0.00019939522025364589, 'samples': 1267680, 'steps': 2475, 'loss/train': 1.0835845470428467} -09/20/2021 23:04:06 - INFO - __main__ - Step 39616: {'lr': 0.00019939522025364589, 'samples': 1267712, 'steps': 2475, 'loss/train': 2.8709919452667236} -09/20/2021 23:04:07 - INFO - __main__ - Step 39617: {'lr': 0.0001993945195651543, 'samples': 1267744, 'steps': 2476, 'loss/train': 1.8983863592147827} -09/20/2021 23:04:08 - INFO - __main__ - Step 39618: {'lr': 0.0001993945195651543, 'samples': 1267776, 'steps': 2476, 'loss/train': 2.5190701484680176} -09/20/2021 23:04:08 - INFO - __main__ - Step 39619: {'lr': 0.0001993945195651543, 'samples': 1267808, 'steps': 2476, 'loss/train': 2.5865633487701416} -09/20/2021 23:04:09 - INFO - __main__ - Step 39620: {'lr': 0.0001993945195651543, 'samples': 1267840, 'steps': 2476, 'loss/train': 2.652656078338623} -09/20/2021 23:04:10 - INFO - __main__ - Step 39621: {'lr': 0.0001993945195651543, 'samples': 1267872, 'steps': 2476, 'loss/train': 2.3372087478637695} -09/20/2021 23:04:11 - INFO - __main__ - Step 39622: {'lr': 0.0001993945195651543, 'samples': 1267904, 'steps': 2476, 'loss/train': 2.7943460941314697} -09/20/2021 23:04:11 - INFO - __main__ - Step 39623: {'lr': 0.0001993945195651543, 'samples': 1267936, 'steps': 2476, 'loss/train': 2.670560836791992} -09/20/2021 23:04:12 - INFO - __main__ - Step 39624: {'lr': 0.0001993945195651543, 'samples': 1267968, 'steps': 2476, 'loss/train': 1.981277346611023} -09/20/2021 23:04:13 - INFO - __main__ - Step 39625: {'lr': 0.0001993945195651543, 'samples': 1268000, 'steps': 2476, 'loss/train': 2.334684371948242} -09/20/2021 23:04:14 - INFO - __main__ - Step 39626: {'lr': 0.0001993945195651543, 'samples': 1268032, 'steps': 2476, 'loss/train': 1.367390751838684} -09/20/2021 23:04:14 - INFO - __main__ - Step 39627: {'lr': 0.0001993945195651543, 'samples': 1268064, 'steps': 2476, 'loss/train': 1.5131762027740479} -09/20/2021 23:04:15 - INFO - __main__ - Step 39628: {'lr': 0.0001993945195651543, 'samples': 1268096, 'steps': 2476, 'loss/train': 1.4104465246200562} -09/20/2021 23:04:16 - INFO - __main__ - Step 39629: {'lr': 0.0001993945195651543, 'samples': 1268128, 'steps': 2476, 'loss/train': 1.5504193305969238} -09/20/2021 23:04:17 - INFO - __main__ - Step 39630: {'lr': 0.0001993945195651543, 'samples': 1268160, 'steps': 2476, 'loss/train': 2.358840227127075} -09/20/2021 23:04:17 - INFO - __main__ - Step 39631: {'lr': 0.0001993945195651543, 'samples': 1268192, 'steps': 2476, 'loss/train': 2.234501600265503} -09/20/2021 23:04:18 - INFO - __main__ - Step 39632: {'lr': 0.0001993945195651543, 'samples': 1268224, 'steps': 2476, 'loss/train': 1.733410120010376} -09/20/2021 23:04:19 - INFO - __main__ - Step 39633: {'lr': 0.00019939381847222684, 'samples': 1268256, 'steps': 2477, 'loss/train': 2.7838261127471924} -09/20/2021 23:04:20 - INFO - __main__ - Step 39634: {'lr': 0.00019939381847222684, 'samples': 1268288, 'steps': 2477, 'loss/train': 1.8090054988861084} -09/20/2021 23:04:20 - INFO - __main__ - Step 39635: {'lr': 0.00019939381847222684, 'samples': 1268320, 'steps': 2477, 'loss/train': 3.1753499507904053} -09/20/2021 23:04:21 - INFO - __main__ - Step 39636: {'lr': 0.00019939381847222684, 'samples': 1268352, 'steps': 2477, 'loss/train': 2.315452814102173} -09/20/2021 23:04:22 - INFO - __main__ - Step 39637: {'lr': 0.00019939381847222684, 'samples': 1268384, 'steps': 2477, 'loss/train': 2.113771438598633} -09/20/2021 23:04:23 - INFO - __main__ - Step 39638: {'lr': 0.00019939381847222684, 'samples': 1268416, 'steps': 2477, 'loss/train': 1.7211326360702515} -09/20/2021 23:04:23 - INFO - __main__ - Step 39639: {'lr': 0.00019939381847222684, 'samples': 1268448, 'steps': 2477, 'loss/train': 2.761849880218506} -09/20/2021 23:04:24 - INFO - __main__ - Step 39640: {'lr': 0.00019939381847222684, 'samples': 1268480, 'steps': 2477, 'loss/train': 2.1648006439208984} -09/20/2021 23:04:25 - INFO - __main__ - Step 39641: {'lr': 0.00019939381847222684, 'samples': 1268512, 'steps': 2477, 'loss/train': 3.1215105056762695} -09/20/2021 23:04:26 - INFO - __main__ - Step 39642: {'lr': 0.00019939381847222684, 'samples': 1268544, 'steps': 2477, 'loss/train': 1.8003770112991333} -09/20/2021 23:04:26 - INFO - __main__ - Step 39643: {'lr': 0.00019939381847222684, 'samples': 1268576, 'steps': 2477, 'loss/train': 2.572354793548584} -09/20/2021 23:04:27 - INFO - __main__ - Step 39644: {'lr': 0.00019939381847222684, 'samples': 1268608, 'steps': 2477, 'loss/train': 2.441723108291626} -09/20/2021 23:04:28 - INFO - __main__ - Step 39645: {'lr': 0.00019939381847222684, 'samples': 1268640, 'steps': 2477, 'loss/train': 2.574918746948242} -09/20/2021 23:04:29 - INFO - __main__ - Step 39646: {'lr': 0.00019939381847222684, 'samples': 1268672, 'steps': 2477, 'loss/train': 1.4099018573760986} -09/20/2021 23:04:30 - INFO - __main__ - Step 39647: {'lr': 0.00019939381847222684, 'samples': 1268704, 'steps': 2477, 'loss/train': 1.4135138988494873} -09/20/2021 23:04:31 - INFO - __main__ - Step 39648: {'lr': 0.00019939381847222684, 'samples': 1268736, 'steps': 2477, 'loss/train': 2.0540645122528076} -09/20/2021 23:04:32 - INFO - __main__ - Step 39649: {'lr': 0.0001993931169748663, 'samples': 1268768, 'steps': 2478, 'loss/train': 1.7989985942840576} -09/20/2021 23:04:32 - INFO - __main__ - Step 39650: {'lr': 0.0001993931169748663, 'samples': 1268800, 'steps': 2478, 'loss/train': 2.1450517177581787} -09/20/2021 23:04:33 - INFO - __main__ - Step 39651: {'lr': 0.0001993931169748663, 'samples': 1268832, 'steps': 2478, 'loss/train': 2.6672778129577637} -09/20/2021 23:04:34 - INFO - __main__ - Step 39652: {'lr': 0.0001993931169748663, 'samples': 1268864, 'steps': 2478, 'loss/train': 1.0722767114639282} -09/20/2021 23:04:35 - INFO - __main__ - Step 39653: {'lr': 0.0001993931169748663, 'samples': 1268896, 'steps': 2478, 'loss/train': 2.0842370986938477} -09/20/2021 23:04:35 - INFO - __main__ - Step 39654: {'lr': 0.0001993931169748663, 'samples': 1268928, 'steps': 2478, 'loss/train': 2.545983076095581} -09/20/2021 23:04:36 - INFO - __main__ - Step 39655: {'lr': 0.0001993931169748663, 'samples': 1268960, 'steps': 2478, 'loss/train': 2.338080406188965} -09/20/2021 23:04:37 - INFO - __main__ - Step 39656: {'lr': 0.0001993931169748663, 'samples': 1268992, 'steps': 2478, 'loss/train': 1.898735761642456} -09/20/2021 23:04:38 - INFO - __main__ - Step 39657: {'lr': 0.0001993931169748663, 'samples': 1269024, 'steps': 2478, 'loss/train': 0.880508542060852} -09/20/2021 23:04:38 - INFO - __main__ - Step 39658: {'lr': 0.0001993931169748663, 'samples': 1269056, 'steps': 2478, 'loss/train': 2.262622594833374} -09/20/2021 23:04:39 - INFO - __main__ - Step 39659: {'lr': 0.0001993931169748663, 'samples': 1269088, 'steps': 2478, 'loss/train': 1.5452735424041748} -09/20/2021 23:04:40 - INFO - __main__ - Step 39660: {'lr': 0.0001993931169748663, 'samples': 1269120, 'steps': 2478, 'loss/train': 2.1574559211730957} -09/20/2021 23:04:41 - INFO - __main__ - Step 39661: {'lr': 0.0001993931169748663, 'samples': 1269152, 'steps': 2478, 'loss/train': 2.0082461833953857} -09/20/2021 23:04:41 - INFO - __main__ - Step 39662: {'lr': 0.0001993931169748663, 'samples': 1269184, 'steps': 2478, 'loss/train': 2.0184223651885986} -09/20/2021 23:04:42 - INFO - __main__ - Step 39663: {'lr': 0.0001993931169748663, 'samples': 1269216, 'steps': 2478, 'loss/train': 3.0458171367645264} -09/20/2021 23:04:43 - INFO - __main__ - Step 39664: {'lr': 0.0001993931169748663, 'samples': 1269248, 'steps': 2478, 'loss/train': 2.5718510150909424} -09/20/2021 23:04:44 - INFO - __main__ - Step 39665: {'lr': 0.00019939241507307555, 'samples': 1269280, 'steps': 2479, 'loss/train': 1.4902211427688599} -09/20/2021 23:04:44 - INFO - __main__ - Step 39666: {'lr': 0.00019939241507307555, 'samples': 1269312, 'steps': 2479, 'loss/train': 1.667655110359192} -09/20/2021 23:04:45 - INFO - __main__ - Step 39667: {'lr': 0.00019939241507307555, 'samples': 1269344, 'steps': 2479, 'loss/train': 2.5489003658294678} -09/20/2021 23:04:46 - INFO - __main__ - Step 39668: {'lr': 0.00019939241507307555, 'samples': 1269376, 'steps': 2479, 'loss/train': 0.6429253220558167} -09/20/2021 23:04:47 - INFO - __main__ - Step 39669: {'lr': 0.00019939241507307555, 'samples': 1269408, 'steps': 2479, 'loss/train': 2.133944511413574} -09/20/2021 23:04:47 - INFO - __main__ - Step 39670: {'lr': 0.00019939241507307555, 'samples': 1269440, 'steps': 2479, 'loss/train': 1.1116559505462646} -09/20/2021 23:04:48 - INFO - __main__ - Step 39671: {'lr': 0.00019939241507307555, 'samples': 1269472, 'steps': 2479, 'loss/train': 2.1284048557281494} -09/20/2021 23:04:49 - INFO - __main__ - Step 39672: {'lr': 0.00019939241507307555, 'samples': 1269504, 'steps': 2479, 'loss/train': 1.6617577075958252} -09/20/2021 23:04:50 - INFO - __main__ - Step 39673: {'lr': 0.00019939241507307555, 'samples': 1269536, 'steps': 2479, 'loss/train': 1.9009180068969727} -09/20/2021 23:04:50 - INFO - __main__ - Step 39674: {'lr': 0.00019939241507307555, 'samples': 1269568, 'steps': 2479, 'loss/train': 2.7682888507843018} -09/20/2021 23:04:51 - INFO - __main__ - Step 39675: {'lr': 0.00019939241507307555, 'samples': 1269600, 'steps': 2479, 'loss/train': 2.2696969509124756} -09/20/2021 23:04:52 - INFO - __main__ - Step 39676: {'lr': 0.00019939241507307555, 'samples': 1269632, 'steps': 2479, 'loss/train': 2.178654193878174} -09/20/2021 23:04:53 - INFO - __main__ - Step 39677: {'lr': 0.00019939241507307555, 'samples': 1269664, 'steps': 2479, 'loss/train': 2.7658743858337402} -09/20/2021 23:04:54 - INFO - __main__ - Step 39678: {'lr': 0.00019939241507307555, 'samples': 1269696, 'steps': 2479, 'loss/train': 2.3563990592956543} -09/20/2021 23:04:55 - INFO - __main__ - Step 39679: {'lr': 0.00019939241507307555, 'samples': 1269728, 'steps': 2479, 'loss/train': 2.961425542831421} -09/20/2021 23:04:56 - INFO - __main__ - Step 39680: {'lr': 0.00019939241507307555, 'samples': 1269760, 'steps': 2479, 'loss/train': 1.9820570945739746} -09/20/2021 23:04:57 - INFO - __main__ - Step 39681: {'lr': 0.00019939171276685746, 'samples': 1269792, 'steps': 2480, 'loss/train': 2.518479108810425} -09/20/2021 23:04:57 - INFO - __main__ - Step 39682: {'lr': 0.00019939171276685746, 'samples': 1269824, 'steps': 2480, 'loss/train': 1.6727855205535889} -09/20/2021 23:04:58 - INFO - __main__ - Step 39683: {'lr': 0.00019939171276685746, 'samples': 1269856, 'steps': 2480, 'loss/train': 1.4907987117767334} -09/20/2021 23:04:59 - INFO - __main__ - Step 39684: {'lr': 0.00019939171276685746, 'samples': 1269888, 'steps': 2480, 'loss/train': 1.8025528192520142} -09/20/2021 23:05:00 - INFO - __main__ - Step 39685: {'lr': 0.00019939171276685746, 'samples': 1269920, 'steps': 2480, 'loss/train': 1.823203444480896} -09/20/2021 23:05:00 - INFO - __main__ - Step 39686: {'lr': 0.00019939171276685746, 'samples': 1269952, 'steps': 2480, 'loss/train': 2.9639739990234375} -09/20/2021 23:05:01 - INFO - __main__ - Step 39687: {'lr': 0.00019939171276685746, 'samples': 1269984, 'steps': 2480, 'loss/train': 2.440181255340576} -09/20/2021 23:05:02 - INFO - __main__ - Step 39688: {'lr': 0.00019939171276685746, 'samples': 1270016, 'steps': 2480, 'loss/train': 1.762532353401184} -09/20/2021 23:05:03 - INFO - __main__ - Step 39689: {'lr': 0.00019939171276685746, 'samples': 1270048, 'steps': 2480, 'loss/train': 0.7103888392448425} -09/20/2021 23:05:03 - INFO - __main__ - Step 39690: {'lr': 0.00019939171276685746, 'samples': 1270080, 'steps': 2480, 'loss/train': 2.3314359188079834} -09/20/2021 23:05:04 - INFO - __main__ - Step 39691: {'lr': 0.00019939171276685746, 'samples': 1270112, 'steps': 2480, 'loss/train': 1.7306501865386963} -09/20/2021 23:05:05 - INFO - __main__ - Step 39692: {'lr': 0.00019939171276685746, 'samples': 1270144, 'steps': 2480, 'loss/train': 2.4574785232543945} -09/20/2021 23:05:06 - INFO - __main__ - Step 39693: {'lr': 0.00019939171276685746, 'samples': 1270176, 'steps': 2480, 'loss/train': 1.6205614805221558} -09/20/2021 23:05:06 - INFO - __main__ - Step 39694: {'lr': 0.00019939171276685746, 'samples': 1270208, 'steps': 2480, 'loss/train': 3.3380045890808105} -09/20/2021 23:05:07 - INFO - __main__ - Step 39695: {'lr': 0.00019939171276685746, 'samples': 1270240, 'steps': 2480, 'loss/train': 2.8764474391937256} -09/20/2021 23:05:08 - INFO - __main__ - Step 39696: {'lr': 0.00019939171276685746, 'samples': 1270272, 'steps': 2480, 'loss/train': 1.9956082105636597} -09/20/2021 23:05:09 - INFO - __main__ - Step 39697: {'lr': 0.00019939101005621488, 'samples': 1270304, 'steps': 2481, 'loss/train': 1.43455970287323} -09/20/2021 23:05:09 - INFO - __main__ - Step 39698: {'lr': 0.00019939101005621488, 'samples': 1270336, 'steps': 2481, 'loss/train': 1.430525541305542} -09/20/2021 23:05:10 - INFO - __main__ - Step 39699: {'lr': 0.00019939101005621488, 'samples': 1270368, 'steps': 2481, 'loss/train': 1.6869515180587769} -09/20/2021 23:05:11 - INFO - __main__ - Step 39700: {'lr': 0.00019939101005621488, 'samples': 1270400, 'steps': 2481, 'loss/train': 0.8973997831344604} -09/20/2021 23:05:12 - INFO - __main__ - Step 39701: {'lr': 0.00019939101005621488, 'samples': 1270432, 'steps': 2481, 'loss/train': 3.90307354927063} -09/20/2021 23:05:12 - INFO - __main__ - Step 39702: {'lr': 0.00019939101005621488, 'samples': 1270464, 'steps': 2481, 'loss/train': 2.2516815662384033} -09/20/2021 23:05:13 - INFO - __main__ - Step 39703: {'lr': 0.00019939101005621488, 'samples': 1270496, 'steps': 2481, 'loss/train': 2.1730520725250244} -09/20/2021 23:05:14 - INFO - __main__ - Step 39704: {'lr': 0.00019939101005621488, 'samples': 1270528, 'steps': 2481, 'loss/train': 1.0920838117599487} -09/20/2021 23:05:15 - INFO - __main__ - Step 39705: {'lr': 0.00019939101005621488, 'samples': 1270560, 'steps': 2481, 'loss/train': 3.640101432800293} -09/20/2021 23:05:15 - INFO - __main__ - Step 39706: {'lr': 0.00019939101005621488, 'samples': 1270592, 'steps': 2481, 'loss/train': 3.7701094150543213} -09/20/2021 23:05:16 - INFO - __main__ - Step 39707: {'lr': 0.00019939101005621488, 'samples': 1270624, 'steps': 2481, 'loss/train': 3.739887237548828} -09/20/2021 23:05:17 - INFO - __main__ - Step 39708: {'lr': 0.00019939101005621488, 'samples': 1270656, 'steps': 2481, 'loss/train': 3.757505178451538} -09/20/2021 23:05:18 - INFO - __main__ - Step 39709: {'lr': 0.00019939101005621488, 'samples': 1270688, 'steps': 2481, 'loss/train': 3.7572519779205322} -09/20/2021 23:05:18 - INFO - __main__ - Step 39710: {'lr': 0.00019939101005621488, 'samples': 1270720, 'steps': 2481, 'loss/train': 3.7825777530670166} -09/20/2021 23:05:19 - INFO - __main__ - Step 39711: {'lr': 0.00019939101005621488, 'samples': 1270752, 'steps': 2481, 'loss/train': 3.857591390609741} -09/20/2021 23:05:20 - INFO - __main__ - Step 39712: {'lr': 0.00019939101005621488, 'samples': 1270784, 'steps': 2481, 'loss/train': 3.7426109313964844} -09/20/2021 23:05:22 - INFO - __main__ - Step 39713: {'lr': 0.00019939030694115064, 'samples': 1270816, 'steps': 2482, 'loss/train': 2.1014585494995117} -09/20/2021 23:05:22 - INFO - __main__ - Step 39714: {'lr': 0.00019939030694115064, 'samples': 1270848, 'steps': 2482, 'loss/train': 2.416430950164795} -09/20/2021 23:05:23 - INFO - __main__ - Step 39715: {'lr': 0.00019939030694115064, 'samples': 1270880, 'steps': 2482, 'loss/train': 2.2377359867095947} -09/20/2021 23:05:24 - INFO - __main__ - Step 39716: {'lr': 0.00019939030694115064, 'samples': 1270912, 'steps': 2482, 'loss/train': 2.220606565475464} -09/20/2021 23:05:25 - INFO - __main__ - Step 39717: {'lr': 0.00019939030694115064, 'samples': 1270944, 'steps': 2482, 'loss/train': 1.6849933862686157} -09/20/2021 23:05:25 - INFO - __main__ - Step 39718: {'lr': 0.00019939030694115064, 'samples': 1270976, 'steps': 2482, 'loss/train': 2.1999447345733643} -09/20/2021 23:05:26 - INFO - __main__ - Step 39719: {'lr': 0.00019939030694115064, 'samples': 1271008, 'steps': 2482, 'loss/train': 2.432204008102417} -09/20/2021 23:05:27 - INFO - __main__ - Step 39720: {'lr': 0.00019939030694115064, 'samples': 1271040, 'steps': 2482, 'loss/train': 2.8447649478912354} -09/20/2021 23:05:28 - INFO - __main__ - Step 39721: {'lr': 0.00019939030694115064, 'samples': 1271072, 'steps': 2482, 'loss/train': 2.272181272506714} -09/20/2021 23:05:28 - INFO - __main__ - Step 39722: {'lr': 0.00019939030694115064, 'samples': 1271104, 'steps': 2482, 'loss/train': 2.032052516937256} -09/20/2021 23:05:29 - INFO - __main__ - Step 39723: {'lr': 0.00019939030694115064, 'samples': 1271136, 'steps': 2482, 'loss/train': 2.180227279663086} -09/20/2021 23:05:30 - INFO - __main__ - Step 39724: {'lr': 0.00019939030694115064, 'samples': 1271168, 'steps': 2482, 'loss/train': 2.0024118423461914} -09/20/2021 23:05:31 - INFO - __main__ - Step 39725: {'lr': 0.00019939030694115064, 'samples': 1271200, 'steps': 2482, 'loss/train': 2.109225273132324} -09/20/2021 23:05:31 - INFO - __main__ - Step 39726: {'lr': 0.00019939030694115064, 'samples': 1271232, 'steps': 2482, 'loss/train': 2.8353962898254395} -09/20/2021 23:05:32 - INFO - __main__ - Step 39727: {'lr': 0.00019939030694115064, 'samples': 1271264, 'steps': 2482, 'loss/train': 2.2667853832244873} -09/20/2021 23:05:33 - INFO - __main__ - Step 39728: {'lr': 0.00019939030694115064, 'samples': 1271296, 'steps': 2482, 'loss/train': 1.7491223812103271} -09/20/2021 23:05:34 - INFO - __main__ - Step 39729: {'lr': 0.00019938960342166765, 'samples': 1271328, 'steps': 2483, 'loss/train': 1.6561402082443237} -09/20/2021 23:05:35 - INFO - __main__ - Step 39730: {'lr': 0.00019938960342166765, 'samples': 1271360, 'steps': 2483, 'loss/train': 2.0159361362457275} -09/20/2021 23:05:35 - INFO - __main__ - Step 39731: {'lr': 0.00019938960342166765, 'samples': 1271392, 'steps': 2483, 'loss/train': 0.6057297587394714} -09/20/2021 23:05:36 - INFO - __main__ - Step 39732: {'lr': 0.00019938960342166765, 'samples': 1271424, 'steps': 2483, 'loss/train': 1.8165732622146606} -09/20/2021 23:05:37 - INFO - __main__ - Step 39733: {'lr': 0.00019938960342166765, 'samples': 1271456, 'steps': 2483, 'loss/train': 2.0879926681518555} -09/20/2021 23:05:38 - INFO - __main__ - Step 39734: {'lr': 0.00019938960342166765, 'samples': 1271488, 'steps': 2483, 'loss/train': 1.765915870666504} -09/20/2021 23:05:38 - INFO - __main__ - Step 39735: {'lr': 0.00019938960342166765, 'samples': 1271520, 'steps': 2483, 'loss/train': 1.4933910369873047} -09/20/2021 23:05:39 - INFO - __main__ - Step 39736: {'lr': 0.00019938960342166765, 'samples': 1271552, 'steps': 2483, 'loss/train': 0.8716175556182861} -09/20/2021 23:05:40 - INFO - __main__ - Step 39737: {'lr': 0.00019938960342166765, 'samples': 1271584, 'steps': 2483, 'loss/train': 2.422182321548462} -09/20/2021 23:05:41 - INFO - __main__ - Step 39738: {'lr': 0.00019938960342166765, 'samples': 1271616, 'steps': 2483, 'loss/train': 1.3791135549545288} -09/20/2021 23:05:41 - INFO - __main__ - Step 39739: {'lr': 0.00019938960342166765, 'samples': 1271648, 'steps': 2483, 'loss/train': 2.5970091819763184} -09/20/2021 23:05:42 - INFO - __main__ - Step 39740: {'lr': 0.00019938960342166765, 'samples': 1271680, 'steps': 2483, 'loss/train': 2.1459310054779053} -09/20/2021 23:05:43 - INFO - __main__ - Step 39741: {'lr': 0.00019938960342166765, 'samples': 1271712, 'steps': 2483, 'loss/train': 2.2201061248779297} -09/20/2021 23:05:44 - INFO - __main__ - Step 39742: {'lr': 0.00019938960342166765, 'samples': 1271744, 'steps': 2483, 'loss/train': 2.7449965476989746} -09/20/2021 23:05:44 - INFO - __main__ - Step 39743: {'lr': 0.00019938960342166765, 'samples': 1271776, 'steps': 2483, 'loss/train': 1.6630921363830566} -09/20/2021 23:05:46 - INFO - __main__ - Step 39744: {'lr': 0.00019938960342166765, 'samples': 1271808, 'steps': 2483, 'loss/train': 2.455165147781372} -09/20/2021 23:05:46 - INFO - __main__ - Step 39745: {'lr': 0.00019938889949776875, 'samples': 1271840, 'steps': 2484, 'loss/train': 2.6990866661071777} -09/20/2021 23:05:47 - INFO - __main__ - Step 39746: {'lr': 0.00019938889949776875, 'samples': 1271872, 'steps': 2484, 'loss/train': 2.16819167137146} -09/20/2021 23:05:48 - INFO - __main__ - Step 39747: {'lr': 0.00019938889949776875, 'samples': 1271904, 'steps': 2484, 'loss/train': 1.8117517232894897} -09/20/2021 23:05:49 - INFO - __main__ - Step 39748: {'lr': 0.00019938889949776875, 'samples': 1271936, 'steps': 2484, 'loss/train': 1.2388750314712524} -09/20/2021 23:05:49 - INFO - __main__ - Step 39749: {'lr': 0.00019938889949776875, 'samples': 1271968, 'steps': 2484, 'loss/train': 2.197523355484009} -09/20/2021 23:05:50 - INFO - __main__ - Step 39750: {'lr': 0.00019938889949776875, 'samples': 1272000, 'steps': 2484, 'loss/train': 2.256629705429077} -09/20/2021 23:05:51 - INFO - __main__ - Step 39751: {'lr': 0.00019938889949776875, 'samples': 1272032, 'steps': 2484, 'loss/train': 1.0577272176742554} -09/20/2021 23:05:52 - INFO - __main__ - Step 39752: {'lr': 0.00019938889949776875, 'samples': 1272064, 'steps': 2484, 'loss/train': 2.508293390274048} -09/20/2021 23:05:52 - INFO - __main__ - Step 39753: {'lr': 0.00019938889949776875, 'samples': 1272096, 'steps': 2484, 'loss/train': 2.199955940246582} -09/20/2021 23:05:53 - INFO - __main__ - Step 39754: {'lr': 0.00019938889949776875, 'samples': 1272128, 'steps': 2484, 'loss/train': 2.1884381771087646} -09/20/2021 23:05:54 - INFO - __main__ - Step 39755: {'lr': 0.00019938889949776875, 'samples': 1272160, 'steps': 2484, 'loss/train': 2.2756388187408447} -09/20/2021 23:05:55 - INFO - __main__ - Step 39756: {'lr': 0.00019938889949776875, 'samples': 1272192, 'steps': 2484, 'loss/train': 0.43745842576026917} -09/20/2021 23:05:55 - INFO - __main__ - Step 39757: {'lr': 0.00019938889949776875, 'samples': 1272224, 'steps': 2484, 'loss/train': 1.9067258834838867} -09/20/2021 23:05:56 - INFO - __main__ - Step 39758: {'lr': 0.00019938889949776875, 'samples': 1272256, 'steps': 2484, 'loss/train': 2.9398691654205322} -09/20/2021 23:05:57 - INFO - __main__ - Step 39759: {'lr': 0.00019938889949776875, 'samples': 1272288, 'steps': 2484, 'loss/train': 2.314354658126831} -09/20/2021 23:05:58 - INFO - __main__ - Step 39760: {'lr': 0.00019938889949776875, 'samples': 1272320, 'steps': 2484, 'loss/train': 2.4450199604034424} -09/20/2021 23:05:59 - INFO - __main__ - Step 39761: {'lr': 0.0001993881951694568, 'samples': 1272352, 'steps': 2485, 'loss/train': 1.981794834136963} -09/20/2021 23:05:59 - INFO - __main__ - Step 39762: {'lr': 0.0001993881951694568, 'samples': 1272384, 'steps': 2485, 'loss/train': 2.528193473815918} -09/20/2021 23:06:00 - INFO - __main__ - Step 39763: {'lr': 0.0001993881951694568, 'samples': 1272416, 'steps': 2485, 'loss/train': 0.9534387588500977} -09/20/2021 23:06:01 - INFO - __main__ - Step 39764: {'lr': 0.0001993881951694568, 'samples': 1272448, 'steps': 2485, 'loss/train': 1.0088846683502197} -09/20/2021 23:06:02 - INFO - __main__ - Step 39765: {'lr': 0.0001993881951694568, 'samples': 1272480, 'steps': 2485, 'loss/train': 2.2583343982696533} -09/20/2021 23:06:02 - INFO - __main__ - Step 39766: {'lr': 0.0001993881951694568, 'samples': 1272512, 'steps': 2485, 'loss/train': 2.216965675354004} -09/20/2021 23:06:03 - INFO - __main__ - Step 39767: {'lr': 0.0001993881951694568, 'samples': 1272544, 'steps': 2485, 'loss/train': 0.46926942467689514} -09/20/2021 23:06:04 - INFO - __main__ - Step 39768: {'lr': 0.0001993881951694568, 'samples': 1272576, 'steps': 2485, 'loss/train': 2.459202766418457} -09/20/2021 23:06:05 - INFO - __main__ - Step 39769: {'lr': 0.0001993881951694568, 'samples': 1272608, 'steps': 2485, 'loss/train': 1.778822660446167} -09/20/2021 23:06:05 - INFO - __main__ - Step 39770: {'lr': 0.0001993881951694568, 'samples': 1272640, 'steps': 2485, 'loss/train': 1.9055708646774292} -09/20/2021 23:06:06 - INFO - __main__ - Step 39771: {'lr': 0.0001993881951694568, 'samples': 1272672, 'steps': 2485, 'loss/train': 2.472318410873413} -09/20/2021 23:06:07 - INFO - __main__ - Step 39772: {'lr': 0.0001993881951694568, 'samples': 1272704, 'steps': 2485, 'loss/train': 2.291224718093872} -09/20/2021 23:06:08 - INFO - __main__ - Step 39773: {'lr': 0.0001993881951694568, 'samples': 1272736, 'steps': 2485, 'loss/train': 1.7329825162887573} -09/20/2021 23:06:09 - INFO - __main__ - Step 39774: {'lr': 0.0001993881951694568, 'samples': 1272768, 'steps': 2485, 'loss/train': 1.4262621402740479} -09/20/2021 23:06:10 - INFO - __main__ - Step 39775: {'lr': 0.0001993881951694568, 'samples': 1272800, 'steps': 2485, 'loss/train': 1.021541953086853} -09/20/2021 23:06:10 - INFO - __main__ - Step 39776: {'lr': 0.0001993881951694568, 'samples': 1272832, 'steps': 2485, 'loss/train': 1.9188125133514404} -09/20/2021 23:06:11 - INFO - __main__ - Step 39777: {'lr': 0.00019938749043673466, 'samples': 1272864, 'steps': 2486, 'loss/train': 2.4265754222869873} -09/20/2021 23:06:12 - INFO - __main__ - Step 39778: {'lr': 0.00019938749043673466, 'samples': 1272896, 'steps': 2486, 'loss/train': 1.332082986831665} -09/20/2021 23:06:13 - INFO - __main__ - Step 39779: {'lr': 0.00019938749043673466, 'samples': 1272928, 'steps': 2486, 'loss/train': 2.637876272201538} -09/20/2021 23:06:13 - INFO - __main__ - Step 39780: {'lr': 0.00019938749043673466, 'samples': 1272960, 'steps': 2486, 'loss/train': 2.287187337875366} -09/20/2021 23:06:14 - INFO - __main__ - Step 39781: {'lr': 0.00019938749043673466, 'samples': 1272992, 'steps': 2486, 'loss/train': 1.9475568532943726} -09/20/2021 23:06:15 - INFO - __main__ - Step 39782: {'lr': 0.00019938749043673466, 'samples': 1273024, 'steps': 2486, 'loss/train': 2.1111679077148438} -09/20/2021 23:06:16 - INFO - __main__ - Step 39783: {'lr': 0.00019938749043673466, 'samples': 1273056, 'steps': 2486, 'loss/train': 2.1717658042907715} -09/20/2021 23:06:16 - INFO - __main__ - Step 39784: {'lr': 0.00019938749043673466, 'samples': 1273088, 'steps': 2486, 'loss/train': 2.085736036300659} -09/20/2021 23:06:17 - INFO - __main__ - Step 39785: {'lr': 0.00019938749043673466, 'samples': 1273120, 'steps': 2486, 'loss/train': 2.3004677295684814} -09/20/2021 23:06:18 - INFO - __main__ - Step 39786: {'lr': 0.00019938749043673466, 'samples': 1273152, 'steps': 2486, 'loss/train': 2.0287716388702393} -09/20/2021 23:06:19 - INFO - __main__ - Step 39787: {'lr': 0.00019938749043673466, 'samples': 1273184, 'steps': 2486, 'loss/train': 2.294969081878662} -09/20/2021 23:06:19 - INFO - __main__ - Step 39788: {'lr': 0.00019938749043673466, 'samples': 1273216, 'steps': 2486, 'loss/train': 3.3275504112243652} -09/20/2021 23:06:20 - INFO - __main__ - Step 39789: {'lr': 0.00019938749043673466, 'samples': 1273248, 'steps': 2486, 'loss/train': 2.2539751529693604} -09/20/2021 23:06:21 - INFO - __main__ - Step 39790: {'lr': 0.00019938749043673466, 'samples': 1273280, 'steps': 2486, 'loss/train': 2.576380968093872} -09/20/2021 23:06:22 - INFO - __main__ - Step 39791: {'lr': 0.00019938749043673466, 'samples': 1273312, 'steps': 2486, 'loss/train': 1.2777130603790283} -09/20/2021 23:06:22 - INFO - __main__ - Step 39792: {'lr': 0.00019938749043673466, 'samples': 1273344, 'steps': 2486, 'loss/train': 2.754120111465454} -09/20/2021 23:06:23 - INFO - __main__ - Step 39793: {'lr': 0.00019938678529960523, 'samples': 1273376, 'steps': 2487, 'loss/train': 2.5865581035614014} -09/20/2021 23:06:24 - INFO - __main__ - Step 39794: {'lr': 0.00019938678529960523, 'samples': 1273408, 'steps': 2487, 'loss/train': 2.219665765762329} -09/20/2021 23:06:25 - INFO - __main__ - Step 39795: {'lr': 0.00019938678529960523, 'samples': 1273440, 'steps': 2487, 'loss/train': 2.622295379638672} -09/20/2021 23:06:26 - INFO - __main__ - Step 39796: {'lr': 0.00019938678529960523, 'samples': 1273472, 'steps': 2487, 'loss/train': 1.7234560251235962} -09/20/2021 23:06:26 - INFO - __main__ - Step 39797: {'lr': 0.00019938678529960523, 'samples': 1273504, 'steps': 2487, 'loss/train': 2.2737927436828613} -09/20/2021 23:06:27 - INFO - __main__ - Step 39798: {'lr': 0.00019938678529960523, 'samples': 1273536, 'steps': 2487, 'loss/train': 0.9667713046073914} -09/20/2021 23:06:28 - INFO - __main__ - Step 39799: {'lr': 0.00019938678529960523, 'samples': 1273568, 'steps': 2487, 'loss/train': 3.1724774837493896} -09/20/2021 23:06:29 - INFO - __main__ - Step 39800: {'lr': 0.00019938678529960523, 'samples': 1273600, 'steps': 2487, 'loss/train': 1.879919171333313} -09/20/2021 23:06:29 - INFO - __main__ - Step 39801: {'lr': 0.00019938678529960523, 'samples': 1273632, 'steps': 2487, 'loss/train': 2.6251492500305176} -09/20/2021 23:06:30 - INFO - __main__ - Step 39802: {'lr': 0.00019938678529960523, 'samples': 1273664, 'steps': 2487, 'loss/train': 1.8769391775131226} -09/20/2021 23:06:31 - INFO - __main__ - Step 39803: {'lr': 0.00019938678529960523, 'samples': 1273696, 'steps': 2487, 'loss/train': 1.8267295360565186} -09/20/2021 23:06:32 - INFO - __main__ - Step 39804: {'lr': 0.00019938678529960523, 'samples': 1273728, 'steps': 2487, 'loss/train': 2.6318764686584473} -09/20/2021 23:06:33 - INFO - __main__ - Step 39805: {'lr': 0.00019938678529960523, 'samples': 1273760, 'steps': 2487, 'loss/train': 2.3935089111328125} -09/20/2021 23:06:34 - INFO - __main__ - Step 39806: {'lr': 0.00019938678529960523, 'samples': 1273792, 'steps': 2487, 'loss/train': 2.3398244380950928} -09/20/2021 23:06:35 - INFO - __main__ - Step 39807: {'lr': 0.00019938678529960523, 'samples': 1273824, 'steps': 2487, 'loss/train': 2.6010708808898926} -09/20/2021 23:06:35 - INFO - __main__ - Step 39808: {'lr': 0.00019938678529960523, 'samples': 1273856, 'steps': 2487, 'loss/train': 2.58282470703125} -09/20/2021 23:06:36 - INFO - __main__ - Step 39809: {'lr': 0.00019938607975807134, 'samples': 1273888, 'steps': 2488, 'loss/train': 2.0091168880462646} -09/20/2021 23:06:37 - INFO - __main__ - Step 39810: {'lr': 0.00019938607975807134, 'samples': 1273920, 'steps': 2488, 'loss/train': 3.091298818588257} -09/20/2021 23:06:38 - INFO - __main__ - Step 39811: {'lr': 0.00019938607975807134, 'samples': 1273952, 'steps': 2488, 'loss/train': 3.6991517543792725} -09/20/2021 23:06:38 - INFO - __main__ - Step 39812: {'lr': 0.00019938607975807134, 'samples': 1273984, 'steps': 2488, 'loss/train': 2.0987260341644287} -09/20/2021 23:06:39 - INFO - __main__ - Step 39813: {'lr': 0.00019938607975807134, 'samples': 1274016, 'steps': 2488, 'loss/train': 2.9799792766571045} -09/20/2021 23:06:40 - INFO - __main__ - Step 39814: {'lr': 0.00019938607975807134, 'samples': 1274048, 'steps': 2488, 'loss/train': 2.4715113639831543} -09/20/2021 23:06:41 - INFO - __main__ - Step 39815: {'lr': 0.00019938607975807134, 'samples': 1274080, 'steps': 2488, 'loss/train': 1.922049880027771} -09/20/2021 23:06:41 - INFO - __main__ - Step 39816: {'lr': 0.00019938607975807134, 'samples': 1274112, 'steps': 2488, 'loss/train': 1.8028044700622559} -09/20/2021 23:06:42 - INFO - __main__ - Step 39817: {'lr': 0.00019938607975807134, 'samples': 1274144, 'steps': 2488, 'loss/train': 2.247389316558838} -09/20/2021 23:06:43 - INFO - __main__ - Step 39818: {'lr': 0.00019938607975807134, 'samples': 1274176, 'steps': 2488, 'loss/train': 2.7371718883514404} -09/20/2021 23:06:44 - INFO - __main__ - Step 39819: {'lr': 0.00019938607975807134, 'samples': 1274208, 'steps': 2488, 'loss/train': 1.5731345415115356} -09/20/2021 23:06:44 - INFO - __main__ - Step 39820: {'lr': 0.00019938607975807134, 'samples': 1274240, 'steps': 2488, 'loss/train': 0.14694972336292267} -09/20/2021 23:06:45 - INFO - __main__ - Step 39821: {'lr': 0.00019938607975807134, 'samples': 1274272, 'steps': 2488, 'loss/train': 0.32726648449897766} -09/20/2021 23:06:46 - INFO - __main__ - Step 39822: {'lr': 0.00019938607975807134, 'samples': 1274304, 'steps': 2488, 'loss/train': 0.4223954975605011} -09/20/2021 23:06:47 - INFO - __main__ - Step 39823: {'lr': 0.00019938607975807134, 'samples': 1274336, 'steps': 2488, 'loss/train': 0.13395285606384277} -09/20/2021 23:06:47 - INFO - __main__ - Step 39824: {'lr': 0.00019938607975807134, 'samples': 1274368, 'steps': 2488, 'loss/train': 2.127182722091675} -09/20/2021 23:06:48 - INFO - __main__ - Step 39825: {'lr': 0.00019938537381213587, 'samples': 1274400, 'steps': 2489, 'loss/train': 1.107175588607788} -09/20/2021 23:06:49 - INFO - __main__ - Step 39826: {'lr': 0.00019938537381213587, 'samples': 1274432, 'steps': 2489, 'loss/train': 1.1092182397842407} -09/20/2021 23:06:50 - INFO - __main__ - Step 39827: {'lr': 0.00019938537381213587, 'samples': 1274464, 'steps': 2489, 'loss/train': 1.093647837638855} -09/20/2021 23:06:51 - INFO - __main__ - Step 39828: {'lr': 0.00019938537381213587, 'samples': 1274496, 'steps': 2489, 'loss/train': 1.1210136413574219} -09/20/2021 23:06:51 - INFO - __main__ - Step 39829: {'lr': 0.00019938537381213587, 'samples': 1274528, 'steps': 2489, 'loss/train': 1.5562803745269775} -09/20/2021 23:06:52 - INFO - __main__ - Step 39830: {'lr': 0.00019938537381213587, 'samples': 1274560, 'steps': 2489, 'loss/train': 1.5543606281280518} -09/20/2021 23:06:53 - INFO - __main__ - Step 39831: {'lr': 0.00019938537381213587, 'samples': 1274592, 'steps': 2489, 'loss/train': 1.1339784860610962} -09/20/2021 23:06:54 - INFO - __main__ - Step 39832: {'lr': 0.00019938537381213587, 'samples': 1274624, 'steps': 2489, 'loss/train': 2.1838533878326416} -09/20/2021 23:06:54 - INFO - __main__ - Step 39833: {'lr': 0.00019938537381213587, 'samples': 1274656, 'steps': 2489, 'loss/train': 1.141800880432129} -09/20/2021 23:06:55 - INFO - __main__ - Step 39834: {'lr': 0.00019938537381213587, 'samples': 1274688, 'steps': 2489, 'loss/train': 2.4936249256134033} -09/20/2021 23:06:56 - INFO - __main__ - Step 39835: {'lr': 0.00019938537381213587, 'samples': 1274720, 'steps': 2489, 'loss/train': 1.7733272314071655} -09/20/2021 23:06:57 - INFO - __main__ - Step 39836: {'lr': 0.00019938537381213587, 'samples': 1274752, 'steps': 2489, 'loss/train': 1.524106740951538} -09/20/2021 23:06:57 - INFO - __main__ - Step 39837: {'lr': 0.00019938537381213587, 'samples': 1274784, 'steps': 2489, 'loss/train': 2.148780584335327} -09/20/2021 23:06:58 - INFO - __main__ - Step 39838: {'lr': 0.00019938537381213587, 'samples': 1274816, 'steps': 2489, 'loss/train': 0.17096614837646484} -09/20/2021 23:07:00 - INFO - __main__ - Step 39839: {'lr': 0.00019938537381213587, 'samples': 1274848, 'steps': 2489, 'loss/train': 1.1450064182281494} -09/20/2021 23:07:01 - INFO - __main__ - Step 39840: {'lr': 0.00019938537381213587, 'samples': 1274880, 'steps': 2489, 'loss/train': 1.438508152961731} -09/20/2021 23:07:01 - INFO - __main__ - Step 39841: {'lr': 0.00019938466746180172, 'samples': 1274912, 'steps': 2490, 'loss/train': 1.148956298828125} -09/20/2021 23:07:02 - INFO - __main__ - Step 39842: {'lr': 0.00019938466746180172, 'samples': 1274944, 'steps': 2490, 'loss/train': 3.102729082107544} -09/20/2021 23:07:03 - INFO - __main__ - Step 39843: {'lr': 0.00019938466746180172, 'samples': 1274976, 'steps': 2490, 'loss/train': 2.6658453941345215} -09/20/2021 23:07:04 - INFO - __main__ - Step 39844: {'lr': 0.00019938466746180172, 'samples': 1275008, 'steps': 2490, 'loss/train': 1.7461313009262085} -09/20/2021 23:07:04 - INFO - __main__ - Step 39845: {'lr': 0.00019938466746180172, 'samples': 1275040, 'steps': 2490, 'loss/train': 2.6149442195892334} -09/20/2021 23:07:05 - INFO - __main__ - Step 39846: {'lr': 0.00019938466746180172, 'samples': 1275072, 'steps': 2490, 'loss/train': 2.3321571350097656} -09/20/2021 23:07:06 - INFO - __main__ - Step 39847: {'lr': 0.00019938466746180172, 'samples': 1275104, 'steps': 2490, 'loss/train': 2.7145321369171143} -09/20/2021 23:07:07 - INFO - __main__ - Step 39848: {'lr': 0.00019938466746180172, 'samples': 1275136, 'steps': 2490, 'loss/train': 2.1332216262817383} -09/20/2021 23:07:07 - INFO - __main__ - Step 39849: {'lr': 0.00019938466746180172, 'samples': 1275168, 'steps': 2490, 'loss/train': 1.8311938047409058} -09/20/2021 23:07:08 - INFO - __main__ - Step 39850: {'lr': 0.00019938466746180172, 'samples': 1275200, 'steps': 2490, 'loss/train': 2.371483325958252} -09/20/2021 23:07:09 - INFO - __main__ - Step 39851: {'lr': 0.00019938466746180172, 'samples': 1275232, 'steps': 2490, 'loss/train': 1.0719479322433472} -09/20/2021 23:07:10 - INFO - __main__ - Step 39852: {'lr': 0.00019938466746180172, 'samples': 1275264, 'steps': 2490, 'loss/train': 1.85316801071167} -09/20/2021 23:07:10 - INFO - __main__ - Step 39853: {'lr': 0.00019938466746180172, 'samples': 1275296, 'steps': 2490, 'loss/train': 0.8104522824287415} -09/20/2021 23:07:11 - INFO - __main__ - Step 39854: {'lr': 0.00019938466746180172, 'samples': 1275328, 'steps': 2490, 'loss/train': 1.6681318283081055} -09/20/2021 23:07:12 - INFO - __main__ - Step 39855: {'lr': 0.00019938466746180172, 'samples': 1275360, 'steps': 2490, 'loss/train': 2.6985855102539062} -09/20/2021 23:07:13 - INFO - __main__ - Step 39856: {'lr': 0.00019938466746180172, 'samples': 1275392, 'steps': 2490, 'loss/train': 1.310779094696045} -09/20/2021 23:07:14 - INFO - __main__ - Step 39857: {'lr': 0.00019938396070707173, 'samples': 1275424, 'steps': 2491, 'loss/train': 2.121206283569336} -09/20/2021 23:07:14 - INFO - __main__ - Step 39858: {'lr': 0.00019938396070707173, 'samples': 1275456, 'steps': 2491, 'loss/train': 2.469295024871826} -09/20/2021 23:07:15 - INFO - __main__ - Step 39859: {'lr': 0.00019938396070707173, 'samples': 1275488, 'steps': 2491, 'loss/train': 2.2209174633026123} -09/20/2021 23:07:16 - INFO - __main__ - Step 39860: {'lr': 0.00019938396070707173, 'samples': 1275520, 'steps': 2491, 'loss/train': 2.6661813259124756} -09/20/2021 23:07:17 - INFO - __main__ - Step 39861: {'lr': 0.00019938396070707173, 'samples': 1275552, 'steps': 2491, 'loss/train': 1.2006888389587402} -09/20/2021 23:07:17 - INFO - __main__ - Step 39862: {'lr': 0.00019938396070707173, 'samples': 1275584, 'steps': 2491, 'loss/train': 1.7660115957260132} -09/20/2021 23:07:18 - INFO - __main__ - Step 39863: {'lr': 0.00019938396070707173, 'samples': 1275616, 'steps': 2491, 'loss/train': 2.4487533569335938} -09/20/2021 23:07:19 - INFO - __main__ - Step 39864: {'lr': 0.00019938396070707173, 'samples': 1275648, 'steps': 2491, 'loss/train': 2.1941535472869873} -09/20/2021 23:07:20 - INFO - __main__ - Step 39865: {'lr': 0.00019938396070707173, 'samples': 1275680, 'steps': 2491, 'loss/train': 2.6036369800567627} -09/20/2021 23:07:20 - INFO - __main__ - Step 39866: {'lr': 0.00019938396070707173, 'samples': 1275712, 'steps': 2491, 'loss/train': 2.141728401184082} -09/20/2021 23:07:21 - INFO - __main__ - Step 39867: {'lr': 0.00019938396070707173, 'samples': 1275744, 'steps': 2491, 'loss/train': 2.26155686378479} -09/20/2021 23:07:22 - INFO - __main__ - Step 39868: {'lr': 0.00019938396070707173, 'samples': 1275776, 'steps': 2491, 'loss/train': 1.8867820501327515} -09/20/2021 23:07:23 - INFO - __main__ - Step 39869: {'lr': 0.00019938396070707173, 'samples': 1275808, 'steps': 2491, 'loss/train': 1.292344570159912} -09/20/2021 23:07:24 - INFO - __main__ - Step 39870: {'lr': 0.00019938396070707173, 'samples': 1275840, 'steps': 2491, 'loss/train': 1.7973614931106567} -09/20/2021 23:07:25 - INFO - __main__ - Step 39871: {'lr': 0.00019938396070707173, 'samples': 1275872, 'steps': 2491, 'loss/train': 2.9092931747436523} -09/20/2021 23:07:25 - INFO - __main__ - Step 39872: {'lr': 0.00019938396070707173, 'samples': 1275904, 'steps': 2491, 'loss/train': 1.673323392868042} -09/20/2021 23:07:26 - INFO - __main__ - Step 39873: {'lr': 0.00019938325354794878, 'samples': 1275936, 'steps': 2492, 'loss/train': 1.5214307308197021} -09/20/2021 23:07:27 - INFO - __main__ - Step 39874: {'lr': 0.00019938325354794878, 'samples': 1275968, 'steps': 2492, 'loss/train': 1.5271871089935303} -09/20/2021 23:07:28 - INFO - __main__ - Step 39875: {'lr': 0.00019938325354794878, 'samples': 1276000, 'steps': 2492, 'loss/train': 2.0316855907440186} -09/20/2021 23:07:28 - INFO - __main__ - Step 39876: {'lr': 0.00019938325354794878, 'samples': 1276032, 'steps': 2492, 'loss/train': 2.4498708248138428} -09/20/2021 23:07:29 - INFO - __main__ - Step 39877: {'lr': 0.00019938325354794878, 'samples': 1276064, 'steps': 2492, 'loss/train': 2.083807945251465} -09/20/2021 23:07:30 - INFO - __main__ - Step 39878: {'lr': 0.00019938325354794878, 'samples': 1276096, 'steps': 2492, 'loss/train': 1.8531326055526733} -09/20/2021 23:07:31 - INFO - __main__ - Step 39879: {'lr': 0.00019938325354794878, 'samples': 1276128, 'steps': 2492, 'loss/train': 1.533196210861206} -09/20/2021 23:07:31 - INFO - __main__ - Step 39880: {'lr': 0.00019938325354794878, 'samples': 1276160, 'steps': 2492, 'loss/train': 1.6503949165344238} -09/20/2021 23:07:32 - INFO - __main__ - Step 39881: {'lr': 0.00019938325354794878, 'samples': 1276192, 'steps': 2492, 'loss/train': 0.5426570773124695} -09/20/2021 23:07:33 - INFO - __main__ - Step 39882: {'lr': 0.00019938325354794878, 'samples': 1276224, 'steps': 2492, 'loss/train': 2.4669761657714844} -09/20/2021 23:07:34 - INFO - __main__ - Step 39883: {'lr': 0.00019938325354794878, 'samples': 1276256, 'steps': 2492, 'loss/train': 2.028458833694458} -09/20/2021 23:07:34 - INFO - __main__ - Step 39884: {'lr': 0.00019938325354794878, 'samples': 1276288, 'steps': 2492, 'loss/train': 2.651736259460449} -09/20/2021 23:07:35 - INFO - __main__ - Step 39885: {'lr': 0.00019938325354794878, 'samples': 1276320, 'steps': 2492, 'loss/train': 2.477189064025879} -09/20/2021 23:07:36 - INFO - __main__ - Step 39886: {'lr': 0.00019938325354794878, 'samples': 1276352, 'steps': 2492, 'loss/train': 2.2157070636749268} -09/20/2021 23:07:37 - INFO - __main__ - Step 39887: {'lr': 0.00019938325354794878, 'samples': 1276384, 'steps': 2492, 'loss/train': 2.554361581802368} -09/20/2021 23:07:37 - INFO - __main__ - Step 39888: {'lr': 0.00019938325354794878, 'samples': 1276416, 'steps': 2492, 'loss/train': 2.157956600189209} -09/20/2021 23:07:38 - INFO - __main__ - Step 39889: {'lr': 0.00019938254598443576, 'samples': 1276448, 'steps': 2493, 'loss/train': 2.140197992324829} -09/20/2021 23:07:39 - INFO - __main__ - Step 39890: {'lr': 0.00019938254598443576, 'samples': 1276480, 'steps': 2493, 'loss/train': 2.3924455642700195} -09/20/2021 23:07:40 - INFO - __main__ - Step 39891: {'lr': 0.00019938254598443576, 'samples': 1276512, 'steps': 2493, 'loss/train': 0.9648749828338623} -09/20/2021 23:07:41 - INFO - __main__ - Step 39892: {'lr': 0.00019938254598443576, 'samples': 1276544, 'steps': 2493, 'loss/train': 1.0861612558364868} -09/20/2021 23:07:41 - INFO - __main__ - Step 39893: {'lr': 0.00019938254598443576, 'samples': 1276576, 'steps': 2493, 'loss/train': 1.892821192741394} -09/20/2021 23:07:42 - INFO - __main__ - Step 39894: {'lr': 0.00019938254598443576, 'samples': 1276608, 'steps': 2493, 'loss/train': 4.798769474029541} -09/20/2021 23:07:43 - INFO - __main__ - Step 39895: {'lr': 0.00019938254598443576, 'samples': 1276640, 'steps': 2493, 'loss/train': 2.305185317993164} -09/20/2021 23:07:44 - INFO - __main__ - Step 39896: {'lr': 0.00019938254598443576, 'samples': 1276672, 'steps': 2493, 'loss/train': 2.3051421642303467} -09/20/2021 23:07:44 - INFO - __main__ - Step 39897: {'lr': 0.00019938254598443576, 'samples': 1276704, 'steps': 2493, 'loss/train': 2.150209903717041} -09/20/2021 23:07:45 - INFO - __main__ - Step 39898: {'lr': 0.00019938254598443576, 'samples': 1276736, 'steps': 2493, 'loss/train': 1.9601994752883911} -09/20/2021 23:07:46 - INFO - __main__ - Step 39899: {'lr': 0.00019938254598443576, 'samples': 1276768, 'steps': 2493, 'loss/train': 1.7638944387435913} -09/20/2021 23:07:47 - INFO - __main__ - Step 39900: {'lr': 0.00019938254598443576, 'samples': 1276800, 'steps': 2493, 'loss/train': 1.708306074142456} -09/20/2021 23:07:48 - INFO - __main__ - Step 39901: {'lr': 0.00019938254598443576, 'samples': 1276832, 'steps': 2493, 'loss/train': 2.5665946006774902} -09/20/2021 23:07:49 - INFO - __main__ - Step 39902: {'lr': 0.00019938254598443576, 'samples': 1276864, 'steps': 2493, 'loss/train': 2.6103713512420654} -09/20/2021 23:07:50 - INFO - __main__ - Step 39903: {'lr': 0.00019938254598443576, 'samples': 1276896, 'steps': 2493, 'loss/train': 2.499943733215332} -09/20/2021 23:07:50 - INFO - __main__ - Step 39904: {'lr': 0.00019938254598443576, 'samples': 1276928, 'steps': 2493, 'loss/train': 1.5342357158660889} -09/20/2021 23:07:51 - INFO - __main__ - Step 39905: {'lr': 0.00019938183801653553, 'samples': 1276960, 'steps': 2494, 'loss/train': 1.1548124551773071} -09/20/2021 23:07:52 - INFO - __main__ - Step 39906: {'lr': 0.00019938183801653553, 'samples': 1276992, 'steps': 2494, 'loss/train': 1.7626210451126099} -09/20/2021 23:07:53 - INFO - __main__ - Step 39907: {'lr': 0.00019938183801653553, 'samples': 1277024, 'steps': 2494, 'loss/train': 3.939422369003296} -09/20/2021 23:07:53 - INFO - __main__ - Step 39908: {'lr': 0.00019938183801653553, 'samples': 1277056, 'steps': 2494, 'loss/train': 1.7556676864624023} -09/20/2021 23:07:54 - INFO - __main__ - Step 39909: {'lr': 0.00019938183801653553, 'samples': 1277088, 'steps': 2494, 'loss/train': 1.8132026195526123} -09/20/2021 23:07:55 - INFO - __main__ - Step 39910: {'lr': 0.00019938183801653553, 'samples': 1277120, 'steps': 2494, 'loss/train': 1.3790749311447144} -09/20/2021 23:07:56 - INFO - __main__ - Step 39911: {'lr': 0.00019938183801653553, 'samples': 1277152, 'steps': 2494, 'loss/train': 2.049253463745117} -09/20/2021 23:07:56 - INFO - __main__ - Step 39912: {'lr': 0.00019938183801653553, 'samples': 1277184, 'steps': 2494, 'loss/train': 1.8011550903320312} -09/20/2021 23:07:57 - INFO - __main__ - Step 39913: {'lr': 0.00019938183801653553, 'samples': 1277216, 'steps': 2494, 'loss/train': 1.7970595359802246} -09/20/2021 23:07:58 - INFO - __main__ - Step 39914: {'lr': 0.00019938183801653553, 'samples': 1277248, 'steps': 2494, 'loss/train': 2.0014536380767822} -09/20/2021 23:07:59 - INFO - __main__ - Step 39915: {'lr': 0.00019938183801653553, 'samples': 1277280, 'steps': 2494, 'loss/train': 2.1890830993652344} -09/20/2021 23:07:59 - INFO - __main__ - Step 39916: {'lr': 0.00019938183801653553, 'samples': 1277312, 'steps': 2494, 'loss/train': 2.142937183380127} -09/20/2021 23:08:00 - INFO - __main__ - Step 39917: {'lr': 0.00019938183801653553, 'samples': 1277344, 'steps': 2494, 'loss/train': 2.578706979751587} -09/20/2021 23:08:01 - INFO - __main__ - Step 39918: {'lr': 0.00019938183801653553, 'samples': 1277376, 'steps': 2494, 'loss/train': 2.3127846717834473} -09/20/2021 23:08:02 - INFO - __main__ - Step 39919: {'lr': 0.00019938183801653553, 'samples': 1277408, 'steps': 2494, 'loss/train': 1.6101881265640259} -09/20/2021 23:08:02 - INFO - __main__ - Step 39920: {'lr': 0.00019938183801653553, 'samples': 1277440, 'steps': 2494, 'loss/train': 2.1013736724853516} -09/20/2021 23:08:03 - INFO - __main__ - Step 39921: {'lr': 0.00019938112964425103, 'samples': 1277472, 'steps': 2495, 'loss/train': 1.5990769863128662} -09/20/2021 23:08:04 - INFO - __main__ - Step 39922: {'lr': 0.00019938112964425103, 'samples': 1277504, 'steps': 2495, 'loss/train': 1.2624945640563965} -09/20/2021 23:08:05 - INFO - __main__ - Step 39923: {'lr': 0.00019938112964425103, 'samples': 1277536, 'steps': 2495, 'loss/train': 1.6985931396484375} -09/20/2021 23:08:06 - INFO - __main__ - Step 39924: {'lr': 0.00019938112964425103, 'samples': 1277568, 'steps': 2495, 'loss/train': 2.3967740535736084} -09/20/2021 23:08:06 - INFO - __main__ - Step 39925: {'lr': 0.00019938112964425103, 'samples': 1277600, 'steps': 2495, 'loss/train': 3.289109706878662} -09/20/2021 23:08:07 - INFO - __main__ - Step 39926: {'lr': 0.00019938112964425103, 'samples': 1277632, 'steps': 2495, 'loss/train': 2.581519842147827} -09/20/2021 23:08:08 - INFO - __main__ - Step 39927: {'lr': 0.00019938112964425103, 'samples': 1277664, 'steps': 2495, 'loss/train': 1.5953938961029053} -09/20/2021 23:08:09 - INFO - __main__ - Step 39928: {'lr': 0.00019938112964425103, 'samples': 1277696, 'steps': 2495, 'loss/train': 2.654222011566162} -09/20/2021 23:08:09 - INFO - __main__ - Step 39929: {'lr': 0.00019938112964425103, 'samples': 1277728, 'steps': 2495, 'loss/train': 1.8295648097991943} -09/20/2021 23:08:10 - INFO - __main__ - Step 39930: {'lr': 0.00019938112964425103, 'samples': 1277760, 'steps': 2495, 'loss/train': 0.6683254837989807} -09/20/2021 23:08:11 - INFO - __main__ - Step 39931: {'lr': 0.00019938112964425103, 'samples': 1277792, 'steps': 2495, 'loss/train': 0.6863189935684204} -09/20/2021 23:08:12 - INFO - __main__ - Step 39932: {'lr': 0.00019938112964425103, 'samples': 1277824, 'steps': 2495, 'loss/train': 1.1768494844436646} -09/20/2021 23:08:13 - INFO - __main__ - Step 39933: {'lr': 0.00019938112964425103, 'samples': 1277856, 'steps': 2495, 'loss/train': 1.1987751722335815} -09/20/2021 23:08:14 - INFO - __main__ - Step 39934: {'lr': 0.00019938112964425103, 'samples': 1277888, 'steps': 2495, 'loss/train': 2.180779218673706} -09/20/2021 23:08:14 - INFO - __main__ - Step 39935: {'lr': 0.00019938112964425103, 'samples': 1277920, 'steps': 2495, 'loss/train': 2.5196950435638428} -09/20/2021 23:08:15 - INFO - __main__ - Step 39936: {'lr': 0.00019938112964425103, 'samples': 1277952, 'steps': 2495, 'loss/train': 3.4807040691375732} -09/20/2021 23:08:16 - INFO - __main__ - Step 39937: {'lr': 0.0001993804208675851, 'samples': 1277984, 'steps': 2496, 'loss/train': 2.437088966369629} -09/20/2021 23:08:17 - INFO - __main__ - Step 39938: {'lr': 0.0001993804208675851, 'samples': 1278016, 'steps': 2496, 'loss/train': 2.1889240741729736} -09/20/2021 23:08:17 - INFO - __main__ - Step 39939: {'lr': 0.0001993804208675851, 'samples': 1278048, 'steps': 2496, 'loss/train': 2.2905967235565186} -09/20/2021 23:08:18 - INFO - __main__ - Step 39940: {'lr': 0.0001993804208675851, 'samples': 1278080, 'steps': 2496, 'loss/train': 2.771413564682007} -09/20/2021 23:08:19 - INFO - __main__ - Step 39941: {'lr': 0.0001993804208675851, 'samples': 1278112, 'steps': 2496, 'loss/train': 0.6926093101501465} -09/20/2021 23:08:20 - INFO - __main__ - Step 39942: {'lr': 0.0001993804208675851, 'samples': 1278144, 'steps': 2496, 'loss/train': 1.8852856159210205} -09/20/2021 23:08:20 - INFO - __main__ - Step 39943: {'lr': 0.0001993804208675851, 'samples': 1278176, 'steps': 2496, 'loss/train': 1.885626196861267} -09/20/2021 23:08:21 - INFO - __main__ - Step 39944: {'lr': 0.0001993804208675851, 'samples': 1278208, 'steps': 2496, 'loss/train': 2.2979328632354736} -09/20/2021 23:08:22 - INFO - __main__ - Step 39945: {'lr': 0.0001993804208675851, 'samples': 1278240, 'steps': 2496, 'loss/train': 2.5994491577148438} -09/20/2021 23:08:23 - INFO - __main__ - Step 39946: {'lr': 0.0001993804208675851, 'samples': 1278272, 'steps': 2496, 'loss/train': 1.7225943803787231} -09/20/2021 23:08:23 - INFO - __main__ - Step 39947: {'lr': 0.0001993804208675851, 'samples': 1278304, 'steps': 2496, 'loss/train': 1.5111074447631836} -09/20/2021 23:08:24 - INFO - __main__ - Step 39948: {'lr': 0.0001993804208675851, 'samples': 1278336, 'steps': 2496, 'loss/train': 2.3083009719848633} -09/20/2021 23:08:25 - INFO - __main__ - Step 39949: {'lr': 0.0001993804208675851, 'samples': 1278368, 'steps': 2496, 'loss/train': 3.1088500022888184} -09/20/2021 23:08:26 - INFO - __main__ - Step 39950: {'lr': 0.0001993804208675851, 'samples': 1278400, 'steps': 2496, 'loss/train': 2.1433780193328857} -09/20/2021 23:08:26 - INFO - __main__ - Step 39951: {'lr': 0.0001993804208675851, 'samples': 1278432, 'steps': 2496, 'loss/train': 2.871584892272949} -09/20/2021 23:08:27 - INFO - __main__ - Step 39952: {'lr': 0.0001993804208675851, 'samples': 1278464, 'steps': 2496, 'loss/train': 2.316348075866699} -09/20/2021 23:08:28 - INFO - __main__ - Step 39953: {'lr': 0.00019937971168654058, 'samples': 1278496, 'steps': 2497, 'loss/train': 1.3976713418960571} -09/20/2021 23:08:29 - INFO - __main__ - Step 39954: {'lr': 0.00019937971168654058, 'samples': 1278528, 'steps': 2497, 'loss/train': 2.197070837020874} -09/20/2021 23:08:30 - INFO - __main__ - Step 39955: {'lr': 0.00019937971168654058, 'samples': 1278560, 'steps': 2497, 'loss/train': 2.1540451049804688} -09/20/2021 23:08:30 - INFO - __main__ - Step 39956: {'lr': 0.00019937971168654058, 'samples': 1278592, 'steps': 2497, 'loss/train': 2.5232508182525635} -09/20/2021 23:08:31 - INFO - __main__ - Step 39957: {'lr': 0.00019937971168654058, 'samples': 1278624, 'steps': 2497, 'loss/train': 1.944364070892334} -09/20/2021 23:08:32 - INFO - __main__ - Step 39958: {'lr': 0.00019937971168654058, 'samples': 1278656, 'steps': 2497, 'loss/train': 2.5599160194396973} -09/20/2021 23:08:33 - INFO - __main__ - Step 39959: {'lr': 0.00019937971168654058, 'samples': 1278688, 'steps': 2497, 'loss/train': 2.4593348503112793} -09/20/2021 23:08:33 - INFO - __main__ - Step 39960: {'lr': 0.00019937971168654058, 'samples': 1278720, 'steps': 2497, 'loss/train': 2.477011203765869} -09/20/2021 23:08:34 - INFO - __main__ - Step 39961: {'lr': 0.00019937971168654058, 'samples': 1278752, 'steps': 2497, 'loss/train': 2.4096310138702393} -09/20/2021 23:08:35 - INFO - __main__ - Step 39962: {'lr': 0.00019937971168654058, 'samples': 1278784, 'steps': 2497, 'loss/train': 2.324444055557251} -09/20/2021 23:08:36 - INFO - __main__ - Step 39963: {'lr': 0.00019937971168654058, 'samples': 1278816, 'steps': 2497, 'loss/train': 1.7495967149734497} -09/20/2021 23:08:37 - INFO - __main__ - Step 39964: {'lr': 0.00019937971168654058, 'samples': 1278848, 'steps': 2497, 'loss/train': 2.3781633377075195} -09/20/2021 23:08:38 - INFO - __main__ - Step 39965: {'lr': 0.00019937971168654058, 'samples': 1278880, 'steps': 2497, 'loss/train': 1.714851975440979} -09/20/2021 23:08:38 - INFO - __main__ - Step 39966: {'lr': 0.00019937971168654058, 'samples': 1278912, 'steps': 2497, 'loss/train': 2.862948417663574} -09/20/2021 23:08:39 - INFO - __main__ - Step 39967: {'lr': 0.00019937971168654058, 'samples': 1278944, 'steps': 2497, 'loss/train': 2.2830727100372314} -09/20/2021 23:08:40 - INFO - __main__ - Step 39968: {'lr': 0.00019937971168654058, 'samples': 1278976, 'steps': 2497, 'loss/train': 1.9559611082077026} -09/20/2021 23:08:41 - INFO - __main__ - Step 39969: {'lr': 0.00019937900210112043, 'samples': 1279008, 'steps': 2498, 'loss/train': 2.4009933471679688} -09/20/2021 23:08:42 - INFO - __main__ - Step 39970: {'lr': 0.00019937900210112043, 'samples': 1279040, 'steps': 2498, 'loss/train': 2.2416131496429443} -09/20/2021 23:08:42 - INFO - __main__ - Step 39971: {'lr': 0.00019937900210112043, 'samples': 1279072, 'steps': 2498, 'loss/train': 1.727095365524292} -09/20/2021 23:08:43 - INFO - __main__ - Step 39972: {'lr': 0.00019937900210112043, 'samples': 1279104, 'steps': 2498, 'loss/train': 1.881291151046753} -09/20/2021 23:08:44 - INFO - __main__ - Step 39973: {'lr': 0.00019937900210112043, 'samples': 1279136, 'steps': 2498, 'loss/train': 1.6376526355743408} -09/20/2021 23:08:45 - INFO - __main__ - Step 39974: {'lr': 0.00019937900210112043, 'samples': 1279168, 'steps': 2498, 'loss/train': 2.029505491256714} -09/20/2021 23:08:45 - INFO - __main__ - Step 39975: {'lr': 0.00019937900210112043, 'samples': 1279200, 'steps': 2498, 'loss/train': 1.8368600606918335} -09/20/2021 23:08:46 - INFO - __main__ - Step 39976: {'lr': 0.00019937900210112043, 'samples': 1279232, 'steps': 2498, 'loss/train': 2.471083879470825} -09/20/2021 23:08:47 - INFO - __main__ - Step 39977: {'lr': 0.00019937900210112043, 'samples': 1279264, 'steps': 2498, 'loss/train': 2.4511497020721436} -09/20/2021 23:08:48 - INFO - __main__ - Step 39978: {'lr': 0.00019937900210112043, 'samples': 1279296, 'steps': 2498, 'loss/train': 1.853628396987915} -09/20/2021 23:08:48 - INFO - __main__ - Step 39979: {'lr': 0.00019937900210112043, 'samples': 1279328, 'steps': 2498, 'loss/train': 2.3574140071868896} -09/20/2021 23:08:49 - INFO - __main__ - Step 39980: {'lr': 0.00019937900210112043, 'samples': 1279360, 'steps': 2498, 'loss/train': 2.5081980228424072} -09/20/2021 23:08:50 - INFO - __main__ - Step 39981: {'lr': 0.00019937900210112043, 'samples': 1279392, 'steps': 2498, 'loss/train': 2.641465663909912} -09/20/2021 23:08:51 - INFO - __main__ - Step 39982: {'lr': 0.00019937900210112043, 'samples': 1279424, 'steps': 2498, 'loss/train': 2.0111501216888428} -09/20/2021 23:08:51 - INFO - __main__ - Step 39983: {'lr': 0.00019937900210112043, 'samples': 1279456, 'steps': 2498, 'loss/train': 2.0884909629821777} -09/20/2021 23:08:52 - INFO - __main__ - Step 39984: {'lr': 0.00019937900210112043, 'samples': 1279488, 'steps': 2498, 'loss/train': 2.025503635406494} -09/20/2021 23:08:53 - INFO - __main__ - Step 39985: {'lr': 0.0001993782921113275, 'samples': 1279520, 'steps': 2499, 'loss/train': 2.0726847648620605} -09/20/2021 23:08:54 - INFO - __main__ - Step 39986: {'lr': 0.0001993782921113275, 'samples': 1279552, 'steps': 2499, 'loss/train': 1.12956702709198} -09/20/2021 23:08:54 - INFO - __main__ - Step 39987: {'lr': 0.0001993782921113275, 'samples': 1279584, 'steps': 2499, 'loss/train': 2.1474997997283936} -09/20/2021 23:08:55 - INFO - __main__ - Step 39988: {'lr': 0.0001993782921113275, 'samples': 1279616, 'steps': 2499, 'loss/train': 0.4367499351501465} -09/20/2021 23:08:56 - INFO - __main__ - Step 39989: {'lr': 0.0001993782921113275, 'samples': 1279648, 'steps': 2499, 'loss/train': 2.8915066719055176} -09/20/2021 23:08:57 - INFO - __main__ - Step 39990: {'lr': 0.0001993782921113275, 'samples': 1279680, 'steps': 2499, 'loss/train': 1.571376919746399} -09/20/2021 23:08:57 - INFO - __main__ - Step 39991: {'lr': 0.0001993782921113275, 'samples': 1279712, 'steps': 2499, 'loss/train': 2.288905382156372} -09/20/2021 23:08:58 - INFO - __main__ - Step 39992: {'lr': 0.0001993782921113275, 'samples': 1279744, 'steps': 2499, 'loss/train': 1.6308965682983398} -09/20/2021 23:09:00 - INFO - __main__ - Step 39993: {'lr': 0.0001993782921113275, 'samples': 1279776, 'steps': 2499, 'loss/train': 2.79911732673645} -09/20/2021 23:09:00 - INFO - __main__ - Step 39994: {'lr': 0.0001993782921113275, 'samples': 1279808, 'steps': 2499, 'loss/train': 1.5622493028640747} -09/20/2021 23:09:01 - INFO - __main__ - Step 39995: {'lr': 0.0001993782921113275, 'samples': 1279840, 'steps': 2499, 'loss/train': 2.09616756439209} -09/20/2021 23:09:02 - INFO - __main__ - Step 39996: {'lr': 0.0001993782921113275, 'samples': 1279872, 'steps': 2499, 'loss/train': 2.658254623413086} -09/20/2021 23:09:03 - INFO - __main__ - Step 39997: {'lr': 0.0001993782921113275, 'samples': 1279904, 'steps': 2499, 'loss/train': 2.3399181365966797} -09/20/2021 23:09:03 - INFO - __main__ - Step 39998: {'lr': 0.0001993782921113275, 'samples': 1279936, 'steps': 2499, 'loss/train': 2.8715569972991943} -09/20/2021 23:09:04 - INFO - __main__ - Step 39999: {'lr': 0.0001993782921113275, 'samples': 1279968, 'steps': 2499, 'loss/train': 2.464667558670044} -09/20/2021 23:09:05 - INFO - __main__ - Step 40000: {'lr': 0.0001993782921113275, 'samples': 1280000, 'steps': 2499, 'loss/train': 2.133725881576538} -09/20/2021 23:09:06 - INFO - __main__ - Step 40001: {'lr': 0.00019937758171716468, 'samples': 1280032, 'steps': 2500, 'loss/train': 2.255249500274658} -09/20/2021 23:09:06 - INFO - __main__ - Step 40002: {'lr': 0.00019937758171716468, 'samples': 1280064, 'steps': 2500, 'loss/train': 2.1448304653167725} -09/20/2021 23:09:07 - INFO - __main__ - Step 40003: {'lr': 0.00019937758171716468, 'samples': 1280096, 'steps': 2500, 'loss/train': 2.4538116455078125} -09/20/2021 23:09:08 - INFO - __main__ - Step 40004: {'lr': 0.00019937758171716468, 'samples': 1280128, 'steps': 2500, 'loss/train': 2.028794765472412} -09/20/2021 23:09:09 - INFO - __main__ - Step 40005: {'lr': 0.00019937758171716468, 'samples': 1280160, 'steps': 2500, 'loss/train': 1.8255871534347534} -09/20/2021 23:09:09 - INFO - __main__ - Step 40006: {'lr': 0.00019937758171716468, 'samples': 1280192, 'steps': 2500, 'loss/train': 2.063112258911133} -09/20/2021 23:09:10 - INFO - __main__ - Step 40007: {'lr': 0.00019937758171716468, 'samples': 1280224, 'steps': 2500, 'loss/train': 1.9640063047409058} -09/20/2021 23:09:11 - INFO - __main__ - Step 40008: {'lr': 0.00019937758171716468, 'samples': 1280256, 'steps': 2500, 'loss/train': 2.6028454303741455} -09/20/2021 23:09:12 - INFO - __main__ - Step 40009: {'lr': 0.00019937758171716468, 'samples': 1280288, 'steps': 2500, 'loss/train': 1.599263310432434} -09/20/2021 23:09:13 - INFO - __main__ - Step 40010: {'lr': 0.00019937758171716468, 'samples': 1280320, 'steps': 2500, 'loss/train': 2.847653388977051} -09/20/2021 23:09:13 - INFO - __main__ - Step 40011: {'lr': 0.00019937758171716468, 'samples': 1280352, 'steps': 2500, 'loss/train': 4.23819637298584} -09/20/2021 23:09:14 - INFO - __main__ - Step 40012: {'lr': 0.00019937758171716468, 'samples': 1280384, 'steps': 2500, 'loss/train': 3.4063520431518555} -09/20/2021 23:09:15 - INFO - __main__ - Step 40013: {'lr': 0.00019937758171716468, 'samples': 1280416, 'steps': 2500, 'loss/train': 4.830731391906738} -09/20/2021 23:09:16 - INFO - __main__ - Step 40014: {'lr': 0.00019937758171716468, 'samples': 1280448, 'steps': 2500, 'loss/train': 2.630781412124634} -09/20/2021 23:09:16 - INFO - __main__ - Step 40015: {'lr': 0.00019937758171716468, 'samples': 1280480, 'steps': 2500, 'loss/train': 1.6324611902236938} -09/20/2021 23:09:17 - INFO - __main__ - Step 40016: {'lr': 0.00019937758171716468, 'samples': 1280512, 'steps': 2500, 'loss/train': 2.3261868953704834} -09/20/2021 23:09:18 - INFO - __main__ - Step 40017: {'lr': 0.00019937687091863487, 'samples': 1280544, 'steps': 2501, 'loss/train': 0.997597873210907} -09/20/2021 23:09:19 - INFO - __main__ - Step 40018: {'lr': 0.00019937687091863487, 'samples': 1280576, 'steps': 2501, 'loss/train': 2.297264575958252} -09/20/2021 23:09:19 - INFO - __main__ - Step 40019: {'lr': 0.00019937687091863487, 'samples': 1280608, 'steps': 2501, 'loss/train': 2.2152037620544434} -09/20/2021 23:09:20 - INFO - __main__ - Step 40020: {'lr': 0.00019937687091863487, 'samples': 1280640, 'steps': 2501, 'loss/train': 2.846628189086914} -09/20/2021 23:09:21 - INFO - __main__ - Step 40021: {'lr': 0.00019937687091863487, 'samples': 1280672, 'steps': 2501, 'loss/train': 0.7031786441802979} -09/20/2021 23:09:22 - INFO - __main__ - Step 40022: {'lr': 0.00019937687091863487, 'samples': 1280704, 'steps': 2501, 'loss/train': 1.9131813049316406} -09/20/2021 23:09:22 - INFO - __main__ - Step 40023: {'lr': 0.00019937687091863487, 'samples': 1280736, 'steps': 2501, 'loss/train': 1.878261923789978} -09/20/2021 23:09:24 - INFO - __main__ - Step 40024: {'lr': 0.00019937687091863487, 'samples': 1280768, 'steps': 2501, 'loss/train': 2.0366666316986084} -09/20/2021 23:09:24 - INFO - __main__ - Step 40025: {'lr': 0.00019937687091863487, 'samples': 1280800, 'steps': 2501, 'loss/train': 3.2050225734710693} -09/20/2021 23:09:25 - INFO - __main__ - Step 40026: {'lr': 0.00019937687091863487, 'samples': 1280832, 'steps': 2501, 'loss/train': 2.136902093887329} -09/20/2021 23:09:26 - INFO - __main__ - Step 40027: {'lr': 0.00019937687091863487, 'samples': 1280864, 'steps': 2501, 'loss/train': 2.308227777481079} -09/20/2021 23:09:27 - INFO - __main__ - Step 40028: {'lr': 0.00019937687091863487, 'samples': 1280896, 'steps': 2501, 'loss/train': 1.046358585357666} -09/20/2021 23:09:27 - INFO - __main__ - Step 40029: {'lr': 0.00019937687091863487, 'samples': 1280928, 'steps': 2501, 'loss/train': 1.975334644317627} -09/20/2021 23:09:28 - INFO - __main__ - Step 40030: {'lr': 0.00019937687091863487, 'samples': 1280960, 'steps': 2501, 'loss/train': 3.2922613620758057} -09/20/2021 23:09:29 - INFO - __main__ - Step 40031: {'lr': 0.00019937687091863487, 'samples': 1280992, 'steps': 2501, 'loss/train': 0.5230856537818909} -09/20/2021 23:09:30 - INFO - __main__ - Step 40032: {'lr': 0.00019937687091863487, 'samples': 1281024, 'steps': 2501, 'loss/train': 1.9560246467590332} -09/20/2021 23:09:31 - INFO - __main__ - Step 40033: {'lr': 0.00019937615971574095, 'samples': 1281056, 'steps': 2502, 'loss/train': 1.7662545442581177} -09/20/2021 23:09:31 - INFO - __main__ - Step 40034: {'lr': 0.00019937615971574095, 'samples': 1281088, 'steps': 2502, 'loss/train': 2.354123592376709} -09/20/2021 23:09:32 - INFO - __main__ - Step 40035: {'lr': 0.00019937615971574095, 'samples': 1281120, 'steps': 2502, 'loss/train': 1.116952657699585} -09/20/2021 23:09:33 - INFO - __main__ - Step 40036: {'lr': 0.00019937615971574095, 'samples': 1281152, 'steps': 2502, 'loss/train': 2.961538791656494} -09/20/2021 23:09:34 - INFO - __main__ - Step 40037: {'lr': 0.00019937615971574095, 'samples': 1281184, 'steps': 2502, 'loss/train': 2.6757631301879883} -09/20/2021 23:09:34 - INFO - __main__ - Step 40038: {'lr': 0.00019937615971574095, 'samples': 1281216, 'steps': 2502, 'loss/train': 2.203500509262085} -09/20/2021 23:09:35 - INFO - __main__ - Step 40039: {'lr': 0.00019937615971574095, 'samples': 1281248, 'steps': 2502, 'loss/train': 1.6906853914260864} -09/20/2021 23:09:36 - INFO - __main__ - Step 40040: {'lr': 0.00019937615971574095, 'samples': 1281280, 'steps': 2502, 'loss/train': 1.8579024076461792} -09/20/2021 23:09:37 - INFO - __main__ - Step 40041: {'lr': 0.00019937615971574095, 'samples': 1281312, 'steps': 2502, 'loss/train': 2.0549821853637695} -09/20/2021 23:09:37 - INFO - __main__ - Step 40042: {'lr': 0.00019937615971574095, 'samples': 1281344, 'steps': 2502, 'loss/train': 0.43317052721977234} -09/20/2021 23:09:38 - INFO - __main__ - Step 40043: {'lr': 0.00019937615971574095, 'samples': 1281376, 'steps': 2502, 'loss/train': 2.5426647663116455} -09/20/2021 23:09:39 - INFO - __main__ - Step 40044: {'lr': 0.00019937615971574095, 'samples': 1281408, 'steps': 2502, 'loss/train': 2.113816738128662} -09/20/2021 23:09:40 - INFO - __main__ - Step 40045: {'lr': 0.00019937615971574095, 'samples': 1281440, 'steps': 2502, 'loss/train': 1.365520715713501} -09/20/2021 23:09:40 - INFO - __main__ - Step 40046: {'lr': 0.00019937615971574095, 'samples': 1281472, 'steps': 2502, 'loss/train': 1.245923399925232} -09/20/2021 23:09:41 - INFO - __main__ - Step 40047: {'lr': 0.00019937615971574095, 'samples': 1281504, 'steps': 2502, 'loss/train': 2.322845458984375} -09/20/2021 23:09:42 - INFO - __main__ - Step 40048: {'lr': 0.00019937615971574095, 'samples': 1281536, 'steps': 2502, 'loss/train': 1.7972142696380615} -09/20/2021 23:09:43 - INFO - __main__ - Step 40049: {'lr': 0.00019937544810848582, 'samples': 1281568, 'steps': 2503, 'loss/train': 1.0015108585357666} -09/20/2021 23:09:43 - INFO - __main__ - Step 40050: {'lr': 0.00019937544810848582, 'samples': 1281600, 'steps': 2503, 'loss/train': 1.9408031702041626} -09/20/2021 23:09:44 - INFO - __main__ - Step 40051: {'lr': 0.00019937544810848582, 'samples': 1281632, 'steps': 2503, 'loss/train': 2.3739428520202637} -09/20/2021 23:09:45 - INFO - __main__ - Step 40052: {'lr': 0.00019937544810848582, 'samples': 1281664, 'steps': 2503, 'loss/train': 1.5606441497802734} -09/20/2021 23:09:46 - INFO - __main__ - Step 40053: {'lr': 0.00019937544810848582, 'samples': 1281696, 'steps': 2503, 'loss/train': 0.26029422879219055} -09/20/2021 23:09:46 - INFO - __main__ - Step 40054: {'lr': 0.00019937544810848582, 'samples': 1281728, 'steps': 2503, 'loss/train': 2.122877597808838} -09/20/2021 23:09:48 - INFO - __main__ - Step 40055: {'lr': 0.00019937544810848582, 'samples': 1281760, 'steps': 2503, 'loss/train': 2.579770565032959} -09/20/2021 23:09:49 - INFO - __main__ - Step 40056: {'lr': 0.00019937544810848582, 'samples': 1281792, 'steps': 2503, 'loss/train': 2.2029905319213867} -09/20/2021 23:09:49 - INFO - __main__ - Step 40057: {'lr': 0.00019937544810848582, 'samples': 1281824, 'steps': 2503, 'loss/train': 1.7053766250610352} -09/20/2021 23:09:50 - INFO - __main__ - Step 40058: {'lr': 0.00019937544810848582, 'samples': 1281856, 'steps': 2503, 'loss/train': 2.48905086517334} -09/20/2021 23:09:51 - INFO - __main__ - Step 40059: {'lr': 0.00019937544810848582, 'samples': 1281888, 'steps': 2503, 'loss/train': 2.2973220348358154} -09/20/2021 23:09:52 - INFO - __main__ - Step 40060: {'lr': 0.00019937544810848582, 'samples': 1281920, 'steps': 2503, 'loss/train': 2.318103551864624} -09/20/2021 23:09:52 - INFO - __main__ - Step 40061: {'lr': 0.00019937544810848582, 'samples': 1281952, 'steps': 2503, 'loss/train': 2.068430185317993} -09/20/2021 23:09:53 - INFO - __main__ - Step 40062: {'lr': 0.00019937544810848582, 'samples': 1281984, 'steps': 2503, 'loss/train': 2.1307857036590576} -09/20/2021 23:09:54 - INFO - __main__ - Step 40063: {'lr': 0.00019937544810848582, 'samples': 1282016, 'steps': 2503, 'loss/train': 1.0567049980163574} -09/20/2021 23:09:55 - INFO - __main__ - Step 40064: {'lr': 0.00019937544810848582, 'samples': 1282048, 'steps': 2503, 'loss/train': 1.9983623027801514} -09/20/2021 23:09:55 - INFO - __main__ - Step 40065: {'lr': 0.0001993747360968724, 'samples': 1282080, 'steps': 2504, 'loss/train': 2.759326696395874} -09/20/2021 23:09:56 - INFO - __main__ - Step 40066: {'lr': 0.0001993747360968724, 'samples': 1282112, 'steps': 2504, 'loss/train': 2.687082290649414} -09/20/2021 23:09:57 - INFO - __main__ - Step 40067: {'lr': 0.0001993747360968724, 'samples': 1282144, 'steps': 2504, 'loss/train': 1.2056946754455566} -09/20/2021 23:09:58 - INFO - __main__ - Step 40068: {'lr': 0.0001993747360968724, 'samples': 1282176, 'steps': 2504, 'loss/train': 0.9816656708717346} -09/20/2021 23:09:58 - INFO - __main__ - Step 40069: {'lr': 0.0001993747360968724, 'samples': 1282208, 'steps': 2504, 'loss/train': 2.5147783756256104} -09/20/2021 23:09:59 - INFO - __main__ - Step 40070: {'lr': 0.0001993747360968724, 'samples': 1282240, 'steps': 2504, 'loss/train': 2.5617921352386475} -09/20/2021 23:10:00 - INFO - __main__ - Step 40071: {'lr': 0.0001993747360968724, 'samples': 1282272, 'steps': 2504, 'loss/train': 2.377277135848999} -09/20/2021 23:10:01 - INFO - __main__ - Step 40072: {'lr': 0.0001993747360968724, 'samples': 1282304, 'steps': 2504, 'loss/train': 2.2949328422546387} -09/20/2021 23:10:01 - INFO - __main__ - Step 40073: {'lr': 0.0001993747360968724, 'samples': 1282336, 'steps': 2504, 'loss/train': 1.4183331727981567} -09/20/2021 23:10:02 - INFO - __main__ - Step 40074: {'lr': 0.0001993747360968724, 'samples': 1282368, 'steps': 2504, 'loss/train': 1.742848515510559} -09/20/2021 23:10:03 - INFO - __main__ - Step 40075: {'lr': 0.0001993747360968724, 'samples': 1282400, 'steps': 2504, 'loss/train': 1.3374019861221313} -09/20/2021 23:10:04 - INFO - __main__ - Step 40076: {'lr': 0.0001993747360968724, 'samples': 1282432, 'steps': 2504, 'loss/train': 1.6796778440475464} -09/20/2021 23:10:04 - INFO - __main__ - Step 40077: {'lr': 0.0001993747360968724, 'samples': 1282464, 'steps': 2504, 'loss/train': 1.2742350101470947} -09/20/2021 23:10:05 - INFO - __main__ - Step 40078: {'lr': 0.0001993747360968724, 'samples': 1282496, 'steps': 2504, 'loss/train': 2.3159022331237793} -09/20/2021 23:10:06 - INFO - __main__ - Step 40079: {'lr': 0.0001993747360968724, 'samples': 1282528, 'steps': 2504, 'loss/train': 1.6917271614074707} -09/20/2021 23:10:07 - INFO - __main__ - Step 40080: {'lr': 0.0001993747360968724, 'samples': 1282560, 'steps': 2504, 'loss/train': 1.3783396482467651} -09/20/2021 23:10:08 - INFO - __main__ - Step 40081: {'lr': 0.00019937402368090353, 'samples': 1282592, 'steps': 2505, 'loss/train': 2.3483550548553467} -09/20/2021 23:10:08 - INFO - __main__ - Step 40082: {'lr': 0.00019937402368090353, 'samples': 1282624, 'steps': 2505, 'loss/train': 2.7772696018218994} -09/20/2021 23:10:09 - INFO - __main__ - Step 40083: {'lr': 0.00019937402368090353, 'samples': 1282656, 'steps': 2505, 'loss/train': 2.3239331245422363} -09/20/2021 23:10:10 - INFO - __main__ - Step 40084: {'lr': 0.00019937402368090353, 'samples': 1282688, 'steps': 2505, 'loss/train': 1.0112274885177612} -09/20/2021 23:10:11 - INFO - __main__ - Step 40085: {'lr': 0.00019937402368090353, 'samples': 1282720, 'steps': 2505, 'loss/train': 2.5795230865478516} -09/20/2021 23:10:11 - INFO - __main__ - Step 40086: {'lr': 0.00019937402368090353, 'samples': 1282752, 'steps': 2505, 'loss/train': 2.814929723739624} -09/20/2021 23:10:13 - INFO - __main__ - Step 40087: {'lr': 0.00019937402368090353, 'samples': 1282784, 'steps': 2505, 'loss/train': 1.4086930751800537} -09/20/2021 23:10:13 - INFO - __main__ - Step 40088: {'lr': 0.00019937402368090353, 'samples': 1282816, 'steps': 2505, 'loss/train': 1.7037742137908936} -09/20/2021 23:10:14 - INFO - __main__ - Step 40089: {'lr': 0.00019937402368090353, 'samples': 1282848, 'steps': 2505, 'loss/train': 1.9784291982650757} -09/20/2021 23:10:15 - INFO - __main__ - Step 40090: {'lr': 0.00019937402368090353, 'samples': 1282880, 'steps': 2505, 'loss/train': 1.4533073902130127} -09/20/2021 23:10:16 - INFO - __main__ - Step 40091: {'lr': 0.00019937402368090353, 'samples': 1282912, 'steps': 2505, 'loss/train': 2.146369457244873} -09/20/2021 23:10:16 - INFO - __main__ - Step 40092: {'lr': 0.00019937402368090353, 'samples': 1282944, 'steps': 2505, 'loss/train': 2.76759934425354} -09/20/2021 23:10:17 - INFO - __main__ - Step 40093: {'lr': 0.00019937402368090353, 'samples': 1282976, 'steps': 2505, 'loss/train': 2.300318956375122} -09/20/2021 23:10:18 - INFO - __main__ - Step 40094: {'lr': 0.00019937402368090353, 'samples': 1283008, 'steps': 2505, 'loss/train': 2.1312670707702637} -09/20/2021 23:10:19 - INFO - __main__ - Step 40095: {'lr': 0.00019937402368090353, 'samples': 1283040, 'steps': 2505, 'loss/train': 2.033639430999756} -09/20/2021 23:10:19 - INFO - __main__ - Step 40096: {'lr': 0.00019937402368090353, 'samples': 1283072, 'steps': 2505, 'loss/train': 2.0622801780700684} -09/20/2021 23:10:20 - INFO - __main__ - Step 40097: {'lr': 0.0001993733108605822, 'samples': 1283104, 'steps': 2506, 'loss/train': 4.327191352844238} -09/20/2021 23:10:21 - INFO - __main__ - Step 40098: {'lr': 0.0001993733108605822, 'samples': 1283136, 'steps': 2506, 'loss/train': 1.6018176078796387} -09/20/2021 23:10:22 - INFO - __main__ - Step 40099: {'lr': 0.0001993733108605822, 'samples': 1283168, 'steps': 2506, 'loss/train': 1.8282040357589722} -09/20/2021 23:10:23 - INFO - __main__ - Step 40100: {'lr': 0.0001993733108605822, 'samples': 1283200, 'steps': 2506, 'loss/train': 2.35817813873291} -09/20/2021 23:10:23 - INFO - __main__ - Step 40101: {'lr': 0.0001993733108605822, 'samples': 1283232, 'steps': 2506, 'loss/train': 2.0379743576049805} -09/20/2021 23:10:24 - INFO - __main__ - Step 40102: {'lr': 0.0001993733108605822, 'samples': 1283264, 'steps': 2506, 'loss/train': 3.5473666191101074} -09/20/2021 23:10:25 - INFO - __main__ - Step 40103: {'lr': 0.0001993733108605822, 'samples': 1283296, 'steps': 2506, 'loss/train': 1.9446231126785278} -09/20/2021 23:10:26 - INFO - __main__ - Step 40104: {'lr': 0.0001993733108605822, 'samples': 1283328, 'steps': 2506, 'loss/train': 0.23968635499477386} -09/20/2021 23:10:26 - INFO - __main__ - Step 40105: {'lr': 0.0001993733108605822, 'samples': 1283360, 'steps': 2506, 'loss/train': 2.0760812759399414} -09/20/2021 23:10:27 - INFO - __main__ - Step 40106: {'lr': 0.0001993733108605822, 'samples': 1283392, 'steps': 2506, 'loss/train': 1.7717514038085938} -09/20/2021 23:10:28 - INFO - __main__ - Step 40107: {'lr': 0.0001993733108605822, 'samples': 1283424, 'steps': 2506, 'loss/train': 2.217914581298828} -09/20/2021 23:10:29 - INFO - __main__ - Step 40108: {'lr': 0.0001993733108605822, 'samples': 1283456, 'steps': 2506, 'loss/train': 0.2194453626871109} -09/20/2021 23:10:29 - INFO - __main__ - Step 40109: {'lr': 0.0001993733108605822, 'samples': 1283488, 'steps': 2506, 'loss/train': 2.254303216934204} -09/20/2021 23:10:30 - INFO - __main__ - Step 40110: {'lr': 0.0001993733108605822, 'samples': 1283520, 'steps': 2506, 'loss/train': 2.380462408065796} -09/20/2021 23:10:31 - INFO - __main__ - Step 40111: {'lr': 0.0001993733108605822, 'samples': 1283552, 'steps': 2506, 'loss/train': 1.7111910581588745} -09/20/2021 23:10:32 - INFO - __main__ - Step 40112: {'lr': 0.0001993733108605822, 'samples': 1283584, 'steps': 2506, 'loss/train': 1.4281560182571411} -09/20/2021 23:10:32 - INFO - __main__ - Step 40113: {'lr': 0.0001993725976359112, 'samples': 1283616, 'steps': 2507, 'loss/train': 2.5490403175354004} -09/20/2021 23:10:33 - INFO - __main__ - Step 40114: {'lr': 0.0001993725976359112, 'samples': 1283648, 'steps': 2507, 'loss/train': 2.5461618900299072} -09/20/2021 23:10:34 - INFO - __main__ - Step 40115: {'lr': 0.0001993725976359112, 'samples': 1283680, 'steps': 2507, 'loss/train': 1.0777761936187744} -09/20/2021 23:10:35 - INFO - __main__ - Step 40116: {'lr': 0.0001993725976359112, 'samples': 1283712, 'steps': 2507, 'loss/train': 0.16319285333156586} -09/20/2021 23:10:35 - INFO - __main__ - Step 40117: {'lr': 0.0001993725976359112, 'samples': 1283744, 'steps': 2507, 'loss/train': 0.19806382060050964} -09/20/2021 23:10:37 - INFO - __main__ - Step 40118: {'lr': 0.0001993725976359112, 'samples': 1283776, 'steps': 2507, 'loss/train': 0.42593783140182495} -09/20/2021 23:10:37 - INFO - __main__ - Step 40119: {'lr': 0.0001993725976359112, 'samples': 1283808, 'steps': 2507, 'loss/train': 1.9734623432159424} -09/20/2021 23:10:38 - INFO - __main__ - Step 40120: {'lr': 0.0001993725976359112, 'samples': 1283840, 'steps': 2507, 'loss/train': 1.7802335023880005} -09/20/2021 23:10:39 - INFO - __main__ - Step 40121: {'lr': 0.0001993725976359112, 'samples': 1283872, 'steps': 2507, 'loss/train': 2.2155416011810303} -09/20/2021 23:10:40 - INFO - __main__ - Step 40122: {'lr': 0.0001993725976359112, 'samples': 1283904, 'steps': 2507, 'loss/train': 1.0194146633148193} -09/20/2021 23:10:40 - INFO - __main__ - Step 40123: {'lr': 0.0001993725976359112, 'samples': 1283936, 'steps': 2507, 'loss/train': 2.1410961151123047} -09/20/2021 23:10:41 - INFO - __main__ - Step 40124: {'lr': 0.0001993725976359112, 'samples': 1283968, 'steps': 2507, 'loss/train': 2.5084280967712402} -09/20/2021 23:10:42 - INFO - __main__ - Step 40125: {'lr': 0.0001993725976359112, 'samples': 1284000, 'steps': 2507, 'loss/train': 2.805968999862671} -09/20/2021 23:10:43 - INFO - __main__ - Step 40126: {'lr': 0.0001993725976359112, 'samples': 1284032, 'steps': 2507, 'loss/train': 2.5854763984680176} -09/20/2021 23:10:43 - INFO - __main__ - Step 40127: {'lr': 0.0001993725976359112, 'samples': 1284064, 'steps': 2507, 'loss/train': 2.3137316703796387} -09/20/2021 23:10:44 - INFO - __main__ - Step 40128: {'lr': 0.0001993725976359112, 'samples': 1284096, 'steps': 2507, 'loss/train': 2.6793031692504883} -09/20/2021 23:10:45 - INFO - __main__ - Step 40129: {'lr': 0.0001993718840068935, 'samples': 1284128, 'steps': 2508, 'loss/train': 2.467000722885132} -09/20/2021 23:10:46 - INFO - __main__ - Step 40130: {'lr': 0.0001993718840068935, 'samples': 1284160, 'steps': 2508, 'loss/train': 2.264549970626831} -09/20/2021 23:10:47 - INFO - __main__ - Step 40131: {'lr': 0.0001993718840068935, 'samples': 1284192, 'steps': 2508, 'loss/train': 2.1811270713806152} -09/20/2021 23:10:47 - INFO - __main__ - Step 40132: {'lr': 0.0001993718840068935, 'samples': 1284224, 'steps': 2508, 'loss/train': 1.537100076675415} -09/20/2021 23:10:48 - INFO - __main__ - Step 40133: {'lr': 0.0001993718840068935, 'samples': 1284256, 'steps': 2508, 'loss/train': 0.5650275349617004} -09/20/2021 23:10:49 - INFO - __main__ - Step 40134: {'lr': 0.0001993718840068935, 'samples': 1284288, 'steps': 2508, 'loss/train': 1.836038589477539} -09/20/2021 23:10:50 - INFO - __main__ - Step 40135: {'lr': 0.0001993718840068935, 'samples': 1284320, 'steps': 2508, 'loss/train': 1.8146437406539917} -09/20/2021 23:10:50 - INFO - __main__ - Step 40136: {'lr': 0.0001993718840068935, 'samples': 1284352, 'steps': 2508, 'loss/train': 2.094040632247925} -09/20/2021 23:10:51 - INFO - __main__ - Step 40137: {'lr': 0.0001993718840068935, 'samples': 1284384, 'steps': 2508, 'loss/train': 3.1671931743621826} -09/20/2021 23:10:52 - INFO - __main__ - Step 40138: {'lr': 0.0001993718840068935, 'samples': 1284416, 'steps': 2508, 'loss/train': 1.9633467197418213} -09/20/2021 23:10:53 - INFO - __main__ - Step 40139: {'lr': 0.0001993718840068935, 'samples': 1284448, 'steps': 2508, 'loss/train': 2.727698564529419} -09/20/2021 23:10:53 - INFO - __main__ - Step 40140: {'lr': 0.0001993718840068935, 'samples': 1284480, 'steps': 2508, 'loss/train': 1.9935256242752075} -09/20/2021 23:10:54 - INFO - __main__ - Step 40141: {'lr': 0.0001993718840068935, 'samples': 1284512, 'steps': 2508, 'loss/train': 2.120349407196045} -09/20/2021 23:10:55 - INFO - __main__ - Step 40142: {'lr': 0.0001993718840068935, 'samples': 1284544, 'steps': 2508, 'loss/train': 2.428126573562622} -09/20/2021 23:10:56 - INFO - __main__ - Step 40143: {'lr': 0.0001993718840068935, 'samples': 1284576, 'steps': 2508, 'loss/train': 2.080317497253418} -09/20/2021 23:10:56 - INFO - __main__ - Step 40144: {'lr': 0.0001993718840068935, 'samples': 1284608, 'steps': 2508, 'loss/train': 2.1277804374694824} -09/20/2021 23:10:57 - INFO - __main__ - Step 40145: {'lr': 0.000199371169973532, 'samples': 1284640, 'steps': 2509, 'loss/train': 2.7093753814697266} -09/20/2021 23:10:58 - INFO - __main__ - Step 40146: {'lr': 0.000199371169973532, 'samples': 1284672, 'steps': 2509, 'loss/train': 1.9858371019363403} -09/20/2021 23:10:59 - INFO - __main__ - Step 40147: {'lr': 0.000199371169973532, 'samples': 1284704, 'steps': 2509, 'loss/train': 1.9995962381362915} -09/20/2021 23:10:59 - INFO - __main__ - Step 40148: {'lr': 0.000199371169973532, 'samples': 1284736, 'steps': 2509, 'loss/train': 2.3094699382781982} -09/20/2021 23:11:01 - INFO - __main__ - Step 40149: {'lr': 0.000199371169973532, 'samples': 1284768, 'steps': 2509, 'loss/train': 5.855759143829346} -09/20/2021 23:11:02 - INFO - __main__ - Step 40150: {'lr': 0.000199371169973532, 'samples': 1284800, 'steps': 2509, 'loss/train': 1.9891119003295898} -09/20/2021 23:11:03 - INFO - __main__ - Step 40151: {'lr': 0.000199371169973532, 'samples': 1284832, 'steps': 2509, 'loss/train': 2.3876171112060547} -09/20/2021 23:11:04 - INFO - __main__ - Step 40152: {'lr': 0.000199371169973532, 'samples': 1284864, 'steps': 2509, 'loss/train': 2.295644998550415} -09/20/2021 23:11:04 - INFO - __main__ - Step 40153: {'lr': 0.000199371169973532, 'samples': 1284896, 'steps': 2509, 'loss/train': 2.751370429992676} -09/20/2021 23:11:05 - INFO - __main__ - Step 40154: {'lr': 0.000199371169973532, 'samples': 1284928, 'steps': 2509, 'loss/train': 2.0825159549713135} -09/20/2021 23:11:06 - INFO - __main__ - Step 40155: {'lr': 0.000199371169973532, 'samples': 1284960, 'steps': 2509, 'loss/train': 1.063521385192871} -09/20/2021 23:11:07 - INFO - __main__ - Step 40156: {'lr': 0.000199371169973532, 'samples': 1284992, 'steps': 2509, 'loss/train': 2.310999870300293} -09/20/2021 23:11:07 - INFO - __main__ - Step 40157: {'lr': 0.000199371169973532, 'samples': 1285024, 'steps': 2509, 'loss/train': 1.8876228332519531} -09/20/2021 23:11:08 - INFO - __main__ - Step 40158: {'lr': 0.000199371169973532, 'samples': 1285056, 'steps': 2509, 'loss/train': 1.8481194972991943} -09/20/2021 23:11:09 - INFO - __main__ - Step 40159: {'lr': 0.000199371169973532, 'samples': 1285088, 'steps': 2509, 'loss/train': 2.016657590866089} -09/20/2021 23:11:10 - INFO - __main__ - Step 40160: {'lr': 0.000199371169973532, 'samples': 1285120, 'steps': 2509, 'loss/train': 1.3028868436813354} -09/20/2021 23:11:10 - INFO - __main__ - Step 40161: {'lr': 0.0001993704555358296, 'samples': 1285152, 'steps': 2510, 'loss/train': 1.7111358642578125} -09/20/2021 23:11:11 - INFO - __main__ - Step 40162: {'lr': 0.0001993704555358296, 'samples': 1285184, 'steps': 2510, 'loss/train': 2.3867886066436768} -09/20/2021 23:11:12 - INFO - __main__ - Step 40163: {'lr': 0.0001993704555358296, 'samples': 1285216, 'steps': 2510, 'loss/train': 1.5125280618667603} -09/20/2021 23:11:13 - INFO - __main__ - Step 40164: {'lr': 0.0001993704555358296, 'samples': 1285248, 'steps': 2510, 'loss/train': 2.346768856048584} -09/20/2021 23:11:13 - INFO - __main__ - Step 40165: {'lr': 0.0001993704555358296, 'samples': 1285280, 'steps': 2510, 'loss/train': 2.039762258529663} -09/20/2021 23:11:14 - INFO - __main__ - Step 40166: {'lr': 0.0001993704555358296, 'samples': 1285312, 'steps': 2510, 'loss/train': 2.5047056674957275} -09/20/2021 23:11:15 - INFO - __main__ - Step 40167: {'lr': 0.0001993704555358296, 'samples': 1285344, 'steps': 2510, 'loss/train': 2.428992748260498} -09/20/2021 23:11:16 - INFO - __main__ - Step 40168: {'lr': 0.0001993704555358296, 'samples': 1285376, 'steps': 2510, 'loss/train': 2.296881914138794} -09/20/2021 23:11:16 - INFO - __main__ - Step 40169: {'lr': 0.0001993704555358296, 'samples': 1285408, 'steps': 2510, 'loss/train': 2.8847744464874268} -09/20/2021 23:11:17 - INFO - __main__ - Step 40170: {'lr': 0.0001993704555358296, 'samples': 1285440, 'steps': 2510, 'loss/train': 1.6231086254119873} -09/20/2021 23:11:18 - INFO - __main__ - Step 40171: {'lr': 0.0001993704555358296, 'samples': 1285472, 'steps': 2510, 'loss/train': 2.3001959323883057} -09/20/2021 23:11:19 - INFO - __main__ - Step 40172: {'lr': 0.0001993704555358296, 'samples': 1285504, 'steps': 2510, 'loss/train': 2.975132942199707} -09/20/2021 23:11:19 - INFO - __main__ - Step 40173: {'lr': 0.0001993704555358296, 'samples': 1285536, 'steps': 2510, 'loss/train': 2.623448610305786} -09/20/2021 23:11:20 - INFO - __main__ - Step 40174: {'lr': 0.0001993704555358296, 'samples': 1285568, 'steps': 2510, 'loss/train': 1.1152722835540771} -09/20/2021 23:11:21 - INFO - __main__ - Step 40175: {'lr': 0.0001993704555358296, 'samples': 1285600, 'steps': 2510, 'loss/train': 0.8435882925987244} -09/20/2021 23:11:22 - INFO - __main__ - Step 40176: {'lr': 0.0001993704555358296, 'samples': 1285632, 'steps': 2510, 'loss/train': 0.7912894487380981} -09/20/2021 23:11:23 - INFO - __main__ - Step 40177: {'lr': 0.0001993697406937892, 'samples': 1285664, 'steps': 2511, 'loss/train': 3.076375961303711} -09/20/2021 23:11:23 - INFO - __main__ - Step 40178: {'lr': 0.0001993697406937892, 'samples': 1285696, 'steps': 2511, 'loss/train': 2.3626224994659424} -09/20/2021 23:11:24 - INFO - __main__ - Step 40179: {'lr': 0.0001993697406937892, 'samples': 1285728, 'steps': 2511, 'loss/train': 2.107391834259033} -09/20/2021 23:11:26 - INFO - __main__ - Step 40180: {'lr': 0.0001993697406937892, 'samples': 1285760, 'steps': 2511, 'loss/train': 1.8726578950881958} -09/20/2021 23:11:27 - INFO - __main__ - Step 40181: {'lr': 0.0001993697406937892, 'samples': 1285792, 'steps': 2511, 'loss/train': 0.539743185043335} -09/20/2021 23:11:27 - INFO - __main__ - Step 40182: {'lr': 0.0001993697406937892, 'samples': 1285824, 'steps': 2511, 'loss/train': 1.7516690492630005} -09/20/2021 23:11:28 - INFO - __main__ - Step 40183: {'lr': 0.0001993697406937892, 'samples': 1285856, 'steps': 2511, 'loss/train': 2.373018503189087} -09/20/2021 23:11:29 - INFO - __main__ - Step 40184: {'lr': 0.0001993697406937892, 'samples': 1285888, 'steps': 2511, 'loss/train': 2.351562023162842} -09/20/2021 23:11:30 - INFO - __main__ - Step 40185: {'lr': 0.0001993697406937892, 'samples': 1285920, 'steps': 2511, 'loss/train': 2.2471065521240234} -09/20/2021 23:11:30 - INFO - __main__ - Step 40186: {'lr': 0.0001993697406937892, 'samples': 1285952, 'steps': 2511, 'loss/train': 1.9992344379425049} -09/20/2021 23:11:31 - INFO - __main__ - Step 40187: {'lr': 0.0001993697406937892, 'samples': 1285984, 'steps': 2511, 'loss/train': 2.9032578468322754} -09/20/2021 23:11:32 - INFO - __main__ - Step 40188: {'lr': 0.0001993697406937892, 'samples': 1286016, 'steps': 2511, 'loss/train': 2.4704322814941406} -09/20/2021 23:11:33 - INFO - __main__ - Step 40189: {'lr': 0.0001993697406937892, 'samples': 1286048, 'steps': 2511, 'loss/train': 0.5926526784896851} -09/20/2021 23:11:33 - INFO - __main__ - Step 40190: {'lr': 0.0001993697406937892, 'samples': 1286080, 'steps': 2511, 'loss/train': 0.3616897761821747} -09/20/2021 23:11:34 - INFO - __main__ - Step 40191: {'lr': 0.0001993697406937892, 'samples': 1286112, 'steps': 2511, 'loss/train': 0.16167135536670685} -09/20/2021 23:11:35 - INFO - __main__ - Step 40192: {'lr': 0.0001993697406937892, 'samples': 1286144, 'steps': 2511, 'loss/train': 0.47260311245918274} -09/20/2021 23:11:36 - INFO - __main__ - Step 40193: {'lr': 0.0001993690254474137, 'samples': 1286176, 'steps': 2512, 'loss/train': 0.2699308693408966} -09/20/2021 23:11:36 - INFO - __main__ - Step 40194: {'lr': 0.0001993690254474137, 'samples': 1286208, 'steps': 2512, 'loss/train': 0.3426731526851654} -09/20/2021 23:11:37 - INFO - __main__ - Step 40195: {'lr': 0.0001993690254474137, 'samples': 1286240, 'steps': 2512, 'loss/train': 2.3693461418151855} -09/20/2021 23:11:38 - INFO - __main__ - Step 40196: {'lr': 0.0001993690254474137, 'samples': 1286272, 'steps': 2512, 'loss/train': 2.5951685905456543} -09/20/2021 23:11:39 - INFO - __main__ - Step 40197: {'lr': 0.0001993690254474137, 'samples': 1286304, 'steps': 2512, 'loss/train': 2.444307327270508} -09/20/2021 23:11:39 - INFO - __main__ - Step 40198: {'lr': 0.0001993690254474137, 'samples': 1286336, 'steps': 2512, 'loss/train': 1.8115801811218262} -09/20/2021 23:11:40 - INFO - __main__ - Step 40199: {'lr': 0.0001993690254474137, 'samples': 1286368, 'steps': 2512, 'loss/train': 0.7965479493141174} -09/20/2021 23:11:41 - INFO - __main__ - Step 40200: {'lr': 0.0001993690254474137, 'samples': 1286400, 'steps': 2512, 'loss/train': 2.935246467590332} -09/20/2021 23:11:42 - INFO - __main__ - Step 40201: {'lr': 0.0001993690254474137, 'samples': 1286432, 'steps': 2512, 'loss/train': 0.781157374382019} -09/20/2021 23:11:42 - INFO - __main__ - Step 40202: {'lr': 0.0001993690254474137, 'samples': 1286464, 'steps': 2512, 'loss/train': 1.5914945602416992} -09/20/2021 23:11:43 - INFO - __main__ - Step 40203: {'lr': 0.0001993690254474137, 'samples': 1286496, 'steps': 2512, 'loss/train': 2.0713040828704834} -09/20/2021 23:11:44 - INFO - __main__ - Step 40204: {'lr': 0.0001993690254474137, 'samples': 1286528, 'steps': 2512, 'loss/train': 1.9380165338516235} -09/20/2021 23:11:45 - INFO - __main__ - Step 40205: {'lr': 0.0001993690254474137, 'samples': 1286560, 'steps': 2512, 'loss/train': 2.977811813354492} -09/20/2021 23:11:45 - INFO - __main__ - Step 40206: {'lr': 0.0001993690254474137, 'samples': 1286592, 'steps': 2512, 'loss/train': 2.144639015197754} -09/20/2021 23:11:46 - INFO - __main__ - Step 40207: {'lr': 0.0001993690254474137, 'samples': 1286624, 'steps': 2512, 'loss/train': 0.7925243377685547} -09/20/2021 23:11:47 - INFO - __main__ - Step 40208: {'lr': 0.0001993690254474137, 'samples': 1286656, 'steps': 2512, 'loss/train': 0.9219818711280823} -09/20/2021 23:11:48 - INFO - __main__ - Step 40209: {'lr': 0.000199368309796706, 'samples': 1286688, 'steps': 2513, 'loss/train': 1.9120556116104126} -09/20/2021 23:11:49 - INFO - __main__ - Step 40210: {'lr': 0.000199368309796706, 'samples': 1286720, 'steps': 2513, 'loss/train': 2.56998610496521} -09/20/2021 23:11:49 - INFO - __main__ - Step 40211: {'lr': 0.000199368309796706, 'samples': 1286752, 'steps': 2513, 'loss/train': 3.2339494228363037} -09/20/2021 23:11:51 - INFO - __main__ - Step 40212: {'lr': 0.000199368309796706, 'samples': 1286784, 'steps': 2513, 'loss/train': 1.3383411169052124} -09/20/2021 23:11:51 - INFO - __main__ - Step 40213: {'lr': 0.000199368309796706, 'samples': 1286816, 'steps': 2513, 'loss/train': 2.26493501663208} -09/20/2021 23:11:52 - INFO - __main__ - Step 40214: {'lr': 0.000199368309796706, 'samples': 1286848, 'steps': 2513, 'loss/train': 2.3878815174102783} -09/20/2021 23:11:53 - INFO - __main__ - Step 40215: {'lr': 0.000199368309796706, 'samples': 1286880, 'steps': 2513, 'loss/train': 1.9061917066574097} -09/20/2021 23:11:54 - INFO - __main__ - Step 40216: {'lr': 0.000199368309796706, 'samples': 1286912, 'steps': 2513, 'loss/train': 2.0510551929473877} -09/20/2021 23:11:54 - INFO - __main__ - Step 40217: {'lr': 0.000199368309796706, 'samples': 1286944, 'steps': 2513, 'loss/train': 3.0678746700286865} -09/20/2021 23:11:55 - INFO - __main__ - Step 40218: {'lr': 0.000199368309796706, 'samples': 1286976, 'steps': 2513, 'loss/train': 2.168760299682617} -09/20/2021 23:11:56 - INFO - __main__ - Step 40219: {'lr': 0.000199368309796706, 'samples': 1287008, 'steps': 2513, 'loss/train': 2.428586006164551} -09/20/2021 23:11:57 - INFO - __main__ - Step 40220: {'lr': 0.000199368309796706, 'samples': 1287040, 'steps': 2513, 'loss/train': 2.7091331481933594} -09/20/2021 23:11:57 - INFO - __main__ - Step 40221: {'lr': 0.000199368309796706, 'samples': 1287072, 'steps': 2513, 'loss/train': 1.9305721521377563} -09/20/2021 23:11:58 - INFO - __main__ - Step 40222: {'lr': 0.000199368309796706, 'samples': 1287104, 'steps': 2513, 'loss/train': 2.5838847160339355} -09/20/2021 23:11:59 - INFO - __main__ - Step 40223: {'lr': 0.000199368309796706, 'samples': 1287136, 'steps': 2513, 'loss/train': 1.9270102977752686} -09/20/2021 23:12:00 - INFO - __main__ - Step 40224: {'lr': 0.000199368309796706, 'samples': 1287168, 'steps': 2513, 'loss/train': 2.7414021492004395} -09/20/2021 23:12:01 - INFO - __main__ - Step 40225: {'lr': 0.00019936759374166907, 'samples': 1287200, 'steps': 2514, 'loss/train': 2.9736294746398926} -09/20/2021 23:12:01 - INFO - __main__ - Step 40226: {'lr': 0.00019936759374166907, 'samples': 1287232, 'steps': 2514, 'loss/train': 2.054863691329956} -09/20/2021 23:12:02 - INFO - __main__ - Step 40227: {'lr': 0.00019936759374166907, 'samples': 1287264, 'steps': 2514, 'loss/train': 3.0060441493988037} -09/20/2021 23:12:03 - INFO - __main__ - Step 40228: {'lr': 0.00019936759374166907, 'samples': 1287296, 'steps': 2514, 'loss/train': 2.9910025596618652} -09/20/2021 23:12:04 - INFO - __main__ - Step 40229: {'lr': 0.00019936759374166907, 'samples': 1287328, 'steps': 2514, 'loss/train': 2.553546905517578} -09/20/2021 23:12:04 - INFO - __main__ - Step 40230: {'lr': 0.00019936759374166907, 'samples': 1287360, 'steps': 2514, 'loss/train': 2.4880118370056152} -09/20/2021 23:12:05 - INFO - __main__ - Step 40231: {'lr': 0.00019936759374166907, 'samples': 1287392, 'steps': 2514, 'loss/train': 2.9809048175811768} -09/20/2021 23:12:06 - INFO - __main__ - Step 40232: {'lr': 0.00019936759374166907, 'samples': 1287424, 'steps': 2514, 'loss/train': 2.6451570987701416} -09/20/2021 23:12:07 - INFO - __main__ - Step 40233: {'lr': 0.00019936759374166907, 'samples': 1287456, 'steps': 2514, 'loss/train': 0.9122125506401062} -09/20/2021 23:12:07 - INFO - __main__ - Step 40234: {'lr': 0.00019936759374166907, 'samples': 1287488, 'steps': 2514, 'loss/train': 1.8990607261657715} -09/20/2021 23:12:08 - INFO - __main__ - Step 40235: {'lr': 0.00019936759374166907, 'samples': 1287520, 'steps': 2514, 'loss/train': 2.582237958908081} -09/20/2021 23:12:09 - INFO - __main__ - Step 40236: {'lr': 0.00019936759374166907, 'samples': 1287552, 'steps': 2514, 'loss/train': 2.358057737350464} -09/20/2021 23:12:10 - INFO - __main__ - Step 40237: {'lr': 0.00019936759374166907, 'samples': 1287584, 'steps': 2514, 'loss/train': 1.8052809238433838} -09/20/2021 23:12:10 - INFO - __main__ - Step 40238: {'lr': 0.00019936759374166907, 'samples': 1287616, 'steps': 2514, 'loss/train': 2.611471176147461} -09/20/2021 23:12:11 - INFO - __main__ - Step 40239: {'lr': 0.00019936759374166907, 'samples': 1287648, 'steps': 2514, 'loss/train': 2.0554001331329346} -09/20/2021 23:12:12 - INFO - __main__ - Step 40240: {'lr': 0.00019936759374166907, 'samples': 1287680, 'steps': 2514, 'loss/train': 2.2386391162872314} -09/20/2021 23:12:13 - INFO - __main__ - Step 40241: {'lr': 0.00019936687728230578, 'samples': 1287712, 'steps': 2515, 'loss/train': 2.253868579864502} -09/20/2021 23:12:13 - INFO - __main__ - Step 40242: {'lr': 0.00019936687728230578, 'samples': 1287744, 'steps': 2515, 'loss/train': 2.230914831161499} -09/20/2021 23:12:14 - INFO - __main__ - Step 40243: {'lr': 0.00019936687728230578, 'samples': 1287776, 'steps': 2515, 'loss/train': 1.9560335874557495} -09/20/2021 23:12:16 - INFO - __main__ - Step 40244: {'lr': 0.00019936687728230578, 'samples': 1287808, 'steps': 2515, 'loss/train': 1.1336582899093628} -09/20/2021 23:12:17 - INFO - __main__ - Step 40245: {'lr': 0.00019936687728230578, 'samples': 1287840, 'steps': 2515, 'loss/train': 2.302863359451294} -09/20/2021 23:12:17 - INFO - __main__ - Step 40246: {'lr': 0.00019936687728230578, 'samples': 1287872, 'steps': 2515, 'loss/train': 1.672706961631775} -09/20/2021 23:12:18 - INFO - __main__ - Step 40247: {'lr': 0.00019936687728230578, 'samples': 1287904, 'steps': 2515, 'loss/train': 2.0088846683502197} -09/20/2021 23:12:19 - INFO - __main__ - Step 40248: {'lr': 0.00019936687728230578, 'samples': 1287936, 'steps': 2515, 'loss/train': 1.8249273300170898} -09/20/2021 23:12:20 - INFO - __main__ - Step 40249: {'lr': 0.00019936687728230578, 'samples': 1287968, 'steps': 2515, 'loss/train': 2.051914691925049} -09/20/2021 23:12:20 - INFO - __main__ - Step 40250: {'lr': 0.00019936687728230578, 'samples': 1288000, 'steps': 2515, 'loss/train': 2.233691930770874} -09/20/2021 23:12:21 - INFO - __main__ - Step 40251: {'lr': 0.00019936687728230578, 'samples': 1288032, 'steps': 2515, 'loss/train': 2.727823257446289} -09/20/2021 23:12:22 - INFO - __main__ - Step 40252: {'lr': 0.00019936687728230578, 'samples': 1288064, 'steps': 2515, 'loss/train': 2.5593206882476807} -09/20/2021 23:12:23 - INFO - __main__ - Step 40253: {'lr': 0.00019936687728230578, 'samples': 1288096, 'steps': 2515, 'loss/train': 2.6567814350128174} -09/20/2021 23:12:23 - INFO - __main__ - Step 40254: {'lr': 0.00019936687728230578, 'samples': 1288128, 'steps': 2515, 'loss/train': 2.125974655151367} -09/20/2021 23:12:24 - INFO - __main__ - Step 40255: {'lr': 0.00019936687728230578, 'samples': 1288160, 'steps': 2515, 'loss/train': 1.8720120191574097} -09/20/2021 23:12:25 - INFO - __main__ - Step 40256: {'lr': 0.00019936687728230578, 'samples': 1288192, 'steps': 2515, 'loss/train': 1.5774224996566772} -09/20/2021 23:12:26 - INFO - __main__ - Step 40257: {'lr': 0.00019936616041861904, 'samples': 1288224, 'steps': 2516, 'loss/train': 0.9583405256271362} -09/20/2021 23:12:26 - INFO - __main__ - Step 40258: {'lr': 0.00019936616041861904, 'samples': 1288256, 'steps': 2516, 'loss/train': 2.122725248336792} -09/20/2021 23:12:27 - INFO - __main__ - Step 40259: {'lr': 0.00019936616041861904, 'samples': 1288288, 'steps': 2516, 'loss/train': 1.6828653812408447} -09/20/2021 23:12:28 - INFO - __main__ - Step 40260: {'lr': 0.00019936616041861904, 'samples': 1288320, 'steps': 2516, 'loss/train': 2.7467944622039795} -09/20/2021 23:12:29 - INFO - __main__ - Step 40261: {'lr': 0.00019936616041861904, 'samples': 1288352, 'steps': 2516, 'loss/train': 2.171430826187134} -09/20/2021 23:12:29 - INFO - __main__ - Step 40262: {'lr': 0.00019936616041861904, 'samples': 1288384, 'steps': 2516, 'loss/train': 2.278984785079956} -09/20/2021 23:12:30 - INFO - __main__ - Step 40263: {'lr': 0.00019936616041861904, 'samples': 1288416, 'steps': 2516, 'loss/train': 2.4091384410858154} -09/20/2021 23:12:31 - INFO - __main__ - Step 40264: {'lr': 0.00019936616041861904, 'samples': 1288448, 'steps': 2516, 'loss/train': 1.922458291053772} -09/20/2021 23:12:32 - INFO - __main__ - Step 40265: {'lr': 0.00019936616041861904, 'samples': 1288480, 'steps': 2516, 'loss/train': 2.2422802448272705} -09/20/2021 23:12:32 - INFO - __main__ - Step 40266: {'lr': 0.00019936616041861904, 'samples': 1288512, 'steps': 2516, 'loss/train': 1.8467121124267578} -09/20/2021 23:12:33 - INFO - __main__ - Step 40267: {'lr': 0.00019936616041861904, 'samples': 1288544, 'steps': 2516, 'loss/train': 1.7184382677078247} -09/20/2021 23:12:34 - INFO - __main__ - Step 40268: {'lr': 0.00019936616041861904, 'samples': 1288576, 'steps': 2516, 'loss/train': 0.4986928403377533} -09/20/2021 23:12:35 - INFO - __main__ - Step 40269: {'lr': 0.00019936616041861904, 'samples': 1288608, 'steps': 2516, 'loss/train': 0.72248375415802} -09/20/2021 23:12:35 - INFO - __main__ - Step 40270: {'lr': 0.00019936616041861904, 'samples': 1288640, 'steps': 2516, 'loss/train': 0.5603852868080139} -09/20/2021 23:12:36 - INFO - __main__ - Step 40271: {'lr': 0.00019936616041861904, 'samples': 1288672, 'steps': 2516, 'loss/train': 0.5431106090545654} -09/20/2021 23:12:37 - INFO - __main__ - Step 40272: {'lr': 0.00019936616041861904, 'samples': 1288704, 'steps': 2516, 'loss/train': 0.4896709620952606} -09/20/2021 23:12:38 - INFO - __main__ - Step 40273: {'lr': 0.0001993654431506118, 'samples': 1288736, 'steps': 2517, 'loss/train': 0.5365344882011414} -09/20/2021 23:12:39 - INFO - __main__ - Step 40274: {'lr': 0.0001993654431506118, 'samples': 1288768, 'steps': 2517, 'loss/train': 0.44987553358078003} -09/20/2021 23:12:39 - INFO - __main__ - Step 40275: {'lr': 0.0001993654431506118, 'samples': 1288800, 'steps': 2517, 'loss/train': 0.6810130476951599} -09/20/2021 23:12:40 - INFO - __main__ - Step 40276: {'lr': 0.0001993654431506118, 'samples': 1288832, 'steps': 2517, 'loss/train': 0.45175930857658386} -09/20/2021 23:12:41 - INFO - __main__ - Step 40277: {'lr': 0.0001993654431506118, 'samples': 1288864, 'steps': 2517, 'loss/train': 2.0512921810150146} -09/20/2021 23:12:42 - INFO - __main__ - Step 40278: {'lr': 0.0001993654431506118, 'samples': 1288896, 'steps': 2517, 'loss/train': 2.6244845390319824} -09/20/2021 23:12:42 - INFO - __main__ - Step 40279: {'lr': 0.0001993654431506118, 'samples': 1288928, 'steps': 2517, 'loss/train': 2.1617870330810547} -09/20/2021 23:12:44 - INFO - __main__ - Step 40280: {'lr': 0.0001993654431506118, 'samples': 1288960, 'steps': 2517, 'loss/train': 2.5460872650146484} -09/20/2021 23:12:44 - INFO - __main__ - Step 40281: {'lr': 0.0001993654431506118, 'samples': 1288992, 'steps': 2517, 'loss/train': 2.178020715713501} -09/20/2021 23:12:45 - INFO - __main__ - Step 40282: {'lr': 0.0001993654431506118, 'samples': 1289024, 'steps': 2517, 'loss/train': 2.300452470779419} -09/20/2021 23:12:46 - INFO - __main__ - Step 40283: {'lr': 0.0001993654431506118, 'samples': 1289056, 'steps': 2517, 'loss/train': 2.695996046066284} -09/20/2021 23:12:47 - INFO - __main__ - Step 40284: {'lr': 0.0001993654431506118, 'samples': 1289088, 'steps': 2517, 'loss/train': 2.0565454959869385} -09/20/2021 23:12:47 - INFO - __main__ - Step 40285: {'lr': 0.0001993654431506118, 'samples': 1289120, 'steps': 2517, 'loss/train': 2.204453945159912} -09/20/2021 23:12:48 - INFO - __main__ - Step 40286: {'lr': 0.0001993654431506118, 'samples': 1289152, 'steps': 2517, 'loss/train': 1.1332862377166748} -09/20/2021 23:12:49 - INFO - __main__ - Step 40287: {'lr': 0.0001993654431506118, 'samples': 1289184, 'steps': 2517, 'loss/train': 2.397602081298828} -09/20/2021 23:12:50 - INFO - __main__ - Step 40288: {'lr': 0.0001993654431506118, 'samples': 1289216, 'steps': 2517, 'loss/train': 1.5258641242980957} -09/20/2021 23:12:50 - INFO - __main__ - Step 40289: {'lr': 0.00019936472547828693, 'samples': 1289248, 'steps': 2518, 'loss/train': 2.7019309997558594} -09/20/2021 23:12:51 - INFO - __main__ - Step 40290: {'lr': 0.00019936472547828693, 'samples': 1289280, 'steps': 2518, 'loss/train': 2.139954090118408} -09/20/2021 23:12:52 - INFO - __main__ - Step 40291: {'lr': 0.00019936472547828693, 'samples': 1289312, 'steps': 2518, 'loss/train': 2.5714638233184814} -09/20/2021 23:12:53 - INFO - __main__ - Step 40292: {'lr': 0.00019936472547828693, 'samples': 1289344, 'steps': 2518, 'loss/train': 2.242111921310425} -09/20/2021 23:12:53 - INFO - __main__ - Step 40293: {'lr': 0.00019936472547828693, 'samples': 1289376, 'steps': 2518, 'loss/train': 2.8474724292755127} -09/20/2021 23:12:54 - INFO - __main__ - Step 40294: {'lr': 0.00019936472547828693, 'samples': 1289408, 'steps': 2518, 'loss/train': 2.1288440227508545} -09/20/2021 23:12:55 - INFO - __main__ - Step 40295: {'lr': 0.00019936472547828693, 'samples': 1289440, 'steps': 2518, 'loss/train': 2.1817398071289062} -09/20/2021 23:12:56 - INFO - __main__ - Step 40296: {'lr': 0.00019936472547828693, 'samples': 1289472, 'steps': 2518, 'loss/train': 3.063816785812378} -09/20/2021 23:12:56 - INFO - __main__ - Step 40297: {'lr': 0.00019936472547828693, 'samples': 1289504, 'steps': 2518, 'loss/train': 1.568411111831665} -09/20/2021 23:12:57 - INFO - __main__ - Step 40298: {'lr': 0.00019936472547828693, 'samples': 1289536, 'steps': 2518, 'loss/train': 1.2351933717727661} -09/20/2021 23:12:58 - INFO - __main__ - Step 40299: {'lr': 0.00019936472547828693, 'samples': 1289568, 'steps': 2518, 'loss/train': 1.8840506076812744} -09/20/2021 23:12:59 - INFO - __main__ - Step 40300: {'lr': 0.00019936472547828693, 'samples': 1289600, 'steps': 2518, 'loss/train': 2.094423770904541} -09/20/2021 23:12:59 - INFO - __main__ - Step 40301: {'lr': 0.00019936472547828693, 'samples': 1289632, 'steps': 2518, 'loss/train': 2.2713260650634766} -09/20/2021 23:13:00 - INFO - __main__ - Step 40302: {'lr': 0.00019936472547828693, 'samples': 1289664, 'steps': 2518, 'loss/train': 2.719740629196167} -09/20/2021 23:13:01 - INFO - __main__ - Step 40303: {'lr': 0.00019936472547828693, 'samples': 1289696, 'steps': 2518, 'loss/train': 1.7431373596191406} -09/20/2021 23:13:02 - INFO - __main__ - Step 40304: {'lr': 0.00019936472547828693, 'samples': 1289728, 'steps': 2518, 'loss/train': 2.2477991580963135} -09/20/2021 23:13:03 - INFO - __main__ - Step 40305: {'lr': 0.00019936400740164738, 'samples': 1289760, 'steps': 2519, 'loss/train': 2.875682830810547} -09/20/2021 23:13:03 - INFO - __main__ - Step 40306: {'lr': 0.00019936400740164738, 'samples': 1289792, 'steps': 2519, 'loss/train': 2.0560567378997803} -09/20/2021 23:13:04 - INFO - __main__ - Step 40307: {'lr': 0.00019936400740164738, 'samples': 1289824, 'steps': 2519, 'loss/train': 2.8382699489593506} -09/20/2021 23:13:05 - INFO - __main__ - Step 40308: {'lr': 0.00019936400740164738, 'samples': 1289856, 'steps': 2519, 'loss/train': 1.7099626064300537} -09/20/2021 23:13:06 - INFO - __main__ - Step 40309: {'lr': 0.00019936400740164738, 'samples': 1289888, 'steps': 2519, 'loss/train': 1.7687427997589111} -09/20/2021 23:13:06 - INFO - __main__ - Step 40310: {'lr': 0.00019936400740164738, 'samples': 1289920, 'steps': 2519, 'loss/train': 1.385318636894226} -09/20/2021 23:13:08 - INFO - __main__ - Step 40311: {'lr': 0.00019936400740164738, 'samples': 1289952, 'steps': 2519, 'loss/train': 2.1075453758239746} -09/20/2021 23:13:09 - INFO - __main__ - Step 40312: {'lr': 0.00019936400740164738, 'samples': 1289984, 'steps': 2519, 'loss/train': 2.433353900909424} -09/20/2021 23:13:09 - INFO - __main__ - Step 40313: {'lr': 0.00019936400740164738, 'samples': 1290016, 'steps': 2519, 'loss/train': 2.5089786052703857} -09/20/2021 23:13:10 - INFO - __main__ - Step 40314: {'lr': 0.00019936400740164738, 'samples': 1290048, 'steps': 2519, 'loss/train': 2.4931271076202393} -09/20/2021 23:13:11 - INFO - __main__ - Step 40315: {'lr': 0.00019936400740164738, 'samples': 1290080, 'steps': 2519, 'loss/train': 2.13720440864563} -09/20/2021 23:13:12 - INFO - __main__ - Step 40316: {'lr': 0.00019936400740164738, 'samples': 1290112, 'steps': 2519, 'loss/train': 2.1424014568328857} -09/20/2021 23:13:12 - INFO - __main__ - Step 40317: {'lr': 0.00019936400740164738, 'samples': 1290144, 'steps': 2519, 'loss/train': 1.877740502357483} -09/20/2021 23:13:13 - INFO - __main__ - Step 40318: {'lr': 0.00019936400740164738, 'samples': 1290176, 'steps': 2519, 'loss/train': 2.259974479675293} -09/20/2021 23:13:14 - INFO - __main__ - Step 40319: {'lr': 0.00019936400740164738, 'samples': 1290208, 'steps': 2519, 'loss/train': 2.1831042766571045} -09/20/2021 23:13:15 - INFO - __main__ - Step 40320: {'lr': 0.00019936400740164738, 'samples': 1290240, 'steps': 2519, 'loss/train': 2.019021987915039} -09/20/2021 23:13:16 - INFO - __main__ - Step 40321: {'lr': 0.00019936328892069608, 'samples': 1290272, 'steps': 2520, 'loss/train': 1.1256039142608643} -09/20/2021 23:13:16 - INFO - __main__ - Step 40322: {'lr': 0.00019936328892069608, 'samples': 1290304, 'steps': 2520, 'loss/train': 1.7587242126464844} -09/20/2021 23:13:17 - INFO - __main__ - Step 40323: {'lr': 0.00019936328892069608, 'samples': 1290336, 'steps': 2520, 'loss/train': 1.8830363750457764} -09/20/2021 23:13:18 - INFO - __main__ - Step 40324: {'lr': 0.00019936328892069608, 'samples': 1290368, 'steps': 2520, 'loss/train': 1.1446679830551147} -09/20/2021 23:13:19 - INFO - __main__ - Step 40325: {'lr': 0.00019936328892069608, 'samples': 1290400, 'steps': 2520, 'loss/train': 2.027078628540039} -09/20/2021 23:13:19 - INFO - __main__ - Step 40326: {'lr': 0.00019936328892069608, 'samples': 1290432, 'steps': 2520, 'loss/train': 2.2560782432556152} -09/20/2021 23:13:20 - INFO - __main__ - Step 40327: {'lr': 0.00019936328892069608, 'samples': 1290464, 'steps': 2520, 'loss/train': 2.818512201309204} -09/20/2021 23:13:21 - INFO - __main__ - Step 40328: {'lr': 0.00019936328892069608, 'samples': 1290496, 'steps': 2520, 'loss/train': 2.0964043140411377} -09/20/2021 23:13:22 - INFO - __main__ - Step 40329: {'lr': 0.00019936328892069608, 'samples': 1290528, 'steps': 2520, 'loss/train': 2.6077327728271484} -09/20/2021 23:13:22 - INFO - __main__ - Step 40330: {'lr': 0.00019936328892069608, 'samples': 1290560, 'steps': 2520, 'loss/train': 2.1740288734436035} -09/20/2021 23:13:23 - INFO - __main__ - Step 40331: {'lr': 0.00019936328892069608, 'samples': 1290592, 'steps': 2520, 'loss/train': 1.4382015466690063} -09/20/2021 23:13:24 - INFO - __main__ - Step 40332: {'lr': 0.00019936328892069608, 'samples': 1290624, 'steps': 2520, 'loss/train': 1.4642683267593384} -09/20/2021 23:13:25 - INFO - __main__ - Step 40333: {'lr': 0.00019936328892069608, 'samples': 1290656, 'steps': 2520, 'loss/train': 1.732600212097168} -09/20/2021 23:13:25 - INFO - __main__ - Step 40334: {'lr': 0.00019936328892069608, 'samples': 1290688, 'steps': 2520, 'loss/train': 2.1422152519226074} -09/20/2021 23:13:26 - INFO - __main__ - Step 40335: {'lr': 0.00019936328892069608, 'samples': 1290720, 'steps': 2520, 'loss/train': 2.307737350463867} -09/20/2021 23:13:27 - INFO - __main__ - Step 40336: {'lr': 0.00019936328892069608, 'samples': 1290752, 'steps': 2520, 'loss/train': 0.27268266677856445} -09/20/2021 23:13:28 - INFO - __main__ - Step 40337: {'lr': 0.00019936257003543592, 'samples': 1290784, 'steps': 2521, 'loss/train': 0.14943282306194305} -09/20/2021 23:13:28 - INFO - __main__ - Step 40338: {'lr': 0.00019936257003543592, 'samples': 1290816, 'steps': 2521, 'loss/train': 0.2824309468269348} -09/20/2021 23:13:29 - INFO - __main__ - Step 40339: {'lr': 0.00019936257003543592, 'samples': 1290848, 'steps': 2521, 'loss/train': 0.2762765884399414} -09/20/2021 23:13:30 - INFO - __main__ - Step 40340: {'lr': 0.00019936257003543592, 'samples': 1290880, 'steps': 2521, 'loss/train': 2.267582893371582} -09/20/2021 23:13:31 - INFO - __main__ - Step 40341: {'lr': 0.00019936257003543592, 'samples': 1290912, 'steps': 2521, 'loss/train': 3.1395576000213623} -09/20/2021 23:13:32 - INFO - __main__ - Step 40342: {'lr': 0.00019936257003543592, 'samples': 1290944, 'steps': 2521, 'loss/train': 1.716917634010315} -09/20/2021 23:13:33 - INFO - __main__ - Step 40343: {'lr': 0.00019936257003543592, 'samples': 1290976, 'steps': 2521, 'loss/train': 1.4346911907196045} -09/20/2021 23:13:33 - INFO - __main__ - Step 40344: {'lr': 0.00019936257003543592, 'samples': 1291008, 'steps': 2521, 'loss/train': 2.4212207794189453} -09/20/2021 23:13:34 - INFO - __main__ - Step 40345: {'lr': 0.00019936257003543592, 'samples': 1291040, 'steps': 2521, 'loss/train': 1.9989924430847168} -09/20/2021 23:13:35 - INFO - __main__ - Step 40346: {'lr': 0.00019936257003543592, 'samples': 1291072, 'steps': 2521, 'loss/train': 2.4752585887908936} -09/20/2021 23:13:36 - INFO - __main__ - Step 40347: {'lr': 0.00019936257003543592, 'samples': 1291104, 'steps': 2521, 'loss/train': 2.145380973815918} -09/20/2021 23:13:36 - INFO - __main__ - Step 40348: {'lr': 0.00019936257003543592, 'samples': 1291136, 'steps': 2521, 'loss/train': 1.9691452980041504} -09/20/2021 23:13:37 - INFO - __main__ - Step 40349: {'lr': 0.00019936257003543592, 'samples': 1291168, 'steps': 2521, 'loss/train': 1.8211933374404907} -09/20/2021 23:13:38 - INFO - __main__ - Step 40350: {'lr': 0.00019936257003543592, 'samples': 1291200, 'steps': 2521, 'loss/train': 2.092684268951416} -09/20/2021 23:13:39 - INFO - __main__ - Step 40351: {'lr': 0.00019936257003543592, 'samples': 1291232, 'steps': 2521, 'loss/train': 2.139726161956787} -09/20/2021 23:13:39 - INFO - __main__ - Step 40352: {'lr': 0.00019936257003543592, 'samples': 1291264, 'steps': 2521, 'loss/train': 2.2871339321136475} -09/20/2021 23:13:40 - INFO - __main__ - Step 40353: {'lr': 0.0001993618507458699, 'samples': 1291296, 'steps': 2522, 'loss/train': 1.9433951377868652} -09/20/2021 23:13:41 - INFO - __main__ - Step 40354: {'lr': 0.0001993618507458699, 'samples': 1291328, 'steps': 2522, 'loss/train': 5.0482683181762695} -09/20/2021 23:13:42 - INFO - __main__ - Step 40355: {'lr': 0.0001993618507458699, 'samples': 1291360, 'steps': 2522, 'loss/train': 1.9071784019470215} -09/20/2021 23:13:43 - INFO - __main__ - Step 40356: {'lr': 0.0001993618507458699, 'samples': 1291392, 'steps': 2522, 'loss/train': 2.5387861728668213} -09/20/2021 23:13:43 - INFO - __main__ - Step 40357: {'lr': 0.0001993618507458699, 'samples': 1291424, 'steps': 2522, 'loss/train': 1.9339085817337036} -09/20/2021 23:13:44 - INFO - __main__ - Step 40358: {'lr': 0.0001993618507458699, 'samples': 1291456, 'steps': 2522, 'loss/train': 1.398370385169983} -09/20/2021 23:13:45 - INFO - __main__ - Step 40359: {'lr': 0.0001993618507458699, 'samples': 1291488, 'steps': 2522, 'loss/train': 2.2061634063720703} -09/20/2021 23:13:46 - INFO - __main__ - Step 40360: {'lr': 0.0001993618507458699, 'samples': 1291520, 'steps': 2522, 'loss/train': 0.24803206324577332} -09/20/2021 23:13:46 - INFO - __main__ - Step 40361: {'lr': 0.0001993618507458699, 'samples': 1291552, 'steps': 2522, 'loss/train': 1.608567714691162} -09/20/2021 23:13:47 - INFO - __main__ - Step 40362: {'lr': 0.0001993618507458699, 'samples': 1291584, 'steps': 2522, 'loss/train': 0.1169474795460701} -09/20/2021 23:13:48 - INFO - __main__ - Step 40363: {'lr': 0.0001993618507458699, 'samples': 1291616, 'steps': 2522, 'loss/train': 2.162060260772705} -09/20/2021 23:13:49 - INFO - __main__ - Step 40364: {'lr': 0.0001993618507458699, 'samples': 1291648, 'steps': 2522, 'loss/train': 1.409583330154419} -09/20/2021 23:13:49 - INFO - __main__ - Step 40365: {'lr': 0.0001993618507458699, 'samples': 1291680, 'steps': 2522, 'loss/train': 2.309929370880127} -09/20/2021 23:13:50 - INFO - __main__ - Step 40366: {'lr': 0.0001993618507458699, 'samples': 1291712, 'steps': 2522, 'loss/train': 0.26022934913635254} -09/20/2021 23:13:51 - INFO - __main__ - Step 40367: {'lr': 0.0001993618507458699, 'samples': 1291744, 'steps': 2522, 'loss/train': 1.4659271240234375} -09/20/2021 23:13:52 - INFO - __main__ - Step 40368: {'lr': 0.0001993618507458699, 'samples': 1291776, 'steps': 2522, 'loss/train': 2.503483533859253} -09/20/2021 23:13:52 - INFO - __main__ - Step 40369: {'lr': 0.00019936113105200085, 'samples': 1291808, 'steps': 2523, 'loss/train': 1.5833357572555542} -09/20/2021 23:13:53 - INFO - __main__ - Step 40370: {'lr': 0.00019936113105200085, 'samples': 1291840, 'steps': 2523, 'loss/train': 1.1121087074279785} -09/20/2021 23:13:55 - INFO - __main__ - Step 40371: {'lr': 0.00019936113105200085, 'samples': 1291872, 'steps': 2523, 'loss/train': 1.5003867149353027} -09/20/2021 23:13:55 - INFO - __main__ - Step 40372: {'lr': 0.00019936113105200085, 'samples': 1291904, 'steps': 2523, 'loss/train': 1.6587464809417725} -09/20/2021 23:13:56 - INFO - __main__ - Step 40373: {'lr': 0.00019936113105200085, 'samples': 1291936, 'steps': 2523, 'loss/train': 2.558023691177368} -09/20/2021 23:13:57 - INFO - __main__ - Step 40374: {'lr': 0.00019936113105200085, 'samples': 1291968, 'steps': 2523, 'loss/train': 1.8714632987976074} -09/20/2021 23:13:58 - INFO - __main__ - Step 40375: {'lr': 0.00019936113105200085, 'samples': 1292000, 'steps': 2523, 'loss/train': 2.131185293197632} -09/20/2021 23:13:58 - INFO - __main__ - Step 40376: {'lr': 0.00019936113105200085, 'samples': 1292032, 'steps': 2523, 'loss/train': 2.40354585647583} -09/20/2021 23:13:59 - INFO - __main__ - Step 40377: {'lr': 0.00019936113105200085, 'samples': 1292064, 'steps': 2523, 'loss/train': 2.3275086879730225} -09/20/2021 23:14:00 - INFO - __main__ - Step 40378: {'lr': 0.00019936113105200085, 'samples': 1292096, 'steps': 2523, 'loss/train': 2.539379596710205} -09/20/2021 23:14:01 - INFO - __main__ - Step 40379: {'lr': 0.00019936113105200085, 'samples': 1292128, 'steps': 2523, 'loss/train': 2.382249593734741} -09/20/2021 23:14:01 - INFO - __main__ - Step 40380: {'lr': 0.00019936113105200085, 'samples': 1292160, 'steps': 2523, 'loss/train': 1.9396109580993652} -09/20/2021 23:14:02 - INFO - __main__ - Step 40381: {'lr': 0.00019936113105200085, 'samples': 1292192, 'steps': 2523, 'loss/train': 3.1061079502105713} -09/20/2021 23:14:03 - INFO - __main__ - Step 40382: {'lr': 0.00019936113105200085, 'samples': 1292224, 'steps': 2523, 'loss/train': 1.635292887687683} -09/20/2021 23:14:04 - INFO - __main__ - Step 40383: {'lr': 0.00019936113105200085, 'samples': 1292256, 'steps': 2523, 'loss/train': 1.6014553308486938} -09/20/2021 23:14:04 - INFO - __main__ - Step 40384: {'lr': 0.00019936113105200085, 'samples': 1292288, 'steps': 2523, 'loss/train': 2.6258623600006104} -09/20/2021 23:14:05 - INFO - __main__ - Step 40385: {'lr': 0.00019936041095383174, 'samples': 1292320, 'steps': 2524, 'loss/train': 1.672324299812317} -09/20/2021 23:14:06 - INFO - __main__ - Step 40386: {'lr': 0.00019936041095383174, 'samples': 1292352, 'steps': 2524, 'loss/train': 1.7736899852752686} -09/20/2021 23:14:07 - INFO - __main__ - Step 40387: {'lr': 0.00019936041095383174, 'samples': 1292384, 'steps': 2524, 'loss/train': 2.0206470489501953} -09/20/2021 23:14:07 - INFO - __main__ - Step 40388: {'lr': 0.00019936041095383174, 'samples': 1292416, 'steps': 2524, 'loss/train': 2.0454161167144775} -09/20/2021 23:14:08 - INFO - __main__ - Step 40389: {'lr': 0.00019936041095383174, 'samples': 1292448, 'steps': 2524, 'loss/train': 1.9927787780761719} -09/20/2021 23:14:09 - INFO - __main__ - Step 40390: {'lr': 0.00019936041095383174, 'samples': 1292480, 'steps': 2524, 'loss/train': 1.8184341192245483} -09/20/2021 23:14:10 - INFO - __main__ - Step 40391: {'lr': 0.00019936041095383174, 'samples': 1292512, 'steps': 2524, 'loss/train': 2.076730966567993} -09/20/2021 23:14:10 - INFO - __main__ - Step 40392: {'lr': 0.00019936041095383174, 'samples': 1292544, 'steps': 2524, 'loss/train': 1.9876515865325928} -09/20/2021 23:14:11 - INFO - __main__ - Step 40393: {'lr': 0.00019936041095383174, 'samples': 1292576, 'steps': 2524, 'loss/train': 2.961042881011963} -09/20/2021 23:14:12 - INFO - __main__ - Step 40394: {'lr': 0.00019936041095383174, 'samples': 1292608, 'steps': 2524, 'loss/train': 2.305800437927246} -09/20/2021 23:14:13 - INFO - __main__ - Step 40395: {'lr': 0.00019936041095383174, 'samples': 1292640, 'steps': 2524, 'loss/train': 1.9178342819213867} -09/20/2021 23:14:13 - INFO - __main__ - Step 40396: {'lr': 0.00019936041095383174, 'samples': 1292672, 'steps': 2524, 'loss/train': 2.250927686691284} -09/20/2021 23:14:14 - INFO - __main__ - Step 40397: {'lr': 0.00019936041095383174, 'samples': 1292704, 'steps': 2524, 'loss/train': 2.0377063751220703} -09/20/2021 23:14:15 - INFO - __main__ - Step 40398: {'lr': 0.00019936041095383174, 'samples': 1292736, 'steps': 2524, 'loss/train': 2.1465814113616943} -09/20/2021 23:14:16 - INFO - __main__ - Step 40399: {'lr': 0.00019936041095383174, 'samples': 1292768, 'steps': 2524, 'loss/train': 2.5172781944274902} -09/20/2021 23:14:16 - INFO - __main__ - Step 40400: {'lr': 0.00019936041095383174, 'samples': 1292800, 'steps': 2524, 'loss/train': 1.4925614595413208} -09/20/2021 23:14:17 - INFO - __main__ - Step 40401: {'lr': 0.00019935969045136554, 'samples': 1292832, 'steps': 2525, 'loss/train': 2.1364243030548096} -09/20/2021 23:14:19 - INFO - __main__ - Step 40402: {'lr': 0.00019935969045136554, 'samples': 1292864, 'steps': 2525, 'loss/train': 1.6827192306518555} -09/20/2021 23:14:19 - INFO - __main__ - Step 40403: {'lr': 0.00019935969045136554, 'samples': 1292896, 'steps': 2525, 'loss/train': 1.9967349767684937} -09/20/2021 23:14:20 - INFO - __main__ - Step 40404: {'lr': 0.00019935969045136554, 'samples': 1292928, 'steps': 2525, 'loss/train': 1.9502336978912354} -09/20/2021 23:14:21 - INFO - __main__ - Step 40405: {'lr': 0.00019935969045136554, 'samples': 1292960, 'steps': 2525, 'loss/train': 2.4523890018463135} -09/20/2021 23:14:22 - INFO - __main__ - Step 40406: {'lr': 0.00019935969045136554, 'samples': 1292992, 'steps': 2525, 'loss/train': 1.1453914642333984} -09/20/2021 23:14:22 - INFO - __main__ - Step 40407: {'lr': 0.00019935969045136554, 'samples': 1293024, 'steps': 2525, 'loss/train': 1.7485294342041016} -09/20/2021 23:14:23 - INFO - __main__ - Step 40408: {'lr': 0.00019935969045136554, 'samples': 1293056, 'steps': 2525, 'loss/train': 3.674640417098999} -09/20/2021 23:14:24 - INFO - __main__ - Step 40409: {'lr': 0.00019935969045136554, 'samples': 1293088, 'steps': 2525, 'loss/train': 2.5500950813293457} -09/20/2021 23:14:25 - INFO - __main__ - Step 40410: {'lr': 0.00019935969045136554, 'samples': 1293120, 'steps': 2525, 'loss/train': 2.4298479557037354} -09/20/2021 23:14:25 - INFO - __main__ - Step 40411: {'lr': 0.00019935969045136554, 'samples': 1293152, 'steps': 2525, 'loss/train': 2.789224147796631} -09/20/2021 23:14:26 - INFO - __main__ - Step 40412: {'lr': 0.00019935969045136554, 'samples': 1293184, 'steps': 2525, 'loss/train': 2.988938331604004} -09/20/2021 23:14:27 - INFO - __main__ - Step 40413: {'lr': 0.00019935969045136554, 'samples': 1293216, 'steps': 2525, 'loss/train': 1.0196983814239502} -09/20/2021 23:14:28 - INFO - __main__ - Step 40414: {'lr': 0.00019935969045136554, 'samples': 1293248, 'steps': 2525, 'loss/train': 1.8833914995193481} -09/20/2021 23:14:28 - INFO - __main__ - Step 40415: {'lr': 0.00019935969045136554, 'samples': 1293280, 'steps': 2525, 'loss/train': 2.35640811920166} -09/20/2021 23:14:29 - INFO - __main__ - Step 40416: {'lr': 0.00019935969045136554, 'samples': 1293312, 'steps': 2525, 'loss/train': 2.173719644546509} -09/20/2021 23:14:30 - INFO - __main__ - Step 40417: {'lr': 0.00019935896954460512, 'samples': 1293344, 'steps': 2526, 'loss/train': 1.0737435817718506} -09/20/2021 23:14:31 - INFO - __main__ - Step 40418: {'lr': 0.00019935896954460512, 'samples': 1293376, 'steps': 2526, 'loss/train': 2.3633360862731934} -09/20/2021 23:14:31 - INFO - __main__ - Step 40419: {'lr': 0.00019935896954460512, 'samples': 1293408, 'steps': 2526, 'loss/train': 3.5532753467559814} -09/20/2021 23:14:32 - INFO - __main__ - Step 40420: {'lr': 0.00019935896954460512, 'samples': 1293440, 'steps': 2526, 'loss/train': 2.51151180267334} -09/20/2021 23:14:33 - INFO - __main__ - Step 40421: {'lr': 0.00019935896954460512, 'samples': 1293472, 'steps': 2526, 'loss/train': 2.441237688064575} -09/20/2021 23:14:34 - INFO - __main__ - Step 40422: {'lr': 0.00019935896954460512, 'samples': 1293504, 'steps': 2526, 'loss/train': 2.014918565750122} -09/20/2021 23:14:34 - INFO - __main__ - Step 40423: {'lr': 0.00019935896954460512, 'samples': 1293536, 'steps': 2526, 'loss/train': 2.417637825012207} -09/20/2021 23:14:35 - INFO - __main__ - Step 40424: {'lr': 0.00019935896954460512, 'samples': 1293568, 'steps': 2526, 'loss/train': 1.4925131797790527} -09/20/2021 23:14:36 - INFO - __main__ - Step 40425: {'lr': 0.00019935896954460512, 'samples': 1293600, 'steps': 2526, 'loss/train': 2.914440155029297} -09/20/2021 23:14:37 - INFO - __main__ - Step 40426: {'lr': 0.00019935896954460512, 'samples': 1293632, 'steps': 2526, 'loss/train': 2.806565284729004} -09/20/2021 23:14:37 - INFO - __main__ - Step 40427: {'lr': 0.00019935896954460512, 'samples': 1293664, 'steps': 2526, 'loss/train': 2.190067768096924} -09/20/2021 23:14:38 - INFO - __main__ - Step 40428: {'lr': 0.00019935896954460512, 'samples': 1293696, 'steps': 2526, 'loss/train': 2.7287023067474365} -09/20/2021 23:14:39 - INFO - __main__ - Step 40429: {'lr': 0.00019935896954460512, 'samples': 1293728, 'steps': 2526, 'loss/train': 1.4471852779388428} -09/20/2021 23:14:40 - INFO - __main__ - Step 40430: {'lr': 0.00019935896954460512, 'samples': 1293760, 'steps': 2526, 'loss/train': 2.08553409576416} -09/20/2021 23:14:40 - INFO - __main__ - Step 40431: {'lr': 0.00019935896954460512, 'samples': 1293792, 'steps': 2526, 'loss/train': 2.0393176078796387} -09/20/2021 23:14:41 - INFO - __main__ - Step 40432: {'lr': 0.00019935896954460512, 'samples': 1293824, 'steps': 2526, 'loss/train': 2.3370044231414795} -09/20/2021 23:14:42 - INFO - __main__ - Step 40433: {'lr': 0.00019935824823355346, 'samples': 1293856, 'steps': 2527, 'loss/train': 1.309511661529541} -09/20/2021 23:14:43 - INFO - __main__ - Step 40434: {'lr': 0.00019935824823355346, 'samples': 1293888, 'steps': 2527, 'loss/train': 2.3956665992736816} -09/20/2021 23:14:44 - INFO - __main__ - Step 40435: {'lr': 0.00019935824823355346, 'samples': 1293920, 'steps': 2527, 'loss/train': 1.8999474048614502} -09/20/2021 23:14:45 - INFO - __main__ - Step 40436: {'lr': 0.00019935824823355346, 'samples': 1293952, 'steps': 2527, 'loss/train': 2.071354389190674} -09/20/2021 23:14:46 - INFO - __main__ - Step 40437: {'lr': 0.00019935824823355346, 'samples': 1293984, 'steps': 2527, 'loss/train': 1.8929063081741333} -09/20/2021 23:14:46 - INFO - __main__ - Step 40438: {'lr': 0.00019935824823355346, 'samples': 1294016, 'steps': 2527, 'loss/train': 1.8832168579101562} -09/20/2021 23:14:47 - INFO - __main__ - Step 40439: {'lr': 0.00019935824823355346, 'samples': 1294048, 'steps': 2527, 'loss/train': 2.2407028675079346} -09/20/2021 23:14:48 - INFO - __main__ - Step 40440: {'lr': 0.00019935824823355346, 'samples': 1294080, 'steps': 2527, 'loss/train': 2.816694498062134} -09/20/2021 23:14:49 - INFO - __main__ - Step 40441: {'lr': 0.00019935824823355346, 'samples': 1294112, 'steps': 2527, 'loss/train': 3.706698179244995} -09/20/2021 23:14:49 - INFO - __main__ - Step 40442: {'lr': 0.00019935824823355346, 'samples': 1294144, 'steps': 2527, 'loss/train': 2.648671865463257} -09/20/2021 23:14:50 - INFO - __main__ - Step 40443: {'lr': 0.00019935824823355346, 'samples': 1294176, 'steps': 2527, 'loss/train': 1.9978272914886475} -09/20/2021 23:14:51 - INFO - __main__ - Step 40444: {'lr': 0.00019935824823355346, 'samples': 1294208, 'steps': 2527, 'loss/train': 2.78818941116333} -09/20/2021 23:14:52 - INFO - __main__ - Step 40445: {'lr': 0.00019935824823355346, 'samples': 1294240, 'steps': 2527, 'loss/train': 2.6739397048950195} -09/20/2021 23:14:52 - INFO - __main__ - Step 40446: {'lr': 0.00019935824823355346, 'samples': 1294272, 'steps': 2527, 'loss/train': 2.7677433490753174} -09/20/2021 23:14:53 - INFO - __main__ - Step 40447: {'lr': 0.00019935824823355346, 'samples': 1294304, 'steps': 2527, 'loss/train': 2.1509833335876465} -09/20/2021 23:14:54 - INFO - __main__ - Step 40448: {'lr': 0.00019935824823355346, 'samples': 1294336, 'steps': 2527, 'loss/train': 0.5557942390441895} -09/20/2021 23:14:55 - INFO - __main__ - Step 40449: {'lr': 0.00019935752651821344, 'samples': 1294368, 'steps': 2528, 'loss/train': 2.367337226867676} -09/20/2021 23:14:56 - INFO - __main__ - Step 40450: {'lr': 0.00019935752651821344, 'samples': 1294400, 'steps': 2528, 'loss/train': 1.7755659818649292} -09/20/2021 23:14:56 - INFO - __main__ - Step 40451: {'lr': 0.00019935752651821344, 'samples': 1294432, 'steps': 2528, 'loss/train': 2.1856815814971924} -09/20/2021 23:14:57 - INFO - __main__ - Step 40452: {'lr': 0.00019935752651821344, 'samples': 1294464, 'steps': 2528, 'loss/train': 2.263334274291992} -09/20/2021 23:14:58 - INFO - __main__ - Step 40453: {'lr': 0.00019935752651821344, 'samples': 1294496, 'steps': 2528, 'loss/train': 1.8914873600006104} -09/20/2021 23:14:59 - INFO - __main__ - Step 40454: {'lr': 0.00019935752651821344, 'samples': 1294528, 'steps': 2528, 'loss/train': 1.730871558189392} -09/20/2021 23:14:59 - INFO - __main__ - Step 40455: {'lr': 0.00019935752651821344, 'samples': 1294560, 'steps': 2528, 'loss/train': 2.7383620738983154} -09/20/2021 23:15:00 - INFO - __main__ - Step 40456: {'lr': 0.00019935752651821344, 'samples': 1294592, 'steps': 2528, 'loss/train': 1.9431661367416382} -09/20/2021 23:15:01 - INFO - __main__ - Step 40457: {'lr': 0.00019935752651821344, 'samples': 1294624, 'steps': 2528, 'loss/train': 2.4127562046051025} -09/20/2021 23:15:02 - INFO - __main__ - Step 40458: {'lr': 0.00019935752651821344, 'samples': 1294656, 'steps': 2528, 'loss/train': 2.189603805541992} -09/20/2021 23:15:02 - INFO - __main__ - Step 40459: {'lr': 0.00019935752651821344, 'samples': 1294688, 'steps': 2528, 'loss/train': 3.2480835914611816} -09/20/2021 23:15:03 - INFO - __main__ - Step 40460: {'lr': 0.00019935752651821344, 'samples': 1294720, 'steps': 2528, 'loss/train': 1.8990261554718018} -09/20/2021 23:15:04 - INFO - __main__ - Step 40461: {'lr': 0.00019935752651821344, 'samples': 1294752, 'steps': 2528, 'loss/train': 1.1370723247528076} -09/20/2021 23:15:05 - INFO - __main__ - Step 40462: {'lr': 0.00019935752651821344, 'samples': 1294784, 'steps': 2528, 'loss/train': 2.0015311241149902} -09/20/2021 23:15:05 - INFO - __main__ - Step 40463: {'lr': 0.00019935752651821344, 'samples': 1294816, 'steps': 2528, 'loss/train': 2.246957302093506} -09/20/2021 23:15:06 - INFO - __main__ - Step 40464: {'lr': 0.00019935752651821344, 'samples': 1294848, 'steps': 2528, 'loss/train': 2.891997814178467} -09/20/2021 23:15:08 - INFO - __main__ - Step 40465: {'lr': 0.00019935680439858806, 'samples': 1294880, 'steps': 2529, 'loss/train': 2.3800430297851562} -09/20/2021 23:15:08 - INFO - __main__ - Step 40466: {'lr': 0.00019935680439858806, 'samples': 1294912, 'steps': 2529, 'loss/train': 2.44518780708313} -09/20/2021 23:15:09 - INFO - __main__ - Step 40467: {'lr': 0.00019935680439858806, 'samples': 1294944, 'steps': 2529, 'loss/train': 2.3329288959503174} -09/20/2021 23:15:10 - INFO - __main__ - Step 40468: {'lr': 0.00019935680439858806, 'samples': 1294976, 'steps': 2529, 'loss/train': 1.3458129167556763} -09/20/2021 23:15:11 - INFO - __main__ - Step 40469: {'lr': 0.00019935680439858806, 'samples': 1295008, 'steps': 2529, 'loss/train': 1.5722250938415527} -09/20/2021 23:15:11 - INFO - __main__ - Step 40470: {'lr': 0.00019935680439858806, 'samples': 1295040, 'steps': 2529, 'loss/train': 1.572003960609436} -09/20/2021 23:15:12 - INFO - __main__ - Step 40471: {'lr': 0.00019935680439858806, 'samples': 1295072, 'steps': 2529, 'loss/train': 1.6379549503326416} -09/20/2021 23:15:13 - INFO - __main__ - Step 40472: {'lr': 0.00019935680439858806, 'samples': 1295104, 'steps': 2529, 'loss/train': 1.8599807024002075} -09/20/2021 23:15:14 - INFO - __main__ - Step 40473: {'lr': 0.00019935680439858806, 'samples': 1295136, 'steps': 2529, 'loss/train': 0.703097939491272} -09/20/2021 23:15:14 - INFO - __main__ - Step 40474: {'lr': 0.00019935680439858806, 'samples': 1295168, 'steps': 2529, 'loss/train': 2.1119699478149414} -09/20/2021 23:15:15 - INFO - __main__ - Step 40475: {'lr': 0.00019935680439858806, 'samples': 1295200, 'steps': 2529, 'loss/train': 2.0811591148376465} -09/20/2021 23:15:16 - INFO - __main__ - Step 40476: {'lr': 0.00019935680439858806, 'samples': 1295232, 'steps': 2529, 'loss/train': 2.5007426738739014} -09/20/2021 23:15:17 - INFO - __main__ - Step 40477: {'lr': 0.00019935680439858806, 'samples': 1295264, 'steps': 2529, 'loss/train': 1.7988389730453491} -09/20/2021 23:15:17 - INFO - __main__ - Step 40478: {'lr': 0.00019935680439858806, 'samples': 1295296, 'steps': 2529, 'loss/train': 2.7674102783203125} -09/20/2021 23:15:18 - INFO - __main__ - Step 40479: {'lr': 0.00019935680439858806, 'samples': 1295328, 'steps': 2529, 'loss/train': 2.81390643119812} -09/20/2021 23:15:19 - INFO - __main__ - Step 40480: {'lr': 0.00019935680439858806, 'samples': 1295360, 'steps': 2529, 'loss/train': 1.2427473068237305} -09/20/2021 23:15:20 - INFO - __main__ - Step 40481: {'lr': 0.00019935608187468022, 'samples': 1295392, 'steps': 2530, 'loss/train': 2.8743481636047363} -09/20/2021 23:15:21 - INFO - __main__ - Step 40482: {'lr': 0.00019935608187468022, 'samples': 1295424, 'steps': 2530, 'loss/train': 3.3778083324432373} -09/20/2021 23:15:21 - INFO - __main__ - Step 40483: {'lr': 0.00019935608187468022, 'samples': 1295456, 'steps': 2530, 'loss/train': 1.958437204360962} -09/20/2021 23:15:22 - INFO - __main__ - Step 40484: {'lr': 0.00019935608187468022, 'samples': 1295488, 'steps': 2530, 'loss/train': 2.0052549839019775} -09/20/2021 23:15:23 - INFO - __main__ - Step 40485: {'lr': 0.00019935608187468022, 'samples': 1295520, 'steps': 2530, 'loss/train': 1.458578109741211} -09/20/2021 23:15:24 - INFO - __main__ - Step 40486: {'lr': 0.00019935608187468022, 'samples': 1295552, 'steps': 2530, 'loss/train': 1.9303137063980103} -09/20/2021 23:15:24 - INFO - __main__ - Step 40487: {'lr': 0.00019935608187468022, 'samples': 1295584, 'steps': 2530, 'loss/train': 0.9580512046813965} -09/20/2021 23:15:25 - INFO - __main__ - Step 40488: {'lr': 0.00019935608187468022, 'samples': 1295616, 'steps': 2530, 'loss/train': 1.892461895942688} -09/20/2021 23:15:26 - INFO - __main__ - Step 40489: {'lr': 0.00019935608187468022, 'samples': 1295648, 'steps': 2530, 'loss/train': 2.451894521713257} -09/20/2021 23:15:27 - INFO - __main__ - Step 40490: {'lr': 0.00019935608187468022, 'samples': 1295680, 'steps': 2530, 'loss/train': 2.725520610809326} -09/20/2021 23:15:27 - INFO - __main__ - Step 40491: {'lr': 0.00019935608187468022, 'samples': 1295712, 'steps': 2530, 'loss/train': 2.1745314598083496} -09/20/2021 23:15:28 - INFO - __main__ - Step 40492: {'lr': 0.00019935608187468022, 'samples': 1295744, 'steps': 2530, 'loss/train': 2.375246286392212} -09/20/2021 23:15:29 - INFO - __main__ - Step 40493: {'lr': 0.00019935608187468022, 'samples': 1295776, 'steps': 2530, 'loss/train': 2.0948522090911865} -09/20/2021 23:15:30 - INFO - __main__ - Step 40494: {'lr': 0.00019935608187468022, 'samples': 1295808, 'steps': 2530, 'loss/train': 1.9225367307662964} -09/20/2021 23:15:30 - INFO - __main__ - Step 40495: {'lr': 0.00019935608187468022, 'samples': 1295840, 'steps': 2530, 'loss/train': 2.7424845695495605} -09/20/2021 23:15:31 - INFO - __main__ - Step 40496: {'lr': 0.00019935608187468022, 'samples': 1295872, 'steps': 2530, 'loss/train': 2.6127281188964844} -09/20/2021 23:15:33 - INFO - __main__ - Step 40497: {'lr': 0.00019935535894649285, 'samples': 1295904, 'steps': 2531, 'loss/train': 1.8725115060806274} -09/20/2021 23:15:34 - INFO - __main__ - Step 40498: {'lr': 0.00019935535894649285, 'samples': 1295936, 'steps': 2531, 'loss/train': 1.1937943696975708} -09/20/2021 23:15:35 - INFO - __main__ - Step 40499: {'lr': 0.00019935535894649285, 'samples': 1295968, 'steps': 2531, 'loss/train': 1.5108314752578735} -09/20/2021 23:15:35 - INFO - __main__ - Step 40500: {'lr': 0.00019935535894649285, 'samples': 1296000, 'steps': 2531, 'loss/train': 2.0450878143310547} -09/20/2021 23:15:36 - INFO - __main__ - Step 40501: {'lr': 0.00019935535894649285, 'samples': 1296032, 'steps': 2531, 'loss/train': 1.7500361204147339} -09/20/2021 23:15:37 - INFO - __main__ - Step 40502: {'lr': 0.00019935535894649285, 'samples': 1296064, 'steps': 2531, 'loss/train': 1.2958711385726929} -09/20/2021 23:15:38 - INFO - __main__ - Step 40503: {'lr': 0.00019935535894649285, 'samples': 1296096, 'steps': 2531, 'loss/train': 1.382266640663147} -09/20/2021 23:15:38 - INFO - __main__ - Step 40504: {'lr': 0.00019935535894649285, 'samples': 1296128, 'steps': 2531, 'loss/train': 1.771349310874939} -09/20/2021 23:15:39 - INFO - __main__ - Step 40505: {'lr': 0.00019935535894649285, 'samples': 1296160, 'steps': 2531, 'loss/train': 1.33273184299469} -09/20/2021 23:15:40 - INFO - __main__ - Step 40506: {'lr': 0.00019935535894649285, 'samples': 1296192, 'steps': 2531, 'loss/train': 2.1815285682678223} -09/20/2021 23:15:41 - INFO - __main__ - Step 40507: {'lr': 0.00019935535894649285, 'samples': 1296224, 'steps': 2531, 'loss/train': 2.4736440181732178} -09/20/2021 23:15:41 - INFO - __main__ - Step 40508: {'lr': 0.00019935535894649285, 'samples': 1296256, 'steps': 2531, 'loss/train': 2.2374930381774902} -09/20/2021 23:15:42 - INFO - __main__ - Step 40509: {'lr': 0.00019935535894649285, 'samples': 1296288, 'steps': 2531, 'loss/train': 2.699070692062378} -09/20/2021 23:15:43 - INFO - __main__ - Step 40510: {'lr': 0.00019935535894649285, 'samples': 1296320, 'steps': 2531, 'loss/train': 1.2785907983779907} -09/20/2021 23:15:44 - INFO - __main__ - Step 40511: {'lr': 0.00019935535894649285, 'samples': 1296352, 'steps': 2531, 'loss/train': 1.8310632705688477} -09/20/2021 23:15:44 - INFO - __main__ - Step 40512: {'lr': 0.00019935535894649285, 'samples': 1296384, 'steps': 2531, 'loss/train': 2.894641876220703} -09/20/2021 23:15:45 - INFO - __main__ - Step 40513: {'lr': 0.00019935463561402894, 'samples': 1296416, 'steps': 2532, 'loss/train': 2.150381088256836} -09/20/2021 23:15:46 - INFO - __main__ - Step 40514: {'lr': 0.00019935463561402894, 'samples': 1296448, 'steps': 2532, 'loss/train': 2.9760549068450928} -09/20/2021 23:15:47 - INFO - __main__ - Step 40515: {'lr': 0.00019935463561402894, 'samples': 1296480, 'steps': 2532, 'loss/train': 2.0216012001037598} -09/20/2021 23:15:47 - INFO - __main__ - Step 40516: {'lr': 0.00019935463561402894, 'samples': 1296512, 'steps': 2532, 'loss/train': 2.227088212966919} -09/20/2021 23:15:48 - INFO - __main__ - Step 40517: {'lr': 0.00019935463561402894, 'samples': 1296544, 'steps': 2532, 'loss/train': 3.084315776824951} -09/20/2021 23:15:49 - INFO - __main__ - Step 40518: {'lr': 0.00019935463561402894, 'samples': 1296576, 'steps': 2532, 'loss/train': 1.6986334323883057} -09/20/2021 23:15:50 - INFO - __main__ - Step 40519: {'lr': 0.00019935463561402894, 'samples': 1296608, 'steps': 2532, 'loss/train': 2.329197883605957} -09/20/2021 23:15:50 - INFO - __main__ - Step 40520: {'lr': 0.00019935463561402894, 'samples': 1296640, 'steps': 2532, 'loss/train': 2.3570914268493652} -09/20/2021 23:15:51 - INFO - __main__ - Step 40521: {'lr': 0.00019935463561402894, 'samples': 1296672, 'steps': 2532, 'loss/train': 6.06781530380249} -09/20/2021 23:15:52 - INFO - __main__ - Step 40522: {'lr': 0.00019935463561402894, 'samples': 1296704, 'steps': 2532, 'loss/train': 5.511902332305908} -09/20/2021 23:15:53 - INFO - __main__ - Step 40523: {'lr': 0.00019935463561402894, 'samples': 1296736, 'steps': 2532, 'loss/train': 2.403250217437744} -09/20/2021 23:15:53 - INFO - __main__ - Step 40524: {'lr': 0.00019935463561402894, 'samples': 1296768, 'steps': 2532, 'loss/train': 2.9534671306610107} -09/20/2021 23:15:54 - INFO - __main__ - Step 40525: {'lr': 0.00019935463561402894, 'samples': 1296800, 'steps': 2532, 'loss/train': 1.4856289625167847} -09/20/2021 23:15:55 - INFO - __main__ - Step 40526: {'lr': 0.00019935463561402894, 'samples': 1296832, 'steps': 2532, 'loss/train': 2.4611945152282715} -09/20/2021 23:15:56 - INFO - __main__ - Step 40527: {'lr': 0.00019935463561402894, 'samples': 1296864, 'steps': 2532, 'loss/train': 2.1398589611053467} -09/20/2021 23:15:56 - INFO - __main__ - Step 40528: {'lr': 0.00019935463561402894, 'samples': 1296896, 'steps': 2532, 'loss/train': 2.704313039779663} -09/20/2021 23:15:58 - INFO - __main__ - Step 40529: {'lr': 0.0001993539118772914, 'samples': 1296928, 'steps': 2533, 'loss/train': 1.444146990776062} -09/20/2021 23:15:59 - INFO - __main__ - Step 40530: {'lr': 0.0001993539118772914, 'samples': 1296960, 'steps': 2533, 'loss/train': 2.2383337020874023} -09/20/2021 23:16:00 - INFO - __main__ - Step 40531: {'lr': 0.0001993539118772914, 'samples': 1296992, 'steps': 2533, 'loss/train': 2.5190658569335938} -09/20/2021 23:16:00 - INFO - __main__ - Step 40532: {'lr': 0.0001993539118772914, 'samples': 1297024, 'steps': 2533, 'loss/train': 0.12799102067947388} -09/20/2021 23:16:01 - INFO - __main__ - Step 40533: {'lr': 0.0001993539118772914, 'samples': 1297056, 'steps': 2533, 'loss/train': 0.16657710075378418} -09/20/2021 23:16:02 - INFO - __main__ - Step 40534: {'lr': 0.0001993539118772914, 'samples': 1297088, 'steps': 2533, 'loss/train': 0.42822062969207764} -09/20/2021 23:16:03 - INFO - __main__ - Step 40535: {'lr': 0.0001993539118772914, 'samples': 1297120, 'steps': 2533, 'loss/train': 1.7865869998931885} -09/20/2021 23:16:03 - INFO - __main__ - Step 40536: {'lr': 0.0001993539118772914, 'samples': 1297152, 'steps': 2533, 'loss/train': 1.958211898803711} -09/20/2021 23:16:04 - INFO - __main__ - Step 40537: {'lr': 0.0001993539118772914, 'samples': 1297184, 'steps': 2533, 'loss/train': 1.5525273084640503} -09/20/2021 23:16:05 - INFO - __main__ - Step 40538: {'lr': 0.0001993539118772914, 'samples': 1297216, 'steps': 2533, 'loss/train': 1.459828495979309} -09/20/2021 23:16:06 - INFO - __main__ - Step 40539: {'lr': 0.0001993539118772914, 'samples': 1297248, 'steps': 2533, 'loss/train': 1.326108455657959} -09/20/2021 23:16:06 - INFO - __main__ - Step 40540: {'lr': 0.0001993539118772914, 'samples': 1297280, 'steps': 2533, 'loss/train': 1.7282334566116333} -09/20/2021 23:16:07 - INFO - __main__ - Step 40541: {'lr': 0.0001993539118772914, 'samples': 1297312, 'steps': 2533, 'loss/train': 1.1532773971557617} -09/20/2021 23:16:08 - INFO - __main__ - Step 40542: {'lr': 0.0001993539118772914, 'samples': 1297344, 'steps': 2533, 'loss/train': 1.754646897315979} -09/20/2021 23:16:09 - INFO - __main__ - Step 40543: {'lr': 0.0001993539118772914, 'samples': 1297376, 'steps': 2533, 'loss/train': 2.610884428024292} -09/20/2021 23:16:09 - INFO - __main__ - Step 40544: {'lr': 0.0001993539118772914, 'samples': 1297408, 'steps': 2533, 'loss/train': 2.6771488189697266} -09/20/2021 23:16:10 - INFO - __main__ - Step 40545: {'lr': 0.00019935318773628318, 'samples': 1297440, 'steps': 2534, 'loss/train': 2.701246738433838} -09/20/2021 23:16:11 - INFO - __main__ - Step 40546: {'lr': 0.00019935318773628318, 'samples': 1297472, 'steps': 2534, 'loss/train': 2.890490770339966} -09/20/2021 23:16:12 - INFO - __main__ - Step 40547: {'lr': 0.00019935318773628318, 'samples': 1297504, 'steps': 2534, 'loss/train': 2.8612470626831055} -09/20/2021 23:16:12 - INFO - __main__ - Step 40548: {'lr': 0.00019935318773628318, 'samples': 1297536, 'steps': 2534, 'loss/train': 2.3949668407440186} -09/20/2021 23:16:13 - INFO - __main__ - Step 40549: {'lr': 0.00019935318773628318, 'samples': 1297568, 'steps': 2534, 'loss/train': 2.3506252765655518} -09/20/2021 23:16:14 - INFO - __main__ - Step 40550: {'lr': 0.00019935318773628318, 'samples': 1297600, 'steps': 2534, 'loss/train': 1.9422625303268433} -09/20/2021 23:16:15 - INFO - __main__ - Step 40551: {'lr': 0.00019935318773628318, 'samples': 1297632, 'steps': 2534, 'loss/train': 2.1793668270111084} -09/20/2021 23:16:15 - INFO - __main__ - Step 40552: {'lr': 0.00019935318773628318, 'samples': 1297664, 'steps': 2534, 'loss/train': 2.169558048248291} -09/20/2021 23:16:16 - INFO - __main__ - Step 40553: {'lr': 0.00019935318773628318, 'samples': 1297696, 'steps': 2534, 'loss/train': 2.1406915187835693} -09/20/2021 23:16:17 - INFO - __main__ - Step 40554: {'lr': 0.00019935318773628318, 'samples': 1297728, 'steps': 2534, 'loss/train': 0.9213430881500244} -09/20/2021 23:16:18 - INFO - __main__ - Step 40555: {'lr': 0.00019935318773628318, 'samples': 1297760, 'steps': 2534, 'loss/train': 2.267043113708496} -09/20/2021 23:16:18 - INFO - __main__ - Step 40556: {'lr': 0.00019935318773628318, 'samples': 1297792, 'steps': 2534, 'loss/train': 2.5472092628479004} -09/20/2021 23:16:19 - INFO - __main__ - Step 40557: {'lr': 0.00019935318773628318, 'samples': 1297824, 'steps': 2534, 'loss/train': 2.397768020629883} -09/20/2021 23:16:20 - INFO - __main__ - Step 40558: {'lr': 0.00019935318773628318, 'samples': 1297856, 'steps': 2534, 'loss/train': 2.913367986679077} -09/20/2021 23:16:21 - INFO - __main__ - Step 40559: {'lr': 0.00019935318773628318, 'samples': 1297888, 'steps': 2534, 'loss/train': 1.9814534187316895} -09/20/2021 23:16:21 - INFO - __main__ - Step 40560: {'lr': 0.00019935318773628318, 'samples': 1297920, 'steps': 2534, 'loss/train': 2.1551105976104736} -09/20/2021 23:16:22 - INFO - __main__ - Step 40561: {'lr': 0.00019935246319100717, 'samples': 1297952, 'steps': 2535, 'loss/train': 2.122223377227783} -09/20/2021 23:16:23 - INFO - __main__ - Step 40562: {'lr': 0.00019935246319100717, 'samples': 1297984, 'steps': 2535, 'loss/train': 2.5219035148620605} -09/20/2021 23:16:25 - INFO - __main__ - Step 40563: {'lr': 0.00019935246319100717, 'samples': 1298016, 'steps': 2535, 'loss/train': 2.935807466506958} -09/20/2021 23:16:25 - INFO - __main__ - Step 40564: {'lr': 0.00019935246319100717, 'samples': 1298048, 'steps': 2535, 'loss/train': 1.9622756242752075} -09/20/2021 23:16:26 - INFO - __main__ - Step 40565: {'lr': 0.00019935246319100717, 'samples': 1298080, 'steps': 2535, 'loss/train': 2.684980630874634} -09/20/2021 23:16:27 - INFO - __main__ - Step 40566: {'lr': 0.00019935246319100717, 'samples': 1298112, 'steps': 2535, 'loss/train': 2.115208148956299} -09/20/2021 23:16:28 - INFO - __main__ - Step 40567: {'lr': 0.00019935246319100717, 'samples': 1298144, 'steps': 2535, 'loss/train': 2.263758420944214} -09/20/2021 23:16:28 - INFO - __main__ - Step 40568: {'lr': 0.00019935246319100717, 'samples': 1298176, 'steps': 2535, 'loss/train': 1.3258222341537476} -09/20/2021 23:16:29 - INFO - __main__ - Step 40569: {'lr': 0.00019935246319100717, 'samples': 1298208, 'steps': 2535, 'loss/train': 0.8555242419242859} -09/20/2021 23:16:30 - INFO - __main__ - Step 40570: {'lr': 0.00019935246319100717, 'samples': 1298240, 'steps': 2535, 'loss/train': 2.451361656188965} -09/20/2021 23:16:31 - INFO - __main__ - Step 40571: {'lr': 0.00019935246319100717, 'samples': 1298272, 'steps': 2535, 'loss/train': 1.4074313640594482} -09/20/2021 23:16:31 - INFO - __main__ - Step 40572: {'lr': 0.00019935246319100717, 'samples': 1298304, 'steps': 2535, 'loss/train': 2.0811314582824707} -09/20/2021 23:16:32 - INFO - __main__ - Step 40573: {'lr': 0.00019935246319100717, 'samples': 1298336, 'steps': 2535, 'loss/train': 0.34509432315826416} -09/20/2021 23:16:33 - INFO - __main__ - Step 40574: {'lr': 0.00019935246319100717, 'samples': 1298368, 'steps': 2535, 'loss/train': 1.8423861265182495} -09/20/2021 23:16:34 - INFO - __main__ - Step 40575: {'lr': 0.00019935246319100717, 'samples': 1298400, 'steps': 2535, 'loss/train': 1.6745110750198364} -09/20/2021 23:16:34 - INFO - __main__ - Step 40576: {'lr': 0.00019935246319100717, 'samples': 1298432, 'steps': 2535, 'loss/train': 0.9133881330490112} -09/20/2021 23:16:35 - INFO - __main__ - Step 40577: {'lr': 0.00019935173824146642, 'samples': 1298464, 'steps': 2536, 'loss/train': 2.7834770679473877} -09/20/2021 23:16:36 - INFO - __main__ - Step 40578: {'lr': 0.00019935173824146642, 'samples': 1298496, 'steps': 2536, 'loss/train': 1.7935022115707397} -09/20/2021 23:16:37 - INFO - __main__ - Step 40579: {'lr': 0.00019935173824146642, 'samples': 1298528, 'steps': 2536, 'loss/train': 1.9156899452209473} -09/20/2021 23:16:38 - INFO - __main__ - Step 40580: {'lr': 0.00019935173824146642, 'samples': 1298560, 'steps': 2536, 'loss/train': 2.7363662719726562} -09/20/2021 23:16:38 - INFO - __main__ - Step 40581: {'lr': 0.00019935173824146642, 'samples': 1298592, 'steps': 2536, 'loss/train': 2.5819523334503174} -09/20/2021 23:16:39 - INFO - __main__ - Step 40582: {'lr': 0.00019935173824146642, 'samples': 1298624, 'steps': 2536, 'loss/train': 1.289533019065857} -09/20/2021 23:16:40 - INFO - __main__ - Step 40583: {'lr': 0.00019935173824146642, 'samples': 1298656, 'steps': 2536, 'loss/train': 1.3464423418045044} -09/20/2021 23:16:41 - INFO - __main__ - Step 40584: {'lr': 0.00019935173824146642, 'samples': 1298688, 'steps': 2536, 'loss/train': 1.843331217765808} -09/20/2021 23:16:41 - INFO - __main__ - Step 40585: {'lr': 0.00019935173824146642, 'samples': 1298720, 'steps': 2536, 'loss/train': 2.2843968868255615} -09/20/2021 23:16:42 - INFO - __main__ - Step 40586: {'lr': 0.00019935173824146642, 'samples': 1298752, 'steps': 2536, 'loss/train': 2.085759162902832} -09/20/2021 23:16:43 - INFO - __main__ - Step 40587: {'lr': 0.00019935173824146642, 'samples': 1298784, 'steps': 2536, 'loss/train': 2.4684929847717285} -09/20/2021 23:16:44 - INFO - __main__ - Step 40588: {'lr': 0.00019935173824146642, 'samples': 1298816, 'steps': 2536, 'loss/train': 1.671120285987854} -09/20/2021 23:16:44 - INFO - __main__ - Step 40589: {'lr': 0.00019935173824146642, 'samples': 1298848, 'steps': 2536, 'loss/train': 2.093130588531494} -09/20/2021 23:16:45 - INFO - __main__ - Step 40590: {'lr': 0.00019935173824146642, 'samples': 1298880, 'steps': 2536, 'loss/train': 1.5068678855895996} -09/20/2021 23:16:46 - INFO - __main__ - Step 40591: {'lr': 0.00019935173824146642, 'samples': 1298912, 'steps': 2536, 'loss/train': 1.8445724248886108} -09/20/2021 23:16:47 - INFO - __main__ - Step 40592: {'lr': 0.00019935173824146642, 'samples': 1298944, 'steps': 2536, 'loss/train': 0.25845709443092346} -09/20/2021 23:16:47 - INFO - __main__ - Step 40593: {'lr': 0.00019935101288766385, 'samples': 1298976, 'steps': 2537, 'loss/train': 0.2285493016242981} -09/20/2021 23:16:48 - INFO - __main__ - Step 40594: {'lr': 0.00019935101288766385, 'samples': 1299008, 'steps': 2537, 'loss/train': 0.24069379270076752} -09/20/2021 23:16:49 - INFO - __main__ - Step 40595: {'lr': 0.00019935101288766385, 'samples': 1299040, 'steps': 2537, 'loss/train': 0.1939995288848877} -09/20/2021 23:16:51 - INFO - __main__ - Step 40596: {'lr': 0.00019935101288766385, 'samples': 1299072, 'steps': 2537, 'loss/train': 0.11562388390302658} -09/20/2021 23:16:51 - INFO - __main__ - Step 40597: {'lr': 0.00019935101288766385, 'samples': 1299104, 'steps': 2537, 'loss/train': 1.8283393383026123} -09/20/2021 23:16:52 - INFO - __main__ - Step 40598: {'lr': 0.00019935101288766385, 'samples': 1299136, 'steps': 2537, 'loss/train': 2.7504806518554688} -09/20/2021 23:16:53 - INFO - __main__ - Step 40599: {'lr': 0.00019935101288766385, 'samples': 1299168, 'steps': 2537, 'loss/train': 0.6748654842376709} -09/20/2021 23:16:54 - INFO - __main__ - Step 40600: {'lr': 0.00019935101288766385, 'samples': 1299200, 'steps': 2537, 'loss/train': 0.5871359705924988} -09/20/2021 23:16:54 - INFO - __main__ - Step 40601: {'lr': 0.00019935101288766385, 'samples': 1299232, 'steps': 2537, 'loss/train': 0.49331775307655334} -09/20/2021 23:16:55 - INFO - __main__ - Step 40602: {'lr': 0.00019935101288766385, 'samples': 1299264, 'steps': 2537, 'loss/train': 0.6478534936904907} -09/20/2021 23:16:56 - INFO - __main__ - Step 40603: {'lr': 0.00019935101288766385, 'samples': 1299296, 'steps': 2537, 'loss/train': 0.5326962471008301} -09/20/2021 23:16:57 - INFO - __main__ - Step 40604: {'lr': 0.00019935101288766385, 'samples': 1299328, 'steps': 2537, 'loss/train': 0.5668935775756836} -09/20/2021 23:16:57 - INFO - __main__ - Step 40605: {'lr': 0.00019935101288766385, 'samples': 1299360, 'steps': 2537, 'loss/train': 0.4977762997150421} -09/20/2021 23:16:58 - INFO - __main__ - Step 40606: {'lr': 0.00019935101288766385, 'samples': 1299392, 'steps': 2537, 'loss/train': 0.7780494689941406} -09/20/2021 23:16:59 - INFO - __main__ - Step 40607: {'lr': 0.00019935101288766385, 'samples': 1299424, 'steps': 2537, 'loss/train': 0.5850085020065308} -09/20/2021 23:17:00 - INFO - __main__ - Step 40608: {'lr': 0.00019935101288766385, 'samples': 1299456, 'steps': 2537, 'loss/train': 2.205289602279663} -09/20/2021 23:17:01 - INFO - __main__ - Step 40609: {'lr': 0.00019935028712960237, 'samples': 1299488, 'steps': 2538, 'loss/train': 0.4906250536441803} -09/20/2021 23:17:01 - INFO - __main__ - Step 40610: {'lr': 0.00019935028712960237, 'samples': 1299520, 'steps': 2538, 'loss/train': 2.144914150238037} -09/20/2021 23:17:02 - INFO - __main__ - Step 40611: {'lr': 0.00019935028712960237, 'samples': 1299552, 'steps': 2538, 'loss/train': 2.197445869445801} -09/20/2021 23:17:03 - INFO - __main__ - Step 40612: {'lr': 0.00019935028712960237, 'samples': 1299584, 'steps': 2538, 'loss/train': 1.8053678274154663} -09/20/2021 23:17:04 - INFO - __main__ - Step 40613: {'lr': 0.00019935028712960237, 'samples': 1299616, 'steps': 2538, 'loss/train': 0.6458016633987427} -09/20/2021 23:17:04 - INFO - __main__ - Step 40614: {'lr': 0.00019935028712960237, 'samples': 1299648, 'steps': 2538, 'loss/train': 5.425466537475586} -09/20/2021 23:17:05 - INFO - __main__ - Step 40615: {'lr': 0.00019935028712960237, 'samples': 1299680, 'steps': 2538, 'loss/train': 2.1590802669525146} -09/20/2021 23:17:06 - INFO - __main__ - Step 40616: {'lr': 0.00019935028712960237, 'samples': 1299712, 'steps': 2538, 'loss/train': 2.227604627609253} -09/20/2021 23:17:07 - INFO - __main__ - Step 40617: {'lr': 0.00019935028712960237, 'samples': 1299744, 'steps': 2538, 'loss/train': 2.6630144119262695} -09/20/2021 23:17:07 - INFO - __main__ - Step 40618: {'lr': 0.00019935028712960237, 'samples': 1299776, 'steps': 2538, 'loss/train': 2.645970344543457} -09/20/2021 23:17:08 - INFO - __main__ - Step 40619: {'lr': 0.00019935028712960237, 'samples': 1299808, 'steps': 2538, 'loss/train': 2.1134161949157715} -09/20/2021 23:17:09 - INFO - __main__ - Step 40620: {'lr': 0.00019935028712960237, 'samples': 1299840, 'steps': 2538, 'loss/train': 2.903933525085449} -09/20/2021 23:17:10 - INFO - __main__ - Step 40621: {'lr': 0.00019935028712960237, 'samples': 1299872, 'steps': 2538, 'loss/train': 2.2192306518554688} -09/20/2021 23:17:10 - INFO - __main__ - Step 40622: {'lr': 0.00019935028712960237, 'samples': 1299904, 'steps': 2538, 'loss/train': 1.1711490154266357} -09/20/2021 23:17:11 - INFO - __main__ - Step 40623: {'lr': 0.00019935028712960237, 'samples': 1299936, 'steps': 2538, 'loss/train': 1.7192891836166382} -09/20/2021 23:17:12 - INFO - __main__ - Step 40624: {'lr': 0.00019935028712960237, 'samples': 1299968, 'steps': 2538, 'loss/train': 2.0869193077087402} -09/20/2021 23:17:13 - INFO - __main__ - Step 40625: {'lr': 0.00019934956096728494, 'samples': 1300000, 'steps': 2539, 'loss/train': 2.1736364364624023} -09/20/2021 23:17:13 - INFO - __main__ - Step 40626: {'lr': 0.00019934956096728494, 'samples': 1300032, 'steps': 2539, 'loss/train': 1.7273310422897339} -09/20/2021 23:17:14 - INFO - __main__ - Step 40627: {'lr': 0.00019934956096728494, 'samples': 1300064, 'steps': 2539, 'loss/train': 2.0509190559387207} -09/20/2021 23:17:15 - INFO - __main__ - Step 40628: {'lr': 0.00019934956096728494, 'samples': 1300096, 'steps': 2539, 'loss/train': 1.6711212396621704} -09/20/2021 23:17:16 - INFO - __main__ - Step 40629: {'lr': 0.00019934956096728494, 'samples': 1300128, 'steps': 2539, 'loss/train': 1.9487314224243164} -09/20/2021 23:17:16 - INFO - __main__ - Step 40630: {'lr': 0.00019934956096728494, 'samples': 1300160, 'steps': 2539, 'loss/train': 1.9773226976394653} -09/20/2021 23:17:18 - INFO - __main__ - Step 40631: {'lr': 0.00019934956096728494, 'samples': 1300192, 'steps': 2539, 'loss/train': 3.6999166011810303} -09/20/2021 23:17:19 - INFO - __main__ - Step 40632: {'lr': 0.00019934956096728494, 'samples': 1300224, 'steps': 2539, 'loss/train': 2.5355584621429443} -09/20/2021 23:17:19 - INFO - __main__ - Step 40633: {'lr': 0.00019934956096728494, 'samples': 1300256, 'steps': 2539, 'loss/train': 2.5341238975524902} -09/20/2021 23:17:20 - INFO - __main__ - Step 40634: {'lr': 0.00019934956096728494, 'samples': 1300288, 'steps': 2539, 'loss/train': 2.807859182357788} -09/20/2021 23:17:21 - INFO - __main__ - Step 40635: {'lr': 0.00019934956096728494, 'samples': 1300320, 'steps': 2539, 'loss/train': 1.8388274908065796} -09/20/2021 23:17:22 - INFO - __main__ - Step 40636: {'lr': 0.00019934956096728494, 'samples': 1300352, 'steps': 2539, 'loss/train': 0.24691209197044373} -09/20/2021 23:17:22 - INFO - __main__ - Step 40637: {'lr': 0.00019934956096728494, 'samples': 1300384, 'steps': 2539, 'loss/train': 1.9551247358322144} -09/20/2021 23:17:23 - INFO - __main__ - Step 40638: {'lr': 0.00019934956096728494, 'samples': 1300416, 'steps': 2539, 'loss/train': 2.2293035984039307} -09/20/2021 23:17:24 - INFO - __main__ - Step 40639: {'lr': 0.00019934956096728494, 'samples': 1300448, 'steps': 2539, 'loss/train': 2.8410489559173584} -09/20/2021 23:17:25 - INFO - __main__ - Step 40640: {'lr': 0.00019934956096728494, 'samples': 1300480, 'steps': 2539, 'loss/train': 1.8433865308761597} -09/20/2021 23:17:26 - INFO - __main__ - Step 40641: {'lr': 0.00019934883440071458, 'samples': 1300512, 'steps': 2540, 'loss/train': 1.3116298913955688} -09/20/2021 23:17:26 - INFO - __main__ - Step 40642: {'lr': 0.00019934883440071458, 'samples': 1300544, 'steps': 2540, 'loss/train': 1.941368818283081} -09/20/2021 23:17:27 - INFO - __main__ - Step 40643: {'lr': 0.00019934883440071458, 'samples': 1300576, 'steps': 2540, 'loss/train': 2.3715713024139404} -09/20/2021 23:17:28 - INFO - __main__ - Step 40644: {'lr': 0.00019934883440071458, 'samples': 1300608, 'steps': 2540, 'loss/train': 1.2318100929260254} -09/20/2021 23:17:29 - INFO - __main__ - Step 40645: {'lr': 0.00019934883440071458, 'samples': 1300640, 'steps': 2540, 'loss/train': 2.0234274864196777} -09/20/2021 23:17:29 - INFO - __main__ - Step 40646: {'lr': 0.00019934883440071458, 'samples': 1300672, 'steps': 2540, 'loss/train': 0.6786229610443115} -09/20/2021 23:17:30 - INFO - __main__ - Step 40647: {'lr': 0.00019934883440071458, 'samples': 1300704, 'steps': 2540, 'loss/train': 1.9596432447433472} -09/20/2021 23:17:31 - INFO - __main__ - Step 40648: {'lr': 0.00019934883440071458, 'samples': 1300736, 'steps': 2540, 'loss/train': 2.986694097518921} -09/20/2021 23:17:32 - INFO - __main__ - Step 40649: {'lr': 0.00019934883440071458, 'samples': 1300768, 'steps': 2540, 'loss/train': 2.4738752841949463} -09/20/2021 23:17:32 - INFO - __main__ - Step 40650: {'lr': 0.00019934883440071458, 'samples': 1300800, 'steps': 2540, 'loss/train': 2.4257428646087646} -09/20/2021 23:17:33 - INFO - __main__ - Step 40651: {'lr': 0.00019934883440071458, 'samples': 1300832, 'steps': 2540, 'loss/train': 0.7167021632194519} -09/20/2021 23:17:34 - INFO - __main__ - Step 40652: {'lr': 0.00019934883440071458, 'samples': 1300864, 'steps': 2540, 'loss/train': 0.1647786796092987} -09/20/2021 23:17:35 - INFO - __main__ - Step 40653: {'lr': 0.00019934883440071458, 'samples': 1300896, 'steps': 2540, 'loss/train': 0.375916987657547} -09/20/2021 23:17:35 - INFO - __main__ - Step 40654: {'lr': 0.00019934883440071458, 'samples': 1300928, 'steps': 2540, 'loss/train': 0.2518253028392792} -09/20/2021 23:17:36 - INFO - __main__ - Step 40655: {'lr': 0.00019934883440071458, 'samples': 1300960, 'steps': 2540, 'loss/train': 0.2339404970407486} -09/20/2021 23:17:37 - INFO - __main__ - Step 40656: {'lr': 0.00019934883440071458, 'samples': 1300992, 'steps': 2540, 'loss/train': 0.08470941334962845} -09/20/2021 23:17:38 - INFO - __main__ - Step 40657: {'lr': 0.00019934810742989415, 'samples': 1301024, 'steps': 2541, 'loss/train': 0.8177058696746826} -09/20/2021 23:17:38 - INFO - __main__ - Step 40658: {'lr': 0.00019934810742989415, 'samples': 1301056, 'steps': 2541, 'loss/train': 2.959095001220703} -09/20/2021 23:17:39 - INFO - __main__ - Step 40659: {'lr': 0.00019934810742989415, 'samples': 1301088, 'steps': 2541, 'loss/train': 1.590476393699646} -09/20/2021 23:17:40 - INFO - __main__ - Step 40660: {'lr': 0.00019934810742989415, 'samples': 1301120, 'steps': 2541, 'loss/train': 1.785179853439331} -09/20/2021 23:17:41 - INFO - __main__ - Step 40661: {'lr': 0.00019934810742989415, 'samples': 1301152, 'steps': 2541, 'loss/train': 1.8727885484695435} -09/20/2021 23:17:42 - INFO - __main__ - Step 40662: {'lr': 0.00019934810742989415, 'samples': 1301184, 'steps': 2541, 'loss/train': 2.3575217723846436} -09/20/2021 23:17:43 - INFO - __main__ - Step 40663: {'lr': 0.00019934810742989415, 'samples': 1301216, 'steps': 2541, 'loss/train': 2.03661847114563} -09/20/2021 23:17:44 - INFO - __main__ - Step 40664: {'lr': 0.00019934810742989415, 'samples': 1301248, 'steps': 2541, 'loss/train': 1.3882713317871094} -09/20/2021 23:17:44 - INFO - __main__ - Step 40665: {'lr': 0.00019934810742989415, 'samples': 1301280, 'steps': 2541, 'loss/train': 2.230818748474121} -09/20/2021 23:17:45 - INFO - __main__ - Step 40666: {'lr': 0.00019934810742989415, 'samples': 1301312, 'steps': 2541, 'loss/train': 2.292152166366577} -09/20/2021 23:17:46 - INFO - __main__ - Step 40667: {'lr': 0.00019934810742989415, 'samples': 1301344, 'steps': 2541, 'loss/train': 1.4633333683013916} -09/20/2021 23:17:47 - INFO - __main__ - Step 40668: {'lr': 0.00019934810742989415, 'samples': 1301376, 'steps': 2541, 'loss/train': 2.201012372970581} -09/20/2021 23:17:47 - INFO - __main__ - Step 40669: {'lr': 0.00019934810742989415, 'samples': 1301408, 'steps': 2541, 'loss/train': 1.8474528789520264} -09/20/2021 23:17:48 - INFO - __main__ - Step 40670: {'lr': 0.00019934810742989415, 'samples': 1301440, 'steps': 2541, 'loss/train': 2.2168712615966797} -09/20/2021 23:17:49 - INFO - __main__ - Step 40671: {'lr': 0.00019934810742989415, 'samples': 1301472, 'steps': 2541, 'loss/train': 1.8982467651367188} -09/20/2021 23:17:50 - INFO - __main__ - Step 40672: {'lr': 0.00019934810742989415, 'samples': 1301504, 'steps': 2541, 'loss/train': 1.7977927923202515} -09/20/2021 23:17:50 - INFO - __main__ - Step 40673: {'lr': 0.00019934738005482667, 'samples': 1301536, 'steps': 2542, 'loss/train': 1.2705185413360596} -09/20/2021 23:17:51 - INFO - __main__ - Step 40674: {'lr': 0.00019934738005482667, 'samples': 1301568, 'steps': 2542, 'loss/train': 1.9727836847305298} -09/20/2021 23:17:52 - INFO - __main__ - Step 40675: {'lr': 0.00019934738005482667, 'samples': 1301600, 'steps': 2542, 'loss/train': 2.543210506439209} -09/20/2021 23:17:53 - INFO - __main__ - Step 40676: {'lr': 0.00019934738005482667, 'samples': 1301632, 'steps': 2542, 'loss/train': 2.38732647895813} -09/20/2021 23:17:53 - INFO - __main__ - Step 40677: {'lr': 0.00019934738005482667, 'samples': 1301664, 'steps': 2542, 'loss/train': 2.767002582550049} -09/20/2021 23:17:54 - INFO - __main__ - Step 40678: {'lr': 0.00019934738005482667, 'samples': 1301696, 'steps': 2542, 'loss/train': 2.4378483295440674} -09/20/2021 23:17:55 - INFO - __main__ - Step 40679: {'lr': 0.00019934738005482667, 'samples': 1301728, 'steps': 2542, 'loss/train': 2.2272074222564697} -09/20/2021 23:17:56 - INFO - __main__ - Step 40680: {'lr': 0.00019934738005482667, 'samples': 1301760, 'steps': 2542, 'loss/train': 2.7741341590881348} -09/20/2021 23:17:56 - INFO - __main__ - Step 40681: {'lr': 0.00019934738005482667, 'samples': 1301792, 'steps': 2542, 'loss/train': 2.5274417400360107} -09/20/2021 23:17:57 - INFO - __main__ - Step 40682: {'lr': 0.00019934738005482667, 'samples': 1301824, 'steps': 2542, 'loss/train': 2.516268491744995} -09/20/2021 23:17:58 - INFO - __main__ - Step 40683: {'lr': 0.00019934738005482667, 'samples': 1301856, 'steps': 2542, 'loss/train': 0.7572319507598877} -09/20/2021 23:17:59 - INFO - __main__ - Step 40684: {'lr': 0.00019934738005482667, 'samples': 1301888, 'steps': 2542, 'loss/train': 2.150409460067749} -09/20/2021 23:17:59 - INFO - __main__ - Step 40685: {'lr': 0.00019934738005482667, 'samples': 1301920, 'steps': 2542, 'loss/train': 3.1709065437316895} -09/20/2021 23:18:00 - INFO - __main__ - Step 40686: {'lr': 0.00019934738005482667, 'samples': 1301952, 'steps': 2542, 'loss/train': 0.8652782440185547} -09/20/2021 23:18:01 - INFO - __main__ - Step 40687: {'lr': 0.00019934738005482667, 'samples': 1301984, 'steps': 2542, 'loss/train': 3.1390249729156494} -09/20/2021 23:18:02 - INFO - __main__ - Step 40688: {'lr': 0.00019934738005482667, 'samples': 1302016, 'steps': 2542, 'loss/train': 1.9865469932556152} -09/20/2021 23:18:03 - INFO - __main__ - Step 40689: {'lr': 0.0001993466522755151, 'samples': 1302048, 'steps': 2543, 'loss/train': 1.9840586185455322} -09/20/2021 23:18:03 - INFO - __main__ - Step 40690: {'lr': 0.0001993466522755151, 'samples': 1302080, 'steps': 2543, 'loss/train': 1.6570947170257568} -09/20/2021 23:18:04 - INFO - __main__ - Step 40691: {'lr': 0.0001993466522755151, 'samples': 1302112, 'steps': 2543, 'loss/train': 2.6347239017486572} -09/20/2021 23:18:05 - INFO - __main__ - Step 40692: {'lr': 0.0001993466522755151, 'samples': 1302144, 'steps': 2543, 'loss/train': 1.6181670427322388} -09/20/2021 23:18:06 - INFO - __main__ - Step 40693: {'lr': 0.0001993466522755151, 'samples': 1302176, 'steps': 2543, 'loss/train': 1.80036461353302} -09/20/2021 23:18:07 - INFO - __main__ - Step 40694: {'lr': 0.0001993466522755151, 'samples': 1302208, 'steps': 2543, 'loss/train': 1.916755199432373} -09/20/2021 23:18:08 - INFO - __main__ - Step 40695: {'lr': 0.0001993466522755151, 'samples': 1302240, 'steps': 2543, 'loss/train': 2.1156833171844482} -09/20/2021 23:18:08 - INFO - __main__ - Step 40696: {'lr': 0.0001993466522755151, 'samples': 1302272, 'steps': 2543, 'loss/train': 2.499427318572998} -09/20/2021 23:18:09 - INFO - __main__ - Step 40697: {'lr': 0.0001993466522755151, 'samples': 1302304, 'steps': 2543, 'loss/train': 2.8027708530426025} -09/20/2021 23:18:10 - INFO - __main__ - Step 40698: {'lr': 0.0001993466522755151, 'samples': 1302336, 'steps': 2543, 'loss/train': 1.5516372919082642} -09/20/2021 23:18:11 - INFO - __main__ - Step 40699: {'lr': 0.0001993466522755151, 'samples': 1302368, 'steps': 2543, 'loss/train': 0.9799961447715759} -09/20/2021 23:18:11 - INFO - __main__ - Step 40700: {'lr': 0.0001993466522755151, 'samples': 1302400, 'steps': 2543, 'loss/train': 1.8390475511550903} -09/20/2021 23:18:12 - INFO - __main__ - Step 40701: {'lr': 0.0001993466522755151, 'samples': 1302432, 'steps': 2543, 'loss/train': 2.254375696182251} -09/20/2021 23:18:13 - INFO - __main__ - Step 40702: {'lr': 0.0001993466522755151, 'samples': 1302464, 'steps': 2543, 'loss/train': 2.0576987266540527} -09/20/2021 23:18:14 - INFO - __main__ - Step 40703: {'lr': 0.0001993466522755151, 'samples': 1302496, 'steps': 2543, 'loss/train': 1.6988427639007568} -09/20/2021 23:18:14 - INFO - __main__ - Step 40704: {'lr': 0.0001993466522755151, 'samples': 1302528, 'steps': 2543, 'loss/train': 1.993974208831787} -09/20/2021 23:18:15 - INFO - __main__ - Step 40705: {'lr': 0.0001993459240919624, 'samples': 1302560, 'steps': 2544, 'loss/train': 1.5961617231369019} -09/20/2021 23:18:16 - INFO - __main__ - Step 40706: {'lr': 0.0001993459240919624, 'samples': 1302592, 'steps': 2544, 'loss/train': 1.818968653678894} -09/20/2021 23:18:17 - INFO - __main__ - Step 40707: {'lr': 0.0001993459240919624, 'samples': 1302624, 'steps': 2544, 'loss/train': 1.8627668619155884} -09/20/2021 23:18:18 - INFO - __main__ - Step 40708: {'lr': 0.0001993459240919624, 'samples': 1302656, 'steps': 2544, 'loss/train': 2.4103879928588867} -09/20/2021 23:18:18 - INFO - __main__ - Step 40709: {'lr': 0.0001993459240919624, 'samples': 1302688, 'steps': 2544, 'loss/train': 1.2262758016586304} -09/20/2021 23:18:19 - INFO - __main__ - Step 40710: {'lr': 0.0001993459240919624, 'samples': 1302720, 'steps': 2544, 'loss/train': 2.2403876781463623} -09/20/2021 23:18:20 - INFO - __main__ - Step 40711: {'lr': 0.0001993459240919624, 'samples': 1302752, 'steps': 2544, 'loss/train': 0.5570703744888306} -09/20/2021 23:18:21 - INFO - __main__ - Step 40712: {'lr': 0.0001993459240919624, 'samples': 1302784, 'steps': 2544, 'loss/train': 0.08310168981552124} -09/20/2021 23:18:21 - INFO - __main__ - Step 40713: {'lr': 0.0001993459240919624, 'samples': 1302816, 'steps': 2544, 'loss/train': 2.3776028156280518} -09/20/2021 23:18:22 - INFO - __main__ - Step 40714: {'lr': 0.0001993459240919624, 'samples': 1302848, 'steps': 2544, 'loss/train': 1.1681492328643799} -09/20/2021 23:18:23 - INFO - __main__ - Step 40715: {'lr': 0.0001993459240919624, 'samples': 1302880, 'steps': 2544, 'loss/train': 1.2772457599639893} -09/20/2021 23:18:24 - INFO - __main__ - Step 40716: {'lr': 0.0001993459240919624, 'samples': 1302912, 'steps': 2544, 'loss/train': 2.239363193511963} -09/20/2021 23:18:24 - INFO - __main__ - Step 40717: {'lr': 0.0001993459240919624, 'samples': 1302944, 'steps': 2544, 'loss/train': 1.0403691530227661} -09/20/2021 23:18:25 - INFO - __main__ - Step 40718: {'lr': 0.0001993459240919624, 'samples': 1302976, 'steps': 2544, 'loss/train': 2.022329568862915} -09/20/2021 23:18:26 - INFO - __main__ - Step 40719: {'lr': 0.0001993459240919624, 'samples': 1303008, 'steps': 2544, 'loss/train': 0.764182984828949} -09/20/2021 23:18:27 - INFO - __main__ - Step 40720: {'lr': 0.0001993459240919624, 'samples': 1303040, 'steps': 2544, 'loss/train': 2.2102458477020264} -09/20/2021 23:18:27 - INFO - __main__ - Step 40721: {'lr': 0.0001993451955041715, 'samples': 1303072, 'steps': 2545, 'loss/train': 2.2238588333129883} -09/20/2021 23:18:28 - INFO - __main__ - Step 40722: {'lr': 0.0001993451955041715, 'samples': 1303104, 'steps': 2545, 'loss/train': 2.661487579345703} -09/20/2021 23:18:29 - INFO - __main__ - Step 40723: {'lr': 0.0001993451955041715, 'samples': 1303136, 'steps': 2545, 'loss/train': 3.0726089477539062} -09/20/2021 23:18:30 - INFO - __main__ - Step 40724: {'lr': 0.0001993451955041715, 'samples': 1303168, 'steps': 2545, 'loss/train': 3.331930637359619} -09/20/2021 23:18:31 - INFO - __main__ - Step 40725: {'lr': 0.0001993451955041715, 'samples': 1303200, 'steps': 2545, 'loss/train': 2.1669886112213135} -09/20/2021 23:18:32 - INFO - __main__ - Step 40726: {'lr': 0.0001993451955041715, 'samples': 1303232, 'steps': 2545, 'loss/train': 2.1661014556884766} -09/20/2021 23:18:33 - INFO - __main__ - Step 40727: {'lr': 0.0001993451955041715, 'samples': 1303264, 'steps': 2545, 'loss/train': 1.7044998407363892} -09/20/2021 23:18:33 - INFO - __main__ - Step 40728: {'lr': 0.0001993451955041715, 'samples': 1303296, 'steps': 2545, 'loss/train': 1.2699322700500488} -09/20/2021 23:18:34 - INFO - __main__ - Step 40729: {'lr': 0.0001993451955041715, 'samples': 1303328, 'steps': 2545, 'loss/train': 2.1349141597747803} -09/20/2021 23:18:35 - INFO - __main__ - Step 40730: {'lr': 0.0001993451955041715, 'samples': 1303360, 'steps': 2545, 'loss/train': 2.2914366722106934} -09/20/2021 23:18:36 - INFO - __main__ - Step 40731: {'lr': 0.0001993451955041715, 'samples': 1303392, 'steps': 2545, 'loss/train': 1.666995882987976} -09/20/2021 23:18:36 - INFO - __main__ - Step 40732: {'lr': 0.0001993451955041715, 'samples': 1303424, 'steps': 2545, 'loss/train': 1.5262631177902222} -09/20/2021 23:18:37 - INFO - __main__ - Step 40733: {'lr': 0.0001993451955041715, 'samples': 1303456, 'steps': 2545, 'loss/train': 1.7189658880233765} -09/20/2021 23:18:38 - INFO - __main__ - Step 40734: {'lr': 0.0001993451955041715, 'samples': 1303488, 'steps': 2545, 'loss/train': 2.5181632041931152} -09/20/2021 23:18:39 - INFO - __main__ - Step 40735: {'lr': 0.0001993451955041715, 'samples': 1303520, 'steps': 2545, 'loss/train': 1.4679089784622192} -09/20/2021 23:18:39 - INFO - __main__ - Step 40736: {'lr': 0.0001993451955041715, 'samples': 1303552, 'steps': 2545, 'loss/train': 1.5488197803497314} -09/20/2021 23:18:40 - INFO - __main__ - Step 40737: {'lr': 0.00019934446651214538, 'samples': 1303584, 'steps': 2546, 'loss/train': 1.102042555809021} -09/20/2021 23:18:41 - INFO - __main__ - Step 40738: {'lr': 0.00019934446651214538, 'samples': 1303616, 'steps': 2546, 'loss/train': 1.0053696632385254} -09/20/2021 23:18:42 - INFO - __main__ - Step 40739: {'lr': 0.00019934446651214538, 'samples': 1303648, 'steps': 2546, 'loss/train': 2.0212953090667725} -09/20/2021 23:18:42 - INFO - __main__ - Step 40740: {'lr': 0.00019934446651214538, 'samples': 1303680, 'steps': 2546, 'loss/train': 1.733719825744629} -09/20/2021 23:18:43 - INFO - __main__ - Step 40741: {'lr': 0.00019934446651214538, 'samples': 1303712, 'steps': 2546, 'loss/train': 2.5358166694641113} -09/20/2021 23:18:44 - INFO - __main__ - Step 40742: {'lr': 0.00019934446651214538, 'samples': 1303744, 'steps': 2546, 'loss/train': 1.8168666362762451} -09/20/2021 23:18:45 - INFO - __main__ - Step 40743: {'lr': 0.00019934446651214538, 'samples': 1303776, 'steps': 2546, 'loss/train': 1.7821755409240723} -09/20/2021 23:18:45 - INFO - __main__ - Step 40744: {'lr': 0.00019934446651214538, 'samples': 1303808, 'steps': 2546, 'loss/train': 3.0146148204803467} -09/20/2021 23:18:46 - INFO - __main__ - Step 40745: {'lr': 0.00019934446651214538, 'samples': 1303840, 'steps': 2546, 'loss/train': 1.9866063594818115} -09/20/2021 23:18:47 - INFO - __main__ - Step 40746: {'lr': 0.00019934446651214538, 'samples': 1303872, 'steps': 2546, 'loss/train': 2.6951606273651123} -09/20/2021 23:18:48 - INFO - __main__ - Step 40747: {'lr': 0.00019934446651214538, 'samples': 1303904, 'steps': 2546, 'loss/train': 1.1018471717834473} -09/20/2021 23:18:48 - INFO - __main__ - Step 40748: {'lr': 0.00019934446651214538, 'samples': 1303936, 'steps': 2546, 'loss/train': 2.1573126316070557} -09/20/2021 23:18:49 - INFO - __main__ - Step 40749: {'lr': 0.00019934446651214538, 'samples': 1303968, 'steps': 2546, 'loss/train': 2.201946973800659} -09/20/2021 23:18:50 - INFO - __main__ - Step 40750: {'lr': 0.00019934446651214538, 'samples': 1304000, 'steps': 2546, 'loss/train': 1.8809095621109009} -09/20/2021 23:18:51 - INFO - __main__ - Step 40751: {'lr': 0.00019934446651214538, 'samples': 1304032, 'steps': 2546, 'loss/train': 2.0034711360931396} -09/20/2021 23:18:51 - INFO - __main__ - Step 40752: {'lr': 0.00019934446651214538, 'samples': 1304064, 'steps': 2546, 'loss/train': 2.0770039558410645} -09/20/2021 23:18:52 - INFO - __main__ - Step 40753: {'lr': 0.000199343737115887, 'samples': 1304096, 'steps': 2547, 'loss/train': 2.694845676422119} -09/20/2021 23:18:53 - INFO - __main__ - Step 40754: {'lr': 0.000199343737115887, 'samples': 1304128, 'steps': 2547, 'loss/train': 2.283383369445801} -09/20/2021 23:18:55 - INFO - __main__ - Step 40755: {'lr': 0.000199343737115887, 'samples': 1304160, 'steps': 2547, 'loss/train': 1.5633134841918945} -09/20/2021 23:18:56 - INFO - __main__ - Step 40756: {'lr': 0.000199343737115887, 'samples': 1304192, 'steps': 2547, 'loss/train': 3.4760241508483887} -09/20/2021 23:18:56 - INFO - __main__ - Step 40757: {'lr': 0.000199343737115887, 'samples': 1304224, 'steps': 2547, 'loss/train': 1.6232753992080688} -09/20/2021 23:18:57 - INFO - __main__ - Step 40758: {'lr': 0.000199343737115887, 'samples': 1304256, 'steps': 2547, 'loss/train': 1.7415531873703003} -09/20/2021 23:18:58 - INFO - __main__ - Step 40759: {'lr': 0.000199343737115887, 'samples': 1304288, 'steps': 2547, 'loss/train': 2.255276679992676} -09/20/2021 23:18:59 - INFO - __main__ - Step 40760: {'lr': 0.000199343737115887, 'samples': 1304320, 'steps': 2547, 'loss/train': 2.2071328163146973} -09/20/2021 23:18:59 - INFO - __main__ - Step 40761: {'lr': 0.000199343737115887, 'samples': 1304352, 'steps': 2547, 'loss/train': 1.8238835334777832} -09/20/2021 23:19:00 - INFO - __main__ - Step 40762: {'lr': 0.000199343737115887, 'samples': 1304384, 'steps': 2547, 'loss/train': 2.0104849338531494} -09/20/2021 23:19:01 - INFO - __main__ - Step 40763: {'lr': 0.000199343737115887, 'samples': 1304416, 'steps': 2547, 'loss/train': 1.4953422546386719} -09/20/2021 23:19:02 - INFO - __main__ - Step 40764: {'lr': 0.000199343737115887, 'samples': 1304448, 'steps': 2547, 'loss/train': 1.8181525468826294} -09/20/2021 23:19:02 - INFO - __main__ - Step 40765: {'lr': 0.000199343737115887, 'samples': 1304480, 'steps': 2547, 'loss/train': 2.0501763820648193} -09/20/2021 23:19:03 - INFO - __main__ - Step 40766: {'lr': 0.000199343737115887, 'samples': 1304512, 'steps': 2547, 'loss/train': 2.890198230743408} -09/20/2021 23:19:04 - INFO - __main__ - Step 40767: {'lr': 0.000199343737115887, 'samples': 1304544, 'steps': 2547, 'loss/train': 1.9909933805465698} -09/20/2021 23:19:05 - INFO - __main__ - Step 40768: {'lr': 0.000199343737115887, 'samples': 1304576, 'steps': 2547, 'loss/train': 1.5828624963760376} -09/20/2021 23:19:05 - INFO - __main__ - Step 40769: {'lr': 0.00019934300731539936, 'samples': 1304608, 'steps': 2548, 'loss/train': 2.3450963497161865} -09/20/2021 23:19:06 - INFO - __main__ - Step 40770: {'lr': 0.00019934300731539936, 'samples': 1304640, 'steps': 2548, 'loss/train': 1.5528486967086792} -09/20/2021 23:19:07 - INFO - __main__ - Step 40771: {'lr': 0.00019934300731539936, 'samples': 1304672, 'steps': 2548, 'loss/train': 2.98587703704834} -09/20/2021 23:19:08 - INFO - __main__ - Step 40772: {'lr': 0.00019934300731539936, 'samples': 1304704, 'steps': 2548, 'loss/train': 1.1463485956192017} -09/20/2021 23:19:08 - INFO - __main__ - Step 40773: {'lr': 0.00019934300731539936, 'samples': 1304736, 'steps': 2548, 'loss/train': 2.5233874320983887} -09/20/2021 23:19:09 - INFO - __main__ - Step 40774: {'lr': 0.00019934300731539936, 'samples': 1304768, 'steps': 2548, 'loss/train': 1.8344035148620605} -09/20/2021 23:19:10 - INFO - __main__ - Step 40775: {'lr': 0.00019934300731539936, 'samples': 1304800, 'steps': 2548, 'loss/train': 2.0649514198303223} -09/20/2021 23:19:11 - INFO - __main__ - Step 40776: {'lr': 0.00019934300731539936, 'samples': 1304832, 'steps': 2548, 'loss/train': 2.0111989974975586} -09/20/2021 23:19:11 - INFO - __main__ - Step 40777: {'lr': 0.00019934300731539936, 'samples': 1304864, 'steps': 2548, 'loss/train': 2.1357100009918213} -09/20/2021 23:19:12 - INFO - __main__ - Step 40778: {'lr': 0.00019934300731539936, 'samples': 1304896, 'steps': 2548, 'loss/train': 2.065595865249634} -09/20/2021 23:19:13 - INFO - __main__ - Step 40779: {'lr': 0.00019934300731539936, 'samples': 1304928, 'steps': 2548, 'loss/train': 3.060163974761963} -09/20/2021 23:19:14 - INFO - __main__ - Step 40780: {'lr': 0.00019934300731539936, 'samples': 1304960, 'steps': 2548, 'loss/train': 2.2711071968078613} -09/20/2021 23:19:14 - INFO - __main__ - Step 40781: {'lr': 0.00019934300731539936, 'samples': 1304992, 'steps': 2548, 'loss/train': 1.6455150842666626} -09/20/2021 23:19:15 - INFO - __main__ - Step 40782: {'lr': 0.00019934300731539936, 'samples': 1305024, 'steps': 2548, 'loss/train': 2.4986729621887207} -09/20/2021 23:19:16 - INFO - __main__ - Step 40783: {'lr': 0.00019934300731539936, 'samples': 1305056, 'steps': 2548, 'loss/train': 2.621791362762451} -09/20/2021 23:19:17 - INFO - __main__ - Step 40784: {'lr': 0.00019934300731539936, 'samples': 1305088, 'steps': 2548, 'loss/train': 2.655651330947876} -09/20/2021 23:19:18 - INFO - __main__ - Step 40785: {'lr': 0.00019934227711068542, 'samples': 1305120, 'steps': 2549, 'loss/train': 2.0616824626922607} -09/20/2021 23:19:18 - INFO - __main__ - Step 40786: {'lr': 0.00019934227711068542, 'samples': 1305152, 'steps': 2549, 'loss/train': 2.1142830848693848} -09/20/2021 23:19:20 - INFO - __main__ - Step 40787: {'lr': 0.00019934227711068542, 'samples': 1305184, 'steps': 2549, 'loss/train': 1.4910811185836792} -09/20/2021 23:19:21 - INFO - __main__ - Step 40788: {'lr': 0.00019934227711068542, 'samples': 1305216, 'steps': 2549, 'loss/train': 2.4734768867492676} -09/20/2021 23:19:22 - INFO - __main__ - Step 40789: {'lr': 0.00019934227711068542, 'samples': 1305248, 'steps': 2549, 'loss/train': 2.892428398132324} -09/20/2021 23:19:22 - INFO - __main__ - Step 40790: {'lr': 0.00019934227711068542, 'samples': 1305280, 'steps': 2549, 'loss/train': 1.491919994354248} -09/20/2021 23:19:23 - INFO - __main__ - Step 40791: {'lr': 0.00019934227711068542, 'samples': 1305312, 'steps': 2549, 'loss/train': 2.108309268951416} -09/20/2021 23:19:24 - INFO - __main__ - Step 40792: {'lr': 0.00019934227711068542, 'samples': 1305344, 'steps': 2549, 'loss/train': 1.9316189289093018} -09/20/2021 23:19:25 - INFO - __main__ - Step 40793: {'lr': 0.00019934227711068542, 'samples': 1305376, 'steps': 2549, 'loss/train': 1.5706981420516968} -09/20/2021 23:19:25 - INFO - __main__ - Step 40794: {'lr': 0.00019934227711068542, 'samples': 1305408, 'steps': 2549, 'loss/train': 0.942367672920227} -09/20/2021 23:19:26 - INFO - __main__ - Step 40795: {'lr': 0.00019934227711068542, 'samples': 1305440, 'steps': 2549, 'loss/train': 1.0275264978408813} -09/20/2021 23:19:27 - INFO - __main__ - Step 40796: {'lr': 0.00019934227711068542, 'samples': 1305472, 'steps': 2549, 'loss/train': 1.2348289489746094} -09/20/2021 23:19:28 - INFO - __main__ - Step 40797: {'lr': 0.00019934227711068542, 'samples': 1305504, 'steps': 2549, 'loss/train': 2.551600933074951} -09/20/2021 23:19:28 - INFO - __main__ - Step 40798: {'lr': 0.00019934227711068542, 'samples': 1305536, 'steps': 2549, 'loss/train': 2.5807576179504395} -09/20/2021 23:19:29 - INFO - __main__ - Step 40799: {'lr': 0.00019934227711068542, 'samples': 1305568, 'steps': 2549, 'loss/train': 2.9876511096954346} -09/20/2021 23:19:30 - INFO - __main__ - Step 40800: {'lr': 0.00019934227711068542, 'samples': 1305600, 'steps': 2549, 'loss/train': 2.0929884910583496} -09/20/2021 23:19:31 - INFO - __main__ - Step 40801: {'lr': 0.0001993415465017481, 'samples': 1305632, 'steps': 2550, 'loss/train': 2.002051830291748} -09/20/2021 23:19:32 - INFO - __main__ - Step 40802: {'lr': 0.0001993415465017481, 'samples': 1305664, 'steps': 2550, 'loss/train': 1.4135533571243286} -09/20/2021 23:19:32 - INFO - __main__ - Step 40803: {'lr': 0.0001993415465017481, 'samples': 1305696, 'steps': 2550, 'loss/train': 2.15899920463562} -09/20/2021 23:19:33 - INFO - __main__ - Step 40804: {'lr': 0.0001993415465017481, 'samples': 1305728, 'steps': 2550, 'loss/train': 1.9354491233825684} -09/20/2021 23:19:34 - INFO - __main__ - Step 40805: {'lr': 0.0001993415465017481, 'samples': 1305760, 'steps': 2550, 'loss/train': 2.214205026626587} -09/20/2021 23:19:35 - INFO - __main__ - Step 40806: {'lr': 0.0001993415465017481, 'samples': 1305792, 'steps': 2550, 'loss/train': 1.7257956266403198} -09/20/2021 23:19:35 - INFO - __main__ - Step 40807: {'lr': 0.0001993415465017481, 'samples': 1305824, 'steps': 2550, 'loss/train': 2.4692869186401367} -09/20/2021 23:19:36 - INFO - __main__ - Step 40808: {'lr': 0.0001993415465017481, 'samples': 1305856, 'steps': 2550, 'loss/train': 2.459620952606201} -09/20/2021 23:19:37 - INFO - __main__ - Step 40809: {'lr': 0.0001993415465017481, 'samples': 1305888, 'steps': 2550, 'loss/train': 2.7200090885162354} -09/20/2021 23:19:38 - INFO - __main__ - Step 40810: {'lr': 0.0001993415465017481, 'samples': 1305920, 'steps': 2550, 'loss/train': 1.5200554132461548} -09/20/2021 23:19:38 - INFO - __main__ - Step 40811: {'lr': 0.0001993415465017481, 'samples': 1305952, 'steps': 2550, 'loss/train': 0.6688580513000488} -09/20/2021 23:19:39 - INFO - __main__ - Step 40812: {'lr': 0.0001993415465017481, 'samples': 1305984, 'steps': 2550, 'loss/train': 0.20816035568714142} -09/20/2021 23:19:40 - INFO - __main__ - Step 40813: {'lr': 0.0001993415465017481, 'samples': 1306016, 'steps': 2550, 'loss/train': 0.2467053085565567} -09/20/2021 23:19:41 - INFO - __main__ - Step 40814: {'lr': 0.0001993415465017481, 'samples': 1306048, 'steps': 2550, 'loss/train': 0.5628154277801514} -09/20/2021 23:19:41 - INFO - __main__ - Step 40815: {'lr': 0.0001993415465017481, 'samples': 1306080, 'steps': 2550, 'loss/train': 0.26276078820228577} -09/20/2021 23:19:42 - INFO - __main__ - Step 40816: {'lr': 0.0001993415465017481, 'samples': 1306112, 'steps': 2550, 'loss/train': 0.284706175327301} -09/20/2021 23:19:43 - INFO - __main__ - Step 40817: {'lr': 0.00019934081548859047, 'samples': 1306144, 'steps': 2551, 'loss/train': 0.3935849070549011} -09/20/2021 23:19:45 - INFO - __main__ - Step 40818: {'lr': 0.00019934081548859047, 'samples': 1306176, 'steps': 2551, 'loss/train': 0.6025859117507935} -09/20/2021 23:19:46 - INFO - __main__ - Step 40819: {'lr': 0.00019934081548859047, 'samples': 1306208, 'steps': 2551, 'loss/train': 1.8370680809020996} -09/20/2021 23:19:46 - INFO - __main__ - Step 40820: {'lr': 0.00019934081548859047, 'samples': 1306240, 'steps': 2551, 'loss/train': 0.7750426530838013} -09/20/2021 23:19:47 - INFO - __main__ - Step 40821: {'lr': 0.00019934081548859047, 'samples': 1306272, 'steps': 2551, 'loss/train': 1.5938148498535156} -09/20/2021 23:19:48 - INFO - __main__ - Step 40822: {'lr': 0.00019934081548859047, 'samples': 1306304, 'steps': 2551, 'loss/train': 2.2435171604156494} -09/20/2021 23:19:49 - INFO - __main__ - Step 40823: {'lr': 0.00019934081548859047, 'samples': 1306336, 'steps': 2551, 'loss/train': 1.2730952501296997} -09/20/2021 23:19:49 - INFO - __main__ - Step 40824: {'lr': 0.00019934081548859047, 'samples': 1306368, 'steps': 2551, 'loss/train': 2.755648136138916} -09/20/2021 23:19:50 - INFO - __main__ - Step 40825: {'lr': 0.00019934081548859047, 'samples': 1306400, 'steps': 2551, 'loss/train': 1.9349873065948486} -09/20/2021 23:19:51 - INFO - __main__ - Step 40826: {'lr': 0.00019934081548859047, 'samples': 1306432, 'steps': 2551, 'loss/train': 1.9028841257095337} -09/20/2021 23:19:52 - INFO - __main__ - Step 40827: {'lr': 0.00019934081548859047, 'samples': 1306464, 'steps': 2551, 'loss/train': 1.4550669193267822} -09/20/2021 23:19:52 - INFO - __main__ - Step 40828: {'lr': 0.00019934081548859047, 'samples': 1306496, 'steps': 2551, 'loss/train': 1.5886030197143555} -09/20/2021 23:19:53 - INFO - __main__ - Step 40829: {'lr': 0.00019934081548859047, 'samples': 1306528, 'steps': 2551, 'loss/train': 3.2359490394592285} -09/20/2021 23:19:54 - INFO - __main__ - Step 40830: {'lr': 0.00019934081548859047, 'samples': 1306560, 'steps': 2551, 'loss/train': 2.626591444015503} -09/20/2021 23:19:55 - INFO - __main__ - Step 40831: {'lr': 0.00019934081548859047, 'samples': 1306592, 'steps': 2551, 'loss/train': 1.9949885606765747} -09/20/2021 23:19:55 - INFO - __main__ - Step 40832: {'lr': 0.00019934081548859047, 'samples': 1306624, 'steps': 2551, 'loss/train': 2.070319175720215} -09/20/2021 23:19:56 - INFO - __main__ - Step 40833: {'lr': 0.0001993400840712154, 'samples': 1306656, 'steps': 2552, 'loss/train': 1.6721326112747192} -09/20/2021 23:19:57 - INFO - __main__ - Step 40834: {'lr': 0.0001993400840712154, 'samples': 1306688, 'steps': 2552, 'loss/train': 2.0170607566833496} -09/20/2021 23:19:58 - INFO - __main__ - Step 40835: {'lr': 0.0001993400840712154, 'samples': 1306720, 'steps': 2552, 'loss/train': 2.256847381591797} -09/20/2021 23:19:58 - INFO - __main__ - Step 40836: {'lr': 0.0001993400840712154, 'samples': 1306752, 'steps': 2552, 'loss/train': 1.4619652032852173} -09/20/2021 23:19:59 - INFO - __main__ - Step 40837: {'lr': 0.0001993400840712154, 'samples': 1306784, 'steps': 2552, 'loss/train': 1.6518020629882812} -09/20/2021 23:20:00 - INFO - __main__ - Step 40838: {'lr': 0.0001993400840712154, 'samples': 1306816, 'steps': 2552, 'loss/train': 2.8625776767730713} -09/20/2021 23:20:01 - INFO - __main__ - Step 40839: {'lr': 0.0001993400840712154, 'samples': 1306848, 'steps': 2552, 'loss/train': 2.1387996673583984} -09/20/2021 23:20:01 - INFO - __main__ - Step 40840: {'lr': 0.0001993400840712154, 'samples': 1306880, 'steps': 2552, 'loss/train': 2.4322547912597656} -09/20/2021 23:20:02 - INFO - __main__ - Step 40841: {'lr': 0.0001993400840712154, 'samples': 1306912, 'steps': 2552, 'loss/train': 2.657067060470581} -09/20/2021 23:20:03 - INFO - __main__ - Step 40842: {'lr': 0.0001993400840712154, 'samples': 1306944, 'steps': 2552, 'loss/train': 1.5778799057006836} -09/20/2021 23:20:04 - INFO - __main__ - Step 40843: {'lr': 0.0001993400840712154, 'samples': 1306976, 'steps': 2552, 'loss/train': 2.1779000759124756} -09/20/2021 23:20:04 - INFO - __main__ - Step 40844: {'lr': 0.0001993400840712154, 'samples': 1307008, 'steps': 2552, 'loss/train': 2.248187303543091} -09/20/2021 23:20:05 - INFO - __main__ - Step 40845: {'lr': 0.0001993400840712154, 'samples': 1307040, 'steps': 2552, 'loss/train': 3.161256790161133} -09/20/2021 23:20:06 - INFO - __main__ - Step 40846: {'lr': 0.0001993400840712154, 'samples': 1307072, 'steps': 2552, 'loss/train': 2.656406879425049} -09/20/2021 23:20:07 - INFO - __main__ - Step 40847: {'lr': 0.0001993400840712154, 'samples': 1307104, 'steps': 2552, 'loss/train': 2.513437509536743} -09/20/2021 23:20:07 - INFO - __main__ - Step 40848: {'lr': 0.0001993400840712154, 'samples': 1307136, 'steps': 2552, 'loss/train': 0.7537641525268555} -09/20/2021 23:20:08 - INFO - __main__ - Step 40849: {'lr': 0.00019933935224962594, 'samples': 1307168, 'steps': 2553, 'loss/train': 2.307044744491577} -09/20/2021 23:20:09 - INFO - __main__ - Step 40850: {'lr': 0.00019933935224962594, 'samples': 1307200, 'steps': 2553, 'loss/train': 2.607198476791382} -09/20/2021 23:20:10 - INFO - __main__ - Step 40851: {'lr': 0.00019933935224962594, 'samples': 1307232, 'steps': 2553, 'loss/train': 2.618875741958618} -09/20/2021 23:20:11 - INFO - __main__ - Step 40852: {'lr': 0.00019933935224962594, 'samples': 1307264, 'steps': 2553, 'loss/train': 1.5944969654083252} -09/20/2021 23:20:12 - INFO - __main__ - Step 40853: {'lr': 0.00019933935224962594, 'samples': 1307296, 'steps': 2553, 'loss/train': 1.287535309791565} -09/20/2021 23:20:13 - INFO - __main__ - Step 40854: {'lr': 0.00019933935224962594, 'samples': 1307328, 'steps': 2553, 'loss/train': 2.2605671882629395} -09/20/2021 23:20:13 - INFO - __main__ - Step 40855: {'lr': 0.00019933935224962594, 'samples': 1307360, 'steps': 2553, 'loss/train': 2.681777000427246} -09/20/2021 23:20:14 - INFO - __main__ - Step 40856: {'lr': 0.00019933935224962594, 'samples': 1307392, 'steps': 2553, 'loss/train': 1.3490089178085327} -09/20/2021 23:20:15 - INFO - __main__ - Step 40857: {'lr': 0.00019933935224962594, 'samples': 1307424, 'steps': 2553, 'loss/train': 2.7039294242858887} -09/20/2021 23:20:16 - INFO - __main__ - Step 40858: {'lr': 0.00019933935224962594, 'samples': 1307456, 'steps': 2553, 'loss/train': 2.7331135272979736} -09/20/2021 23:20:16 - INFO - __main__ - Step 40859: {'lr': 0.00019933935224962594, 'samples': 1307488, 'steps': 2553, 'loss/train': 2.2893643379211426} -09/20/2021 23:20:17 - INFO - __main__ - Step 40860: {'lr': 0.00019933935224962594, 'samples': 1307520, 'steps': 2553, 'loss/train': 2.22788143157959} -09/20/2021 23:20:18 - INFO - __main__ - Step 40861: {'lr': 0.00019933935224962594, 'samples': 1307552, 'steps': 2553, 'loss/train': 2.9623773097991943} -09/20/2021 23:20:19 - INFO - __main__ - Step 40862: {'lr': 0.00019933935224962594, 'samples': 1307584, 'steps': 2553, 'loss/train': 1.2822301387786865} -09/20/2021 23:20:19 - INFO - __main__ - Step 40863: {'lr': 0.00019933935224962594, 'samples': 1307616, 'steps': 2553, 'loss/train': 1.1082926988601685} -09/20/2021 23:20:20 - INFO - __main__ - Step 40864: {'lr': 0.00019933935224962594, 'samples': 1307648, 'steps': 2553, 'loss/train': 2.449289321899414} -09/20/2021 23:20:21 - INFO - __main__ - Step 40865: {'lr': 0.00019933862002382503, 'samples': 1307680, 'steps': 2554, 'loss/train': 1.5815175771713257} -09/20/2021 23:20:22 - INFO - __main__ - Step 40866: {'lr': 0.00019933862002382503, 'samples': 1307712, 'steps': 2554, 'loss/train': 2.0970516204833984} -09/20/2021 23:20:22 - INFO - __main__ - Step 40867: {'lr': 0.00019933862002382503, 'samples': 1307744, 'steps': 2554, 'loss/train': 1.2546107769012451} -09/20/2021 23:20:23 - INFO - __main__ - Step 40868: {'lr': 0.00019933862002382503, 'samples': 1307776, 'steps': 2554, 'loss/train': 1.0550638437271118} -09/20/2021 23:20:24 - INFO - __main__ - Step 40869: {'lr': 0.00019933862002382503, 'samples': 1307808, 'steps': 2554, 'loss/train': 1.3556320667266846} -09/20/2021 23:20:25 - INFO - __main__ - Step 40870: {'lr': 0.00019933862002382503, 'samples': 1307840, 'steps': 2554, 'loss/train': 2.5030710697174072} -09/20/2021 23:20:25 - INFO - __main__ - Step 40871: {'lr': 0.00019933862002382503, 'samples': 1307872, 'steps': 2554, 'loss/train': 2.098660707473755} -09/20/2021 23:20:26 - INFO - __main__ - Step 40872: {'lr': 0.00019933862002382503, 'samples': 1307904, 'steps': 2554, 'loss/train': 1.7583847045898438} -09/20/2021 23:20:27 - INFO - __main__ - Step 40873: {'lr': 0.00019933862002382503, 'samples': 1307936, 'steps': 2554, 'loss/train': 2.6007473468780518} -09/20/2021 23:20:28 - INFO - __main__ - Step 40874: {'lr': 0.00019933862002382503, 'samples': 1307968, 'steps': 2554, 'loss/train': 1.2421579360961914} -09/20/2021 23:20:28 - INFO - __main__ - Step 40875: {'lr': 0.00019933862002382503, 'samples': 1308000, 'steps': 2554, 'loss/train': 2.2452454566955566} -09/20/2021 23:20:29 - INFO - __main__ - Step 40876: {'lr': 0.00019933862002382503, 'samples': 1308032, 'steps': 2554, 'loss/train': 3.2063467502593994} -09/20/2021 23:20:30 - INFO - __main__ - Step 40877: {'lr': 0.00019933862002382503, 'samples': 1308064, 'steps': 2554, 'loss/train': 1.3565094470977783} -09/20/2021 23:20:31 - INFO - __main__ - Step 40878: {'lr': 0.00019933862002382503, 'samples': 1308096, 'steps': 2554, 'loss/train': 2.070246696472168} -09/20/2021 23:20:31 - INFO - __main__ - Step 40879: {'lr': 0.00019933862002382503, 'samples': 1308128, 'steps': 2554, 'loss/train': 2.4024343490600586} -09/20/2021 23:20:32 - INFO - __main__ - Step 40880: {'lr': 0.00019933862002382503, 'samples': 1308160, 'steps': 2554, 'loss/train': 3.0308072566986084} -09/20/2021 23:20:33 - INFO - __main__ - Step 40881: {'lr': 0.00019933788739381563, 'samples': 1308192, 'steps': 2555, 'loss/train': 1.844124436378479} -09/20/2021 23:20:34 - INFO - __main__ - Step 40882: {'lr': 0.00019933788739381563, 'samples': 1308224, 'steps': 2555, 'loss/train': 2.9914729595184326} -09/20/2021 23:20:35 - INFO - __main__ - Step 40883: {'lr': 0.00019933788739381563, 'samples': 1308256, 'steps': 2555, 'loss/train': 2.020901918411255} -09/20/2021 23:20:36 - INFO - __main__ - Step 40884: {'lr': 0.00019933788739381563, 'samples': 1308288, 'steps': 2555, 'loss/train': 2.5246200561523438} -09/20/2021 23:20:37 - INFO - __main__ - Step 40885: {'lr': 0.00019933788739381563, 'samples': 1308320, 'steps': 2555, 'loss/train': 2.0364599227905273} -09/20/2021 23:20:37 - INFO - __main__ - Step 40886: {'lr': 0.00019933788739381563, 'samples': 1308352, 'steps': 2555, 'loss/train': 2.115177631378174} -09/20/2021 23:20:38 - INFO - __main__ - Step 40887: {'lr': 0.00019933788739381563, 'samples': 1308384, 'steps': 2555, 'loss/train': 3.1743671894073486} -09/20/2021 23:20:39 - INFO - __main__ - Step 40888: {'lr': 0.00019933788739381563, 'samples': 1308416, 'steps': 2555, 'loss/train': 1.7000938653945923} -09/20/2021 23:20:40 - INFO - __main__ - Step 40889: {'lr': 0.00019933788739381563, 'samples': 1308448, 'steps': 2555, 'loss/train': 2.0361416339874268} -09/20/2021 23:20:40 - INFO - __main__ - Step 40890: {'lr': 0.00019933788739381563, 'samples': 1308480, 'steps': 2555, 'loss/train': 2.4771595001220703} -09/20/2021 23:20:41 - INFO - __main__ - Step 40891: {'lr': 0.00019933788739381563, 'samples': 1308512, 'steps': 2555, 'loss/train': 2.1008918285369873} -09/20/2021 23:20:42 - INFO - __main__ - Step 40892: {'lr': 0.00019933788739381563, 'samples': 1308544, 'steps': 2555, 'loss/train': 2.031606674194336} -09/20/2021 23:20:43 - INFO - __main__ - Step 40893: {'lr': 0.00019933788739381563, 'samples': 1308576, 'steps': 2555, 'loss/train': 1.9413762092590332} -09/20/2021 23:20:43 - INFO - __main__ - Step 40894: {'lr': 0.00019933788739381563, 'samples': 1308608, 'steps': 2555, 'loss/train': 2.1491665840148926} -09/20/2021 23:20:44 - INFO - __main__ - Step 40895: {'lr': 0.00019933788739381563, 'samples': 1308640, 'steps': 2555, 'loss/train': 1.909485936164856} -09/20/2021 23:20:45 - INFO - __main__ - Step 40896: {'lr': 0.00019933788739381563, 'samples': 1308672, 'steps': 2555, 'loss/train': 1.3245577812194824} -09/20/2021 23:20:46 - INFO - __main__ - Step 40897: {'lr': 0.00019933715435960082, 'samples': 1308704, 'steps': 2556, 'loss/train': 2.069897413253784} -09/20/2021 23:20:47 - INFO - __main__ - Step 40898: {'lr': 0.00019933715435960082, 'samples': 1308736, 'steps': 2556, 'loss/train': 2.3250932693481445} -09/20/2021 23:20:47 - INFO - __main__ - Step 40899: {'lr': 0.00019933715435960082, 'samples': 1308768, 'steps': 2556, 'loss/train': 1.178154468536377} -09/20/2021 23:20:48 - INFO - __main__ - Step 40900: {'lr': 0.00019933715435960082, 'samples': 1308800, 'steps': 2556, 'loss/train': 1.8186448812484741} -09/20/2021 23:20:49 - INFO - __main__ - Step 40901: {'lr': 0.00019933715435960082, 'samples': 1308832, 'steps': 2556, 'loss/train': 1.418935775756836} -09/20/2021 23:20:50 - INFO - __main__ - Step 40902: {'lr': 0.00019933715435960082, 'samples': 1308864, 'steps': 2556, 'loss/train': 1.5460259914398193} -09/20/2021 23:20:50 - INFO - __main__ - Step 40903: {'lr': 0.00019933715435960082, 'samples': 1308896, 'steps': 2556, 'loss/train': 2.6196775436401367} -09/20/2021 23:20:51 - INFO - __main__ - Step 40904: {'lr': 0.00019933715435960082, 'samples': 1308928, 'steps': 2556, 'loss/train': 2.0526278018951416} -09/20/2021 23:20:52 - INFO - __main__ - Step 40905: {'lr': 0.00019933715435960082, 'samples': 1308960, 'steps': 2556, 'loss/train': 1.7146766185760498} -09/20/2021 23:20:53 - INFO - __main__ - Step 40906: {'lr': 0.00019933715435960082, 'samples': 1308992, 'steps': 2556, 'loss/train': 3.9439289569854736} -09/20/2021 23:20:53 - INFO - __main__ - Step 40907: {'lr': 0.00019933715435960082, 'samples': 1309024, 'steps': 2556, 'loss/train': 2.4937760829925537} -09/20/2021 23:20:54 - INFO - __main__ - Step 40908: {'lr': 0.00019933715435960082, 'samples': 1309056, 'steps': 2556, 'loss/train': 1.801793098449707} -09/20/2021 23:20:55 - INFO - __main__ - Step 40909: {'lr': 0.00019933715435960082, 'samples': 1309088, 'steps': 2556, 'loss/train': 1.549839735031128} -09/20/2021 23:20:56 - INFO - __main__ - Step 40910: {'lr': 0.00019933715435960082, 'samples': 1309120, 'steps': 2556, 'loss/train': 2.497025966644287} -09/20/2021 23:20:56 - INFO - __main__ - Step 40911: {'lr': 0.00019933715435960082, 'samples': 1309152, 'steps': 2556, 'loss/train': 2.12648868560791} -09/20/2021 23:20:57 - INFO - __main__ - Step 40912: {'lr': 0.00019933715435960082, 'samples': 1309184, 'steps': 2556, 'loss/train': 3.295138120651245} -09/20/2021 23:20:59 - INFO - __main__ - Step 40913: {'lr': 0.00019933642092118348, 'samples': 1309216, 'steps': 2557, 'loss/train': 1.3506823778152466} -09/20/2021 23:20:59 - INFO - __main__ - Step 40914: {'lr': 0.00019933642092118348, 'samples': 1309248, 'steps': 2557, 'loss/train': 1.8564321994781494} -09/20/2021 23:21:00 - INFO - __main__ - Step 40915: {'lr': 0.00019933642092118348, 'samples': 1309280, 'steps': 2557, 'loss/train': 2.2678020000457764} -09/20/2021 23:21:01 - INFO - __main__ - Step 40916: {'lr': 0.00019933642092118348, 'samples': 1309312, 'steps': 2557, 'loss/train': 2.568371057510376} -09/20/2021 23:21:02 - INFO - __main__ - Step 40917: {'lr': 0.00019933642092118348, 'samples': 1309344, 'steps': 2557, 'loss/train': 2.4051265716552734} -09/20/2021 23:21:02 - INFO - __main__ - Step 40918: {'lr': 0.00019933642092118348, 'samples': 1309376, 'steps': 2557, 'loss/train': 2.1974565982818604} -09/20/2021 23:21:03 - INFO - __main__ - Step 40919: {'lr': 0.00019933642092118348, 'samples': 1309408, 'steps': 2557, 'loss/train': 1.651500940322876} -09/20/2021 23:21:04 - INFO - __main__ - Step 40920: {'lr': 0.00019933642092118348, 'samples': 1309440, 'steps': 2557, 'loss/train': 1.8884551525115967} -09/20/2021 23:21:05 - INFO - __main__ - Step 40921: {'lr': 0.00019933642092118348, 'samples': 1309472, 'steps': 2557, 'loss/train': 2.0990850925445557} -09/20/2021 23:21:05 - INFO - __main__ - Step 40922: {'lr': 0.00019933642092118348, 'samples': 1309504, 'steps': 2557, 'loss/train': 2.0044209957122803} -09/20/2021 23:21:06 - INFO - __main__ - Step 40923: {'lr': 0.00019933642092118348, 'samples': 1309536, 'steps': 2557, 'loss/train': 1.5899810791015625} -09/20/2021 23:21:07 - INFO - __main__ - Step 40924: {'lr': 0.00019933642092118348, 'samples': 1309568, 'steps': 2557, 'loss/train': 1.462860107421875} -09/20/2021 23:21:08 - INFO - __main__ - Step 40925: {'lr': 0.00019933642092118348, 'samples': 1309600, 'steps': 2557, 'loss/train': 1.5255402326583862} -09/20/2021 23:21:08 - INFO - __main__ - Step 40926: {'lr': 0.00019933642092118348, 'samples': 1309632, 'steps': 2557, 'loss/train': 1.3150888681411743} -09/20/2021 23:21:09 - INFO - __main__ - Step 40927: {'lr': 0.00019933642092118348, 'samples': 1309664, 'steps': 2557, 'loss/train': 2.3255996704101562} -09/20/2021 23:21:10 - INFO - __main__ - Step 40928: {'lr': 0.00019933642092118348, 'samples': 1309696, 'steps': 2557, 'loss/train': 1.9478352069854736} -09/20/2021 23:21:11 - INFO - __main__ - Step 40929: {'lr': 0.00019933568707856662, 'samples': 1309728, 'steps': 2558, 'loss/train': 1.8652533292770386} -09/20/2021 23:21:11 - INFO - __main__ - Step 40930: {'lr': 0.00019933568707856662, 'samples': 1309760, 'steps': 2558, 'loss/train': 2.2207372188568115} -09/20/2021 23:21:12 - INFO - __main__ - Step 40931: {'lr': 0.00019933568707856662, 'samples': 1309792, 'steps': 2558, 'loss/train': 2.4175357818603516} -09/20/2021 23:21:13 - INFO - __main__ - Step 40932: {'lr': 0.00019933568707856662, 'samples': 1309824, 'steps': 2558, 'loss/train': 2.275928258895874} -09/20/2021 23:21:14 - INFO - __main__ - Step 40933: {'lr': 0.00019933568707856662, 'samples': 1309856, 'steps': 2558, 'loss/train': 2.185638904571533} -09/20/2021 23:21:14 - INFO - __main__ - Step 40934: {'lr': 0.00019933568707856662, 'samples': 1309888, 'steps': 2558, 'loss/train': 1.575476050376892} -09/20/2021 23:21:15 - INFO - __main__ - Step 40935: {'lr': 0.00019933568707856662, 'samples': 1309920, 'steps': 2558, 'loss/train': 2.836583137512207} -09/20/2021 23:21:16 - INFO - __main__ - Step 40936: {'lr': 0.00019933568707856662, 'samples': 1309952, 'steps': 2558, 'loss/train': 2.5714120864868164} -09/20/2021 23:21:17 - INFO - __main__ - Step 40937: {'lr': 0.00019933568707856662, 'samples': 1309984, 'steps': 2558, 'loss/train': 2.146601438522339} -09/20/2021 23:21:17 - INFO - __main__ - Step 40938: {'lr': 0.00019933568707856662, 'samples': 1310016, 'steps': 2558, 'loss/train': 2.4646530151367188} -09/20/2021 23:21:18 - INFO - __main__ - Step 40939: {'lr': 0.00019933568707856662, 'samples': 1310048, 'steps': 2558, 'loss/train': 2.4126994609832764} -09/20/2021 23:21:19 - INFO - __main__ - Step 40940: {'lr': 0.00019933568707856662, 'samples': 1310080, 'steps': 2558, 'loss/train': 2.9863786697387695} -09/20/2021 23:21:20 - INFO - __main__ - Step 40941: {'lr': 0.00019933568707856662, 'samples': 1310112, 'steps': 2558, 'loss/train': 2.144482135772705} -09/20/2021 23:21:20 - INFO - __main__ - Step 40942: {'lr': 0.00019933568707856662, 'samples': 1310144, 'steps': 2558, 'loss/train': 2.0000998973846436} -09/20/2021 23:21:21 - INFO - __main__ - Step 40943: {'lr': 0.00019933568707856662, 'samples': 1310176, 'steps': 2558, 'loss/train': 3.1241884231567383} -09/20/2021 23:21:23 - INFO - __main__ - Step 40944: {'lr': 0.00019933568707856662, 'samples': 1310208, 'steps': 2558, 'loss/train': 1.3895370960235596} -09/20/2021 23:21:24 - INFO - __main__ - Step 40945: {'lr': 0.00019933495283175324, 'samples': 1310240, 'steps': 2559, 'loss/train': 1.876280665397644} -09/20/2021 23:21:24 - INFO - __main__ - Step 40946: {'lr': 0.00019933495283175324, 'samples': 1310272, 'steps': 2559, 'loss/train': 3.0462746620178223} -09/20/2021 23:21:25 - INFO - __main__ - Step 40947: {'lr': 0.00019933495283175324, 'samples': 1310304, 'steps': 2559, 'loss/train': 2.8225255012512207} -09/20/2021 23:21:26 - INFO - __main__ - Step 40948: {'lr': 0.00019933495283175324, 'samples': 1310336, 'steps': 2559, 'loss/train': 0.7174099683761597} -09/20/2021 23:21:27 - INFO - __main__ - Step 40949: {'lr': 0.00019933495283175324, 'samples': 1310368, 'steps': 2559, 'loss/train': 1.7571457624435425} -09/20/2021 23:21:27 - INFO - __main__ - Step 40950: {'lr': 0.00019933495283175324, 'samples': 1310400, 'steps': 2559, 'loss/train': 1.1817022562026978} -09/20/2021 23:21:28 - INFO - __main__ - Step 40951: {'lr': 0.00019933495283175324, 'samples': 1310432, 'steps': 2559, 'loss/train': 2.5475053787231445} -09/20/2021 23:21:29 - INFO - __main__ - Step 40952: {'lr': 0.00019933495283175324, 'samples': 1310464, 'steps': 2559, 'loss/train': 2.289307117462158} -09/20/2021 23:21:30 - INFO - __main__ - Step 40953: {'lr': 0.00019933495283175324, 'samples': 1310496, 'steps': 2559, 'loss/train': 2.2332265377044678} -09/20/2021 23:21:30 - INFO - __main__ - Step 40954: {'lr': 0.00019933495283175324, 'samples': 1310528, 'steps': 2559, 'loss/train': 2.0532455444335938} -09/20/2021 23:21:31 - INFO - __main__ - Step 40955: {'lr': 0.00019933495283175324, 'samples': 1310560, 'steps': 2559, 'loss/train': 2.4458580017089844} -09/20/2021 23:21:32 - INFO - __main__ - Step 40956: {'lr': 0.00019933495283175324, 'samples': 1310592, 'steps': 2559, 'loss/train': 1.923616647720337} -09/20/2021 23:21:33 - INFO - __main__ - Step 40957: {'lr': 0.00019933495283175324, 'samples': 1310624, 'steps': 2559, 'loss/train': 2.0378735065460205} -09/20/2021 23:21:33 - INFO - __main__ - Step 40958: {'lr': 0.00019933495283175324, 'samples': 1310656, 'steps': 2559, 'loss/train': 1.8780182600021362} -09/20/2021 23:21:34 - INFO - __main__ - Step 40959: {'lr': 0.00019933495283175324, 'samples': 1310688, 'steps': 2559, 'loss/train': 1.2750078439712524} -09/20/2021 23:21:35 - INFO - __main__ - Step 40960: {'lr': 0.00019933495283175324, 'samples': 1310720, 'steps': 2559, 'loss/train': 2.718430519104004} -09/20/2021 23:21:36 - INFO - __main__ - Step 40961: {'lr': 0.00019933421818074632, 'samples': 1310752, 'steps': 2560, 'loss/train': 2.6174168586730957} -09/20/2021 23:21:36 - INFO - __main__ - Step 40962: {'lr': 0.00019933421818074632, 'samples': 1310784, 'steps': 2560, 'loss/train': 2.153811454772949} -09/20/2021 23:21:37 - INFO - __main__ - Step 40963: {'lr': 0.00019933421818074632, 'samples': 1310816, 'steps': 2560, 'loss/train': 1.4657708406448364} -09/20/2021 23:21:38 - INFO - __main__ - Step 40964: {'lr': 0.00019933421818074632, 'samples': 1310848, 'steps': 2560, 'loss/train': 1.4498260021209717} -09/20/2021 23:21:39 - INFO - __main__ - Step 40965: {'lr': 0.00019933421818074632, 'samples': 1310880, 'steps': 2560, 'loss/train': 1.350411057472229} -09/20/2021 23:21:39 - INFO - __main__ - Step 40966: {'lr': 0.00019933421818074632, 'samples': 1310912, 'steps': 2560, 'loss/train': 0.7501848340034485} -09/20/2021 23:21:40 - INFO - __main__ - Step 40967: {'lr': 0.00019933421818074632, 'samples': 1310944, 'steps': 2560, 'loss/train': 1.9635298252105713} -09/20/2021 23:21:41 - INFO - __main__ - Step 40968: {'lr': 0.00019933421818074632, 'samples': 1310976, 'steps': 2560, 'loss/train': 2.94252872467041} -09/20/2021 23:21:42 - INFO - __main__ - Step 40969: {'lr': 0.00019933421818074632, 'samples': 1311008, 'steps': 2560, 'loss/train': 1.9016737937927246} -09/20/2021 23:21:42 - INFO - __main__ - Step 40970: {'lr': 0.00019933421818074632, 'samples': 1311040, 'steps': 2560, 'loss/train': 2.9384443759918213} -09/20/2021 23:21:43 - INFO - __main__ - Step 40971: {'lr': 0.00019933421818074632, 'samples': 1311072, 'steps': 2560, 'loss/train': 2.0476467609405518} -09/20/2021 23:21:44 - INFO - __main__ - Step 40972: {'lr': 0.00019933421818074632, 'samples': 1311104, 'steps': 2560, 'loss/train': 1.3198870420455933} -09/20/2021 23:21:45 - INFO - __main__ - Step 40973: {'lr': 0.00019933421818074632, 'samples': 1311136, 'steps': 2560, 'loss/train': 1.2321646213531494} -09/20/2021 23:21:45 - INFO - __main__ - Step 40974: {'lr': 0.00019933421818074632, 'samples': 1311168, 'steps': 2560, 'loss/train': 1.3720425367355347} -09/20/2021 23:21:47 - INFO - __main__ - Step 40975: {'lr': 0.00019933421818074632, 'samples': 1311200, 'steps': 2560, 'loss/train': 1.2677680253982544} -09/20/2021 23:21:47 - INFO - __main__ - Step 40976: {'lr': 0.00019933421818074632, 'samples': 1311232, 'steps': 2560, 'loss/train': 1.9156848192214966} -09/20/2021 23:21:48 - INFO - __main__ - Step 40977: {'lr': 0.00019933348312554884, 'samples': 1311264, 'steps': 2561, 'loss/train': 1.7386828660964966} -09/20/2021 23:21:49 - INFO - __main__ - Step 40978: {'lr': 0.00019933348312554884, 'samples': 1311296, 'steps': 2561, 'loss/train': 1.7876826524734497} -09/20/2021 23:21:50 - INFO - __main__ - Step 40979: {'lr': 0.00019933348312554884, 'samples': 1311328, 'steps': 2561, 'loss/train': 2.4533441066741943} -09/20/2021 23:21:51 - INFO - __main__ - Step 40980: {'lr': 0.00019933348312554884, 'samples': 1311360, 'steps': 2561, 'loss/train': 0.8317967057228088} -09/20/2021 23:21:51 - INFO - __main__ - Step 40981: {'lr': 0.00019933348312554884, 'samples': 1311392, 'steps': 2561, 'loss/train': 1.9079643487930298} -09/20/2021 23:21:52 - INFO - __main__ - Step 40982: {'lr': 0.00019933348312554884, 'samples': 1311424, 'steps': 2561, 'loss/train': 2.8624253273010254} -09/20/2021 23:21:53 - INFO - __main__ - Step 40983: {'lr': 0.00019933348312554884, 'samples': 1311456, 'steps': 2561, 'loss/train': 2.142580509185791} -09/20/2021 23:21:54 - INFO - __main__ - Step 40984: {'lr': 0.00019933348312554884, 'samples': 1311488, 'steps': 2561, 'loss/train': 2.0766875743865967} -09/20/2021 23:21:54 - INFO - __main__ - Step 40985: {'lr': 0.00019933348312554884, 'samples': 1311520, 'steps': 2561, 'loss/train': 2.7073397636413574} -09/20/2021 23:21:55 - INFO - __main__ - Step 40986: {'lr': 0.00019933348312554884, 'samples': 1311552, 'steps': 2561, 'loss/train': 2.7713139057159424} -09/20/2021 23:21:56 - INFO - __main__ - Step 40987: {'lr': 0.00019933348312554884, 'samples': 1311584, 'steps': 2561, 'loss/train': 1.140039086341858} -09/20/2021 23:21:57 - INFO - __main__ - Step 40988: {'lr': 0.00019933348312554884, 'samples': 1311616, 'steps': 2561, 'loss/train': 1.9511785507202148} -09/20/2021 23:21:57 - INFO - __main__ - Step 40989: {'lr': 0.00019933348312554884, 'samples': 1311648, 'steps': 2561, 'loss/train': 2.1000099182128906} -09/20/2021 23:21:58 - INFO - __main__ - Step 40990: {'lr': 0.00019933348312554884, 'samples': 1311680, 'steps': 2561, 'loss/train': 2.9196505546569824} -09/20/2021 23:21:59 - INFO - __main__ - Step 40991: {'lr': 0.00019933348312554884, 'samples': 1311712, 'steps': 2561, 'loss/train': 2.304859161376953} -09/20/2021 23:22:00 - INFO - __main__ - Step 40992: {'lr': 0.00019933348312554884, 'samples': 1311744, 'steps': 2561, 'loss/train': 2.9276907444000244} -09/20/2021 23:22:00 - INFO - __main__ - Step 40993: {'lr': 0.00019933274766616383, 'samples': 1311776, 'steps': 2562, 'loss/train': 3.190531015396118} -09/20/2021 23:22:01 - INFO - __main__ - Step 40994: {'lr': 0.00019933274766616383, 'samples': 1311808, 'steps': 2562, 'loss/train': 0.6280367970466614} -09/20/2021 23:22:02 - INFO - __main__ - Step 40995: {'lr': 0.00019933274766616383, 'samples': 1311840, 'steps': 2562, 'loss/train': 2.6302475929260254} -09/20/2021 23:22:03 - INFO - __main__ - Step 40996: {'lr': 0.00019933274766616383, 'samples': 1311872, 'steps': 2562, 'loss/train': 2.4299018383026123} -09/20/2021 23:22:03 - INFO - __main__ - Step 40997: {'lr': 0.00019933274766616383, 'samples': 1311904, 'steps': 2562, 'loss/train': 0.44186103343963623} -09/20/2021 23:22:04 - INFO - __main__ - Step 40998: {'lr': 0.00019933274766616383, 'samples': 1311936, 'steps': 2562, 'loss/train': 2.0604209899902344} -09/20/2021 23:22:05 - INFO - __main__ - Step 40999: {'lr': 0.00019933274766616383, 'samples': 1311968, 'steps': 2562, 'loss/train': 2.5072782039642334} -09/20/2021 23:22:06 - INFO - __main__ - Step 41000: {'lr': 0.00019933274766616383, 'samples': 1312000, 'steps': 2562, 'loss/train': 1.7771883010864258} -09/20/2021 23:22:06 - INFO - __main__ - Step 41001: {'lr': 0.00019933274766616383, 'samples': 1312032, 'steps': 2562, 'loss/train': 2.062525510787964} -09/20/2021 23:22:07 - INFO - __main__ - Step 41002: {'lr': 0.00019933274766616383, 'samples': 1312064, 'steps': 2562, 'loss/train': 1.375908374786377} -09/20/2021 23:22:08 - INFO - __main__ - Step 41003: {'lr': 0.00019933274766616383, 'samples': 1312096, 'steps': 2562, 'loss/train': 1.765068531036377} -09/20/2021 23:22:09 - INFO - __main__ - Step 41004: {'lr': 0.00019933274766616383, 'samples': 1312128, 'steps': 2562, 'loss/train': 1.9729403257369995} -09/20/2021 23:22:09 - INFO - __main__ - Step 41005: {'lr': 0.00019933274766616383, 'samples': 1312160, 'steps': 2562, 'loss/train': 0.5751407742500305} -09/20/2021 23:22:10 - INFO - __main__ - Step 41006: {'lr': 0.00019933274766616383, 'samples': 1312192, 'steps': 2562, 'loss/train': 2.6220924854278564} -09/20/2021 23:22:12 - INFO - __main__ - Step 41007: {'lr': 0.00019933274766616383, 'samples': 1312224, 'steps': 2562, 'loss/train': 2.282238483428955} -09/20/2021 23:22:12 - INFO - __main__ - Step 41008: {'lr': 0.00019933274766616383, 'samples': 1312256, 'steps': 2562, 'loss/train': 0.20402409136295319} -09/20/2021 23:22:13 - INFO - __main__ - Step 41009: {'lr': 0.00019933201180259426, 'samples': 1312288, 'steps': 2563, 'loss/train': 0.19598044455051422} -09/20/2021 23:22:14 - INFO - __main__ - Step 41010: {'lr': 0.00019933201180259426, 'samples': 1312320, 'steps': 2563, 'loss/train': 2.088198184967041} -09/20/2021 23:22:15 - INFO - __main__ - Step 41011: {'lr': 0.00019933201180259426, 'samples': 1312352, 'steps': 2563, 'loss/train': 1.202132225036621} -09/20/2021 23:22:15 - INFO - __main__ - Step 41012: {'lr': 0.00019933201180259426, 'samples': 1312384, 'steps': 2563, 'loss/train': 2.433622360229492} -09/20/2021 23:22:16 - INFO - __main__ - Step 41013: {'lr': 0.00019933201180259426, 'samples': 1312416, 'steps': 2563, 'loss/train': 2.1251611709594727} -09/20/2021 23:22:17 - INFO - __main__ - Step 41014: {'lr': 0.00019933201180259426, 'samples': 1312448, 'steps': 2563, 'loss/train': 0.6487112045288086} -09/20/2021 23:22:18 - INFO - __main__ - Step 41015: {'lr': 0.00019933201180259426, 'samples': 1312480, 'steps': 2563, 'loss/train': 2.1744272708892822} -09/20/2021 23:22:18 - INFO - __main__ - Step 41016: {'lr': 0.00019933201180259426, 'samples': 1312512, 'steps': 2563, 'loss/train': 1.6033726930618286} -09/20/2021 23:22:19 - INFO - __main__ - Step 41017: {'lr': 0.00019933201180259426, 'samples': 1312544, 'steps': 2563, 'loss/train': 1.6271706819534302} -09/20/2021 23:22:20 - INFO - __main__ - Step 41018: {'lr': 0.00019933201180259426, 'samples': 1312576, 'steps': 2563, 'loss/train': 1.867480754852295} -09/20/2021 23:22:21 - INFO - __main__ - Step 41019: {'lr': 0.00019933201180259426, 'samples': 1312608, 'steps': 2563, 'loss/train': 1.2063570022583008} -09/20/2021 23:22:21 - INFO - __main__ - Step 41020: {'lr': 0.00019933201180259426, 'samples': 1312640, 'steps': 2563, 'loss/train': 2.521421194076538} -09/20/2021 23:22:22 - INFO - __main__ - Step 41021: {'lr': 0.00019933201180259426, 'samples': 1312672, 'steps': 2563, 'loss/train': 0.7014084458351135} -09/20/2021 23:22:23 - INFO - __main__ - Step 41022: {'lr': 0.00019933201180259426, 'samples': 1312704, 'steps': 2563, 'loss/train': 1.962242841720581} -09/20/2021 23:22:24 - INFO - __main__ - Step 41023: {'lr': 0.00019933201180259426, 'samples': 1312736, 'steps': 2563, 'loss/train': 1.7251174449920654} -09/20/2021 23:22:24 - INFO - __main__ - Step 41024: {'lr': 0.00019933201180259426, 'samples': 1312768, 'steps': 2563, 'loss/train': 2.0640268325805664} -09/20/2021 23:22:25 - INFO - __main__ - Step 41025: {'lr': 0.0001993312755348431, 'samples': 1312800, 'steps': 2564, 'loss/train': 2.0908169746398926} -09/20/2021 23:22:26 - INFO - __main__ - Step 41026: {'lr': 0.0001993312755348431, 'samples': 1312832, 'steps': 2564, 'loss/train': 2.6972532272338867} -09/20/2021 23:22:27 - INFO - __main__ - Step 41027: {'lr': 0.0001993312755348431, 'samples': 1312864, 'steps': 2564, 'loss/train': 1.9056891202926636} -09/20/2021 23:22:28 - INFO - __main__ - Step 41028: {'lr': 0.0001993312755348431, 'samples': 1312896, 'steps': 2564, 'loss/train': 1.5529963970184326} -09/20/2021 23:22:28 - INFO - __main__ - Step 41029: {'lr': 0.0001993312755348431, 'samples': 1312928, 'steps': 2564, 'loss/train': 1.8068678379058838} -09/20/2021 23:22:29 - INFO - __main__ - Step 41030: {'lr': 0.0001993312755348431, 'samples': 1312960, 'steps': 2564, 'loss/train': 2.3497984409332275} -09/20/2021 23:22:30 - INFO - __main__ - Step 41031: {'lr': 0.0001993312755348431, 'samples': 1312992, 'steps': 2564, 'loss/train': 0.8440003991127014} -09/20/2021 23:22:31 - INFO - __main__ - Step 41032: {'lr': 0.0001993312755348431, 'samples': 1313024, 'steps': 2564, 'loss/train': 1.4100350141525269} -09/20/2021 23:22:31 - INFO - __main__ - Step 41033: {'lr': 0.0001993312755348431, 'samples': 1313056, 'steps': 2564, 'loss/train': 2.367823600769043} -09/20/2021 23:22:32 - INFO - __main__ - Step 41034: {'lr': 0.0001993312755348431, 'samples': 1313088, 'steps': 2564, 'loss/train': 3.0593934059143066} -09/20/2021 23:22:33 - INFO - __main__ - Step 41035: {'lr': 0.0001993312755348431, 'samples': 1313120, 'steps': 2564, 'loss/train': 2.571453809738159} -09/20/2021 23:22:34 - INFO - __main__ - Step 41036: {'lr': 0.0001993312755348431, 'samples': 1313152, 'steps': 2564, 'loss/train': 2.2618024349212646} -09/20/2021 23:22:34 - INFO - __main__ - Step 41037: {'lr': 0.0001993312755348431, 'samples': 1313184, 'steps': 2564, 'loss/train': 2.4268434047698975} -09/20/2021 23:22:36 - INFO - __main__ - Step 41038: {'lr': 0.0001993312755348431, 'samples': 1313216, 'steps': 2564, 'loss/train': 2.1561341285705566} -09/20/2021 23:22:37 - INFO - __main__ - Step 41039: {'lr': 0.0001993312755348431, 'samples': 1313248, 'steps': 2564, 'loss/train': 2.046999216079712} -09/20/2021 23:22:37 - INFO - __main__ - Step 41040: {'lr': 0.0001993312755348431, 'samples': 1313280, 'steps': 2564, 'loss/train': 1.9486281871795654} -09/20/2021 23:22:38 - INFO - __main__ - Step 41041: {'lr': 0.00019933053886291336, 'samples': 1313312, 'steps': 2565, 'loss/train': 2.4529576301574707} -09/20/2021 23:22:39 - INFO - __main__ - Step 41042: {'lr': 0.00019933053886291336, 'samples': 1313344, 'steps': 2565, 'loss/train': 1.9527689218521118} -09/20/2021 23:22:40 - INFO - __main__ - Step 41043: {'lr': 0.00019933053886291336, 'samples': 1313376, 'steps': 2565, 'loss/train': 1.9999053478240967} -09/20/2021 23:22:41 - INFO - __main__ - Step 41044: {'lr': 0.00019933053886291336, 'samples': 1313408, 'steps': 2565, 'loss/train': 1.7304725646972656} -09/20/2021 23:22:41 - INFO - __main__ - Step 41045: {'lr': 0.00019933053886291336, 'samples': 1313440, 'steps': 2565, 'loss/train': 2.6145522594451904} -09/20/2021 23:22:42 - INFO - __main__ - Step 41046: {'lr': 0.00019933053886291336, 'samples': 1313472, 'steps': 2565, 'loss/train': 3.4591352939605713} -09/20/2021 23:22:43 - INFO - __main__ - Step 41047: {'lr': 0.00019933053886291336, 'samples': 1313504, 'steps': 2565, 'loss/train': 2.21061110496521} -09/20/2021 23:22:44 - INFO - __main__ - Step 41048: {'lr': 0.00019933053886291336, 'samples': 1313536, 'steps': 2565, 'loss/train': 1.700112223625183} -09/20/2021 23:22:44 - INFO - __main__ - Step 41049: {'lr': 0.00019933053886291336, 'samples': 1313568, 'steps': 2565, 'loss/train': 2.626030206680298} -09/20/2021 23:22:45 - INFO - __main__ - Step 41050: {'lr': 0.00019933053886291336, 'samples': 1313600, 'steps': 2565, 'loss/train': 1.6071522235870361} -09/20/2021 23:22:46 - INFO - __main__ - Step 41051: {'lr': 0.00019933053886291336, 'samples': 1313632, 'steps': 2565, 'loss/train': 1.5497835874557495} -09/20/2021 23:22:47 - INFO - __main__ - Step 41052: {'lr': 0.00019933053886291336, 'samples': 1313664, 'steps': 2565, 'loss/train': 1.7516095638275146} -09/20/2021 23:22:47 - INFO - __main__ - Step 41053: {'lr': 0.00019933053886291336, 'samples': 1313696, 'steps': 2565, 'loss/train': 1.0882669687271118} -09/20/2021 23:22:48 - INFO - __main__ - Step 41054: {'lr': 0.00019933053886291336, 'samples': 1313728, 'steps': 2565, 'loss/train': 2.1334726810455322} -09/20/2021 23:22:49 - INFO - __main__ - Step 41055: {'lr': 0.00019933053886291336, 'samples': 1313760, 'steps': 2565, 'loss/train': 2.346353054046631} -09/20/2021 23:22:50 - INFO - __main__ - Step 41056: {'lr': 0.00019933053886291336, 'samples': 1313792, 'steps': 2565, 'loss/train': 1.748793363571167} -09/20/2021 23:22:51 - INFO - __main__ - Step 41057: {'lr': 0.00019932980178680808, 'samples': 1313824, 'steps': 2566, 'loss/train': 2.168290853500366} -09/20/2021 23:22:51 - INFO - __main__ - Step 41058: {'lr': 0.00019932980178680808, 'samples': 1313856, 'steps': 2566, 'loss/train': 1.7415999174118042} -09/20/2021 23:22:52 - INFO - __main__ - Step 41059: {'lr': 0.00019932980178680808, 'samples': 1313888, 'steps': 2566, 'loss/train': 1.902869462966919} -09/20/2021 23:22:53 - INFO - __main__ - Step 41060: {'lr': 0.00019932980178680808, 'samples': 1313920, 'steps': 2566, 'loss/train': 2.008955478668213} -09/20/2021 23:22:53 - INFO - __main__ - Step 41061: {'lr': 0.00019932980178680808, 'samples': 1313952, 'steps': 2566, 'loss/train': 2.271286964416504} -09/20/2021 23:22:54 - INFO - __main__ - Step 41062: {'lr': 0.00019932980178680808, 'samples': 1313984, 'steps': 2566, 'loss/train': 2.3264644145965576} -09/20/2021 23:22:55 - INFO - __main__ - Step 41063: {'lr': 0.00019932980178680808, 'samples': 1314016, 'steps': 2566, 'loss/train': 1.0046379566192627} -09/20/2021 23:22:56 - INFO - __main__ - Step 41064: {'lr': 0.00019932980178680808, 'samples': 1314048, 'steps': 2566, 'loss/train': 2.5956993103027344} -09/20/2021 23:22:56 - INFO - __main__ - Step 41065: {'lr': 0.00019932980178680808, 'samples': 1314080, 'steps': 2566, 'loss/train': 2.453012466430664} -09/20/2021 23:22:57 - INFO - __main__ - Step 41066: {'lr': 0.00019932980178680808, 'samples': 1314112, 'steps': 2566, 'loss/train': 2.2045481204986572} -09/20/2021 23:22:58 - INFO - __main__ - Step 41067: {'lr': 0.00019932980178680808, 'samples': 1314144, 'steps': 2566, 'loss/train': 1.4562456607818604} -09/20/2021 23:22:59 - INFO - __main__ - Step 41068: {'lr': 0.00019932980178680808, 'samples': 1314176, 'steps': 2566, 'loss/train': 0.38212743401527405} -09/20/2021 23:22:59 - INFO - __main__ - Step 41069: {'lr': 0.00019932980178680808, 'samples': 1314208, 'steps': 2566, 'loss/train': 2.1526670455932617} -09/20/2021 23:23:00 - INFO - __main__ - Step 41070: {'lr': 0.00019932980178680808, 'samples': 1314240, 'steps': 2566, 'loss/train': 2.185708522796631} -09/20/2021 23:23:02 - INFO - __main__ - Step 41071: {'lr': 0.00019932980178680808, 'samples': 1314272, 'steps': 2566, 'loss/train': 1.916236162185669} -09/20/2021 23:23:02 - INFO - __main__ - Step 41072: {'lr': 0.00019932980178680808, 'samples': 1314304, 'steps': 2566, 'loss/train': 0.3995455503463745} -09/20/2021 23:23:03 - INFO - __main__ - Step 41073: {'lr': 0.00019932906430653017, 'samples': 1314336, 'steps': 2567, 'loss/train': 2.9894092082977295} -09/20/2021 23:23:04 - INFO - __main__ - Step 41074: {'lr': 0.00019932906430653017, 'samples': 1314368, 'steps': 2567, 'loss/train': 2.1525065898895264} -09/20/2021 23:23:05 - INFO - __main__ - Step 41075: {'lr': 0.00019932906430653017, 'samples': 1314400, 'steps': 2567, 'loss/train': 2.313100814819336} -09/20/2021 23:23:05 - INFO - __main__ - Step 41076: {'lr': 0.00019932906430653017, 'samples': 1314432, 'steps': 2567, 'loss/train': 2.3177292346954346} -09/20/2021 23:23:06 - INFO - __main__ - Step 41077: {'lr': 0.00019932906430653017, 'samples': 1314464, 'steps': 2567, 'loss/train': 1.576464295387268} -09/20/2021 23:23:07 - INFO - __main__ - Step 41078: {'lr': 0.00019932906430653017, 'samples': 1314496, 'steps': 2567, 'loss/train': 2.600532054901123} -09/20/2021 23:23:08 - INFO - __main__ - Step 41079: {'lr': 0.00019932906430653017, 'samples': 1314528, 'steps': 2567, 'loss/train': 1.9584987163543701} -09/20/2021 23:23:08 - INFO - __main__ - Step 41080: {'lr': 0.00019932906430653017, 'samples': 1314560, 'steps': 2567, 'loss/train': 5.642662048339844} -09/20/2021 23:23:09 - INFO - __main__ - Step 41081: {'lr': 0.00019932906430653017, 'samples': 1314592, 'steps': 2567, 'loss/train': 1.8246127367019653} -09/20/2021 23:23:10 - INFO - __main__ - Step 41082: {'lr': 0.00019932906430653017, 'samples': 1314624, 'steps': 2567, 'loss/train': 1.363207459449768} -09/20/2021 23:23:11 - INFO - __main__ - Step 41083: {'lr': 0.00019932906430653017, 'samples': 1314656, 'steps': 2567, 'loss/train': 1.6814846992492676} -09/20/2021 23:23:11 - INFO - __main__ - Step 41084: {'lr': 0.00019932906430653017, 'samples': 1314688, 'steps': 2567, 'loss/train': 1.683513879776001} -09/20/2021 23:23:12 - INFO - __main__ - Step 41085: {'lr': 0.00019932906430653017, 'samples': 1314720, 'steps': 2567, 'loss/train': 2.9246139526367188} -09/20/2021 23:23:13 - INFO - __main__ - Step 41086: {'lr': 0.00019932906430653017, 'samples': 1314752, 'steps': 2567, 'loss/train': 2.4521164894104004} -09/20/2021 23:23:14 - INFO - __main__ - Step 41087: {'lr': 0.00019932906430653017, 'samples': 1314784, 'steps': 2567, 'loss/train': 2.239534378051758} -09/20/2021 23:23:14 - INFO - __main__ - Step 41088: {'lr': 0.00019932906430653017, 'samples': 1314816, 'steps': 2567, 'loss/train': 1.720396637916565} -09/20/2021 23:23:15 - INFO - __main__ - Step 41089: {'lr': 0.0001993283264220827, 'samples': 1314848, 'steps': 2568, 'loss/train': 1.9202343225479126} -09/20/2021 23:23:16 - INFO - __main__ - Step 41090: {'lr': 0.0001993283264220827, 'samples': 1314880, 'steps': 2568, 'loss/train': 1.6102808713912964} -09/20/2021 23:23:17 - INFO - __main__ - Step 41091: {'lr': 0.0001993283264220827, 'samples': 1314912, 'steps': 2568, 'loss/train': 2.2952826023101807} -09/20/2021 23:23:18 - INFO - __main__ - Step 41092: {'lr': 0.0001993283264220827, 'samples': 1314944, 'steps': 2568, 'loss/train': 1.7447235584259033} -09/20/2021 23:23:18 - INFO - __main__ - Step 41093: {'lr': 0.0001993283264220827, 'samples': 1314976, 'steps': 2568, 'loss/train': 3.4256629943847656} -09/20/2021 23:23:19 - INFO - __main__ - Step 41094: {'lr': 0.0001993283264220827, 'samples': 1315008, 'steps': 2568, 'loss/train': 1.9197232723236084} -09/20/2021 23:23:20 - INFO - __main__ - Step 41095: {'lr': 0.0001993283264220827, 'samples': 1315040, 'steps': 2568, 'loss/train': 2.5468268394470215} -09/20/2021 23:23:21 - INFO - __main__ - Step 41096: {'lr': 0.0001993283264220827, 'samples': 1315072, 'steps': 2568, 'loss/train': 2.1792588233947754} -09/20/2021 23:23:21 - INFO - __main__ - Step 41097: {'lr': 0.0001993283264220827, 'samples': 1315104, 'steps': 2568, 'loss/train': 1.4970179796218872} -09/20/2021 23:23:22 - INFO - __main__ - Step 41098: {'lr': 0.0001993283264220827, 'samples': 1315136, 'steps': 2568, 'loss/train': 1.4898321628570557} -09/20/2021 23:23:23 - INFO - __main__ - Step 41099: {'lr': 0.0001993283264220827, 'samples': 1315168, 'steps': 2568, 'loss/train': 1.9538055658340454} -09/20/2021 23:23:24 - INFO - __main__ - Step 41100: {'lr': 0.0001993283264220827, 'samples': 1315200, 'steps': 2568, 'loss/train': 0.8080394864082336} -09/20/2021 23:23:24 - INFO - __main__ - Step 41101: {'lr': 0.0001993283264220827, 'samples': 1315232, 'steps': 2568, 'loss/train': 2.8283345699310303} -09/20/2021 23:23:26 - INFO - __main__ - Step 41102: {'lr': 0.0001993283264220827, 'samples': 1315264, 'steps': 2568, 'loss/train': 1.4494503736495972} -09/20/2021 23:23:27 - INFO - __main__ - Step 41103: {'lr': 0.0001993283264220827, 'samples': 1315296, 'steps': 2568, 'loss/train': 2.5440802574157715} -09/20/2021 23:23:27 - INFO - __main__ - Step 41104: {'lr': 0.0001993283264220827, 'samples': 1315328, 'steps': 2568, 'loss/train': 2.0651464462280273} -09/20/2021 23:23:28 - INFO - __main__ - Step 41105: {'lr': 0.00019932758813346867, 'samples': 1315360, 'steps': 2569, 'loss/train': 2.355163812637329} -09/20/2021 23:23:29 - INFO - __main__ - Step 41106: {'lr': 0.00019932758813346867, 'samples': 1315392, 'steps': 2569, 'loss/train': 1.665268063545227} -09/20/2021 23:23:30 - INFO - __main__ - Step 41107: {'lr': 0.00019932758813346867, 'samples': 1315424, 'steps': 2569, 'loss/train': 1.1311120986938477} -09/20/2021 23:23:31 - INFO - __main__ - Step 41108: {'lr': 0.00019932758813346867, 'samples': 1315456, 'steps': 2569, 'loss/train': 0.6715006828308105} -09/20/2021 23:23:31 - INFO - __main__ - Step 41109: {'lr': 0.00019932758813346867, 'samples': 1315488, 'steps': 2569, 'loss/train': 1.196489930152893} -09/20/2021 23:23:32 - INFO - __main__ - Step 41110: {'lr': 0.00019932758813346867, 'samples': 1315520, 'steps': 2569, 'loss/train': 0.7129443287849426} -09/20/2021 23:23:33 - INFO - __main__ - Step 41111: {'lr': 0.00019932758813346867, 'samples': 1315552, 'steps': 2569, 'loss/train': 0.8324160575866699} -09/20/2021 23:23:34 - INFO - __main__ - Step 41112: {'lr': 0.00019932758813346867, 'samples': 1315584, 'steps': 2569, 'loss/train': 1.0050684213638306} -09/20/2021 23:23:34 - INFO - __main__ - Step 41113: {'lr': 0.00019932758813346867, 'samples': 1315616, 'steps': 2569, 'loss/train': 0.6273438334465027} -09/20/2021 23:23:35 - INFO - __main__ - Step 41114: {'lr': 0.00019932758813346867, 'samples': 1315648, 'steps': 2569, 'loss/train': 0.7148259878158569} -09/20/2021 23:23:36 - INFO - __main__ - Step 41115: {'lr': 0.00019932758813346867, 'samples': 1315680, 'steps': 2569, 'loss/train': 1.8895138502120972} -09/20/2021 23:23:37 - INFO - __main__ - Step 41116: {'lr': 0.00019932758813346867, 'samples': 1315712, 'steps': 2569, 'loss/train': 2.0517475605010986} -09/20/2021 23:23:37 - INFO - __main__ - Step 41117: {'lr': 0.00019932758813346867, 'samples': 1315744, 'steps': 2569, 'loss/train': 2.3172049522399902} -09/20/2021 23:23:38 - INFO - __main__ - Step 41118: {'lr': 0.00019932758813346867, 'samples': 1315776, 'steps': 2569, 'loss/train': 1.4442366361618042} -09/20/2021 23:23:39 - INFO - __main__ - Step 41119: {'lr': 0.00019932758813346867, 'samples': 1315808, 'steps': 2569, 'loss/train': 1.9554154872894287} -09/20/2021 23:23:40 - INFO - __main__ - Step 41120: {'lr': 0.00019932758813346867, 'samples': 1315840, 'steps': 2569, 'loss/train': 2.015101194381714} -09/20/2021 23:23:40 - INFO - __main__ - Step 41121: {'lr': 0.00019932684944069107, 'samples': 1315872, 'steps': 2570, 'loss/train': 2.262070894241333} -09/20/2021 23:23:41 - INFO - __main__ - Step 41122: {'lr': 0.00019932684944069107, 'samples': 1315904, 'steps': 2570, 'loss/train': 2.246072769165039} -09/20/2021 23:23:42 - INFO - __main__ - Step 41123: {'lr': 0.00019932684944069107, 'samples': 1315936, 'steps': 2570, 'loss/train': 1.6231950521469116} -09/20/2021 23:23:43 - INFO - __main__ - Step 41124: {'lr': 0.00019932684944069107, 'samples': 1315968, 'steps': 2570, 'loss/train': 0.3370901346206665} -09/20/2021 23:23:43 - INFO - __main__ - Step 41125: {'lr': 0.00019932684944069107, 'samples': 1316000, 'steps': 2570, 'loss/train': 2.113002300262451} -09/20/2021 23:23:44 - INFO - __main__ - Step 41126: {'lr': 0.00019932684944069107, 'samples': 1316032, 'steps': 2570, 'loss/train': 2.875264883041382} -09/20/2021 23:23:45 - INFO - __main__ - Step 41127: {'lr': 0.00019932684944069107, 'samples': 1316064, 'steps': 2570, 'loss/train': 1.8535624742507935} -09/20/2021 23:23:46 - INFO - __main__ - Step 41128: {'lr': 0.00019932684944069107, 'samples': 1316096, 'steps': 2570, 'loss/train': 1.6128222942352295} -09/20/2021 23:23:46 - INFO - __main__ - Step 41129: {'lr': 0.00019932684944069107, 'samples': 1316128, 'steps': 2570, 'loss/train': 2.290717601776123} -09/20/2021 23:23:47 - INFO - __main__ - Step 41130: {'lr': 0.00019932684944069107, 'samples': 1316160, 'steps': 2570, 'loss/train': 1.8733628988265991} -09/20/2021 23:23:48 - INFO - __main__ - Step 41131: {'lr': 0.00019932684944069107, 'samples': 1316192, 'steps': 2570, 'loss/train': 1.7327927350997925} -09/20/2021 23:23:49 - INFO - __main__ - Step 41132: {'lr': 0.00019932684944069107, 'samples': 1316224, 'steps': 2570, 'loss/train': 1.817286491394043} -09/20/2021 23:23:49 - INFO - __main__ - Step 41133: {'lr': 0.00019932684944069107, 'samples': 1316256, 'steps': 2570, 'loss/train': 1.8604336977005005} -09/20/2021 23:23:50 - INFO - __main__ - Step 41134: {'lr': 0.00019932684944069107, 'samples': 1316288, 'steps': 2570, 'loss/train': 2.2412374019622803} -09/20/2021 23:23:51 - INFO - __main__ - Step 41135: {'lr': 0.00019932684944069107, 'samples': 1316320, 'steps': 2570, 'loss/train': 2.794614553451538} -09/20/2021 23:23:52 - INFO - __main__ - Step 41136: {'lr': 0.00019932684944069107, 'samples': 1316352, 'steps': 2570, 'loss/train': 2.598905563354492} -09/20/2021 23:23:53 - INFO - __main__ - Step 41137: {'lr': 0.00019932611034375287, 'samples': 1316384, 'steps': 2571, 'loss/train': 1.3259437084197998} -09/20/2021 23:23:54 - INFO - __main__ - Step 41138: {'lr': 0.00019932611034375287, 'samples': 1316416, 'steps': 2571, 'loss/train': 1.413962721824646} -09/20/2021 23:23:55 - INFO - __main__ - Step 41139: {'lr': 0.00019932611034375287, 'samples': 1316448, 'steps': 2571, 'loss/train': 2.655200958251953} -09/20/2021 23:23:56 - INFO - __main__ - Step 41140: {'lr': 0.00019932611034375287, 'samples': 1316480, 'steps': 2571, 'loss/train': 1.8092107772827148} -09/20/2021 23:23:57 - INFO - __main__ - Step 41141: {'lr': 0.00019932611034375287, 'samples': 1316512, 'steps': 2571, 'loss/train': 1.7525758743286133} -09/20/2021 23:23:57 - INFO - __main__ - Step 41142: {'lr': 0.00019932611034375287, 'samples': 1316544, 'steps': 2571, 'loss/train': 1.3948867321014404} -09/20/2021 23:23:58 - INFO - __main__ - Step 41143: {'lr': 0.00019932611034375287, 'samples': 1316576, 'steps': 2571, 'loss/train': 3.189724922180176} -09/20/2021 23:23:59 - INFO - __main__ - Step 41144: {'lr': 0.00019932611034375287, 'samples': 1316608, 'steps': 2571, 'loss/train': 1.683995246887207} -09/20/2021 23:24:00 - INFO - __main__ - Step 41145: {'lr': 0.00019932611034375287, 'samples': 1316640, 'steps': 2571, 'loss/train': 2.0800628662109375} -09/20/2021 23:24:00 - INFO - __main__ - Step 41146: {'lr': 0.00019932611034375287, 'samples': 1316672, 'steps': 2571, 'loss/train': 0.8531234264373779} -09/20/2021 23:24:01 - INFO - __main__ - Step 41147: {'lr': 0.00019932611034375287, 'samples': 1316704, 'steps': 2571, 'loss/train': 1.9287036657333374} -09/20/2021 23:24:02 - INFO - __main__ - Step 41148: {'lr': 0.00019932611034375287, 'samples': 1316736, 'steps': 2571, 'loss/train': 2.1073520183563232} -09/20/2021 23:24:03 - INFO - __main__ - Step 41149: {'lr': 0.00019932611034375287, 'samples': 1316768, 'steps': 2571, 'loss/train': 1.9309207201004028} -09/20/2021 23:24:03 - INFO - __main__ - Step 41150: {'lr': 0.00019932611034375287, 'samples': 1316800, 'steps': 2571, 'loss/train': 2.7292861938476562} -09/20/2021 23:24:04 - INFO - __main__ - Step 41151: {'lr': 0.00019932611034375287, 'samples': 1316832, 'steps': 2571, 'loss/train': 0.3237740397453308} -09/20/2021 23:24:05 - INFO - __main__ - Step 41152: {'lr': 0.00019932611034375287, 'samples': 1316864, 'steps': 2571, 'loss/train': 2.6422739028930664} -09/20/2021 23:24:06 - INFO - __main__ - Step 41153: {'lr': 0.00019932537084265715, 'samples': 1316896, 'steps': 2572, 'loss/train': 1.9629987478256226} -09/20/2021 23:24:06 - INFO - __main__ - Step 41154: {'lr': 0.00019932537084265715, 'samples': 1316928, 'steps': 2572, 'loss/train': 2.2007057666778564} -09/20/2021 23:24:07 - INFO - __main__ - Step 41155: {'lr': 0.00019932537084265715, 'samples': 1316960, 'steps': 2572, 'loss/train': 1.3881926536560059} -09/20/2021 23:24:08 - INFO - __main__ - Step 41156: {'lr': 0.00019932537084265715, 'samples': 1316992, 'steps': 2572, 'loss/train': 1.5833114385604858} -09/20/2021 23:24:09 - INFO - __main__ - Step 41157: {'lr': 0.00019932537084265715, 'samples': 1317024, 'steps': 2572, 'loss/train': 1.7183361053466797} -09/20/2021 23:24:09 - INFO - __main__ - Step 41158: {'lr': 0.00019932537084265715, 'samples': 1317056, 'steps': 2572, 'loss/train': 2.41605806350708} -09/20/2021 23:24:10 - INFO - __main__ - Step 41159: {'lr': 0.00019932537084265715, 'samples': 1317088, 'steps': 2572, 'loss/train': 1.4161962270736694} -09/20/2021 23:24:11 - INFO - __main__ - Step 41160: {'lr': 0.00019932537084265715, 'samples': 1317120, 'steps': 2572, 'loss/train': 2.4875147342681885} -09/20/2021 23:24:12 - INFO - __main__ - Step 41161: {'lr': 0.00019932537084265715, 'samples': 1317152, 'steps': 2572, 'loss/train': 1.6268553733825684} -09/20/2021 23:24:12 - INFO - __main__ - Step 41162: {'lr': 0.00019932537084265715, 'samples': 1317184, 'steps': 2572, 'loss/train': 1.356604814529419} -09/20/2021 23:24:13 - INFO - __main__ - Step 41163: {'lr': 0.00019932537084265715, 'samples': 1317216, 'steps': 2572, 'loss/train': 2.34289813041687} -09/20/2021 23:24:14 - INFO - __main__ - Step 41164: {'lr': 0.00019932537084265715, 'samples': 1317248, 'steps': 2572, 'loss/train': 2.1679205894470215} -09/20/2021 23:24:15 - INFO - __main__ - Step 41165: {'lr': 0.00019932537084265715, 'samples': 1317280, 'steps': 2572, 'loss/train': 1.941328763961792} -09/20/2021 23:24:15 - INFO - __main__ - Step 41166: {'lr': 0.00019932537084265715, 'samples': 1317312, 'steps': 2572, 'loss/train': 2.456913948059082} -09/20/2021 23:24:16 - INFO - __main__ - Step 41167: {'lr': 0.00019932537084265715, 'samples': 1317344, 'steps': 2572, 'loss/train': 2.1029810905456543} -09/20/2021 23:24:17 - INFO - __main__ - Step 41168: {'lr': 0.00019932537084265715, 'samples': 1317376, 'steps': 2572, 'loss/train': 2.2076642513275146} -09/20/2021 23:24:19 - INFO - __main__ - Step 41169: {'lr': 0.00019932463093740688, 'samples': 1317408, 'steps': 2573, 'loss/train': 2.5577011108398438} -09/20/2021 23:24:19 - INFO - __main__ - Step 41170: {'lr': 0.00019932463093740688, 'samples': 1317440, 'steps': 2573, 'loss/train': 2.4621477127075195} -09/20/2021 23:24:20 - INFO - __main__ - Step 41171: {'lr': 0.00019932463093740688, 'samples': 1317472, 'steps': 2573, 'loss/train': 2.126079559326172} -09/20/2021 23:24:21 - INFO - __main__ - Step 41172: {'lr': 0.00019932463093740688, 'samples': 1317504, 'steps': 2573, 'loss/train': 2.308915853500366} -09/20/2021 23:24:22 - INFO - __main__ - Step 41173: {'lr': 0.00019932463093740688, 'samples': 1317536, 'steps': 2573, 'loss/train': 2.479127883911133} -09/20/2021 23:24:22 - INFO - __main__ - Step 41174: {'lr': 0.00019932463093740688, 'samples': 1317568, 'steps': 2573, 'loss/train': 2.748331308364868} -09/20/2021 23:24:23 - INFO - __main__ - Step 41175: {'lr': 0.00019932463093740688, 'samples': 1317600, 'steps': 2573, 'loss/train': 2.478454828262329} -09/20/2021 23:24:24 - INFO - __main__ - Step 41176: {'lr': 0.00019932463093740688, 'samples': 1317632, 'steps': 2573, 'loss/train': 2.4869818687438965} -09/20/2021 23:24:25 - INFO - __main__ - Step 41177: {'lr': 0.00019932463093740688, 'samples': 1317664, 'steps': 2573, 'loss/train': 1.9071342945098877} -09/20/2021 23:24:25 - INFO - __main__ - Step 41178: {'lr': 0.00019932463093740688, 'samples': 1317696, 'steps': 2573, 'loss/train': 1.6088483333587646} -09/20/2021 23:24:26 - INFO - __main__ - Step 41179: {'lr': 0.00019932463093740688, 'samples': 1317728, 'steps': 2573, 'loss/train': 1.5948563814163208} -09/20/2021 23:24:27 - INFO - __main__ - Step 41180: {'lr': 0.00019932463093740688, 'samples': 1317760, 'steps': 2573, 'loss/train': 1.636343002319336} -09/20/2021 23:24:28 - INFO - __main__ - Step 41181: {'lr': 0.00019932463093740688, 'samples': 1317792, 'steps': 2573, 'loss/train': 2.6972060203552246} -09/20/2021 23:24:28 - INFO - __main__ - Step 41182: {'lr': 0.00019932463093740688, 'samples': 1317824, 'steps': 2573, 'loss/train': 1.9818428754806519} -09/20/2021 23:24:29 - INFO - __main__ - Step 41183: {'lr': 0.00019932463093740688, 'samples': 1317856, 'steps': 2573, 'loss/train': 1.6565195322036743} -09/20/2021 23:24:30 - INFO - __main__ - Step 41184: {'lr': 0.00019932463093740688, 'samples': 1317888, 'steps': 2573, 'loss/train': 1.3378760814666748} -09/20/2021 23:24:31 - INFO - __main__ - Step 41185: {'lr': 0.00019932389062800505, 'samples': 1317920, 'steps': 2574, 'loss/train': 2.1976935863494873} -09/20/2021 23:24:31 - INFO - __main__ - Step 41186: {'lr': 0.00019932389062800505, 'samples': 1317952, 'steps': 2574, 'loss/train': 2.104618549346924} -09/20/2021 23:24:32 - INFO - __main__ - Step 41187: {'lr': 0.00019932389062800505, 'samples': 1317984, 'steps': 2574, 'loss/train': 2.1650197505950928} -09/20/2021 23:24:33 - INFO - __main__ - Step 41188: {'lr': 0.00019932389062800505, 'samples': 1318016, 'steps': 2574, 'loss/train': 2.1923611164093018} -09/20/2021 23:24:34 - INFO - __main__ - Step 41189: {'lr': 0.00019932389062800505, 'samples': 1318048, 'steps': 2574, 'loss/train': 1.5699721574783325} -09/20/2021 23:24:34 - INFO - __main__ - Step 41190: {'lr': 0.00019932389062800505, 'samples': 1318080, 'steps': 2574, 'loss/train': 2.409942388534546} -09/20/2021 23:24:35 - INFO - __main__ - Step 41191: {'lr': 0.00019932389062800505, 'samples': 1318112, 'steps': 2574, 'loss/train': 2.1725666522979736} -09/20/2021 23:24:36 - INFO - __main__ - Step 41192: {'lr': 0.00019932389062800505, 'samples': 1318144, 'steps': 2574, 'loss/train': 2.0819971561431885} -09/20/2021 23:24:37 - INFO - __main__ - Step 41193: {'lr': 0.00019932389062800505, 'samples': 1318176, 'steps': 2574, 'loss/train': 1.7549220323562622} -09/20/2021 23:24:37 - INFO - __main__ - Step 41194: {'lr': 0.00019932389062800505, 'samples': 1318208, 'steps': 2574, 'loss/train': 4.181841850280762} -09/20/2021 23:24:38 - INFO - __main__ - Step 41195: {'lr': 0.00019932389062800505, 'samples': 1318240, 'steps': 2574, 'loss/train': 2.0600156784057617} -09/20/2021 23:24:39 - INFO - __main__ - Step 41196: {'lr': 0.00019932389062800505, 'samples': 1318272, 'steps': 2574, 'loss/train': 1.5275790691375732} -09/20/2021 23:24:40 - INFO - __main__ - Step 41197: {'lr': 0.00019932389062800505, 'samples': 1318304, 'steps': 2574, 'loss/train': 2.111576795578003} -09/20/2021 23:24:40 - INFO - __main__ - Step 41198: {'lr': 0.00019932389062800505, 'samples': 1318336, 'steps': 2574, 'loss/train': 2.3268489837646484} -09/20/2021 23:24:42 - INFO - __main__ - Step 41199: {'lr': 0.00019932389062800505, 'samples': 1318368, 'steps': 2574, 'loss/train': 2.7036454677581787} -09/20/2021 23:24:43 - INFO - __main__ - Step 41200: {'lr': 0.00019932389062800505, 'samples': 1318400, 'steps': 2574, 'loss/train': 2.8848204612731934} -09/20/2021 23:24:43 - INFO - __main__ - Step 41201: {'lr': 0.0001993231499144547, 'samples': 1318432, 'steps': 2575, 'loss/train': 1.2743144035339355} -09/20/2021 23:24:44 - INFO - __main__ - Step 41202: {'lr': 0.0001993231499144547, 'samples': 1318464, 'steps': 2575, 'loss/train': 1.8181633949279785} -09/20/2021 23:24:45 - INFO - __main__ - Step 41203: {'lr': 0.0001993231499144547, 'samples': 1318496, 'steps': 2575, 'loss/train': 2.178807497024536} -09/20/2021 23:24:46 - INFO - __main__ - Step 41204: {'lr': 0.0001993231499144547, 'samples': 1318528, 'steps': 2575, 'loss/train': 1.2865147590637207} -09/20/2021 23:24:46 - INFO - __main__ - Step 41205: {'lr': 0.0001993231499144547, 'samples': 1318560, 'steps': 2575, 'loss/train': 2.301386594772339} -09/20/2021 23:24:47 - INFO - __main__ - Step 41206: {'lr': 0.0001993231499144547, 'samples': 1318592, 'steps': 2575, 'loss/train': 2.1842005252838135} -09/20/2021 23:24:48 - INFO - __main__ - Step 41207: {'lr': 0.0001993231499144547, 'samples': 1318624, 'steps': 2575, 'loss/train': 1.955274224281311} -09/20/2021 23:24:49 - INFO - __main__ - Step 41208: {'lr': 0.0001993231499144547, 'samples': 1318656, 'steps': 2575, 'loss/train': 2.9571566581726074} -09/20/2021 23:24:49 - INFO - __main__ - Step 41209: {'lr': 0.0001993231499144547, 'samples': 1318688, 'steps': 2575, 'loss/train': 1.888965368270874} -09/20/2021 23:24:50 - INFO - __main__ - Step 41210: {'lr': 0.0001993231499144547, 'samples': 1318720, 'steps': 2575, 'loss/train': 2.3662161827087402} -09/20/2021 23:24:51 - INFO - __main__ - Step 41211: {'lr': 0.0001993231499144547, 'samples': 1318752, 'steps': 2575, 'loss/train': 1.367557406425476} -09/20/2021 23:24:52 - INFO - __main__ - Step 41212: {'lr': 0.0001993231499144547, 'samples': 1318784, 'steps': 2575, 'loss/train': 2.1489689350128174} -09/20/2021 23:24:52 - INFO - __main__ - Step 41213: {'lr': 0.0001993231499144547, 'samples': 1318816, 'steps': 2575, 'loss/train': 2.651772975921631} -09/20/2021 23:24:53 - INFO - __main__ - Step 41214: {'lr': 0.0001993231499144547, 'samples': 1318848, 'steps': 2575, 'loss/train': 2.3211865425109863} -09/20/2021 23:24:54 - INFO - __main__ - Step 41215: {'lr': 0.0001993231499144547, 'samples': 1318880, 'steps': 2575, 'loss/train': 2.2635157108306885} -09/20/2021 23:24:55 - INFO - __main__ - Step 41216: {'lr': 0.0001993231499144547, 'samples': 1318912, 'steps': 2575, 'loss/train': 1.6511458158493042} -09/20/2021 23:24:56 - INFO - __main__ - Step 41217: {'lr': 0.00019932240879675885, 'samples': 1318944, 'steps': 2576, 'loss/train': 2.0155258178710938} -09/20/2021 23:24:56 - INFO - __main__ - Step 41218: {'lr': 0.00019932240879675885, 'samples': 1318976, 'steps': 2576, 'loss/train': 1.8100388050079346} -09/20/2021 23:24:57 - INFO - __main__ - Step 41219: {'lr': 0.00019932240879675885, 'samples': 1319008, 'steps': 2576, 'loss/train': 1.092813491821289} -09/20/2021 23:24:58 - INFO - __main__ - Step 41220: {'lr': 0.00019932240879675885, 'samples': 1319040, 'steps': 2576, 'loss/train': 2.5323848724365234} -09/20/2021 23:24:59 - INFO - __main__ - Step 41221: {'lr': 0.00019932240879675885, 'samples': 1319072, 'steps': 2576, 'loss/train': 1.5978124141693115} -09/20/2021 23:24:59 - INFO - __main__ - Step 41222: {'lr': 0.00019932240879675885, 'samples': 1319104, 'steps': 2576, 'loss/train': 1.6704275608062744} -09/20/2021 23:25:00 - INFO - __main__ - Step 41223: {'lr': 0.00019932240879675885, 'samples': 1319136, 'steps': 2576, 'loss/train': 1.540116548538208} -09/20/2021 23:25:01 - INFO - __main__ - Step 41224: {'lr': 0.00019932240879675885, 'samples': 1319168, 'steps': 2576, 'loss/train': 1.6956076622009277} -09/20/2021 23:25:02 - INFO - __main__ - Step 41225: {'lr': 0.00019932240879675885, 'samples': 1319200, 'steps': 2576, 'loss/train': 3.0974948406219482} -09/20/2021 23:25:02 - INFO - __main__ - Step 41226: {'lr': 0.00019932240879675885, 'samples': 1319232, 'steps': 2576, 'loss/train': 1.3302319049835205} -09/20/2021 23:25:03 - INFO - __main__ - Step 41227: {'lr': 0.00019932240879675885, 'samples': 1319264, 'steps': 2576, 'loss/train': 2.3611443042755127} -09/20/2021 23:25:04 - INFO - __main__ - Step 41228: {'lr': 0.00019932240879675885, 'samples': 1319296, 'steps': 2576, 'loss/train': 2.418962001800537} -09/20/2021 23:25:06 - INFO - __main__ - Step 41229: {'lr': 0.00019932240879675885, 'samples': 1319328, 'steps': 2576, 'loss/train': 2.330111503601074} -09/20/2021 23:25:07 - INFO - __main__ - Step 41230: {'lr': 0.00019932240879675885, 'samples': 1319360, 'steps': 2576, 'loss/train': 2.9110422134399414} -09/20/2021 23:25:08 - INFO - __main__ - Step 41231: {'lr': 0.00019932240879675885, 'samples': 1319392, 'steps': 2576, 'loss/train': 1.74263596534729} -09/20/2021 23:25:08 - INFO - __main__ - Step 41232: {'lr': 0.00019932240879675885, 'samples': 1319424, 'steps': 2576, 'loss/train': 2.0720181465148926} -09/20/2021 23:25:09 - INFO - __main__ - Step 41233: {'lr': 0.0001993216672749205, 'samples': 1319456, 'steps': 2577, 'loss/train': 2.9519145488739014} -09/20/2021 23:25:10 - INFO - __main__ - Step 41234: {'lr': 0.0001993216672749205, 'samples': 1319488, 'steps': 2577, 'loss/train': 2.278225898742676} -09/20/2021 23:25:11 - INFO - __main__ - Step 41235: {'lr': 0.0001993216672749205, 'samples': 1319520, 'steps': 2577, 'loss/train': 1.3714674711227417} -09/20/2021 23:25:12 - INFO - __main__ - Step 41236: {'lr': 0.0001993216672749205, 'samples': 1319552, 'steps': 2577, 'loss/train': 2.6348965167999268} -09/20/2021 23:25:12 - INFO - __main__ - Step 41237: {'lr': 0.0001993216672749205, 'samples': 1319584, 'steps': 2577, 'loss/train': 1.984168529510498} -09/20/2021 23:25:13 - INFO - __main__ - Step 41238: {'lr': 0.0001993216672749205, 'samples': 1319616, 'steps': 2577, 'loss/train': 2.8937907218933105} -09/20/2021 23:25:14 - INFO - __main__ - Step 41239: {'lr': 0.0001993216672749205, 'samples': 1319648, 'steps': 2577, 'loss/train': 3.362049102783203} -09/20/2021 23:25:15 - INFO - __main__ - Step 41240: {'lr': 0.0001993216672749205, 'samples': 1319680, 'steps': 2577, 'loss/train': 1.8481935262680054} -09/20/2021 23:25:15 - INFO - __main__ - Step 41241: {'lr': 0.0001993216672749205, 'samples': 1319712, 'steps': 2577, 'loss/train': 1.2742834091186523} -09/20/2021 23:25:16 - INFO - __main__ - Step 41242: {'lr': 0.0001993216672749205, 'samples': 1319744, 'steps': 2577, 'loss/train': 1.5659396648406982} -09/20/2021 23:25:17 - INFO - __main__ - Step 41243: {'lr': 0.0001993216672749205, 'samples': 1319776, 'steps': 2577, 'loss/train': 1.2834690809249878} -09/20/2021 23:25:18 - INFO - __main__ - Step 41244: {'lr': 0.0001993216672749205, 'samples': 1319808, 'steps': 2577, 'loss/train': 2.869168519973755} -09/20/2021 23:25:18 - INFO - __main__ - Step 41245: {'lr': 0.0001993216672749205, 'samples': 1319840, 'steps': 2577, 'loss/train': 1.8915091753005981} -09/20/2021 23:25:19 - INFO - __main__ - Step 41246: {'lr': 0.0001993216672749205, 'samples': 1319872, 'steps': 2577, 'loss/train': 2.7321929931640625} -09/20/2021 23:25:20 - INFO - __main__ - Step 41247: {'lr': 0.0001993216672749205, 'samples': 1319904, 'steps': 2577, 'loss/train': 2.564134120941162} -09/20/2021 23:25:21 - INFO - __main__ - Step 41248: {'lr': 0.0001993216672749205, 'samples': 1319936, 'steps': 2577, 'loss/train': 1.9716224670410156} -09/20/2021 23:25:21 - INFO - __main__ - Step 41249: {'lr': 0.00019932092534894266, 'samples': 1319968, 'steps': 2578, 'loss/train': 1.989990234375} -09/20/2021 23:25:22 - INFO - __main__ - Step 41250: {'lr': 0.00019932092534894266, 'samples': 1320000, 'steps': 2578, 'loss/train': 2.1130807399749756} -09/20/2021 23:25:23 - INFO - __main__ - Step 41251: {'lr': 0.00019932092534894266, 'samples': 1320032, 'steps': 2578, 'loss/train': 3.919609308242798} -09/20/2021 23:25:24 - INFO - __main__ - Step 41252: {'lr': 0.00019932092534894266, 'samples': 1320064, 'steps': 2578, 'loss/train': 2.761852502822876} -09/20/2021 23:25:24 - INFO - __main__ - Step 41253: {'lr': 0.00019932092534894266, 'samples': 1320096, 'steps': 2578, 'loss/train': 3.4926698207855225} -09/20/2021 23:25:25 - INFO - __main__ - Step 41254: {'lr': 0.00019932092534894266, 'samples': 1320128, 'steps': 2578, 'loss/train': 5.3609795570373535} -09/20/2021 23:25:26 - INFO - __main__ - Step 41255: {'lr': 0.00019932092534894266, 'samples': 1320160, 'steps': 2578, 'loss/train': 5.025317192077637} -09/20/2021 23:25:27 - INFO - __main__ - Step 41256: {'lr': 0.00019932092534894266, 'samples': 1320192, 'steps': 2578, 'loss/train': 5.1946611404418945} -09/20/2021 23:25:27 - INFO - __main__ - Step 41257: {'lr': 0.00019932092534894266, 'samples': 1320224, 'steps': 2578, 'loss/train': 5.313138008117676} -09/20/2021 23:25:28 - INFO - __main__ - Step 41258: {'lr': 0.00019932092534894266, 'samples': 1320256, 'steps': 2578, 'loss/train': 5.059414863586426} -09/20/2021 23:25:29 - INFO - __main__ - Step 41259: {'lr': 0.00019932092534894266, 'samples': 1320288, 'steps': 2578, 'loss/train': 4.901602268218994} -09/20/2021 23:25:30 - INFO - __main__ - Step 41260: {'lr': 0.00019932092534894266, 'samples': 1320320, 'steps': 2578, 'loss/train': 5.023196697235107} -09/20/2021 23:25:30 - INFO - __main__ - Step 41261: {'lr': 0.00019932092534894266, 'samples': 1320352, 'steps': 2578, 'loss/train': 4.746205806732178} -09/20/2021 23:25:31 - INFO - __main__ - Step 41262: {'lr': 0.00019932092534894266, 'samples': 1320384, 'steps': 2578, 'loss/train': 5.15053653717041} -09/20/2021 23:25:32 - INFO - __main__ - Step 41263: {'lr': 0.00019932092534894266, 'samples': 1320416, 'steps': 2578, 'loss/train': 4.492410659790039} -09/20/2021 23:25:33 - INFO - __main__ - Step 41264: {'lr': 0.00019932092534894266, 'samples': 1320448, 'steps': 2578, 'loss/train': 5.189090251922607} -09/20/2021 23:25:34 - INFO - __main__ - Step 41265: {'lr': 0.0001993201830188284, 'samples': 1320480, 'steps': 2579, 'loss/train': 2.7207088470458984} -09/20/2021 23:25:34 - INFO - __main__ - Step 41266: {'lr': 0.0001993201830188284, 'samples': 1320512, 'steps': 2579, 'loss/train': 2.602522850036621} -09/20/2021 23:25:35 - INFO - __main__ - Step 41267: {'lr': 0.0001993201830188284, 'samples': 1320544, 'steps': 2579, 'loss/train': 2.5354652404785156} -09/20/2021 23:25:36 - INFO - __main__ - Step 41268: {'lr': 0.0001993201830188284, 'samples': 1320576, 'steps': 2579, 'loss/train': 2.747814655303955} -09/20/2021 23:25:37 - INFO - __main__ - Step 41269: {'lr': 0.0001993201830188284, 'samples': 1320608, 'steps': 2579, 'loss/train': 2.8371362686157227} -09/20/2021 23:25:38 - INFO - __main__ - Step 41270: {'lr': 0.0001993201830188284, 'samples': 1320640, 'steps': 2579, 'loss/train': 2.0604984760284424} -09/20/2021 23:25:39 - INFO - __main__ - Step 41271: {'lr': 0.0001993201830188284, 'samples': 1320672, 'steps': 2579, 'loss/train': 2.2379064559936523} -09/20/2021 23:25:39 - INFO - __main__ - Step 41272: {'lr': 0.0001993201830188284, 'samples': 1320704, 'steps': 2579, 'loss/train': 1.963719367980957} -09/20/2021 23:25:40 - INFO - __main__ - Step 41273: {'lr': 0.0001993201830188284, 'samples': 1320736, 'steps': 2579, 'loss/train': 1.6837165355682373} -09/20/2021 23:25:41 - INFO - __main__ - Step 41274: {'lr': 0.0001993201830188284, 'samples': 1320768, 'steps': 2579, 'loss/train': 2.241405487060547} -09/20/2021 23:25:42 - INFO - __main__ - Step 41275: {'lr': 0.0001993201830188284, 'samples': 1320800, 'steps': 2579, 'loss/train': 2.0556399822235107} -09/20/2021 23:25:42 - INFO - __main__ - Step 41276: {'lr': 0.0001993201830188284, 'samples': 1320832, 'steps': 2579, 'loss/train': 1.4381568431854248} -09/20/2021 23:25:43 - INFO - __main__ - Step 41277: {'lr': 0.0001993201830188284, 'samples': 1320864, 'steps': 2579, 'loss/train': 1.947818636894226} -09/20/2021 23:25:44 - INFO - __main__ - Step 41278: {'lr': 0.0001993201830188284, 'samples': 1320896, 'steps': 2579, 'loss/train': 1.9863229990005493} -09/20/2021 23:25:45 - INFO - __main__ - Step 41279: {'lr': 0.0001993201830188284, 'samples': 1320928, 'steps': 2579, 'loss/train': 2.21995210647583} -09/20/2021 23:25:45 - INFO - __main__ - Step 41280: {'lr': 0.0001993201830188284, 'samples': 1320960, 'steps': 2579, 'loss/train': 1.9232163429260254} -09/20/2021 23:25:46 - INFO - __main__ - Step 41281: {'lr': 0.00019931944028458065, 'samples': 1320992, 'steps': 2580, 'loss/train': 1.7063275575637817} -09/20/2021 23:25:47 - INFO - __main__ - Step 41282: {'lr': 0.00019931944028458065, 'samples': 1321024, 'steps': 2580, 'loss/train': 2.4189870357513428} -09/20/2021 23:25:48 - INFO - __main__ - Step 41283: {'lr': 0.00019931944028458065, 'samples': 1321056, 'steps': 2580, 'loss/train': 2.649721384048462} -09/20/2021 23:25:48 - INFO - __main__ - Step 41284: {'lr': 0.00019931944028458065, 'samples': 1321088, 'steps': 2580, 'loss/train': 2.5978336334228516} -09/20/2021 23:25:49 - INFO - __main__ - Step 41285: {'lr': 0.00019931944028458065, 'samples': 1321120, 'steps': 2580, 'loss/train': 2.3584213256835938} -09/20/2021 23:25:50 - INFO - __main__ - Step 41286: {'lr': 0.00019931944028458065, 'samples': 1321152, 'steps': 2580, 'loss/train': 2.147116184234619} -09/20/2021 23:25:51 - INFO - __main__ - Step 41287: {'lr': 0.00019931944028458065, 'samples': 1321184, 'steps': 2580, 'loss/train': 1.5099644660949707} -09/20/2021 23:25:51 - INFO - __main__ - Step 41288: {'lr': 0.00019931944028458065, 'samples': 1321216, 'steps': 2580, 'loss/train': 2.5204174518585205} -09/20/2021 23:25:52 - INFO - __main__ - Step 41289: {'lr': 0.00019931944028458065, 'samples': 1321248, 'steps': 2580, 'loss/train': 0.746563196182251} -09/20/2021 23:25:53 - INFO - __main__ - Step 41290: {'lr': 0.00019931944028458065, 'samples': 1321280, 'steps': 2580, 'loss/train': 0.16977956891059875} -09/20/2021 23:25:54 - INFO - __main__ - Step 41291: {'lr': 0.00019931944028458065, 'samples': 1321312, 'steps': 2580, 'loss/train': 0.2757669985294342} -09/20/2021 23:25:54 - INFO - __main__ - Step 41292: {'lr': 0.00019931944028458065, 'samples': 1321344, 'steps': 2580, 'loss/train': 2.52419114112854} -09/20/2021 23:25:55 - INFO - __main__ - Step 41293: {'lr': 0.00019931944028458065, 'samples': 1321376, 'steps': 2580, 'loss/train': 2.5326380729675293} -09/20/2021 23:25:56 - INFO - __main__ - Step 41294: {'lr': 0.00019931944028458065, 'samples': 1321408, 'steps': 2580, 'loss/train': 1.5845842361450195} -09/20/2021 23:25:57 - INFO - __main__ - Step 41295: {'lr': 0.00019931944028458065, 'samples': 1321440, 'steps': 2580, 'loss/train': 1.542237639427185} -09/20/2021 23:25:57 - INFO - __main__ - Step 41296: {'lr': 0.00019931944028458065, 'samples': 1321472, 'steps': 2580, 'loss/train': 1.6060097217559814} -09/20/2021 23:25:58 - INFO - __main__ - Step 41297: {'lr': 0.00019931869714620253, 'samples': 1321504, 'steps': 2581, 'loss/train': 1.2377781867980957} -09/20/2021 23:25:59 - INFO - __main__ - Step 41298: {'lr': 0.00019931869714620253, 'samples': 1321536, 'steps': 2581, 'loss/train': 2.043109893798828} -09/20/2021 23:26:00 - INFO - __main__ - Step 41299: {'lr': 0.00019931869714620253, 'samples': 1321568, 'steps': 2581, 'loss/train': 2.554110050201416} -09/20/2021 23:26:01 - INFO - __main__ - Step 41300: {'lr': 0.00019931869714620253, 'samples': 1321600, 'steps': 2581, 'loss/train': 1.532070279121399} -09/20/2021 23:26:02 - INFO - __main__ - Step 41301: {'lr': 0.00019931869714620253, 'samples': 1321632, 'steps': 2581, 'loss/train': 1.9904574155807495} -09/20/2021 23:26:03 - INFO - __main__ - Step 41302: {'lr': 0.00019931869714620253, 'samples': 1321664, 'steps': 2581, 'loss/train': 1.2903269529342651} -09/20/2021 23:26:03 - INFO - __main__ - Step 41303: {'lr': 0.00019931869714620253, 'samples': 1321696, 'steps': 2581, 'loss/train': 1.6817436218261719} -09/20/2021 23:26:04 - INFO - __main__ - Step 41304: {'lr': 0.00019931869714620253, 'samples': 1321728, 'steps': 2581, 'loss/train': 2.4156904220581055} -09/20/2021 23:26:05 - INFO - __main__ - Step 41305: {'lr': 0.00019931869714620253, 'samples': 1321760, 'steps': 2581, 'loss/train': 1.6715654134750366} -09/20/2021 23:26:06 - INFO - __main__ - Step 41306: {'lr': 0.00019931869714620253, 'samples': 1321792, 'steps': 2581, 'loss/train': 1.6743918657302856} -09/20/2021 23:26:06 - INFO - __main__ - Step 41307: {'lr': 0.00019931869714620253, 'samples': 1321824, 'steps': 2581, 'loss/train': 2.121279239654541} -09/20/2021 23:26:07 - INFO - __main__ - Step 41308: {'lr': 0.00019931869714620253, 'samples': 1321856, 'steps': 2581, 'loss/train': 0.2792645990848541} -09/20/2021 23:26:08 - INFO - __main__ - Step 41309: {'lr': 0.00019931869714620253, 'samples': 1321888, 'steps': 2581, 'loss/train': 2.426050901412964} -09/20/2021 23:26:09 - INFO - __main__ - Step 41310: {'lr': 0.00019931869714620253, 'samples': 1321920, 'steps': 2581, 'loss/train': 1.8264760971069336} -09/20/2021 23:26:09 - INFO - __main__ - Step 41311: {'lr': 0.00019931869714620253, 'samples': 1321952, 'steps': 2581, 'loss/train': 2.075005292892456} -09/20/2021 23:26:10 - INFO - __main__ - Step 41312: {'lr': 0.00019931869714620253, 'samples': 1321984, 'steps': 2581, 'loss/train': 1.6575969457626343} -09/20/2021 23:26:11 - INFO - __main__ - Step 41313: {'lr': 0.00019931795360369697, 'samples': 1322016, 'steps': 2582, 'loss/train': 2.818211317062378} -09/20/2021 23:26:12 - INFO - __main__ - Step 41314: {'lr': 0.00019931795360369697, 'samples': 1322048, 'steps': 2582, 'loss/train': 2.004304885864258} -09/20/2021 23:26:13 - INFO - __main__ - Step 41315: {'lr': 0.00019931795360369697, 'samples': 1322080, 'steps': 2582, 'loss/train': 3.0727086067199707} -09/20/2021 23:26:13 - INFO - __main__ - Step 41316: {'lr': 0.00019931795360369697, 'samples': 1322112, 'steps': 2582, 'loss/train': 1.5833674669265747} -09/20/2021 23:26:14 - INFO - __main__ - Step 41317: {'lr': 0.00019931795360369697, 'samples': 1322144, 'steps': 2582, 'loss/train': 1.7565393447875977} -09/20/2021 23:26:15 - INFO - __main__ - Step 41318: {'lr': 0.00019931795360369697, 'samples': 1322176, 'steps': 2582, 'loss/train': 2.064060926437378} -09/20/2021 23:26:16 - INFO - __main__ - Step 41319: {'lr': 0.00019931795360369697, 'samples': 1322208, 'steps': 2582, 'loss/train': 2.264647960662842} -09/20/2021 23:26:16 - INFO - __main__ - Step 41320: {'lr': 0.00019931795360369697, 'samples': 1322240, 'steps': 2582, 'loss/train': 2.49228572845459} -09/20/2021 23:26:17 - INFO - __main__ - Step 41321: {'lr': 0.00019931795360369697, 'samples': 1322272, 'steps': 2582, 'loss/train': 1.5402504205703735} -09/20/2021 23:26:18 - INFO - __main__ - Step 41322: {'lr': 0.00019931795360369697, 'samples': 1322304, 'steps': 2582, 'loss/train': 1.8969359397888184} -09/20/2021 23:26:19 - INFO - __main__ - Step 41323: {'lr': 0.00019931795360369697, 'samples': 1322336, 'steps': 2582, 'loss/train': 2.5857019424438477} -09/20/2021 23:26:19 - INFO - __main__ - Step 41324: {'lr': 0.00019931795360369697, 'samples': 1322368, 'steps': 2582, 'loss/train': 1.9991910457611084} -09/20/2021 23:26:20 - INFO - __main__ - Step 41325: {'lr': 0.00019931795360369697, 'samples': 1322400, 'steps': 2582, 'loss/train': 1.7396713495254517} -09/20/2021 23:26:21 - INFO - __main__ - Step 41326: {'lr': 0.00019931795360369697, 'samples': 1322432, 'steps': 2582, 'loss/train': 2.6918814182281494} -09/20/2021 23:26:22 - INFO - __main__ - Step 41327: {'lr': 0.00019931795360369697, 'samples': 1322464, 'steps': 2582, 'loss/train': 1.7715764045715332} -09/20/2021 23:26:22 - INFO - __main__ - Step 41328: {'lr': 0.00019931795360369697, 'samples': 1322496, 'steps': 2582, 'loss/train': 2.3715038299560547} -09/20/2021 23:26:23 - INFO - __main__ - Step 41329: {'lr': 0.00019931720965706706, 'samples': 1322528, 'steps': 2583, 'loss/train': 1.0668703317642212} -09/20/2021 23:26:24 - INFO - __main__ - Step 41330: {'lr': 0.00019931720965706706, 'samples': 1322560, 'steps': 2583, 'loss/train': 0.5997666716575623} -09/20/2021 23:26:25 - INFO - __main__ - Step 41331: {'lr': 0.00019931720965706706, 'samples': 1322592, 'steps': 2583, 'loss/train': 2.961430311203003} -09/20/2021 23:26:26 - INFO - __main__ - Step 41332: {'lr': 0.00019931720965706706, 'samples': 1322624, 'steps': 2583, 'loss/train': 2.110025644302368} -09/20/2021 23:26:27 - INFO - __main__ - Step 41333: {'lr': 0.00019931720965706706, 'samples': 1322656, 'steps': 2583, 'loss/train': 2.261030435562134} -09/20/2021 23:26:27 - INFO - __main__ - Step 41334: {'lr': 0.00019931720965706706, 'samples': 1322688, 'steps': 2583, 'loss/train': 1.4026073217391968} -09/20/2021 23:26:28 - INFO - __main__ - Step 41335: {'lr': 0.00019931720965706706, 'samples': 1322720, 'steps': 2583, 'loss/train': 1.987891435623169} -09/20/2021 23:26:29 - INFO - __main__ - Step 41336: {'lr': 0.00019931720965706706, 'samples': 1322752, 'steps': 2583, 'loss/train': 1.6672896146774292} -09/20/2021 23:26:30 - INFO - __main__ - Step 41337: {'lr': 0.00019931720965706706, 'samples': 1322784, 'steps': 2583, 'loss/train': 3.1179022789001465} -09/20/2021 23:26:30 - INFO - __main__ - Step 41338: {'lr': 0.00019931720965706706, 'samples': 1322816, 'steps': 2583, 'loss/train': 2.265963554382324} -09/20/2021 23:26:31 - INFO - __main__ - Step 41339: {'lr': 0.00019931720965706706, 'samples': 1322848, 'steps': 2583, 'loss/train': 2.3429088592529297} -09/20/2021 23:26:32 - INFO - __main__ - Step 41340: {'lr': 0.00019931720965706706, 'samples': 1322880, 'steps': 2583, 'loss/train': 3.236811399459839} -09/20/2021 23:26:33 - INFO - __main__ - Step 41341: {'lr': 0.00019931720965706706, 'samples': 1322912, 'steps': 2583, 'loss/train': 3.093435764312744} -09/20/2021 23:26:33 - INFO - __main__ - Step 41342: {'lr': 0.00019931720965706706, 'samples': 1322944, 'steps': 2583, 'loss/train': 1.5498391389846802} -09/20/2021 23:26:34 - INFO - __main__ - Step 41343: {'lr': 0.00019931720965706706, 'samples': 1322976, 'steps': 2583, 'loss/train': 0.5953881144523621} -09/20/2021 23:26:35 - INFO - __main__ - Step 41344: {'lr': 0.00019931720965706706, 'samples': 1323008, 'steps': 2583, 'loss/train': 1.8108537197113037} -09/20/2021 23:26:36 - INFO - __main__ - Step 41345: {'lr': 0.00019931646530631583, 'samples': 1323040, 'steps': 2584, 'loss/train': 2.1957383155822754} -09/20/2021 23:26:37 - INFO - __main__ - Step 41346: {'lr': 0.00019931646530631583, 'samples': 1323072, 'steps': 2584, 'loss/train': 2.6987111568450928} -09/20/2021 23:26:37 - INFO - __main__ - Step 41347: {'lr': 0.00019931646530631583, 'samples': 1323104, 'steps': 2584, 'loss/train': 1.86279296875} -09/20/2021 23:26:38 - INFO - __main__ - Step 41348: {'lr': 0.00019931646530631583, 'samples': 1323136, 'steps': 2584, 'loss/train': 2.660543918609619} -09/20/2021 23:26:39 - INFO - __main__ - Step 41349: {'lr': 0.00019931646530631583, 'samples': 1323168, 'steps': 2584, 'loss/train': 1.822139024734497} -09/20/2021 23:26:40 - INFO - __main__ - Step 41350: {'lr': 0.00019931646530631583, 'samples': 1323200, 'steps': 2584, 'loss/train': 1.5422478914260864} -09/20/2021 23:26:40 - INFO - __main__ - Step 41351: {'lr': 0.00019931646530631583, 'samples': 1323232, 'steps': 2584, 'loss/train': 2.3057467937469482} -09/20/2021 23:26:41 - INFO - __main__ - Step 41352: {'lr': 0.00019931646530631583, 'samples': 1323264, 'steps': 2584, 'loss/train': 2.4228127002716064} -09/20/2021 23:26:42 - INFO - __main__ - Step 41353: {'lr': 0.00019931646530631583, 'samples': 1323296, 'steps': 2584, 'loss/train': 1.8558807373046875} -09/20/2021 23:26:43 - INFO - __main__ - Step 41354: {'lr': 0.00019931646530631583, 'samples': 1323328, 'steps': 2584, 'loss/train': 2.199796199798584} -09/20/2021 23:26:43 - INFO - __main__ - Step 41355: {'lr': 0.00019931646530631583, 'samples': 1323360, 'steps': 2584, 'loss/train': 2.115100622177124} -09/20/2021 23:26:44 - INFO - __main__ - Step 41356: {'lr': 0.00019931646530631583, 'samples': 1323392, 'steps': 2584, 'loss/train': 2.234631061553955} -09/20/2021 23:26:45 - INFO - __main__ - Step 41357: {'lr': 0.00019931646530631583, 'samples': 1323424, 'steps': 2584, 'loss/train': 2.033984661102295} -09/20/2021 23:26:46 - INFO - __main__ - Step 41358: {'lr': 0.00019931646530631583, 'samples': 1323456, 'steps': 2584, 'loss/train': 2.074678897857666} -09/20/2021 23:26:46 - INFO - __main__ - Step 41359: {'lr': 0.00019931646530631583, 'samples': 1323488, 'steps': 2584, 'loss/train': 2.5053956508636475} -09/20/2021 23:26:47 - INFO - __main__ - Step 41360: {'lr': 0.00019931646530631583, 'samples': 1323520, 'steps': 2584, 'loss/train': 2.6795239448547363} -09/20/2021 23:26:48 - INFO - __main__ - Step 41361: {'lr': 0.00019931572055144627, 'samples': 1323552, 'steps': 2585, 'loss/train': 1.613806962966919} -09/20/2021 23:26:49 - INFO - __main__ - Step 41362: {'lr': 0.00019931572055144627, 'samples': 1323584, 'steps': 2585, 'loss/train': 1.668062448501587} -09/20/2021 23:26:50 - INFO - __main__ - Step 41363: {'lr': 0.00019931572055144627, 'samples': 1323616, 'steps': 2585, 'loss/train': 1.6867146492004395} -09/20/2021 23:26:51 - INFO - __main__ - Step 41364: {'lr': 0.00019931572055144627, 'samples': 1323648, 'steps': 2585, 'loss/train': 2.117922782897949} -09/20/2021 23:26:52 - INFO - __main__ - Step 41365: {'lr': 0.00019931572055144627, 'samples': 1323680, 'steps': 2585, 'loss/train': 1.9890941381454468} -09/20/2021 23:26:52 - INFO - __main__ - Step 41366: {'lr': 0.00019931572055144627, 'samples': 1323712, 'steps': 2585, 'loss/train': 1.3563562631607056} -09/20/2021 23:26:53 - INFO - __main__ - Step 41367: {'lr': 0.00019931572055144627, 'samples': 1323744, 'steps': 2585, 'loss/train': 1.9799530506134033} -09/20/2021 23:26:54 - INFO - __main__ - Step 41368: {'lr': 0.00019931572055144627, 'samples': 1323776, 'steps': 2585, 'loss/train': 1.9760109186172485} -09/20/2021 23:26:55 - INFO - __main__ - Step 41369: {'lr': 0.00019931572055144627, 'samples': 1323808, 'steps': 2585, 'loss/train': 2.027036428451538} -09/20/2021 23:26:55 - INFO - __main__ - Step 41370: {'lr': 0.00019931572055144627, 'samples': 1323840, 'steps': 2585, 'loss/train': 1.8457483053207397} -09/20/2021 23:26:56 - INFO - __main__ - Step 41371: {'lr': 0.00019931572055144627, 'samples': 1323872, 'steps': 2585, 'loss/train': 2.333631753921509} -09/20/2021 23:26:57 - INFO - __main__ - Step 41372: {'lr': 0.00019931572055144627, 'samples': 1323904, 'steps': 2585, 'loss/train': 2.526872396469116} -09/20/2021 23:26:58 - INFO - __main__ - Step 41373: {'lr': 0.00019931572055144627, 'samples': 1323936, 'steps': 2585, 'loss/train': 1.7197608947753906} -09/20/2021 23:26:58 - INFO - __main__ - Step 41374: {'lr': 0.00019931572055144627, 'samples': 1323968, 'steps': 2585, 'loss/train': 1.9412556886672974} -09/20/2021 23:26:59 - INFO - __main__ - Step 41375: {'lr': 0.00019931572055144627, 'samples': 1324000, 'steps': 2585, 'loss/train': 2.052102565765381} -09/20/2021 23:27:00 - INFO - __main__ - Step 41376: {'lr': 0.00019931572055144627, 'samples': 1324032, 'steps': 2585, 'loss/train': 1.7101523876190186} -09/20/2021 23:27:01 - INFO - __main__ - Step 41377: {'lr': 0.00019931497539246143, 'samples': 1324064, 'steps': 2586, 'loss/train': 2.8882384300231934} -09/20/2021 23:27:01 - INFO - __main__ - Step 41378: {'lr': 0.00019931497539246143, 'samples': 1324096, 'steps': 2586, 'loss/train': 2.22371506690979} -09/20/2021 23:27:02 - INFO - __main__ - Step 41379: {'lr': 0.00019931497539246143, 'samples': 1324128, 'steps': 2586, 'loss/train': 1.8869513273239136} -09/20/2021 23:27:03 - INFO - __main__ - Step 41380: {'lr': 0.00019931497539246143, 'samples': 1324160, 'steps': 2586, 'loss/train': 1.8725602626800537} -09/20/2021 23:27:04 - INFO - __main__ - Step 41381: {'lr': 0.00019931497539246143, 'samples': 1324192, 'steps': 2586, 'loss/train': 1.9732017517089844} -09/20/2021 23:27:04 - INFO - __main__ - Step 41382: {'lr': 0.00019931497539246143, 'samples': 1324224, 'steps': 2586, 'loss/train': 2.283604145050049} -09/20/2021 23:27:05 - INFO - __main__ - Step 41383: {'lr': 0.00019931497539246143, 'samples': 1324256, 'steps': 2586, 'loss/train': 2.3879952430725098} -09/20/2021 23:27:06 - INFO - __main__ - Step 41384: {'lr': 0.00019931497539246143, 'samples': 1324288, 'steps': 2586, 'loss/train': 1.972574234008789} -09/20/2021 23:27:07 - INFO - __main__ - Step 41385: {'lr': 0.00019931497539246143, 'samples': 1324320, 'steps': 2586, 'loss/train': 2.212695837020874} -09/20/2021 23:27:07 - INFO - __main__ - Step 41386: {'lr': 0.00019931497539246143, 'samples': 1324352, 'steps': 2586, 'loss/train': 2.293736219406128} -09/20/2021 23:27:08 - INFO - __main__ - Step 41387: {'lr': 0.00019931497539246143, 'samples': 1324384, 'steps': 2586, 'loss/train': 1.8183648586273193} -09/20/2021 23:27:09 - INFO - __main__ - Step 41388: {'lr': 0.00019931497539246143, 'samples': 1324416, 'steps': 2586, 'loss/train': 5.827042579650879} -09/20/2021 23:27:10 - INFO - __main__ - Step 41389: {'lr': 0.00019931497539246143, 'samples': 1324448, 'steps': 2586, 'loss/train': 6.0710062980651855} -09/20/2021 23:27:10 - INFO - __main__ - Step 41390: {'lr': 0.00019931497539246143, 'samples': 1324480, 'steps': 2586, 'loss/train': 5.971269130706787} -09/20/2021 23:27:11 - INFO - __main__ - Step 41391: {'lr': 0.00019931497539246143, 'samples': 1324512, 'steps': 2586, 'loss/train': 2.472949266433716} -09/20/2021 23:27:12 - INFO - __main__ - Step 41392: {'lr': 0.00019931497539246143, 'samples': 1324544, 'steps': 2586, 'loss/train': 1.469090223312378} -09/20/2021 23:27:13 - INFO - __main__ - Step 41393: {'lr': 0.00019931422982936433, 'samples': 1324576, 'steps': 2587, 'loss/train': 1.6330370903015137} -09/20/2021 23:27:14 - INFO - __main__ - Step 41394: {'lr': 0.00019931422982936433, 'samples': 1324608, 'steps': 2587, 'loss/train': 2.269901752471924} -09/20/2021 23:27:15 - INFO - __main__ - Step 41395: {'lr': 0.00019931422982936433, 'samples': 1324640, 'steps': 2587, 'loss/train': 1.6671544313430786} -09/20/2021 23:27:16 - INFO - __main__ - Step 41396: {'lr': 0.00019931422982936433, 'samples': 1324672, 'steps': 2587, 'loss/train': 1.6334083080291748} -09/20/2021 23:27:16 - INFO - __main__ - Step 41397: {'lr': 0.00019931422982936433, 'samples': 1324704, 'steps': 2587, 'loss/train': 2.0838754177093506} -09/20/2021 23:27:17 - INFO - __main__ - Step 41398: {'lr': 0.00019931422982936433, 'samples': 1324736, 'steps': 2587, 'loss/train': 1.6063380241394043} -09/20/2021 23:27:18 - INFO - __main__ - Step 41399: {'lr': 0.00019931422982936433, 'samples': 1324768, 'steps': 2587, 'loss/train': 2.1987996101379395} -09/20/2021 23:27:19 - INFO - __main__ - Step 41400: {'lr': 0.00019931422982936433, 'samples': 1324800, 'steps': 2587, 'loss/train': 2.623811960220337} -09/20/2021 23:27:19 - INFO - __main__ - Step 41401: {'lr': 0.00019931422982936433, 'samples': 1324832, 'steps': 2587, 'loss/train': 2.0335617065429688} -09/20/2021 23:27:20 - INFO - __main__ - Step 41402: {'lr': 0.00019931422982936433, 'samples': 1324864, 'steps': 2587, 'loss/train': 2.384638547897339} -09/20/2021 23:27:21 - INFO - __main__ - Step 41403: {'lr': 0.00019931422982936433, 'samples': 1324896, 'steps': 2587, 'loss/train': 2.4009203910827637} -09/20/2021 23:27:22 - INFO - __main__ - Step 41404: {'lr': 0.00019931422982936433, 'samples': 1324928, 'steps': 2587, 'loss/train': 1.7849273681640625} -09/20/2021 23:27:22 - INFO - __main__ - Step 41405: {'lr': 0.00019931422982936433, 'samples': 1324960, 'steps': 2587, 'loss/train': 2.342839002609253} -09/20/2021 23:27:23 - INFO - __main__ - Step 41406: {'lr': 0.00019931422982936433, 'samples': 1324992, 'steps': 2587, 'loss/train': 2.5241212844848633} -09/20/2021 23:27:24 - INFO - __main__ - Step 41407: {'lr': 0.00019931422982936433, 'samples': 1325024, 'steps': 2587, 'loss/train': 1.91368567943573} -09/20/2021 23:27:25 - INFO - __main__ - Step 41408: {'lr': 0.00019931422982936433, 'samples': 1325056, 'steps': 2587, 'loss/train': 1.486168622970581} -09/20/2021 23:27:25 - INFO - __main__ - Step 41409: {'lr': 0.00019931348386215803, 'samples': 1325088, 'steps': 2588, 'loss/train': 2.615662097930908} -09/20/2021 23:27:26 - INFO - __main__ - Step 41410: {'lr': 0.00019931348386215803, 'samples': 1325120, 'steps': 2588, 'loss/train': 1.5654619932174683} -09/20/2021 23:27:27 - INFO - __main__ - Step 41411: {'lr': 0.00019931348386215803, 'samples': 1325152, 'steps': 2588, 'loss/train': 2.3319270610809326} -09/20/2021 23:27:28 - INFO - __main__ - Step 41412: {'lr': 0.00019931348386215803, 'samples': 1325184, 'steps': 2588, 'loss/train': 2.4640324115753174} -09/20/2021 23:27:28 - INFO - __main__ - Step 41413: {'lr': 0.00019931348386215803, 'samples': 1325216, 'steps': 2588, 'loss/train': 2.2168173789978027} -09/20/2021 23:27:29 - INFO - __main__ - Step 41414: {'lr': 0.00019931348386215803, 'samples': 1325248, 'steps': 2588, 'loss/train': 2.0448241233825684} -09/20/2021 23:27:30 - INFO - __main__ - Step 41415: {'lr': 0.00019931348386215803, 'samples': 1325280, 'steps': 2588, 'loss/train': 2.7158615589141846} -09/20/2021 23:27:31 - INFO - __main__ - Step 41416: {'lr': 0.00019931348386215803, 'samples': 1325312, 'steps': 2588, 'loss/train': 1.474518060684204} -09/20/2021 23:27:31 - INFO - __main__ - Step 41417: {'lr': 0.00019931348386215803, 'samples': 1325344, 'steps': 2588, 'loss/train': 2.55125093460083} -09/20/2021 23:27:32 - INFO - __main__ - Step 41418: {'lr': 0.00019931348386215803, 'samples': 1325376, 'steps': 2588, 'loss/train': 2.5354151725769043} -09/20/2021 23:27:33 - INFO - __main__ - Step 41419: {'lr': 0.00019931348386215803, 'samples': 1325408, 'steps': 2588, 'loss/train': 2.3328187465667725} -09/20/2021 23:27:34 - INFO - __main__ - Step 41420: {'lr': 0.00019931348386215803, 'samples': 1325440, 'steps': 2588, 'loss/train': 1.8068912029266357} -09/20/2021 23:27:34 - INFO - __main__ - Step 41421: {'lr': 0.00019931348386215803, 'samples': 1325472, 'steps': 2588, 'loss/train': 0.4743615686893463} -09/20/2021 23:27:35 - INFO - __main__ - Step 41422: {'lr': 0.00019931348386215803, 'samples': 1325504, 'steps': 2588, 'loss/train': 2.1107521057128906} -09/20/2021 23:27:36 - INFO - __main__ - Step 41423: {'lr': 0.00019931348386215803, 'samples': 1325536, 'steps': 2588, 'loss/train': 0.6698944568634033} -09/20/2021 23:27:37 - INFO - __main__ - Step 41424: {'lr': 0.00019931348386215803, 'samples': 1325568, 'steps': 2588, 'loss/train': 1.807553768157959} -09/20/2021 23:27:38 - INFO - __main__ - Step 41425: {'lr': 0.00019931273749084554, 'samples': 1325600, 'steps': 2589, 'loss/train': 1.220781683921814} -09/20/2021 23:27:39 - INFO - __main__ - Step 41426: {'lr': 0.00019931273749084554, 'samples': 1325632, 'steps': 2589, 'loss/train': 3.054816246032715} -09/20/2021 23:27:40 - INFO - __main__ - Step 41427: {'lr': 0.00019931273749084554, 'samples': 1325664, 'steps': 2589, 'loss/train': 1.9072962999343872} -09/20/2021 23:27:40 - INFO - __main__ - Step 41428: {'lr': 0.00019931273749084554, 'samples': 1325696, 'steps': 2589, 'loss/train': 1.716256022453308} -09/20/2021 23:27:41 - INFO - __main__ - Step 41429: {'lr': 0.00019931273749084554, 'samples': 1325728, 'steps': 2589, 'loss/train': 0.8078406453132629} -09/20/2021 23:27:42 - INFO - __main__ - Step 41430: {'lr': 0.00019931273749084554, 'samples': 1325760, 'steps': 2589, 'loss/train': 1.6932753324508667} -09/20/2021 23:27:43 - INFO - __main__ - Step 41431: {'lr': 0.00019931273749084554, 'samples': 1325792, 'steps': 2589, 'loss/train': 2.8519062995910645} -09/20/2021 23:27:43 - INFO - __main__ - Step 41432: {'lr': 0.00019931273749084554, 'samples': 1325824, 'steps': 2589, 'loss/train': 2.86328387260437} -09/20/2021 23:27:44 - INFO - __main__ - Step 41433: {'lr': 0.00019931273749084554, 'samples': 1325856, 'steps': 2589, 'loss/train': 1.9383692741394043} -09/20/2021 23:27:45 - INFO - __main__ - Step 41434: {'lr': 0.00019931273749084554, 'samples': 1325888, 'steps': 2589, 'loss/train': 1.548107624053955} -09/20/2021 23:27:46 - INFO - __main__ - Step 41435: {'lr': 0.00019931273749084554, 'samples': 1325920, 'steps': 2589, 'loss/train': 0.38045668601989746} -09/20/2021 23:27:46 - INFO - __main__ - Step 41436: {'lr': 0.00019931273749084554, 'samples': 1325952, 'steps': 2589, 'loss/train': 1.7078849077224731} -09/20/2021 23:27:47 - INFO - __main__ - Step 41437: {'lr': 0.00019931273749084554, 'samples': 1325984, 'steps': 2589, 'loss/train': 2.2813398838043213} -09/20/2021 23:27:48 - INFO - __main__ - Step 41438: {'lr': 0.00019931273749084554, 'samples': 1326016, 'steps': 2589, 'loss/train': 1.7848756313323975} -09/20/2021 23:27:49 - INFO - __main__ - Step 41439: {'lr': 0.00019931273749084554, 'samples': 1326048, 'steps': 2589, 'loss/train': 2.9563708305358887} -09/20/2021 23:27:49 - INFO - __main__ - Step 41440: {'lr': 0.00019931273749084554, 'samples': 1326080, 'steps': 2589, 'loss/train': 2.3693909645080566} -09/20/2021 23:27:50 - INFO - __main__ - Step 41441: {'lr': 0.00019931199071542992, 'samples': 1326112, 'steps': 2590, 'loss/train': 2.171515703201294} -09/20/2021 23:27:51 - INFO - __main__ - Step 41442: {'lr': 0.00019931199071542992, 'samples': 1326144, 'steps': 2590, 'loss/train': 3.40622615814209} -09/20/2021 23:27:52 - INFO - __main__ - Step 41443: {'lr': 0.00019931199071542992, 'samples': 1326176, 'steps': 2590, 'loss/train': 1.7753316164016724} -09/20/2021 23:27:52 - INFO - __main__ - Step 41444: {'lr': 0.00019931199071542992, 'samples': 1326208, 'steps': 2590, 'loss/train': 2.6967146396636963} -09/20/2021 23:27:53 - INFO - __main__ - Step 41445: {'lr': 0.00019931199071542992, 'samples': 1326240, 'steps': 2590, 'loss/train': 1.951499342918396} -09/20/2021 23:27:54 - INFO - __main__ - Step 41446: {'lr': 0.00019931199071542992, 'samples': 1326272, 'steps': 2590, 'loss/train': 2.862346887588501} -09/20/2021 23:27:55 - INFO - __main__ - Step 41447: {'lr': 0.00019931199071542992, 'samples': 1326304, 'steps': 2590, 'loss/train': 1.5218029022216797} -09/20/2021 23:27:55 - INFO - __main__ - Step 41448: {'lr': 0.00019931199071542992, 'samples': 1326336, 'steps': 2590, 'loss/train': 2.527224540710449} -09/20/2021 23:27:56 - INFO - __main__ - Step 41449: {'lr': 0.00019931199071542992, 'samples': 1326368, 'steps': 2590, 'loss/train': 2.408672332763672} -09/20/2021 23:27:57 - INFO - __main__ - Step 41450: {'lr': 0.00019931199071542992, 'samples': 1326400, 'steps': 2590, 'loss/train': 2.0624330043792725} -09/20/2021 23:27:58 - INFO - __main__ - Step 41451: {'lr': 0.00019931199071542992, 'samples': 1326432, 'steps': 2590, 'loss/train': 1.7866191864013672} -09/20/2021 23:27:58 - INFO - __main__ - Step 41452: {'lr': 0.00019931199071542992, 'samples': 1326464, 'steps': 2590, 'loss/train': 2.4700839519500732} -09/20/2021 23:27:59 - INFO - __main__ - Step 41453: {'lr': 0.00019931199071542992, 'samples': 1326496, 'steps': 2590, 'loss/train': 3.1577587127685547} -09/20/2021 23:28:00 - INFO - __main__ - Step 41454: {'lr': 0.00019931199071542992, 'samples': 1326528, 'steps': 2590, 'loss/train': 2.2201449871063232} -09/20/2021 23:28:01 - INFO - __main__ - Step 41455: {'lr': 0.00019931199071542992, 'samples': 1326560, 'steps': 2590, 'loss/train': 2.5426337718963623} -09/20/2021 23:28:01 - INFO - __main__ - Step 41456: {'lr': 0.00019931199071542992, 'samples': 1326592, 'steps': 2590, 'loss/train': 2.5722315311431885} -09/20/2021 23:28:03 - INFO - __main__ - Step 41457: {'lr': 0.0001993112435359142, 'samples': 1326624, 'steps': 2591, 'loss/train': 1.3138816356658936} -09/20/2021 23:28:04 - INFO - __main__ - Step 41458: {'lr': 0.0001993112435359142, 'samples': 1326656, 'steps': 2591, 'loss/train': 1.8649826049804688} -09/20/2021 23:28:05 - INFO - __main__ - Step 41459: {'lr': 0.0001993112435359142, 'samples': 1326688, 'steps': 2591, 'loss/train': 1.8433727025985718} -09/20/2021 23:28:06 - INFO - __main__ - Step 41460: {'lr': 0.0001993112435359142, 'samples': 1326720, 'steps': 2591, 'loss/train': 1.4732879400253296} -09/20/2021 23:28:06 - INFO - __main__ - Step 41461: {'lr': 0.0001993112435359142, 'samples': 1326752, 'steps': 2591, 'loss/train': 1.8313978910446167} -09/20/2021 23:28:07 - INFO - __main__ - Step 41462: {'lr': 0.0001993112435359142, 'samples': 1326784, 'steps': 2591, 'loss/train': 1.4481183290481567} -09/20/2021 23:28:08 - INFO - __main__ - Step 41463: {'lr': 0.0001993112435359142, 'samples': 1326816, 'steps': 2591, 'loss/train': 2.850369691848755} -09/20/2021 23:28:09 - INFO - __main__ - Step 41464: {'lr': 0.0001993112435359142, 'samples': 1326848, 'steps': 2591, 'loss/train': 2.1475751399993896} -09/20/2021 23:28:09 - INFO - __main__ - Step 41465: {'lr': 0.0001993112435359142, 'samples': 1326880, 'steps': 2591, 'loss/train': 1.7643707990646362} -09/20/2021 23:28:10 - INFO - __main__ - Step 41466: {'lr': 0.0001993112435359142, 'samples': 1326912, 'steps': 2591, 'loss/train': 2.0775952339172363} -09/20/2021 23:28:11 - INFO - __main__ - Step 41467: {'lr': 0.0001993112435359142, 'samples': 1326944, 'steps': 2591, 'loss/train': 2.2376372814178467} -09/20/2021 23:28:12 - INFO - __main__ - Step 41468: {'lr': 0.0001993112435359142, 'samples': 1326976, 'steps': 2591, 'loss/train': 1.6051032543182373} -09/20/2021 23:28:12 - INFO - __main__ - Step 41469: {'lr': 0.0001993112435359142, 'samples': 1327008, 'steps': 2591, 'loss/train': 1.4616336822509766} -09/20/2021 23:28:13 - INFO - __main__ - Step 41470: {'lr': 0.0001993112435359142, 'samples': 1327040, 'steps': 2591, 'loss/train': 1.952043056488037} -09/20/2021 23:28:14 - INFO - __main__ - Step 41471: {'lr': 0.0001993112435359142, 'samples': 1327072, 'steps': 2591, 'loss/train': 2.1865062713623047} -09/20/2021 23:28:15 - INFO - __main__ - Step 41472: {'lr': 0.0001993112435359142, 'samples': 1327104, 'steps': 2591, 'loss/train': 2.6822280883789062} -09/20/2021 23:28:16 - INFO - __main__ - Step 41473: {'lr': 0.00019931049595230138, 'samples': 1327136, 'steps': 2592, 'loss/train': 2.1966774463653564} -09/20/2021 23:28:16 - INFO - __main__ - Step 41474: {'lr': 0.00019931049595230138, 'samples': 1327168, 'steps': 2592, 'loss/train': 2.2680671215057373} -09/20/2021 23:28:17 - INFO - __main__ - Step 41475: {'lr': 0.00019931049595230138, 'samples': 1327200, 'steps': 2592, 'loss/train': 2.231330156326294} -09/20/2021 23:28:18 - INFO - __main__ - Step 41476: {'lr': 0.00019931049595230138, 'samples': 1327232, 'steps': 2592, 'loss/train': 1.3838474750518799} -09/20/2021 23:28:19 - INFO - __main__ - Step 41477: {'lr': 0.00019931049595230138, 'samples': 1327264, 'steps': 2592, 'loss/train': 1.3428000211715698} -09/20/2021 23:28:19 - INFO - __main__ - Step 41478: {'lr': 0.00019931049595230138, 'samples': 1327296, 'steps': 2592, 'loss/train': 2.3243753910064697} -09/20/2021 23:28:20 - INFO - __main__ - Step 41479: {'lr': 0.00019931049595230138, 'samples': 1327328, 'steps': 2592, 'loss/train': 1.6685848236083984} -09/20/2021 23:28:21 - INFO - __main__ - Step 41480: {'lr': 0.00019931049595230138, 'samples': 1327360, 'steps': 2592, 'loss/train': 2.6160521507263184} -09/20/2021 23:28:22 - INFO - __main__ - Step 41481: {'lr': 0.00019931049595230138, 'samples': 1327392, 'steps': 2592, 'loss/train': 2.2356791496276855} -09/20/2021 23:28:22 - INFO - __main__ - Step 41482: {'lr': 0.00019931049595230138, 'samples': 1327424, 'steps': 2592, 'loss/train': 3.1633150577545166} -09/20/2021 23:28:23 - INFO - __main__ - Step 41483: {'lr': 0.00019931049595230138, 'samples': 1327456, 'steps': 2592, 'loss/train': 2.156373977661133} -09/20/2021 23:28:24 - INFO - __main__ - Step 41484: {'lr': 0.00019931049595230138, 'samples': 1327488, 'steps': 2592, 'loss/train': 1.9500941038131714} -09/20/2021 23:28:25 - INFO - __main__ - Step 41485: {'lr': 0.00019931049595230138, 'samples': 1327520, 'steps': 2592, 'loss/train': 2.284575939178467} -09/20/2021 23:28:25 - INFO - __main__ - Step 41486: {'lr': 0.00019931049595230138, 'samples': 1327552, 'steps': 2592, 'loss/train': 1.8698829412460327} -09/20/2021 23:28:26 - INFO - __main__ - Step 41487: {'lr': 0.00019931049595230138, 'samples': 1327584, 'steps': 2592, 'loss/train': 0.5722792148590088} -09/20/2021 23:28:27 - INFO - __main__ - Step 41488: {'lr': 0.00019931049595230138, 'samples': 1327616, 'steps': 2592, 'loss/train': 3.1346399784088135} -09/20/2021 23:28:28 - INFO - __main__ - Step 41489: {'lr': 0.00019930974796459458, 'samples': 1327648, 'steps': 2593, 'loss/train': 2.176720380783081} -09/20/2021 23:28:29 - INFO - __main__ - Step 41490: {'lr': 0.00019930974796459458, 'samples': 1327680, 'steps': 2593, 'loss/train': 2.5713911056518555} -09/20/2021 23:28:30 - INFO - __main__ - Step 41491: {'lr': 0.00019930974796459458, 'samples': 1327712, 'steps': 2593, 'loss/train': 1.4398566484451294} -09/20/2021 23:28:30 - INFO - __main__ - Step 41492: {'lr': 0.00019930974796459458, 'samples': 1327744, 'steps': 2593, 'loss/train': 2.7847020626068115} -09/20/2021 23:28:31 - INFO - __main__ - Step 41493: {'lr': 0.00019930974796459458, 'samples': 1327776, 'steps': 2593, 'loss/train': 2.659627914428711} -09/20/2021 23:28:32 - INFO - __main__ - Step 41494: {'lr': 0.00019930974796459458, 'samples': 1327808, 'steps': 2593, 'loss/train': 2.1164066791534424} -09/20/2021 23:28:33 - INFO - __main__ - Step 41495: {'lr': 0.00019930974796459458, 'samples': 1327840, 'steps': 2593, 'loss/train': 1.8670017719268799} -09/20/2021 23:28:33 - INFO - __main__ - Step 41496: {'lr': 0.00019930974796459458, 'samples': 1327872, 'steps': 2593, 'loss/train': 1.8754863739013672} -09/20/2021 23:28:34 - INFO - __main__ - Step 41497: {'lr': 0.00019930974796459458, 'samples': 1327904, 'steps': 2593, 'loss/train': 2.0382091999053955} -09/20/2021 23:28:35 - INFO - __main__ - Step 41498: {'lr': 0.00019930974796459458, 'samples': 1327936, 'steps': 2593, 'loss/train': 2.512913227081299} -09/20/2021 23:28:36 - INFO - __main__ - Step 41499: {'lr': 0.00019930974796459458, 'samples': 1327968, 'steps': 2593, 'loss/train': 2.121985912322998} -09/20/2021 23:28:36 - INFO - __main__ - Step 41500: {'lr': 0.00019930974796459458, 'samples': 1328000, 'steps': 2593, 'loss/train': 2.679908275604248} -09/20/2021 23:28:37 - INFO - __main__ - Step 41501: {'lr': 0.00019930974796459458, 'samples': 1328032, 'steps': 2593, 'loss/train': 1.7823177576065063} -09/20/2021 23:28:38 - INFO - __main__ - Step 41502: {'lr': 0.00019930974796459458, 'samples': 1328064, 'steps': 2593, 'loss/train': 2.1234874725341797} -09/20/2021 23:28:39 - INFO - __main__ - Step 41503: {'lr': 0.00019930974796459458, 'samples': 1328096, 'steps': 2593, 'loss/train': 1.5715945959091187} -09/20/2021 23:28:39 - INFO - __main__ - Step 41504: {'lr': 0.00019930974796459458, 'samples': 1328128, 'steps': 2593, 'loss/train': 1.8285794258117676} -09/20/2021 23:28:40 - INFO - __main__ - Step 41505: {'lr': 0.00019930899957279675, 'samples': 1328160, 'steps': 2594, 'loss/train': 2.446518659591675} -09/20/2021 23:28:41 - INFO - __main__ - Step 41506: {'lr': 0.00019930899957279675, 'samples': 1328192, 'steps': 2594, 'loss/train': 2.0287351608276367} -09/20/2021 23:28:42 - INFO - __main__ - Step 41507: {'lr': 0.00019930899957279675, 'samples': 1328224, 'steps': 2594, 'loss/train': 1.8211761713027954} -09/20/2021 23:28:43 - INFO - __main__ - Step 41508: {'lr': 0.00019930899957279675, 'samples': 1328256, 'steps': 2594, 'loss/train': 1.8430852890014648} -09/20/2021 23:28:43 - INFO - __main__ - Step 41509: {'lr': 0.00019930899957279675, 'samples': 1328288, 'steps': 2594, 'loss/train': 2.9144127368927} -09/20/2021 23:28:44 - INFO - __main__ - Step 41510: {'lr': 0.00019930899957279675, 'samples': 1328320, 'steps': 2594, 'loss/train': 1.8478069305419922} -09/20/2021 23:28:45 - INFO - __main__ - Step 41511: {'lr': 0.00019930899957279675, 'samples': 1328352, 'steps': 2594, 'loss/train': 2.5746288299560547} -09/20/2021 23:28:46 - INFO - __main__ - Step 41512: {'lr': 0.00019930899957279675, 'samples': 1328384, 'steps': 2594, 'loss/train': 3.479099750518799} -09/20/2021 23:28:46 - INFO - __main__ - Step 41513: {'lr': 0.00019930899957279675, 'samples': 1328416, 'steps': 2594, 'loss/train': 2.2215535640716553} -09/20/2021 23:28:47 - INFO - __main__ - Step 41514: {'lr': 0.00019930899957279675, 'samples': 1328448, 'steps': 2594, 'loss/train': 1.5943138599395752} -09/20/2021 23:28:48 - INFO - __main__ - Step 41515: {'lr': 0.00019930899957279675, 'samples': 1328480, 'steps': 2594, 'loss/train': 1.721184253692627} -09/20/2021 23:28:49 - INFO - __main__ - Step 41516: {'lr': 0.00019930899957279675, 'samples': 1328512, 'steps': 2594, 'loss/train': 2.712386131286621} -09/20/2021 23:28:49 - INFO - __main__ - Step 41517: {'lr': 0.00019930899957279675, 'samples': 1328544, 'steps': 2594, 'loss/train': 2.3566863536834717} -09/20/2021 23:28:50 - INFO - __main__ - Step 41518: {'lr': 0.00019930899957279675, 'samples': 1328576, 'steps': 2594, 'loss/train': 1.5720494985580444} -09/20/2021 23:28:52 - INFO - __main__ - Step 41519: {'lr': 0.00019930899957279675, 'samples': 1328608, 'steps': 2594, 'loss/train': 2.486922025680542} -09/20/2021 23:28:52 - INFO - __main__ - Step 41520: {'lr': 0.00019930899957279675, 'samples': 1328640, 'steps': 2594, 'loss/train': 2.6952145099639893} -09/20/2021 23:28:53 - INFO - __main__ - Step 41521: {'lr': 0.00019930825077691105, 'samples': 1328672, 'steps': 2595, 'loss/train': 0.5872771143913269} -09/20/2021 23:28:54 - INFO - __main__ - Step 41522: {'lr': 0.00019930825077691105, 'samples': 1328704, 'steps': 2595, 'loss/train': 2.3146309852600098} -09/20/2021 23:28:55 - INFO - __main__ - Step 41523: {'lr': 0.00019930825077691105, 'samples': 1328736, 'steps': 2595, 'loss/train': 2.599935531616211} -09/20/2021 23:28:56 - INFO - __main__ - Step 41524: {'lr': 0.00019930825077691105, 'samples': 1328768, 'steps': 2595, 'loss/train': 1.822271466255188} -09/20/2021 23:28:56 - INFO - __main__ - Step 41525: {'lr': 0.00019930825077691105, 'samples': 1328800, 'steps': 2595, 'loss/train': 1.7877999544143677} -09/20/2021 23:28:57 - INFO - __main__ - Step 41526: {'lr': 0.00019930825077691105, 'samples': 1328832, 'steps': 2595, 'loss/train': 1.5667263269424438} -09/20/2021 23:28:58 - INFO - __main__ - Step 41527: {'lr': 0.00019930825077691105, 'samples': 1328864, 'steps': 2595, 'loss/train': 1.6151331663131714} -09/20/2021 23:28:59 - INFO - __main__ - Step 41528: {'lr': 0.00019930825077691105, 'samples': 1328896, 'steps': 2595, 'loss/train': 1.135599970817566} -09/20/2021 23:28:59 - INFO - __main__ - Step 41529: {'lr': 0.00019930825077691105, 'samples': 1328928, 'steps': 2595, 'loss/train': 0.8929935693740845} -09/20/2021 23:29:00 - INFO - __main__ - Step 41530: {'lr': 0.00019930825077691105, 'samples': 1328960, 'steps': 2595, 'loss/train': 1.0761717557907104} -09/20/2021 23:29:01 - INFO - __main__ - Step 41531: {'lr': 0.00019930825077691105, 'samples': 1328992, 'steps': 2595, 'loss/train': 0.7511329650878906} -09/20/2021 23:29:02 - INFO - __main__ - Step 41532: {'lr': 0.00019930825077691105, 'samples': 1329024, 'steps': 2595, 'loss/train': 0.9571922421455383} -09/20/2021 23:29:02 - INFO - __main__ - Step 41533: {'lr': 0.00019930825077691105, 'samples': 1329056, 'steps': 2595, 'loss/train': 0.7575550079345703} -09/20/2021 23:29:03 - INFO - __main__ - Step 41534: {'lr': 0.00019930825077691105, 'samples': 1329088, 'steps': 2595, 'loss/train': 1.215061902999878} -09/20/2021 23:29:04 - INFO - __main__ - Step 41535: {'lr': 0.00019930825077691105, 'samples': 1329120, 'steps': 2595, 'loss/train': 1.4792300462722778} -09/20/2021 23:29:05 - INFO - __main__ - Step 41536: {'lr': 0.00019930825077691105, 'samples': 1329152, 'steps': 2595, 'loss/train': 3.0150015354156494} -09/20/2021 23:29:06 - INFO - __main__ - Step 41537: {'lr': 0.00019930750157694043, 'samples': 1329184, 'steps': 2596, 'loss/train': 2.044670820236206} -09/20/2021 23:29:06 - INFO - __main__ - Step 41538: {'lr': 0.00019930750157694043, 'samples': 1329216, 'steps': 2596, 'loss/train': 1.8738330602645874} -09/20/2021 23:29:07 - INFO - __main__ - Step 41539: {'lr': 0.00019930750157694043, 'samples': 1329248, 'steps': 2596, 'loss/train': 1.4363137483596802} -09/20/2021 23:29:08 - INFO - __main__ - Step 41540: {'lr': 0.00019930750157694043, 'samples': 1329280, 'steps': 2596, 'loss/train': 2.7783632278442383} -09/20/2021 23:29:09 - INFO - __main__ - Step 41541: {'lr': 0.00019930750157694043, 'samples': 1329312, 'steps': 2596, 'loss/train': 2.86733078956604} -09/20/2021 23:29:09 - INFO - __main__ - Step 41542: {'lr': 0.00019930750157694043, 'samples': 1329344, 'steps': 2596, 'loss/train': 2.005276679992676} -09/20/2021 23:29:10 - INFO - __main__ - Step 41543: {'lr': 0.00019930750157694043, 'samples': 1329376, 'steps': 2596, 'loss/train': 1.7801342010498047} -09/20/2021 23:29:11 - INFO - __main__ - Step 41544: {'lr': 0.00019930750157694043, 'samples': 1329408, 'steps': 2596, 'loss/train': 3.3427484035491943} -09/20/2021 23:29:12 - INFO - __main__ - Step 41545: {'lr': 0.00019930750157694043, 'samples': 1329440, 'steps': 2596, 'loss/train': 1.8671702146530151} -09/20/2021 23:29:12 - INFO - __main__ - Step 41546: {'lr': 0.00019930750157694043, 'samples': 1329472, 'steps': 2596, 'loss/train': 2.4405040740966797} -09/20/2021 23:29:13 - INFO - __main__ - Step 41547: {'lr': 0.00019930750157694043, 'samples': 1329504, 'steps': 2596, 'loss/train': 2.3514816761016846} -09/20/2021 23:29:14 - INFO - __main__ - Step 41548: {'lr': 0.00019930750157694043, 'samples': 1329536, 'steps': 2596, 'loss/train': 2.3010659217834473} -09/20/2021 23:29:15 - INFO - __main__ - Step 41549: {'lr': 0.00019930750157694043, 'samples': 1329568, 'steps': 2596, 'loss/train': 2.2930097579956055} -09/20/2021 23:29:15 - INFO - __main__ - Step 41550: {'lr': 0.00019930750157694043, 'samples': 1329600, 'steps': 2596, 'loss/train': 2.580737590789795} -09/20/2021 23:29:16 - INFO - __main__ - Step 41551: {'lr': 0.00019930750157694043, 'samples': 1329632, 'steps': 2596, 'loss/train': 2.4550631046295166} -09/20/2021 23:29:17 - INFO - __main__ - Step 41552: {'lr': 0.00019930750157694043, 'samples': 1329664, 'steps': 2596, 'loss/train': 2.1860907077789307} -09/20/2021 23:29:18 - INFO - __main__ - Step 41553: {'lr': 0.00019930675197288796, 'samples': 1329696, 'steps': 2597, 'loss/train': 2.033507823944092} -09/20/2021 23:29:18 - INFO - __main__ - Step 41554: {'lr': 0.00019930675197288796, 'samples': 1329728, 'steps': 2597, 'loss/train': 2.076443910598755} -09/20/2021 23:29:20 - INFO - __main__ - Step 41555: {'lr': 0.00019930675197288796, 'samples': 1329760, 'steps': 2597, 'loss/train': 1.8299956321716309} -09/20/2021 23:29:21 - INFO - __main__ - Step 41556: {'lr': 0.00019930675197288796, 'samples': 1329792, 'steps': 2597, 'loss/train': 1.9442042112350464} -09/20/2021 23:29:21 - INFO - __main__ - Step 41557: {'lr': 0.00019930675197288796, 'samples': 1329824, 'steps': 2597, 'loss/train': 1.798816442489624} -09/20/2021 23:29:22 - INFO - __main__ - Step 41558: {'lr': 0.00019930675197288796, 'samples': 1329856, 'steps': 2597, 'loss/train': 1.3693227767944336} -09/20/2021 23:29:23 - INFO - __main__ - Step 41559: {'lr': 0.00019930675197288796, 'samples': 1329888, 'steps': 2597, 'loss/train': 1.5696109533309937} -09/20/2021 23:29:24 - INFO - __main__ - Step 41560: {'lr': 0.00019930675197288796, 'samples': 1329920, 'steps': 2597, 'loss/train': 1.3176243305206299} -09/20/2021 23:29:24 - INFO - __main__ - Step 41561: {'lr': 0.00019930675197288796, 'samples': 1329952, 'steps': 2597, 'loss/train': 0.4968115985393524} -09/20/2021 23:29:25 - INFO - __main__ - Step 41562: {'lr': 0.00019930675197288796, 'samples': 1329984, 'steps': 2597, 'loss/train': 2.317519426345825} -09/20/2021 23:29:26 - INFO - __main__ - Step 41563: {'lr': 0.00019930675197288796, 'samples': 1330016, 'steps': 2597, 'loss/train': 2.215094804763794} -09/20/2021 23:29:27 - INFO - __main__ - Step 41564: {'lr': 0.00019930675197288796, 'samples': 1330048, 'steps': 2597, 'loss/train': 2.2978322505950928} -09/20/2021 23:29:27 - INFO - __main__ - Step 41565: {'lr': 0.00019930675197288796, 'samples': 1330080, 'steps': 2597, 'loss/train': 1.8100426197052002} -09/20/2021 23:29:28 - INFO - __main__ - Step 41566: {'lr': 0.00019930675197288796, 'samples': 1330112, 'steps': 2597, 'loss/train': 2.7885420322418213} -09/20/2021 23:29:29 - INFO - __main__ - Step 41567: {'lr': 0.00019930675197288796, 'samples': 1330144, 'steps': 2597, 'loss/train': 2.374837875366211} -09/20/2021 23:29:30 - INFO - __main__ - Step 41568: {'lr': 0.00019930675197288796, 'samples': 1330176, 'steps': 2597, 'loss/train': 2.5317938327789307} -09/20/2021 23:29:30 - INFO - __main__ - Step 41569: {'lr': 0.0001993060019647567, 'samples': 1330208, 'steps': 2598, 'loss/train': 2.8306162357330322} -09/20/2021 23:29:31 - INFO - __main__ - Step 41570: {'lr': 0.0001993060019647567, 'samples': 1330240, 'steps': 2598, 'loss/train': 1.5163987874984741} -09/20/2021 23:29:32 - INFO - __main__ - Step 41571: {'lr': 0.0001993060019647567, 'samples': 1330272, 'steps': 2598, 'loss/train': 1.6395410299301147} -09/20/2021 23:29:33 - INFO - __main__ - Step 41572: {'lr': 0.0001993060019647567, 'samples': 1330304, 'steps': 2598, 'loss/train': 1.336167573928833} -09/20/2021 23:29:33 - INFO - __main__ - Step 41573: {'lr': 0.0001993060019647567, 'samples': 1330336, 'steps': 2598, 'loss/train': 1.9628615379333496} -09/20/2021 23:29:34 - INFO - __main__ - Step 41574: {'lr': 0.0001993060019647567, 'samples': 1330368, 'steps': 2598, 'loss/train': 1.9124021530151367} -09/20/2021 23:29:35 - INFO - __main__ - Step 41575: {'lr': 0.0001993060019647567, 'samples': 1330400, 'steps': 2598, 'loss/train': 2.4832570552825928} -09/20/2021 23:29:36 - INFO - __main__ - Step 41576: {'lr': 0.0001993060019647567, 'samples': 1330432, 'steps': 2598, 'loss/train': 1.8301998376846313} -09/20/2021 23:29:36 - INFO - __main__ - Step 41577: {'lr': 0.0001993060019647567, 'samples': 1330464, 'steps': 2598, 'loss/train': 2.7662580013275146} -09/20/2021 23:29:37 - INFO - __main__ - Step 41578: {'lr': 0.0001993060019647567, 'samples': 1330496, 'steps': 2598, 'loss/train': 2.502452850341797} -09/20/2021 23:29:38 - INFO - __main__ - Step 41579: {'lr': 0.0001993060019647567, 'samples': 1330528, 'steps': 2598, 'loss/train': 0.7368454933166504} -09/20/2021 23:29:39 - INFO - __main__ - Step 41580: {'lr': 0.0001993060019647567, 'samples': 1330560, 'steps': 2598, 'loss/train': 2.1416049003601074} -09/20/2021 23:29:39 - INFO - __main__ - Step 41581: {'lr': 0.0001993060019647567, 'samples': 1330592, 'steps': 2598, 'loss/train': 1.6025055646896362} -09/20/2021 23:29:40 - INFO - __main__ - Step 41582: {'lr': 0.0001993060019647567, 'samples': 1330624, 'steps': 2598, 'loss/train': 0.1756005883216858} -09/20/2021 23:29:41 - INFO - __main__ - Step 41583: {'lr': 0.0001993060019647567, 'samples': 1330656, 'steps': 2598, 'loss/train': 0.15882772207260132} -09/20/2021 23:29:42 - INFO - __main__ - Step 41584: {'lr': 0.0001993060019647567, 'samples': 1330688, 'steps': 2598, 'loss/train': 1.8958559036254883} -09/20/2021 23:29:43 - INFO - __main__ - Step 41585: {'lr': 0.00019930525155254972, 'samples': 1330720, 'steps': 2599, 'loss/train': 2.401238203048706} -09/20/2021 23:29:44 - INFO - __main__ - Step 41586: {'lr': 0.00019930525155254972, 'samples': 1330752, 'steps': 2599, 'loss/train': 2.1316282749176025} -09/20/2021 23:29:45 - INFO - __main__ - Step 41587: {'lr': 0.00019930525155254972, 'samples': 1330784, 'steps': 2599, 'loss/train': 2.9441897869110107} -09/20/2021 23:29:45 - INFO - __main__ - Step 41588: {'lr': 0.00019930525155254972, 'samples': 1330816, 'steps': 2599, 'loss/train': 2.766066074371338} -09/20/2021 23:29:46 - INFO - __main__ - Step 41589: {'lr': 0.00019930525155254972, 'samples': 1330848, 'steps': 2599, 'loss/train': 2.314210891723633} -09/20/2021 23:29:47 - INFO - __main__ - Step 41590: {'lr': 0.00019930525155254972, 'samples': 1330880, 'steps': 2599, 'loss/train': 2.1615164279937744} -09/20/2021 23:29:48 - INFO - __main__ - Step 41591: {'lr': 0.00019930525155254972, 'samples': 1330912, 'steps': 2599, 'loss/train': 2.61515474319458} -09/20/2021 23:29:48 - INFO - __main__ - Step 41592: {'lr': 0.00019930525155254972, 'samples': 1330944, 'steps': 2599, 'loss/train': 2.17997145652771} -09/20/2021 23:29:49 - INFO - __main__ - Step 41593: {'lr': 0.00019930525155254972, 'samples': 1330976, 'steps': 2599, 'loss/train': 2.6513829231262207} -09/20/2021 23:29:50 - INFO - __main__ - Step 41594: {'lr': 0.00019930525155254972, 'samples': 1331008, 'steps': 2599, 'loss/train': 2.410710334777832} -09/20/2021 23:29:51 - INFO - __main__ - Step 41595: {'lr': 0.00019930525155254972, 'samples': 1331040, 'steps': 2599, 'loss/train': 1.993943214416504} -09/20/2021 23:29:51 - INFO - __main__ - Step 41596: {'lr': 0.00019930525155254972, 'samples': 1331072, 'steps': 2599, 'loss/train': 2.3290562629699707} -09/20/2021 23:29:52 - INFO - __main__ - Step 41597: {'lr': 0.00019930525155254972, 'samples': 1331104, 'steps': 2599, 'loss/train': 2.6011486053466797} -09/20/2021 23:29:53 - INFO - __main__ - Step 41598: {'lr': 0.00019930525155254972, 'samples': 1331136, 'steps': 2599, 'loss/train': 2.6320011615753174} -09/20/2021 23:29:54 - INFO - __main__ - Step 41599: {'lr': 0.00019930525155254972, 'samples': 1331168, 'steps': 2599, 'loss/train': 2.534410238265991} -09/20/2021 23:29:54 - INFO - __main__ - Step 41600: {'lr': 0.00019930525155254972, 'samples': 1331200, 'steps': 2599, 'loss/train': 2.381643056869507} -09/20/2021 23:29:55 - INFO - __main__ - Step 41601: {'lr': 0.00019930450073627008, 'samples': 1331232, 'steps': 2600, 'loss/train': 1.5446834564208984} -09/20/2021 23:29:56 - INFO - __main__ - Step 41602: {'lr': 0.00019930450073627008, 'samples': 1331264, 'steps': 2600, 'loss/train': 1.0547354221343994} -09/20/2021 23:29:57 - INFO - __main__ - Step 41603: {'lr': 0.00019930450073627008, 'samples': 1331296, 'steps': 2600, 'loss/train': 0.39083966612815857} -09/20/2021 23:29:57 - INFO - __main__ - Step 41604: {'lr': 0.00019930450073627008, 'samples': 1331328, 'steps': 2600, 'loss/train': 1.2794413566589355} -09/20/2021 23:29:58 - INFO - __main__ - Step 41605: {'lr': 0.00019930450073627008, 'samples': 1331360, 'steps': 2600, 'loss/train': 2.183109760284424} -09/20/2021 23:29:59 - INFO - __main__ - Step 41606: {'lr': 0.00019930450073627008, 'samples': 1331392, 'steps': 2600, 'loss/train': 3.0229272842407227} -09/20/2021 23:30:00 - INFO - __main__ - Step 41607: {'lr': 0.00019930450073627008, 'samples': 1331424, 'steps': 2600, 'loss/train': 1.8562138080596924} -09/20/2021 23:30:00 - INFO - __main__ - Step 41608: {'lr': 0.00019930450073627008, 'samples': 1331456, 'steps': 2600, 'loss/train': 2.171518564224243} -09/20/2021 23:30:01 - INFO - __main__ - Step 41609: {'lr': 0.00019930450073627008, 'samples': 1331488, 'steps': 2600, 'loss/train': 1.9860522747039795} -09/20/2021 23:30:02 - INFO - __main__ - Step 41610: {'lr': 0.00019930450073627008, 'samples': 1331520, 'steps': 2600, 'loss/train': 2.4487764835357666} -09/20/2021 23:30:03 - INFO - __main__ - Step 41611: {'lr': 0.00019930450073627008, 'samples': 1331552, 'steps': 2600, 'loss/train': 1.9210864305496216} -09/20/2021 23:30:03 - INFO - __main__ - Step 41612: {'lr': 0.00019930450073627008, 'samples': 1331584, 'steps': 2600, 'loss/train': 2.233180522918701} -09/20/2021 23:30:04 - INFO - __main__ - Step 41613: {'lr': 0.00019930450073627008, 'samples': 1331616, 'steps': 2600, 'loss/train': 2.127793550491333} -09/20/2021 23:30:05 - INFO - __main__ - Step 41614: {'lr': 0.00019930450073627008, 'samples': 1331648, 'steps': 2600, 'loss/train': 1.8518617153167725} -09/20/2021 23:30:06 - INFO - __main__ - Step 41615: {'lr': 0.00019930450073627008, 'samples': 1331680, 'steps': 2600, 'loss/train': 2.2743656635284424} -09/20/2021 23:30:07 - INFO - __main__ - Step 41616: {'lr': 0.00019930450073627008, 'samples': 1331712, 'steps': 2600, 'loss/train': 2.205897331237793} -09/20/2021 23:30:08 - INFO - __main__ - Step 41617: {'lr': 0.00019930374951592078, 'samples': 1331744, 'steps': 2601, 'loss/train': 3.305837869644165} -09/20/2021 23:30:09 - INFO - __main__ - Step 41618: {'lr': 0.00019930374951592078, 'samples': 1331776, 'steps': 2601, 'loss/train': 2.768828868865967} -09/20/2021 23:30:09 - INFO - __main__ - Step 41619: {'lr': 0.00019930374951592078, 'samples': 1331808, 'steps': 2601, 'loss/train': 2.021946907043457} -09/20/2021 23:30:10 - INFO - __main__ - Step 41620: {'lr': 0.00019930374951592078, 'samples': 1331840, 'steps': 2601, 'loss/train': 1.0152639150619507} -09/20/2021 23:30:11 - INFO - __main__ - Step 41621: {'lr': 0.00019930374951592078, 'samples': 1331872, 'steps': 2601, 'loss/train': 1.6766235828399658} -09/20/2021 23:30:12 - INFO - __main__ - Step 41622: {'lr': 0.00019930374951592078, 'samples': 1331904, 'steps': 2601, 'loss/train': 2.409183979034424} -09/20/2021 23:30:12 - INFO - __main__ - Step 41623: {'lr': 0.00019930374951592078, 'samples': 1331936, 'steps': 2601, 'loss/train': 0.4765813946723938} -09/20/2021 23:30:13 - INFO - __main__ - Step 41624: {'lr': 0.00019930374951592078, 'samples': 1331968, 'steps': 2601, 'loss/train': 2.1570887565612793} -09/20/2021 23:30:14 - INFO - __main__ - Step 41625: {'lr': 0.00019930374951592078, 'samples': 1332000, 'steps': 2601, 'loss/train': 2.1058452129364014} -09/20/2021 23:30:15 - INFO - __main__ - Step 41626: {'lr': 0.00019930374951592078, 'samples': 1332032, 'steps': 2601, 'loss/train': 1.9347890615463257} -09/20/2021 23:30:15 - INFO - __main__ - Step 41627: {'lr': 0.00019930374951592078, 'samples': 1332064, 'steps': 2601, 'loss/train': 1.9320154190063477} -09/20/2021 23:30:16 - INFO - __main__ - Step 41628: {'lr': 0.00019930374951592078, 'samples': 1332096, 'steps': 2601, 'loss/train': 1.8813601732254028} -09/20/2021 23:30:17 - INFO - __main__ - Step 41629: {'lr': 0.00019930374951592078, 'samples': 1332128, 'steps': 2601, 'loss/train': 2.084581136703491} -09/20/2021 23:30:18 - INFO - __main__ - Step 41630: {'lr': 0.00019930374951592078, 'samples': 1332160, 'steps': 2601, 'loss/train': 1.3990399837493896} -09/20/2021 23:30:18 - INFO - __main__ - Step 41631: {'lr': 0.00019930374951592078, 'samples': 1332192, 'steps': 2601, 'loss/train': 1.6747791767120361} -09/20/2021 23:30:19 - INFO - __main__ - Step 41632: {'lr': 0.00019930374951592078, 'samples': 1332224, 'steps': 2601, 'loss/train': 3.0828301906585693} -09/20/2021 23:30:20 - INFO - __main__ - Step 41633: {'lr': 0.0001993029978915049, 'samples': 1332256, 'steps': 2602, 'loss/train': 2.3658206462860107} -09/20/2021 23:30:21 - INFO - __main__ - Step 41634: {'lr': 0.0001993029978915049, 'samples': 1332288, 'steps': 2602, 'loss/train': 1.4179173707962036} -09/20/2021 23:30:22 - INFO - __main__ - Step 41635: {'lr': 0.0001993029978915049, 'samples': 1332320, 'steps': 2602, 'loss/train': 2.205857515335083} -09/20/2021 23:30:22 - INFO - __main__ - Step 41636: {'lr': 0.0001993029978915049, 'samples': 1332352, 'steps': 2602, 'loss/train': 1.8649463653564453} -09/20/2021 23:30:23 - INFO - __main__ - Step 41637: {'lr': 0.0001993029978915049, 'samples': 1332384, 'steps': 2602, 'loss/train': 1.9387285709381104} -09/20/2021 23:30:24 - INFO - __main__ - Step 41638: {'lr': 0.0001993029978915049, 'samples': 1332416, 'steps': 2602, 'loss/train': 2.060011386871338} -09/20/2021 23:30:25 - INFO - __main__ - Step 41639: {'lr': 0.0001993029978915049, 'samples': 1332448, 'steps': 2602, 'loss/train': 2.02346134185791} -09/20/2021 23:30:25 - INFO - __main__ - Step 41640: {'lr': 0.0001993029978915049, 'samples': 1332480, 'steps': 2602, 'loss/train': 1.4714117050170898} -09/20/2021 23:30:26 - INFO - __main__ - Step 41641: {'lr': 0.0001993029978915049, 'samples': 1332512, 'steps': 2602, 'loss/train': 2.51607084274292} -09/20/2021 23:30:27 - INFO - __main__ - Step 41642: {'lr': 0.0001993029978915049, 'samples': 1332544, 'steps': 2602, 'loss/train': 1.8182719945907593} -09/20/2021 23:30:28 - INFO - __main__ - Step 41643: {'lr': 0.0001993029978915049, 'samples': 1332576, 'steps': 2602, 'loss/train': 2.426767349243164} -09/20/2021 23:30:28 - INFO - __main__ - Step 41644: {'lr': 0.0001993029978915049, 'samples': 1332608, 'steps': 2602, 'loss/train': 2.123649835586548} -09/20/2021 23:30:29 - INFO - __main__ - Step 41645: {'lr': 0.0001993029978915049, 'samples': 1332640, 'steps': 2602, 'loss/train': 2.1892144680023193} -09/20/2021 23:30:30 - INFO - __main__ - Step 41646: {'lr': 0.0001993029978915049, 'samples': 1332672, 'steps': 2602, 'loss/train': 2.0433712005615234} -09/20/2021 23:30:31 - INFO - __main__ - Step 41647: {'lr': 0.0001993029978915049, 'samples': 1332704, 'steps': 2602, 'loss/train': 1.809553861618042} -09/20/2021 23:30:32 - INFO - __main__ - Step 41648: {'lr': 0.0001993029978915049, 'samples': 1332736, 'steps': 2602, 'loss/train': 2.4934475421905518} -09/20/2021 23:30:33 - INFO - __main__ - Step 41649: {'lr': 0.00019930224586302552, 'samples': 1332768, 'steps': 2603, 'loss/train': 2.157378911972046} -09/20/2021 23:30:34 - INFO - __main__ - Step 41650: {'lr': 0.00019930224586302552, 'samples': 1332800, 'steps': 2603, 'loss/train': 2.36191463470459} -09/20/2021 23:30:34 - INFO - __main__ - Step 41651: {'lr': 0.00019930224586302552, 'samples': 1332832, 'steps': 2603, 'loss/train': 2.2952351570129395} -09/20/2021 23:30:35 - INFO - __main__ - Step 41652: {'lr': 0.00019930224586302552, 'samples': 1332864, 'steps': 2603, 'loss/train': 1.749068260192871} -09/20/2021 23:30:36 - INFO - __main__ - Step 41653: {'lr': 0.00019930224586302552, 'samples': 1332896, 'steps': 2603, 'loss/train': 1.857751727104187} -09/20/2021 23:30:37 - INFO - __main__ - Step 41654: {'lr': 0.00019930224586302552, 'samples': 1332928, 'steps': 2603, 'loss/train': 2.6580593585968018} -09/20/2021 23:30:37 - INFO - __main__ - Step 41655: {'lr': 0.00019930224586302552, 'samples': 1332960, 'steps': 2603, 'loss/train': 2.791206121444702} -09/20/2021 23:30:38 - INFO - __main__ - Step 41656: {'lr': 0.00019930224586302552, 'samples': 1332992, 'steps': 2603, 'loss/train': 2.006108045578003} -09/20/2021 23:30:39 - INFO - __main__ - Step 41657: {'lr': 0.00019930224586302552, 'samples': 1333024, 'steps': 2603, 'loss/train': 2.6981911659240723} -09/20/2021 23:30:40 - INFO - __main__ - Step 41658: {'lr': 0.00019930224586302552, 'samples': 1333056, 'steps': 2603, 'loss/train': 2.9634621143341064} -09/20/2021 23:30:40 - INFO - __main__ - Step 41659: {'lr': 0.00019930224586302552, 'samples': 1333088, 'steps': 2603, 'loss/train': 2.835695266723633} -09/20/2021 23:30:41 - INFO - __main__ - Step 41660: {'lr': 0.00019930224586302552, 'samples': 1333120, 'steps': 2603, 'loss/train': 3.0047643184661865} -09/20/2021 23:30:42 - INFO - __main__ - Step 41661: {'lr': 0.00019930224586302552, 'samples': 1333152, 'steps': 2603, 'loss/train': 2.432847023010254} -09/20/2021 23:30:43 - INFO - __main__ - Step 41662: {'lr': 0.00019930224586302552, 'samples': 1333184, 'steps': 2603, 'loss/train': 2.6576738357543945} -09/20/2021 23:30:43 - INFO - __main__ - Step 41663: {'lr': 0.00019930224586302552, 'samples': 1333216, 'steps': 2603, 'loss/train': 2.091892719268799} -09/20/2021 23:30:44 - INFO - __main__ - Step 41664: {'lr': 0.00019930224586302552, 'samples': 1333248, 'steps': 2603, 'loss/train': 1.65378737449646} -09/20/2021 23:30:45 - INFO - __main__ - Step 41665: {'lr': 0.0001993014934304857, 'samples': 1333280, 'steps': 2604, 'loss/train': 2.6459903717041016} -09/20/2021 23:30:46 - INFO - __main__ - Step 41666: {'lr': 0.0001993014934304857, 'samples': 1333312, 'steps': 2604, 'loss/train': 2.1417534351348877} -09/20/2021 23:30:47 - INFO - __main__ - Step 41667: {'lr': 0.0001993014934304857, 'samples': 1333344, 'steps': 2604, 'loss/train': 0.6250811219215393} -09/20/2021 23:30:47 - INFO - __main__ - Step 41668: {'lr': 0.0001993014934304857, 'samples': 1333376, 'steps': 2604, 'loss/train': 2.3510844707489014} -09/20/2021 23:30:48 - INFO - __main__ - Step 41669: {'lr': 0.0001993014934304857, 'samples': 1333408, 'steps': 2604, 'loss/train': 2.0991368293762207} -09/20/2021 23:30:49 - INFO - __main__ - Step 41670: {'lr': 0.0001993014934304857, 'samples': 1333440, 'steps': 2604, 'loss/train': 2.3818788528442383} -09/20/2021 23:30:50 - INFO - __main__ - Step 41671: {'lr': 0.0001993014934304857, 'samples': 1333472, 'steps': 2604, 'loss/train': 2.0573344230651855} -09/20/2021 23:30:50 - INFO - __main__ - Step 41672: {'lr': 0.0001993014934304857, 'samples': 1333504, 'steps': 2604, 'loss/train': 1.430457353591919} -09/20/2021 23:30:51 - INFO - __main__ - Step 41673: {'lr': 0.0001993014934304857, 'samples': 1333536, 'steps': 2604, 'loss/train': 1.8615814447402954} -09/20/2021 23:30:52 - INFO - __main__ - Step 41674: {'lr': 0.0001993014934304857, 'samples': 1333568, 'steps': 2604, 'loss/train': 2.6800270080566406} -09/20/2021 23:30:53 - INFO - __main__ - Step 41675: {'lr': 0.0001993014934304857, 'samples': 1333600, 'steps': 2604, 'loss/train': 1.8906493186950684} -09/20/2021 23:30:53 - INFO - __main__ - Step 41676: {'lr': 0.0001993014934304857, 'samples': 1333632, 'steps': 2604, 'loss/train': 2.904695749282837} -09/20/2021 23:30:54 - INFO - __main__ - Step 41677: {'lr': 0.0001993014934304857, 'samples': 1333664, 'steps': 2604, 'loss/train': 3.703956127166748} -09/20/2021 23:30:55 - INFO - __main__ - Step 41678: {'lr': 0.0001993014934304857, 'samples': 1333696, 'steps': 2604, 'loss/train': 3.1181676387786865} -09/20/2021 23:30:56 - INFO - __main__ - Step 41679: {'lr': 0.0001993014934304857, 'samples': 1333728, 'steps': 2604, 'loss/train': 2.8441805839538574} -09/20/2021 23:30:57 - INFO - __main__ - Step 41680: {'lr': 0.0001993014934304857, 'samples': 1333760, 'steps': 2604, 'loss/train': 2.9478843212127686} -09/20/2021 23:30:58 - INFO - __main__ - Step 41681: {'lr': 0.00019930074059388848, 'samples': 1333792, 'steps': 2605, 'loss/train': 2.157221555709839} -09/20/2021 23:30:58 - INFO - __main__ - Step 41682: {'lr': 0.00019930074059388848, 'samples': 1333824, 'steps': 2605, 'loss/train': 1.7102099657058716} -09/20/2021 23:30:59 - INFO - __main__ - Step 41683: {'lr': 0.00019930074059388848, 'samples': 1333856, 'steps': 2605, 'loss/train': 1.9035371541976929} -09/20/2021 23:31:00 - INFO - __main__ - Step 41684: {'lr': 0.00019930074059388848, 'samples': 1333888, 'steps': 2605, 'loss/train': 1.715274453163147} -09/20/2021 23:31:01 - INFO - __main__ - Step 41685: {'lr': 0.00019930074059388848, 'samples': 1333920, 'steps': 2605, 'loss/train': 2.193040609359741} -09/20/2021 23:31:01 - INFO - __main__ - Step 41686: {'lr': 0.00019930074059388848, 'samples': 1333952, 'steps': 2605, 'loss/train': 2.6579384803771973} -09/20/2021 23:31:02 - INFO - __main__ - Step 41687: {'lr': 0.00019930074059388848, 'samples': 1333984, 'steps': 2605, 'loss/train': 1.8699723482131958} -09/20/2021 23:31:03 - INFO - __main__ - Step 41688: {'lr': 0.00019930074059388848, 'samples': 1334016, 'steps': 2605, 'loss/train': 1.5457465648651123} -09/20/2021 23:31:04 - INFO - __main__ - Step 41689: {'lr': 0.00019930074059388848, 'samples': 1334048, 'steps': 2605, 'loss/train': 1.9633424282073975} -09/20/2021 23:31:04 - INFO - __main__ - Step 41690: {'lr': 0.00019930074059388848, 'samples': 1334080, 'steps': 2605, 'loss/train': 2.693737030029297} -09/20/2021 23:31:05 - INFO - __main__ - Step 41691: {'lr': 0.00019930074059388848, 'samples': 1334112, 'steps': 2605, 'loss/train': 1.2053754329681396} -09/20/2021 23:31:06 - INFO - __main__ - Step 41692: {'lr': 0.00019930074059388848, 'samples': 1334144, 'steps': 2605, 'loss/train': 3.113184928894043} -09/20/2021 23:31:07 - INFO - __main__ - Step 41693: {'lr': 0.00019930074059388848, 'samples': 1334176, 'steps': 2605, 'loss/train': 3.3540403842926025} -09/20/2021 23:31:07 - INFO - __main__ - Step 41694: {'lr': 0.00019930074059388848, 'samples': 1334208, 'steps': 2605, 'loss/train': 1.2903896570205688} -09/20/2021 23:31:08 - INFO - __main__ - Step 41695: {'lr': 0.00019930074059388848, 'samples': 1334240, 'steps': 2605, 'loss/train': 1.9870885610580444} -09/20/2021 23:31:09 - INFO - __main__ - Step 41696: {'lr': 0.00019930074059388848, 'samples': 1334272, 'steps': 2605, 'loss/train': 1.5603915452957153} -09/20/2021 23:31:10 - INFO - __main__ - Step 41697: {'lr': 0.0001992999873532369, 'samples': 1334304, 'steps': 2606, 'loss/train': 2.577909469604492} -09/20/2021 23:31:11 - INFO - __main__ - Step 41698: {'lr': 0.0001992999873532369, 'samples': 1334336, 'steps': 2606, 'loss/train': 2.5392000675201416} -09/20/2021 23:31:11 - INFO - __main__ - Step 41699: {'lr': 0.0001992999873532369, 'samples': 1334368, 'steps': 2606, 'loss/train': 2.2346508502960205} -09/20/2021 23:31:12 - INFO - __main__ - Step 41700: {'lr': 0.0001992999873532369, 'samples': 1334400, 'steps': 2606, 'loss/train': 2.404606342315674} -09/20/2021 23:31:13 - INFO - __main__ - Step 41701: {'lr': 0.0001992999873532369, 'samples': 1334432, 'steps': 2606, 'loss/train': 2.6529643535614014} -09/20/2021 23:31:14 - INFO - __main__ - Step 41702: {'lr': 0.0001992999873532369, 'samples': 1334464, 'steps': 2606, 'loss/train': 1.8553550243377686} -09/20/2021 23:31:14 - INFO - __main__ - Step 41703: {'lr': 0.0001992999873532369, 'samples': 1334496, 'steps': 2606, 'loss/train': 2.3308420181274414} -09/20/2021 23:31:15 - INFO - __main__ - Step 41704: {'lr': 0.0001992999873532369, 'samples': 1334528, 'steps': 2606, 'loss/train': 1.8038314580917358} -09/20/2021 23:31:16 - INFO - __main__ - Step 41705: {'lr': 0.0001992999873532369, 'samples': 1334560, 'steps': 2606, 'loss/train': 1.4947186708450317} -09/20/2021 23:31:17 - INFO - __main__ - Step 41706: {'lr': 0.0001992999873532369, 'samples': 1334592, 'steps': 2606, 'loss/train': 1.9981353282928467} -09/20/2021 23:31:17 - INFO - __main__ - Step 41707: {'lr': 0.0001992999873532369, 'samples': 1334624, 'steps': 2606, 'loss/train': 1.4687985181808472} -09/20/2021 23:31:18 - INFO - __main__ - Step 41708: {'lr': 0.0001992999873532369, 'samples': 1334656, 'steps': 2606, 'loss/train': 2.489276647567749} -09/20/2021 23:31:19 - INFO - __main__ - Step 41709: {'lr': 0.0001992999873532369, 'samples': 1334688, 'steps': 2606, 'loss/train': 2.293156623840332} -09/20/2021 23:31:20 - INFO - __main__ - Step 41710: {'lr': 0.0001992999873532369, 'samples': 1334720, 'steps': 2606, 'loss/train': 2.982715368270874} -09/20/2021 23:31:21 - INFO - __main__ - Step 41711: {'lr': 0.0001992999873532369, 'samples': 1334752, 'steps': 2606, 'loss/train': 1.9444128274917603} -09/20/2021 23:31:22 - INFO - __main__ - Step 41712: {'lr': 0.0001992999873532369, 'samples': 1334784, 'steps': 2606, 'loss/train': 2.104177236557007} -09/20/2021 23:31:23 - INFO - __main__ - Step 41713: {'lr': 0.0001992992337085341, 'samples': 1334816, 'steps': 2607, 'loss/train': 1.9005728960037231} -09/20/2021 23:31:24 - INFO - __main__ - Step 41714: {'lr': 0.0001992992337085341, 'samples': 1334848, 'steps': 2607, 'loss/train': 1.674974799156189} -09/20/2021 23:31:24 - INFO - __main__ - Step 41715: {'lr': 0.0001992992337085341, 'samples': 1334880, 'steps': 2607, 'loss/train': 2.286487340927124} -09/20/2021 23:31:25 - INFO - __main__ - Step 41716: {'lr': 0.0001992992337085341, 'samples': 1334912, 'steps': 2607, 'loss/train': 2.5108137130737305} -09/20/2021 23:31:26 - INFO - __main__ - Step 41717: {'lr': 0.0001992992337085341, 'samples': 1334944, 'steps': 2607, 'loss/train': 2.496800184249878} -09/20/2021 23:31:27 - INFO - __main__ - Step 41718: {'lr': 0.0001992992337085341, 'samples': 1334976, 'steps': 2607, 'loss/train': 1.6636770963668823} -09/20/2021 23:31:27 - INFO - __main__ - Step 41719: {'lr': 0.0001992992337085341, 'samples': 1335008, 'steps': 2607, 'loss/train': 0.17910966277122498} -09/20/2021 23:31:28 - INFO - __main__ - Step 41720: {'lr': 0.0001992992337085341, 'samples': 1335040, 'steps': 2607, 'loss/train': 0.10652398318052292} -09/20/2021 23:31:29 - INFO - __main__ - Step 41721: {'lr': 0.0001992992337085341, 'samples': 1335072, 'steps': 2607, 'loss/train': 2.8185954093933105} -09/20/2021 23:31:30 - INFO - __main__ - Step 41722: {'lr': 0.0001992992337085341, 'samples': 1335104, 'steps': 2607, 'loss/train': 2.2360751628875732} -09/20/2021 23:31:30 - INFO - __main__ - Step 41723: {'lr': 0.0001992992337085341, 'samples': 1335136, 'steps': 2607, 'loss/train': 2.9158010482788086} -09/20/2021 23:31:31 - INFO - __main__ - Step 41724: {'lr': 0.0001992992337085341, 'samples': 1335168, 'steps': 2607, 'loss/train': 1.981595516204834} -09/20/2021 23:31:32 - INFO - __main__ - Step 41725: {'lr': 0.0001992992337085341, 'samples': 1335200, 'steps': 2607, 'loss/train': 2.1424477100372314} -09/20/2021 23:31:33 - INFO - __main__ - Step 41726: {'lr': 0.0001992992337085341, 'samples': 1335232, 'steps': 2607, 'loss/train': 2.1806557178497314} -09/20/2021 23:31:33 - INFO - __main__ - Step 41727: {'lr': 0.0001992992337085341, 'samples': 1335264, 'steps': 2607, 'loss/train': 1.902596354484558} -09/20/2021 23:31:34 - INFO - __main__ - Step 41728: {'lr': 0.0001992992337085341, 'samples': 1335296, 'steps': 2607, 'loss/train': 1.5506622791290283} -09/20/2021 23:31:35 - INFO - __main__ - Step 41729: {'lr': 0.0001992984796597831, 'samples': 1335328, 'steps': 2608, 'loss/train': 1.7589876651763916} -09/20/2021 23:31:36 - INFO - __main__ - Step 41730: {'lr': 0.0001992984796597831, 'samples': 1335360, 'steps': 2608, 'loss/train': 2.005661964416504} -09/20/2021 23:31:36 - INFO - __main__ - Step 41731: {'lr': 0.0001992984796597831, 'samples': 1335392, 'steps': 2608, 'loss/train': 2.5839874744415283} -09/20/2021 23:31:37 - INFO - __main__ - Step 41732: {'lr': 0.0001992984796597831, 'samples': 1335424, 'steps': 2608, 'loss/train': 1.9122328758239746} -09/20/2021 23:31:38 - INFO - __main__ - Step 41733: {'lr': 0.0001992984796597831, 'samples': 1335456, 'steps': 2608, 'loss/train': 1.809848427772522} -09/20/2021 23:31:39 - INFO - __main__ - Step 41734: {'lr': 0.0001992984796597831, 'samples': 1335488, 'steps': 2608, 'loss/train': 2.659118413925171} -09/20/2021 23:31:39 - INFO - __main__ - Step 41735: {'lr': 0.0001992984796597831, 'samples': 1335520, 'steps': 2608, 'loss/train': 1.8124221563339233} -09/20/2021 23:31:40 - INFO - __main__ - Step 41736: {'lr': 0.0001992984796597831, 'samples': 1335552, 'steps': 2608, 'loss/train': 2.0279948711395264} -09/20/2021 23:31:41 - INFO - __main__ - Step 41737: {'lr': 0.0001992984796597831, 'samples': 1335584, 'steps': 2608, 'loss/train': 0.5884419083595276} -09/20/2021 23:31:42 - INFO - __main__ - Step 41738: {'lr': 0.0001992984796597831, 'samples': 1335616, 'steps': 2608, 'loss/train': 0.4445495903491974} -09/20/2021 23:31:42 - INFO - __main__ - Step 41739: {'lr': 0.0001992984796597831, 'samples': 1335648, 'steps': 2608, 'loss/train': 0.46413159370422363} -09/20/2021 23:31:43 - INFO - __main__ - Step 41740: {'lr': 0.0001992984796597831, 'samples': 1335680, 'steps': 2608, 'loss/train': 0.4913856089115143} -09/20/2021 23:31:44 - INFO - __main__ - Step 41741: {'lr': 0.0001992984796597831, 'samples': 1335712, 'steps': 2608, 'loss/train': 0.6229147911071777} -09/20/2021 23:31:45 - INFO - __main__ - Step 41742: {'lr': 0.0001992984796597831, 'samples': 1335744, 'steps': 2608, 'loss/train': 0.5172604918479919} -09/20/2021 23:31:45 - INFO - __main__ - Step 41743: {'lr': 0.0001992984796597831, 'samples': 1335776, 'steps': 2608, 'loss/train': 0.7488278150558472} -09/20/2021 23:31:46 - INFO - __main__ - Step 41744: {'lr': 0.0001992984796597831, 'samples': 1335808, 'steps': 2608, 'loss/train': 0.5971229076385498} -09/20/2021 23:31:47 - INFO - __main__ - Step 41745: {'lr': 0.00019929772520698696, 'samples': 1335840, 'steps': 2609, 'loss/train': 1.7066458463668823} -09/20/2021 23:31:49 - INFO - __main__ - Step 41746: {'lr': 0.00019929772520698696, 'samples': 1335872, 'steps': 2609, 'loss/train': 2.072360038757324} -09/20/2021 23:31:50 - INFO - __main__ - Step 41747: {'lr': 0.00019929772520698696, 'samples': 1335904, 'steps': 2609, 'loss/train': 2.0981245040893555} -09/20/2021 23:31:50 - INFO - __main__ - Step 41748: {'lr': 0.00019929772520698696, 'samples': 1335936, 'steps': 2609, 'loss/train': 2.244168996810913} -09/20/2021 23:31:51 - INFO - __main__ - Step 41749: {'lr': 0.00019929772520698696, 'samples': 1335968, 'steps': 2609, 'loss/train': 2.5583231449127197} -09/20/2021 23:31:52 - INFO - __main__ - Step 41750: {'lr': 0.00019929772520698696, 'samples': 1336000, 'steps': 2609, 'loss/train': 2.6972765922546387} -09/20/2021 23:31:53 - INFO - __main__ - Step 41751: {'lr': 0.00019929772520698696, 'samples': 1336032, 'steps': 2609, 'loss/train': 1.803523302078247} -09/20/2021 23:31:53 - INFO - __main__ - Step 41752: {'lr': 0.00019929772520698696, 'samples': 1336064, 'steps': 2609, 'loss/train': 1.8697086572647095} -09/20/2021 23:31:54 - INFO - __main__ - Step 41753: {'lr': 0.00019929772520698696, 'samples': 1336096, 'steps': 2609, 'loss/train': 1.9400948286056519} -09/20/2021 23:31:55 - INFO - __main__ - Step 41754: {'lr': 0.00019929772520698696, 'samples': 1336128, 'steps': 2609, 'loss/train': 2.5204544067382812} -09/20/2021 23:31:56 - INFO - __main__ - Step 41755: {'lr': 0.00019929772520698696, 'samples': 1336160, 'steps': 2609, 'loss/train': 2.5041298866271973} -09/20/2021 23:31:56 - INFO - __main__ - Step 41756: {'lr': 0.00019929772520698696, 'samples': 1336192, 'steps': 2609, 'loss/train': 1.7847325801849365} -09/20/2021 23:31:57 - INFO - __main__ - Step 41757: {'lr': 0.00019929772520698696, 'samples': 1336224, 'steps': 2609, 'loss/train': 1.822022557258606} -09/20/2021 23:31:58 - INFO - __main__ - Step 41758: {'lr': 0.00019929772520698696, 'samples': 1336256, 'steps': 2609, 'loss/train': 1.767637014389038} -09/20/2021 23:31:59 - INFO - __main__ - Step 41759: {'lr': 0.00019929772520698696, 'samples': 1336288, 'steps': 2609, 'loss/train': 1.7784868478775024} -09/20/2021 23:31:59 - INFO - __main__ - Step 41760: {'lr': 0.00019929772520698696, 'samples': 1336320, 'steps': 2609, 'loss/train': 1.7706140279769897} -09/20/2021 23:32:00 - INFO - __main__ - Step 41761: {'lr': 0.00019929697035014877, 'samples': 1336352, 'steps': 2610, 'loss/train': 1.7817063331604004} -09/20/2021 23:32:01 - INFO - __main__ - Step 41762: {'lr': 0.00019929697035014877, 'samples': 1336384, 'steps': 2610, 'loss/train': 1.8611936569213867} -09/20/2021 23:32:02 - INFO - __main__ - Step 41763: {'lr': 0.00019929697035014877, 'samples': 1336416, 'steps': 2610, 'loss/train': 1.8580125570297241} -09/20/2021 23:32:02 - INFO - __main__ - Step 41764: {'lr': 0.00019929697035014877, 'samples': 1336448, 'steps': 2610, 'loss/train': 1.7502713203430176} -09/20/2021 23:32:03 - INFO - __main__ - Step 41765: {'lr': 0.00019929697035014877, 'samples': 1336480, 'steps': 2610, 'loss/train': 1.7178246974945068} -09/20/2021 23:32:04 - INFO - __main__ - Step 41766: {'lr': 0.00019929697035014877, 'samples': 1336512, 'steps': 2610, 'loss/train': 2.075636625289917} -09/20/2021 23:32:05 - INFO - __main__ - Step 41767: {'lr': 0.00019929697035014877, 'samples': 1336544, 'steps': 2610, 'loss/train': 2.5915677547454834} -09/20/2021 23:32:05 - INFO - __main__ - Step 41768: {'lr': 0.00019929697035014877, 'samples': 1336576, 'steps': 2610, 'loss/train': 1.4254404306411743} -09/20/2021 23:32:06 - INFO - __main__ - Step 41769: {'lr': 0.00019929697035014877, 'samples': 1336608, 'steps': 2610, 'loss/train': 1.5779376029968262} -09/20/2021 23:32:07 - INFO - __main__ - Step 41770: {'lr': 0.00019929697035014877, 'samples': 1336640, 'steps': 2610, 'loss/train': 2.5650529861450195} -09/20/2021 23:32:08 - INFO - __main__ - Step 41771: {'lr': 0.00019929697035014877, 'samples': 1336672, 'steps': 2610, 'loss/train': 3.028681516647339} -09/20/2021 23:32:08 - INFO - __main__ - Step 41772: {'lr': 0.00019929697035014877, 'samples': 1336704, 'steps': 2610, 'loss/train': 1.8487725257873535} -09/20/2021 23:32:09 - INFO - __main__ - Step 41773: {'lr': 0.00019929697035014877, 'samples': 1336736, 'steps': 2610, 'loss/train': 2.5804741382598877} -09/20/2021 23:32:10 - INFO - __main__ - Step 41774: {'lr': 0.00019929697035014877, 'samples': 1336768, 'steps': 2610, 'loss/train': 1.9188672304153442} -09/20/2021 23:32:11 - INFO - __main__ - Step 41775: {'lr': 0.00019929697035014877, 'samples': 1336800, 'steps': 2610, 'loss/train': 2.5531833171844482} -09/20/2021 23:32:12 - INFO - __main__ - Step 41776: {'lr': 0.00019929697035014877, 'samples': 1336832, 'steps': 2610, 'loss/train': 1.9149144887924194} -09/20/2021 23:32:12 - INFO - __main__ - Step 41777: {'lr': 0.00019929621508927157, 'samples': 1336864, 'steps': 2611, 'loss/train': 1.8504102230072021} -09/20/2021 23:32:13 - INFO - __main__ - Step 41778: {'lr': 0.00019929621508927157, 'samples': 1336896, 'steps': 2611, 'loss/train': 3.3371403217315674} -09/20/2021 23:32:14 - INFO - __main__ - Step 41779: {'lr': 0.00019929621508927157, 'samples': 1336928, 'steps': 2611, 'loss/train': 2.3330533504486084} -09/20/2021 23:32:15 - INFO - __main__ - Step 41780: {'lr': 0.00019929621508927157, 'samples': 1336960, 'steps': 2611, 'loss/train': 2.5204083919525146} -09/20/2021 23:32:15 - INFO - __main__ - Step 41781: {'lr': 0.00019929621508927157, 'samples': 1336992, 'steps': 2611, 'loss/train': 2.3183176517486572} -09/20/2021 23:32:16 - INFO - __main__ - Step 41782: {'lr': 0.00019929621508927157, 'samples': 1337024, 'steps': 2611, 'loss/train': 1.9932317733764648} -09/20/2021 23:32:17 - INFO - __main__ - Step 41783: {'lr': 0.00019929621508927157, 'samples': 1337056, 'steps': 2611, 'loss/train': 2.528665065765381} -09/20/2021 23:32:18 - INFO - __main__ - Step 41784: {'lr': 0.00019929621508927157, 'samples': 1337088, 'steps': 2611, 'loss/train': 1.4369127750396729} -09/20/2021 23:32:19 - INFO - __main__ - Step 41785: {'lr': 0.00019929621508927157, 'samples': 1337120, 'steps': 2611, 'loss/train': 1.8749467134475708} -09/20/2021 23:32:20 - INFO - __main__ - Step 41786: {'lr': 0.00019929621508927157, 'samples': 1337152, 'steps': 2611, 'loss/train': 2.343923807144165} -09/20/2021 23:32:20 - INFO - __main__ - Step 41787: {'lr': 0.00019929621508927157, 'samples': 1337184, 'steps': 2611, 'loss/train': 1.993775725364685} -09/20/2021 23:32:21 - INFO - __main__ - Step 41788: {'lr': 0.00019929621508927157, 'samples': 1337216, 'steps': 2611, 'loss/train': 2.185824394226074} -09/20/2021 23:32:22 - INFO - __main__ - Step 41789: {'lr': 0.00019929621508927157, 'samples': 1337248, 'steps': 2611, 'loss/train': 2.809724807739258} -09/20/2021 23:32:23 - INFO - __main__ - Step 41790: {'lr': 0.00019929621508927157, 'samples': 1337280, 'steps': 2611, 'loss/train': 2.231325149536133} -09/20/2021 23:32:23 - INFO - __main__ - Step 41791: {'lr': 0.00019929621508927157, 'samples': 1337312, 'steps': 2611, 'loss/train': 2.036865472793579} -09/20/2021 23:32:24 - INFO - __main__ - Step 41792: {'lr': 0.00019929621508927157, 'samples': 1337344, 'steps': 2611, 'loss/train': 2.3392069339752197} -09/20/2021 23:32:25 - INFO - __main__ - Step 41793: {'lr': 0.00019929545942435847, 'samples': 1337376, 'steps': 2612, 'loss/train': 2.1289048194885254} -09/20/2021 23:32:26 - INFO - __main__ - Step 41794: {'lr': 0.00019929545942435847, 'samples': 1337408, 'steps': 2612, 'loss/train': 1.6013566255569458} -09/20/2021 23:32:27 - INFO - __main__ - Step 41795: {'lr': 0.00019929545942435847, 'samples': 1337440, 'steps': 2612, 'loss/train': 3.20587158203125} -09/20/2021 23:32:27 - INFO - __main__ - Step 41796: {'lr': 0.00019929545942435847, 'samples': 1337472, 'steps': 2612, 'loss/train': 2.4432249069213867} -09/20/2021 23:32:28 - INFO - __main__ - Step 41797: {'lr': 0.00019929545942435847, 'samples': 1337504, 'steps': 2612, 'loss/train': 3.1910438537597656} -09/20/2021 23:32:29 - INFO - __main__ - Step 41798: {'lr': 0.00019929545942435847, 'samples': 1337536, 'steps': 2612, 'loss/train': 1.7071483135223389} -09/20/2021 23:32:30 - INFO - __main__ - Step 41799: {'lr': 0.00019929545942435847, 'samples': 1337568, 'steps': 2612, 'loss/train': 2.4380176067352295} -09/20/2021 23:32:30 - INFO - __main__ - Step 41800: {'lr': 0.00019929545942435847, 'samples': 1337600, 'steps': 2612, 'loss/train': 1.9121862649917603} -09/20/2021 23:32:31 - INFO - __main__ - Step 41801: {'lr': 0.00019929545942435847, 'samples': 1337632, 'steps': 2612, 'loss/train': 2.521212100982666} -09/20/2021 23:32:32 - INFO - __main__ - Step 41802: {'lr': 0.00019929545942435847, 'samples': 1337664, 'steps': 2612, 'loss/train': 2.155393600463867} -09/20/2021 23:32:33 - INFO - __main__ - Step 41803: {'lr': 0.00019929545942435847, 'samples': 1337696, 'steps': 2612, 'loss/train': 1.8634344339370728} -09/20/2021 23:32:33 - INFO - __main__ - Step 41804: {'lr': 0.00019929545942435847, 'samples': 1337728, 'steps': 2612, 'loss/train': 2.5352680683135986} -09/20/2021 23:32:34 - INFO - __main__ - Step 41805: {'lr': 0.00019929545942435847, 'samples': 1337760, 'steps': 2612, 'loss/train': 1.6927980184555054} -09/20/2021 23:32:35 - INFO - __main__ - Step 41806: {'lr': 0.00019929545942435847, 'samples': 1337792, 'steps': 2612, 'loss/train': 2.3814427852630615} -09/20/2021 23:32:36 - INFO - __main__ - Step 41807: {'lr': 0.00019929545942435847, 'samples': 1337824, 'steps': 2612, 'loss/train': 2.1556570529937744} -09/20/2021 23:32:36 - INFO - __main__ - Step 41808: {'lr': 0.00019929545942435847, 'samples': 1337856, 'steps': 2612, 'loss/train': 2.3348307609558105} -09/20/2021 23:32:37 - INFO - __main__ - Step 41809: {'lr': 0.00019929470335541255, 'samples': 1337888, 'steps': 2613, 'loss/train': 3.1546759605407715} -09/20/2021 23:32:38 - INFO - __main__ - Step 41810: {'lr': 0.00019929470335541255, 'samples': 1337920, 'steps': 2613, 'loss/train': 1.0112260580062866} -09/20/2021 23:32:39 - INFO - __main__ - Step 41811: {'lr': 0.00019929470335541255, 'samples': 1337952, 'steps': 2613, 'loss/train': 2.1651687622070312} -09/20/2021 23:32:39 - INFO - __main__ - Step 41812: {'lr': 0.00019929470335541255, 'samples': 1337984, 'steps': 2613, 'loss/train': 2.5724356174468994} -09/20/2021 23:32:40 - INFO - __main__ - Step 41813: {'lr': 0.00019929470335541255, 'samples': 1338016, 'steps': 2613, 'loss/train': 2.3655903339385986} -09/20/2021 23:32:42 - INFO - __main__ - Step 41814: {'lr': 0.00019929470335541255, 'samples': 1338048, 'steps': 2613, 'loss/train': 2.783572196960449} -09/20/2021 23:32:43 - INFO - __main__ - Step 41815: {'lr': 0.00019929470335541255, 'samples': 1338080, 'steps': 2613, 'loss/train': 2.0616536140441895} -09/20/2021 23:32:44 - INFO - __main__ - Step 41816: {'lr': 0.00019929470335541255, 'samples': 1338112, 'steps': 2613, 'loss/train': 1.6099966764450073} -09/20/2021 23:32:44 - INFO - __main__ - Step 41817: {'lr': 0.00019929470335541255, 'samples': 1338144, 'steps': 2613, 'loss/train': 2.018817186355591} -09/20/2021 23:32:45 - INFO - __main__ - Step 41818: {'lr': 0.00019929470335541255, 'samples': 1338176, 'steps': 2613, 'loss/train': 2.0713133811950684} -09/20/2021 23:32:46 - INFO - __main__ - Step 41819: {'lr': 0.00019929470335541255, 'samples': 1338208, 'steps': 2613, 'loss/train': 1.9464802742004395} -09/20/2021 23:32:47 - INFO - __main__ - Step 41820: {'lr': 0.00019929470335541255, 'samples': 1338240, 'steps': 2613, 'loss/train': 1.9256492853164673} -09/20/2021 23:32:47 - INFO - __main__ - Step 41821: {'lr': 0.00019929470335541255, 'samples': 1338272, 'steps': 2613, 'loss/train': 2.076719284057617} -09/20/2021 23:32:48 - INFO - __main__ - Step 41822: {'lr': 0.00019929470335541255, 'samples': 1338304, 'steps': 2613, 'loss/train': 2.2767181396484375} -09/20/2021 23:32:49 - INFO - __main__ - Step 41823: {'lr': 0.00019929470335541255, 'samples': 1338336, 'steps': 2613, 'loss/train': 1.8022929430007935} -09/20/2021 23:32:50 - INFO - __main__ - Step 41824: {'lr': 0.00019929470335541255, 'samples': 1338368, 'steps': 2613, 'loss/train': 1.7298884391784668} -09/20/2021 23:32:50 - INFO - __main__ - Step 41825: {'lr': 0.00019929394688243684, 'samples': 1338400, 'steps': 2614, 'loss/train': 1.8992339372634888} -09/20/2021 23:32:51 - INFO - __main__ - Step 41826: {'lr': 0.00019929394688243684, 'samples': 1338432, 'steps': 2614, 'loss/train': 3.364156484603882} -09/20/2021 23:32:52 - INFO - __main__ - Step 41827: {'lr': 0.00019929394688243684, 'samples': 1338464, 'steps': 2614, 'loss/train': 2.1321067810058594} -09/20/2021 23:32:53 - INFO - __main__ - Step 41828: {'lr': 0.00019929394688243684, 'samples': 1338496, 'steps': 2614, 'loss/train': 3.4990475177764893} -09/20/2021 23:32:53 - INFO - __main__ - Step 41829: {'lr': 0.00019929394688243684, 'samples': 1338528, 'steps': 2614, 'loss/train': 1.610357642173767} -09/20/2021 23:32:54 - INFO - __main__ - Step 41830: {'lr': 0.00019929394688243684, 'samples': 1338560, 'steps': 2614, 'loss/train': 1.0857793092727661} -09/20/2021 23:32:55 - INFO - __main__ - Step 41831: {'lr': 0.00019929394688243684, 'samples': 1338592, 'steps': 2614, 'loss/train': 1.941445231437683} -09/20/2021 23:32:56 - INFO - __main__ - Step 41832: {'lr': 0.00019929394688243684, 'samples': 1338624, 'steps': 2614, 'loss/train': 1.783205270767212} -09/20/2021 23:32:56 - INFO - __main__ - Step 41833: {'lr': 0.00019929394688243684, 'samples': 1338656, 'steps': 2614, 'loss/train': 2.0409607887268066} -09/20/2021 23:32:57 - INFO - __main__ - Step 41834: {'lr': 0.00019929394688243684, 'samples': 1338688, 'steps': 2614, 'loss/train': 2.4682369232177734} -09/20/2021 23:32:58 - INFO - __main__ - Step 41835: {'lr': 0.00019929394688243684, 'samples': 1338720, 'steps': 2614, 'loss/train': 2.7113449573516846} -09/20/2021 23:32:59 - INFO - __main__ - Step 41836: {'lr': 0.00019929394688243684, 'samples': 1338752, 'steps': 2614, 'loss/train': 2.8200082778930664} -09/20/2021 23:32:59 - INFO - __main__ - Step 41837: {'lr': 0.00019929394688243684, 'samples': 1338784, 'steps': 2614, 'loss/train': 2.1029882431030273} -09/20/2021 23:33:00 - INFO - __main__ - Step 41838: {'lr': 0.00019929394688243684, 'samples': 1338816, 'steps': 2614, 'loss/train': 2.9756176471710205} -09/20/2021 23:33:01 - INFO - __main__ - Step 41839: {'lr': 0.00019929394688243684, 'samples': 1338848, 'steps': 2614, 'loss/train': 1.8704441785812378} -09/20/2021 23:33:02 - INFO - __main__ - Step 41840: {'lr': 0.00019929394688243684, 'samples': 1338880, 'steps': 2614, 'loss/train': 2.1186347007751465} -09/20/2021 23:33:03 - INFO - __main__ - Step 41841: {'lr': 0.00019929319000543445, 'samples': 1338912, 'steps': 2615, 'loss/train': 1.6226775646209717} -09/20/2021 23:33:03 - INFO - __main__ - Step 41842: {'lr': 0.00019929319000543445, 'samples': 1338944, 'steps': 2615, 'loss/train': 0.7108607888221741} -09/20/2021 23:33:04 - INFO - __main__ - Step 41843: {'lr': 0.00019929319000543445, 'samples': 1338976, 'steps': 2615, 'loss/train': 1.4966930150985718} -09/20/2021 23:33:05 - INFO - __main__ - Step 41844: {'lr': 0.00019929319000543445, 'samples': 1339008, 'steps': 2615, 'loss/train': 2.7353811264038086} -09/20/2021 23:33:06 - INFO - __main__ - Step 41845: {'lr': 0.00019929319000543445, 'samples': 1339040, 'steps': 2615, 'loss/train': 1.902119755744934} -09/20/2021 23:33:07 - INFO - __main__ - Step 41846: {'lr': 0.00019929319000543445, 'samples': 1339072, 'steps': 2615, 'loss/train': 2.57002329826355} -09/20/2021 23:33:08 - INFO - __main__ - Step 41847: {'lr': 0.00019929319000543445, 'samples': 1339104, 'steps': 2615, 'loss/train': 2.0991835594177246} -09/20/2021 23:33:08 - INFO - __main__ - Step 41848: {'lr': 0.00019929319000543445, 'samples': 1339136, 'steps': 2615, 'loss/train': 2.379549741744995} -09/20/2021 23:33:09 - INFO - __main__ - Step 41849: {'lr': 0.00019929319000543445, 'samples': 1339168, 'steps': 2615, 'loss/train': 2.4754292964935303} -09/20/2021 23:33:10 - INFO - __main__ - Step 41850: {'lr': 0.00019929319000543445, 'samples': 1339200, 'steps': 2615, 'loss/train': 2.597228765487671} -09/20/2021 23:33:11 - INFO - __main__ - Step 41851: {'lr': 0.00019929319000543445, 'samples': 1339232, 'steps': 2615, 'loss/train': 0.7170040607452393} -09/20/2021 23:33:11 - INFO - __main__ - Step 41852: {'lr': 0.00019929319000543445, 'samples': 1339264, 'steps': 2615, 'loss/train': 2.090292453765869} -09/20/2021 23:33:12 - INFO - __main__ - Step 41853: {'lr': 0.00019929319000543445, 'samples': 1339296, 'steps': 2615, 'loss/train': 1.7791671752929688} -09/20/2021 23:33:13 - INFO - __main__ - Step 41854: {'lr': 0.00019929319000543445, 'samples': 1339328, 'steps': 2615, 'loss/train': 2.5059428215026855} -09/20/2021 23:33:14 - INFO - __main__ - Step 41855: {'lr': 0.00019929319000543445, 'samples': 1339360, 'steps': 2615, 'loss/train': 1.876569151878357} -09/20/2021 23:33:14 - INFO - __main__ - Step 41856: {'lr': 0.00019929319000543445, 'samples': 1339392, 'steps': 2615, 'loss/train': 2.2584145069122314} -09/20/2021 23:33:15 - INFO - __main__ - Step 41857: {'lr': 0.00019929243272440847, 'samples': 1339424, 'steps': 2616, 'loss/train': 2.4283294677734375} -09/20/2021 23:33:16 - INFO - __main__ - Step 41858: {'lr': 0.00019929243272440847, 'samples': 1339456, 'steps': 2616, 'loss/train': 2.483258008956909} -09/20/2021 23:33:17 - INFO - __main__ - Step 41859: {'lr': 0.00019929243272440847, 'samples': 1339488, 'steps': 2616, 'loss/train': 2.043064594268799} -09/20/2021 23:33:18 - INFO - __main__ - Step 41860: {'lr': 0.00019929243272440847, 'samples': 1339520, 'steps': 2616, 'loss/train': 2.317267894744873} -09/20/2021 23:33:18 - INFO - __main__ - Step 41861: {'lr': 0.00019929243272440847, 'samples': 1339552, 'steps': 2616, 'loss/train': 0.8545379042625427} -09/20/2021 23:33:19 - INFO - __main__ - Step 41862: {'lr': 0.00019929243272440847, 'samples': 1339584, 'steps': 2616, 'loss/train': 2.3313896656036377} -09/20/2021 23:33:20 - INFO - __main__ - Step 41863: {'lr': 0.00019929243272440847, 'samples': 1339616, 'steps': 2616, 'loss/train': 1.7157994508743286} -09/20/2021 23:33:21 - INFO - __main__ - Step 41864: {'lr': 0.00019929243272440847, 'samples': 1339648, 'steps': 2616, 'loss/train': 2.3352231979370117} -09/20/2021 23:33:21 - INFO - __main__ - Step 41865: {'lr': 0.00019929243272440847, 'samples': 1339680, 'steps': 2616, 'loss/train': 1.5841983556747437} -09/20/2021 23:33:22 - INFO - __main__ - Step 41866: {'lr': 0.00019929243272440847, 'samples': 1339712, 'steps': 2616, 'loss/train': 2.215148448944092} -09/20/2021 23:33:23 - INFO - __main__ - Step 41867: {'lr': 0.00019929243272440847, 'samples': 1339744, 'steps': 2616, 'loss/train': 1.4567067623138428} -09/20/2021 23:33:24 - INFO - __main__ - Step 41868: {'lr': 0.00019929243272440847, 'samples': 1339776, 'steps': 2616, 'loss/train': 1.77573823928833} -09/20/2021 23:33:24 - INFO - __main__ - Step 41869: {'lr': 0.00019929243272440847, 'samples': 1339808, 'steps': 2616, 'loss/train': 2.3407394886016846} -09/20/2021 23:33:25 - INFO - __main__ - Step 41870: {'lr': 0.00019929243272440847, 'samples': 1339840, 'steps': 2616, 'loss/train': 0.4173504114151001} -09/20/2021 23:33:26 - INFO - __main__ - Step 41871: {'lr': 0.00019929243272440847, 'samples': 1339872, 'steps': 2616, 'loss/train': 2.005312204360962} -09/20/2021 23:33:27 - INFO - __main__ - Step 41872: {'lr': 0.00019929243272440847, 'samples': 1339904, 'steps': 2616, 'loss/train': 2.0021626949310303} -09/20/2021 23:33:27 - INFO - __main__ - Step 41873: {'lr': 0.00019929167503936196, 'samples': 1339936, 'steps': 2617, 'loss/train': 1.949554204940796} -09/20/2021 23:33:28 - INFO - __main__ - Step 41874: {'lr': 0.00019929167503936196, 'samples': 1339968, 'steps': 2617, 'loss/train': 2.7266674041748047} -09/20/2021 23:33:29 - INFO - __main__ - Step 41875: {'lr': 0.00019929167503936196, 'samples': 1340000, 'steps': 2617, 'loss/train': 2.220593214035034} -09/20/2021 23:33:30 - INFO - __main__ - Step 41876: {'lr': 0.00019929167503936196, 'samples': 1340032, 'steps': 2617, 'loss/train': 1.5407217741012573} -09/20/2021 23:33:31 - INFO - __main__ - Step 41877: {'lr': 0.00019929167503936196, 'samples': 1340064, 'steps': 2617, 'loss/train': 2.3395681381225586} -09/20/2021 23:33:32 - INFO - __main__ - Step 41878: {'lr': 0.00019929167503936196, 'samples': 1340096, 'steps': 2617, 'loss/train': 2.1189699172973633} -09/20/2021 23:33:32 - INFO - __main__ - Step 41879: {'lr': 0.00019929167503936196, 'samples': 1340128, 'steps': 2617, 'loss/train': 2.7392938137054443} -09/20/2021 23:33:33 - INFO - __main__ - Step 41880: {'lr': 0.00019929167503936196, 'samples': 1340160, 'steps': 2617, 'loss/train': 2.7786054611206055} -09/20/2021 23:33:34 - INFO - __main__ - Step 41881: {'lr': 0.00019929167503936196, 'samples': 1340192, 'steps': 2617, 'loss/train': 2.25307035446167} -09/20/2021 23:33:35 - INFO - __main__ - Step 41882: {'lr': 0.00019929167503936196, 'samples': 1340224, 'steps': 2617, 'loss/train': 1.6573721170425415} -09/20/2021 23:33:35 - INFO - __main__ - Step 41883: {'lr': 0.00019929167503936196, 'samples': 1340256, 'steps': 2617, 'loss/train': 1.7052950859069824} -09/20/2021 23:33:36 - INFO - __main__ - Step 41884: {'lr': 0.00019929167503936196, 'samples': 1340288, 'steps': 2617, 'loss/train': 2.483840227127075} -09/20/2021 23:33:37 - INFO - __main__ - Step 41885: {'lr': 0.00019929167503936196, 'samples': 1340320, 'steps': 2617, 'loss/train': 0.6949535608291626} -09/20/2021 23:33:38 - INFO - __main__ - Step 41886: {'lr': 0.00019929167503936196, 'samples': 1340352, 'steps': 2617, 'loss/train': 2.7875735759735107} -09/20/2021 23:33:38 - INFO - __main__ - Step 41887: {'lr': 0.00019929167503936196, 'samples': 1340384, 'steps': 2617, 'loss/train': 2.450923204421997} -09/20/2021 23:33:39 - INFO - __main__ - Step 41888: {'lr': 0.00019929167503936196, 'samples': 1340416, 'steps': 2617, 'loss/train': 2.9186642169952393} -09/20/2021 23:33:40 - INFO - __main__ - Step 41889: {'lr': 0.000199290916950298, 'samples': 1340448, 'steps': 2618, 'loss/train': 2.381920099258423} -09/20/2021 23:33:41 - INFO - __main__ - Step 41890: {'lr': 0.000199290916950298, 'samples': 1340480, 'steps': 2618, 'loss/train': 3.087196111679077} -09/20/2021 23:33:42 - INFO - __main__ - Step 41891: {'lr': 0.000199290916950298, 'samples': 1340512, 'steps': 2618, 'loss/train': 2.621032953262329} -09/20/2021 23:33:42 - INFO - __main__ - Step 41892: {'lr': 0.000199290916950298, 'samples': 1340544, 'steps': 2618, 'loss/train': 1.872279167175293} -09/20/2021 23:33:43 - INFO - __main__ - Step 41893: {'lr': 0.000199290916950298, 'samples': 1340576, 'steps': 2618, 'loss/train': 1.8492588996887207} -09/20/2021 23:33:44 - INFO - __main__ - Step 41894: {'lr': 0.000199290916950298, 'samples': 1340608, 'steps': 2618, 'loss/train': 2.225602388381958} -09/20/2021 23:33:45 - INFO - __main__ - Step 41895: {'lr': 0.000199290916950298, 'samples': 1340640, 'steps': 2618, 'loss/train': 2.868306875228882} -09/20/2021 23:33:45 - INFO - __main__ - Step 41896: {'lr': 0.000199290916950298, 'samples': 1340672, 'steps': 2618, 'loss/train': 1.6101006269454956} -09/20/2021 23:33:46 - INFO - __main__ - Step 41897: {'lr': 0.000199290916950298, 'samples': 1340704, 'steps': 2618, 'loss/train': 2.0977060794830322} -09/20/2021 23:33:47 - INFO - __main__ - Step 41898: {'lr': 0.000199290916950298, 'samples': 1340736, 'steps': 2618, 'loss/train': 1.9729410409927368} -09/20/2021 23:33:48 - INFO - __main__ - Step 41899: {'lr': 0.000199290916950298, 'samples': 1340768, 'steps': 2618, 'loss/train': 3.4565250873565674} -09/20/2021 23:33:48 - INFO - __main__ - Step 41900: {'lr': 0.000199290916950298, 'samples': 1340800, 'steps': 2618, 'loss/train': 1.3166778087615967} -09/20/2021 23:33:49 - INFO - __main__ - Step 41901: {'lr': 0.000199290916950298, 'samples': 1340832, 'steps': 2618, 'loss/train': 3.151984691619873} -09/20/2021 23:33:50 - INFO - __main__ - Step 41902: {'lr': 0.000199290916950298, 'samples': 1340864, 'steps': 2618, 'loss/train': 3.1459052562713623} -09/20/2021 23:33:51 - INFO - __main__ - Step 41903: {'lr': 0.000199290916950298, 'samples': 1340896, 'steps': 2618, 'loss/train': 1.7540719509124756} -09/20/2021 23:33:51 - INFO - __main__ - Step 41904: {'lr': 0.000199290916950298, 'samples': 1340928, 'steps': 2618, 'loss/train': 1.4212621450424194} -09/20/2021 23:33:52 - INFO - __main__ - Step 41905: {'lr': 0.0001992901584572197, 'samples': 1340960, 'steps': 2619, 'loss/train': 1.824142336845398} -09/20/2021 23:33:54 - INFO - __main__ - Step 41906: {'lr': 0.0001992901584572197, 'samples': 1340992, 'steps': 2619, 'loss/train': 2.241617441177368} -09/20/2021 23:33:54 - INFO - __main__ - Step 41907: {'lr': 0.0001992901584572197, 'samples': 1341024, 'steps': 2619, 'loss/train': 2.419896364212036} -09/20/2021 23:33:55 - INFO - __main__ - Step 41908: {'lr': 0.0001992901584572197, 'samples': 1341056, 'steps': 2619, 'loss/train': 2.113981008529663} -09/20/2021 23:33:56 - INFO - __main__ - Step 41909: {'lr': 0.0001992901584572197, 'samples': 1341088, 'steps': 2619, 'loss/train': 1.7476314306259155} -09/20/2021 23:33:57 - INFO - __main__ - Step 41910: {'lr': 0.0001992901584572197, 'samples': 1341120, 'steps': 2619, 'loss/train': 2.873492479324341} -09/20/2021 23:33:57 - INFO - __main__ - Step 41911: {'lr': 0.0001992901584572197, 'samples': 1341152, 'steps': 2619, 'loss/train': 2.0778677463531494} -09/20/2021 23:33:58 - INFO - __main__ - Step 41912: {'lr': 0.0001992901584572197, 'samples': 1341184, 'steps': 2619, 'loss/train': 1.812197208404541} -09/20/2021 23:33:59 - INFO - __main__ - Step 41913: {'lr': 0.0001992901584572197, 'samples': 1341216, 'steps': 2619, 'loss/train': 3.3034141063690186} -09/20/2021 23:34:00 - INFO - __main__ - Step 41914: {'lr': 0.0001992901584572197, 'samples': 1341248, 'steps': 2619, 'loss/train': 2.2505085468292236} -09/20/2021 23:34:00 - INFO - __main__ - Step 41915: {'lr': 0.0001992901584572197, 'samples': 1341280, 'steps': 2619, 'loss/train': 0.5740155577659607} -09/20/2021 23:34:01 - INFO - __main__ - Step 41916: {'lr': 0.0001992901584572197, 'samples': 1341312, 'steps': 2619, 'loss/train': 2.128246545791626} -09/20/2021 23:34:02 - INFO - __main__ - Step 41917: {'lr': 0.0001992901584572197, 'samples': 1341344, 'steps': 2619, 'loss/train': 1.0170170068740845} -09/20/2021 23:34:03 - INFO - __main__ - Step 41918: {'lr': 0.0001992901584572197, 'samples': 1341376, 'steps': 2619, 'loss/train': 2.2528181076049805} -09/20/2021 23:34:03 - INFO - __main__ - Step 41919: {'lr': 0.0001992901584572197, 'samples': 1341408, 'steps': 2619, 'loss/train': 2.31174898147583} -09/20/2021 23:34:04 - INFO - __main__ - Step 41920: {'lr': 0.0001992901584572197, 'samples': 1341440, 'steps': 2619, 'loss/train': 2.7157790660858154} -09/20/2021 23:34:05 - INFO - __main__ - Step 41921: {'lr': 0.0001992893995601301, 'samples': 1341472, 'steps': 2620, 'loss/train': 2.947084426879883} -09/20/2021 23:34:06 - INFO - __main__ - Step 41922: {'lr': 0.0001992893995601301, 'samples': 1341504, 'steps': 2620, 'loss/train': 0.1621875762939453} -09/20/2021 23:34:06 - INFO - __main__ - Step 41923: {'lr': 0.0001992893995601301, 'samples': 1341536, 'steps': 2620, 'loss/train': 0.1614854335784912} -09/20/2021 23:34:07 - INFO - __main__ - Step 41924: {'lr': 0.0001992893995601301, 'samples': 1341568, 'steps': 2620, 'loss/train': 1.360939383506775} -09/20/2021 23:34:08 - INFO - __main__ - Step 41925: {'lr': 0.0001992893995601301, 'samples': 1341600, 'steps': 2620, 'loss/train': 2.982848644256592} -09/20/2021 23:34:09 - INFO - __main__ - Step 41926: {'lr': 0.0001992893995601301, 'samples': 1341632, 'steps': 2620, 'loss/train': 3.0233607292175293} -09/20/2021 23:34:09 - INFO - __main__ - Step 41927: {'lr': 0.0001992893995601301, 'samples': 1341664, 'steps': 2620, 'loss/train': 0.9611876606941223} -09/20/2021 23:34:10 - INFO - __main__ - Step 41928: {'lr': 0.0001992893995601301, 'samples': 1341696, 'steps': 2620, 'loss/train': 1.2116795778274536} -09/20/2021 23:34:11 - INFO - __main__ - Step 41929: {'lr': 0.0001992893995601301, 'samples': 1341728, 'steps': 2620, 'loss/train': 2.2575809955596924} -09/20/2021 23:34:12 - INFO - __main__ - Step 41930: {'lr': 0.0001992893995601301, 'samples': 1341760, 'steps': 2620, 'loss/train': 2.0344274044036865} -09/20/2021 23:34:12 - INFO - __main__ - Step 41931: {'lr': 0.0001992893995601301, 'samples': 1341792, 'steps': 2620, 'loss/train': 1.8897417783737183} -09/20/2021 23:34:13 - INFO - __main__ - Step 41932: {'lr': 0.0001992893995601301, 'samples': 1341824, 'steps': 2620, 'loss/train': 3.293395519256592} -09/20/2021 23:34:14 - INFO - __main__ - Step 41933: {'lr': 0.0001992893995601301, 'samples': 1341856, 'steps': 2620, 'loss/train': 2.058269500732422} -09/20/2021 23:34:15 - INFO - __main__ - Step 41934: {'lr': 0.0001992893995601301, 'samples': 1341888, 'steps': 2620, 'loss/train': 3.4943268299102783} -09/20/2021 23:34:15 - INFO - __main__ - Step 41935: {'lr': 0.0001992893995601301, 'samples': 1341920, 'steps': 2620, 'loss/train': 1.8274117708206177} -09/20/2021 23:34:16 - INFO - __main__ - Step 41936: {'lr': 0.0001992893995601301, 'samples': 1341952, 'steps': 2620, 'loss/train': 2.9410574436187744} -09/20/2021 23:34:17 - INFO - __main__ - Step 41937: {'lr': 0.00019928864025903236, 'samples': 1341984, 'steps': 2621, 'loss/train': 2.038113594055176} -09/20/2021 23:34:18 - INFO - __main__ - Step 41938: {'lr': 0.00019928864025903236, 'samples': 1342016, 'steps': 2621, 'loss/train': 2.1363675594329834} -09/20/2021 23:34:19 - INFO - __main__ - Step 41939: {'lr': 0.00019928864025903236, 'samples': 1342048, 'steps': 2621, 'loss/train': 2.383470058441162} -09/20/2021 23:34:20 - INFO - __main__ - Step 41940: {'lr': 0.00019928864025903236, 'samples': 1342080, 'steps': 2621, 'loss/train': 2.3475911617279053} -09/20/2021 23:34:21 - INFO - __main__ - Step 41941: {'lr': 0.00019928864025903236, 'samples': 1342112, 'steps': 2621, 'loss/train': 1.8034067153930664} -09/20/2021 23:34:21 - INFO - __main__ - Step 41942: {'lr': 0.00019928864025903236, 'samples': 1342144, 'steps': 2621, 'loss/train': 1.2000638246536255} -09/20/2021 23:34:22 - INFO - __main__ - Step 41943: {'lr': 0.00019928864025903236, 'samples': 1342176, 'steps': 2621, 'loss/train': 2.3477015495300293} -09/20/2021 23:34:23 - INFO - __main__ - Step 41944: {'lr': 0.00019928864025903236, 'samples': 1342208, 'steps': 2621, 'loss/train': 2.0554282665252686} -09/20/2021 23:34:24 - INFO - __main__ - Step 41945: {'lr': 0.00019928864025903236, 'samples': 1342240, 'steps': 2621, 'loss/train': 2.0509822368621826} -09/20/2021 23:34:24 - INFO - __main__ - Step 41946: {'lr': 0.00019928864025903236, 'samples': 1342272, 'steps': 2621, 'loss/train': 1.8602625131607056} -09/20/2021 23:34:25 - INFO - __main__ - Step 41947: {'lr': 0.00019928864025903236, 'samples': 1342304, 'steps': 2621, 'loss/train': 2.3943588733673096} -09/20/2021 23:34:26 - INFO - __main__ - Step 41948: {'lr': 0.00019928864025903236, 'samples': 1342336, 'steps': 2621, 'loss/train': 2.0429794788360596} -09/20/2021 23:34:27 - INFO - __main__ - Step 41949: {'lr': 0.00019928864025903236, 'samples': 1342368, 'steps': 2621, 'loss/train': 1.3712742328643799} -09/20/2021 23:34:27 - INFO - __main__ - Step 41950: {'lr': 0.00019928864025903236, 'samples': 1342400, 'steps': 2621, 'loss/train': 1.934901237487793} -09/20/2021 23:34:28 - INFO - __main__ - Step 41951: {'lr': 0.00019928864025903236, 'samples': 1342432, 'steps': 2621, 'loss/train': 1.7502204179763794} -09/20/2021 23:34:29 - INFO - __main__ - Step 41952: {'lr': 0.00019928864025903236, 'samples': 1342464, 'steps': 2621, 'loss/train': 0.36724865436553955} -09/20/2021 23:34:30 - INFO - __main__ - Step 41953: {'lr': 0.0001992878805539295, 'samples': 1342496, 'steps': 2622, 'loss/train': 2.900273323059082} -09/20/2021 23:34:31 - INFO - __main__ - Step 41954: {'lr': 0.0001992878805539295, 'samples': 1342528, 'steps': 2622, 'loss/train': 2.4193079471588135} -09/20/2021 23:34:31 - INFO - __main__ - Step 41955: {'lr': 0.0001992878805539295, 'samples': 1342560, 'steps': 2622, 'loss/train': 0.9479556679725647} -09/20/2021 23:34:32 - INFO - __main__ - Step 41956: {'lr': 0.0001992878805539295, 'samples': 1342592, 'steps': 2622, 'loss/train': 2.7102646827697754} -09/20/2021 23:34:33 - INFO - __main__ - Step 41957: {'lr': 0.0001992878805539295, 'samples': 1342624, 'steps': 2622, 'loss/train': 2.4497663974761963} -09/20/2021 23:34:34 - INFO - __main__ - Step 41958: {'lr': 0.0001992878805539295, 'samples': 1342656, 'steps': 2622, 'loss/train': 2.460404396057129} -09/20/2021 23:34:34 - INFO - __main__ - Step 41959: {'lr': 0.0001992878805539295, 'samples': 1342688, 'steps': 2622, 'loss/train': 0.39865878224372864} -09/20/2021 23:34:35 - INFO - __main__ - Step 41960: {'lr': 0.0001992878805539295, 'samples': 1342720, 'steps': 2622, 'loss/train': 2.745837688446045} -09/20/2021 23:34:36 - INFO - __main__ - Step 41961: {'lr': 0.0001992878805539295, 'samples': 1342752, 'steps': 2622, 'loss/train': 1.944654107093811} -09/20/2021 23:34:37 - INFO - __main__ - Step 41962: {'lr': 0.0001992878805539295, 'samples': 1342784, 'steps': 2622, 'loss/train': 0.8603934049606323} -09/20/2021 23:34:37 - INFO - __main__ - Step 41963: {'lr': 0.0001992878805539295, 'samples': 1342816, 'steps': 2622, 'loss/train': 3.19810152053833} -09/20/2021 23:34:38 - INFO - __main__ - Step 41964: {'lr': 0.0001992878805539295, 'samples': 1342848, 'steps': 2622, 'loss/train': 2.749063014984131} -09/20/2021 23:34:39 - INFO - __main__ - Step 41965: {'lr': 0.0001992878805539295, 'samples': 1342880, 'steps': 2622, 'loss/train': 2.55367112159729} -09/20/2021 23:34:40 - INFO - __main__ - Step 41966: {'lr': 0.0001992878805539295, 'samples': 1342912, 'steps': 2622, 'loss/train': 1.9425679445266724} -09/20/2021 23:34:40 - INFO - __main__ - Step 41967: {'lr': 0.0001992878805539295, 'samples': 1342944, 'steps': 2622, 'loss/train': 1.4543570280075073} -09/20/2021 23:34:41 - INFO - __main__ - Step 41968: {'lr': 0.0001992878805539295, 'samples': 1342976, 'steps': 2622, 'loss/train': 1.9285712242126465} -09/20/2021 23:34:43 - INFO - __main__ - Step 41969: {'lr': 0.00019928712044482464, 'samples': 1343008, 'steps': 2623, 'loss/train': 2.6946728229522705} -09/20/2021 23:34:43 - INFO - __main__ - Step 41970: {'lr': 0.00019928712044482464, 'samples': 1343040, 'steps': 2623, 'loss/train': 1.1184288263320923} -09/20/2021 23:34:44 - INFO - __main__ - Step 41971: {'lr': 0.00019928712044482464, 'samples': 1343072, 'steps': 2623, 'loss/train': 2.265275478363037} -09/20/2021 23:34:45 - INFO - __main__ - Step 41972: {'lr': 0.00019928712044482464, 'samples': 1343104, 'steps': 2623, 'loss/train': 0.5974849462509155} -09/20/2021 23:34:46 - INFO - __main__ - Step 41973: {'lr': 0.00019928712044482464, 'samples': 1343136, 'steps': 2623, 'loss/train': 1.8546746969223022} -09/20/2021 23:34:46 - INFO - __main__ - Step 41974: {'lr': 0.00019928712044482464, 'samples': 1343168, 'steps': 2623, 'loss/train': 2.364967107772827} -09/20/2021 23:34:47 - INFO - __main__ - Step 41975: {'lr': 0.00019928712044482464, 'samples': 1343200, 'steps': 2623, 'loss/train': 2.416442394256592} -09/20/2021 23:34:48 - INFO - __main__ - Step 41976: {'lr': 0.00019928712044482464, 'samples': 1343232, 'steps': 2623, 'loss/train': 1.4150060415267944} -09/20/2021 23:34:49 - INFO - __main__ - Step 41977: {'lr': 0.00019928712044482464, 'samples': 1343264, 'steps': 2623, 'loss/train': 0.33209648728370667} -09/20/2021 23:34:49 - INFO - __main__ - Step 41978: {'lr': 0.00019928712044482464, 'samples': 1343296, 'steps': 2623, 'loss/train': 0.1536608189344406} -09/20/2021 23:34:50 - INFO - __main__ - Step 41979: {'lr': 0.00019928712044482464, 'samples': 1343328, 'steps': 2623, 'loss/train': 0.10187339782714844} -09/20/2021 23:34:51 - INFO - __main__ - Step 41980: {'lr': 0.00019928712044482464, 'samples': 1343360, 'steps': 2623, 'loss/train': 2.6889231204986572} -09/20/2021 23:34:52 - INFO - __main__ - Step 41981: {'lr': 0.00019928712044482464, 'samples': 1343392, 'steps': 2623, 'loss/train': 1.5968509912490845} -09/20/2021 23:34:52 - INFO - __main__ - Step 41982: {'lr': 0.00019928712044482464, 'samples': 1343424, 'steps': 2623, 'loss/train': 1.7779446840286255} -09/20/2021 23:34:53 - INFO - __main__ - Step 41983: {'lr': 0.00019928712044482464, 'samples': 1343456, 'steps': 2623, 'loss/train': 1.3674954175949097} -09/20/2021 23:34:54 - INFO - __main__ - Step 41984: {'lr': 0.00019928712044482464, 'samples': 1343488, 'steps': 2623, 'loss/train': 1.915765643119812} -09/20/2021 23:34:55 - INFO - __main__ - Step 41985: {'lr': 0.00019928635993172092, 'samples': 1343520, 'steps': 2624, 'loss/train': 1.8735461235046387} -09/20/2021 23:34:55 - INFO - __main__ - Step 41986: {'lr': 0.00019928635993172092, 'samples': 1343552, 'steps': 2624, 'loss/train': 1.8954627513885498} -09/20/2021 23:34:56 - INFO - __main__ - Step 41987: {'lr': 0.00019928635993172092, 'samples': 1343584, 'steps': 2624, 'loss/train': 1.1833425760269165} -09/20/2021 23:34:57 - INFO - __main__ - Step 41988: {'lr': 0.00019928635993172092, 'samples': 1343616, 'steps': 2624, 'loss/train': 1.9049615859985352} -09/20/2021 23:34:58 - INFO - __main__ - Step 41989: {'lr': 0.00019928635993172092, 'samples': 1343648, 'steps': 2624, 'loss/train': 2.6931583881378174} -09/20/2021 23:34:58 - INFO - __main__ - Step 41990: {'lr': 0.00019928635993172092, 'samples': 1343680, 'steps': 2624, 'loss/train': 2.138338327407837} -09/20/2021 23:34:59 - INFO - __main__ - Step 41991: {'lr': 0.00019928635993172092, 'samples': 1343712, 'steps': 2624, 'loss/train': 3.3303415775299072} -09/20/2021 23:35:00 - INFO - __main__ - Step 41992: {'lr': 0.00019928635993172092, 'samples': 1343744, 'steps': 2624, 'loss/train': 2.50238299369812} -09/20/2021 23:35:01 - INFO - __main__ - Step 41993: {'lr': 0.00019928635993172092, 'samples': 1343776, 'steps': 2624, 'loss/train': 1.761338710784912} -09/20/2021 23:35:01 - INFO - __main__ - Step 41994: {'lr': 0.00019928635993172092, 'samples': 1343808, 'steps': 2624, 'loss/train': 2.3607287406921387} -09/20/2021 23:35:02 - INFO - __main__ - Step 41995: {'lr': 0.00019928635993172092, 'samples': 1343840, 'steps': 2624, 'loss/train': 1.4266858100891113} -09/20/2021 23:35:03 - INFO - __main__ - Step 41996: {'lr': 0.00019928635993172092, 'samples': 1343872, 'steps': 2624, 'loss/train': 2.639655113220215} -09/20/2021 23:35:04 - INFO - __main__ - Step 41997: {'lr': 0.00019928635993172092, 'samples': 1343904, 'steps': 2624, 'loss/train': 1.6894489526748657} -09/20/2021 23:35:04 - INFO - __main__ - Step 41998: {'lr': 0.00019928635993172092, 'samples': 1343936, 'steps': 2624, 'loss/train': 1.6621638536453247} -09/20/2021 23:35:05 - INFO - __main__ - Step 41999: {'lr': 0.00019928635993172092, 'samples': 1343968, 'steps': 2624, 'loss/train': 1.6182652711868286} -09/20/2021 23:35:06 - INFO - __main__ - Step 42000: {'lr': 0.00019928635993172092, 'samples': 1344000, 'steps': 2624, 'loss/train': 1.5764527320861816} -09/20/2021 23:35:07 - INFO - __main__ - Step 42001: {'lr': 0.00019928559901462133, 'samples': 1344032, 'steps': 2625, 'loss/train': 1.9113714694976807} -09/20/2021 23:35:08 - INFO - __main__ - Step 42002: {'lr': 0.00019928559901462133, 'samples': 1344064, 'steps': 2625, 'loss/train': 2.8127198219299316} -09/20/2021 23:35:09 - INFO - __main__ - Step 42003: {'lr': 0.00019928559901462133, 'samples': 1344096, 'steps': 2625, 'loss/train': 1.8859400749206543} -09/20/2021 23:35:10 - INFO - __main__ - Step 42004: {'lr': 0.00019928559901462133, 'samples': 1344128, 'steps': 2625, 'loss/train': 2.2658979892730713} -09/20/2021 23:35:10 - INFO - __main__ - Step 42005: {'lr': 0.00019928559901462133, 'samples': 1344160, 'steps': 2625, 'loss/train': 2.755873441696167} -09/20/2021 23:35:11 - INFO - __main__ - Step 42006: {'lr': 0.00019928559901462133, 'samples': 1344192, 'steps': 2625, 'loss/train': 1.417243242263794} -09/20/2021 23:35:12 - INFO - __main__ - Step 42007: {'lr': 0.00019928559901462133, 'samples': 1344224, 'steps': 2625, 'loss/train': 1.9793373346328735} -09/20/2021 23:35:13 - INFO - __main__ - Step 42008: {'lr': 0.00019928559901462133, 'samples': 1344256, 'steps': 2625, 'loss/train': 1.5542467832565308} -09/20/2021 23:35:13 - INFO - __main__ - Step 42009: {'lr': 0.00019928559901462133, 'samples': 1344288, 'steps': 2625, 'loss/train': 2.111116647720337} -09/20/2021 23:35:14 - INFO - __main__ - Step 42010: {'lr': 0.00019928559901462133, 'samples': 1344320, 'steps': 2625, 'loss/train': 2.1165404319763184} -09/20/2021 23:35:15 - INFO - __main__ - Step 42011: {'lr': 0.00019928559901462133, 'samples': 1344352, 'steps': 2625, 'loss/train': 1.8202648162841797} -09/20/2021 23:35:16 - INFO - __main__ - Step 42012: {'lr': 0.00019928559901462133, 'samples': 1344384, 'steps': 2625, 'loss/train': 2.912297248840332} -09/20/2021 23:35:16 - INFO - __main__ - Step 42013: {'lr': 0.00019928559901462133, 'samples': 1344416, 'steps': 2625, 'loss/train': 2.3067092895507812} -09/20/2021 23:35:17 - INFO - __main__ - Step 42014: {'lr': 0.00019928559901462133, 'samples': 1344448, 'steps': 2625, 'loss/train': 2.0392680168151855} -09/20/2021 23:35:18 - INFO - __main__ - Step 42015: {'lr': 0.00019928559901462133, 'samples': 1344480, 'steps': 2625, 'loss/train': 2.423050880432129} -09/20/2021 23:35:19 - INFO - __main__ - Step 42016: {'lr': 0.00019928559901462133, 'samples': 1344512, 'steps': 2625, 'loss/train': 2.824878215789795} -09/20/2021 23:35:19 - INFO - __main__ - Step 42017: {'lr': 0.00019928483769352903, 'samples': 1344544, 'steps': 2626, 'loss/train': 1.5163965225219727} -09/20/2021 23:35:20 - INFO - __main__ - Step 42018: {'lr': 0.00019928483769352903, 'samples': 1344576, 'steps': 2626, 'loss/train': 1.9092326164245605} -09/20/2021 23:35:21 - INFO - __main__ - Step 42019: {'lr': 0.00019928483769352903, 'samples': 1344608, 'steps': 2626, 'loss/train': 2.154783010482788} -09/20/2021 23:35:22 - INFO - __main__ - Step 42020: {'lr': 0.00019928483769352903, 'samples': 1344640, 'steps': 2626, 'loss/train': 1.5646089315414429} -09/20/2021 23:35:22 - INFO - __main__ - Step 42021: {'lr': 0.00019928483769352903, 'samples': 1344672, 'steps': 2626, 'loss/train': 1.9048079252243042} -09/20/2021 23:35:23 - INFO - __main__ - Step 42022: {'lr': 0.00019928483769352903, 'samples': 1344704, 'steps': 2626, 'loss/train': 2.3837926387786865} -09/20/2021 23:35:24 - INFO - __main__ - Step 42023: {'lr': 0.00019928483769352903, 'samples': 1344736, 'steps': 2626, 'loss/train': 3.6057116985321045} -09/20/2021 23:35:25 - INFO - __main__ - Step 42024: {'lr': 0.00019928483769352903, 'samples': 1344768, 'steps': 2626, 'loss/train': 2.0305662155151367} -09/20/2021 23:35:25 - INFO - __main__ - Step 42025: {'lr': 0.00019928483769352903, 'samples': 1344800, 'steps': 2626, 'loss/train': 1.9272191524505615} -09/20/2021 23:35:26 - INFO - __main__ - Step 42026: {'lr': 0.00019928483769352903, 'samples': 1344832, 'steps': 2626, 'loss/train': 1.7945011854171753} -09/20/2021 23:35:27 - INFO - __main__ - Step 42027: {'lr': 0.00019928483769352903, 'samples': 1344864, 'steps': 2626, 'loss/train': 2.6853315830230713} -09/20/2021 23:35:28 - INFO - __main__ - Step 42028: {'lr': 0.00019928483769352903, 'samples': 1344896, 'steps': 2626, 'loss/train': 0.5709139108657837} -09/20/2021 23:35:28 - INFO - __main__ - Step 42029: {'lr': 0.00019928483769352903, 'samples': 1344928, 'steps': 2626, 'loss/train': 0.809951901435852} -09/20/2021 23:35:29 - INFO - __main__ - Step 42030: {'lr': 0.00019928483769352903, 'samples': 1344960, 'steps': 2626, 'loss/train': 1.8598994016647339} -09/20/2021 23:35:31 - INFO - __main__ - Step 42031: {'lr': 0.00019928483769352903, 'samples': 1344992, 'steps': 2626, 'loss/train': 2.7719943523406982} -09/20/2021 23:35:31 - INFO - __main__ - Step 42032: {'lr': 0.00019928483769352903, 'samples': 1345024, 'steps': 2626, 'loss/train': 2.08520770072937} -09/20/2021 23:35:32 - INFO - __main__ - Step 42033: {'lr': 0.00019928407596844712, 'samples': 1345056, 'steps': 2627, 'loss/train': 2.2549991607666016} -09/20/2021 23:35:33 - INFO - __main__ - Step 42034: {'lr': 0.00019928407596844712, 'samples': 1345088, 'steps': 2627, 'loss/train': 2.026397228240967} -09/20/2021 23:35:34 - INFO - __main__ - Step 42035: {'lr': 0.00019928407596844712, 'samples': 1345120, 'steps': 2627, 'loss/train': 2.277787685394287} -09/20/2021 23:35:34 - INFO - __main__ - Step 42036: {'lr': 0.00019928407596844712, 'samples': 1345152, 'steps': 2627, 'loss/train': 2.275465250015259} -09/20/2021 23:35:35 - INFO - __main__ - Step 42037: {'lr': 0.00019928407596844712, 'samples': 1345184, 'steps': 2627, 'loss/train': 2.4507224559783936} -09/20/2021 23:35:36 - INFO - __main__ - Step 42038: {'lr': 0.00019928407596844712, 'samples': 1345216, 'steps': 2627, 'loss/train': 0.6600793600082397} -09/20/2021 23:35:37 - INFO - __main__ - Step 42039: {'lr': 0.00019928407596844712, 'samples': 1345248, 'steps': 2627, 'loss/train': 0.47350797057151794} -09/20/2021 23:35:37 - INFO - __main__ - Step 42040: {'lr': 0.00019928407596844712, 'samples': 1345280, 'steps': 2627, 'loss/train': 2.1834418773651123} -09/20/2021 23:35:38 - INFO - __main__ - Step 42041: {'lr': 0.00019928407596844712, 'samples': 1345312, 'steps': 2627, 'loss/train': 2.0802524089813232} -09/20/2021 23:35:39 - INFO - __main__ - Step 42042: {'lr': 0.00019928407596844712, 'samples': 1345344, 'steps': 2627, 'loss/train': 2.3891830444335938} -09/20/2021 23:35:40 - INFO - __main__ - Step 42043: {'lr': 0.00019928407596844712, 'samples': 1345376, 'steps': 2627, 'loss/train': 2.452880620956421} -09/20/2021 23:35:40 - INFO - __main__ - Step 42044: {'lr': 0.00019928407596844712, 'samples': 1345408, 'steps': 2627, 'loss/train': 0.21882955729961395} -09/20/2021 23:35:41 - INFO - __main__ - Step 42045: {'lr': 0.00019928407596844712, 'samples': 1345440, 'steps': 2627, 'loss/train': 0.1600208729505539} -09/20/2021 23:35:42 - INFO - __main__ - Step 42046: {'lr': 0.00019928407596844712, 'samples': 1345472, 'steps': 2627, 'loss/train': 2.8055903911590576} -09/20/2021 23:35:43 - INFO - __main__ - Step 42047: {'lr': 0.00019928407596844712, 'samples': 1345504, 'steps': 2627, 'loss/train': 1.1270335912704468} -09/20/2021 23:35:43 - INFO - __main__ - Step 42048: {'lr': 0.00019928407596844712, 'samples': 1345536, 'steps': 2627, 'loss/train': 3.2733495235443115} -09/20/2021 23:35:44 - INFO - __main__ - Step 42049: {'lr': 0.0001992833138393787, 'samples': 1345568, 'steps': 2628, 'loss/train': 1.6397793292999268} -09/20/2021 23:35:45 - INFO - __main__ - Step 42050: {'lr': 0.0001992833138393787, 'samples': 1345600, 'steps': 2628, 'loss/train': 2.5509939193725586} -09/20/2021 23:35:46 - INFO - __main__ - Step 42051: {'lr': 0.0001992833138393787, 'samples': 1345632, 'steps': 2628, 'loss/train': 2.232973337173462} -09/20/2021 23:35:47 - INFO - __main__ - Step 42052: {'lr': 0.0001992833138393787, 'samples': 1345664, 'steps': 2628, 'loss/train': 2.0354552268981934} -09/20/2021 23:35:47 - INFO - __main__ - Step 42053: {'lr': 0.0001992833138393787, 'samples': 1345696, 'steps': 2628, 'loss/train': 2.7273664474487305} -09/20/2021 23:35:48 - INFO - __main__ - Step 42054: {'lr': 0.0001992833138393787, 'samples': 1345728, 'steps': 2628, 'loss/train': 1.723237156867981} -09/20/2021 23:35:49 - INFO - __main__ - Step 42055: {'lr': 0.0001992833138393787, 'samples': 1345760, 'steps': 2628, 'loss/train': 2.550715684890747} -09/20/2021 23:35:50 - INFO - __main__ - Step 42056: {'lr': 0.0001992833138393787, 'samples': 1345792, 'steps': 2628, 'loss/train': 2.4482247829437256} -09/20/2021 23:35:50 - INFO - __main__ - Step 42057: {'lr': 0.0001992833138393787, 'samples': 1345824, 'steps': 2628, 'loss/train': 2.0928168296813965} -09/20/2021 23:35:51 - INFO - __main__ - Step 42058: {'lr': 0.0001992833138393787, 'samples': 1345856, 'steps': 2628, 'loss/train': 2.4077115058898926} -09/20/2021 23:35:52 - INFO - __main__ - Step 42059: {'lr': 0.0001992833138393787, 'samples': 1345888, 'steps': 2628, 'loss/train': 1.72187340259552} -09/20/2021 23:35:53 - INFO - __main__ - Step 42060: {'lr': 0.0001992833138393787, 'samples': 1345920, 'steps': 2628, 'loss/train': 2.810131788253784} -09/20/2021 23:35:54 - INFO - __main__ - Step 42061: {'lr': 0.0001992833138393787, 'samples': 1345952, 'steps': 2628, 'loss/train': 2.169234037399292} -09/20/2021 23:35:55 - INFO - __main__ - Step 42062: {'lr': 0.0001992833138393787, 'samples': 1345984, 'steps': 2628, 'loss/train': 2.0115158557891846} -09/20/2021 23:35:56 - INFO - __main__ - Step 42063: {'lr': 0.0001992833138393787, 'samples': 1346016, 'steps': 2628, 'loss/train': 2.037477970123291} -09/20/2021 23:35:57 - INFO - __main__ - Step 42064: {'lr': 0.0001992833138393787, 'samples': 1346048, 'steps': 2628, 'loss/train': 1.8919909000396729} -09/20/2021 23:35:57 - INFO - __main__ - Step 42065: {'lr': 0.00019928255130632685, 'samples': 1346080, 'steps': 2629, 'loss/train': 2.873054265975952} -09/20/2021 23:35:58 - INFO - __main__ - Step 42066: {'lr': 0.00019928255130632685, 'samples': 1346112, 'steps': 2629, 'loss/train': 2.041731119155884} -09/20/2021 23:35:59 - INFO - __main__ - Step 42067: {'lr': 0.00019928255130632685, 'samples': 1346144, 'steps': 2629, 'loss/train': 1.4259556531906128} -09/20/2021 23:36:00 - INFO - __main__ - Step 42068: {'lr': 0.00019928255130632685, 'samples': 1346176, 'steps': 2629, 'loss/train': 2.0797295570373535} -09/20/2021 23:36:00 - INFO - __main__ - Step 42069: {'lr': 0.00019928255130632685, 'samples': 1346208, 'steps': 2629, 'loss/train': 1.9079042673110962} -09/20/2021 23:36:01 - INFO - __main__ - Step 42070: {'lr': 0.00019928255130632685, 'samples': 1346240, 'steps': 2629, 'loss/train': 2.6468334197998047} -09/20/2021 23:36:02 - INFO - __main__ - Step 42071: {'lr': 0.00019928255130632685, 'samples': 1346272, 'steps': 2629, 'loss/train': 2.022934913635254} -09/20/2021 23:36:03 - INFO - __main__ - Step 42072: {'lr': 0.00019928255130632685, 'samples': 1346304, 'steps': 2629, 'loss/train': 1.8395427465438843} -09/20/2021 23:36:03 - INFO - __main__ - Step 42073: {'lr': 0.00019928255130632685, 'samples': 1346336, 'steps': 2629, 'loss/train': 2.3936049938201904} -09/20/2021 23:36:04 - INFO - __main__ - Step 42074: {'lr': 0.00019928255130632685, 'samples': 1346368, 'steps': 2629, 'loss/train': 0.2778661251068115} -09/20/2021 23:36:05 - INFO - __main__ - Step 42075: {'lr': 0.00019928255130632685, 'samples': 1346400, 'steps': 2629, 'loss/train': 0.3646582067012787} -09/20/2021 23:36:06 - INFO - __main__ - Step 42076: {'lr': 0.00019928255130632685, 'samples': 1346432, 'steps': 2629, 'loss/train': 0.2046055644750595} -09/20/2021 23:36:06 - INFO - __main__ - Step 42077: {'lr': 0.00019928255130632685, 'samples': 1346464, 'steps': 2629, 'loss/train': 0.10019674152135849} -09/20/2021 23:36:07 - INFO - __main__ - Step 42078: {'lr': 0.00019928255130632685, 'samples': 1346496, 'steps': 2629, 'loss/train': 0.18750248849391937} -09/20/2021 23:36:08 - INFO - __main__ - Step 42079: {'lr': 0.00019928255130632685, 'samples': 1346528, 'steps': 2629, 'loss/train': 0.1906505674123764} -09/20/2021 23:36:09 - INFO - __main__ - Step 42080: {'lr': 0.00019928255130632685, 'samples': 1346560, 'steps': 2629, 'loss/train': 2.069162368774414} -09/20/2021 23:36:10 - INFO - __main__ - Step 42081: {'lr': 0.0001992817883692947, 'samples': 1346592, 'steps': 2630, 'loss/train': 1.8222713470458984} -09/20/2021 23:36:10 - INFO - __main__ - Step 42082: {'lr': 0.0001992817883692947, 'samples': 1346624, 'steps': 2630, 'loss/train': 2.321451425552368} -09/20/2021 23:36:11 - INFO - __main__ - Step 42083: {'lr': 0.0001992817883692947, 'samples': 1346656, 'steps': 2630, 'loss/train': 2.5471231937408447} -09/20/2021 23:36:12 - INFO - __main__ - Step 42084: {'lr': 0.0001992817883692947, 'samples': 1346688, 'steps': 2630, 'loss/train': 1.13078773021698} -09/20/2021 23:36:13 - INFO - __main__ - Step 42085: {'lr': 0.0001992817883692947, 'samples': 1346720, 'steps': 2630, 'loss/train': 2.0477535724639893} -09/20/2021 23:36:13 - INFO - __main__ - Step 42086: {'lr': 0.0001992817883692947, 'samples': 1346752, 'steps': 2630, 'loss/train': 2.2912275791168213} -09/20/2021 23:36:14 - INFO - __main__ - Step 42087: {'lr': 0.0001992817883692947, 'samples': 1346784, 'steps': 2630, 'loss/train': 1.341356873512268} -09/20/2021 23:36:15 - INFO - __main__ - Step 42088: {'lr': 0.0001992817883692947, 'samples': 1346816, 'steps': 2630, 'loss/train': 1.8003836870193481} -09/20/2021 23:36:16 - INFO - __main__ - Step 42089: {'lr': 0.0001992817883692947, 'samples': 1346848, 'steps': 2630, 'loss/train': 1.681341528892517} -09/20/2021 23:36:16 - INFO - __main__ - Step 42090: {'lr': 0.0001992817883692947, 'samples': 1346880, 'steps': 2630, 'loss/train': 1.1231729984283447} -09/20/2021 23:36:18 - INFO - __main__ - Step 42091: {'lr': 0.0001992817883692947, 'samples': 1346912, 'steps': 2630, 'loss/train': 0.9290255904197693} -09/20/2021 23:36:18 - INFO - __main__ - Step 42092: {'lr': 0.0001992817883692947, 'samples': 1346944, 'steps': 2630, 'loss/train': 1.0747441053390503} -09/20/2021 23:36:19 - INFO - __main__ - Step 42093: {'lr': 0.0001992817883692947, 'samples': 1346976, 'steps': 2630, 'loss/train': 2.7005350589752197} -09/20/2021 23:36:20 - INFO - __main__ - Step 42094: {'lr': 0.0001992817883692947, 'samples': 1347008, 'steps': 2630, 'loss/train': 2.3095767498016357} -09/20/2021 23:36:21 - INFO - __main__ - Step 42095: {'lr': 0.0001992817883692947, 'samples': 1347040, 'steps': 2630, 'loss/train': 1.712424397468567} -09/20/2021 23:36:21 - INFO - __main__ - Step 42096: {'lr': 0.0001992817883692947, 'samples': 1347072, 'steps': 2630, 'loss/train': 2.821004867553711} -09/20/2021 23:36:22 - INFO - __main__ - Step 42097: {'lr': 0.00019928102502828532, 'samples': 1347104, 'steps': 2631, 'loss/train': 2.654707431793213} -09/20/2021 23:36:23 - INFO - __main__ - Step 42098: {'lr': 0.00019928102502828532, 'samples': 1347136, 'steps': 2631, 'loss/train': 2.0556423664093018} -09/20/2021 23:36:24 - INFO - __main__ - Step 42099: {'lr': 0.00019928102502828532, 'samples': 1347168, 'steps': 2631, 'loss/train': 2.4323344230651855} -09/20/2021 23:36:25 - INFO - __main__ - Step 42100: {'lr': 0.00019928102502828532, 'samples': 1347200, 'steps': 2631, 'loss/train': 2.3826985359191895} -09/20/2021 23:36:25 - INFO - __main__ - Step 42101: {'lr': 0.00019928102502828532, 'samples': 1347232, 'steps': 2631, 'loss/train': 2.4325456619262695} -09/20/2021 23:36:26 - INFO - __main__ - Step 42102: {'lr': 0.00019928102502828532, 'samples': 1347264, 'steps': 2631, 'loss/train': 1.5678077936172485} -09/20/2021 23:36:27 - INFO - __main__ - Step 42103: {'lr': 0.00019928102502828532, 'samples': 1347296, 'steps': 2631, 'loss/train': 1.8246045112609863} -09/20/2021 23:36:28 - INFO - __main__ - Step 42104: {'lr': 0.00019928102502828532, 'samples': 1347328, 'steps': 2631, 'loss/train': 1.7000852823257446} -09/20/2021 23:36:28 - INFO - __main__ - Step 42105: {'lr': 0.00019928102502828532, 'samples': 1347360, 'steps': 2631, 'loss/train': 2.261047601699829} -09/20/2021 23:36:29 - INFO - __main__ - Step 42106: {'lr': 0.00019928102502828532, 'samples': 1347392, 'steps': 2631, 'loss/train': 1.9833312034606934} -09/20/2021 23:36:30 - INFO - __main__ - Step 42107: {'lr': 0.00019928102502828532, 'samples': 1347424, 'steps': 2631, 'loss/train': 1.2798022031784058} -09/20/2021 23:36:31 - INFO - __main__ - Step 42108: {'lr': 0.00019928102502828532, 'samples': 1347456, 'steps': 2631, 'loss/train': 1.63743257522583} -09/20/2021 23:36:31 - INFO - __main__ - Step 42109: {'lr': 0.00019928102502828532, 'samples': 1347488, 'steps': 2631, 'loss/train': 1.9898899793624878} -09/20/2021 23:36:32 - INFO - __main__ - Step 42110: {'lr': 0.00019928102502828532, 'samples': 1347520, 'steps': 2631, 'loss/train': 3.1786298751831055} -09/20/2021 23:36:33 - INFO - __main__ - Step 42111: {'lr': 0.00019928102502828532, 'samples': 1347552, 'steps': 2631, 'loss/train': 2.4877543449401855} -09/20/2021 23:36:34 - INFO - __main__ - Step 42112: {'lr': 0.00019928102502828532, 'samples': 1347584, 'steps': 2631, 'loss/train': 3.1474921703338623} -09/20/2021 23:36:34 - INFO - __main__ - Step 42113: {'lr': 0.00019928026128330183, 'samples': 1347616, 'steps': 2632, 'loss/train': 2.125732898712158} -09/20/2021 23:36:35 - INFO - __main__ - Step 42114: {'lr': 0.00019928026128330183, 'samples': 1347648, 'steps': 2632, 'loss/train': 2.993229866027832} -09/20/2021 23:36:36 - INFO - __main__ - Step 42115: {'lr': 0.00019928026128330183, 'samples': 1347680, 'steps': 2632, 'loss/train': 2.1116573810577393} -09/20/2021 23:36:37 - INFO - __main__ - Step 42116: {'lr': 0.00019928026128330183, 'samples': 1347712, 'steps': 2632, 'loss/train': 1.3715704679489136} -09/20/2021 23:36:37 - INFO - __main__ - Step 42117: {'lr': 0.00019928026128330183, 'samples': 1347744, 'steps': 2632, 'loss/train': 1.9301573038101196} -09/20/2021 23:36:38 - INFO - __main__ - Step 42118: {'lr': 0.00019928026128330183, 'samples': 1347776, 'steps': 2632, 'loss/train': 1.9477829933166504} -09/20/2021 23:36:39 - INFO - __main__ - Step 42119: {'lr': 0.00019928026128330183, 'samples': 1347808, 'steps': 2632, 'loss/train': 1.8618727922439575} -09/20/2021 23:36:40 - INFO - __main__ - Step 42120: {'lr': 0.00019928026128330183, 'samples': 1347840, 'steps': 2632, 'loss/train': 2.0599348545074463} -09/20/2021 23:36:40 - INFO - __main__ - Step 42121: {'lr': 0.00019928026128330183, 'samples': 1347872, 'steps': 2632, 'loss/train': 1.9263713359832764} -09/20/2021 23:36:42 - INFO - __main__ - Step 42122: {'lr': 0.00019928026128330183, 'samples': 1347904, 'steps': 2632, 'loss/train': 2.599391460418701} -09/20/2021 23:36:42 - INFO - __main__ - Step 42123: {'lr': 0.00019928026128330183, 'samples': 1347936, 'steps': 2632, 'loss/train': 2.1578757762908936} -09/20/2021 23:36:43 - INFO - __main__ - Step 42124: {'lr': 0.00019928026128330183, 'samples': 1347968, 'steps': 2632, 'loss/train': 1.8029351234436035} -09/20/2021 23:36:44 - INFO - __main__ - Step 42125: {'lr': 0.00019928026128330183, 'samples': 1348000, 'steps': 2632, 'loss/train': 1.9637141227722168} -09/20/2021 23:36:45 - INFO - __main__ - Step 42126: {'lr': 0.00019928026128330183, 'samples': 1348032, 'steps': 2632, 'loss/train': 1.9240458011627197} -09/20/2021 23:36:45 - INFO - __main__ - Step 42127: {'lr': 0.00019928026128330183, 'samples': 1348064, 'steps': 2632, 'loss/train': 1.7129888534545898} -09/20/2021 23:36:46 - INFO - __main__ - Step 42128: {'lr': 0.00019928026128330183, 'samples': 1348096, 'steps': 2632, 'loss/train': 2.167707920074463} -09/20/2021 23:36:47 - INFO - __main__ - Step 42129: {'lr': 0.00019927949713434737, 'samples': 1348128, 'steps': 2633, 'loss/train': 2.408012866973877} -09/20/2021 23:36:48 - INFO - __main__ - Step 42130: {'lr': 0.00019927949713434737, 'samples': 1348160, 'steps': 2633, 'loss/train': 2.0699827671051025} -09/20/2021 23:36:49 - INFO - __main__ - Step 42131: {'lr': 0.00019927949713434737, 'samples': 1348192, 'steps': 2633, 'loss/train': 2.5036253929138184} -09/20/2021 23:36:49 - INFO - __main__ - Step 42132: {'lr': 0.00019927949713434737, 'samples': 1348224, 'steps': 2633, 'loss/train': 1.931381106376648} -09/20/2021 23:36:50 - INFO - __main__ - Step 42133: {'lr': 0.00019927949713434737, 'samples': 1348256, 'steps': 2633, 'loss/train': 1.553170919418335} -09/20/2021 23:36:51 - INFO - __main__ - Step 42134: {'lr': 0.00019927949713434737, 'samples': 1348288, 'steps': 2633, 'loss/train': 2.1051297187805176} -09/20/2021 23:36:52 - INFO - __main__ - Step 42135: {'lr': 0.00019927949713434737, 'samples': 1348320, 'steps': 2633, 'loss/train': 2.3559892177581787} -09/20/2021 23:36:52 - INFO - __main__ - Step 42136: {'lr': 0.00019927949713434737, 'samples': 1348352, 'steps': 2633, 'loss/train': 2.3270063400268555} -09/20/2021 23:36:53 - INFO - __main__ - Step 42137: {'lr': 0.00019927949713434737, 'samples': 1348384, 'steps': 2633, 'loss/train': 1.909307837486267} -09/20/2021 23:36:54 - INFO - __main__ - Step 42138: {'lr': 0.00019927949713434737, 'samples': 1348416, 'steps': 2633, 'loss/train': 2.4476048946380615} -09/20/2021 23:36:55 - INFO - __main__ - Step 42139: {'lr': 0.00019927949713434737, 'samples': 1348448, 'steps': 2633, 'loss/train': 2.551652431488037} -09/20/2021 23:36:55 - INFO - __main__ - Step 42140: {'lr': 0.00019927949713434737, 'samples': 1348480, 'steps': 2633, 'loss/train': 1.6122852563858032} -09/20/2021 23:36:56 - INFO - __main__ - Step 42141: {'lr': 0.00019927949713434737, 'samples': 1348512, 'steps': 2633, 'loss/train': 1.9857335090637207} -09/20/2021 23:36:57 - INFO - __main__ - Step 42142: {'lr': 0.00019927949713434737, 'samples': 1348544, 'steps': 2633, 'loss/train': 2.2685532569885254} -09/20/2021 23:36:58 - INFO - __main__ - Step 42143: {'lr': 0.00019927949713434737, 'samples': 1348576, 'steps': 2633, 'loss/train': 1.485710859298706} -09/20/2021 23:36:58 - INFO - __main__ - Step 42144: {'lr': 0.00019927949713434737, 'samples': 1348608, 'steps': 2633, 'loss/train': 1.594818115234375} -09/20/2021 23:36:59 - INFO - __main__ - Step 42145: {'lr': 0.00019927873258142496, 'samples': 1348640, 'steps': 2634, 'loss/train': 3.1094729900360107} -09/20/2021 23:37:00 - INFO - __main__ - Step 42146: {'lr': 0.00019927873258142496, 'samples': 1348672, 'steps': 2634, 'loss/train': 3.152517318725586} -09/20/2021 23:37:01 - INFO - __main__ - Step 42147: {'lr': 0.00019927873258142496, 'samples': 1348704, 'steps': 2634, 'loss/train': 2.539851188659668} -09/20/2021 23:37:01 - INFO - __main__ - Step 42148: {'lr': 0.00019927873258142496, 'samples': 1348736, 'steps': 2634, 'loss/train': 1.9156944751739502} -09/20/2021 23:37:02 - INFO - __main__ - Step 42149: {'lr': 0.00019927873258142496, 'samples': 1348768, 'steps': 2634, 'loss/train': 2.2100107669830322} -09/20/2021 23:37:03 - INFO - __main__ - Step 42150: {'lr': 0.00019927873258142496, 'samples': 1348800, 'steps': 2634, 'loss/train': 1.6923274993896484} -09/20/2021 23:37:04 - INFO - __main__ - Step 42151: {'lr': 0.00019927873258142496, 'samples': 1348832, 'steps': 2634, 'loss/train': 1.996397614479065} -09/20/2021 23:37:04 - INFO - __main__ - Step 42152: {'lr': 0.00019927873258142496, 'samples': 1348864, 'steps': 2634, 'loss/train': 1.319494366645813} -09/20/2021 23:37:06 - INFO - __main__ - Step 42153: {'lr': 0.00019927873258142496, 'samples': 1348896, 'steps': 2634, 'loss/train': 3.6258652210235596} -09/20/2021 23:37:07 - INFO - __main__ - Step 42154: {'lr': 0.00019927873258142496, 'samples': 1348928, 'steps': 2634, 'loss/train': 1.9838905334472656} -09/20/2021 23:37:08 - INFO - __main__ - Step 42155: {'lr': 0.00019927873258142496, 'samples': 1348960, 'steps': 2634, 'loss/train': 2.3805670738220215} -09/20/2021 23:37:08 - INFO - __main__ - Step 42156: {'lr': 0.00019927873258142496, 'samples': 1348992, 'steps': 2634, 'loss/train': 2.6555392742156982} -09/20/2021 23:37:09 - INFO - __main__ - Step 42157: {'lr': 0.00019927873258142496, 'samples': 1349024, 'steps': 2634, 'loss/train': 2.5856852531433105} -09/20/2021 23:37:10 - INFO - __main__ - Step 42158: {'lr': 0.00019927873258142496, 'samples': 1349056, 'steps': 2634, 'loss/train': 2.2543833255767822} -09/20/2021 23:37:11 - INFO - __main__ - Step 42159: {'lr': 0.00019927873258142496, 'samples': 1349088, 'steps': 2634, 'loss/train': 1.4687259197235107} -09/20/2021 23:37:11 - INFO - __main__ - Step 42160: {'lr': 0.00019927873258142496, 'samples': 1349120, 'steps': 2634, 'loss/train': 2.064457416534424} -09/20/2021 23:37:12 - INFO - __main__ - Step 42161: {'lr': 0.00019927796762453785, 'samples': 1349152, 'steps': 2635, 'loss/train': 1.9565589427947998} -09/20/2021 23:37:13 - INFO - __main__ - Step 42162: {'lr': 0.00019927796762453785, 'samples': 1349184, 'steps': 2635, 'loss/train': 1.2426594495773315} -09/20/2021 23:37:14 - INFO - __main__ - Step 42163: {'lr': 0.00019927796762453785, 'samples': 1349216, 'steps': 2635, 'loss/train': 1.7073043584823608} -09/20/2021 23:37:15 - INFO - __main__ - Step 42164: {'lr': 0.00019927796762453785, 'samples': 1349248, 'steps': 2635, 'loss/train': 2.4065113067626953} -09/20/2021 23:37:15 - INFO - __main__ - Step 42165: {'lr': 0.00019927796762453785, 'samples': 1349280, 'steps': 2635, 'loss/train': 2.280963659286499} -09/20/2021 23:37:16 - INFO - __main__ - Step 42166: {'lr': 0.00019927796762453785, 'samples': 1349312, 'steps': 2635, 'loss/train': 1.5327037572860718} -09/20/2021 23:37:17 - INFO - __main__ - Step 42167: {'lr': 0.00019927796762453785, 'samples': 1349344, 'steps': 2635, 'loss/train': 2.4067723751068115} -09/20/2021 23:37:18 - INFO - __main__ - Step 42168: {'lr': 0.00019927796762453785, 'samples': 1349376, 'steps': 2635, 'loss/train': 2.2065558433532715} -09/20/2021 23:37:18 - INFO - __main__ - Step 42169: {'lr': 0.00019927796762453785, 'samples': 1349408, 'steps': 2635, 'loss/train': 2.504560708999634} -09/20/2021 23:37:19 - INFO - __main__ - Step 42170: {'lr': 0.00019927796762453785, 'samples': 1349440, 'steps': 2635, 'loss/train': 1.712109088897705} -09/20/2021 23:37:20 - INFO - __main__ - Step 42171: {'lr': 0.00019927796762453785, 'samples': 1349472, 'steps': 2635, 'loss/train': 1.7681246995925903} -09/20/2021 23:37:21 - INFO - __main__ - Step 42172: {'lr': 0.00019927796762453785, 'samples': 1349504, 'steps': 2635, 'loss/train': 2.213008403778076} -09/20/2021 23:37:21 - INFO - __main__ - Step 42173: {'lr': 0.00019927796762453785, 'samples': 1349536, 'steps': 2635, 'loss/train': 2.043001651763916} -09/20/2021 23:37:22 - INFO - __main__ - Step 42174: {'lr': 0.00019927796762453785, 'samples': 1349568, 'steps': 2635, 'loss/train': 1.3154324293136597} -09/20/2021 23:37:23 - INFO - __main__ - Step 42175: {'lr': 0.00019927796762453785, 'samples': 1349600, 'steps': 2635, 'loss/train': 2.0130815505981445} -09/20/2021 23:37:24 - INFO - __main__ - Step 42176: {'lr': 0.00019927796762453785, 'samples': 1349632, 'steps': 2635, 'loss/train': 0.46839141845703125} -09/20/2021 23:37:25 - INFO - __main__ - Step 42177: {'lr': 0.00019927720226368904, 'samples': 1349664, 'steps': 2636, 'loss/train': 2.6573703289031982} -09/20/2021 23:37:25 - INFO - __main__ - Step 42178: {'lr': 0.00019927720226368904, 'samples': 1349696, 'steps': 2636, 'loss/train': 2.830190420150757} -09/20/2021 23:37:26 - INFO - __main__ - Step 42179: {'lr': 0.00019927720226368904, 'samples': 1349728, 'steps': 2636, 'loss/train': 1.5406103134155273} -09/20/2021 23:37:27 - INFO - __main__ - Step 42180: {'lr': 0.00019927720226368904, 'samples': 1349760, 'steps': 2636, 'loss/train': 2.2703940868377686} -09/20/2021 23:37:28 - INFO - __main__ - Step 42181: {'lr': 0.00019927720226368904, 'samples': 1349792, 'steps': 2636, 'loss/train': 2.2168121337890625} -09/20/2021 23:37:28 - INFO - __main__ - Step 42182: {'lr': 0.00019927720226368904, 'samples': 1349824, 'steps': 2636, 'loss/train': 1.7102986574172974} -09/20/2021 23:37:29 - INFO - __main__ - Step 42183: {'lr': 0.00019927720226368904, 'samples': 1349856, 'steps': 2636, 'loss/train': 0.3283449113368988} -09/20/2021 23:37:30 - INFO - __main__ - Step 42184: {'lr': 0.00019927720226368904, 'samples': 1349888, 'steps': 2636, 'loss/train': 1.0029631853103638} -09/20/2021 23:37:31 - INFO - __main__ - Step 42185: {'lr': 0.00019927720226368904, 'samples': 1349920, 'steps': 2636, 'loss/train': 2.366051197052002} -09/20/2021 23:37:32 - INFO - __main__ - Step 42186: {'lr': 0.00019927720226368904, 'samples': 1349952, 'steps': 2636, 'loss/train': 1.7324970960617065} -09/20/2021 23:37:33 - INFO - __main__ - Step 42187: {'lr': 0.00019927720226368904, 'samples': 1349984, 'steps': 2636, 'loss/train': 2.0161397457122803} -09/20/2021 23:37:33 - INFO - __main__ - Step 42188: {'lr': 0.00019927720226368904, 'samples': 1350016, 'steps': 2636, 'loss/train': 0.9674665331840515} -09/20/2021 23:37:34 - INFO - __main__ - Step 42189: {'lr': 0.00019927720226368904, 'samples': 1350048, 'steps': 2636, 'loss/train': 2.4543445110321045} -09/20/2021 23:37:35 - INFO - __main__ - Step 42190: {'lr': 0.00019927720226368904, 'samples': 1350080, 'steps': 2636, 'loss/train': 2.182119131088257} -09/20/2021 23:37:36 - INFO - __main__ - Step 42191: {'lr': 0.00019927720226368904, 'samples': 1350112, 'steps': 2636, 'loss/train': 4.206177711486816} -09/20/2021 23:37:36 - INFO - __main__ - Step 42192: {'lr': 0.00019927720226368904, 'samples': 1350144, 'steps': 2636, 'loss/train': 1.6030664443969727} -09/20/2021 23:37:37 - INFO - __main__ - Step 42193: {'lr': 0.00019927643649888168, 'samples': 1350176, 'steps': 2637, 'loss/train': 2.4064035415649414} -09/20/2021 23:37:38 - INFO - __main__ - Step 42194: {'lr': 0.00019927643649888168, 'samples': 1350208, 'steps': 2637, 'loss/train': 0.509461522102356} -09/20/2021 23:37:39 - INFO - __main__ - Step 42195: {'lr': 0.00019927643649888168, 'samples': 1350240, 'steps': 2637, 'loss/train': 2.252041816711426} -09/20/2021 23:37:39 - INFO - __main__ - Step 42196: {'lr': 0.00019927643649888168, 'samples': 1350272, 'steps': 2637, 'loss/train': 1.995411992073059} -09/20/2021 23:37:40 - INFO - __main__ - Step 42197: {'lr': 0.00019927643649888168, 'samples': 1350304, 'steps': 2637, 'loss/train': 2.310490846633911} -09/20/2021 23:37:41 - INFO - __main__ - Step 42198: {'lr': 0.00019927643649888168, 'samples': 1350336, 'steps': 2637, 'loss/train': 2.0828168392181396} -09/20/2021 23:37:42 - INFO - __main__ - Step 42199: {'lr': 0.00019927643649888168, 'samples': 1350368, 'steps': 2637, 'loss/train': 1.8428692817687988} -09/20/2021 23:37:42 - INFO - __main__ - Step 42200: {'lr': 0.00019927643649888168, 'samples': 1350400, 'steps': 2637, 'loss/train': 2.694902181625366} -09/20/2021 23:37:43 - INFO - __main__ - Step 42201: {'lr': 0.00019927643649888168, 'samples': 1350432, 'steps': 2637, 'loss/train': 1.7031431198120117} -09/20/2021 23:37:44 - INFO - __main__ - Step 42202: {'lr': 0.00019927643649888168, 'samples': 1350464, 'steps': 2637, 'loss/train': 1.598683476448059} -09/20/2021 23:37:45 - INFO - __main__ - Step 42203: {'lr': 0.00019927643649888168, 'samples': 1350496, 'steps': 2637, 'loss/train': 1.8308295011520386} -09/20/2021 23:37:45 - INFO - __main__ - Step 42204: {'lr': 0.00019927643649888168, 'samples': 1350528, 'steps': 2637, 'loss/train': 2.2028298377990723} -09/20/2021 23:37:46 - INFO - __main__ - Step 42205: {'lr': 0.00019927643649888168, 'samples': 1350560, 'steps': 2637, 'loss/train': 2.741243839263916} -09/20/2021 23:37:47 - INFO - __main__ - Step 42206: {'lr': 0.00019927643649888168, 'samples': 1350592, 'steps': 2637, 'loss/train': 1.7084381580352783} -09/20/2021 23:37:48 - INFO - __main__ - Step 42207: {'lr': 0.00019927643649888168, 'samples': 1350624, 'steps': 2637, 'loss/train': 2.143218755722046} -09/20/2021 23:37:48 - INFO - __main__ - Step 42208: {'lr': 0.00019927643649888168, 'samples': 1350656, 'steps': 2637, 'loss/train': 2.2925195693969727} -09/20/2021 23:37:49 - INFO - __main__ - Step 42209: {'lr': 0.0001992756703301189, 'samples': 1350688, 'steps': 2638, 'loss/train': 2.684145212173462} -09/20/2021 23:37:50 - INFO - __main__ - Step 42210: {'lr': 0.0001992756703301189, 'samples': 1350720, 'steps': 2638, 'loss/train': 2.4114999771118164} -09/20/2021 23:37:51 - INFO - __main__ - Step 42211: {'lr': 0.0001992756703301189, 'samples': 1350752, 'steps': 2638, 'loss/train': 1.8066967725753784} -09/20/2021 23:37:52 - INFO - __main__ - Step 42212: {'lr': 0.0001992756703301189, 'samples': 1350784, 'steps': 2638, 'loss/train': 1.7571324110031128} -09/20/2021 23:37:52 - INFO - __main__ - Step 42213: {'lr': 0.0001992756703301189, 'samples': 1350816, 'steps': 2638, 'loss/train': 2.605746030807495} -09/20/2021 23:37:54 - INFO - __main__ - Step 42214: {'lr': 0.0001992756703301189, 'samples': 1350848, 'steps': 2638, 'loss/train': 1.7566615343093872} -09/20/2021 23:37:54 - INFO - __main__ - Step 42215: {'lr': 0.0001992756703301189, 'samples': 1350880, 'steps': 2638, 'loss/train': 2.1286964416503906} -09/20/2021 23:37:55 - INFO - __main__ - Step 42216: {'lr': 0.0001992756703301189, 'samples': 1350912, 'steps': 2638, 'loss/train': 1.9320586919784546} -09/20/2021 23:37:56 - INFO - __main__ - Step 42217: {'lr': 0.0001992756703301189, 'samples': 1350944, 'steps': 2638, 'loss/train': 3.112952470779419} -09/20/2021 23:37:57 - INFO - __main__ - Step 42218: {'lr': 0.0001992756703301189, 'samples': 1350976, 'steps': 2638, 'loss/train': 1.755744457244873} -09/20/2021 23:37:57 - INFO - __main__ - Step 42219: {'lr': 0.0001992756703301189, 'samples': 1351008, 'steps': 2638, 'loss/train': 2.234219789505005} -09/20/2021 23:37:58 - INFO - __main__ - Step 42220: {'lr': 0.0001992756703301189, 'samples': 1351040, 'steps': 2638, 'loss/train': 1.534836769104004} -09/20/2021 23:37:59 - INFO - __main__ - Step 42221: {'lr': 0.0001992756703301189, 'samples': 1351072, 'steps': 2638, 'loss/train': 2.188871383666992} -09/20/2021 23:38:00 - INFO - __main__ - Step 42222: {'lr': 0.0001992756703301189, 'samples': 1351104, 'steps': 2638, 'loss/train': 2.678044080734253} -09/20/2021 23:38:00 - INFO - __main__ - Step 42223: {'lr': 0.0001992756703301189, 'samples': 1351136, 'steps': 2638, 'loss/train': 2.0481629371643066} -09/20/2021 23:38:01 - INFO - __main__ - Step 42224: {'lr': 0.0001992756703301189, 'samples': 1351168, 'steps': 2638, 'loss/train': 2.6692874431610107} -09/20/2021 23:38:02 - INFO - __main__ - Step 42225: {'lr': 0.00019927490375740376, 'samples': 1351200, 'steps': 2639, 'loss/train': 1.8796898126602173} -09/20/2021 23:38:03 - INFO - __main__ - Step 42226: {'lr': 0.00019927490375740376, 'samples': 1351232, 'steps': 2639, 'loss/train': 2.432417392730713} -09/20/2021 23:38:03 - INFO - __main__ - Step 42227: {'lr': 0.00019927490375740376, 'samples': 1351264, 'steps': 2639, 'loss/train': 2.3538999557495117} -09/20/2021 23:38:04 - INFO - __main__ - Step 42228: {'lr': 0.00019927490375740376, 'samples': 1351296, 'steps': 2639, 'loss/train': 1.95879328250885} -09/20/2021 23:38:05 - INFO - __main__ - Step 42229: {'lr': 0.00019927490375740376, 'samples': 1351328, 'steps': 2639, 'loss/train': 1.7946255207061768} -09/20/2021 23:38:06 - INFO - __main__ - Step 42230: {'lr': 0.00019927490375740376, 'samples': 1351360, 'steps': 2639, 'loss/train': 2.81699800491333} -09/20/2021 23:38:06 - INFO - __main__ - Step 42231: {'lr': 0.00019927490375740376, 'samples': 1351392, 'steps': 2639, 'loss/train': 2.198789596557617} -09/20/2021 23:38:07 - INFO - __main__ - Step 42232: {'lr': 0.00019927490375740376, 'samples': 1351424, 'steps': 2639, 'loss/train': 2.0624332427978516} -09/20/2021 23:38:08 - INFO - __main__ - Step 42233: {'lr': 0.00019927490375740376, 'samples': 1351456, 'steps': 2639, 'loss/train': 1.918738842010498} -09/20/2021 23:38:09 - INFO - __main__ - Step 42234: {'lr': 0.00019927490375740376, 'samples': 1351488, 'steps': 2639, 'loss/train': 1.1884177923202515} -09/20/2021 23:38:09 - INFO - __main__ - Step 42235: {'lr': 0.00019927490375740376, 'samples': 1351520, 'steps': 2639, 'loss/train': 2.825183391571045} -09/20/2021 23:38:10 - INFO - __main__ - Step 42236: {'lr': 0.00019927490375740376, 'samples': 1351552, 'steps': 2639, 'loss/train': 2.4512746334075928} -09/20/2021 23:38:11 - INFO - __main__ - Step 42237: {'lr': 0.00019927490375740376, 'samples': 1351584, 'steps': 2639, 'loss/train': 1.577353835105896} -09/20/2021 23:38:12 - INFO - __main__ - Step 42238: {'lr': 0.00019927490375740376, 'samples': 1351616, 'steps': 2639, 'loss/train': 2.063230276107788} -09/20/2021 23:38:12 - INFO - __main__ - Step 42239: {'lr': 0.00019927490375740376, 'samples': 1351648, 'steps': 2639, 'loss/train': 2.180903911590576} -09/20/2021 23:38:13 - INFO - __main__ - Step 42240: {'lr': 0.00019927490375740376, 'samples': 1351680, 'steps': 2639, 'loss/train': 1.6821638345718384} -09/20/2021 23:38:14 - INFO - __main__ - Step 42241: {'lr': 0.00019927413678073945, 'samples': 1351712, 'steps': 2640, 'loss/train': 1.7408024072647095} -09/20/2021 23:38:15 - INFO - __main__ - Step 42242: {'lr': 0.00019927413678073945, 'samples': 1351744, 'steps': 2640, 'loss/train': 2.0436501502990723} -09/20/2021 23:38:16 - INFO - __main__ - Step 42243: {'lr': 0.00019927413678073945, 'samples': 1351776, 'steps': 2640, 'loss/train': 1.548197865486145} -09/20/2021 23:38:16 - INFO - __main__ - Step 42244: {'lr': 0.00019927413678073945, 'samples': 1351808, 'steps': 2640, 'loss/train': 0.8207570910453796} -09/20/2021 23:38:18 - INFO - __main__ - Step 42245: {'lr': 0.00019927413678073945, 'samples': 1351840, 'steps': 2640, 'loss/train': 2.020846128463745} -09/20/2021 23:38:18 - INFO - __main__ - Step 42246: {'lr': 0.00019927413678073945, 'samples': 1351872, 'steps': 2640, 'loss/train': 2.4300050735473633} -09/20/2021 23:38:19 - INFO - __main__ - Step 42247: {'lr': 0.00019927413678073945, 'samples': 1351904, 'steps': 2640, 'loss/train': 1.8657039403915405} -09/20/2021 23:38:20 - INFO - __main__ - Step 42248: {'lr': 0.00019927413678073945, 'samples': 1351936, 'steps': 2640, 'loss/train': 1.7642686367034912} -09/20/2021 23:38:21 - INFO - __main__ - Step 42249: {'lr': 0.00019927413678073945, 'samples': 1351968, 'steps': 2640, 'loss/train': 2.2069358825683594} -09/20/2021 23:38:21 - INFO - __main__ - Step 42250: {'lr': 0.00019927413678073945, 'samples': 1352000, 'steps': 2640, 'loss/train': 2.3153293132781982} -09/20/2021 23:38:22 - INFO - __main__ - Step 42251: {'lr': 0.00019927413678073945, 'samples': 1352032, 'steps': 2640, 'loss/train': 1.9586504697799683} -09/20/2021 23:38:23 - INFO - __main__ - Step 42252: {'lr': 0.00019927413678073945, 'samples': 1352064, 'steps': 2640, 'loss/train': 2.0816614627838135} -09/20/2021 23:38:24 - INFO - __main__ - Step 42253: {'lr': 0.00019927413678073945, 'samples': 1352096, 'steps': 2640, 'loss/train': 0.7345438599586487} -09/20/2021 23:38:24 - INFO - __main__ - Step 42254: {'lr': 0.00019927413678073945, 'samples': 1352128, 'steps': 2640, 'loss/train': 3.219214916229248} -09/20/2021 23:38:25 - INFO - __main__ - Step 42255: {'lr': 0.00019927413678073945, 'samples': 1352160, 'steps': 2640, 'loss/train': 1.937219500541687} -09/20/2021 23:38:26 - INFO - __main__ - Step 42256: {'lr': 0.00019927413678073945, 'samples': 1352192, 'steps': 2640, 'loss/train': 2.3677990436553955} -09/20/2021 23:38:27 - INFO - __main__ - Step 42257: {'lr': 0.00019927336940012908, 'samples': 1352224, 'steps': 2641, 'loss/train': 1.541063904762268} -09/20/2021 23:38:28 - INFO - __main__ - Step 42258: {'lr': 0.00019927336940012908, 'samples': 1352256, 'steps': 2641, 'loss/train': 2.158245801925659} -09/20/2021 23:38:28 - INFO - __main__ - Step 42259: {'lr': 0.00019927336940012908, 'samples': 1352288, 'steps': 2641, 'loss/train': 2.1424405574798584} -09/20/2021 23:38:29 - INFO - __main__ - Step 42260: {'lr': 0.00019927336940012908, 'samples': 1352320, 'steps': 2641, 'loss/train': 2.1001009941101074} -09/20/2021 23:38:30 - INFO - __main__ - Step 42261: {'lr': 0.00019927336940012908, 'samples': 1352352, 'steps': 2641, 'loss/train': 1.7176450490951538} -09/20/2021 23:38:31 - INFO - __main__ - Step 42262: {'lr': 0.00019927336940012908, 'samples': 1352384, 'steps': 2641, 'loss/train': 2.3056259155273438} -09/20/2021 23:38:31 - INFO - __main__ - Step 42263: {'lr': 0.00019927336940012908, 'samples': 1352416, 'steps': 2641, 'loss/train': 1.5199265480041504} -09/20/2021 23:38:32 - INFO - __main__ - Step 42264: {'lr': 0.00019927336940012908, 'samples': 1352448, 'steps': 2641, 'loss/train': 2.5029544830322266} -09/20/2021 23:38:33 - INFO - __main__ - Step 42265: {'lr': 0.00019927336940012908, 'samples': 1352480, 'steps': 2641, 'loss/train': 0.2578110694885254} -09/20/2021 23:38:34 - INFO - __main__ - Step 42266: {'lr': 0.00019927336940012908, 'samples': 1352512, 'steps': 2641, 'loss/train': 0.9968517422676086} -09/20/2021 23:38:34 - INFO - __main__ - Step 42267: {'lr': 0.00019927336940012908, 'samples': 1352544, 'steps': 2641, 'loss/train': 1.7241065502166748} -09/20/2021 23:38:35 - INFO - __main__ - Step 42268: {'lr': 0.00019927336940012908, 'samples': 1352576, 'steps': 2641, 'loss/train': 2.3658080101013184} -09/20/2021 23:38:36 - INFO - __main__ - Step 42269: {'lr': 0.00019927336940012908, 'samples': 1352608, 'steps': 2641, 'loss/train': 2.2786176204681396} -09/20/2021 23:38:37 - INFO - __main__ - Step 42270: {'lr': 0.00019927336940012908, 'samples': 1352640, 'steps': 2641, 'loss/train': 2.6888694763183594} -09/20/2021 23:38:37 - INFO - __main__ - Step 42271: {'lr': 0.00019927336940012908, 'samples': 1352672, 'steps': 2641, 'loss/train': 2.0270285606384277} -09/20/2021 23:38:38 - INFO - __main__ - Step 42272: {'lr': 0.00019927336940012908, 'samples': 1352704, 'steps': 2641, 'loss/train': 2.7083375453948975} -09/20/2021 23:38:39 - INFO - __main__ - Step 42273: {'lr': 0.00019927260161557576, 'samples': 1352736, 'steps': 2642, 'loss/train': 3.237485885620117} -09/20/2021 23:38:40 - INFO - __main__ - Step 42274: {'lr': 0.00019927260161557576, 'samples': 1352768, 'steps': 2642, 'loss/train': 2.7391605377197266} -09/20/2021 23:38:40 - INFO - __main__ - Step 42275: {'lr': 0.00019927260161557576, 'samples': 1352800, 'steps': 2642, 'loss/train': 2.3352441787719727} -09/20/2021 23:38:42 - INFO - __main__ - Step 42276: {'lr': 0.00019927260161557576, 'samples': 1352832, 'steps': 2642, 'loss/train': 2.3261144161224365} -09/20/2021 23:38:43 - INFO - __main__ - Step 42277: {'lr': 0.00019927260161557576, 'samples': 1352864, 'steps': 2642, 'loss/train': 1.2850239276885986} -09/20/2021 23:38:43 - INFO - __main__ - Step 42278: {'lr': 0.00019927260161557576, 'samples': 1352896, 'steps': 2642, 'loss/train': 1.5928726196289062} -09/20/2021 23:38:44 - INFO - __main__ - Step 42279: {'lr': 0.00019927260161557576, 'samples': 1352928, 'steps': 2642, 'loss/train': 2.2245442867279053} -09/20/2021 23:38:45 - INFO - __main__ - Step 42280: {'lr': 0.00019927260161557576, 'samples': 1352960, 'steps': 2642, 'loss/train': 1.6355681419372559} -09/20/2021 23:38:46 - INFO - __main__ - Step 42281: {'lr': 0.00019927260161557576, 'samples': 1352992, 'steps': 2642, 'loss/train': 2.030454397201538} -09/20/2021 23:38:46 - INFO - __main__ - Step 42282: {'lr': 0.00019927260161557576, 'samples': 1353024, 'steps': 2642, 'loss/train': 2.1391656398773193} -09/20/2021 23:38:47 - INFO - __main__ - Step 42283: {'lr': 0.00019927260161557576, 'samples': 1353056, 'steps': 2642, 'loss/train': 1.8864532709121704} -09/20/2021 23:38:48 - INFO - __main__ - Step 42284: {'lr': 0.00019927260161557576, 'samples': 1353088, 'steps': 2642, 'loss/train': 2.4046852588653564} -09/20/2021 23:38:49 - INFO - __main__ - Step 42285: {'lr': 0.00019927260161557576, 'samples': 1353120, 'steps': 2642, 'loss/train': 2.210714817047119} -09/20/2021 23:38:49 - INFO - __main__ - Step 42286: {'lr': 0.00019927260161557576, 'samples': 1353152, 'steps': 2642, 'loss/train': 1.655397891998291} -09/20/2021 23:38:50 - INFO - __main__ - Step 42287: {'lr': 0.00019927260161557576, 'samples': 1353184, 'steps': 2642, 'loss/train': 2.7604176998138428} -09/20/2021 23:38:51 - INFO - __main__ - Step 42288: {'lr': 0.00019927260161557576, 'samples': 1353216, 'steps': 2642, 'loss/train': 1.873895525932312} -09/20/2021 23:38:52 - INFO - __main__ - Step 42289: {'lr': 0.00019927183342708258, 'samples': 1353248, 'steps': 2643, 'loss/train': 2.2423579692840576} -09/20/2021 23:38:52 - INFO - __main__ - Step 42290: {'lr': 0.00019927183342708258, 'samples': 1353280, 'steps': 2643, 'loss/train': 6.237076759338379} -09/20/2021 23:38:53 - INFO - __main__ - Step 42291: {'lr': 0.00019927183342708258, 'samples': 1353312, 'steps': 2643, 'loss/train': 4.684946060180664} -09/20/2021 23:38:54 - INFO - __main__ - Step 42292: {'lr': 0.00019927183342708258, 'samples': 1353344, 'steps': 2643, 'loss/train': 1.7603706121444702} -09/20/2021 23:38:55 - INFO - __main__ - Step 42293: {'lr': 0.00019927183342708258, 'samples': 1353376, 'steps': 2643, 'loss/train': 0.22551681101322174} -09/20/2021 23:38:55 - INFO - __main__ - Step 42294: {'lr': 0.00019927183342708258, 'samples': 1353408, 'steps': 2643, 'loss/train': 1.8094645738601685} -09/20/2021 23:38:56 - INFO - __main__ - Step 42295: {'lr': 0.00019927183342708258, 'samples': 1353440, 'steps': 2643, 'loss/train': 0.5613547563552856} -09/20/2021 23:38:57 - INFO - __main__ - Step 42296: {'lr': 0.00019927183342708258, 'samples': 1353472, 'steps': 2643, 'loss/train': 2.0089664459228516} -09/20/2021 23:38:58 - INFO - __main__ - Step 42297: {'lr': 0.00019927183342708258, 'samples': 1353504, 'steps': 2643, 'loss/train': 1.732415795326233} -09/20/2021 23:38:58 - INFO - __main__ - Step 42298: {'lr': 0.00019927183342708258, 'samples': 1353536, 'steps': 2643, 'loss/train': 0.9413031935691833} -09/20/2021 23:38:59 - INFO - __main__ - Step 42299: {'lr': 0.00019927183342708258, 'samples': 1353568, 'steps': 2643, 'loss/train': 2.7063827514648438} -09/20/2021 23:39:00 - INFO - __main__ - Step 42300: {'lr': 0.00019927183342708258, 'samples': 1353600, 'steps': 2643, 'loss/train': 1.1998974084854126} -09/20/2021 23:39:01 - INFO - __main__ - Step 42301: {'lr': 0.00019927183342708258, 'samples': 1353632, 'steps': 2643, 'loss/train': 1.7139045000076294} -09/20/2021 23:39:01 - INFO - __main__ - Step 42302: {'lr': 0.00019927183342708258, 'samples': 1353664, 'steps': 2643, 'loss/train': 2.216420888900757} -09/20/2021 23:39:02 - INFO - __main__ - Step 42303: {'lr': 0.00019927183342708258, 'samples': 1353696, 'steps': 2643, 'loss/train': 1.4577206373214722} -09/20/2021 23:39:03 - INFO - __main__ - Step 42304: {'lr': 0.00019927183342708258, 'samples': 1353728, 'steps': 2643, 'loss/train': 1.4591515064239502} -09/20/2021 23:39:04 - INFO - __main__ - Step 42305: {'lr': 0.0001992710648346527, 'samples': 1353760, 'steps': 2644, 'loss/train': 2.541797399520874} -09/20/2021 23:39:05 - INFO - __main__ - Step 42306: {'lr': 0.0001992710648346527, 'samples': 1353792, 'steps': 2644, 'loss/train': 2.6469788551330566} -09/20/2021 23:39:05 - INFO - __main__ - Step 42307: {'lr': 0.0001992710648346527, 'samples': 1353824, 'steps': 2644, 'loss/train': 2.022627592086792} -09/20/2021 23:39:06 - INFO - __main__ - Step 42308: {'lr': 0.0001992710648346527, 'samples': 1353856, 'steps': 2644, 'loss/train': 2.026041030883789} -09/20/2021 23:39:07 - INFO - __main__ - Step 42309: {'lr': 0.0001992710648346527, 'samples': 1353888, 'steps': 2644, 'loss/train': 2.497551679611206} -09/20/2021 23:39:08 - INFO - __main__ - Step 42310: {'lr': 0.0001992710648346527, 'samples': 1353920, 'steps': 2644, 'loss/train': 3.0099713802337646} -09/20/2021 23:39:09 - INFO - __main__ - Step 42311: {'lr': 0.0001992710648346527, 'samples': 1353952, 'steps': 2644, 'loss/train': 2.010394811630249} -09/20/2021 23:39:10 - INFO - __main__ - Step 42312: {'lr': 0.0001992710648346527, 'samples': 1353984, 'steps': 2644, 'loss/train': 2.4306702613830566} -09/20/2021 23:39:10 - INFO - __main__ - Step 42313: {'lr': 0.0001992710648346527, 'samples': 1354016, 'steps': 2644, 'loss/train': 1.183127522468567} -09/20/2021 23:39:11 - INFO - __main__ - Step 42314: {'lr': 0.0001992710648346527, 'samples': 1354048, 'steps': 2644, 'loss/train': 2.1411256790161133} -09/20/2021 23:39:12 - INFO - __main__ - Step 42315: {'lr': 0.0001992710648346527, 'samples': 1354080, 'steps': 2644, 'loss/train': 2.0215065479278564} -09/20/2021 23:39:13 - INFO - __main__ - Step 42316: {'lr': 0.0001992710648346527, 'samples': 1354112, 'steps': 2644, 'loss/train': 2.0074923038482666} -09/20/2021 23:39:13 - INFO - __main__ - Step 42317: {'lr': 0.0001992710648346527, 'samples': 1354144, 'steps': 2644, 'loss/train': 1.7731367349624634} -09/20/2021 23:39:14 - INFO - __main__ - Step 42318: {'lr': 0.0001992710648346527, 'samples': 1354176, 'steps': 2644, 'loss/train': 1.7108901739120483} -09/20/2021 23:39:15 - INFO - __main__ - Step 42319: {'lr': 0.0001992710648346527, 'samples': 1354208, 'steps': 2644, 'loss/train': 2.3657469749450684} -09/20/2021 23:39:16 - INFO - __main__ - Step 42320: {'lr': 0.0001992710648346527, 'samples': 1354240, 'steps': 2644, 'loss/train': 2.4307093620300293} -09/20/2021 23:39:16 - INFO - __main__ - Step 42321: {'lr': 0.00019927029583828923, 'samples': 1354272, 'steps': 2645, 'loss/train': 2.0759496688842773} -09/20/2021 23:39:17 - INFO - __main__ - Step 42322: {'lr': 0.00019927029583828923, 'samples': 1354304, 'steps': 2645, 'loss/train': 2.019676923751831} -09/20/2021 23:39:18 - INFO - __main__ - Step 42323: {'lr': 0.00019927029583828923, 'samples': 1354336, 'steps': 2645, 'loss/train': 2.3122105598449707} -09/20/2021 23:39:19 - INFO - __main__ - Step 42324: {'lr': 0.00019927029583828923, 'samples': 1354368, 'steps': 2645, 'loss/train': 1.9989933967590332} -09/20/2021 23:39:19 - INFO - __main__ - Step 42325: {'lr': 0.00019927029583828923, 'samples': 1354400, 'steps': 2645, 'loss/train': 0.16786400973796844} -09/20/2021 23:39:20 - INFO - __main__ - Step 42326: {'lr': 0.00019927029583828923, 'samples': 1354432, 'steps': 2645, 'loss/train': 0.17829835414886475} -09/20/2021 23:39:21 - INFO - __main__ - Step 42327: {'lr': 0.00019927029583828923, 'samples': 1354464, 'steps': 2645, 'loss/train': 2.322777271270752} -09/20/2021 23:39:22 - INFO - __main__ - Step 42328: {'lr': 0.00019927029583828923, 'samples': 1354496, 'steps': 2645, 'loss/train': 2.1694533824920654} -09/20/2021 23:39:22 - INFO - __main__ - Step 42329: {'lr': 0.00019927029583828923, 'samples': 1354528, 'steps': 2645, 'loss/train': 2.5444576740264893} -09/20/2021 23:39:23 - INFO - __main__ - Step 42330: {'lr': 0.00019927029583828923, 'samples': 1354560, 'steps': 2645, 'loss/train': 2.314650774002075} -09/20/2021 23:39:24 - INFO - __main__ - Step 42331: {'lr': 0.00019927029583828923, 'samples': 1354592, 'steps': 2645, 'loss/train': 2.416942834854126} -09/20/2021 23:39:25 - INFO - __main__ - Step 42332: {'lr': 0.00019927029583828923, 'samples': 1354624, 'steps': 2645, 'loss/train': 1.270263910293579} -09/20/2021 23:39:25 - INFO - __main__ - Step 42333: {'lr': 0.00019927029583828923, 'samples': 1354656, 'steps': 2645, 'loss/train': 1.9564417600631714} -09/20/2021 23:39:26 - INFO - __main__ - Step 42334: {'lr': 0.00019927029583828923, 'samples': 1354688, 'steps': 2645, 'loss/train': 3.098461627960205} -09/20/2021 23:39:27 - INFO - __main__ - Step 42335: {'lr': 0.00019927029583828923, 'samples': 1354720, 'steps': 2645, 'loss/train': 0.39958319067955017} -09/20/2021 23:39:28 - INFO - __main__ - Step 42336: {'lr': 0.00019927029583828923, 'samples': 1354752, 'steps': 2645, 'loss/train': 2.1274573802948} -09/20/2021 23:39:29 - INFO - __main__ - Step 42337: {'lr': 0.00019926952643799535, 'samples': 1354784, 'steps': 2646, 'loss/train': 1.804233193397522} -09/20/2021 23:39:29 - INFO - __main__ - Step 42338: {'lr': 0.00019926952643799535, 'samples': 1354816, 'steps': 2646, 'loss/train': 2.0135815143585205} -09/20/2021 23:39:30 - INFO - __main__ - Step 42339: {'lr': 0.00019926952643799535, 'samples': 1354848, 'steps': 2646, 'loss/train': 1.8679206371307373} -09/20/2021 23:39:31 - INFO - __main__ - Step 42340: {'lr': 0.00019926952643799535, 'samples': 1354880, 'steps': 2646, 'loss/train': 2.1046173572540283} -09/20/2021 23:39:32 - INFO - __main__ - Step 42341: {'lr': 0.00019926952643799535, 'samples': 1354912, 'steps': 2646, 'loss/train': 1.391680359840393} -09/20/2021 23:39:33 - INFO - __main__ - Step 42342: {'lr': 0.00019926952643799535, 'samples': 1354944, 'steps': 2646, 'loss/train': 2.5242197513580322} -09/20/2021 23:39:34 - INFO - __main__ - Step 42343: {'lr': 0.00019926952643799535, 'samples': 1354976, 'steps': 2646, 'loss/train': 1.8632960319519043} -09/20/2021 23:39:34 - INFO - __main__ - Step 42344: {'lr': 0.00019926952643799535, 'samples': 1355008, 'steps': 2646, 'loss/train': 2.3261666297912598} -09/20/2021 23:39:35 - INFO - __main__ - Step 42345: {'lr': 0.00019926952643799535, 'samples': 1355040, 'steps': 2646, 'loss/train': 1.583434820175171} -09/20/2021 23:39:36 - INFO - __main__ - Step 42346: {'lr': 0.00019926952643799535, 'samples': 1355072, 'steps': 2646, 'loss/train': 2.8277180194854736} -09/20/2021 23:39:37 - INFO - __main__ - Step 42347: {'lr': 0.00019926952643799535, 'samples': 1355104, 'steps': 2646, 'loss/train': 2.293184995651245} -09/20/2021 23:39:37 - INFO - __main__ - Step 42348: {'lr': 0.00019926952643799535, 'samples': 1355136, 'steps': 2646, 'loss/train': 2.5794665813446045} -09/20/2021 23:39:38 - INFO - __main__ - Step 42349: {'lr': 0.00019926952643799535, 'samples': 1355168, 'steps': 2646, 'loss/train': 1.9168312549591064} -09/20/2021 23:39:39 - INFO - __main__ - Step 42350: {'lr': 0.00019926952643799535, 'samples': 1355200, 'steps': 2646, 'loss/train': 1.9670326709747314} -09/20/2021 23:39:40 - INFO - __main__ - Step 42351: {'lr': 0.00019926952643799535, 'samples': 1355232, 'steps': 2646, 'loss/train': 2.7100961208343506} -09/20/2021 23:39:40 - INFO - __main__ - Step 42352: {'lr': 0.00019926952643799535, 'samples': 1355264, 'steps': 2646, 'loss/train': 1.9446028470993042} -09/20/2021 23:39:41 - INFO - __main__ - Step 42353: {'lr': 0.0001992687566337741, 'samples': 1355296, 'steps': 2647, 'loss/train': 1.4679193496704102} -09/20/2021 23:39:42 - INFO - __main__ - Step 42354: {'lr': 0.0001992687566337741, 'samples': 1355328, 'steps': 2647, 'loss/train': 1.5365904569625854} -09/20/2021 23:39:43 - INFO - __main__ - Step 42355: {'lr': 0.0001992687566337741, 'samples': 1355360, 'steps': 2647, 'loss/train': 1.3845961093902588} -09/20/2021 23:39:43 - INFO - __main__ - Step 42356: {'lr': 0.0001992687566337741, 'samples': 1355392, 'steps': 2647, 'loss/train': 0.37356266379356384} -09/20/2021 23:39:44 - INFO - __main__ - Step 42357: {'lr': 0.0001992687566337741, 'samples': 1355424, 'steps': 2647, 'loss/train': 1.858530879020691} -09/20/2021 23:39:45 - INFO - __main__ - Step 42358: {'lr': 0.0001992687566337741, 'samples': 1355456, 'steps': 2647, 'loss/train': 1.1334550380706787} -09/20/2021 23:39:46 - INFO - __main__ - Step 42359: {'lr': 0.0001992687566337741, 'samples': 1355488, 'steps': 2647, 'loss/train': 1.271328091621399} -09/20/2021 23:39:46 - INFO - __main__ - Step 42360: {'lr': 0.0001992687566337741, 'samples': 1355520, 'steps': 2647, 'loss/train': 2.1670045852661133} -09/20/2021 23:39:47 - INFO - __main__ - Step 42361: {'lr': 0.0001992687566337741, 'samples': 1355552, 'steps': 2647, 'loss/train': 1.5682705640792847} -09/20/2021 23:39:48 - INFO - __main__ - Step 42362: {'lr': 0.0001992687566337741, 'samples': 1355584, 'steps': 2647, 'loss/train': 2.208604097366333} -09/20/2021 23:39:49 - INFO - __main__ - Step 42363: {'lr': 0.0001992687566337741, 'samples': 1355616, 'steps': 2647, 'loss/train': 2.2363853454589844} -09/20/2021 23:39:49 - INFO - __main__ - Step 42364: {'lr': 0.0001992687566337741, 'samples': 1355648, 'steps': 2647, 'loss/train': 2.82332181930542} -09/20/2021 23:39:50 - INFO - __main__ - Step 42365: {'lr': 0.0001992687566337741, 'samples': 1355680, 'steps': 2647, 'loss/train': 2.339897394180298} -09/20/2021 23:39:51 - INFO - __main__ - Step 42366: {'lr': 0.0001992687566337741, 'samples': 1355712, 'steps': 2647, 'loss/train': 1.4325778484344482} -09/20/2021 23:39:52 - INFO - __main__ - Step 42367: {'lr': 0.0001992687566337741, 'samples': 1355744, 'steps': 2647, 'loss/train': 2.181177854537964} -09/20/2021 23:39:53 - INFO - __main__ - Step 42368: {'lr': 0.0001992687566337741, 'samples': 1355776, 'steps': 2647, 'loss/train': 2.57123064994812} -09/20/2021 23:39:53 - INFO - __main__ - Step 42369: {'lr': 0.0001992679864256287, 'samples': 1355808, 'steps': 2648, 'loss/train': 2.4057414531707764} -09/20/2021 23:39:54 - INFO - __main__ - Step 42370: {'lr': 0.0001992679864256287, 'samples': 1355840, 'steps': 2648, 'loss/train': 2.6688408851623535} -09/20/2021 23:39:55 - INFO - __main__ - Step 42371: {'lr': 0.0001992679864256287, 'samples': 1355872, 'steps': 2648, 'loss/train': 2.0174472332000732} -09/20/2021 23:39:56 - INFO - __main__ - Step 42372: {'lr': 0.0001992679864256287, 'samples': 1355904, 'steps': 2648, 'loss/train': 2.772834300994873} -09/20/2021 23:39:57 - INFO - __main__ - Step 42373: {'lr': 0.0001992679864256287, 'samples': 1355936, 'steps': 2648, 'loss/train': 2.1717662811279297} -09/20/2021 23:39:58 - INFO - __main__ - Step 42374: {'lr': 0.0001992679864256287, 'samples': 1355968, 'steps': 2648, 'loss/train': 2.3079566955566406} -09/20/2021 23:39:58 - INFO - __main__ - Step 42375: {'lr': 0.0001992679864256287, 'samples': 1356000, 'steps': 2648, 'loss/train': 2.633989095687866} -09/20/2021 23:39:59 - INFO - __main__ - Step 42376: {'lr': 0.0001992679864256287, 'samples': 1356032, 'steps': 2648, 'loss/train': 1.646873116493225} -09/20/2021 23:40:00 - INFO - __main__ - Step 42377: {'lr': 0.0001992679864256287, 'samples': 1356064, 'steps': 2648, 'loss/train': 1.9630024433135986} -09/20/2021 23:40:01 - INFO - __main__ - Step 42378: {'lr': 0.0001992679864256287, 'samples': 1356096, 'steps': 2648, 'loss/train': 1.7375314235687256} -09/20/2021 23:40:01 - INFO - __main__ - Step 42379: {'lr': 0.0001992679864256287, 'samples': 1356128, 'steps': 2648, 'loss/train': 0.36536598205566406} -09/20/2021 23:40:02 - INFO - __main__ - Step 42380: {'lr': 0.0001992679864256287, 'samples': 1356160, 'steps': 2648, 'loss/train': 3.5212838649749756} -09/20/2021 23:40:03 - INFO - __main__ - Step 42381: {'lr': 0.0001992679864256287, 'samples': 1356192, 'steps': 2648, 'loss/train': 2.852592706680298} -09/20/2021 23:40:04 - INFO - __main__ - Step 42382: {'lr': 0.0001992679864256287, 'samples': 1356224, 'steps': 2648, 'loss/train': 1.5980101823806763} -09/20/2021 23:40:04 - INFO - __main__ - Step 42383: {'lr': 0.0001992679864256287, 'samples': 1356256, 'steps': 2648, 'loss/train': 2.788658380508423} -09/20/2021 23:40:05 - INFO - __main__ - Step 42384: {'lr': 0.0001992679864256287, 'samples': 1356288, 'steps': 2648, 'loss/train': 2.193709373474121} -09/20/2021 23:40:06 - INFO - __main__ - Step 42385: {'lr': 0.00019926721581356224, 'samples': 1356320, 'steps': 2649, 'loss/train': 2.5137267112731934} -09/20/2021 23:40:07 - INFO - __main__ - Step 42386: {'lr': 0.00019926721581356224, 'samples': 1356352, 'steps': 2649, 'loss/train': 1.6131826639175415} -09/20/2021 23:40:08 - INFO - __main__ - Step 42387: {'lr': 0.00019926721581356224, 'samples': 1356384, 'steps': 2649, 'loss/train': 2.6225688457489014} -09/20/2021 23:40:08 - INFO - __main__ - Step 42388: {'lr': 0.00019926721581356224, 'samples': 1356416, 'steps': 2649, 'loss/train': 2.1078078746795654} -09/20/2021 23:40:09 - INFO - __main__ - Step 42389: {'lr': 0.00019926721581356224, 'samples': 1356448, 'steps': 2649, 'loss/train': 5.012269496917725} -09/20/2021 23:40:10 - INFO - __main__ - Step 42390: {'lr': 0.00019926721581356224, 'samples': 1356480, 'steps': 2649, 'loss/train': 2.3505489826202393} -09/20/2021 23:40:11 - INFO - __main__ - Step 42391: {'lr': 0.00019926721581356224, 'samples': 1356512, 'steps': 2649, 'loss/train': 1.5305644273757935} -09/20/2021 23:40:11 - INFO - __main__ - Step 42392: {'lr': 0.00019926721581356224, 'samples': 1356544, 'steps': 2649, 'loss/train': 2.4346301555633545} -09/20/2021 23:40:12 - INFO - __main__ - Step 42393: {'lr': 0.00019926721581356224, 'samples': 1356576, 'steps': 2649, 'loss/train': 1.4559882879257202} -09/20/2021 23:40:13 - INFO - __main__ - Step 42394: {'lr': 0.00019926721581356224, 'samples': 1356608, 'steps': 2649, 'loss/train': 2.11379075050354} -09/20/2021 23:40:14 - INFO - __main__ - Step 42395: {'lr': 0.00019926721581356224, 'samples': 1356640, 'steps': 2649, 'loss/train': 2.8493993282318115} -09/20/2021 23:40:14 - INFO - __main__ - Step 42396: {'lr': 0.00019926721581356224, 'samples': 1356672, 'steps': 2649, 'loss/train': 0.5909642577171326} -09/20/2021 23:40:15 - INFO - __main__ - Step 42397: {'lr': 0.00019926721581356224, 'samples': 1356704, 'steps': 2649, 'loss/train': 1.9278630018234253} -09/20/2021 23:40:16 - INFO - __main__ - Step 42398: {'lr': 0.00019926721581356224, 'samples': 1356736, 'steps': 2649, 'loss/train': 2.449711322784424} -09/20/2021 23:40:17 - INFO - __main__ - Step 42399: {'lr': 0.00019926721581356224, 'samples': 1356768, 'steps': 2649, 'loss/train': 2.6005024909973145} -09/20/2021 23:40:17 - INFO - __main__ - Step 42400: {'lr': 0.00019926721581356224, 'samples': 1356800, 'steps': 2649, 'loss/train': 2.225370407104492} -09/20/2021 23:40:18 - INFO - __main__ - Step 42401: {'lr': 0.00019926644479757787, 'samples': 1356832, 'steps': 2650, 'loss/train': 1.233134150505066} -09/20/2021 23:40:19 - INFO - __main__ - Step 42402: {'lr': 0.00019926644479757787, 'samples': 1356864, 'steps': 2650, 'loss/train': 1.4013124704360962} -09/20/2021 23:40:20 - INFO - __main__ - Step 42403: {'lr': 0.00019926644479757787, 'samples': 1356896, 'steps': 2650, 'loss/train': 1.54248046875} -09/20/2021 23:40:21 - INFO - __main__ - Step 42404: {'lr': 0.00019926644479757787, 'samples': 1356928, 'steps': 2650, 'loss/train': 2.3535120487213135} -09/20/2021 23:40:22 - INFO - __main__ - Step 42405: {'lr': 0.00019926644479757787, 'samples': 1356960, 'steps': 2650, 'loss/train': 2.0869405269622803} -09/20/2021 23:40:22 - INFO - __main__ - Step 42406: {'lr': 0.00019926644479757787, 'samples': 1356992, 'steps': 2650, 'loss/train': 2.199861526489258} -09/20/2021 23:40:23 - INFO - __main__ - Step 42407: {'lr': 0.00019926644479757787, 'samples': 1357024, 'steps': 2650, 'loss/train': 2.4931724071502686} -09/20/2021 23:40:24 - INFO - __main__ - Step 42408: {'lr': 0.00019926644479757787, 'samples': 1357056, 'steps': 2650, 'loss/train': 1.55430006980896} -09/20/2021 23:40:25 - INFO - __main__ - Step 42409: {'lr': 0.00019926644479757787, 'samples': 1357088, 'steps': 2650, 'loss/train': 2.3376717567443848} -09/20/2021 23:40:25 - INFO - __main__ - Step 42410: {'lr': 0.00019926644479757787, 'samples': 1357120, 'steps': 2650, 'loss/train': 2.9797964096069336} -09/20/2021 23:40:26 - INFO - __main__ - Step 42411: {'lr': 0.00019926644479757787, 'samples': 1357152, 'steps': 2650, 'loss/train': 1.5783278942108154} -09/20/2021 23:40:27 - INFO - __main__ - Step 42412: {'lr': 0.00019926644479757787, 'samples': 1357184, 'steps': 2650, 'loss/train': 2.334967613220215} -09/20/2021 23:40:28 - INFO - __main__ - Step 42413: {'lr': 0.00019926644479757787, 'samples': 1357216, 'steps': 2650, 'loss/train': 1.8830044269561768} -09/20/2021 23:40:28 - INFO - __main__ - Step 42414: {'lr': 0.00019926644479757787, 'samples': 1357248, 'steps': 2650, 'loss/train': 2.217620611190796} -09/20/2021 23:40:29 - INFO - __main__ - Step 42415: {'lr': 0.00019926644479757787, 'samples': 1357280, 'steps': 2650, 'loss/train': 1.5554418563842773} -09/20/2021 23:40:30 - INFO - __main__ - Step 42416: {'lr': 0.00019926644479757787, 'samples': 1357312, 'steps': 2650, 'loss/train': 1.895581841468811} -09/20/2021 23:40:31 - INFO - __main__ - Step 42417: {'lr': 0.00019926567337767871, 'samples': 1357344, 'steps': 2651, 'loss/train': 2.2664902210235596} -09/20/2021 23:40:32 - INFO - __main__ - Step 42418: {'lr': 0.00019926567337767871, 'samples': 1357376, 'steps': 2651, 'loss/train': 2.6839733123779297} -09/20/2021 23:40:32 - INFO - __main__ - Step 42419: {'lr': 0.00019926567337767871, 'samples': 1357408, 'steps': 2651, 'loss/train': 1.7053790092468262} -09/20/2021 23:40:33 - INFO - __main__ - Step 42420: {'lr': 0.00019926567337767871, 'samples': 1357440, 'steps': 2651, 'loss/train': 2.021995782852173} -09/20/2021 23:40:34 - INFO - __main__ - Step 42421: {'lr': 0.00019926567337767871, 'samples': 1357472, 'steps': 2651, 'loss/train': 2.1403968334198} -09/20/2021 23:40:35 - INFO - __main__ - Step 42422: {'lr': 0.00019926567337767871, 'samples': 1357504, 'steps': 2651, 'loss/train': 2.523265838623047} -09/20/2021 23:40:35 - INFO - __main__ - Step 42423: {'lr': 0.00019926567337767871, 'samples': 1357536, 'steps': 2651, 'loss/train': 1.7476723194122314} -09/20/2021 23:40:36 - INFO - __main__ - Step 42424: {'lr': 0.00019926567337767871, 'samples': 1357568, 'steps': 2651, 'loss/train': 2.6451244354248047} -09/20/2021 23:40:37 - INFO - __main__ - Step 42425: {'lr': 0.00019926567337767871, 'samples': 1357600, 'steps': 2651, 'loss/train': 2.2147791385650635} -09/20/2021 23:40:38 - INFO - __main__ - Step 42426: {'lr': 0.00019926567337767871, 'samples': 1357632, 'steps': 2651, 'loss/train': 2.0341804027557373} -09/20/2021 23:40:38 - INFO - __main__ - Step 42427: {'lr': 0.00019926567337767871, 'samples': 1357664, 'steps': 2651, 'loss/train': 3.102783441543579} -09/20/2021 23:40:39 - INFO - __main__ - Step 42428: {'lr': 0.00019926567337767871, 'samples': 1357696, 'steps': 2651, 'loss/train': 2.5448317527770996} -09/20/2021 23:40:40 - INFO - __main__ - Step 42429: {'lr': 0.00019926567337767871, 'samples': 1357728, 'steps': 2651, 'loss/train': 1.6169499158859253} -09/20/2021 23:40:41 - INFO - __main__ - Step 42430: {'lr': 0.00019926567337767871, 'samples': 1357760, 'steps': 2651, 'loss/train': 1.8920552730560303} -09/20/2021 23:40:41 - INFO - __main__ - Step 42431: {'lr': 0.00019926567337767871, 'samples': 1357792, 'steps': 2651, 'loss/train': 1.2470005750656128} -09/20/2021 23:40:42 - INFO - __main__ - Step 42432: {'lr': 0.00019926567337767871, 'samples': 1357824, 'steps': 2651, 'loss/train': 2.1262707710266113} -09/20/2021 23:40:44 - INFO - __main__ - Step 42433: {'lr': 0.00019926490155386793, 'samples': 1357856, 'steps': 2652, 'loss/train': 2.4595165252685547} -09/20/2021 23:40:45 - INFO - __main__ - Step 42434: {'lr': 0.00019926490155386793, 'samples': 1357888, 'steps': 2652, 'loss/train': 1.9559296369552612} -09/20/2021 23:40:45 - INFO - __main__ - Step 42435: {'lr': 0.00019926490155386793, 'samples': 1357920, 'steps': 2652, 'loss/train': 3.221574306488037} -09/20/2021 23:40:46 - INFO - __main__ - Step 42436: {'lr': 0.00019926490155386793, 'samples': 1357952, 'steps': 2652, 'loss/train': 1.4604755640029907} -09/20/2021 23:40:47 - INFO - __main__ - Step 42437: {'lr': 0.00019926490155386793, 'samples': 1357984, 'steps': 2652, 'loss/train': 1.6481883525848389} -09/20/2021 23:40:48 - INFO - __main__ - Step 42438: {'lr': 0.00019926490155386793, 'samples': 1358016, 'steps': 2652, 'loss/train': 1.6936094760894775} -09/20/2021 23:40:48 - INFO - __main__ - Step 42439: {'lr': 0.00019926490155386793, 'samples': 1358048, 'steps': 2652, 'loss/train': 2.0951364040374756} -09/20/2021 23:40:49 - INFO - __main__ - Step 42440: {'lr': 0.00019926490155386793, 'samples': 1358080, 'steps': 2652, 'loss/train': 2.6579558849334717} -09/20/2021 23:40:50 - INFO - __main__ - Step 42441: {'lr': 0.00019926490155386793, 'samples': 1358112, 'steps': 2652, 'loss/train': 2.8010640144348145} -09/20/2021 23:40:50 - INFO - __main__ - Step 42442: {'lr': 0.00019926490155386793, 'samples': 1358144, 'steps': 2652, 'loss/train': 2.2517402172088623} -09/20/2021 23:40:51 - INFO - __main__ - Step 42443: {'lr': 0.00019926490155386793, 'samples': 1358176, 'steps': 2652, 'loss/train': 1.713963508605957} -09/20/2021 23:40:52 - INFO - __main__ - Step 42444: {'lr': 0.00019926490155386793, 'samples': 1358208, 'steps': 2652, 'loss/train': 1.42909836769104} -09/20/2021 23:40:53 - INFO - __main__ - Step 42445: {'lr': 0.00019926490155386793, 'samples': 1358240, 'steps': 2652, 'loss/train': 2.4832048416137695} -09/20/2021 23:40:53 - INFO - __main__ - Step 42446: {'lr': 0.00019926490155386793, 'samples': 1358272, 'steps': 2652, 'loss/train': 2.634871006011963} -09/20/2021 23:40:54 - INFO - __main__ - Step 42447: {'lr': 0.00019926490155386793, 'samples': 1358304, 'steps': 2652, 'loss/train': 2.7413382530212402} -09/20/2021 23:40:55 - INFO - __main__ - Step 42448: {'lr': 0.00019926490155386793, 'samples': 1358336, 'steps': 2652, 'loss/train': 2.737700939178467} -09/20/2021 23:40:56 - INFO - __main__ - Step 42449: {'lr': 0.00019926412932614863, 'samples': 1358368, 'steps': 2653, 'loss/train': 2.586507558822632} -09/20/2021 23:40:57 - INFO - __main__ - Step 42450: {'lr': 0.00019926412932614863, 'samples': 1358400, 'steps': 2653, 'loss/train': 2.657841682434082} -09/20/2021 23:40:57 - INFO - __main__ - Step 42451: {'lr': 0.00019926412932614863, 'samples': 1358432, 'steps': 2653, 'loss/train': 2.3938887119293213} -09/20/2021 23:40:58 - INFO - __main__ - Step 42452: {'lr': 0.00019926412932614863, 'samples': 1358464, 'steps': 2653, 'loss/train': 2.4907801151275635} -09/20/2021 23:40:59 - INFO - __main__ - Step 42453: {'lr': 0.00019926412932614863, 'samples': 1358496, 'steps': 2653, 'loss/train': 1.8731030225753784} -09/20/2021 23:41:00 - INFO - __main__ - Step 42454: {'lr': 0.00019926412932614863, 'samples': 1358528, 'steps': 2653, 'loss/train': 2.2074790000915527} -09/20/2021 23:41:00 - INFO - __main__ - Step 42455: {'lr': 0.00019926412932614863, 'samples': 1358560, 'steps': 2653, 'loss/train': 2.658690929412842} -09/20/2021 23:41:01 - INFO - __main__ - Step 42456: {'lr': 0.00019926412932614863, 'samples': 1358592, 'steps': 2653, 'loss/train': 4.272883892059326} -09/20/2021 23:41:02 - INFO - __main__ - Step 42457: {'lr': 0.00019926412932614863, 'samples': 1358624, 'steps': 2653, 'loss/train': 2.5685763359069824} -09/20/2021 23:41:03 - INFO - __main__ - Step 42458: {'lr': 0.00019926412932614863, 'samples': 1358656, 'steps': 2653, 'loss/train': 2.0477097034454346} -09/20/2021 23:41:03 - INFO - __main__ - Step 42459: {'lr': 0.00019926412932614863, 'samples': 1358688, 'steps': 2653, 'loss/train': 2.986511468887329} -09/20/2021 23:41:04 - INFO - __main__ - Step 42460: {'lr': 0.00019926412932614863, 'samples': 1358720, 'steps': 2653, 'loss/train': 2.315640926361084} -09/20/2021 23:41:05 - INFO - __main__ - Step 42461: {'lr': 0.00019926412932614863, 'samples': 1358752, 'steps': 2653, 'loss/train': 1.9366846084594727} -09/20/2021 23:41:06 - INFO - __main__ - Step 42462: {'lr': 0.00019926412932614863, 'samples': 1358784, 'steps': 2653, 'loss/train': 2.2365520000457764} -09/20/2021 23:41:06 - INFO - __main__ - Step 42463: {'lr': 0.00019926412932614863, 'samples': 1358816, 'steps': 2653, 'loss/train': 0.6131717562675476} -09/20/2021 23:41:07 - INFO - __main__ - Step 42464: {'lr': 0.00019926412932614863, 'samples': 1358848, 'steps': 2653, 'loss/train': 0.5379205346107483} -09/20/2021 23:41:08 - INFO - __main__ - Step 42465: {'lr': 0.000199263356694524, 'samples': 1358880, 'steps': 2654, 'loss/train': 0.508701503276825} -09/20/2021 23:41:10 - INFO - __main__ - Step 42466: {'lr': 0.000199263356694524, 'samples': 1358912, 'steps': 2654, 'loss/train': 2.457589626312256} -09/20/2021 23:41:11 - INFO - __main__ - Step 42467: {'lr': 0.000199263356694524, 'samples': 1358944, 'steps': 2654, 'loss/train': 2.427460193634033} -09/20/2021 23:41:11 - INFO - __main__ - Step 42468: {'lr': 0.000199263356694524, 'samples': 1358976, 'steps': 2654, 'loss/train': 1.9862744808197021} -09/20/2021 23:41:12 - INFO - __main__ - Step 42469: {'lr': 0.000199263356694524, 'samples': 1359008, 'steps': 2654, 'loss/train': 2.7230477333068848} -09/20/2021 23:41:13 - INFO - __main__ - Step 42470: {'lr': 0.000199263356694524, 'samples': 1359040, 'steps': 2654, 'loss/train': 1.9059048891067505} -09/20/2021 23:41:14 - INFO - __main__ - Step 42471: {'lr': 0.000199263356694524, 'samples': 1359072, 'steps': 2654, 'loss/train': 2.6533405780792236} -09/20/2021 23:41:14 - INFO - __main__ - Step 42472: {'lr': 0.000199263356694524, 'samples': 1359104, 'steps': 2654, 'loss/train': 2.1767640113830566} -09/20/2021 23:41:15 - INFO - __main__ - Step 42473: {'lr': 0.000199263356694524, 'samples': 1359136, 'steps': 2654, 'loss/train': 2.278773546218872} -09/20/2021 23:41:16 - INFO - __main__ - Step 42474: {'lr': 0.000199263356694524, 'samples': 1359168, 'steps': 2654, 'loss/train': 1.963234782218933} -09/20/2021 23:41:17 - INFO - __main__ - Step 42475: {'lr': 0.000199263356694524, 'samples': 1359200, 'steps': 2654, 'loss/train': 1.7112960815429688} -09/20/2021 23:41:17 - INFO - __main__ - Step 42476: {'lr': 0.000199263356694524, 'samples': 1359232, 'steps': 2654, 'loss/train': 1.8897343873977661} -09/20/2021 23:41:18 - INFO - __main__ - Step 42477: {'lr': 0.000199263356694524, 'samples': 1359264, 'steps': 2654, 'loss/train': 2.2617061138153076} -09/20/2021 23:41:19 - INFO - __main__ - Step 42478: {'lr': 0.000199263356694524, 'samples': 1359296, 'steps': 2654, 'loss/train': 2.494295835494995} -09/20/2021 23:41:20 - INFO - __main__ - Step 42479: {'lr': 0.000199263356694524, 'samples': 1359328, 'steps': 2654, 'loss/train': 2.12450909614563} -09/20/2021 23:41:20 - INFO - __main__ - Step 42480: {'lr': 0.000199263356694524, 'samples': 1359360, 'steps': 2654, 'loss/train': 2.810967445373535} -09/20/2021 23:41:21 - INFO - __main__ - Step 42481: {'lr': 0.00019926258365899715, 'samples': 1359392, 'steps': 2655, 'loss/train': 2.07271671295166} -09/20/2021 23:41:22 - INFO - __main__ - Step 42482: {'lr': 0.00019926258365899715, 'samples': 1359424, 'steps': 2655, 'loss/train': 1.6130582094192505} -09/20/2021 23:41:23 - INFO - __main__ - Step 42483: {'lr': 0.00019926258365899715, 'samples': 1359456, 'steps': 2655, 'loss/train': 2.2531306743621826} -09/20/2021 23:41:24 - INFO - __main__ - Step 42484: {'lr': 0.00019926258365899715, 'samples': 1359488, 'steps': 2655, 'loss/train': 2.338977098464966} -09/20/2021 23:41:24 - INFO - __main__ - Step 42485: {'lr': 0.00019926258365899715, 'samples': 1359520, 'steps': 2655, 'loss/train': 2.7935523986816406} -09/20/2021 23:41:25 - INFO - __main__ - Step 42486: {'lr': 0.00019926258365899715, 'samples': 1359552, 'steps': 2655, 'loss/train': 1.7658746242523193} -09/20/2021 23:41:26 - INFO - __main__ - Step 42487: {'lr': 0.00019926258365899715, 'samples': 1359584, 'steps': 2655, 'loss/train': 2.177191972732544} -09/20/2021 23:41:27 - INFO - __main__ - Step 42488: {'lr': 0.00019926258365899715, 'samples': 1359616, 'steps': 2655, 'loss/train': 2.0970194339752197} -09/20/2021 23:41:27 - INFO - __main__ - Step 42489: {'lr': 0.00019926258365899715, 'samples': 1359648, 'steps': 2655, 'loss/train': 0.5816084742546082} -09/20/2021 23:41:28 - INFO - __main__ - Step 42490: {'lr': 0.00019926258365899715, 'samples': 1359680, 'steps': 2655, 'loss/train': 2.437830686569214} -09/20/2021 23:41:29 - INFO - __main__ - Step 42491: {'lr': 0.00019926258365899715, 'samples': 1359712, 'steps': 2655, 'loss/train': 2.2178773880004883} -09/20/2021 23:41:30 - INFO - __main__ - Step 42492: {'lr': 0.00019926258365899715, 'samples': 1359744, 'steps': 2655, 'loss/train': 2.2349507808685303} -09/20/2021 23:41:30 - INFO - __main__ - Step 42493: {'lr': 0.00019926258365899715, 'samples': 1359776, 'steps': 2655, 'loss/train': 3.0097885131835938} -09/20/2021 23:41:31 - INFO - __main__ - Step 42494: {'lr': 0.00019926258365899715, 'samples': 1359808, 'steps': 2655, 'loss/train': 3.18896484375} -09/20/2021 23:41:32 - INFO - __main__ - Step 42495: {'lr': 0.00019926258365899715, 'samples': 1359840, 'steps': 2655, 'loss/train': 2.892266035079956} -09/20/2021 23:41:33 - INFO - __main__ - Step 42496: {'lr': 0.00019926258365899715, 'samples': 1359872, 'steps': 2655, 'loss/train': 2.9967775344848633} -09/20/2021 23:41:33 - INFO - __main__ - Step 42497: {'lr': 0.0001992618102195712, 'samples': 1359904, 'steps': 2656, 'loss/train': 3.7008724212646484} -09/20/2021 23:41:34 - INFO - __main__ - Step 42498: {'lr': 0.0001992618102195712, 'samples': 1359936, 'steps': 2656, 'loss/train': 2.340947151184082} -09/20/2021 23:41:35 - INFO - __main__ - Step 42499: {'lr': 0.0001992618102195712, 'samples': 1359968, 'steps': 2656, 'loss/train': 1.9986121654510498} -09/20/2021 23:41:36 - INFO - __main__ - Step 42500: {'lr': 0.0001992618102195712, 'samples': 1360000, 'steps': 2656, 'loss/train': 1.5874863862991333} -09/20/2021 23:41:37 - INFO - __main__ - Step 42501: {'lr': 0.0001992618102195712, 'samples': 1360032, 'steps': 2656, 'loss/train': 2.114518880844116} -09/20/2021 23:41:38 - INFO - __main__ - Step 42502: {'lr': 0.0001992618102195712, 'samples': 1360064, 'steps': 2656, 'loss/train': 3.0267040729522705} -09/20/2021 23:41:38 - INFO - __main__ - Step 42503: {'lr': 0.0001992618102195712, 'samples': 1360096, 'steps': 2656, 'loss/train': 2.0754752159118652} -09/20/2021 23:41:39 - INFO - __main__ - Step 42504: {'lr': 0.0001992618102195712, 'samples': 1360128, 'steps': 2656, 'loss/train': 3.0819687843322754} -09/20/2021 23:41:40 - INFO - __main__ - Step 42505: {'lr': 0.0001992618102195712, 'samples': 1360160, 'steps': 2656, 'loss/train': 2.427948474884033} -09/20/2021 23:41:41 - INFO - __main__ - Step 42506: {'lr': 0.0001992618102195712, 'samples': 1360192, 'steps': 2656, 'loss/train': 1.8106436729431152} -09/20/2021 23:41:41 - INFO - __main__ - Step 42507: {'lr': 0.0001992618102195712, 'samples': 1360224, 'steps': 2656, 'loss/train': 2.5033154487609863} -09/20/2021 23:41:42 - INFO - __main__ - Step 42508: {'lr': 0.0001992618102195712, 'samples': 1360256, 'steps': 2656, 'loss/train': 1.739816665649414} -09/20/2021 23:41:43 - INFO - __main__ - Step 42509: {'lr': 0.0001992618102195712, 'samples': 1360288, 'steps': 2656, 'loss/train': 2.134221315383911} -09/20/2021 23:41:44 - INFO - __main__ - Step 42510: {'lr': 0.0001992618102195712, 'samples': 1360320, 'steps': 2656, 'loss/train': 2.4213955402374268} -09/20/2021 23:41:44 - INFO - __main__ - Step 42511: {'lr': 0.0001992618102195712, 'samples': 1360352, 'steps': 2656, 'loss/train': 1.5283676385879517} -09/20/2021 23:41:45 - INFO - __main__ - Step 42512: {'lr': 0.0001992618102195712, 'samples': 1360384, 'steps': 2656, 'loss/train': 2.576357364654541} -09/20/2021 23:41:46 - INFO - __main__ - Step 42513: {'lr': 0.00019926103637624935, 'samples': 1360416, 'steps': 2657, 'loss/train': 2.200092077255249} -09/20/2021 23:41:47 - INFO - __main__ - Step 42514: {'lr': 0.00019926103637624935, 'samples': 1360448, 'steps': 2657, 'loss/train': 2.785504102706909} -09/20/2021 23:41:48 - INFO - __main__ - Step 42515: {'lr': 0.00019926103637624935, 'samples': 1360480, 'steps': 2657, 'loss/train': 2.651625156402588} -09/20/2021 23:41:48 - INFO - __main__ - Step 42516: {'lr': 0.00019926103637624935, 'samples': 1360512, 'steps': 2657, 'loss/train': 3.4642937183380127} -09/20/2021 23:41:49 - INFO - __main__ - Step 42517: {'lr': 0.00019926103637624935, 'samples': 1360544, 'steps': 2657, 'loss/train': 1.6861367225646973} -09/20/2021 23:41:50 - INFO - __main__ - Step 42518: {'lr': 0.00019926103637624935, 'samples': 1360576, 'steps': 2657, 'loss/train': 2.236572742462158} -09/20/2021 23:41:51 - INFO - __main__ - Step 42519: {'lr': 0.00019926103637624935, 'samples': 1360608, 'steps': 2657, 'loss/train': 1.2436258792877197} -09/20/2021 23:41:51 - INFO - __main__ - Step 42520: {'lr': 0.00019926103637624935, 'samples': 1360640, 'steps': 2657, 'loss/train': 2.4489428997039795} -09/20/2021 23:41:52 - INFO - __main__ - Step 42521: {'lr': 0.00019926103637624935, 'samples': 1360672, 'steps': 2657, 'loss/train': 2.1301045417785645} -09/20/2021 23:41:53 - INFO - __main__ - Step 42522: {'lr': 0.00019926103637624935, 'samples': 1360704, 'steps': 2657, 'loss/train': 1.6276357173919678} -09/20/2021 23:41:54 - INFO - __main__ - Step 42523: {'lr': 0.00019926103637624935, 'samples': 1360736, 'steps': 2657, 'loss/train': 1.7097140550613403} -09/20/2021 23:41:54 - INFO - __main__ - Step 42524: {'lr': 0.00019926103637624935, 'samples': 1360768, 'steps': 2657, 'loss/train': 1.944685935974121} -09/20/2021 23:41:55 - INFO - __main__ - Step 42525: {'lr': 0.00019926103637624935, 'samples': 1360800, 'steps': 2657, 'loss/train': 2.060429334640503} -09/20/2021 23:41:56 - INFO - __main__ - Step 42526: {'lr': 0.00019926103637624935, 'samples': 1360832, 'steps': 2657, 'loss/train': 2.9829955101013184} -09/20/2021 23:41:57 - INFO - __main__ - Step 42527: {'lr': 0.00019926103637624935, 'samples': 1360864, 'steps': 2657, 'loss/train': 1.4648395776748657} -09/20/2021 23:41:57 - INFO - __main__ - Step 42528: {'lr': 0.00019926103637624935, 'samples': 1360896, 'steps': 2657, 'loss/train': 2.0742697715759277} -09/20/2021 23:41:59 - INFO - __main__ - Step 42529: {'lr': 0.00019926026212903475, 'samples': 1360928, 'steps': 2658, 'loss/train': 1.8234188556671143} -09/20/2021 23:42:00 - INFO - __main__ - Step 42530: {'lr': 0.00019926026212903475, 'samples': 1360960, 'steps': 2658, 'loss/train': 2.1562862396240234} -09/20/2021 23:42:00 - INFO - __main__ - Step 42531: {'lr': 0.00019926026212903475, 'samples': 1360992, 'steps': 2658, 'loss/train': 0.38927334547042847} -09/20/2021 23:42:01 - INFO - __main__ - Step 42532: {'lr': 0.00019926026212903475, 'samples': 1361024, 'steps': 2658, 'loss/train': 2.0516650676727295} -09/20/2021 23:42:02 - INFO - __main__ - Step 42533: {'lr': 0.00019926026212903475, 'samples': 1361056, 'steps': 2658, 'loss/train': 2.1208884716033936} -09/20/2021 23:42:03 - INFO - __main__ - Step 42534: {'lr': 0.00019926026212903475, 'samples': 1361088, 'steps': 2658, 'loss/train': 2.2819294929504395} -09/20/2021 23:42:03 - INFO - __main__ - Step 42535: {'lr': 0.00019926026212903475, 'samples': 1361120, 'steps': 2658, 'loss/train': 2.1270592212677} -09/20/2021 23:42:04 - INFO - __main__ - Step 42536: {'lr': 0.00019926026212903475, 'samples': 1361152, 'steps': 2658, 'loss/train': 1.8079699277877808} -09/20/2021 23:42:05 - INFO - __main__ - Step 42537: {'lr': 0.00019926026212903475, 'samples': 1361184, 'steps': 2658, 'loss/train': 2.1117849349975586} -09/20/2021 23:42:06 - INFO - __main__ - Step 42538: {'lr': 0.00019926026212903475, 'samples': 1361216, 'steps': 2658, 'loss/train': 1.527855396270752} -09/20/2021 23:42:06 - INFO - __main__ - Step 42539: {'lr': 0.00019926026212903475, 'samples': 1361248, 'steps': 2658, 'loss/train': 1.5161224603652954} -09/20/2021 23:42:07 - INFO - __main__ - Step 42540: {'lr': 0.00019926026212903475, 'samples': 1361280, 'steps': 2658, 'loss/train': 1.6254847049713135} -09/20/2021 23:42:08 - INFO - __main__ - Step 42541: {'lr': 0.00019926026212903475, 'samples': 1361312, 'steps': 2658, 'loss/train': 2.337012529373169} -09/20/2021 23:42:09 - INFO - __main__ - Step 42542: {'lr': 0.00019926026212903475, 'samples': 1361344, 'steps': 2658, 'loss/train': 2.017794132232666} -09/20/2021 23:42:09 - INFO - __main__ - Step 42543: {'lr': 0.00019926026212903475, 'samples': 1361376, 'steps': 2658, 'loss/train': 1.734775424003601} -09/20/2021 23:42:10 - INFO - __main__ - Step 42544: {'lr': 0.00019926026212903475, 'samples': 1361408, 'steps': 2658, 'loss/train': 0.9631147980690002} -09/20/2021 23:42:11 - INFO - __main__ - Step 42545: {'lr': 0.0001992594874779305, 'samples': 1361440, 'steps': 2659, 'loss/train': 2.0908074378967285} -09/20/2021 23:42:12 - INFO - __main__ - Step 42546: {'lr': 0.0001992594874779305, 'samples': 1361472, 'steps': 2659, 'loss/train': 2.09641170501709} -09/20/2021 23:42:12 - INFO - __main__ - Step 42547: {'lr': 0.0001992594874779305, 'samples': 1361504, 'steps': 2659, 'loss/train': 1.6409540176391602} -09/20/2021 23:42:13 - INFO - __main__ - Step 42548: {'lr': 0.0001992594874779305, 'samples': 1361536, 'steps': 2659, 'loss/train': 1.6924270391464233} -09/20/2021 23:42:14 - INFO - __main__ - Step 42549: {'lr': 0.0001992594874779305, 'samples': 1361568, 'steps': 2659, 'loss/train': 1.8854892253875732} -09/20/2021 23:42:15 - INFO - __main__ - Step 42550: {'lr': 0.0001992594874779305, 'samples': 1361600, 'steps': 2659, 'loss/train': 2.539086103439331} -09/20/2021 23:42:15 - INFO - __main__ - Step 42551: {'lr': 0.0001992594874779305, 'samples': 1361632, 'steps': 2659, 'loss/train': 0.626689076423645} -09/20/2021 23:42:16 - INFO - __main__ - Step 42552: {'lr': 0.0001992594874779305, 'samples': 1361664, 'steps': 2659, 'loss/train': 1.9367871284484863} -09/20/2021 23:42:17 - INFO - __main__ - Step 42553: {'lr': 0.0001992594874779305, 'samples': 1361696, 'steps': 2659, 'loss/train': 1.939742088317871} -09/20/2021 23:42:18 - INFO - __main__ - Step 42554: {'lr': 0.0001992594874779305, 'samples': 1361728, 'steps': 2659, 'loss/train': 2.734226942062378} -09/20/2021 23:42:18 - INFO - __main__ - Step 42555: {'lr': 0.0001992594874779305, 'samples': 1361760, 'steps': 2659, 'loss/train': 1.8307323455810547} -09/20/2021 23:42:19 - INFO - __main__ - Step 42556: {'lr': 0.0001992594874779305, 'samples': 1361792, 'steps': 2659, 'loss/train': 2.772339344024658} -09/20/2021 23:42:20 - INFO - __main__ - Step 42557: {'lr': 0.0001992594874779305, 'samples': 1361824, 'steps': 2659, 'loss/train': 1.7178676128387451} -09/20/2021 23:42:21 - INFO - __main__ - Step 42558: {'lr': 0.0001992594874779305, 'samples': 1361856, 'steps': 2659, 'loss/train': 2.057291269302368} -09/20/2021 23:42:21 - INFO - __main__ - Step 42559: {'lr': 0.0001992594874779305, 'samples': 1361888, 'steps': 2659, 'loss/train': 2.003192663192749} -09/20/2021 23:42:23 - INFO - __main__ - Step 42560: {'lr': 0.0001992594874779305, 'samples': 1361920, 'steps': 2659, 'loss/train': 2.2706382274627686} -09/20/2021 23:42:24 - INFO - __main__ - Step 42561: {'lr': 0.0001992587124229398, 'samples': 1361952, 'steps': 2660, 'loss/train': 2.283080816268921} -09/20/2021 23:42:24 - INFO - __main__ - Step 42562: {'lr': 0.0001992587124229398, 'samples': 1361984, 'steps': 2660, 'loss/train': 2.734772205352783} -09/20/2021 23:42:25 - INFO - __main__ - Step 42563: {'lr': 0.0001992587124229398, 'samples': 1362016, 'steps': 2660, 'loss/train': 2.7739388942718506} -09/20/2021 23:42:26 - INFO - __main__ - Step 42564: {'lr': 0.0001992587124229398, 'samples': 1362048, 'steps': 2660, 'loss/train': 1.5865365266799927} -09/20/2021 23:42:27 - INFO - __main__ - Step 42565: {'lr': 0.0001992587124229398, 'samples': 1362080, 'steps': 2660, 'loss/train': 1.3870623111724854} -09/20/2021 23:42:27 - INFO - __main__ - Step 42566: {'lr': 0.0001992587124229398, 'samples': 1362112, 'steps': 2660, 'loss/train': 1.963312029838562} -09/20/2021 23:42:28 - INFO - __main__ - Step 42567: {'lr': 0.0001992587124229398, 'samples': 1362144, 'steps': 2660, 'loss/train': 0.5065882205963135} -09/20/2021 23:42:29 - INFO - __main__ - Step 42568: {'lr': 0.0001992587124229398, 'samples': 1362176, 'steps': 2660, 'loss/train': 1.828762412071228} -09/20/2021 23:42:30 - INFO - __main__ - Step 42569: {'lr': 0.0001992587124229398, 'samples': 1362208, 'steps': 2660, 'loss/train': 2.3097305297851562} -09/20/2021 23:42:30 - INFO - __main__ - Step 42570: {'lr': 0.0001992587124229398, 'samples': 1362240, 'steps': 2660, 'loss/train': 2.2262086868286133} -09/20/2021 23:42:31 - INFO - __main__ - Step 42571: {'lr': 0.0001992587124229398, 'samples': 1362272, 'steps': 2660, 'loss/train': 2.3768107891082764} -09/20/2021 23:42:32 - INFO - __main__ - Step 42572: {'lr': 0.0001992587124229398, 'samples': 1362304, 'steps': 2660, 'loss/train': 1.7374780178070068} -09/20/2021 23:42:33 - INFO - __main__ - Step 42573: {'lr': 0.0001992587124229398, 'samples': 1362336, 'steps': 2660, 'loss/train': 1.7284783124923706} -09/20/2021 23:42:33 - INFO - __main__ - Step 42574: {'lr': 0.0001992587124229398, 'samples': 1362368, 'steps': 2660, 'loss/train': 1.6531729698181152} -09/20/2021 23:42:34 - INFO - __main__ - Step 42575: {'lr': 0.0001992587124229398, 'samples': 1362400, 'steps': 2660, 'loss/train': 1.8908296823501587} -09/20/2021 23:42:35 - INFO - __main__ - Step 42576: {'lr': 0.0001992587124229398, 'samples': 1362432, 'steps': 2660, 'loss/train': 2.279974937438965} -09/20/2021 23:42:36 - INFO - __main__ - Step 42577: {'lr': 0.00019925793696406573, 'samples': 1362464, 'steps': 2661, 'loss/train': 0.7157118916511536} -09/20/2021 23:42:37 - INFO - __main__ - Step 42578: {'lr': 0.00019925793696406573, 'samples': 1362496, 'steps': 2661, 'loss/train': 2.1031298637390137} -09/20/2021 23:42:37 - INFO - __main__ - Step 42579: {'lr': 0.00019925793696406573, 'samples': 1362528, 'steps': 2661, 'loss/train': 3.4446969032287598} -09/20/2021 23:42:38 - INFO - __main__ - Step 42580: {'lr': 0.00019925793696406573, 'samples': 1362560, 'steps': 2661, 'loss/train': 1.4265456199645996} -09/20/2021 23:42:39 - INFO - __main__ - Step 42581: {'lr': 0.00019925793696406573, 'samples': 1362592, 'steps': 2661, 'loss/train': 1.5817369222640991} -09/20/2021 23:42:40 - INFO - __main__ - Step 42582: {'lr': 0.00019925793696406573, 'samples': 1362624, 'steps': 2661, 'loss/train': 2.5367960929870605} -09/20/2021 23:42:40 - INFO - __main__ - Step 42583: {'lr': 0.00019925793696406573, 'samples': 1362656, 'steps': 2661, 'loss/train': 1.7466644048690796} -09/20/2021 23:42:41 - INFO - __main__ - Step 42584: {'lr': 0.00019925793696406573, 'samples': 1362688, 'steps': 2661, 'loss/train': 2.2408289909362793} -09/20/2021 23:42:42 - INFO - __main__ - Step 42585: {'lr': 0.00019925793696406573, 'samples': 1362720, 'steps': 2661, 'loss/train': 3.4306437969207764} -09/20/2021 23:42:43 - INFO - __main__ - Step 42586: {'lr': 0.00019925793696406573, 'samples': 1362752, 'steps': 2661, 'loss/train': 3.534635305404663} -09/20/2021 23:42:43 - INFO - __main__ - Step 42587: {'lr': 0.00019925793696406573, 'samples': 1362784, 'steps': 2661, 'loss/train': 3.459317922592163} -09/20/2021 23:42:44 - INFO - __main__ - Step 42588: {'lr': 0.00019925793696406573, 'samples': 1362816, 'steps': 2661, 'loss/train': 3.5810964107513428} -09/20/2021 23:42:45 - INFO - __main__ - Step 42589: {'lr': 0.00019925793696406573, 'samples': 1362848, 'steps': 2661, 'loss/train': 3.5859713554382324} -09/20/2021 23:42:46 - INFO - __main__ - Step 42590: {'lr': 0.00019925793696406573, 'samples': 1362880, 'steps': 2661, 'loss/train': 3.41572904586792} -09/20/2021 23:42:46 - INFO - __main__ - Step 42591: {'lr': 0.00019925793696406573, 'samples': 1362912, 'steps': 2661, 'loss/train': 1.6040412187576294} -09/20/2021 23:42:47 - INFO - __main__ - Step 42592: {'lr': 0.00019925793696406573, 'samples': 1362944, 'steps': 2661, 'loss/train': 2.101048707962036} -09/20/2021 23:42:48 - INFO - __main__ - Step 42593: {'lr': 0.00019925716110131156, 'samples': 1362976, 'steps': 2662, 'loss/train': 2.575080394744873} -09/20/2021 23:42:49 - INFO - __main__ - Step 42594: {'lr': 0.00019925716110131156, 'samples': 1363008, 'steps': 2662, 'loss/train': 0.7669646739959717} -09/20/2021 23:42:50 - INFO - __main__ - Step 42595: {'lr': 0.00019925716110131156, 'samples': 1363040, 'steps': 2662, 'loss/train': 3.1705853939056396} -09/20/2021 23:42:50 - INFO - __main__ - Step 42596: {'lr': 0.00019925716110131156, 'samples': 1363072, 'steps': 2662, 'loss/train': 2.8770174980163574} -09/20/2021 23:42:52 - INFO - __main__ - Step 42597: {'lr': 0.00019925716110131156, 'samples': 1363104, 'steps': 2662, 'loss/train': 2.2782626152038574} -09/20/2021 23:42:52 - INFO - __main__ - Step 42598: {'lr': 0.00019925716110131156, 'samples': 1363136, 'steps': 2662, 'loss/train': 0.6316856145858765} -09/20/2021 23:42:53 - INFO - __main__ - Step 42599: {'lr': 0.00019925716110131156, 'samples': 1363168, 'steps': 2662, 'loss/train': 2.247485876083374} -09/20/2021 23:42:54 - INFO - __main__ - Step 42600: {'lr': 0.00019925716110131156, 'samples': 1363200, 'steps': 2662, 'loss/train': 1.9775047302246094} -09/20/2021 23:42:55 - INFO - __main__ - Step 42601: {'lr': 0.00019925716110131156, 'samples': 1363232, 'steps': 2662, 'loss/train': 2.1655070781707764} -09/20/2021 23:42:55 - INFO - __main__ - Step 42602: {'lr': 0.00019925716110131156, 'samples': 1363264, 'steps': 2662, 'loss/train': 1.8572487831115723} -09/20/2021 23:42:56 - INFO - __main__ - Step 42603: {'lr': 0.00019925716110131156, 'samples': 1363296, 'steps': 2662, 'loss/train': 1.9747486114501953} -09/20/2021 23:42:57 - INFO - __main__ - Step 42604: {'lr': 0.00019925716110131156, 'samples': 1363328, 'steps': 2662, 'loss/train': 1.8318805694580078} -09/20/2021 23:42:58 - INFO - __main__ - Step 42605: {'lr': 0.00019925716110131156, 'samples': 1363360, 'steps': 2662, 'loss/train': 2.0744359493255615} -09/20/2021 23:42:58 - INFO - __main__ - Step 42606: {'lr': 0.00019925716110131156, 'samples': 1363392, 'steps': 2662, 'loss/train': 1.4037339687347412} -09/20/2021 23:42:59 - INFO - __main__ - Step 42607: {'lr': 0.00019925716110131156, 'samples': 1363424, 'steps': 2662, 'loss/train': 2.1737611293792725} -09/20/2021 23:43:00 - INFO - __main__ - Step 42608: {'lr': 0.00019925716110131156, 'samples': 1363456, 'steps': 2662, 'loss/train': 2.7256317138671875} -09/20/2021 23:43:01 - INFO - __main__ - Step 42609: {'lr': 0.00019925638483468038, 'samples': 1363488, 'steps': 2663, 'loss/train': 2.3538053035736084} -09/20/2021 23:43:01 - INFO - __main__ - Step 42610: {'lr': 0.00019925638483468038, 'samples': 1363520, 'steps': 2663, 'loss/train': 1.7381736040115356} -09/20/2021 23:43:02 - INFO - __main__ - Step 42611: {'lr': 0.00019925638483468038, 'samples': 1363552, 'steps': 2663, 'loss/train': 2.029292583465576} -09/20/2021 23:43:03 - INFO - __main__ - Step 42612: {'lr': 0.00019925638483468038, 'samples': 1363584, 'steps': 2663, 'loss/train': 2.739969253540039} -09/20/2021 23:43:04 - INFO - __main__ - Step 42613: {'lr': 0.00019925638483468038, 'samples': 1363616, 'steps': 2663, 'loss/train': 2.6934316158294678} -09/20/2021 23:43:04 - INFO - __main__ - Step 42614: {'lr': 0.00019925638483468038, 'samples': 1363648, 'steps': 2663, 'loss/train': 1.8099918365478516} -09/20/2021 23:43:05 - INFO - __main__ - Step 42615: {'lr': 0.00019925638483468038, 'samples': 1363680, 'steps': 2663, 'loss/train': 2.025928258895874} -09/20/2021 23:43:06 - INFO - __main__ - Step 42616: {'lr': 0.00019925638483468038, 'samples': 1363712, 'steps': 2663, 'loss/train': 2.540709972381592} -09/20/2021 23:43:07 - INFO - __main__ - Step 42617: {'lr': 0.00019925638483468038, 'samples': 1363744, 'steps': 2663, 'loss/train': 1.8398065567016602} -09/20/2021 23:43:07 - INFO - __main__ - Step 42618: {'lr': 0.00019925638483468038, 'samples': 1363776, 'steps': 2663, 'loss/train': 2.3083181381225586} -09/20/2021 23:43:08 - INFO - __main__ - Step 42619: {'lr': 0.00019925638483468038, 'samples': 1363808, 'steps': 2663, 'loss/train': 1.303452730178833} -09/20/2021 23:43:09 - INFO - __main__ - Step 42620: {'lr': 0.00019925638483468038, 'samples': 1363840, 'steps': 2663, 'loss/train': 1.4460538625717163} -09/20/2021 23:43:10 - INFO - __main__ - Step 42621: {'lr': 0.00019925638483468038, 'samples': 1363872, 'steps': 2663, 'loss/train': 1.3949576616287231} -09/20/2021 23:43:10 - INFO - __main__ - Step 42622: {'lr': 0.00019925638483468038, 'samples': 1363904, 'steps': 2663, 'loss/train': 0.4739743173122406} -09/20/2021 23:43:11 - INFO - __main__ - Step 42623: {'lr': 0.00019925638483468038, 'samples': 1363936, 'steps': 2663, 'loss/train': 1.6088454723358154} -09/20/2021 23:43:12 - INFO - __main__ - Step 42624: {'lr': 0.00019925638483468038, 'samples': 1363968, 'steps': 2663, 'loss/train': 1.6142780780792236} -09/20/2021 23:43:13 - INFO - __main__ - Step 42625: {'lr': 0.00019925560816417534, 'samples': 1364000, 'steps': 2664, 'loss/train': 1.7348463535308838} -09/20/2021 23:43:14 - INFO - __main__ - Step 42626: {'lr': 0.00019925560816417534, 'samples': 1364032, 'steps': 2664, 'loss/train': 1.6722854375839233} -09/20/2021 23:43:14 - INFO - __main__ - Step 42627: {'lr': 0.00019925560816417534, 'samples': 1364064, 'steps': 2664, 'loss/train': 1.268876552581787} -09/20/2021 23:43:15 - INFO - __main__ - Step 42628: {'lr': 0.00019925560816417534, 'samples': 1364096, 'steps': 2664, 'loss/train': 2.4238576889038086} -09/20/2021 23:43:16 - INFO - __main__ - Step 42629: {'lr': 0.00019925560816417534, 'samples': 1364128, 'steps': 2664, 'loss/train': 0.8282279372215271} -09/20/2021 23:43:17 - INFO - __main__ - Step 42630: {'lr': 0.00019925560816417534, 'samples': 1364160, 'steps': 2664, 'loss/train': 2.8189594745635986} -09/20/2021 23:43:18 - INFO - __main__ - Step 42631: {'lr': 0.00019925560816417534, 'samples': 1364192, 'steps': 2664, 'loss/train': 1.599212408065796} -09/20/2021 23:43:19 - INFO - __main__ - Step 42632: {'lr': 0.00019925560816417534, 'samples': 1364224, 'steps': 2664, 'loss/train': 2.099269390106201} -09/20/2021 23:43:19 - INFO - __main__ - Step 42633: {'lr': 0.00019925560816417534, 'samples': 1364256, 'steps': 2664, 'loss/train': 6.246743202209473} -09/20/2021 23:43:20 - INFO - __main__ - Step 42634: {'lr': 0.00019925560816417534, 'samples': 1364288, 'steps': 2664, 'loss/train': 6.1055097579956055} -09/20/2021 23:43:21 - INFO - __main__ - Step 42635: {'lr': 0.00019925560816417534, 'samples': 1364320, 'steps': 2664, 'loss/train': 6.18484354019165} -09/20/2021 23:43:22 - INFO - __main__ - Step 42636: {'lr': 0.00019925560816417534, 'samples': 1364352, 'steps': 2664, 'loss/train': 6.113645553588867} -09/20/2021 23:43:22 - INFO - __main__ - Step 42637: {'lr': 0.00019925560816417534, 'samples': 1364384, 'steps': 2664, 'loss/train': 6.191632270812988} -09/20/2021 23:43:23 - INFO - __main__ - Step 42638: {'lr': 0.00019925560816417534, 'samples': 1364416, 'steps': 2664, 'loss/train': 6.14054536819458} -09/20/2021 23:43:24 - INFO - __main__ - Step 42639: {'lr': 0.00019925560816417534, 'samples': 1364448, 'steps': 2664, 'loss/train': 6.181967735290527} -09/20/2021 23:43:25 - INFO - __main__ - Step 42640: {'lr': 0.00019925560816417534, 'samples': 1364480, 'steps': 2664, 'loss/train': 2.282017946243286} -09/20/2021 23:43:26 - INFO - __main__ - Step 42641: {'lr': 0.0001992548310897996, 'samples': 1364512, 'steps': 2665, 'loss/train': 2.414328098297119} -09/20/2021 23:43:26 - INFO - __main__ - Step 42642: {'lr': 0.0001992548310897996, 'samples': 1364544, 'steps': 2665, 'loss/train': 2.038687229156494} -09/20/2021 23:43:27 - INFO - __main__ - Step 42643: {'lr': 0.0001992548310897996, 'samples': 1364576, 'steps': 2665, 'loss/train': 0.3199550211429596} -09/20/2021 23:43:28 - INFO - __main__ - Step 42644: {'lr': 0.0001992548310897996, 'samples': 1364608, 'steps': 2665, 'loss/train': 1.5251866579055786} -09/20/2021 23:43:29 - INFO - __main__ - Step 42645: {'lr': 0.0001992548310897996, 'samples': 1364640, 'steps': 2665, 'loss/train': 2.546100616455078} -09/20/2021 23:43:29 - INFO - __main__ - Step 42646: {'lr': 0.0001992548310897996, 'samples': 1364672, 'steps': 2665, 'loss/train': 2.028141498565674} -09/20/2021 23:43:30 - INFO - __main__ - Step 42647: {'lr': 0.0001992548310897996, 'samples': 1364704, 'steps': 2665, 'loss/train': 1.997288465499878} -09/20/2021 23:43:31 - INFO - __main__ - Step 42648: {'lr': 0.0001992548310897996, 'samples': 1364736, 'steps': 2665, 'loss/train': 2.1064975261688232} -09/20/2021 23:43:32 - INFO - __main__ - Step 42649: {'lr': 0.0001992548310897996, 'samples': 1364768, 'steps': 2665, 'loss/train': 2.4904260635375977} -09/20/2021 23:43:32 - INFO - __main__ - Step 42650: {'lr': 0.0001992548310897996, 'samples': 1364800, 'steps': 2665, 'loss/train': 2.2364375591278076} -09/20/2021 23:43:33 - INFO - __main__ - Step 42651: {'lr': 0.0001992548310897996, 'samples': 1364832, 'steps': 2665, 'loss/train': 2.2971458435058594} -09/20/2021 23:43:34 - INFO - __main__ - Step 42652: {'lr': 0.0001992548310897996, 'samples': 1364864, 'steps': 2665, 'loss/train': 2.6354963779449463} -09/20/2021 23:43:35 - INFO - __main__ - Step 42653: {'lr': 0.0001992548310897996, 'samples': 1364896, 'steps': 2665, 'loss/train': 1.5762258768081665} -09/20/2021 23:43:35 - INFO - __main__ - Step 42654: {'lr': 0.0001992548310897996, 'samples': 1364928, 'steps': 2665, 'loss/train': 0.9323456883430481} -09/20/2021 23:43:36 - INFO - __main__ - Step 42655: {'lr': 0.0001992548310897996, 'samples': 1364960, 'steps': 2665, 'loss/train': 2.4963181018829346} -09/20/2021 23:43:37 - INFO - __main__ - Step 42656: {'lr': 0.0001992548310897996, 'samples': 1364992, 'steps': 2665, 'loss/train': 0.20813684165477753} -09/20/2021 23:43:38 - INFO - __main__ - Step 42657: {'lr': 0.00019925405361155638, 'samples': 1365024, 'steps': 2666, 'loss/train': 2.7390334606170654} -09/20/2021 23:43:39 - INFO - __main__ - Step 42658: {'lr': 0.00019925405361155638, 'samples': 1365056, 'steps': 2666, 'loss/train': 1.8463793992996216} -09/20/2021 23:43:39 - INFO - __main__ - Step 42659: {'lr': 0.00019925405361155638, 'samples': 1365088, 'steps': 2666, 'loss/train': 1.4737768173217773} -09/20/2021 23:43:40 - INFO - __main__ - Step 42660: {'lr': 0.00019925405361155638, 'samples': 1365120, 'steps': 2666, 'loss/train': 2.02148175239563} -09/20/2021 23:43:41 - INFO - __main__ - Step 42661: {'lr': 0.00019925405361155638, 'samples': 1365152, 'steps': 2666, 'loss/train': 2.049593448638916} -09/20/2021 23:43:42 - INFO - __main__ - Step 42662: {'lr': 0.00019925405361155638, 'samples': 1365184, 'steps': 2666, 'loss/train': 1.4812124967575073} -09/20/2021 23:43:43 - INFO - __main__ - Step 42663: {'lr': 0.00019925405361155638, 'samples': 1365216, 'steps': 2666, 'loss/train': 1.3963805437088013} -09/20/2021 23:43:44 - INFO - __main__ - Step 42664: {'lr': 0.00019925405361155638, 'samples': 1365248, 'steps': 2666, 'loss/train': 1.9508591890335083} -09/20/2021 23:43:44 - INFO - __main__ - Step 42665: {'lr': 0.00019925405361155638, 'samples': 1365280, 'steps': 2666, 'loss/train': 2.3005685806274414} -09/20/2021 23:43:45 - INFO - __main__ - Step 42666: {'lr': 0.00019925405361155638, 'samples': 1365312, 'steps': 2666, 'loss/train': 2.0281143188476562} -09/20/2021 23:43:46 - INFO - __main__ - Step 42667: {'lr': 0.00019925405361155638, 'samples': 1365344, 'steps': 2666, 'loss/train': 2.352238655090332} -09/20/2021 23:43:47 - INFO - __main__ - Step 42668: {'lr': 0.00019925405361155638, 'samples': 1365376, 'steps': 2666, 'loss/train': 2.0417771339416504} -09/20/2021 23:43:47 - INFO - __main__ - Step 42669: {'lr': 0.00019925405361155638, 'samples': 1365408, 'steps': 2666, 'loss/train': 1.9637258052825928} -09/20/2021 23:43:48 - INFO - __main__ - Step 42670: {'lr': 0.00019925405361155638, 'samples': 1365440, 'steps': 2666, 'loss/train': 1.7696155309677124} -09/20/2021 23:43:49 - INFO - __main__ - Step 42671: {'lr': 0.00019925405361155638, 'samples': 1365472, 'steps': 2666, 'loss/train': 2.420307159423828} -09/20/2021 23:43:50 - INFO - __main__ - Step 42672: {'lr': 0.00019925405361155638, 'samples': 1365504, 'steps': 2666, 'loss/train': 2.006105422973633} -09/20/2021 23:43:50 - INFO - __main__ - Step 42673: {'lr': 0.00019925327572944878, 'samples': 1365536, 'steps': 2667, 'loss/train': 2.079953670501709} -09/20/2021 23:43:51 - INFO - __main__ - Step 42674: {'lr': 0.00019925327572944878, 'samples': 1365568, 'steps': 2667, 'loss/train': 1.6939579248428345} -09/20/2021 23:43:52 - INFO - __main__ - Step 42675: {'lr': 0.00019925327572944878, 'samples': 1365600, 'steps': 2667, 'loss/train': 1.7943841218948364} -09/20/2021 23:43:53 - INFO - __main__ - Step 42676: {'lr': 0.00019925327572944878, 'samples': 1365632, 'steps': 2667, 'loss/train': 1.215754508972168} -09/20/2021 23:43:53 - INFO - __main__ - Step 42677: {'lr': 0.00019925327572944878, 'samples': 1365664, 'steps': 2667, 'loss/train': 1.4384819269180298} -09/20/2021 23:43:54 - INFO - __main__ - Step 42678: {'lr': 0.00019925327572944878, 'samples': 1365696, 'steps': 2667, 'loss/train': 1.1727732419967651} -09/20/2021 23:43:55 - INFO - __main__ - Step 42679: {'lr': 0.00019925327572944878, 'samples': 1365728, 'steps': 2667, 'loss/train': 0.16444775462150574} -09/20/2021 23:43:56 - INFO - __main__ - Step 42680: {'lr': 0.00019925327572944878, 'samples': 1365760, 'steps': 2667, 'loss/train': 3.731477975845337} -09/20/2021 23:43:56 - INFO - __main__ - Step 42681: {'lr': 0.00019925327572944878, 'samples': 1365792, 'steps': 2667, 'loss/train': 1.3239344358444214} -09/20/2021 23:43:57 - INFO - __main__ - Step 42682: {'lr': 0.00019925327572944878, 'samples': 1365824, 'steps': 2667, 'loss/train': 1.442236065864563} -09/20/2021 23:43:58 - INFO - __main__ - Step 42683: {'lr': 0.00019925327572944878, 'samples': 1365856, 'steps': 2667, 'loss/train': 2.3665101528167725} -09/20/2021 23:43:59 - INFO - __main__ - Step 42684: {'lr': 0.00019925327572944878, 'samples': 1365888, 'steps': 2667, 'loss/train': 2.249103546142578} -09/20/2021 23:43:59 - INFO - __main__ - Step 42685: {'lr': 0.00019925327572944878, 'samples': 1365920, 'steps': 2667, 'loss/train': 2.379718780517578} -09/20/2021 23:44:00 - INFO - __main__ - Step 42686: {'lr': 0.00019925327572944878, 'samples': 1365952, 'steps': 2667, 'loss/train': 1.5775080919265747} -09/20/2021 23:44:01 - INFO - __main__ - Step 42687: {'lr': 0.00019925327572944878, 'samples': 1365984, 'steps': 2667, 'loss/train': 1.9883300065994263} -09/20/2021 23:44:02 - INFO - __main__ - Step 42688: {'lr': 0.00019925327572944878, 'samples': 1366016, 'steps': 2667, 'loss/train': 2.5488169193267822} -09/20/2021 23:44:03 - INFO - __main__ - Step 42689: {'lr': 0.00019925249744348, 'samples': 1366048, 'steps': 2668, 'loss/train': 2.281691312789917} -09/20/2021 23:44:03 - INFO - __main__ - Step 42690: {'lr': 0.00019925249744348, 'samples': 1366080, 'steps': 2668, 'loss/train': 2.7812142372131348} -09/20/2021 23:44:04 - INFO - __main__ - Step 42691: {'lr': 0.00019925249744348, 'samples': 1366112, 'steps': 2668, 'loss/train': 2.0741961002349854} -09/20/2021 23:44:05 - INFO - __main__ - Step 42692: {'lr': 0.00019925249744348, 'samples': 1366144, 'steps': 2668, 'loss/train': 2.8608596324920654} -09/20/2021 23:44:06 - INFO - __main__ - Step 42693: {'lr': 0.00019925249744348, 'samples': 1366176, 'steps': 2668, 'loss/train': 1.9464550018310547} -09/20/2021 23:44:07 - INFO - __main__ - Step 42694: {'lr': 0.00019925249744348, 'samples': 1366208, 'steps': 2668, 'loss/train': 2.2142467498779297} -09/20/2021 23:44:08 - INFO - __main__ - Step 42695: {'lr': 0.00019925249744348, 'samples': 1366240, 'steps': 2668, 'loss/train': 2.3621881008148193} -09/20/2021 23:44:09 - INFO - __main__ - Step 42696: {'lr': 0.00019925249744348, 'samples': 1366272, 'steps': 2668, 'loss/train': 1.2573323249816895} -09/20/2021 23:44:09 - INFO - __main__ - Step 42697: {'lr': 0.00019925249744348, 'samples': 1366304, 'steps': 2668, 'loss/train': 4.119604110717773} -09/20/2021 23:44:10 - INFO - __main__ - Step 42698: {'lr': 0.00019925249744348, 'samples': 1366336, 'steps': 2668, 'loss/train': 1.6014389991760254} -09/20/2021 23:44:11 - INFO - __main__ - Step 42699: {'lr': 0.00019925249744348, 'samples': 1366368, 'steps': 2668, 'loss/train': 1.5334346294403076} -09/20/2021 23:44:12 - INFO - __main__ - Step 42700: {'lr': 0.00019925249744348, 'samples': 1366400, 'steps': 2668, 'loss/train': 2.5328433513641357} -09/20/2021 23:44:12 - INFO - __main__ - Step 42701: {'lr': 0.00019925249744348, 'samples': 1366432, 'steps': 2668, 'loss/train': 2.969388008117676} -09/20/2021 23:44:13 - INFO - __main__ - Step 42702: {'lr': 0.00019925249744348, 'samples': 1366464, 'steps': 2668, 'loss/train': 1.641452431678772} -09/20/2021 23:44:14 - INFO - __main__ - Step 42703: {'lr': 0.00019925249744348, 'samples': 1366496, 'steps': 2668, 'loss/train': 1.9081628322601318} -09/20/2021 23:44:15 - INFO - __main__ - Step 42704: {'lr': 0.00019925249744348, 'samples': 1366528, 'steps': 2668, 'loss/train': 2.5459280014038086} -09/20/2021 23:44:15 - INFO - __main__ - Step 42705: {'lr': 0.00019925171875365317, 'samples': 1366560, 'steps': 2669, 'loss/train': 1.9725309610366821} -09/20/2021 23:44:16 - INFO - __main__ - Step 42706: {'lr': 0.00019925171875365317, 'samples': 1366592, 'steps': 2669, 'loss/train': 1.9371587038040161} -09/20/2021 23:44:17 - INFO - __main__ - Step 42707: {'lr': 0.00019925171875365317, 'samples': 1366624, 'steps': 2669, 'loss/train': 1.9039493799209595} -09/20/2021 23:44:18 - INFO - __main__ - Step 42708: {'lr': 0.00019925171875365317, 'samples': 1366656, 'steps': 2669, 'loss/train': 2.3835010528564453} -09/20/2021 23:44:18 - INFO - __main__ - Step 42709: {'lr': 0.00019925171875365317, 'samples': 1366688, 'steps': 2669, 'loss/train': 3.0282719135284424} -09/20/2021 23:44:19 - INFO - __main__ - Step 42710: {'lr': 0.00019925171875365317, 'samples': 1366720, 'steps': 2669, 'loss/train': 1.2446789741516113} -09/20/2021 23:44:20 - INFO - __main__ - Step 42711: {'lr': 0.00019925171875365317, 'samples': 1366752, 'steps': 2669, 'loss/train': 1.9641661643981934} -09/20/2021 23:44:21 - INFO - __main__ - Step 42712: {'lr': 0.00019925171875365317, 'samples': 1366784, 'steps': 2669, 'loss/train': 1.950595736503601} -09/20/2021 23:44:21 - INFO - __main__ - Step 42713: {'lr': 0.00019925171875365317, 'samples': 1366816, 'steps': 2669, 'loss/train': 1.4240621328353882} -09/20/2021 23:44:22 - INFO - __main__ - Step 42714: {'lr': 0.00019925171875365317, 'samples': 1366848, 'steps': 2669, 'loss/train': 2.0330562591552734} -09/20/2021 23:44:23 - INFO - __main__ - Step 42715: {'lr': 0.00019925171875365317, 'samples': 1366880, 'steps': 2669, 'loss/train': 0.3150642216205597} -09/20/2021 23:44:24 - INFO - __main__ - Step 42716: {'lr': 0.00019925171875365317, 'samples': 1366912, 'steps': 2669, 'loss/train': 0.12752895057201385} -09/20/2021 23:44:24 - INFO - __main__ - Step 42717: {'lr': 0.00019925171875365317, 'samples': 1366944, 'steps': 2669, 'loss/train': 0.24150799214839935} -09/20/2021 23:44:25 - INFO - __main__ - Step 42718: {'lr': 0.00019925171875365317, 'samples': 1366976, 'steps': 2669, 'loss/train': 0.26963549852371216} -09/20/2021 23:44:26 - INFO - __main__ - Step 42719: {'lr': 0.00019925171875365317, 'samples': 1367008, 'steps': 2669, 'loss/train': 0.2788662910461426} -09/20/2021 23:44:27 - INFO - __main__ - Step 42720: {'lr': 0.00019925171875365317, 'samples': 1367040, 'steps': 2669, 'loss/train': 2.051520824432373} -09/20/2021 23:44:28 - INFO - __main__ - Step 42721: {'lr': 0.00019925093965997151, 'samples': 1367072, 'steps': 2670, 'loss/train': 1.4966171979904175} -09/20/2021 23:44:28 - INFO - __main__ - Step 42722: {'lr': 0.00019925093965997151, 'samples': 1367104, 'steps': 2670, 'loss/train': 2.0717883110046387} -09/20/2021 23:44:29 - INFO - __main__ - Step 42723: {'lr': 0.00019925093965997151, 'samples': 1367136, 'steps': 2670, 'loss/train': 2.538722276687622} -09/20/2021 23:44:30 - INFO - __main__ - Step 42724: {'lr': 0.00019925093965997151, 'samples': 1367168, 'steps': 2670, 'loss/train': 1.702850341796875} -09/20/2021 23:44:31 - INFO - __main__ - Step 42725: {'lr': 0.00019925093965997151, 'samples': 1367200, 'steps': 2670, 'loss/train': 1.8384140729904175} -09/20/2021 23:44:32 - INFO - __main__ - Step 42726: {'lr': 0.00019925093965997151, 'samples': 1367232, 'steps': 2670, 'loss/train': 3.3198368549346924} -09/20/2021 23:44:33 - INFO - __main__ - Step 42727: {'lr': 0.00019925093965997151, 'samples': 1367264, 'steps': 2670, 'loss/train': 0.2862876057624817} -09/20/2021 23:44:33 - INFO - __main__ - Step 42728: {'lr': 0.00019925093965997151, 'samples': 1367296, 'steps': 2670, 'loss/train': 0.20540514588356018} -09/20/2021 23:44:34 - INFO - __main__ - Step 42729: {'lr': 0.00019925093965997151, 'samples': 1367328, 'steps': 2670, 'loss/train': 1.695116639137268} -09/20/2021 23:44:35 - INFO - __main__ - Step 42730: {'lr': 0.00019925093965997151, 'samples': 1367360, 'steps': 2670, 'loss/train': 1.8009462356567383} -09/20/2021 23:44:36 - INFO - __main__ - Step 42731: {'lr': 0.00019925093965997151, 'samples': 1367392, 'steps': 2670, 'loss/train': 1.5811527967453003} -09/20/2021 23:44:36 - INFO - __main__ - Step 42732: {'lr': 0.00019925093965997151, 'samples': 1367424, 'steps': 2670, 'loss/train': 1.7012664079666138} -09/20/2021 23:44:37 - INFO - __main__ - Step 42733: {'lr': 0.00019925093965997151, 'samples': 1367456, 'steps': 2670, 'loss/train': 0.5477246046066284} -09/20/2021 23:44:38 - INFO - __main__ - Step 42734: {'lr': 0.00019925093965997151, 'samples': 1367488, 'steps': 2670, 'loss/train': 1.5744410753250122} -09/20/2021 23:44:39 - INFO - __main__ - Step 42735: {'lr': 0.00019925093965997151, 'samples': 1367520, 'steps': 2670, 'loss/train': 1.7177278995513916} -09/20/2021 23:44:39 - INFO - __main__ - Step 42736: {'lr': 0.00019925093965997151, 'samples': 1367552, 'steps': 2670, 'loss/train': 1.5332534313201904} -09/20/2021 23:44:40 - INFO - __main__ - Step 42737: {'lr': 0.00019925016016243813, 'samples': 1367584, 'steps': 2671, 'loss/train': 2.9014506340026855} -09/20/2021 23:44:41 - INFO - __main__ - Step 42738: {'lr': 0.00019925016016243813, 'samples': 1367616, 'steps': 2671, 'loss/train': 1.331935167312622} -09/20/2021 23:44:42 - INFO - __main__ - Step 42739: {'lr': 0.00019925016016243813, 'samples': 1367648, 'steps': 2671, 'loss/train': 0.5770506858825684} -09/20/2021 23:44:43 - INFO - __main__ - Step 42740: {'lr': 0.00019925016016243813, 'samples': 1367680, 'steps': 2671, 'loss/train': 1.9736828804016113} -09/20/2021 23:44:43 - INFO - __main__ - Step 42741: {'lr': 0.00019925016016243813, 'samples': 1367712, 'steps': 2671, 'loss/train': 2.3656156063079834} -09/20/2021 23:44:44 - INFO - __main__ - Step 42742: {'lr': 0.00019925016016243813, 'samples': 1367744, 'steps': 2671, 'loss/train': 2.2615976333618164} -09/20/2021 23:44:45 - INFO - __main__ - Step 42743: {'lr': 0.00019925016016243813, 'samples': 1367776, 'steps': 2671, 'loss/train': 2.431743621826172} -09/20/2021 23:44:46 - INFO - __main__ - Step 42744: {'lr': 0.00019925016016243813, 'samples': 1367808, 'steps': 2671, 'loss/train': 0.5255183577537537} -09/20/2021 23:44:46 - INFO - __main__ - Step 42745: {'lr': 0.00019925016016243813, 'samples': 1367840, 'steps': 2671, 'loss/train': 1.9648427963256836} -09/20/2021 23:44:47 - INFO - __main__ - Step 42746: {'lr': 0.00019925016016243813, 'samples': 1367872, 'steps': 2671, 'loss/train': 2.2725865840911865} -09/20/2021 23:44:48 - INFO - __main__ - Step 42747: {'lr': 0.00019925016016243813, 'samples': 1367904, 'steps': 2671, 'loss/train': 2.0669755935668945} -09/20/2021 23:44:49 - INFO - __main__ - Step 42748: {'lr': 0.00019925016016243813, 'samples': 1367936, 'steps': 2671, 'loss/train': 1.8696223497390747} -09/20/2021 23:44:49 - INFO - __main__ - Step 42749: {'lr': 0.00019925016016243813, 'samples': 1367968, 'steps': 2671, 'loss/train': 2.3409817218780518} -09/20/2021 23:44:50 - INFO - __main__ - Step 42750: {'lr': 0.00019925016016243813, 'samples': 1368000, 'steps': 2671, 'loss/train': 2.406505584716797} -09/20/2021 23:44:51 - INFO - __main__ - Step 42751: {'lr': 0.00019925016016243813, 'samples': 1368032, 'steps': 2671, 'loss/train': 1.7597843408584595} -09/20/2021 23:44:52 - INFO - __main__ - Step 42752: {'lr': 0.00019925016016243813, 'samples': 1368064, 'steps': 2671, 'loss/train': 2.314725399017334} -09/20/2021 23:44:52 - INFO - __main__ - Step 42753: {'lr': 0.00019924938026105623, 'samples': 1368096, 'steps': 2672, 'loss/train': 1.842078685760498} -09/20/2021 23:44:53 - INFO - __main__ - Step 42754: {'lr': 0.00019924938026105623, 'samples': 1368128, 'steps': 2672, 'loss/train': 1.8616724014282227} -09/20/2021 23:44:54 - INFO - __main__ - Step 42755: {'lr': 0.00019924938026105623, 'samples': 1368160, 'steps': 2672, 'loss/train': 1.504429578781128} -09/20/2021 23:44:55 - INFO - __main__ - Step 42756: {'lr': 0.00019924938026105623, 'samples': 1368192, 'steps': 2672, 'loss/train': 2.7781503200531006} -09/20/2021 23:44:56 - INFO - __main__ - Step 42757: {'lr': 0.00019924938026105623, 'samples': 1368224, 'steps': 2672, 'loss/train': 2.471926689147949} -09/20/2021 23:44:57 - INFO - __main__ - Step 42758: {'lr': 0.00019924938026105623, 'samples': 1368256, 'steps': 2672, 'loss/train': 2.3983678817749023} -09/20/2021 23:44:58 - INFO - __main__ - Step 42759: {'lr': 0.00019924938026105623, 'samples': 1368288, 'steps': 2672, 'loss/train': 4.491472244262695} -09/20/2021 23:44:58 - INFO - __main__ - Step 42760: {'lr': 0.00019924938026105623, 'samples': 1368320, 'steps': 2672, 'loss/train': 2.2562384605407715} -09/20/2021 23:44:59 - INFO - __main__ - Step 42761: {'lr': 0.00019924938026105623, 'samples': 1368352, 'steps': 2672, 'loss/train': 0.7073941230773926} -09/20/2021 23:45:00 - INFO - __main__ - Step 42762: {'lr': 0.00019924938026105623, 'samples': 1368384, 'steps': 2672, 'loss/train': 1.0266515016555786} -09/20/2021 23:45:01 - INFO - __main__ - Step 42763: {'lr': 0.00019924938026105623, 'samples': 1368416, 'steps': 2672, 'loss/train': 0.6759670376777649} -09/20/2021 23:45:01 - INFO - __main__ - Step 42764: {'lr': 0.00019924938026105623, 'samples': 1368448, 'steps': 2672, 'loss/train': 2.839303731918335} -09/20/2021 23:45:02 - INFO - __main__ - Step 42765: {'lr': 0.00019924938026105623, 'samples': 1368480, 'steps': 2672, 'loss/train': 2.2211766242980957} -09/20/2021 23:45:03 - INFO - __main__ - Step 42766: {'lr': 0.00019924938026105623, 'samples': 1368512, 'steps': 2672, 'loss/train': 2.9501516819000244} -09/20/2021 23:45:04 - INFO - __main__ - Step 42767: {'lr': 0.00019924938026105623, 'samples': 1368544, 'steps': 2672, 'loss/train': 1.2008945941925049} -09/20/2021 23:45:04 - INFO - __main__ - Step 42768: {'lr': 0.00019924938026105623, 'samples': 1368576, 'steps': 2672, 'loss/train': 1.449101209640503} -09/20/2021 23:45:05 - INFO - __main__ - Step 42769: {'lr': 0.000199248599955829, 'samples': 1368608, 'steps': 2673, 'loss/train': 2.7977993488311768} -09/20/2021 23:45:06 - INFO - __main__ - Step 42770: {'lr': 0.000199248599955829, 'samples': 1368640, 'steps': 2673, 'loss/train': 2.027771472930908} -09/20/2021 23:45:07 - INFO - __main__ - Step 42771: {'lr': 0.000199248599955829, 'samples': 1368672, 'steps': 2673, 'loss/train': 1.9361786842346191} -09/20/2021 23:45:07 - INFO - __main__ - Step 42772: {'lr': 0.000199248599955829, 'samples': 1368704, 'steps': 2673, 'loss/train': 2.007262706756592} -09/20/2021 23:45:08 - INFO - __main__ - Step 42773: {'lr': 0.000199248599955829, 'samples': 1368736, 'steps': 2673, 'loss/train': 2.2772159576416016} -09/20/2021 23:45:09 - INFO - __main__ - Step 42774: {'lr': 0.000199248599955829, 'samples': 1368768, 'steps': 2673, 'loss/train': 1.435824990272522} -09/20/2021 23:45:10 - INFO - __main__ - Step 42775: {'lr': 0.000199248599955829, 'samples': 1368800, 'steps': 2673, 'loss/train': 1.345996379852295} -09/20/2021 23:45:10 - INFO - __main__ - Step 42776: {'lr': 0.000199248599955829, 'samples': 1368832, 'steps': 2673, 'loss/train': 3.0141022205352783} -09/20/2021 23:45:11 - INFO - __main__ - Step 42777: {'lr': 0.000199248599955829, 'samples': 1368864, 'steps': 2673, 'loss/train': 2.3718302249908447} -09/20/2021 23:45:12 - INFO - __main__ - Step 42778: {'lr': 0.000199248599955829, 'samples': 1368896, 'steps': 2673, 'loss/train': 2.0442116260528564} -09/20/2021 23:45:13 - INFO - __main__ - Step 42779: {'lr': 0.000199248599955829, 'samples': 1368928, 'steps': 2673, 'loss/train': 2.64693021774292} -09/20/2021 23:45:13 - INFO - __main__ - Step 42780: {'lr': 0.000199248599955829, 'samples': 1368960, 'steps': 2673, 'loss/train': 2.0969362258911133} -09/20/2021 23:45:14 - INFO - __main__ - Step 42781: {'lr': 0.000199248599955829, 'samples': 1368992, 'steps': 2673, 'loss/train': 1.6844464540481567} -09/20/2021 23:45:15 - INFO - __main__ - Step 42782: {'lr': 0.000199248599955829, 'samples': 1369024, 'steps': 2673, 'loss/train': 1.3445791006088257} -09/20/2021 23:45:16 - INFO - __main__ - Step 42783: {'lr': 0.000199248599955829, 'samples': 1369056, 'steps': 2673, 'loss/train': 2.74202823638916} -09/20/2021 23:45:16 - INFO - __main__ - Step 42784: {'lr': 0.000199248599955829, 'samples': 1369088, 'steps': 2673, 'loss/train': 0.4973872900009155} -09/20/2021 23:45:17 - INFO - __main__ - Step 42785: {'lr': 0.00019924781924675962, 'samples': 1369120, 'steps': 2674, 'loss/train': 1.622215747833252} -09/20/2021 23:45:18 - INFO - __main__ - Step 42786: {'lr': 0.00019924781924675962, 'samples': 1369152, 'steps': 2674, 'loss/train': 2.3282177448272705} -09/20/2021 23:45:19 - INFO - __main__ - Step 42787: {'lr': 0.00019924781924675962, 'samples': 1369184, 'steps': 2674, 'loss/train': 1.9168246984481812} -09/20/2021 23:45:20 - INFO - __main__ - Step 42788: {'lr': 0.00019924781924675962, 'samples': 1369216, 'steps': 2674, 'loss/train': 2.384064197540283} -09/20/2021 23:45:20 - INFO - __main__ - Step 42789: {'lr': 0.00019924781924675962, 'samples': 1369248, 'steps': 2674, 'loss/train': 2.6338863372802734} -09/20/2021 23:45:22 - INFO - __main__ - Step 42790: {'lr': 0.00019924781924675962, 'samples': 1369280, 'steps': 2674, 'loss/train': 2.071660041809082} -09/20/2021 23:45:23 - INFO - __main__ - Step 42791: {'lr': 0.00019924781924675962, 'samples': 1369312, 'steps': 2674, 'loss/train': 2.4565436840057373} -09/20/2021 23:45:24 - INFO - __main__ - Step 42792: {'lr': 0.00019924781924675962, 'samples': 1369344, 'steps': 2674, 'loss/train': 1.4600766897201538} -09/20/2021 23:45:24 - INFO - __main__ - Step 42793: {'lr': 0.00019924781924675962, 'samples': 1369376, 'steps': 2674, 'loss/train': 1.600631833076477} -09/20/2021 23:45:25 - INFO - __main__ - Step 42794: {'lr': 0.00019924781924675962, 'samples': 1369408, 'steps': 2674, 'loss/train': 2.559948682785034} -09/20/2021 23:45:26 - INFO - __main__ - Step 42795: {'lr': 0.00019924781924675962, 'samples': 1369440, 'steps': 2674, 'loss/train': 1.9954904317855835} -09/20/2021 23:45:27 - INFO - __main__ - Step 42796: {'lr': 0.00019924781924675962, 'samples': 1369472, 'steps': 2674, 'loss/train': 2.0939207077026367} -09/20/2021 23:45:27 - INFO - __main__ - Step 42797: {'lr': 0.00019924781924675962, 'samples': 1369504, 'steps': 2674, 'loss/train': 2.2970330715179443} -09/20/2021 23:45:28 - INFO - __main__ - Step 42798: {'lr': 0.00019924781924675962, 'samples': 1369536, 'steps': 2674, 'loss/train': 3.242685317993164} -09/20/2021 23:45:29 - INFO - __main__ - Step 42799: {'lr': 0.00019924781924675962, 'samples': 1369568, 'steps': 2674, 'loss/train': 1.5563477277755737} -09/20/2021 23:45:30 - INFO - __main__ - Step 42800: {'lr': 0.00019924781924675962, 'samples': 1369600, 'steps': 2674, 'loss/train': 2.201475143432617} -09/20/2021 23:45:30 - INFO - __main__ - Step 42801: {'lr': 0.00019924703813385125, 'samples': 1369632, 'steps': 2675, 'loss/train': 2.288381338119507} -09/20/2021 23:45:31 - INFO - __main__ - Step 42802: {'lr': 0.00019924703813385125, 'samples': 1369664, 'steps': 2675, 'loss/train': 2.1111550331115723} -09/20/2021 23:45:32 - INFO - __main__ - Step 42803: {'lr': 0.00019924703813385125, 'samples': 1369696, 'steps': 2675, 'loss/train': 1.8791756629943848} -09/20/2021 23:45:33 - INFO - __main__ - Step 42804: {'lr': 0.00019924703813385125, 'samples': 1369728, 'steps': 2675, 'loss/train': 0.5628440976142883} -09/20/2021 23:45:33 - INFO - __main__ - Step 42805: {'lr': 0.00019924703813385125, 'samples': 1369760, 'steps': 2675, 'loss/train': 1.5895795822143555} -09/20/2021 23:45:34 - INFO - __main__ - Step 42806: {'lr': 0.00019924703813385125, 'samples': 1369792, 'steps': 2675, 'loss/train': 1.7603100538253784} -09/20/2021 23:45:35 - INFO - __main__ - Step 42807: {'lr': 0.00019924703813385125, 'samples': 1369824, 'steps': 2675, 'loss/train': 1.861014723777771} -09/20/2021 23:45:36 - INFO - __main__ - Step 42808: {'lr': 0.00019924703813385125, 'samples': 1369856, 'steps': 2675, 'loss/train': 2.549633502960205} -09/20/2021 23:45:36 - INFO - __main__ - Step 42809: {'lr': 0.00019924703813385125, 'samples': 1369888, 'steps': 2675, 'loss/train': 1.372705340385437} -09/20/2021 23:45:37 - INFO - __main__ - Step 42810: {'lr': 0.00019924703813385125, 'samples': 1369920, 'steps': 2675, 'loss/train': 2.1174066066741943} -09/20/2021 23:45:38 - INFO - __main__ - Step 42811: {'lr': 0.00019924703813385125, 'samples': 1369952, 'steps': 2675, 'loss/train': 2.070510149002075} -09/20/2021 23:45:39 - INFO - __main__ - Step 42812: {'lr': 0.00019924703813385125, 'samples': 1369984, 'steps': 2675, 'loss/train': 0.6398164629936218} -09/20/2021 23:45:39 - INFO - __main__ - Step 42813: {'lr': 0.00019924703813385125, 'samples': 1370016, 'steps': 2675, 'loss/train': 1.3917346000671387} -09/20/2021 23:45:40 - INFO - __main__ - Step 42814: {'lr': 0.00019924703813385125, 'samples': 1370048, 'steps': 2675, 'loss/train': 1.4328235387802124} -09/20/2021 23:45:41 - INFO - __main__ - Step 42815: {'lr': 0.00019924703813385125, 'samples': 1370080, 'steps': 2675, 'loss/train': 2.6846792697906494} -09/20/2021 23:45:42 - INFO - __main__ - Step 42816: {'lr': 0.00019924703813385125, 'samples': 1370112, 'steps': 2675, 'loss/train': 2.07539439201355} -09/20/2021 23:45:43 - INFO - __main__ - Step 42817: {'lr': 0.00019924625661710702, 'samples': 1370144, 'steps': 2676, 'loss/train': 2.02008056640625} -09/20/2021 23:45:43 - INFO - __main__ - Step 42818: {'lr': 0.00019924625661710702, 'samples': 1370176, 'steps': 2676, 'loss/train': 1.961094617843628} -09/20/2021 23:45:44 - INFO - __main__ - Step 42819: {'lr': 0.00019924625661710702, 'samples': 1370208, 'steps': 2676, 'loss/train': 2.7709248065948486} -09/20/2021 23:45:46 - INFO - __main__ - Step 42820: {'lr': 0.00019924625661710702, 'samples': 1370240, 'steps': 2676, 'loss/train': 1.7736624479293823} -09/20/2021 23:45:46 - INFO - __main__ - Step 42821: {'lr': 0.00019924625661710702, 'samples': 1370272, 'steps': 2676, 'loss/train': 1.6499847173690796} -09/20/2021 23:45:47 - INFO - __main__ - Step 42822: {'lr': 0.00019924625661710702, 'samples': 1370304, 'steps': 2676, 'loss/train': 1.8059087991714478} -09/20/2021 23:45:48 - INFO - __main__ - Step 42823: {'lr': 0.00019924625661710702, 'samples': 1370336, 'steps': 2676, 'loss/train': 2.0722620487213135} -09/20/2021 23:45:49 - INFO - __main__ - Step 42824: {'lr': 0.00019924625661710702, 'samples': 1370368, 'steps': 2676, 'loss/train': 1.7504198551177979} -09/20/2021 23:45:49 - INFO - __main__ - Step 42825: {'lr': 0.00019924625661710702, 'samples': 1370400, 'steps': 2676, 'loss/train': 1.8767033815383911} -09/20/2021 23:45:50 - INFO - __main__ - Step 42826: {'lr': 0.00019924625661710702, 'samples': 1370432, 'steps': 2676, 'loss/train': 2.2058892250061035} -09/20/2021 23:45:51 - INFO - __main__ - Step 42827: {'lr': 0.00019924625661710702, 'samples': 1370464, 'steps': 2676, 'loss/train': 2.6532156467437744} -09/20/2021 23:45:52 - INFO - __main__ - Step 42828: {'lr': 0.00019924625661710702, 'samples': 1370496, 'steps': 2676, 'loss/train': 1.7240411043167114} -09/20/2021 23:45:52 - INFO - __main__ - Step 42829: {'lr': 0.00019924625661710702, 'samples': 1370528, 'steps': 2676, 'loss/train': 1.4993950128555298} -09/20/2021 23:45:53 - INFO - __main__ - Step 42830: {'lr': 0.00019924625661710702, 'samples': 1370560, 'steps': 2676, 'loss/train': 3.2802093029022217} -09/20/2021 23:45:54 - INFO - __main__ - Step 42831: {'lr': 0.00019924625661710702, 'samples': 1370592, 'steps': 2676, 'loss/train': 1.9163825511932373} -09/20/2021 23:45:55 - INFO - __main__ - Step 42832: {'lr': 0.00019924625661710702, 'samples': 1370624, 'steps': 2676, 'loss/train': 2.582423210144043} -09/20/2021 23:45:55 - INFO - __main__ - Step 42833: {'lr': 0.0001992454746965302, 'samples': 1370656, 'steps': 2677, 'loss/train': 1.5662245750427246} -09/20/2021 23:45:56 - INFO - __main__ - Step 42834: {'lr': 0.0001992454746965302, 'samples': 1370688, 'steps': 2677, 'loss/train': 2.329376220703125} -09/20/2021 23:45:57 - INFO - __main__ - Step 42835: {'lr': 0.0001992454746965302, 'samples': 1370720, 'steps': 2677, 'loss/train': 2.570460081100464} -09/20/2021 23:45:58 - INFO - __main__ - Step 42836: {'lr': 0.0001992454746965302, 'samples': 1370752, 'steps': 2677, 'loss/train': 2.687472343444824} -09/20/2021 23:45:58 - INFO - __main__ - Step 42837: {'lr': 0.0001992454746965302, 'samples': 1370784, 'steps': 2677, 'loss/train': 2.734835386276245} -09/20/2021 23:45:59 - INFO - __main__ - Step 42838: {'lr': 0.0001992454746965302, 'samples': 1370816, 'steps': 2677, 'loss/train': 2.5424375534057617} -09/20/2021 23:46:00 - INFO - __main__ - Step 42839: {'lr': 0.0001992454746965302, 'samples': 1370848, 'steps': 2677, 'loss/train': 1.756474256515503} -09/20/2021 23:46:01 - INFO - __main__ - Step 42840: {'lr': 0.0001992454746965302, 'samples': 1370880, 'steps': 2677, 'loss/train': 2.571298837661743} -09/20/2021 23:46:01 - INFO - __main__ - Step 42841: {'lr': 0.0001992454746965302, 'samples': 1370912, 'steps': 2677, 'loss/train': 1.4987941980361938} -09/20/2021 23:46:02 - INFO - __main__ - Step 42842: {'lr': 0.0001992454746965302, 'samples': 1370944, 'steps': 2677, 'loss/train': 2.396888494491577} -09/20/2021 23:46:03 - INFO - __main__ - Step 42843: {'lr': 0.0001992454746965302, 'samples': 1370976, 'steps': 2677, 'loss/train': 2.149928092956543} -09/20/2021 23:46:04 - INFO - __main__ - Step 42844: {'lr': 0.0001992454746965302, 'samples': 1371008, 'steps': 2677, 'loss/train': 2.2177939414978027} -09/20/2021 23:46:04 - INFO - __main__ - Step 42845: {'lr': 0.0001992454746965302, 'samples': 1371040, 'steps': 2677, 'loss/train': 2.580010175704956} -09/20/2021 23:46:05 - INFO - __main__ - Step 42846: {'lr': 0.0001992454746965302, 'samples': 1371072, 'steps': 2677, 'loss/train': 2.2906155586242676} -09/20/2021 23:46:06 - INFO - __main__ - Step 42847: {'lr': 0.0001992454746965302, 'samples': 1371104, 'steps': 2677, 'loss/train': 1.6563445329666138} -09/20/2021 23:46:07 - INFO - __main__ - Step 42848: {'lr': 0.0001992454746965302, 'samples': 1371136, 'steps': 2677, 'loss/train': 2.3778109550476074} -09/20/2021 23:46:08 - INFO - __main__ - Step 42849: {'lr': 0.0001992446923721239, 'samples': 1371168, 'steps': 2678, 'loss/train': 2.2755727767944336} -09/20/2021 23:46:08 - INFO - __main__ - Step 42850: {'lr': 0.0001992446923721239, 'samples': 1371200, 'steps': 2678, 'loss/train': 1.6030144691467285} -09/20/2021 23:46:09 - INFO - __main__ - Step 42851: {'lr': 0.0001992446923721239, 'samples': 1371232, 'steps': 2678, 'loss/train': 2.9079933166503906} -09/20/2021 23:46:10 - INFO - __main__ - Step 42852: {'lr': 0.0001992446923721239, 'samples': 1371264, 'steps': 2678, 'loss/train': 1.4810761213302612} -09/20/2021 23:46:11 - INFO - __main__ - Step 42853: {'lr': 0.0001992446923721239, 'samples': 1371296, 'steps': 2678, 'loss/train': 1.5473122596740723} -09/20/2021 23:46:12 - INFO - __main__ - Step 42854: {'lr': 0.0001992446923721239, 'samples': 1371328, 'steps': 2678, 'loss/train': 1.428987741470337} -09/20/2021 23:46:13 - INFO - __main__ - Step 42855: {'lr': 0.0001992446923721239, 'samples': 1371360, 'steps': 2678, 'loss/train': 1.965053677558899} -09/20/2021 23:46:13 - INFO - __main__ - Step 42856: {'lr': 0.0001992446923721239, 'samples': 1371392, 'steps': 2678, 'loss/train': 2.125157356262207} -09/20/2021 23:46:14 - INFO - __main__ - Step 42857: {'lr': 0.0001992446923721239, 'samples': 1371424, 'steps': 2678, 'loss/train': 2.4954264163970947} -09/20/2021 23:46:15 - INFO - __main__ - Step 42858: {'lr': 0.0001992446923721239, 'samples': 1371456, 'steps': 2678, 'loss/train': 2.089538812637329} -09/20/2021 23:46:16 - INFO - __main__ - Step 42859: {'lr': 0.0001992446923721239, 'samples': 1371488, 'steps': 2678, 'loss/train': 2.0138306617736816} -09/20/2021 23:46:16 - INFO - __main__ - Step 42860: {'lr': 0.0001992446923721239, 'samples': 1371520, 'steps': 2678, 'loss/train': 1.716675877571106} -09/20/2021 23:46:17 - INFO - __main__ - Step 42861: {'lr': 0.0001992446923721239, 'samples': 1371552, 'steps': 2678, 'loss/train': 1.8045918941497803} -09/20/2021 23:46:18 - INFO - __main__ - Step 42862: {'lr': 0.0001992446923721239, 'samples': 1371584, 'steps': 2678, 'loss/train': 2.553759813308716} -09/20/2021 23:46:19 - INFO - __main__ - Step 42863: {'lr': 0.0001992446923721239, 'samples': 1371616, 'steps': 2678, 'loss/train': 2.3013670444488525} -09/20/2021 23:46:19 - INFO - __main__ - Step 42864: {'lr': 0.0001992446923721239, 'samples': 1371648, 'steps': 2678, 'loss/train': 2.20217227935791} -09/20/2021 23:46:20 - INFO - __main__ - Step 42865: {'lr': 0.00019924390964389134, 'samples': 1371680, 'steps': 2679, 'loss/train': 0.24410441517829895} -09/20/2021 23:46:21 - INFO - __main__ - Step 42866: {'lr': 0.00019924390964389134, 'samples': 1371712, 'steps': 2679, 'loss/train': 0.2682943344116211} -09/20/2021 23:46:22 - INFO - __main__ - Step 42867: {'lr': 0.00019924390964389134, 'samples': 1371744, 'steps': 2679, 'loss/train': 0.19743597507476807} -09/20/2021 23:46:23 - INFO - __main__ - Step 42868: {'lr': 0.00019924390964389134, 'samples': 1371776, 'steps': 2679, 'loss/train': 2.3105783462524414} -09/20/2021 23:46:23 - INFO - __main__ - Step 42869: {'lr': 0.00019924390964389134, 'samples': 1371808, 'steps': 2679, 'loss/train': 1.7382334470748901} -09/20/2021 23:46:24 - INFO - __main__ - Step 42870: {'lr': 0.00019924390964389134, 'samples': 1371840, 'steps': 2679, 'loss/train': 2.679351568222046} -09/20/2021 23:46:25 - INFO - __main__ - Step 42871: {'lr': 0.00019924390964389134, 'samples': 1371872, 'steps': 2679, 'loss/train': 2.559997081756592} -09/20/2021 23:46:26 - INFO - __main__ - Step 42872: {'lr': 0.00019924390964389134, 'samples': 1371904, 'steps': 2679, 'loss/train': 2.0403473377227783} -09/20/2021 23:46:26 - INFO - __main__ - Step 42873: {'lr': 0.00019924390964389134, 'samples': 1371936, 'steps': 2679, 'loss/train': 1.4145692586898804} -09/20/2021 23:46:27 - INFO - __main__ - Step 42874: {'lr': 0.00019924390964389134, 'samples': 1371968, 'steps': 2679, 'loss/train': 1.766584873199463} -09/20/2021 23:46:28 - INFO - __main__ - Step 42875: {'lr': 0.00019924390964389134, 'samples': 1372000, 'steps': 2679, 'loss/train': 1.9442609548568726} -09/20/2021 23:46:29 - INFO - __main__ - Step 42876: {'lr': 0.00019924390964389134, 'samples': 1372032, 'steps': 2679, 'loss/train': 1.4690520763397217} -09/20/2021 23:46:29 - INFO - __main__ - Step 42877: {'lr': 0.00019924390964389134, 'samples': 1372064, 'steps': 2679, 'loss/train': 2.2109057903289795} -09/20/2021 23:46:30 - INFO - __main__ - Step 42878: {'lr': 0.00019924390964389134, 'samples': 1372096, 'steps': 2679, 'loss/train': 1.319527268409729} -09/20/2021 23:46:31 - INFO - __main__ - Step 42879: {'lr': 0.00019924390964389134, 'samples': 1372128, 'steps': 2679, 'loss/train': 2.6724071502685547} -09/20/2021 23:46:32 - INFO - __main__ - Step 42880: {'lr': 0.00019924390964389134, 'samples': 1372160, 'steps': 2679, 'loss/train': 2.399261474609375} -09/20/2021 23:46:32 - INFO - __main__ - Step 42881: {'lr': 0.00019924312651183572, 'samples': 1372192, 'steps': 2680, 'loss/train': 2.219407320022583} -09/20/2021 23:46:33 - INFO - __main__ - Step 42882: {'lr': 0.00019924312651183572, 'samples': 1372224, 'steps': 2680, 'loss/train': 2.222628355026245} -09/20/2021 23:46:34 - INFO - __main__ - Step 42883: {'lr': 0.00019924312651183572, 'samples': 1372256, 'steps': 2680, 'loss/train': 1.8512052297592163} -09/20/2021 23:46:35 - INFO - __main__ - Step 42884: {'lr': 0.00019924312651183572, 'samples': 1372288, 'steps': 2680, 'loss/train': 1.6151056289672852} -09/20/2021 23:46:36 - INFO - __main__ - Step 42885: {'lr': 0.00019924312651183572, 'samples': 1372320, 'steps': 2680, 'loss/train': 1.5722367763519287} -09/20/2021 23:46:37 - INFO - __main__ - Step 42886: {'lr': 0.00019924312651183572, 'samples': 1372352, 'steps': 2680, 'loss/train': 1.6830276250839233} -09/20/2021 23:46:38 - INFO - __main__ - Step 42887: {'lr': 0.00019924312651183572, 'samples': 1372384, 'steps': 2680, 'loss/train': 1.756553053855896} -09/20/2021 23:46:38 - INFO - __main__ - Step 42888: {'lr': 0.00019924312651183572, 'samples': 1372416, 'steps': 2680, 'loss/train': 3.0117368698120117} -09/20/2021 23:46:39 - INFO - __main__ - Step 42889: {'lr': 0.00019924312651183572, 'samples': 1372448, 'steps': 2680, 'loss/train': 1.842755675315857} -09/20/2021 23:46:40 - INFO - __main__ - Step 42890: {'lr': 0.00019924312651183572, 'samples': 1372480, 'steps': 2680, 'loss/train': 0.9533494114875793} -09/20/2021 23:46:41 - INFO - __main__ - Step 42891: {'lr': 0.00019924312651183572, 'samples': 1372512, 'steps': 2680, 'loss/train': 2.5505359172821045} -09/20/2021 23:46:41 - INFO - __main__ - Step 42892: {'lr': 0.00019924312651183572, 'samples': 1372544, 'steps': 2680, 'loss/train': 2.4170119762420654} -09/20/2021 23:46:42 - INFO - __main__ - Step 42893: {'lr': 0.00019924312651183572, 'samples': 1372576, 'steps': 2680, 'loss/train': 2.3202919960021973} -09/20/2021 23:46:43 - INFO - __main__ - Step 42894: {'lr': 0.00019924312651183572, 'samples': 1372608, 'steps': 2680, 'loss/train': 0.4470170736312866} -09/20/2021 23:46:44 - INFO - __main__ - Step 42895: {'lr': 0.00019924312651183572, 'samples': 1372640, 'steps': 2680, 'loss/train': 2.1375491619110107} -09/20/2021 23:46:44 - INFO - __main__ - Step 42896: {'lr': 0.00019924312651183572, 'samples': 1372672, 'steps': 2680, 'loss/train': 1.8901736736297607} -09/20/2021 23:46:45 - INFO - __main__ - Step 42897: {'lr': 0.0001992423429759602, 'samples': 1372704, 'steps': 2681, 'loss/train': 0.6301231980323792} -09/20/2021 23:46:46 - INFO - __main__ - Step 42898: {'lr': 0.0001992423429759602, 'samples': 1372736, 'steps': 2681, 'loss/train': 0.5890215635299683} -09/20/2021 23:46:47 - INFO - __main__ - Step 42899: {'lr': 0.0001992423429759602, 'samples': 1372768, 'steps': 2681, 'loss/train': 0.7212051153182983} -09/20/2021 23:46:47 - INFO - __main__ - Step 42900: {'lr': 0.0001992423429759602, 'samples': 1372800, 'steps': 2681, 'loss/train': 0.7405229210853577} -09/20/2021 23:46:48 - INFO - __main__ - Step 42901: {'lr': 0.0001992423429759602, 'samples': 1372832, 'steps': 2681, 'loss/train': 0.671291172504425} -09/20/2021 23:46:49 - INFO - __main__ - Step 42902: {'lr': 0.0001992423429759602, 'samples': 1372864, 'steps': 2681, 'loss/train': 1.4900107383728027} -09/20/2021 23:46:50 - INFO - __main__ - Step 42903: {'lr': 0.0001992423429759602, 'samples': 1372896, 'steps': 2681, 'loss/train': 1.8682034015655518} -09/20/2021 23:46:50 - INFO - __main__ - Step 42904: {'lr': 0.0001992423429759602, 'samples': 1372928, 'steps': 2681, 'loss/train': 2.59904146194458} -09/20/2021 23:46:51 - INFO - __main__ - Step 42905: {'lr': 0.0001992423429759602, 'samples': 1372960, 'steps': 2681, 'loss/train': 0.7331857681274414} -09/20/2021 23:46:52 - INFO - __main__ - Step 42906: {'lr': 0.0001992423429759602, 'samples': 1372992, 'steps': 2681, 'loss/train': 0.6291201114654541} -09/20/2021 23:46:53 - INFO - __main__ - Step 42907: {'lr': 0.0001992423429759602, 'samples': 1373024, 'steps': 2681, 'loss/train': 2.6793577671051025} -09/20/2021 23:46:53 - INFO - __main__ - Step 42908: {'lr': 0.0001992423429759602, 'samples': 1373056, 'steps': 2681, 'loss/train': 0.7770540118217468} -09/20/2021 23:46:54 - INFO - __main__ - Step 42909: {'lr': 0.0001992423429759602, 'samples': 1373088, 'steps': 2681, 'loss/train': 2.1866614818573} -09/20/2021 23:46:55 - INFO - __main__ - Step 42910: {'lr': 0.0001992423429759602, 'samples': 1373120, 'steps': 2681, 'loss/train': 1.7833431959152222} -09/20/2021 23:46:56 - INFO - __main__ - Step 42911: {'lr': 0.0001992423429759602, 'samples': 1373152, 'steps': 2681, 'loss/train': 2.1445014476776123} -09/20/2021 23:46:56 - INFO - __main__ - Step 42912: {'lr': 0.0001992423429759602, 'samples': 1373184, 'steps': 2681, 'loss/train': 1.4646508693695068} -09/20/2021 23:46:57 - INFO - __main__ - Step 42913: {'lr': 0.00019924155903626795, 'samples': 1373216, 'steps': 2682, 'loss/train': 2.804987907409668} -09/20/2021 23:46:58 - INFO - __main__ - Step 42914: {'lr': 0.00019924155903626795, 'samples': 1373248, 'steps': 2682, 'loss/train': 2.2277519702911377} -09/20/2021 23:46:59 - INFO - __main__ - Step 42915: {'lr': 0.00019924155903626795, 'samples': 1373280, 'steps': 2682, 'loss/train': 1.784956455230713} -09/20/2021 23:47:00 - INFO - __main__ - Step 42916: {'lr': 0.00019924155903626795, 'samples': 1373312, 'steps': 2682, 'loss/train': 2.090400457382202} -09/20/2021 23:47:00 - INFO - __main__ - Step 42917: {'lr': 0.00019924155903626795, 'samples': 1373344, 'steps': 2682, 'loss/train': 2.00718355178833} -09/20/2021 23:47:02 - INFO - __main__ - Step 42918: {'lr': 0.00019924155903626795, 'samples': 1373376, 'steps': 2682, 'loss/train': 2.02858829498291} -09/20/2021 23:47:02 - INFO - __main__ - Step 42919: {'lr': 0.00019924155903626795, 'samples': 1373408, 'steps': 2682, 'loss/train': 1.451100468635559} -09/20/2021 23:47:03 - INFO - __main__ - Step 42920: {'lr': 0.00019924155903626795, 'samples': 1373440, 'steps': 2682, 'loss/train': 2.5144994258880615} -09/20/2021 23:47:04 - INFO - __main__ - Step 42921: {'lr': 0.00019924155903626795, 'samples': 1373472, 'steps': 2682, 'loss/train': 2.2396764755249023} -09/20/2021 23:47:05 - INFO - __main__ - Step 42922: {'lr': 0.00019924155903626795, 'samples': 1373504, 'steps': 2682, 'loss/train': 2.4529926776885986} -09/20/2021 23:47:05 - INFO - __main__ - Step 42923: {'lr': 0.00019924155903626795, 'samples': 1373536, 'steps': 2682, 'loss/train': 2.3838038444519043} -09/20/2021 23:47:06 - INFO - __main__ - Step 42924: {'lr': 0.00019924155903626795, 'samples': 1373568, 'steps': 2682, 'loss/train': 2.3404698371887207} -09/20/2021 23:47:07 - INFO - __main__ - Step 42925: {'lr': 0.00019924155903626795, 'samples': 1373600, 'steps': 2682, 'loss/train': 1.2988970279693604} -09/20/2021 23:47:08 - INFO - __main__ - Step 42926: {'lr': 0.00019924155903626795, 'samples': 1373632, 'steps': 2682, 'loss/train': 1.9523903131484985} -09/20/2021 23:47:08 - INFO - __main__ - Step 42927: {'lr': 0.00019924155903626795, 'samples': 1373664, 'steps': 2682, 'loss/train': 1.9357643127441406} -09/20/2021 23:47:09 - INFO - __main__ - Step 42928: {'lr': 0.00019924155903626795, 'samples': 1373696, 'steps': 2682, 'loss/train': 1.0410319566726685} -09/20/2021 23:47:10 - INFO - __main__ - Step 42929: {'lr': 0.00019924077469276222, 'samples': 1373728, 'steps': 2683, 'loss/train': 1.4779493808746338} -09/20/2021 23:47:11 - INFO - __main__ - Step 42930: {'lr': 0.00019924077469276222, 'samples': 1373760, 'steps': 2683, 'loss/train': 2.146872043609619} -09/20/2021 23:47:12 - INFO - __main__ - Step 42931: {'lr': 0.00019924077469276222, 'samples': 1373792, 'steps': 2683, 'loss/train': 1.9472734928131104} -09/20/2021 23:47:12 - INFO - __main__ - Step 42932: {'lr': 0.00019924077469276222, 'samples': 1373824, 'steps': 2683, 'loss/train': 2.2533884048461914} -09/20/2021 23:47:13 - INFO - __main__ - Step 42933: {'lr': 0.00019924077469276222, 'samples': 1373856, 'steps': 2683, 'loss/train': 1.8868452310562134} -09/20/2021 23:47:14 - INFO - __main__ - Step 42934: {'lr': 0.00019924077469276222, 'samples': 1373888, 'steps': 2683, 'loss/train': 1.797034740447998} -09/20/2021 23:47:15 - INFO - __main__ - Step 42935: {'lr': 0.00019924077469276222, 'samples': 1373920, 'steps': 2683, 'loss/train': 3.265096664428711} -09/20/2021 23:47:15 - INFO - __main__ - Step 42936: {'lr': 0.00019924077469276222, 'samples': 1373952, 'steps': 2683, 'loss/train': 3.2510199546813965} -09/20/2021 23:47:16 - INFO - __main__ - Step 42937: {'lr': 0.00019924077469276222, 'samples': 1373984, 'steps': 2683, 'loss/train': 2.927551031112671} -09/20/2021 23:47:17 - INFO - __main__ - Step 42938: {'lr': 0.00019924077469276222, 'samples': 1374016, 'steps': 2683, 'loss/train': 3.4584712982177734} -09/20/2021 23:47:18 - INFO - __main__ - Step 42939: {'lr': 0.00019924077469276222, 'samples': 1374048, 'steps': 2683, 'loss/train': 4.198868751525879} -09/20/2021 23:47:18 - INFO - __main__ - Step 42940: {'lr': 0.00019924077469276222, 'samples': 1374080, 'steps': 2683, 'loss/train': 1.6771347522735596} -09/20/2021 23:47:19 - INFO - __main__ - Step 42941: {'lr': 0.00019924077469276222, 'samples': 1374112, 'steps': 2683, 'loss/train': 1.659489631652832} -09/20/2021 23:47:20 - INFO - __main__ - Step 42942: {'lr': 0.00019924077469276222, 'samples': 1374144, 'steps': 2683, 'loss/train': 2.056607246398926} -09/20/2021 23:47:21 - INFO - __main__ - Step 42943: {'lr': 0.00019924077469276222, 'samples': 1374176, 'steps': 2683, 'loss/train': 2.976196765899658} -09/20/2021 23:47:21 - INFO - __main__ - Step 42944: {'lr': 0.00019924077469276222, 'samples': 1374208, 'steps': 2683, 'loss/train': 1.8893098831176758} -09/20/2021 23:47:22 - INFO - __main__ - Step 42945: {'lr': 0.0001992399899454461, 'samples': 1374240, 'steps': 2684, 'loss/train': 2.1354031562805176} -09/20/2021 23:47:23 - INFO - __main__ - Step 42946: {'lr': 0.0001992399899454461, 'samples': 1374272, 'steps': 2684, 'loss/train': 2.357494354248047} -09/20/2021 23:47:24 - INFO - __main__ - Step 42947: {'lr': 0.0001992399899454461, 'samples': 1374304, 'steps': 2684, 'loss/train': 2.3059277534484863} -09/20/2021 23:47:25 - INFO - __main__ - Step 42948: {'lr': 0.0001992399899454461, 'samples': 1374336, 'steps': 2684, 'loss/train': 2.2010622024536133} -09/20/2021 23:47:25 - INFO - __main__ - Step 42949: {'lr': 0.0001992399899454461, 'samples': 1374368, 'steps': 2684, 'loss/train': 1.184771180152893} -09/20/2021 23:47:26 - INFO - __main__ - Step 42950: {'lr': 0.0001992399899454461, 'samples': 1374400, 'steps': 2684, 'loss/train': 2.146552324295044} -09/20/2021 23:47:27 - INFO - __main__ - Step 42951: {'lr': 0.0001992399899454461, 'samples': 1374432, 'steps': 2684, 'loss/train': 2.333636522293091} -09/20/2021 23:47:28 - INFO - __main__ - Step 42952: {'lr': 0.0001992399899454461, 'samples': 1374464, 'steps': 2684, 'loss/train': 2.446927785873413} -09/20/2021 23:47:29 - INFO - __main__ - Step 42953: {'lr': 0.0001992399899454461, 'samples': 1374496, 'steps': 2684, 'loss/train': 1.877599835395813} -09/20/2021 23:47:30 - INFO - __main__ - Step 42954: {'lr': 0.0001992399899454461, 'samples': 1374528, 'steps': 2684, 'loss/train': 2.405917167663574} -09/20/2021 23:47:30 - INFO - __main__ - Step 42955: {'lr': 0.0001992399899454461, 'samples': 1374560, 'steps': 2684, 'loss/train': 2.5862348079681396} -09/20/2021 23:47:31 - INFO - __main__ - Step 42956: {'lr': 0.0001992399899454461, 'samples': 1374592, 'steps': 2684, 'loss/train': 0.2967073619365692} -09/20/2021 23:47:32 - INFO - __main__ - Step 42957: {'lr': 0.0001992399899454461, 'samples': 1374624, 'steps': 2684, 'loss/train': 1.3203274011611938} -09/20/2021 23:47:33 - INFO - __main__ - Step 42958: {'lr': 0.0001992399899454461, 'samples': 1374656, 'steps': 2684, 'loss/train': 2.045348644256592} -09/20/2021 23:47:33 - INFO - __main__ - Step 42959: {'lr': 0.0001992399899454461, 'samples': 1374688, 'steps': 2684, 'loss/train': 2.2617712020874023} -09/20/2021 23:47:34 - INFO - __main__ - Step 42960: {'lr': 0.0001992399899454461, 'samples': 1374720, 'steps': 2684, 'loss/train': 2.5582363605499268} -09/20/2021 23:47:35 - INFO - __main__ - Step 42961: {'lr': 0.00019923920479432287, 'samples': 1374752, 'steps': 2685, 'loss/train': 1.9919133186340332} -09/20/2021 23:47:36 - INFO - __main__ - Step 42962: {'lr': 0.00019923920479432287, 'samples': 1374784, 'steps': 2685, 'loss/train': 1.6254528760910034} -09/20/2021 23:47:36 - INFO - __main__ - Step 42963: {'lr': 0.00019923920479432287, 'samples': 1374816, 'steps': 2685, 'loss/train': 2.0850353240966797} -09/20/2021 23:47:37 - INFO - __main__ - Step 42964: {'lr': 0.00019923920479432287, 'samples': 1374848, 'steps': 2685, 'loss/train': 0.8025282025337219} -09/20/2021 23:47:38 - INFO - __main__ - Step 42965: {'lr': 0.00019923920479432287, 'samples': 1374880, 'steps': 2685, 'loss/train': 2.6784207820892334} -09/20/2021 23:47:39 - INFO - __main__ - Step 42966: {'lr': 0.00019923920479432287, 'samples': 1374912, 'steps': 2685, 'loss/train': 1.7833356857299805} -09/20/2021 23:47:39 - INFO - __main__ - Step 42967: {'lr': 0.00019923920479432287, 'samples': 1374944, 'steps': 2685, 'loss/train': 1.701821208000183} -09/20/2021 23:47:40 - INFO - __main__ - Step 42968: {'lr': 0.00019923920479432287, 'samples': 1374976, 'steps': 2685, 'loss/train': 2.0913279056549072} -09/20/2021 23:47:41 - INFO - __main__ - Step 42969: {'lr': 0.00019923920479432287, 'samples': 1375008, 'steps': 2685, 'loss/train': 3.247955560684204} -09/20/2021 23:47:42 - INFO - __main__ - Step 42970: {'lr': 0.00019923920479432287, 'samples': 1375040, 'steps': 2685, 'loss/train': 2.341618299484253} -09/20/2021 23:47:42 - INFO - __main__ - Step 42971: {'lr': 0.00019923920479432287, 'samples': 1375072, 'steps': 2685, 'loss/train': 2.497004270553589} -09/20/2021 23:47:43 - INFO - __main__ - Step 42972: {'lr': 0.00019923920479432287, 'samples': 1375104, 'steps': 2685, 'loss/train': 2.539675235748291} -09/20/2021 23:47:44 - INFO - __main__ - Step 42973: {'lr': 0.00019923920479432287, 'samples': 1375136, 'steps': 2685, 'loss/train': 2.3016977310180664} -09/20/2021 23:47:45 - INFO - __main__ - Step 42974: {'lr': 0.00019923920479432287, 'samples': 1375168, 'steps': 2685, 'loss/train': 2.290383815765381} -09/20/2021 23:47:45 - INFO - __main__ - Step 42975: {'lr': 0.00019923920479432287, 'samples': 1375200, 'steps': 2685, 'loss/train': 1.769402027130127} -09/20/2021 23:47:46 - INFO - __main__ - Step 42976: {'lr': 0.00019923920479432287, 'samples': 1375232, 'steps': 2685, 'loss/train': 1.3493165969848633} -09/20/2021 23:47:47 - INFO - __main__ - Step 42977: {'lr': 0.00019923841923939571, 'samples': 1375264, 'steps': 2686, 'loss/train': 1.7148505449295044} -09/20/2021 23:47:48 - INFO - __main__ - Step 42978: {'lr': 0.00019923841923939571, 'samples': 1375296, 'steps': 2686, 'loss/train': 2.284838914871216} -09/20/2021 23:47:49 - INFO - __main__ - Step 42979: {'lr': 0.00019923841923939571, 'samples': 1375328, 'steps': 2686, 'loss/train': 2.352456569671631} -09/20/2021 23:47:49 - INFO - __main__ - Step 42980: {'lr': 0.00019923841923939571, 'samples': 1375360, 'steps': 2686, 'loss/train': 2.2809040546417236} -09/20/2021 23:47:50 - INFO - __main__ - Step 42981: {'lr': 0.00019923841923939571, 'samples': 1375392, 'steps': 2686, 'loss/train': 2.2883548736572266} -09/20/2021 23:47:51 - INFO - __main__ - Step 42982: {'lr': 0.00019923841923939571, 'samples': 1375424, 'steps': 2686, 'loss/train': 2.5184569358825684} -09/20/2021 23:47:52 - INFO - __main__ - Step 42983: {'lr': 0.00019923841923939571, 'samples': 1375456, 'steps': 2686, 'loss/train': 0.713665783405304} -09/20/2021 23:47:53 - INFO - __main__ - Step 42984: {'lr': 0.00019923841923939571, 'samples': 1375488, 'steps': 2686, 'loss/train': 2.0305871963500977} -09/20/2021 23:47:54 - INFO - __main__ - Step 42985: {'lr': 0.00019923841923939571, 'samples': 1375520, 'steps': 2686, 'loss/train': 1.7150523662567139} -09/20/2021 23:47:54 - INFO - __main__ - Step 42986: {'lr': 0.00019923841923939571, 'samples': 1375552, 'steps': 2686, 'loss/train': 2.4348788261413574} -09/20/2021 23:47:55 - INFO - __main__ - Step 42987: {'lr': 0.00019923841923939571, 'samples': 1375584, 'steps': 2686, 'loss/train': 2.2378828525543213} -09/20/2021 23:47:56 - INFO - __main__ - Step 42988: {'lr': 0.00019923841923939571, 'samples': 1375616, 'steps': 2686, 'loss/train': 2.1185402870178223} -09/20/2021 23:47:57 - INFO - __main__ - Step 42989: {'lr': 0.00019923841923939571, 'samples': 1375648, 'steps': 2686, 'loss/train': 2.2636237144470215} -09/20/2021 23:47:57 - INFO - __main__ - Step 42990: {'lr': 0.00019923841923939571, 'samples': 1375680, 'steps': 2686, 'loss/train': 1.7760883569717407} -09/20/2021 23:47:58 - INFO - __main__ - Step 42991: {'lr': 0.00019923841923939571, 'samples': 1375712, 'steps': 2686, 'loss/train': 1.639162302017212} -09/20/2021 23:47:59 - INFO - __main__ - Step 42992: {'lr': 0.00019923841923939571, 'samples': 1375744, 'steps': 2686, 'loss/train': 2.4605472087860107} -09/20/2021 23:48:00 - INFO - __main__ - Step 42993: {'lr': 0.00019923763328066785, 'samples': 1375776, 'steps': 2687, 'loss/train': 2.5667927265167236} -09/20/2021 23:48:00 - INFO - __main__ - Step 42994: {'lr': 0.00019923763328066785, 'samples': 1375808, 'steps': 2687, 'loss/train': 2.5144317150115967} -09/20/2021 23:48:01 - INFO - __main__ - Step 42995: {'lr': 0.00019923763328066785, 'samples': 1375840, 'steps': 2687, 'loss/train': 1.6698939800262451} -09/20/2021 23:48:02 - INFO - __main__ - Step 42996: {'lr': 0.00019923763328066785, 'samples': 1375872, 'steps': 2687, 'loss/train': 0.8026064038276672} -09/20/2021 23:48:03 - INFO - __main__ - Step 42997: {'lr': 0.00019923763328066785, 'samples': 1375904, 'steps': 2687, 'loss/train': 2.7105705738067627} -09/20/2021 23:48:03 - INFO - __main__ - Step 42998: {'lr': 0.00019923763328066785, 'samples': 1375936, 'steps': 2687, 'loss/train': 2.230311155319214} -09/20/2021 23:48:04 - INFO - __main__ - Step 42999: {'lr': 0.00019923763328066785, 'samples': 1375968, 'steps': 2687, 'loss/train': 3.1246509552001953} -09/20/2021 23:48:05 - INFO - __main__ - Step 43000: {'lr': 0.00019923763328066785, 'samples': 1376000, 'steps': 2687, 'loss/train': 2.3578834533691406} -09/20/2021 23:48:06 - INFO - __main__ - Step 43001: {'lr': 0.00019923763328066785, 'samples': 1376032, 'steps': 2687, 'loss/train': 1.8348853588104248} -09/20/2021 23:48:06 - INFO - __main__ - Step 43002: {'lr': 0.00019923763328066785, 'samples': 1376064, 'steps': 2687, 'loss/train': 2.1169633865356445} -09/20/2021 23:48:07 - INFO - __main__ - Step 43003: {'lr': 0.00019923763328066785, 'samples': 1376096, 'steps': 2687, 'loss/train': 2.192063570022583} -09/20/2021 23:48:08 - INFO - __main__ - Step 43004: {'lr': 0.00019923763328066785, 'samples': 1376128, 'steps': 2687, 'loss/train': 1.8979485034942627} -09/20/2021 23:48:09 - INFO - __main__ - Step 43005: {'lr': 0.00019923763328066785, 'samples': 1376160, 'steps': 2687, 'loss/train': 1.6370306015014648} -09/20/2021 23:48:09 - INFO - __main__ - Step 43006: {'lr': 0.00019923763328066785, 'samples': 1376192, 'steps': 2687, 'loss/train': 1.3540695905685425} -09/20/2021 23:48:10 - INFO - __main__ - Step 43007: {'lr': 0.00019923763328066785, 'samples': 1376224, 'steps': 2687, 'loss/train': 2.0143399238586426} -09/20/2021 23:48:11 - INFO - __main__ - Step 43008: {'lr': 0.00019923763328066785, 'samples': 1376256, 'steps': 2687, 'loss/train': 2.1137914657592773} -09/20/2021 23:48:12 - INFO - __main__ - Step 43009: {'lr': 0.0001992368469181424, 'samples': 1376288, 'steps': 2688, 'loss/train': 2.1979713439941406} -09/20/2021 23:48:13 - INFO - __main__ - Step 43010: {'lr': 0.0001992368469181424, 'samples': 1376320, 'steps': 2688, 'loss/train': 1.7188652753829956} -09/20/2021 23:48:13 - INFO - __main__ - Step 43011: {'lr': 0.0001992368469181424, 'samples': 1376352, 'steps': 2688, 'loss/train': 2.5853805541992188} -09/20/2021 23:48:14 - INFO - __main__ - Step 43012: {'lr': 0.0001992368469181424, 'samples': 1376384, 'steps': 2688, 'loss/train': 2.2303967475891113} -09/20/2021 23:48:16 - INFO - __main__ - Step 43013: {'lr': 0.0001992368469181424, 'samples': 1376416, 'steps': 2688, 'loss/train': 1.5401583909988403} -09/20/2021 23:48:16 - INFO - __main__ - Step 43014: {'lr': 0.0001992368469181424, 'samples': 1376448, 'steps': 2688, 'loss/train': 2.5960049629211426} -09/20/2021 23:48:17 - INFO - __main__ - Step 43015: {'lr': 0.0001992368469181424, 'samples': 1376480, 'steps': 2688, 'loss/train': 1.825373888015747} -09/20/2021 23:48:18 - INFO - __main__ - Step 43016: {'lr': 0.0001992368469181424, 'samples': 1376512, 'steps': 2688, 'loss/train': 1.93299400806427} -09/20/2021 23:48:19 - INFO - __main__ - Step 43017: {'lr': 0.0001992368469181424, 'samples': 1376544, 'steps': 2688, 'loss/train': 1.8671568632125854} -09/20/2021 23:48:19 - INFO - __main__ - Step 43018: {'lr': 0.0001992368469181424, 'samples': 1376576, 'steps': 2688, 'loss/train': 1.8167039155960083} -09/20/2021 23:48:20 - INFO - __main__ - Step 43019: {'lr': 0.0001992368469181424, 'samples': 1376608, 'steps': 2688, 'loss/train': 1.9586275815963745} -09/20/2021 23:48:21 - INFO - __main__ - Step 43020: {'lr': 0.0001992368469181424, 'samples': 1376640, 'steps': 2688, 'loss/train': 1.6427412033081055} -09/20/2021 23:48:22 - INFO - __main__ - Step 43021: {'lr': 0.0001992368469181424, 'samples': 1376672, 'steps': 2688, 'loss/train': 1.6752550601959229} -09/20/2021 23:48:22 - INFO - __main__ - Step 43022: {'lr': 0.0001992368469181424, 'samples': 1376704, 'steps': 2688, 'loss/train': 1.9212640523910522} -09/20/2021 23:48:23 - INFO - __main__ - Step 43023: {'lr': 0.0001992368469181424, 'samples': 1376736, 'steps': 2688, 'loss/train': 2.3261406421661377} -09/20/2021 23:48:24 - INFO - __main__ - Step 43024: {'lr': 0.0001992368469181424, 'samples': 1376768, 'steps': 2688, 'loss/train': 1.7007899284362793} -09/20/2021 23:48:25 - INFO - __main__ - Step 43025: {'lr': 0.00019923606015182258, 'samples': 1376800, 'steps': 2689, 'loss/train': 2.107522964477539} -09/20/2021 23:48:25 - INFO - __main__ - Step 43026: {'lr': 0.00019923606015182258, 'samples': 1376832, 'steps': 2689, 'loss/train': 2.8122575283050537} -09/20/2021 23:48:26 - INFO - __main__ - Step 43027: {'lr': 0.00019923606015182258, 'samples': 1376864, 'steps': 2689, 'loss/train': 2.1300406455993652} -09/20/2021 23:48:27 - INFO - __main__ - Step 43028: {'lr': 0.00019923606015182258, 'samples': 1376896, 'steps': 2689, 'loss/train': 1.7929043769836426} -09/20/2021 23:48:28 - INFO - __main__ - Step 43029: {'lr': 0.00019923606015182258, 'samples': 1376928, 'steps': 2689, 'loss/train': 2.717357873916626} -09/20/2021 23:48:28 - INFO - __main__ - Step 43030: {'lr': 0.00019923606015182258, 'samples': 1376960, 'steps': 2689, 'loss/train': 2.557250499725342} -09/20/2021 23:48:29 - INFO - __main__ - Step 43031: {'lr': 0.00019923606015182258, 'samples': 1376992, 'steps': 2689, 'loss/train': 3.4053311347961426} -09/20/2021 23:48:30 - INFO - __main__ - Step 43032: {'lr': 0.00019923606015182258, 'samples': 1377024, 'steps': 2689, 'loss/train': 2.41256046295166} -09/20/2021 23:48:31 - INFO - __main__ - Step 43033: {'lr': 0.00019923606015182258, 'samples': 1377056, 'steps': 2689, 'loss/train': 0.7623983025550842} -09/20/2021 23:48:31 - INFO - __main__ - Step 43034: {'lr': 0.00019923606015182258, 'samples': 1377088, 'steps': 2689, 'loss/train': 2.7831602096557617} -09/20/2021 23:48:32 - INFO - __main__ - Step 43035: {'lr': 0.00019923606015182258, 'samples': 1377120, 'steps': 2689, 'loss/train': 2.7414958477020264} -09/20/2021 23:48:33 - INFO - __main__ - Step 43036: {'lr': 0.00019923606015182258, 'samples': 1377152, 'steps': 2689, 'loss/train': 2.0689940452575684} -09/20/2021 23:48:34 - INFO - __main__ - Step 43037: {'lr': 0.00019923606015182258, 'samples': 1377184, 'steps': 2689, 'loss/train': 0.13752992451190948} -09/20/2021 23:48:34 - INFO - __main__ - Step 43038: {'lr': 0.00019923606015182258, 'samples': 1377216, 'steps': 2689, 'loss/train': 0.25213199853897095} -09/20/2021 23:48:35 - INFO - __main__ - Step 43039: {'lr': 0.00019923606015182258, 'samples': 1377248, 'steps': 2689, 'loss/train': 0.16240115463733673} -09/20/2021 23:48:36 - INFO - __main__ - Step 43040: {'lr': 0.00019923606015182258, 'samples': 1377280, 'steps': 2689, 'loss/train': 0.394014835357666} -09/20/2021 23:48:37 - INFO - __main__ - Step 43041: {'lr': 0.00019923527298171164, 'samples': 1377312, 'steps': 2690, 'loss/train': 2.3923001289367676} -09/20/2021 23:48:38 - INFO - __main__ - Step 43042: {'lr': 0.00019923527298171164, 'samples': 1377344, 'steps': 2690, 'loss/train': 1.878875732421875} -09/20/2021 23:48:38 - INFO - __main__ - Step 43043: {'lr': 0.00019923527298171164, 'samples': 1377376, 'steps': 2690, 'loss/train': 2.014047384262085} -09/20/2021 23:48:40 - INFO - __main__ - Step 43044: {'lr': 0.00019923527298171164, 'samples': 1377408, 'steps': 2690, 'loss/train': 2.250082492828369} -09/20/2021 23:48:40 - INFO - __main__ - Step 43045: {'lr': 0.00019923527298171164, 'samples': 1377440, 'steps': 2690, 'loss/train': 1.936048984527588} -09/20/2021 23:48:41 - INFO - __main__ - Step 43046: {'lr': 0.00019923527298171164, 'samples': 1377472, 'steps': 2690, 'loss/train': 1.879631519317627} -09/20/2021 23:48:42 - INFO - __main__ - Step 43047: {'lr': 0.00019923527298171164, 'samples': 1377504, 'steps': 2690, 'loss/train': 1.0534707307815552} -09/20/2021 23:48:43 - INFO - __main__ - Step 43048: {'lr': 0.00019923527298171164, 'samples': 1377536, 'steps': 2690, 'loss/train': 2.108023166656494} -09/20/2021 23:48:43 - INFO - __main__ - Step 43049: {'lr': 0.00019923527298171164, 'samples': 1377568, 'steps': 2690, 'loss/train': 1.84971284866333} -09/20/2021 23:48:44 - INFO - __main__ - Step 43050: {'lr': 0.00019923527298171164, 'samples': 1377600, 'steps': 2690, 'loss/train': 3.074532985687256} -09/20/2021 23:48:45 - INFO - __main__ - Step 43051: {'lr': 0.00019923527298171164, 'samples': 1377632, 'steps': 2690, 'loss/train': 2.466395616531372} -09/20/2021 23:48:46 - INFO - __main__ - Step 43052: {'lr': 0.00019923527298171164, 'samples': 1377664, 'steps': 2690, 'loss/train': 1.525598168373108} -09/20/2021 23:48:46 - INFO - __main__ - Step 43053: {'lr': 0.00019923527298171164, 'samples': 1377696, 'steps': 2690, 'loss/train': 2.210799217224121} -09/20/2021 23:48:47 - INFO - __main__ - Step 43054: {'lr': 0.00019923527298171164, 'samples': 1377728, 'steps': 2690, 'loss/train': 1.4195696115493774} -09/20/2021 23:48:48 - INFO - __main__ - Step 43055: {'lr': 0.00019923527298171164, 'samples': 1377760, 'steps': 2690, 'loss/train': 2.17301869392395} -09/20/2021 23:48:49 - INFO - __main__ - Step 43056: {'lr': 0.00019923527298171164, 'samples': 1377792, 'steps': 2690, 'loss/train': 1.4891741275787354} -09/20/2021 23:48:50 - INFO - __main__ - Step 43057: {'lr': 0.0001992344854078128, 'samples': 1377824, 'steps': 2691, 'loss/train': 0.8866980075836182} -09/20/2021 23:48:50 - INFO - __main__ - Step 43058: {'lr': 0.0001992344854078128, 'samples': 1377856, 'steps': 2691, 'loss/train': 2.1371119022369385} -09/20/2021 23:48:51 - INFO - __main__ - Step 43059: {'lr': 0.0001992344854078128, 'samples': 1377888, 'steps': 2691, 'loss/train': 2.5816633701324463} -09/20/2021 23:48:52 - INFO - __main__ - Step 43060: {'lr': 0.0001992344854078128, 'samples': 1377920, 'steps': 2691, 'loss/train': 1.6981325149536133} -09/20/2021 23:48:53 - INFO - __main__ - Step 43061: {'lr': 0.0001992344854078128, 'samples': 1377952, 'steps': 2691, 'loss/train': 2.135068416595459} -09/20/2021 23:48:53 - INFO - __main__ - Step 43062: {'lr': 0.0001992344854078128, 'samples': 1377984, 'steps': 2691, 'loss/train': 1.6221938133239746} -09/20/2021 23:48:54 - INFO - __main__ - Step 43063: {'lr': 0.0001992344854078128, 'samples': 1378016, 'steps': 2691, 'loss/train': 2.087587833404541} -09/20/2021 23:48:55 - INFO - __main__ - Step 43064: {'lr': 0.0001992344854078128, 'samples': 1378048, 'steps': 2691, 'loss/train': 1.7217565774917603} -09/20/2021 23:48:56 - INFO - __main__ - Step 43065: {'lr': 0.0001992344854078128, 'samples': 1378080, 'steps': 2691, 'loss/train': 1.9287307262420654} -09/20/2021 23:48:56 - INFO - __main__ - Step 43066: {'lr': 0.0001992344854078128, 'samples': 1378112, 'steps': 2691, 'loss/train': 2.1163384914398193} -09/20/2021 23:48:57 - INFO - __main__ - Step 43067: {'lr': 0.0001992344854078128, 'samples': 1378144, 'steps': 2691, 'loss/train': 0.5851520299911499} -09/20/2021 23:48:58 - INFO - __main__ - Step 43068: {'lr': 0.0001992344854078128, 'samples': 1378176, 'steps': 2691, 'loss/train': 0.5354793667793274} -09/20/2021 23:48:59 - INFO - __main__ - Step 43069: {'lr': 0.0001992344854078128, 'samples': 1378208, 'steps': 2691, 'loss/train': 1.0290120840072632} -09/20/2021 23:48:59 - INFO - __main__ - Step 43070: {'lr': 0.0001992344854078128, 'samples': 1378240, 'steps': 2691, 'loss/train': 2.238950252532959} -09/20/2021 23:49:00 - INFO - __main__ - Step 43071: {'lr': 0.0001992344854078128, 'samples': 1378272, 'steps': 2691, 'loss/train': 1.7521958351135254} -09/20/2021 23:49:01 - INFO - __main__ - Step 43072: {'lr': 0.0001992344854078128, 'samples': 1378304, 'steps': 2691, 'loss/train': 2.306830883026123} -09/20/2021 23:49:02 - INFO - __main__ - Step 43073: {'lr': 0.00019923369743012916, 'samples': 1378336, 'steps': 2692, 'loss/train': 2.388873338699341} -09/20/2021 23:49:02 - INFO - __main__ - Step 43074: {'lr': 0.00019923369743012916, 'samples': 1378368, 'steps': 2692, 'loss/train': 1.6798112392425537} -09/20/2021 23:49:03 - INFO - __main__ - Step 43075: {'lr': 0.00019923369743012916, 'samples': 1378400, 'steps': 2692, 'loss/train': 2.374939441680908} -09/20/2021 23:49:05 - INFO - __main__ - Step 43076: {'lr': 0.00019923369743012916, 'samples': 1378432, 'steps': 2692, 'loss/train': 2.5807223320007324} -09/20/2021 23:49:05 - INFO - __main__ - Step 43077: {'lr': 0.00019923369743012916, 'samples': 1378464, 'steps': 2692, 'loss/train': 2.3599627017974854} -09/20/2021 23:49:06 - INFO - __main__ - Step 43078: {'lr': 0.00019923369743012916, 'samples': 1378496, 'steps': 2692, 'loss/train': 0.28780317306518555} -09/20/2021 23:49:07 - INFO - __main__ - Step 43079: {'lr': 0.00019923369743012916, 'samples': 1378528, 'steps': 2692, 'loss/train': 1.698202133178711} -09/20/2021 23:49:08 - INFO - __main__ - Step 43080: {'lr': 0.00019923369743012916, 'samples': 1378560, 'steps': 2692, 'loss/train': 2.227989435195923} -09/20/2021 23:49:08 - INFO - __main__ - Step 43081: {'lr': 0.00019923369743012916, 'samples': 1378592, 'steps': 2692, 'loss/train': 1.6464438438415527} -09/20/2021 23:49:09 - INFO - __main__ - Step 43082: {'lr': 0.00019923369743012916, 'samples': 1378624, 'steps': 2692, 'loss/train': 2.310772657394409} -09/20/2021 23:49:10 - INFO - __main__ - Step 43083: {'lr': 0.00019923369743012916, 'samples': 1378656, 'steps': 2692, 'loss/train': 2.2051219940185547} -09/20/2021 23:49:11 - INFO - __main__ - Step 43084: {'lr': 0.00019923369743012916, 'samples': 1378688, 'steps': 2692, 'loss/train': 1.8901993036270142} -09/20/2021 23:49:11 - INFO - __main__ - Step 43085: {'lr': 0.00019923369743012916, 'samples': 1378720, 'steps': 2692, 'loss/train': 2.5024731159210205} -09/20/2021 23:49:12 - INFO - __main__ - Step 43086: {'lr': 0.00019923369743012916, 'samples': 1378752, 'steps': 2692, 'loss/train': 2.7918989658355713} -09/20/2021 23:49:13 - INFO - __main__ - Step 43087: {'lr': 0.00019923369743012916, 'samples': 1378784, 'steps': 2692, 'loss/train': 1.9618996381759644} -09/20/2021 23:49:14 - INFO - __main__ - Step 43088: {'lr': 0.00019923369743012916, 'samples': 1378816, 'steps': 2692, 'loss/train': 1.8293508291244507} -09/20/2021 23:49:14 - INFO - __main__ - Step 43089: {'lr': 0.00019923290904866404, 'samples': 1378848, 'steps': 2693, 'loss/train': 2.4730727672576904} -09/20/2021 23:49:15 - INFO - __main__ - Step 43090: {'lr': 0.00019923290904866404, 'samples': 1378880, 'steps': 2693, 'loss/train': 0.9130778908729553} -09/20/2021 23:49:16 - INFO - __main__ - Step 43091: {'lr': 0.00019923290904866404, 'samples': 1378912, 'steps': 2693, 'loss/train': 0.3174988031387329} -09/20/2021 23:49:17 - INFO - __main__ - Step 43092: {'lr': 0.00019923290904866404, 'samples': 1378944, 'steps': 2693, 'loss/train': 2.3044395446777344} -09/20/2021 23:49:17 - INFO - __main__ - Step 43093: {'lr': 0.00019923290904866404, 'samples': 1378976, 'steps': 2693, 'loss/train': 2.370215654373169} -09/20/2021 23:49:18 - INFO - __main__ - Step 43094: {'lr': 0.00019923290904866404, 'samples': 1379008, 'steps': 2693, 'loss/train': 2.370163679122925} -09/20/2021 23:49:19 - INFO - __main__ - Step 43095: {'lr': 0.00019923290904866404, 'samples': 1379040, 'steps': 2693, 'loss/train': 2.6004176139831543} -09/20/2021 23:49:20 - INFO - __main__ - Step 43096: {'lr': 0.00019923290904866404, 'samples': 1379072, 'steps': 2693, 'loss/train': 3.916966438293457} -09/20/2021 23:49:20 - INFO - __main__ - Step 43097: {'lr': 0.00019923290904866404, 'samples': 1379104, 'steps': 2693, 'loss/train': 2.384692668914795} -09/20/2021 23:49:21 - INFO - __main__ - Step 43098: {'lr': 0.00019923290904866404, 'samples': 1379136, 'steps': 2693, 'loss/train': 3.0771546363830566} -09/20/2021 23:49:22 - INFO - __main__ - Step 43099: {'lr': 0.00019923290904866404, 'samples': 1379168, 'steps': 2693, 'loss/train': 2.9943339824676514} -09/20/2021 23:49:23 - INFO - __main__ - Step 43100: {'lr': 0.00019923290904866404, 'samples': 1379200, 'steps': 2693, 'loss/train': 3.7833969593048096} -09/20/2021 23:49:23 - INFO - __main__ - Step 43101: {'lr': 0.00019923290904866404, 'samples': 1379232, 'steps': 2693, 'loss/train': 0.38528990745544434} -09/20/2021 23:49:24 - INFO - __main__ - Step 43102: {'lr': 0.00019923290904866404, 'samples': 1379264, 'steps': 2693, 'loss/train': 2.274060010910034} -09/20/2021 23:49:25 - INFO - __main__ - Step 43103: {'lr': 0.00019923290904866404, 'samples': 1379296, 'steps': 2693, 'loss/train': 2.4008898735046387} -09/20/2021 23:49:26 - INFO - __main__ - Step 43104: {'lr': 0.00019923290904866404, 'samples': 1379328, 'steps': 2693, 'loss/train': 1.0422662496566772} -09/20/2021 23:49:27 - INFO - __main__ - Step 43105: {'lr': 0.00019923212026342057, 'samples': 1379360, 'steps': 2694, 'loss/train': 2.2809460163116455} -09/20/2021 23:49:27 - INFO - __main__ - Step 43106: {'lr': 0.00019923212026342057, 'samples': 1379392, 'steps': 2694, 'loss/train': 2.6538245677948} -09/20/2021 23:49:28 - INFO - __main__ - Step 43107: {'lr': 0.00019923212026342057, 'samples': 1379424, 'steps': 2694, 'loss/train': 1.7171653509140015} -09/20/2021 23:49:29 - INFO - __main__ - Step 43108: {'lr': 0.00019923212026342057, 'samples': 1379456, 'steps': 2694, 'loss/train': 2.6903514862060547} -09/20/2021 23:49:30 - INFO - __main__ - Step 43109: {'lr': 0.00019923212026342057, 'samples': 1379488, 'steps': 2694, 'loss/train': 2.25302791595459} -09/20/2021 23:49:31 - INFO - __main__ - Step 43110: {'lr': 0.00019923212026342057, 'samples': 1379520, 'steps': 2694, 'loss/train': 2.2729384899139404} -09/20/2021 23:49:32 - INFO - __main__ - Step 43111: {'lr': 0.00019923212026342057, 'samples': 1379552, 'steps': 2694, 'loss/train': 1.4728630781173706} -09/20/2021 23:49:33 - INFO - __main__ - Step 43112: {'lr': 0.00019923212026342057, 'samples': 1379584, 'steps': 2694, 'loss/train': 1.5607519149780273} -09/20/2021 23:49:34 - INFO - __main__ - Step 43113: {'lr': 0.00019923212026342057, 'samples': 1379616, 'steps': 2694, 'loss/train': 0.9555410742759705} -09/20/2021 23:49:34 - INFO - __main__ - Step 43114: {'lr': 0.00019923212026342057, 'samples': 1379648, 'steps': 2694, 'loss/train': 1.930304765701294} -09/20/2021 23:49:35 - INFO - __main__ - Step 43115: {'lr': 0.00019923212026342057, 'samples': 1379680, 'steps': 2694, 'loss/train': 2.347031354904175} -09/20/2021 23:49:36 - INFO - __main__ - Step 43116: {'lr': 0.00019923212026342057, 'samples': 1379712, 'steps': 2694, 'loss/train': 2.0194904804229736} -09/20/2021 23:49:37 - INFO - __main__ - Step 43117: {'lr': 0.00019923212026342057, 'samples': 1379744, 'steps': 2694, 'loss/train': 1.8046770095825195} -09/20/2021 23:49:37 - INFO - __main__ - Step 43118: {'lr': 0.00019923212026342057, 'samples': 1379776, 'steps': 2694, 'loss/train': 1.7837674617767334} -09/20/2021 23:49:38 - INFO - __main__ - Step 43119: {'lr': 0.00019923212026342057, 'samples': 1379808, 'steps': 2694, 'loss/train': 2.7852354049682617} -09/20/2021 23:49:39 - INFO - __main__ - Step 43120: {'lr': 0.00019923212026342057, 'samples': 1379840, 'steps': 2694, 'loss/train': 2.2283735275268555} -09/20/2021 23:49:40 - INFO - __main__ - Step 43121: {'lr': 0.000199231331074402, 'samples': 1379872, 'steps': 2695, 'loss/train': 3.066396713256836} -09/20/2021 23:49:40 - INFO - __main__ - Step 43122: {'lr': 0.000199231331074402, 'samples': 1379904, 'steps': 2695, 'loss/train': 2.6699109077453613} -09/20/2021 23:49:41 - INFO - __main__ - Step 43123: {'lr': 0.000199231331074402, 'samples': 1379936, 'steps': 2695, 'loss/train': 2.274402379989624} -09/20/2021 23:49:42 - INFO - __main__ - Step 43124: {'lr': 0.000199231331074402, 'samples': 1379968, 'steps': 2695, 'loss/train': 1.6165555715560913} -09/20/2021 23:49:43 - INFO - __main__ - Step 43125: {'lr': 0.000199231331074402, 'samples': 1380000, 'steps': 2695, 'loss/train': 1.6587543487548828} -09/20/2021 23:49:43 - INFO - __main__ - Step 43126: {'lr': 0.000199231331074402, 'samples': 1380032, 'steps': 2695, 'loss/train': 2.2349939346313477} -09/20/2021 23:49:44 - INFO - __main__ - Step 43127: {'lr': 0.000199231331074402, 'samples': 1380064, 'steps': 2695, 'loss/train': 1.8014401197433472} -09/20/2021 23:49:45 - INFO - __main__ - Step 43128: {'lr': 0.000199231331074402, 'samples': 1380096, 'steps': 2695, 'loss/train': 0.6714305281639099} -09/20/2021 23:49:46 - INFO - __main__ - Step 43129: {'lr': 0.000199231331074402, 'samples': 1380128, 'steps': 2695, 'loss/train': 1.4194236993789673} -09/20/2021 23:49:46 - INFO - __main__ - Step 43130: {'lr': 0.000199231331074402, 'samples': 1380160, 'steps': 2695, 'loss/train': 1.2519334554672241} -09/20/2021 23:49:47 - INFO - __main__ - Step 43131: {'lr': 0.000199231331074402, 'samples': 1380192, 'steps': 2695, 'loss/train': 2.5498013496398926} -09/20/2021 23:49:48 - INFO - __main__ - Step 43132: {'lr': 0.000199231331074402, 'samples': 1380224, 'steps': 2695, 'loss/train': 1.7380385398864746} -09/20/2021 23:49:49 - INFO - __main__ - Step 43133: {'lr': 0.000199231331074402, 'samples': 1380256, 'steps': 2695, 'loss/train': 2.332761526107788} -09/20/2021 23:49:49 - INFO - __main__ - Step 43134: {'lr': 0.000199231331074402, 'samples': 1380288, 'steps': 2695, 'loss/train': 2.181748151779175} -09/20/2021 23:49:50 - INFO - __main__ - Step 43135: {'lr': 0.000199231331074402, 'samples': 1380320, 'steps': 2695, 'loss/train': 1.303861379623413} -09/20/2021 23:49:51 - INFO - __main__ - Step 43136: {'lr': 0.000199231331074402, 'samples': 1380352, 'steps': 2695, 'loss/train': 1.6415536403656006} -09/20/2021 23:49:52 - INFO - __main__ - Step 43137: {'lr': 0.00019923054148161153, 'samples': 1380384, 'steps': 2696, 'loss/train': 2.263376474380493} -09/20/2021 23:49:53 - INFO - __main__ - Step 43138: {'lr': 0.00019923054148161153, 'samples': 1380416, 'steps': 2696, 'loss/train': 3.230358123779297} -09/20/2021 23:49:53 - INFO - __main__ - Step 43139: {'lr': 0.00019923054148161153, 'samples': 1380448, 'steps': 2696, 'loss/train': 1.8622523546218872} -09/20/2021 23:49:55 - INFO - __main__ - Step 43140: {'lr': 0.00019923054148161153, 'samples': 1380480, 'steps': 2696, 'loss/train': 2.2638823986053467} -09/20/2021 23:49:55 - INFO - __main__ - Step 43141: {'lr': 0.00019923054148161153, 'samples': 1380512, 'steps': 2696, 'loss/train': 2.1464641094207764} -09/20/2021 23:49:56 - INFO - __main__ - Step 43142: {'lr': 0.00019923054148161153, 'samples': 1380544, 'steps': 2696, 'loss/train': 2.3986012935638428} -09/20/2021 23:49:57 - INFO - __main__ - Step 43143: {'lr': 0.00019923054148161153, 'samples': 1380576, 'steps': 2696, 'loss/train': 2.1196582317352295} -09/20/2021 23:49:58 - INFO - __main__ - Step 43144: {'lr': 0.00019923054148161153, 'samples': 1380608, 'steps': 2696, 'loss/train': 1.9359716176986694} -09/20/2021 23:49:58 - INFO - __main__ - Step 43145: {'lr': 0.00019923054148161153, 'samples': 1380640, 'steps': 2696, 'loss/train': 1.7203094959259033} -09/20/2021 23:49:59 - INFO - __main__ - Step 43146: {'lr': 0.00019923054148161153, 'samples': 1380672, 'steps': 2696, 'loss/train': 2.0675249099731445} -09/20/2021 23:50:00 - INFO - __main__ - Step 43147: {'lr': 0.00019923054148161153, 'samples': 1380704, 'steps': 2696, 'loss/train': 0.8755913972854614} -09/20/2021 23:50:01 - INFO - __main__ - Step 43148: {'lr': 0.00019923054148161153, 'samples': 1380736, 'steps': 2696, 'loss/train': 1.0431427955627441} -09/20/2021 23:50:01 - INFO - __main__ - Step 43149: {'lr': 0.00019923054148161153, 'samples': 1380768, 'steps': 2696, 'loss/train': 1.2514656782150269} -09/20/2021 23:50:02 - INFO - __main__ - Step 43150: {'lr': 0.00019923054148161153, 'samples': 1380800, 'steps': 2696, 'loss/train': 0.7232975959777832} -09/20/2021 23:50:03 - INFO - __main__ - Step 43151: {'lr': 0.00019923054148161153, 'samples': 1380832, 'steps': 2696, 'loss/train': 2.4107210636138916} -09/20/2021 23:50:04 - INFO - __main__ - Step 43152: {'lr': 0.00019923054148161153, 'samples': 1380864, 'steps': 2696, 'loss/train': 2.4663279056549072} -09/20/2021 23:50:05 - INFO - __main__ - Step 43153: {'lr': 0.00019922975148505237, 'samples': 1380896, 'steps': 2697, 'loss/train': 2.385019063949585} -09/20/2021 23:50:05 - INFO - __main__ - Step 43154: {'lr': 0.00019922975148505237, 'samples': 1380928, 'steps': 2697, 'loss/train': 1.0300016403198242} -09/20/2021 23:50:06 - INFO - __main__ - Step 43155: {'lr': 0.00019922975148505237, 'samples': 1380960, 'steps': 2697, 'loss/train': 1.9118890762329102} -09/20/2021 23:50:07 - INFO - __main__ - Step 43156: {'lr': 0.00019922975148505237, 'samples': 1380992, 'steps': 2697, 'loss/train': 0.45645207166671753} -09/20/2021 23:50:08 - INFO - __main__ - Step 43157: {'lr': 0.00019922975148505237, 'samples': 1381024, 'steps': 2697, 'loss/train': 1.3139934539794922} -09/20/2021 23:50:08 - INFO - __main__ - Step 43158: {'lr': 0.00019922975148505237, 'samples': 1381056, 'steps': 2697, 'loss/train': 1.7747985124588013} -09/20/2021 23:50:09 - INFO - __main__ - Step 43159: {'lr': 0.00019922975148505237, 'samples': 1381088, 'steps': 2697, 'loss/train': 2.228412389755249} -09/20/2021 23:50:10 - INFO - __main__ - Step 43160: {'lr': 0.00019922975148505237, 'samples': 1381120, 'steps': 2697, 'loss/train': 3.132681369781494} -09/20/2021 23:50:11 - INFO - __main__ - Step 43161: {'lr': 0.00019922975148505237, 'samples': 1381152, 'steps': 2697, 'loss/train': 2.063286781311035} -09/20/2021 23:50:11 - INFO - __main__ - Step 43162: {'lr': 0.00019922975148505237, 'samples': 1381184, 'steps': 2697, 'loss/train': 0.9311800599098206} -09/20/2021 23:50:12 - INFO - __main__ - Step 43163: {'lr': 0.00019922975148505237, 'samples': 1381216, 'steps': 2697, 'loss/train': 1.8436267375946045} -09/20/2021 23:50:13 - INFO - __main__ - Step 43164: {'lr': 0.00019922975148505237, 'samples': 1381248, 'steps': 2697, 'loss/train': 2.664886713027954} -09/20/2021 23:50:14 - INFO - __main__ - Step 43165: {'lr': 0.00019922975148505237, 'samples': 1381280, 'steps': 2697, 'loss/train': 2.472830295562744} -09/20/2021 23:50:14 - INFO - __main__ - Step 43166: {'lr': 0.00019922975148505237, 'samples': 1381312, 'steps': 2697, 'loss/train': 1.9098153114318848} -09/20/2021 23:50:15 - INFO - __main__ - Step 43167: {'lr': 0.00019922975148505237, 'samples': 1381344, 'steps': 2697, 'loss/train': 2.4974801540374756} -09/20/2021 23:50:16 - INFO - __main__ - Step 43168: {'lr': 0.00019922975148505237, 'samples': 1381376, 'steps': 2697, 'loss/train': 1.893282175064087} -09/20/2021 23:50:17 - INFO - __main__ - Step 43169: {'lr': 0.00019922896108472772, 'samples': 1381408, 'steps': 2698, 'loss/train': 1.432824969291687} -09/20/2021 23:50:17 - INFO - __main__ - Step 43170: {'lr': 0.00019922896108472772, 'samples': 1381440, 'steps': 2698, 'loss/train': 1.8375906944274902} -09/20/2021 23:50:19 - INFO - __main__ - Step 43171: {'lr': 0.00019922896108472772, 'samples': 1381472, 'steps': 2698, 'loss/train': 2.564019203186035} -09/20/2021 23:50:20 - INFO - __main__ - Step 43172: {'lr': 0.00019922896108472772, 'samples': 1381504, 'steps': 2698, 'loss/train': 2.42028546333313} -09/20/2021 23:50:20 - INFO - __main__ - Step 43173: {'lr': 0.00019922896108472772, 'samples': 1381536, 'steps': 2698, 'loss/train': 1.5222740173339844} -09/20/2021 23:50:21 - INFO - __main__ - Step 43174: {'lr': 0.00019922896108472772, 'samples': 1381568, 'steps': 2698, 'loss/train': 2.1752283573150635} -09/20/2021 23:50:22 - INFO - __main__ - Step 43175: {'lr': 0.00019922896108472772, 'samples': 1381600, 'steps': 2698, 'loss/train': 1.3683476448059082} -09/20/2021 23:50:23 - INFO - __main__ - Step 43176: {'lr': 0.00019922896108472772, 'samples': 1381632, 'steps': 2698, 'loss/train': 1.9052351713180542} -09/20/2021 23:50:23 - INFO - __main__ - Step 43177: {'lr': 0.00019922896108472772, 'samples': 1381664, 'steps': 2698, 'loss/train': 1.6980775594711304} -09/20/2021 23:50:24 - INFO - __main__ - Step 43178: {'lr': 0.00019922896108472772, 'samples': 1381696, 'steps': 2698, 'loss/train': 2.1418707370758057} -09/20/2021 23:50:25 - INFO - __main__ - Step 43179: {'lr': 0.00019922896108472772, 'samples': 1381728, 'steps': 2698, 'loss/train': 2.4023208618164062} -09/20/2021 23:50:26 - INFO - __main__ - Step 43180: {'lr': 0.00019922896108472772, 'samples': 1381760, 'steps': 2698, 'loss/train': 1.7750084400177002} -09/20/2021 23:50:26 - INFO - __main__ - Step 43181: {'lr': 0.00019922896108472772, 'samples': 1381792, 'steps': 2698, 'loss/train': 2.5682425498962402} -09/20/2021 23:50:27 - INFO - __main__ - Step 43182: {'lr': 0.00019922896108472772, 'samples': 1381824, 'steps': 2698, 'loss/train': 1.6862528324127197} -09/20/2021 23:50:28 - INFO - __main__ - Step 43183: {'lr': 0.00019922896108472772, 'samples': 1381856, 'steps': 2698, 'loss/train': 1.9806979894638062} -09/20/2021 23:50:29 - INFO - __main__ - Step 43184: {'lr': 0.00019922896108472772, 'samples': 1381888, 'steps': 2698, 'loss/train': 2.025805711746216} -09/20/2021 23:50:29 - INFO - __main__ - Step 43185: {'lr': 0.00019922817028064082, 'samples': 1381920, 'steps': 2699, 'loss/train': 2.1340227127075195} -09/20/2021 23:50:30 - INFO - __main__ - Step 43186: {'lr': 0.00019922817028064082, 'samples': 1381952, 'steps': 2699, 'loss/train': 1.866144061088562} -09/20/2021 23:50:31 - INFO - __main__ - Step 43187: {'lr': 0.00019922817028064082, 'samples': 1381984, 'steps': 2699, 'loss/train': 2.799917697906494} -09/20/2021 23:50:32 - INFO - __main__ - Step 43188: {'lr': 0.00019922817028064082, 'samples': 1382016, 'steps': 2699, 'loss/train': 2.08143949508667} -09/20/2021 23:50:32 - INFO - __main__ - Step 43189: {'lr': 0.00019922817028064082, 'samples': 1382048, 'steps': 2699, 'loss/train': 1.8556067943572998} -09/20/2021 23:50:33 - INFO - __main__ - Step 43190: {'lr': 0.00019922817028064082, 'samples': 1382080, 'steps': 2699, 'loss/train': 3.732816457748413} -09/20/2021 23:50:34 - INFO - __main__ - Step 43191: {'lr': 0.00019922817028064082, 'samples': 1382112, 'steps': 2699, 'loss/train': 1.4763942956924438} -09/20/2021 23:50:35 - INFO - __main__ - Step 43192: {'lr': 0.00019922817028064082, 'samples': 1382144, 'steps': 2699, 'loss/train': 2.990208387374878} -09/20/2021 23:50:35 - INFO - __main__ - Step 43193: {'lr': 0.00019922817028064082, 'samples': 1382176, 'steps': 2699, 'loss/train': 2.16534686088562} -09/20/2021 23:50:36 - INFO - __main__ - Step 43194: {'lr': 0.00019922817028064082, 'samples': 1382208, 'steps': 2699, 'loss/train': 1.3291503190994263} -09/20/2021 23:50:37 - INFO - __main__ - Step 43195: {'lr': 0.00019922817028064082, 'samples': 1382240, 'steps': 2699, 'loss/train': 2.2543082237243652} -09/20/2021 23:50:38 - INFO - __main__ - Step 43196: {'lr': 0.00019922817028064082, 'samples': 1382272, 'steps': 2699, 'loss/train': 3.536367177963257} -09/20/2021 23:50:38 - INFO - __main__ - Step 43197: {'lr': 0.00019922817028064082, 'samples': 1382304, 'steps': 2699, 'loss/train': 2.041414499282837} -09/20/2021 23:50:39 - INFO - __main__ - Step 43198: {'lr': 0.00019922817028064082, 'samples': 1382336, 'steps': 2699, 'loss/train': 1.9208370447158813} -09/20/2021 23:50:40 - INFO - __main__ - Step 43199: {'lr': 0.00019922817028064082, 'samples': 1382368, 'steps': 2699, 'loss/train': 2.1884422302246094} -09/20/2021 23:50:41 - INFO - __main__ - Step 43200: {'lr': 0.00019922817028064082, 'samples': 1382400, 'steps': 2699, 'loss/train': 3.2333929538726807} -09/20/2021 23:50:42 - INFO - __main__ - Step 43201: {'lr': 0.0001992273790727949, 'samples': 1382432, 'steps': 2700, 'loss/train': 2.4134790897369385} -09/20/2021 23:50:42 - INFO - __main__ - Step 43202: {'lr': 0.0001992273790727949, 'samples': 1382464, 'steps': 2700, 'loss/train': 1.592769980430603} -09/20/2021 23:50:43 - INFO - __main__ - Step 43203: {'lr': 0.0001992273790727949, 'samples': 1382496, 'steps': 2700, 'loss/train': 1.6262141466140747} -09/20/2021 23:50:44 - INFO - __main__ - Step 43204: {'lr': 0.0001992273790727949, 'samples': 1382528, 'steps': 2700, 'loss/train': 1.5243148803710938} -09/20/2021 23:50:45 - INFO - __main__ - Step 43205: {'lr': 0.0001992273790727949, 'samples': 1382560, 'steps': 2700, 'loss/train': 1.462144374847412} -09/20/2021 23:50:46 - INFO - __main__ - Step 43206: {'lr': 0.0001992273790727949, 'samples': 1382592, 'steps': 2700, 'loss/train': 1.3337574005126953} -09/20/2021 23:50:47 - INFO - __main__ - Step 43207: {'lr': 0.0001992273790727949, 'samples': 1382624, 'steps': 2700, 'loss/train': 0.5930443406105042} -09/20/2021 23:50:47 - INFO - __main__ - Step 43208: {'lr': 0.0001992273790727949, 'samples': 1382656, 'steps': 2700, 'loss/train': 1.123368501663208} -09/20/2021 23:50:48 - INFO - __main__ - Step 43209: {'lr': 0.0001992273790727949, 'samples': 1382688, 'steps': 2700, 'loss/train': 1.8644055128097534} -09/20/2021 23:50:49 - INFO - __main__ - Step 43210: {'lr': 0.0001992273790727949, 'samples': 1382720, 'steps': 2700, 'loss/train': 1.8702198266983032} -09/20/2021 23:50:50 - INFO - __main__ - Step 43211: {'lr': 0.0001992273790727949, 'samples': 1382752, 'steps': 2700, 'loss/train': 1.9171087741851807} -09/20/2021 23:50:50 - INFO - __main__ - Step 43212: {'lr': 0.0001992273790727949, 'samples': 1382784, 'steps': 2700, 'loss/train': 1.5148779153823853} -09/20/2021 23:50:51 - INFO - __main__ - Step 43213: {'lr': 0.0001992273790727949, 'samples': 1382816, 'steps': 2700, 'loss/train': 1.6652438640594482} -09/20/2021 23:50:52 - INFO - __main__ - Step 43214: {'lr': 0.0001992273790727949, 'samples': 1382848, 'steps': 2700, 'loss/train': 0.7832881212234497} -09/20/2021 23:50:53 - INFO - __main__ - Step 43215: {'lr': 0.0001992273790727949, 'samples': 1382880, 'steps': 2700, 'loss/train': 2.1662282943725586} -09/20/2021 23:50:53 - INFO - __main__ - Step 43216: {'lr': 0.0001992273790727949, 'samples': 1382912, 'steps': 2700, 'loss/train': 2.140329360961914} -09/20/2021 23:50:54 - INFO - __main__ - Step 43217: {'lr': 0.00019922658746119313, 'samples': 1382944, 'steps': 2701, 'loss/train': 2.349266529083252} -09/20/2021 23:50:55 - INFO - __main__ - Step 43218: {'lr': 0.00019922658746119313, 'samples': 1382976, 'steps': 2701, 'loss/train': 2.124595880508423} -09/20/2021 23:50:56 - INFO - __main__ - Step 43219: {'lr': 0.00019922658746119313, 'samples': 1383008, 'steps': 2701, 'loss/train': 2.533642053604126} -09/20/2021 23:50:57 - INFO - __main__ - Step 43220: {'lr': 0.00019922658746119313, 'samples': 1383040, 'steps': 2701, 'loss/train': 1.828171968460083} -09/20/2021 23:50:57 - INFO - __main__ - Step 43221: {'lr': 0.00019922658746119313, 'samples': 1383072, 'steps': 2701, 'loss/train': 3.040602445602417} -09/20/2021 23:50:58 - INFO - __main__ - Step 43222: {'lr': 0.00019922658746119313, 'samples': 1383104, 'steps': 2701, 'loss/train': 1.5288282632827759} -09/20/2021 23:50:59 - INFO - __main__ - Step 43223: {'lr': 0.00019922658746119313, 'samples': 1383136, 'steps': 2701, 'loss/train': 2.0226340293884277} -09/20/2021 23:51:00 - INFO - __main__ - Step 43224: {'lr': 0.00019922658746119313, 'samples': 1383168, 'steps': 2701, 'loss/train': 1.708950161933899} -09/20/2021 23:51:00 - INFO - __main__ - Step 43225: {'lr': 0.00019922658746119313, 'samples': 1383200, 'steps': 2701, 'loss/train': 2.8132314682006836} -09/20/2021 23:51:01 - INFO - __main__ - Step 43226: {'lr': 0.00019922658746119313, 'samples': 1383232, 'steps': 2701, 'loss/train': 2.529618501663208} -09/20/2021 23:51:02 - INFO - __main__ - Step 43227: {'lr': 0.00019922658746119313, 'samples': 1383264, 'steps': 2701, 'loss/train': 0.7001511454582214} -09/20/2021 23:51:03 - INFO - __main__ - Step 43228: {'lr': 0.00019922658746119313, 'samples': 1383296, 'steps': 2701, 'loss/train': 2.3790488243103027} -09/20/2021 23:51:03 - INFO - __main__ - Step 43229: {'lr': 0.00019922658746119313, 'samples': 1383328, 'steps': 2701, 'loss/train': 1.4617340564727783} -09/20/2021 23:51:04 - INFO - __main__ - Step 43230: {'lr': 0.00019922658746119313, 'samples': 1383360, 'steps': 2701, 'loss/train': 1.5311473608016968} -09/20/2021 23:51:05 - INFO - __main__ - Step 43231: {'lr': 0.00019922658746119313, 'samples': 1383392, 'steps': 2701, 'loss/train': 2.0479323863983154} -09/20/2021 23:51:06 - INFO - __main__ - Step 43232: {'lr': 0.00019922658746119313, 'samples': 1383424, 'steps': 2701, 'loss/train': 2.4705655574798584} -09/20/2021 23:51:06 - INFO - __main__ - Step 43233: {'lr': 0.00019922579544583879, 'samples': 1383456, 'steps': 2702, 'loss/train': 2.0032901763916016} -09/20/2021 23:51:07 - INFO - __main__ - Step 43234: {'lr': 0.00019922579544583879, 'samples': 1383488, 'steps': 2702, 'loss/train': 2.0093774795532227} -09/20/2021 23:51:08 - INFO - __main__ - Step 43235: {'lr': 0.00019922579544583879, 'samples': 1383520, 'steps': 2702, 'loss/train': 3.0375187397003174} -09/20/2021 23:51:09 - INFO - __main__ - Step 43236: {'lr': 0.00019922579544583879, 'samples': 1383552, 'steps': 2702, 'loss/train': 1.1968235969543457} -09/20/2021 23:51:10 - INFO - __main__ - Step 43237: {'lr': 0.00019922579544583879, 'samples': 1383584, 'steps': 2702, 'loss/train': 2.08109188079834} -09/20/2021 23:51:11 - INFO - __main__ - Step 43238: {'lr': 0.00019922579544583879, 'samples': 1383616, 'steps': 2702, 'loss/train': 1.883514165878296} -09/20/2021 23:51:11 - INFO - __main__ - Step 43239: {'lr': 0.00019922579544583879, 'samples': 1383648, 'steps': 2702, 'loss/train': 2.1008031368255615} -09/20/2021 23:51:12 - INFO - __main__ - Step 43240: {'lr': 0.00019922579544583879, 'samples': 1383680, 'steps': 2702, 'loss/train': 1.7236779928207397} -09/20/2021 23:51:13 - INFO - __main__ - Step 43241: {'lr': 0.00019922579544583879, 'samples': 1383712, 'steps': 2702, 'loss/train': 3.0241689682006836} -09/20/2021 23:51:14 - INFO - __main__ - Step 43242: {'lr': 0.00019922579544583879, 'samples': 1383744, 'steps': 2702, 'loss/train': 2.6556687355041504} -09/20/2021 23:51:14 - INFO - __main__ - Step 43243: {'lr': 0.00019922579544583879, 'samples': 1383776, 'steps': 2702, 'loss/train': 1.8177191019058228} -09/20/2021 23:51:15 - INFO - __main__ - Step 43244: {'lr': 0.00019922579544583879, 'samples': 1383808, 'steps': 2702, 'loss/train': 1.8773623704910278} -09/20/2021 23:51:16 - INFO - __main__ - Step 43245: {'lr': 0.00019922579544583879, 'samples': 1383840, 'steps': 2702, 'loss/train': 1.9636131525039673} -09/20/2021 23:51:17 - INFO - __main__ - Step 43246: {'lr': 0.00019922579544583879, 'samples': 1383872, 'steps': 2702, 'loss/train': 1.3715667724609375} -09/20/2021 23:51:18 - INFO - __main__ - Step 43247: {'lr': 0.00019922579544583879, 'samples': 1383904, 'steps': 2702, 'loss/train': 1.3886594772338867} -09/20/2021 23:51:18 - INFO - __main__ - Step 43248: {'lr': 0.00019922579544583879, 'samples': 1383936, 'steps': 2702, 'loss/train': 2.1630024909973145} -09/20/2021 23:51:19 - INFO - __main__ - Step 43249: {'lr': 0.00019922500302673506, 'samples': 1383968, 'steps': 2703, 'loss/train': 2.2891244888305664} -09/20/2021 23:51:20 - INFO - __main__ - Step 43250: {'lr': 0.00019922500302673506, 'samples': 1384000, 'steps': 2703, 'loss/train': 0.47104451060295105} -09/20/2021 23:51:21 - INFO - __main__ - Step 43251: {'lr': 0.00019922500302673506, 'samples': 1384032, 'steps': 2703, 'loss/train': 2.3325719833374023} -09/20/2021 23:51:21 - INFO - __main__ - Step 43252: {'lr': 0.00019922500302673506, 'samples': 1384064, 'steps': 2703, 'loss/train': 1.6130685806274414} -09/20/2021 23:51:22 - INFO - __main__ - Step 43253: {'lr': 0.00019922500302673506, 'samples': 1384096, 'steps': 2703, 'loss/train': 3.529169797897339} -09/20/2021 23:51:23 - INFO - __main__ - Step 43254: {'lr': 0.00019922500302673506, 'samples': 1384128, 'steps': 2703, 'loss/train': 2.4799232482910156} -09/20/2021 23:51:24 - INFO - __main__ - Step 43255: {'lr': 0.00019922500302673506, 'samples': 1384160, 'steps': 2703, 'loss/train': 2.195749521255493} -09/20/2021 23:51:24 - INFO - __main__ - Step 43256: {'lr': 0.00019922500302673506, 'samples': 1384192, 'steps': 2703, 'loss/train': 3.4128284454345703} -09/20/2021 23:51:25 - INFO - __main__ - Step 43257: {'lr': 0.00019922500302673506, 'samples': 1384224, 'steps': 2703, 'loss/train': 1.7196297645568848} -09/20/2021 23:51:26 - INFO - __main__ - Step 43258: {'lr': 0.00019922500302673506, 'samples': 1384256, 'steps': 2703, 'loss/train': 1.530380129814148} -09/20/2021 23:51:27 - INFO - __main__ - Step 43259: {'lr': 0.00019922500302673506, 'samples': 1384288, 'steps': 2703, 'loss/train': 2.4087533950805664} -09/20/2021 23:51:27 - INFO - __main__ - Step 43260: {'lr': 0.00019922500302673506, 'samples': 1384320, 'steps': 2703, 'loss/train': 2.3082542419433594} -09/20/2021 23:51:28 - INFO - __main__ - Step 43261: {'lr': 0.00019922500302673506, 'samples': 1384352, 'steps': 2703, 'loss/train': 1.2089316844940186} -09/20/2021 23:51:29 - INFO - __main__ - Step 43262: {'lr': 0.00019922500302673506, 'samples': 1384384, 'steps': 2703, 'loss/train': 1.8227083683013916} -09/20/2021 23:51:30 - INFO - __main__ - Step 43263: {'lr': 0.00019922500302673506, 'samples': 1384416, 'steps': 2703, 'loss/train': 2.15217661857605} -09/20/2021 23:51:30 - INFO - __main__ - Step 43264: {'lr': 0.00019922500302673506, 'samples': 1384448, 'steps': 2703, 'loss/train': 1.8971710205078125} -09/20/2021 23:51:31 - INFO - __main__ - Step 43265: {'lr': 0.00019922421020388518, 'samples': 1384480, 'steps': 2704, 'loss/train': 1.4217140674591064} -09/20/2021 23:51:32 - INFO - __main__ - Step 43266: {'lr': 0.00019922421020388518, 'samples': 1384512, 'steps': 2704, 'loss/train': 1.9738826751708984} -09/20/2021 23:51:33 - INFO - __main__ - Step 43267: {'lr': 0.00019922421020388518, 'samples': 1384544, 'steps': 2704, 'loss/train': 2.074350118637085} -09/20/2021 23:51:34 - INFO - __main__ - Step 43268: {'lr': 0.00019922421020388518, 'samples': 1384576, 'steps': 2704, 'loss/train': 1.7769696712493896} -09/20/2021 23:51:35 - INFO - __main__ - Step 43269: {'lr': 0.00019922421020388518, 'samples': 1384608, 'steps': 2704, 'loss/train': 2.830469846725464} -09/20/2021 23:51:36 - INFO - __main__ - Step 43270: {'lr': 0.00019922421020388518, 'samples': 1384640, 'steps': 2704, 'loss/train': 3.2105109691619873} -09/20/2021 23:51:36 - INFO - __main__ - Step 43271: {'lr': 0.00019922421020388518, 'samples': 1384672, 'steps': 2704, 'loss/train': 2.0929393768310547} -09/20/2021 23:51:37 - INFO - __main__ - Step 43272: {'lr': 0.00019922421020388518, 'samples': 1384704, 'steps': 2704, 'loss/train': 2.1324450969696045} -09/20/2021 23:51:38 - INFO - __main__ - Step 43273: {'lr': 0.00019922421020388518, 'samples': 1384736, 'steps': 2704, 'loss/train': 5.566690921783447} -09/20/2021 23:51:39 - INFO - __main__ - Step 43274: {'lr': 0.00019922421020388518, 'samples': 1384768, 'steps': 2704, 'loss/train': 2.3377158641815186} -09/20/2021 23:51:39 - INFO - __main__ - Step 43275: {'lr': 0.00019922421020388518, 'samples': 1384800, 'steps': 2704, 'loss/train': 0.5690704584121704} -09/20/2021 23:51:40 - INFO - __main__ - Step 43276: {'lr': 0.00019922421020388518, 'samples': 1384832, 'steps': 2704, 'loss/train': 2.3315322399139404} -09/20/2021 23:51:41 - INFO - __main__ - Step 43277: {'lr': 0.00019922421020388518, 'samples': 1384864, 'steps': 2704, 'loss/train': 2.199312686920166} -09/20/2021 23:51:42 - INFO - __main__ - Step 43278: {'lr': 0.00019922421020388518, 'samples': 1384896, 'steps': 2704, 'loss/train': 2.065885305404663} -09/20/2021 23:51:42 - INFO - __main__ - Step 43279: {'lr': 0.00019922421020388518, 'samples': 1384928, 'steps': 2704, 'loss/train': 2.1845109462738037} -09/20/2021 23:51:43 - INFO - __main__ - Step 43280: {'lr': 0.00019922421020388518, 'samples': 1384960, 'steps': 2704, 'loss/train': 2.286054849624634} -09/20/2021 23:51:44 - INFO - __main__ - Step 43281: {'lr': 0.00019922341697729238, 'samples': 1384992, 'steps': 2705, 'loss/train': 1.9316651821136475} -09/20/2021 23:51:45 - INFO - __main__ - Step 43282: {'lr': 0.00019922341697729238, 'samples': 1385024, 'steps': 2705, 'loss/train': 2.252493381500244} -09/20/2021 23:51:45 - INFO - __main__ - Step 43283: {'lr': 0.00019922341697729238, 'samples': 1385056, 'steps': 2705, 'loss/train': 1.7656035423278809} -09/20/2021 23:51:46 - INFO - __main__ - Step 43284: {'lr': 0.00019922341697729238, 'samples': 1385088, 'steps': 2705, 'loss/train': 2.5439999103546143} -09/20/2021 23:51:47 - INFO - __main__ - Step 43285: {'lr': 0.00019922341697729238, 'samples': 1385120, 'steps': 2705, 'loss/train': 2.532696485519409} -09/20/2021 23:51:48 - INFO - __main__ - Step 43286: {'lr': 0.00019922341697729238, 'samples': 1385152, 'steps': 2705, 'loss/train': 2.2664072513580322} -09/20/2021 23:51:48 - INFO - __main__ - Step 43287: {'lr': 0.00019922341697729238, 'samples': 1385184, 'steps': 2705, 'loss/train': 2.064218282699585} -09/20/2021 23:51:49 - INFO - __main__ - Step 43288: {'lr': 0.00019922341697729238, 'samples': 1385216, 'steps': 2705, 'loss/train': 1.643074631690979} -09/20/2021 23:51:50 - INFO - __main__ - Step 43289: {'lr': 0.00019922341697729238, 'samples': 1385248, 'steps': 2705, 'loss/train': 1.5363903045654297} -09/20/2021 23:51:51 - INFO - __main__ - Step 43290: {'lr': 0.00019922341697729238, 'samples': 1385280, 'steps': 2705, 'loss/train': 1.8811225891113281} -09/20/2021 23:51:51 - INFO - __main__ - Step 43291: {'lr': 0.00019922341697729238, 'samples': 1385312, 'steps': 2705, 'loss/train': 1.467576026916504} -09/20/2021 23:51:52 - INFO - __main__ - Step 43292: {'lr': 0.00019922341697729238, 'samples': 1385344, 'steps': 2705, 'loss/train': 2.054044485092163} -09/20/2021 23:51:53 - INFO - __main__ - Step 43293: {'lr': 0.00019922341697729238, 'samples': 1385376, 'steps': 2705, 'loss/train': 1.8948489427566528} -09/20/2021 23:51:54 - INFO - __main__ - Step 43294: {'lr': 0.00019922341697729238, 'samples': 1385408, 'steps': 2705, 'loss/train': 1.905661702156067} -09/20/2021 23:51:54 - INFO - __main__ - Step 43295: {'lr': 0.00019922341697729238, 'samples': 1385440, 'steps': 2705, 'loss/train': 1.9079573154449463} -09/20/2021 23:51:55 - INFO - __main__ - Step 43296: {'lr': 0.00019922341697729238, 'samples': 1385472, 'steps': 2705, 'loss/train': 2.3510632514953613} -09/20/2021 23:51:56 - INFO - __main__ - Step 43297: {'lr': 0.00019922262334695984, 'samples': 1385504, 'steps': 2706, 'loss/train': 1.981640338897705} -09/20/2021 23:51:57 - INFO - __main__ - Step 43298: {'lr': 0.00019922262334695984, 'samples': 1385536, 'steps': 2706, 'loss/train': 1.249337911605835} -09/20/2021 23:51:58 - INFO - __main__ - Step 43299: {'lr': 0.00019922262334695984, 'samples': 1385568, 'steps': 2706, 'loss/train': 2.6226930618286133} -09/20/2021 23:51:59 - INFO - __main__ - Step 43300: {'lr': 0.00019922262334695984, 'samples': 1385600, 'steps': 2706, 'loss/train': 2.5373709201812744} -09/20/2021 23:52:00 - INFO - __main__ - Step 43301: {'lr': 0.00019922262334695984, 'samples': 1385632, 'steps': 2706, 'loss/train': 2.219531297683716} -09/20/2021 23:52:00 - INFO - __main__ - Step 43302: {'lr': 0.00019922262334695984, 'samples': 1385664, 'steps': 2706, 'loss/train': 1.6074331998825073} -09/20/2021 23:52:01 - INFO - __main__ - Step 43303: {'lr': 0.00019922262334695984, 'samples': 1385696, 'steps': 2706, 'loss/train': 2.5631303787231445} -09/20/2021 23:52:02 - INFO - __main__ - Step 43304: {'lr': 0.00019922262334695984, 'samples': 1385728, 'steps': 2706, 'loss/train': 2.1213064193725586} -09/20/2021 23:52:03 - INFO - __main__ - Step 43305: {'lr': 0.00019922262334695984, 'samples': 1385760, 'steps': 2706, 'loss/train': 0.4161757826805115} -09/20/2021 23:52:03 - INFO - __main__ - Step 43306: {'lr': 0.00019922262334695984, 'samples': 1385792, 'steps': 2706, 'loss/train': 2.5310442447662354} -09/20/2021 23:52:04 - INFO - __main__ - Step 43307: {'lr': 0.00019922262334695984, 'samples': 1385824, 'steps': 2706, 'loss/train': 2.31685471534729} -09/20/2021 23:52:05 - INFO - __main__ - Step 43308: {'lr': 0.00019922262334695984, 'samples': 1385856, 'steps': 2706, 'loss/train': 1.8983815908432007} -09/20/2021 23:52:06 - INFO - __main__ - Step 43309: {'lr': 0.00019922262334695984, 'samples': 1385888, 'steps': 2706, 'loss/train': 1.9789297580718994} -09/20/2021 23:52:06 - INFO - __main__ - Step 43310: {'lr': 0.00019922262334695984, 'samples': 1385920, 'steps': 2706, 'loss/train': 0.2658730149269104} -09/20/2021 23:52:07 - INFO - __main__ - Step 43311: {'lr': 0.00019922262334695984, 'samples': 1385952, 'steps': 2706, 'loss/train': 2.2215523719787598} -09/20/2021 23:52:08 - INFO - __main__ - Step 43312: {'lr': 0.00019922262334695984, 'samples': 1385984, 'steps': 2706, 'loss/train': 2.6463141441345215} -09/20/2021 23:52:09 - INFO - __main__ - Step 43313: {'lr': 0.0001992218293128909, 'samples': 1386016, 'steps': 2707, 'loss/train': 2.5990519523620605} -09/20/2021 23:52:10 - INFO - __main__ - Step 43314: {'lr': 0.0001992218293128909, 'samples': 1386048, 'steps': 2707, 'loss/train': 2.147831678390503} -09/20/2021 23:52:10 - INFO - __main__ - Step 43315: {'lr': 0.0001992218293128909, 'samples': 1386080, 'steps': 2707, 'loss/train': 1.8724035024642944} -09/20/2021 23:52:11 - INFO - __main__ - Step 43316: {'lr': 0.0001992218293128909, 'samples': 1386112, 'steps': 2707, 'loss/train': 1.752884864807129} -09/20/2021 23:52:12 - INFO - __main__ - Step 43317: {'lr': 0.0001992218293128909, 'samples': 1386144, 'steps': 2707, 'loss/train': 2.3650014400482178} -09/20/2021 23:52:13 - INFO - __main__ - Step 43318: {'lr': 0.0001992218293128909, 'samples': 1386176, 'steps': 2707, 'loss/train': 2.0984671115875244} -09/20/2021 23:52:13 - INFO - __main__ - Step 43319: {'lr': 0.0001992218293128909, 'samples': 1386208, 'steps': 2707, 'loss/train': 2.263106107711792} -09/20/2021 23:52:14 - INFO - __main__ - Step 43320: {'lr': 0.0001992218293128909, 'samples': 1386240, 'steps': 2707, 'loss/train': 0.31681716442108154} -09/20/2021 23:52:15 - INFO - __main__ - Step 43321: {'lr': 0.0001992218293128909, 'samples': 1386272, 'steps': 2707, 'loss/train': 0.22564417123794556} -09/20/2021 23:52:16 - INFO - __main__ - Step 43322: {'lr': 0.0001992218293128909, 'samples': 1386304, 'steps': 2707, 'loss/train': 0.13930435478687286} -09/20/2021 23:52:16 - INFO - __main__ - Step 43323: {'lr': 0.0001992218293128909, 'samples': 1386336, 'steps': 2707, 'loss/train': 0.27960604429244995} -09/20/2021 23:52:17 - INFO - __main__ - Step 43324: {'lr': 0.0001992218293128909, 'samples': 1386368, 'steps': 2707, 'loss/train': 3.6962430477142334} -09/20/2021 23:52:18 - INFO - __main__ - Step 43325: {'lr': 0.0001992218293128909, 'samples': 1386400, 'steps': 2707, 'loss/train': 2.398989200592041} -09/20/2021 23:52:19 - INFO - __main__ - Step 43326: {'lr': 0.0001992218293128909, 'samples': 1386432, 'steps': 2707, 'loss/train': 2.035595655441284} -09/20/2021 23:52:19 - INFO - __main__ - Step 43327: {'lr': 0.0001992218293128909, 'samples': 1386464, 'steps': 2707, 'loss/train': 1.8963929414749146} -09/20/2021 23:52:20 - INFO - __main__ - Step 43328: {'lr': 0.0001992218293128909, 'samples': 1386496, 'steps': 2707, 'loss/train': 2.014253616333008} -09/20/2021 23:52:21 - INFO - __main__ - Step 43329: {'lr': 0.00019922103487508865, 'samples': 1386528, 'steps': 2708, 'loss/train': 1.021102786064148} -09/20/2021 23:52:22 - INFO - __main__ - Step 43330: {'lr': 0.00019922103487508865, 'samples': 1386560, 'steps': 2708, 'loss/train': 0.8630848526954651} -09/20/2021 23:52:23 - INFO - __main__ - Step 43331: {'lr': 0.00019922103487508865, 'samples': 1386592, 'steps': 2708, 'loss/train': 1.8961824178695679} -09/20/2021 23:52:24 - INFO - __main__ - Step 43332: {'lr': 0.00019922103487508865, 'samples': 1386624, 'steps': 2708, 'loss/train': 2.0602617263793945} -09/20/2021 23:52:24 - INFO - __main__ - Step 43333: {'lr': 0.00019922103487508865, 'samples': 1386656, 'steps': 2708, 'loss/train': 2.013429641723633} -09/20/2021 23:52:25 - INFO - __main__ - Step 43334: {'lr': 0.00019922103487508865, 'samples': 1386688, 'steps': 2708, 'loss/train': 1.918412685394287} -09/20/2021 23:52:26 - INFO - __main__ - Step 43335: {'lr': 0.00019922103487508865, 'samples': 1386720, 'steps': 2708, 'loss/train': 2.505530834197998} -09/20/2021 23:52:27 - INFO - __main__ - Step 43336: {'lr': 0.00019922103487508865, 'samples': 1386752, 'steps': 2708, 'loss/train': 1.5324153900146484} -09/20/2021 23:52:27 - INFO - __main__ - Step 43337: {'lr': 0.00019922103487508865, 'samples': 1386784, 'steps': 2708, 'loss/train': 1.5774706602096558} -09/20/2021 23:52:28 - INFO - __main__ - Step 43338: {'lr': 0.00019922103487508865, 'samples': 1386816, 'steps': 2708, 'loss/train': 2.4015679359436035} -09/20/2021 23:52:29 - INFO - __main__ - Step 43339: {'lr': 0.00019922103487508865, 'samples': 1386848, 'steps': 2708, 'loss/train': 1.5260852575302124} -09/20/2021 23:52:30 - INFO - __main__ - Step 43340: {'lr': 0.00019922103487508865, 'samples': 1386880, 'steps': 2708, 'loss/train': 2.1060116291046143} -09/20/2021 23:52:30 - INFO - __main__ - Step 43341: {'lr': 0.00019922103487508865, 'samples': 1386912, 'steps': 2708, 'loss/train': 2.08478045463562} -09/20/2021 23:52:31 - INFO - __main__ - Step 43342: {'lr': 0.00019922103487508865, 'samples': 1386944, 'steps': 2708, 'loss/train': 2.172510862350464} -09/20/2021 23:52:32 - INFO - __main__ - Step 43343: {'lr': 0.00019922103487508865, 'samples': 1386976, 'steps': 2708, 'loss/train': 2.866687059402466} -09/20/2021 23:52:33 - INFO - __main__ - Step 43344: {'lr': 0.00019922103487508865, 'samples': 1387008, 'steps': 2708, 'loss/train': 0.3881005346775055} -09/20/2021 23:52:34 - INFO - __main__ - Step 43345: {'lr': 0.00019922024003355646, 'samples': 1387040, 'steps': 2709, 'loss/train': 2.1465773582458496} -09/20/2021 23:52:34 - INFO - __main__ - Step 43346: {'lr': 0.00019922024003355646, 'samples': 1387072, 'steps': 2709, 'loss/train': 2.1267497539520264} -09/20/2021 23:52:35 - INFO - __main__ - Step 43347: {'lr': 0.00019922024003355646, 'samples': 1387104, 'steps': 2709, 'loss/train': 2.2667229175567627} -09/20/2021 23:52:36 - INFO - __main__ - Step 43348: {'lr': 0.00019922024003355646, 'samples': 1387136, 'steps': 2709, 'loss/train': 2.376445770263672} -09/20/2021 23:52:37 - INFO - __main__ - Step 43349: {'lr': 0.00019922024003355646, 'samples': 1387168, 'steps': 2709, 'loss/train': 2.406290292739868} -09/20/2021 23:52:37 - INFO - __main__ - Step 43350: {'lr': 0.00019922024003355646, 'samples': 1387200, 'steps': 2709, 'loss/train': 1.9993501901626587} -09/20/2021 23:52:38 - INFO - __main__ - Step 43351: {'lr': 0.00019922024003355646, 'samples': 1387232, 'steps': 2709, 'loss/train': 2.650618553161621} -09/20/2021 23:52:39 - INFO - __main__ - Step 43352: {'lr': 0.00019922024003355646, 'samples': 1387264, 'steps': 2709, 'loss/train': 1.480367660522461} -09/20/2021 23:52:40 - INFO - __main__ - Step 43353: {'lr': 0.00019922024003355646, 'samples': 1387296, 'steps': 2709, 'loss/train': 1.942533016204834} -09/20/2021 23:52:40 - INFO - __main__ - Step 43354: {'lr': 0.00019922024003355646, 'samples': 1387328, 'steps': 2709, 'loss/train': 1.693014144897461} -09/20/2021 23:52:41 - INFO - __main__ - Step 43355: {'lr': 0.00019922024003355646, 'samples': 1387360, 'steps': 2709, 'loss/train': 3.1222891807556152} -09/20/2021 23:52:42 - INFO - __main__ - Step 43356: {'lr': 0.00019922024003355646, 'samples': 1387392, 'steps': 2709, 'loss/train': 1.78749418258667} -09/20/2021 23:52:43 - INFO - __main__ - Step 43357: {'lr': 0.00019922024003355646, 'samples': 1387424, 'steps': 2709, 'loss/train': 1.562476396560669} -09/20/2021 23:52:43 - INFO - __main__ - Step 43358: {'lr': 0.00019922024003355646, 'samples': 1387456, 'steps': 2709, 'loss/train': 1.3394207954406738} -09/20/2021 23:52:44 - INFO - __main__ - Step 43359: {'lr': 0.00019922024003355646, 'samples': 1387488, 'steps': 2709, 'loss/train': 2.451129198074341} -09/20/2021 23:52:45 - INFO - __main__ - Step 43360: {'lr': 0.00019922024003355646, 'samples': 1387520, 'steps': 2709, 'loss/train': 2.749946117401123} -09/20/2021 23:52:48 - INFO - __main__ - Step 43361: {'lr': 0.00019921944478829744, 'samples': 1387552, 'steps': 2710, 'loss/train': 1.212433099746704} -09/20/2021 23:52:48 - INFO - __main__ - Step 43362: {'lr': 0.00019921944478829744, 'samples': 1387584, 'steps': 2710, 'loss/train': 2.255558729171753} -09/20/2021 23:52:49 - INFO - __main__ - Step 43363: {'lr': 0.00019921944478829744, 'samples': 1387616, 'steps': 2710, 'loss/train': 1.7622978687286377} -09/20/2021 23:52:50 - INFO - __main__ - Step 43364: {'lr': 0.00019921944478829744, 'samples': 1387648, 'steps': 2710, 'loss/train': 1.8641799688339233} -09/20/2021 23:52:51 - INFO - __main__ - Step 43365: {'lr': 0.00019921944478829744, 'samples': 1387680, 'steps': 2710, 'loss/train': 2.089986801147461} -09/20/2021 23:52:51 - INFO - __main__ - Step 43366: {'lr': 0.00019921944478829744, 'samples': 1387712, 'steps': 2710, 'loss/train': 1.1136592626571655} -09/20/2021 23:52:52 - INFO - __main__ - Step 43367: {'lr': 0.00019921944478829744, 'samples': 1387744, 'steps': 2710, 'loss/train': 1.6337023973464966} -09/20/2021 23:52:53 - INFO - __main__ - Step 43368: {'lr': 0.00019921944478829744, 'samples': 1387776, 'steps': 2710, 'loss/train': 2.02347469329834} -09/20/2021 23:52:54 - INFO - __main__ - Step 43369: {'lr': 0.00019921944478829744, 'samples': 1387808, 'steps': 2710, 'loss/train': 2.5400259494781494} -09/20/2021 23:52:54 - INFO - __main__ - Step 43370: {'lr': 0.00019921944478829744, 'samples': 1387840, 'steps': 2710, 'loss/train': 2.024186134338379} -09/20/2021 23:52:55 - INFO - __main__ - Step 43371: {'lr': 0.00019921944478829744, 'samples': 1387872, 'steps': 2710, 'loss/train': 2.214895248413086} -09/20/2021 23:52:56 - INFO - __main__ - Step 43372: {'lr': 0.00019921944478829744, 'samples': 1387904, 'steps': 2710, 'loss/train': 2.1213338375091553} -09/20/2021 23:52:57 - INFO - __main__ - Step 43373: {'lr': 0.00019921944478829744, 'samples': 1387936, 'steps': 2710, 'loss/train': 2.170057535171509} -09/20/2021 23:52:57 - INFO - __main__ - Step 43374: {'lr': 0.00019921944478829744, 'samples': 1387968, 'steps': 2710, 'loss/train': 3.119647979736328} -09/20/2021 23:52:58 - INFO - __main__ - Step 43375: {'lr': 0.00019921944478829744, 'samples': 1388000, 'steps': 2710, 'loss/train': 3.316890001296997} -09/20/2021 23:52:59 - INFO - __main__ - Step 43376: {'lr': 0.00019921944478829744, 'samples': 1388032, 'steps': 2710, 'loss/train': 2.5411980152130127} -09/20/2021 23:53:00 - INFO - __main__ - Step 43377: {'lr': 0.00019921864913931492, 'samples': 1388064, 'steps': 2711, 'loss/train': 1.1279330253601074} -09/20/2021 23:53:00 - INFO - __main__ - Step 43378: {'lr': 0.00019921864913931492, 'samples': 1388096, 'steps': 2711, 'loss/train': 2.4198355674743652} -09/20/2021 23:53:01 - INFO - __main__ - Step 43379: {'lr': 0.00019921864913931492, 'samples': 1388128, 'steps': 2711, 'loss/train': 2.3346168994903564} -09/20/2021 23:53:02 - INFO - __main__ - Step 43380: {'lr': 0.00019921864913931492, 'samples': 1388160, 'steps': 2711, 'loss/train': 1.6284265518188477} -09/20/2021 23:53:03 - INFO - __main__ - Step 43381: {'lr': 0.00019921864913931492, 'samples': 1388192, 'steps': 2711, 'loss/train': 1.5548487901687622} -09/20/2021 23:53:03 - INFO - __main__ - Step 43382: {'lr': 0.00019921864913931492, 'samples': 1388224, 'steps': 2711, 'loss/train': 1.9129266738891602} -09/20/2021 23:53:04 - INFO - __main__ - Step 43383: {'lr': 0.00019921864913931492, 'samples': 1388256, 'steps': 2711, 'loss/train': 4.443511486053467} -09/20/2021 23:53:05 - INFO - __main__ - Step 43384: {'lr': 0.00019921864913931492, 'samples': 1388288, 'steps': 2711, 'loss/train': 1.3966753482818604} -09/20/2021 23:53:06 - INFO - __main__ - Step 43385: {'lr': 0.00019921864913931492, 'samples': 1388320, 'steps': 2711, 'loss/train': 2.968263864517212} -09/20/2021 23:53:06 - INFO - __main__ - Step 43386: {'lr': 0.00019921864913931492, 'samples': 1388352, 'steps': 2711, 'loss/train': 1.4923027753829956} -09/20/2021 23:53:07 - INFO - __main__ - Step 43387: {'lr': 0.00019921864913931492, 'samples': 1388384, 'steps': 2711, 'loss/train': 1.3131150007247925} -09/20/2021 23:53:08 - INFO - __main__ - Step 43388: {'lr': 0.00019921864913931492, 'samples': 1388416, 'steps': 2711, 'loss/train': 1.4952399730682373} -09/20/2021 23:53:09 - INFO - __main__ - Step 43389: {'lr': 0.00019921864913931492, 'samples': 1388448, 'steps': 2711, 'loss/train': 2.195763349533081} -09/20/2021 23:53:09 - INFO - __main__ - Step 43390: {'lr': 0.00019921864913931492, 'samples': 1388480, 'steps': 2711, 'loss/train': 2.231121063232422} -09/20/2021 23:53:10 - INFO - __main__ - Step 43391: {'lr': 0.00019921864913931492, 'samples': 1388512, 'steps': 2711, 'loss/train': 2.2518348693847656} -09/20/2021 23:53:11 - INFO - __main__ - Step 43392: {'lr': 0.00019921864913931492, 'samples': 1388544, 'steps': 2711, 'loss/train': 2.3006207942962646} -09/20/2021 23:53:12 - INFO - __main__ - Step 43393: {'lr': 0.0001992178530866121, 'samples': 1388576, 'steps': 2712, 'loss/train': 2.752337694168091} -09/20/2021 23:53:13 - INFO - __main__ - Step 43394: {'lr': 0.0001992178530866121, 'samples': 1388608, 'steps': 2712, 'loss/train': 2.72654128074646} -09/20/2021 23:53:13 - INFO - __main__ - Step 43395: {'lr': 0.0001992178530866121, 'samples': 1388640, 'steps': 2712, 'loss/train': 2.7844550609588623} -09/20/2021 23:53:14 - INFO - __main__ - Step 43396: {'lr': 0.0001992178530866121, 'samples': 1388672, 'steps': 2712, 'loss/train': 2.773409843444824} -09/20/2021 23:53:15 - INFO - __main__ - Step 43397: {'lr': 0.0001992178530866121, 'samples': 1388704, 'steps': 2712, 'loss/train': 2.8115134239196777} -09/20/2021 23:53:16 - INFO - __main__ - Step 43398: {'lr': 0.0001992178530866121, 'samples': 1388736, 'steps': 2712, 'loss/train': 2.8328731060028076} -09/20/2021 23:53:16 - INFO - __main__ - Step 43399: {'lr': 0.0001992178530866121, 'samples': 1388768, 'steps': 2712, 'loss/train': 2.72190523147583} -09/20/2021 23:53:17 - INFO - __main__ - Step 43400: {'lr': 0.0001992178530866121, 'samples': 1388800, 'steps': 2712, 'loss/train': 2.493222951889038} -09/20/2021 23:53:18 - INFO - __main__ - Step 43401: {'lr': 0.0001992178530866121, 'samples': 1388832, 'steps': 2712, 'loss/train': 2.509695053100586} -09/20/2021 23:53:19 - INFO - __main__ - Step 43402: {'lr': 0.0001992178530866121, 'samples': 1388864, 'steps': 2712, 'loss/train': 2.7417352199554443} -09/20/2021 23:53:19 - INFO - __main__ - Step 43403: {'lr': 0.0001992178530866121, 'samples': 1388896, 'steps': 2712, 'loss/train': 2.6065309047698975} -09/20/2021 23:53:20 - INFO - __main__ - Step 43404: {'lr': 0.0001992178530866121, 'samples': 1388928, 'steps': 2712, 'loss/train': 2.5775279998779297} -09/20/2021 23:53:21 - INFO - __main__ - Step 43405: {'lr': 0.0001992178530866121, 'samples': 1388960, 'steps': 2712, 'loss/train': 2.8272993564605713} -09/20/2021 23:53:22 - INFO - __main__ - Step 43406: {'lr': 0.0001992178530866121, 'samples': 1388992, 'steps': 2712, 'loss/train': 2.732071876525879} -09/20/2021 23:53:22 - INFO - __main__ - Step 43407: {'lr': 0.0001992178530866121, 'samples': 1389024, 'steps': 2712, 'loss/train': 2.7402942180633545} -09/20/2021 23:53:24 - INFO - __main__ - Step 43408: {'lr': 0.0001992178530866121, 'samples': 1389056, 'steps': 2712, 'loss/train': 2.8004469871520996} -09/20/2021 23:53:25 - INFO - __main__ - Step 43409: {'lr': 0.00019921705663019222, 'samples': 1389088, 'steps': 2713, 'loss/train': 2.1531569957733154} -09/20/2021 23:53:25 - INFO - __main__ - Step 43410: {'lr': 0.00019921705663019222, 'samples': 1389120, 'steps': 2713, 'loss/train': 2.596832513809204} -09/20/2021 23:53:26 - INFO - __main__ - Step 43411: {'lr': 0.00019921705663019222, 'samples': 1389152, 'steps': 2713, 'loss/train': 1.351471185684204} -09/20/2021 23:53:27 - INFO - __main__ - Step 43412: {'lr': 0.00019921705663019222, 'samples': 1389184, 'steps': 2713, 'loss/train': 2.578192949295044} -09/20/2021 23:53:28 - INFO - __main__ - Step 43413: {'lr': 0.00019921705663019222, 'samples': 1389216, 'steps': 2713, 'loss/train': 1.8071908950805664} -09/20/2021 23:53:28 - INFO - __main__ - Step 43414: {'lr': 0.00019921705663019222, 'samples': 1389248, 'steps': 2713, 'loss/train': 2.752826690673828} -09/20/2021 23:53:29 - INFO - __main__ - Step 43415: {'lr': 0.00019921705663019222, 'samples': 1389280, 'steps': 2713, 'loss/train': 1.7743868827819824} -09/20/2021 23:53:30 - INFO - __main__ - Step 43416: {'lr': 0.00019921705663019222, 'samples': 1389312, 'steps': 2713, 'loss/train': 1.9054042100906372} -09/20/2021 23:53:31 - INFO - __main__ - Step 43417: {'lr': 0.00019921705663019222, 'samples': 1389344, 'steps': 2713, 'loss/train': 0.5492837429046631} -09/20/2021 23:53:31 - INFO - __main__ - Step 43418: {'lr': 0.00019921705663019222, 'samples': 1389376, 'steps': 2713, 'loss/train': 2.678110122680664} -09/20/2021 23:53:32 - INFO - __main__ - Step 43419: {'lr': 0.00019921705663019222, 'samples': 1389408, 'steps': 2713, 'loss/train': 2.527886390686035} -09/20/2021 23:53:33 - INFO - __main__ - Step 43420: {'lr': 0.00019921705663019222, 'samples': 1389440, 'steps': 2713, 'loss/train': 1.516435146331787} -09/20/2021 23:53:34 - INFO - __main__ - Step 43421: {'lr': 0.00019921705663019222, 'samples': 1389472, 'steps': 2713, 'loss/train': 2.368088483810425} -09/20/2021 23:53:34 - INFO - __main__ - Step 43422: {'lr': 0.00019921705663019222, 'samples': 1389504, 'steps': 2713, 'loss/train': 2.6778268814086914} -09/20/2021 23:53:35 - INFO - __main__ - Step 43423: {'lr': 0.00019921705663019222, 'samples': 1389536, 'steps': 2713, 'loss/train': 2.108616590499878} -09/20/2021 23:53:36 - INFO - __main__ - Step 43424: {'lr': 0.00019921705663019222, 'samples': 1389568, 'steps': 2713, 'loss/train': 2.706914186477661} -09/20/2021 23:53:37 - INFO - __main__ - Step 43425: {'lr': 0.00019921625977005852, 'samples': 1389600, 'steps': 2714, 'loss/train': 2.613112449645996} -09/20/2021 23:53:37 - INFO - __main__ - Step 43426: {'lr': 0.00019921625977005852, 'samples': 1389632, 'steps': 2714, 'loss/train': 2.028001308441162} -09/20/2021 23:53:38 - INFO - __main__ - Step 43427: {'lr': 0.00019921625977005852, 'samples': 1389664, 'steps': 2714, 'loss/train': 2.6804826259613037} -09/20/2021 23:53:39 - INFO - __main__ - Step 43428: {'lr': 0.00019921625977005852, 'samples': 1389696, 'steps': 2714, 'loss/train': 3.5582077503204346} -09/20/2021 23:53:40 - INFO - __main__ - Step 43429: {'lr': 0.00019921625977005852, 'samples': 1389728, 'steps': 2714, 'loss/train': 3.5929324626922607} -09/20/2021 23:53:40 - INFO - __main__ - Step 43430: {'lr': 0.00019921625977005852, 'samples': 1389760, 'steps': 2714, 'loss/train': 2.5929672718048096} -09/20/2021 23:53:41 - INFO - __main__ - Step 43431: {'lr': 0.00019921625977005852, 'samples': 1389792, 'steps': 2714, 'loss/train': 1.781205654144287} -09/20/2021 23:53:42 - INFO - __main__ - Step 43432: {'lr': 0.00019921625977005852, 'samples': 1389824, 'steps': 2714, 'loss/train': 1.8457382917404175} -09/20/2021 23:53:43 - INFO - __main__ - Step 43433: {'lr': 0.00019921625977005852, 'samples': 1389856, 'steps': 2714, 'loss/train': 1.916815996170044} -09/20/2021 23:53:43 - INFO - __main__ - Step 43434: {'lr': 0.00019921625977005852, 'samples': 1389888, 'steps': 2714, 'loss/train': 1.7947338819503784} -09/20/2021 23:53:44 - INFO - __main__ - Step 43435: {'lr': 0.00019921625977005852, 'samples': 1389920, 'steps': 2714, 'loss/train': 2.560070276260376} -09/20/2021 23:53:45 - INFO - __main__ - Step 43436: {'lr': 0.00019921625977005852, 'samples': 1389952, 'steps': 2714, 'loss/train': 1.9983816146850586} -09/20/2021 23:53:46 - INFO - __main__ - Step 43437: {'lr': 0.00019921625977005852, 'samples': 1389984, 'steps': 2714, 'loss/train': 2.2053072452545166} -09/20/2021 23:53:46 - INFO - __main__ - Step 43438: {'lr': 0.00019921625977005852, 'samples': 1390016, 'steps': 2714, 'loss/train': 2.5916805267333984} -09/20/2021 23:53:47 - INFO - __main__ - Step 43439: {'lr': 0.00019921625977005852, 'samples': 1390048, 'steps': 2714, 'loss/train': 1.8642319440841675} -09/20/2021 23:53:49 - INFO - __main__ - Step 43440: {'lr': 0.00019921625977005852, 'samples': 1390080, 'steps': 2714, 'loss/train': 1.6325472593307495} -09/20/2021 23:53:50 - INFO - __main__ - Step 43441: {'lr': 0.00019921546250621424, 'samples': 1390112, 'steps': 2715, 'loss/train': 2.742013931274414} -09/20/2021 23:53:51 - INFO - __main__ - Step 43442: {'lr': 0.00019921546250621424, 'samples': 1390144, 'steps': 2715, 'loss/train': 3.0979039669036865} -09/20/2021 23:53:51 - INFO - __main__ - Step 43443: {'lr': 0.00019921546250621424, 'samples': 1390176, 'steps': 2715, 'loss/train': 3.7163264751434326} -09/20/2021 23:53:52 - INFO - __main__ - Step 43444: {'lr': 0.00019921546250621424, 'samples': 1390208, 'steps': 2715, 'loss/train': 3.974898099899292} -09/20/2021 23:53:53 - INFO - __main__ - Step 43445: {'lr': 0.00019921546250621424, 'samples': 1390240, 'steps': 2715, 'loss/train': 3.4782750606536865} -09/20/2021 23:53:54 - INFO - __main__ - Step 43446: {'lr': 0.00019921546250621424, 'samples': 1390272, 'steps': 2715, 'loss/train': 3.875894546508789} -09/20/2021 23:53:54 - INFO - __main__ - Step 43447: {'lr': 0.00019921546250621424, 'samples': 1390304, 'steps': 2715, 'loss/train': 1.505476474761963} -09/20/2021 23:53:55 - INFO - __main__ - Step 43448: {'lr': 0.00019921546250621424, 'samples': 1390336, 'steps': 2715, 'loss/train': 2.3441104888916016} -09/20/2021 23:53:56 - INFO - __main__ - Step 43449: {'lr': 0.00019921546250621424, 'samples': 1390368, 'steps': 2715, 'loss/train': 1.8204604387283325} -09/20/2021 23:53:57 - INFO - __main__ - Step 43450: {'lr': 0.00019921546250621424, 'samples': 1390400, 'steps': 2715, 'loss/train': 5.889391899108887} -09/20/2021 23:53:57 - INFO - __main__ - Step 43451: {'lr': 0.00019921546250621424, 'samples': 1390432, 'steps': 2715, 'loss/train': 5.951089859008789} -09/20/2021 23:53:58 - INFO - __main__ - Step 43452: {'lr': 0.00019921546250621424, 'samples': 1390464, 'steps': 2715, 'loss/train': 5.986616611480713} -09/20/2021 23:53:59 - INFO - __main__ - Step 43453: {'lr': 0.00019921546250621424, 'samples': 1390496, 'steps': 2715, 'loss/train': 5.916161060333252} -09/20/2021 23:54:00 - INFO - __main__ - Step 43454: {'lr': 0.00019921546250621424, 'samples': 1390528, 'steps': 2715, 'loss/train': 5.970296859741211} -09/20/2021 23:54:00 - INFO - __main__ - Step 43455: {'lr': 0.00019921546250621424, 'samples': 1390560, 'steps': 2715, 'loss/train': 5.985699653625488} -09/20/2021 23:54:01 - INFO - __main__ - Step 43456: {'lr': 0.00019921546250621424, 'samples': 1390592, 'steps': 2715, 'loss/train': 5.897940635681152} -09/20/2021 23:54:02 - INFO - __main__ - Step 43457: {'lr': 0.00019921466483866263, 'samples': 1390624, 'steps': 2716, 'loss/train': 5.882382392883301} -09/20/2021 23:54:03 - INFO - __main__ - Step 43458: {'lr': 0.00019921466483866263, 'samples': 1390656, 'steps': 2716, 'loss/train': 5.860616683959961} -09/20/2021 23:54:03 - INFO - __main__ - Step 43459: {'lr': 0.00019921466483866263, 'samples': 1390688, 'steps': 2716, 'loss/train': 5.858025550842285} -09/20/2021 23:54:04 - INFO - __main__ - Step 43460: {'lr': 0.00019921466483866263, 'samples': 1390720, 'steps': 2716, 'loss/train': 5.827043533325195} -09/20/2021 23:54:05 - INFO - __main__ - Step 43461: {'lr': 0.00019921466483866263, 'samples': 1390752, 'steps': 2716, 'loss/train': 1.2095588445663452} -09/20/2021 23:54:06 - INFO - __main__ - Step 43462: {'lr': 0.00019921466483866263, 'samples': 1390784, 'steps': 2716, 'loss/train': 3.213412046432495} -09/20/2021 23:54:06 - INFO - __main__ - Step 43463: {'lr': 0.00019921466483866263, 'samples': 1390816, 'steps': 2716, 'loss/train': 0.5914612412452698} -09/20/2021 23:54:07 - INFO - __main__ - Step 43464: {'lr': 0.00019921466483866263, 'samples': 1390848, 'steps': 2716, 'loss/train': 0.4365963637828827} -09/20/2021 23:54:08 - INFO - __main__ - Step 43465: {'lr': 0.00019921466483866263, 'samples': 1390880, 'steps': 2716, 'loss/train': 0.23138348758220673} -09/20/2021 23:54:09 - INFO - __main__ - Step 43466: {'lr': 0.00019921466483866263, 'samples': 1390912, 'steps': 2716, 'loss/train': 0.4763822853565216} -09/20/2021 23:54:09 - INFO - __main__ - Step 43467: {'lr': 0.00019921466483866263, 'samples': 1390944, 'steps': 2716, 'loss/train': 0.28898483514785767} -09/20/2021 23:54:10 - INFO - __main__ - Step 43468: {'lr': 0.00019921466483866263, 'samples': 1390976, 'steps': 2716, 'loss/train': 0.44795650243759155} -09/20/2021 23:54:11 - INFO - __main__ - Step 43469: {'lr': 0.00019921466483866263, 'samples': 1391008, 'steps': 2716, 'loss/train': 1.910637617111206} -09/20/2021 23:54:12 - INFO - __main__ - Step 43470: {'lr': 0.00019921466483866263, 'samples': 1391040, 'steps': 2716, 'loss/train': 3.225323438644409} -09/20/2021 23:54:12 - INFO - __main__ - Step 43471: {'lr': 0.00019921466483866263, 'samples': 1391072, 'steps': 2716, 'loss/train': 1.2871404886245728} -09/20/2021 23:54:13 - INFO - __main__ - Step 43472: {'lr': 0.00019921466483866263, 'samples': 1391104, 'steps': 2716, 'loss/train': 0.8548573851585388} -09/20/2021 23:54:14 - INFO - __main__ - Step 43473: {'lr': 0.00019921386676740693, 'samples': 1391136, 'steps': 2717, 'loss/train': 2.5996181964874268} -09/20/2021 23:54:15 - INFO - __main__ - Step 43474: {'lr': 0.00019921386676740693, 'samples': 1391168, 'steps': 2717, 'loss/train': 1.8698581457138062} -09/20/2021 23:54:16 - INFO - __main__ - Step 43475: {'lr': 0.00019921386676740693, 'samples': 1391200, 'steps': 2717, 'loss/train': 1.6899683475494385} -09/20/2021 23:54:16 - INFO - __main__ - Step 43476: {'lr': 0.00019921386676740693, 'samples': 1391232, 'steps': 2717, 'loss/train': 3.1153500080108643} -09/20/2021 23:54:17 - INFO - __main__ - Step 43477: {'lr': 0.00019921386676740693, 'samples': 1391264, 'steps': 2717, 'loss/train': 1.1468456983566284} -09/20/2021 23:54:18 - INFO - __main__ - Step 43478: {'lr': 0.00019921386676740693, 'samples': 1391296, 'steps': 2717, 'loss/train': 1.3728846311569214} -09/20/2021 23:54:19 - INFO - __main__ - Step 43479: {'lr': 0.00019921386676740693, 'samples': 1391328, 'steps': 2717, 'loss/train': 3.103311777114868} -09/20/2021 23:54:21 - INFO - __main__ - Step 43480: {'lr': 0.00019921386676740693, 'samples': 1391360, 'steps': 2717, 'loss/train': 2.6655993461608887} -09/20/2021 23:54:21 - INFO - __main__ - Step 43481: {'lr': 0.00019921386676740693, 'samples': 1391392, 'steps': 2717, 'loss/train': 2.9880778789520264} -09/20/2021 23:54:22 - INFO - __main__ - Step 43482: {'lr': 0.00019921386676740693, 'samples': 1391424, 'steps': 2717, 'loss/train': 2.0261423587799072} -09/20/2021 23:54:23 - INFO - __main__ - Step 43483: {'lr': 0.00019921386676740693, 'samples': 1391456, 'steps': 2717, 'loss/train': 3.2502102851867676} -09/20/2021 23:54:24 - INFO - __main__ - Step 43484: {'lr': 0.00019921386676740693, 'samples': 1391488, 'steps': 2717, 'loss/train': 2.3104333877563477} -09/20/2021 23:54:24 - INFO - __main__ - Step 43485: {'lr': 0.00019921386676740693, 'samples': 1391520, 'steps': 2717, 'loss/train': 2.239962100982666} -09/20/2021 23:54:25 - INFO - __main__ - Step 43486: {'lr': 0.00019921386676740693, 'samples': 1391552, 'steps': 2717, 'loss/train': 2.3119654655456543} -09/20/2021 23:54:26 - INFO - __main__ - Step 43487: {'lr': 0.00019921386676740693, 'samples': 1391584, 'steps': 2717, 'loss/train': 2.7972915172576904} -09/20/2021 23:54:27 - INFO - __main__ - Step 43488: {'lr': 0.00019921386676740693, 'samples': 1391616, 'steps': 2717, 'loss/train': 2.0426228046417236} -09/20/2021 23:54:28 - INFO - __main__ - Step 43489: {'lr': 0.0001992130682924504, 'samples': 1391648, 'steps': 2718, 'loss/train': 1.650762677192688} -09/20/2021 23:54:28 - INFO - __main__ - Step 43490: {'lr': 0.0001992130682924504, 'samples': 1391680, 'steps': 2718, 'loss/train': 3.002521514892578} -09/20/2021 23:54:29 - INFO - __main__ - Step 43491: {'lr': 0.0001992130682924504, 'samples': 1391712, 'steps': 2718, 'loss/train': 2.0257697105407715} -09/20/2021 23:54:30 - INFO - __main__ - Step 43492: {'lr': 0.0001992130682924504, 'samples': 1391744, 'steps': 2718, 'loss/train': 2.270322322845459} -09/20/2021 23:54:31 - INFO - __main__ - Step 43493: {'lr': 0.0001992130682924504, 'samples': 1391776, 'steps': 2718, 'loss/train': 0.16497646272182465} -09/20/2021 23:54:31 - INFO - __main__ - Step 43494: {'lr': 0.0001992130682924504, 'samples': 1391808, 'steps': 2718, 'loss/train': 0.14804160594940186} -09/20/2021 23:54:32 - INFO - __main__ - Step 43495: {'lr': 0.0001992130682924504, 'samples': 1391840, 'steps': 2718, 'loss/train': 0.5296812653541565} -09/20/2021 23:54:33 - INFO - __main__ - Step 43496: {'lr': 0.0001992130682924504, 'samples': 1391872, 'steps': 2718, 'loss/train': 1.6702409982681274} -09/20/2021 23:54:34 - INFO - __main__ - Step 43497: {'lr': 0.0001992130682924504, 'samples': 1391904, 'steps': 2718, 'loss/train': 1.9609609842300415} -09/20/2021 23:54:34 - INFO - __main__ - Step 43498: {'lr': 0.0001992130682924504, 'samples': 1391936, 'steps': 2718, 'loss/train': 3.5526154041290283} -09/20/2021 23:54:35 - INFO - __main__ - Step 43499: {'lr': 0.0001992130682924504, 'samples': 1391968, 'steps': 2718, 'loss/train': 2.439054012298584} -09/20/2021 23:54:36 - INFO - __main__ - Step 43500: {'lr': 0.0001992130682924504, 'samples': 1392000, 'steps': 2718, 'loss/train': 2.2374260425567627} -09/20/2021 23:54:37 - INFO - __main__ - Step 43501: {'lr': 0.0001992130682924504, 'samples': 1392032, 'steps': 2718, 'loss/train': 2.2644476890563965} -09/20/2021 23:54:37 - INFO - __main__ - Step 43502: {'lr': 0.0001992130682924504, 'samples': 1392064, 'steps': 2718, 'loss/train': 3.670100212097168} -09/20/2021 23:54:38 - INFO - __main__ - Step 43503: {'lr': 0.0001992130682924504, 'samples': 1392096, 'steps': 2718, 'loss/train': 4.5899248123168945} -09/20/2021 23:54:39 - INFO - __main__ - Step 43504: {'lr': 0.0001992130682924504, 'samples': 1392128, 'steps': 2718, 'loss/train': 3.3614258766174316} -09/20/2021 23:54:40 - INFO - __main__ - Step 43505: {'lr': 0.00019921226941379625, 'samples': 1392160, 'steps': 2719, 'loss/train': 3.4657700061798096} -09/20/2021 23:54:40 - INFO - __main__ - Step 43506: {'lr': 0.00019921226941379625, 'samples': 1392192, 'steps': 2719, 'loss/train': 4.023043632507324} -09/20/2021 23:54:41 - INFO - __main__ - Step 43507: {'lr': 0.00019921226941379625, 'samples': 1392224, 'steps': 2719, 'loss/train': 1.6821579933166504} -09/20/2021 23:54:42 - INFO - __main__ - Step 43508: {'lr': 0.00019921226941379625, 'samples': 1392256, 'steps': 2719, 'loss/train': 2.7218589782714844} -09/20/2021 23:54:43 - INFO - __main__ - Step 43509: {'lr': 0.00019921226941379625, 'samples': 1392288, 'steps': 2719, 'loss/train': 0.9615819454193115} -09/20/2021 23:54:43 - INFO - __main__ - Step 43510: {'lr': 0.00019921226941379625, 'samples': 1392320, 'steps': 2719, 'loss/train': 2.7724528312683105} -09/20/2021 23:54:44 - INFO - __main__ - Step 43511: {'lr': 0.00019921226941379625, 'samples': 1392352, 'steps': 2719, 'loss/train': 2.3215107917785645} -09/20/2021 23:54:45 - INFO - __main__ - Step 43512: {'lr': 0.00019921226941379625, 'samples': 1392384, 'steps': 2719, 'loss/train': 2.4414424896240234} -09/20/2021 23:54:46 - INFO - __main__ - Step 43513: {'lr': 0.00019921226941379625, 'samples': 1392416, 'steps': 2719, 'loss/train': 2.4495670795440674} -09/20/2021 23:54:46 - INFO - __main__ - Step 43514: {'lr': 0.00019921226941379625, 'samples': 1392448, 'steps': 2719, 'loss/train': 2.41060209274292} -09/20/2021 23:54:47 - INFO - __main__ - Step 43515: {'lr': 0.00019921226941379625, 'samples': 1392480, 'steps': 2719, 'loss/train': 2.441927194595337} -09/20/2021 23:54:48 - INFO - __main__ - Step 43516: {'lr': 0.00019921226941379625, 'samples': 1392512, 'steps': 2719, 'loss/train': 2.519082546234131} -09/20/2021 23:54:49 - INFO - __main__ - Step 43517: {'lr': 0.00019921226941379625, 'samples': 1392544, 'steps': 2719, 'loss/train': 2.432842254638672} -09/20/2021 23:54:49 - INFO - __main__ - Step 43518: {'lr': 0.00019921226941379625, 'samples': 1392576, 'steps': 2719, 'loss/train': 2.3747265338897705} -09/20/2021 23:54:50 - INFO - __main__ - Step 43519: {'lr': 0.00019921226941379625, 'samples': 1392608, 'steps': 2719, 'loss/train': 2.488308906555176} -09/20/2021 23:54:52 - INFO - __main__ - Step 43520: {'lr': 0.00019921226941379625, 'samples': 1392640, 'steps': 2719, 'loss/train': 2.4336209297180176} -09/20/2021 23:54:53 - INFO - __main__ - Step 43521: {'lr': 0.0001992114701314478, 'samples': 1392672, 'steps': 2720, 'loss/train': 2.185699462890625} -09/20/2021 23:54:53 - INFO - __main__ - Step 43522: {'lr': 0.0001992114701314478, 'samples': 1392704, 'steps': 2720, 'loss/train': 2.818774461746216} -09/20/2021 23:54:54 - INFO - __main__ - Step 43523: {'lr': 0.0001992114701314478, 'samples': 1392736, 'steps': 2720, 'loss/train': 2.0031399726867676} -09/20/2021 23:54:55 - INFO - __main__ - Step 43524: {'lr': 0.0001992114701314478, 'samples': 1392768, 'steps': 2720, 'loss/train': 2.2942044734954834} -09/20/2021 23:54:56 - INFO - __main__ - Step 43525: {'lr': 0.0001992114701314478, 'samples': 1392800, 'steps': 2720, 'loss/train': 3.228891134262085} -09/20/2021 23:54:56 - INFO - __main__ - Step 43526: {'lr': 0.0001992114701314478, 'samples': 1392832, 'steps': 2720, 'loss/train': 1.8729501962661743} -09/20/2021 23:54:57 - INFO - __main__ - Step 43527: {'lr': 0.0001992114701314478, 'samples': 1392864, 'steps': 2720, 'loss/train': 1.8628987073898315} -09/20/2021 23:54:58 - INFO - __main__ - Step 43528: {'lr': 0.0001992114701314478, 'samples': 1392896, 'steps': 2720, 'loss/train': 1.8166611194610596} -09/20/2021 23:54:59 - INFO - __main__ - Step 43529: {'lr': 0.0001992114701314478, 'samples': 1392928, 'steps': 2720, 'loss/train': 1.6616218090057373} -09/20/2021 23:54:59 - INFO - __main__ - Step 43530: {'lr': 0.0001992114701314478, 'samples': 1392960, 'steps': 2720, 'loss/train': 1.8492144346237183} -09/20/2021 23:55:00 - INFO - __main__ - Step 43531: {'lr': 0.0001992114701314478, 'samples': 1392992, 'steps': 2720, 'loss/train': 2.128857374191284} -09/20/2021 23:55:01 - INFO - __main__ - Step 43532: {'lr': 0.0001992114701314478, 'samples': 1393024, 'steps': 2720, 'loss/train': 1.645361304283142} -09/20/2021 23:55:02 - INFO - __main__ - Step 43533: {'lr': 0.0001992114701314478, 'samples': 1393056, 'steps': 2720, 'loss/train': 2.9173524379730225} -09/20/2021 23:55:02 - INFO - __main__ - Step 43534: {'lr': 0.0001992114701314478, 'samples': 1393088, 'steps': 2720, 'loss/train': 2.3628344535827637} -09/20/2021 23:55:03 - INFO - __main__ - Step 43535: {'lr': 0.0001992114701314478, 'samples': 1393120, 'steps': 2720, 'loss/train': 2.3523433208465576} -09/20/2021 23:55:04 - INFO - __main__ - Step 43536: {'lr': 0.0001992114701314478, 'samples': 1393152, 'steps': 2720, 'loss/train': 1.5720691680908203} -09/20/2021 23:55:05 - INFO - __main__ - Step 43537: {'lr': 0.00019921067044540824, 'samples': 1393184, 'steps': 2721, 'loss/train': 1.4071664810180664} -09/20/2021 23:55:05 - INFO - __main__ - Step 43538: {'lr': 0.00019921067044540824, 'samples': 1393216, 'steps': 2721, 'loss/train': 2.556790351867676} -09/20/2021 23:55:06 - INFO - __main__ - Step 43539: {'lr': 0.00019921067044540824, 'samples': 1393248, 'steps': 2721, 'loss/train': 2.0638723373413086} -09/20/2021 23:55:07 - INFO - __main__ - Step 43540: {'lr': 0.00019921067044540824, 'samples': 1393280, 'steps': 2721, 'loss/train': 1.7696326971054077} -09/20/2021 23:55:08 - INFO - __main__ - Step 43541: {'lr': 0.00019921067044540824, 'samples': 1393312, 'steps': 2721, 'loss/train': 1.9016156196594238} -09/20/2021 23:55:08 - INFO - __main__ - Step 43542: {'lr': 0.00019921067044540824, 'samples': 1393344, 'steps': 2721, 'loss/train': 1.9597089290618896} -09/20/2021 23:55:09 - INFO - __main__ - Step 43543: {'lr': 0.00019921067044540824, 'samples': 1393376, 'steps': 2721, 'loss/train': 2.3827195167541504} -09/20/2021 23:55:10 - INFO - __main__ - Step 43544: {'lr': 0.00019921067044540824, 'samples': 1393408, 'steps': 2721, 'loss/train': 2.3387889862060547} -09/20/2021 23:55:11 - INFO - __main__ - Step 43545: {'lr': 0.00019921067044540824, 'samples': 1393440, 'steps': 2721, 'loss/train': 1.8756709098815918} -09/20/2021 23:55:11 - INFO - __main__ - Step 43546: {'lr': 0.00019921067044540824, 'samples': 1393472, 'steps': 2721, 'loss/train': 1.6169816255569458} -09/20/2021 23:55:12 - INFO - __main__ - Step 43547: {'lr': 0.00019921067044540824, 'samples': 1393504, 'steps': 2721, 'loss/train': 1.9838119745254517} -09/20/2021 23:55:13 - INFO - __main__ - Step 43548: {'lr': 0.00019921067044540824, 'samples': 1393536, 'steps': 2721, 'loss/train': 1.330308198928833} -09/20/2021 23:55:14 - INFO - __main__ - Step 43549: {'lr': 0.00019921067044540824, 'samples': 1393568, 'steps': 2721, 'loss/train': 2.088779926300049} -09/20/2021 23:55:14 - INFO - __main__ - Step 43550: {'lr': 0.00019921067044540824, 'samples': 1393600, 'steps': 2721, 'loss/train': 2.150481700897217} -09/20/2021 23:55:16 - INFO - __main__ - Step 43551: {'lr': 0.00019921067044540824, 'samples': 1393632, 'steps': 2721, 'loss/train': 2.4438235759735107} -09/20/2021 23:55:16 - INFO - __main__ - Step 43552: {'lr': 0.00019921067044540824, 'samples': 1393664, 'steps': 2721, 'loss/train': 2.234042167663574} -09/20/2021 23:55:17 - INFO - __main__ - Step 43553: {'lr': 0.00019920987035568086, 'samples': 1393696, 'steps': 2722, 'loss/train': 2.2468206882476807} -09/20/2021 23:55:18 - INFO - __main__ - Step 43554: {'lr': 0.00019920987035568086, 'samples': 1393728, 'steps': 2722, 'loss/train': 2.287109136581421} -09/20/2021 23:55:19 - INFO - __main__ - Step 43555: {'lr': 0.00019920987035568086, 'samples': 1393760, 'steps': 2722, 'loss/train': 1.2455453872680664} -09/20/2021 23:55:20 - INFO - __main__ - Step 43556: {'lr': 0.00019920987035568086, 'samples': 1393792, 'steps': 2722, 'loss/train': 1.256398320198059} -09/20/2021 23:55:20 - INFO - __main__ - Step 43557: {'lr': 0.00019920987035568086, 'samples': 1393824, 'steps': 2722, 'loss/train': 1.1919161081314087} -09/20/2021 23:55:21 - INFO - __main__ - Step 43558: {'lr': 0.00019920987035568086, 'samples': 1393856, 'steps': 2722, 'loss/train': 3.1896109580993652} -09/20/2021 23:55:22 - INFO - __main__ - Step 43559: {'lr': 0.00019920987035568086, 'samples': 1393888, 'steps': 2722, 'loss/train': 1.1771637201309204} -09/20/2021 23:55:23 - INFO - __main__ - Step 43560: {'lr': 0.00019920987035568086, 'samples': 1393920, 'steps': 2722, 'loss/train': 2.034071922302246} -09/20/2021 23:55:23 - INFO - __main__ - Step 43561: {'lr': 0.00019920987035568086, 'samples': 1393952, 'steps': 2722, 'loss/train': 1.6390979290008545} -09/20/2021 23:55:24 - INFO - __main__ - Step 43562: {'lr': 0.00019920987035568086, 'samples': 1393984, 'steps': 2722, 'loss/train': 1.7699744701385498} -09/20/2021 23:55:25 - INFO - __main__ - Step 43563: {'lr': 0.00019920987035568086, 'samples': 1394016, 'steps': 2722, 'loss/train': 3.3947947025299072} -09/20/2021 23:55:26 - INFO - __main__ - Step 43564: {'lr': 0.00019920987035568086, 'samples': 1394048, 'steps': 2722, 'loss/train': 1.9797122478485107} -09/20/2021 23:55:26 - INFO - __main__ - Step 43565: {'lr': 0.00019920987035568086, 'samples': 1394080, 'steps': 2722, 'loss/train': 0.4940209984779358} -09/20/2021 23:55:27 - INFO - __main__ - Step 43566: {'lr': 0.00019920987035568086, 'samples': 1394112, 'steps': 2722, 'loss/train': 1.7999173402786255} -09/20/2021 23:55:28 - INFO - __main__ - Step 43567: {'lr': 0.00019920987035568086, 'samples': 1394144, 'steps': 2722, 'loss/train': 2.652550458908081} -09/20/2021 23:55:29 - INFO - __main__ - Step 43568: {'lr': 0.00019920987035568086, 'samples': 1394176, 'steps': 2722, 'loss/train': 2.3800323009490967} -09/20/2021 23:55:29 - INFO - __main__ - Step 43569: {'lr': 0.00019920906986226888, 'samples': 1394208, 'steps': 2723, 'loss/train': 1.6543099880218506} -09/20/2021 23:55:30 - INFO - __main__ - Step 43570: {'lr': 0.00019920906986226888, 'samples': 1394240, 'steps': 2723, 'loss/train': 3.0777394771575928} -09/20/2021 23:55:31 - INFO - __main__ - Step 43571: {'lr': 0.00019920906986226888, 'samples': 1394272, 'steps': 2723, 'loss/train': 2.0338997840881348} -09/20/2021 23:55:32 - INFO - __main__ - Step 43572: {'lr': 0.00019920906986226888, 'samples': 1394304, 'steps': 2723, 'loss/train': 2.7992911338806152} -09/20/2021 23:55:32 - INFO - __main__ - Step 43573: {'lr': 0.00019920906986226888, 'samples': 1394336, 'steps': 2723, 'loss/train': 2.0765812397003174} -09/20/2021 23:55:33 - INFO - __main__ - Step 43574: {'lr': 0.00019920906986226888, 'samples': 1394368, 'steps': 2723, 'loss/train': 2.312390089035034} -09/20/2021 23:55:34 - INFO - __main__ - Step 43575: {'lr': 0.00019920906986226888, 'samples': 1394400, 'steps': 2723, 'loss/train': 2.2796030044555664} -09/20/2021 23:55:35 - INFO - __main__ - Step 43576: {'lr': 0.00019920906986226888, 'samples': 1394432, 'steps': 2723, 'loss/train': 2.3987205028533936} -09/20/2021 23:55:35 - INFO - __main__ - Step 43577: {'lr': 0.00019920906986226888, 'samples': 1394464, 'steps': 2723, 'loss/train': 2.333608627319336} -09/20/2021 23:55:36 - INFO - __main__ - Step 43578: {'lr': 0.00019920906986226888, 'samples': 1394496, 'steps': 2723, 'loss/train': 2.528974771499634} -09/20/2021 23:55:37 - INFO - __main__ - Step 43579: {'lr': 0.00019920906986226888, 'samples': 1394528, 'steps': 2723, 'loss/train': 1.7381819486618042} -09/20/2021 23:55:38 - INFO - __main__ - Step 43580: {'lr': 0.00019920906986226888, 'samples': 1394560, 'steps': 2723, 'loss/train': 2.044658660888672} -09/20/2021 23:55:39 - INFO - __main__ - Step 43581: {'lr': 0.00019920906986226888, 'samples': 1394592, 'steps': 2723, 'loss/train': 2.286191940307617} -09/20/2021 23:55:40 - INFO - __main__ - Step 43582: {'lr': 0.00019920906986226888, 'samples': 1394624, 'steps': 2723, 'loss/train': 2.497222423553467} -09/20/2021 23:55:41 - INFO - __main__ - Step 43583: {'lr': 0.00019920906986226888, 'samples': 1394656, 'steps': 2723, 'loss/train': 3.100006341934204} -09/20/2021 23:55:41 - INFO - __main__ - Step 43584: {'lr': 0.00019920906986226888, 'samples': 1394688, 'steps': 2723, 'loss/train': 0.8012105822563171} -09/20/2021 23:55:42 - INFO - __main__ - Step 43585: {'lr': 0.0001992082689651756, 'samples': 1394720, 'steps': 2724, 'loss/train': 1.8898018598556519} -09/20/2021 23:55:43 - INFO - __main__ - Step 43586: {'lr': 0.0001992082689651756, 'samples': 1394752, 'steps': 2724, 'loss/train': 2.936128616333008} -09/20/2021 23:55:44 - INFO - __main__ - Step 43587: {'lr': 0.0001992082689651756, 'samples': 1394784, 'steps': 2724, 'loss/train': 2.4139087200164795} -09/20/2021 23:55:44 - INFO - __main__ - Step 43588: {'lr': 0.0001992082689651756, 'samples': 1394816, 'steps': 2724, 'loss/train': 1.7681244611740112} -09/20/2021 23:55:45 - INFO - __main__ - Step 43589: {'lr': 0.0001992082689651756, 'samples': 1394848, 'steps': 2724, 'loss/train': 2.129542112350464} -09/20/2021 23:55:46 - INFO - __main__ - Step 43590: {'lr': 0.0001992082689651756, 'samples': 1394880, 'steps': 2724, 'loss/train': 2.1209614276885986} -09/20/2021 23:55:47 - INFO - __main__ - Step 43591: {'lr': 0.0001992082689651756, 'samples': 1394912, 'steps': 2724, 'loss/train': 2.4092111587524414} -09/20/2021 23:55:47 - INFO - __main__ - Step 43592: {'lr': 0.0001992082689651756, 'samples': 1394944, 'steps': 2724, 'loss/train': 2.072204113006592} -09/20/2021 23:55:48 - INFO - __main__ - Step 43593: {'lr': 0.0001992082689651756, 'samples': 1394976, 'steps': 2724, 'loss/train': 2.0732421875} -09/20/2021 23:55:49 - INFO - __main__ - Step 43594: {'lr': 0.0001992082689651756, 'samples': 1395008, 'steps': 2724, 'loss/train': 3.195638656616211} -09/20/2021 23:55:50 - INFO - __main__ - Step 43595: {'lr': 0.0001992082689651756, 'samples': 1395040, 'steps': 2724, 'loss/train': 2.7562286853790283} -09/20/2021 23:55:50 - INFO - __main__ - Step 43596: {'lr': 0.0001992082689651756, 'samples': 1395072, 'steps': 2724, 'loss/train': 2.32377028465271} -09/20/2021 23:55:51 - INFO - __main__ - Step 43597: {'lr': 0.0001992082689651756, 'samples': 1395104, 'steps': 2724, 'loss/train': 0.5770837068557739} -09/20/2021 23:55:52 - INFO - __main__ - Step 43598: {'lr': 0.0001992082689651756, 'samples': 1395136, 'steps': 2724, 'loss/train': 1.800925374031067} -09/20/2021 23:55:53 - INFO - __main__ - Step 43599: {'lr': 0.0001992082689651756, 'samples': 1395168, 'steps': 2724, 'loss/train': 1.8409463167190552} -09/20/2021 23:55:53 - INFO - __main__ - Step 43600: {'lr': 0.0001992082689651756, 'samples': 1395200, 'steps': 2724, 'loss/train': 1.972386121749878} -09/20/2021 23:55:54 - INFO - __main__ - Step 43601: {'lr': 0.0001992074676644043, 'samples': 1395232, 'steps': 2725, 'loss/train': 2.070507287979126} -09/20/2021 23:55:55 - INFO - __main__ - Step 43602: {'lr': 0.0001992074676644043, 'samples': 1395264, 'steps': 2725, 'loss/train': 2.3921971321105957} -09/20/2021 23:55:56 - INFO - __main__ - Step 43603: {'lr': 0.0001992074676644043, 'samples': 1395296, 'steps': 2725, 'loss/train': 2.347142457962036} -09/20/2021 23:55:57 - INFO - __main__ - Step 43604: {'lr': 0.0001992074676644043, 'samples': 1395328, 'steps': 2725, 'loss/train': 1.2935364246368408} -09/20/2021 23:55:57 - INFO - __main__ - Step 43605: {'lr': 0.0001992074676644043, 'samples': 1395360, 'steps': 2725, 'loss/train': 0.9445818662643433} -09/20/2021 23:55:58 - INFO - __main__ - Step 43606: {'lr': 0.0001992074676644043, 'samples': 1395392, 'steps': 2725, 'loss/train': 2.4386308193206787} -09/20/2021 23:55:59 - INFO - __main__ - Step 43607: {'lr': 0.0001992074676644043, 'samples': 1395424, 'steps': 2725, 'loss/train': 1.2192823886871338} -09/20/2021 23:56:00 - INFO - __main__ - Step 43608: {'lr': 0.0001992074676644043, 'samples': 1395456, 'steps': 2725, 'loss/train': 1.8933275938034058} -09/20/2021 23:56:00 - INFO - __main__ - Step 43609: {'lr': 0.0001992074676644043, 'samples': 1395488, 'steps': 2725, 'loss/train': 1.7974770069122314} -09/20/2021 23:56:01 - INFO - __main__ - Step 43610: {'lr': 0.0001992074676644043, 'samples': 1395520, 'steps': 2725, 'loss/train': 1.7629683017730713} -09/20/2021 23:56:02 - INFO - __main__ - Step 43611: {'lr': 0.0001992074676644043, 'samples': 1395552, 'steps': 2725, 'loss/train': 2.395984649658203} -09/20/2021 23:56:03 - INFO - __main__ - Step 43612: {'lr': 0.0001992074676644043, 'samples': 1395584, 'steps': 2725, 'loss/train': 1.4214023351669312} -09/20/2021 23:56:04 - INFO - __main__ - Step 43613: {'lr': 0.0001992074676644043, 'samples': 1395616, 'steps': 2725, 'loss/train': 2.55168080329895} -09/20/2021 23:56:05 - INFO - __main__ - Step 43614: {'lr': 0.0001992074676644043, 'samples': 1395648, 'steps': 2725, 'loss/train': 1.3233722448349} -09/20/2021 23:56:05 - INFO - __main__ - Step 43615: {'lr': 0.0001992074676644043, 'samples': 1395680, 'steps': 2725, 'loss/train': 2.8869030475616455} -09/20/2021 23:56:06 - INFO - __main__ - Step 43616: {'lr': 0.0001992074676644043, 'samples': 1395712, 'steps': 2725, 'loss/train': 1.888781189918518} -09/20/2021 23:56:07 - INFO - __main__ - Step 43617: {'lr': 0.0001992066659599581, 'samples': 1395744, 'steps': 2726, 'loss/train': 2.01143217086792} -09/20/2021 23:56:08 - INFO - __main__ - Step 43618: {'lr': 0.0001992066659599581, 'samples': 1395776, 'steps': 2726, 'loss/train': 2.1396822929382324} -09/20/2021 23:56:09 - INFO - __main__ - Step 43619: {'lr': 0.0001992066659599581, 'samples': 1395808, 'steps': 2726, 'loss/train': 1.4330062866210938} -09/20/2021 23:56:09 - INFO - __main__ - Step 43620: {'lr': 0.0001992066659599581, 'samples': 1395840, 'steps': 2726, 'loss/train': 1.8133677244186401} -09/20/2021 23:56:10 - INFO - __main__ - Step 43621: {'lr': 0.0001992066659599581, 'samples': 1395872, 'steps': 2726, 'loss/train': 1.7882187366485596} -09/20/2021 23:56:11 - INFO - __main__ - Step 43622: {'lr': 0.0001992066659599581, 'samples': 1395904, 'steps': 2726, 'loss/train': 2.501514196395874} -09/20/2021 23:56:12 - INFO - __main__ - Step 43623: {'lr': 0.0001992066659599581, 'samples': 1395936, 'steps': 2726, 'loss/train': 2.494515895843506} -09/20/2021 23:56:12 - INFO - __main__ - Step 43624: {'lr': 0.0001992066659599581, 'samples': 1395968, 'steps': 2726, 'loss/train': 1.98759925365448} -09/20/2021 23:56:13 - INFO - __main__ - Step 43625: {'lr': 0.0001992066659599581, 'samples': 1396000, 'steps': 2726, 'loss/train': 1.2373584508895874} -09/20/2021 23:56:14 - INFO - __main__ - Step 43626: {'lr': 0.0001992066659599581, 'samples': 1396032, 'steps': 2726, 'loss/train': 3.0920000076293945} -09/20/2021 23:56:15 - INFO - __main__ - Step 43627: {'lr': 0.0001992066659599581, 'samples': 1396064, 'steps': 2726, 'loss/train': 2.3966784477233887} -09/20/2021 23:56:15 - INFO - __main__ - Step 43628: {'lr': 0.0001992066659599581, 'samples': 1396096, 'steps': 2726, 'loss/train': 1.884350299835205} -09/20/2021 23:56:16 - INFO - __main__ - Step 43629: {'lr': 0.0001992066659599581, 'samples': 1396128, 'steps': 2726, 'loss/train': 2.5177838802337646} -09/20/2021 23:56:17 - INFO - __main__ - Step 43630: {'lr': 0.0001992066659599581, 'samples': 1396160, 'steps': 2726, 'loss/train': 1.9757063388824463} -09/20/2021 23:56:18 - INFO - __main__ - Step 43631: {'lr': 0.0001992066659599581, 'samples': 1396192, 'steps': 2726, 'loss/train': 2.3066487312316895} -09/20/2021 23:56:18 - INFO - __main__ - Step 43632: {'lr': 0.0001992066659599581, 'samples': 1396224, 'steps': 2726, 'loss/train': 2.3394038677215576} -09/20/2021 23:56:19 - INFO - __main__ - Step 43633: {'lr': 0.00019920586385184044, 'samples': 1396256, 'steps': 2727, 'loss/train': 1.983099341392517} -09/20/2021 23:56:20 - INFO - __main__ - Step 43634: {'lr': 0.00019920586385184044, 'samples': 1396288, 'steps': 2727, 'loss/train': 2.354408025741577} -09/20/2021 23:56:21 - INFO - __main__ - Step 43635: {'lr': 0.00019920586385184044, 'samples': 1396320, 'steps': 2727, 'loss/train': 2.2669217586517334} -09/20/2021 23:56:21 - INFO - __main__ - Step 43636: {'lr': 0.00019920586385184044, 'samples': 1396352, 'steps': 2727, 'loss/train': 0.8149828910827637} -09/20/2021 23:56:22 - INFO - __main__ - Step 43637: {'lr': 0.00019920586385184044, 'samples': 1396384, 'steps': 2727, 'loss/train': 2.276667833328247} -09/20/2021 23:56:23 - INFO - __main__ - Step 43638: {'lr': 0.00019920586385184044, 'samples': 1396416, 'steps': 2727, 'loss/train': 1.6491498947143555} -09/20/2021 23:56:24 - INFO - __main__ - Step 43639: {'lr': 0.00019920586385184044, 'samples': 1396448, 'steps': 2727, 'loss/train': 2.139167547225952} -09/20/2021 23:56:24 - INFO - __main__ - Step 43640: {'lr': 0.00019920586385184044, 'samples': 1396480, 'steps': 2727, 'loss/train': 2.4155478477478027} -09/20/2021 23:56:25 - INFO - __main__ - Step 43641: {'lr': 0.00019920586385184044, 'samples': 1396512, 'steps': 2727, 'loss/train': 1.887584924697876} -09/20/2021 23:56:26 - INFO - __main__ - Step 43642: {'lr': 0.00019920586385184044, 'samples': 1396544, 'steps': 2727, 'loss/train': 2.6381676197052} -09/20/2021 23:56:27 - INFO - __main__ - Step 43643: {'lr': 0.00019920586385184044, 'samples': 1396576, 'steps': 2727, 'loss/train': 2.61112904548645} -09/20/2021 23:56:28 - INFO - __main__ - Step 43644: {'lr': 0.00019920586385184044, 'samples': 1396608, 'steps': 2727, 'loss/train': 2.268850326538086} -09/20/2021 23:56:29 - INFO - __main__ - Step 43645: {'lr': 0.00019920586385184044, 'samples': 1396640, 'steps': 2727, 'loss/train': 2.911963701248169} -09/20/2021 23:56:29 - INFO - __main__ - Step 43646: {'lr': 0.00019920586385184044, 'samples': 1396672, 'steps': 2727, 'loss/train': 2.1179580688476562} -09/20/2021 23:56:30 - INFO - __main__ - Step 43647: {'lr': 0.00019920586385184044, 'samples': 1396704, 'steps': 2727, 'loss/train': 1.4176619052886963} -09/20/2021 23:56:31 - INFO - __main__ - Step 43648: {'lr': 0.00019920586385184044, 'samples': 1396736, 'steps': 2727, 'loss/train': 1.4184695482254028} -09/20/2021 23:56:32 - INFO - __main__ - Step 43649: {'lr': 0.00019920506134005447, 'samples': 1396768, 'steps': 2728, 'loss/train': 1.7666587829589844} -09/20/2021 23:56:33 - INFO - __main__ - Step 43650: {'lr': 0.00019920506134005447, 'samples': 1396800, 'steps': 2728, 'loss/train': 1.9774216413497925} -09/20/2021 23:56:33 - INFO - __main__ - Step 43651: {'lr': 0.00019920506134005447, 'samples': 1396832, 'steps': 2728, 'loss/train': 2.090038299560547} -09/20/2021 23:56:34 - INFO - __main__ - Step 43652: {'lr': 0.00019920506134005447, 'samples': 1396864, 'steps': 2728, 'loss/train': 2.3897905349731445} -09/20/2021 23:56:35 - INFO - __main__ - Step 43653: {'lr': 0.00019920506134005447, 'samples': 1396896, 'steps': 2728, 'loss/train': 1.9427666664123535} -09/20/2021 23:56:36 - INFO - __main__ - Step 43654: {'lr': 0.00019920506134005447, 'samples': 1396928, 'steps': 2728, 'loss/train': 2.436600685119629} -09/20/2021 23:56:36 - INFO - __main__ - Step 43655: {'lr': 0.00019920506134005447, 'samples': 1396960, 'steps': 2728, 'loss/train': 1.5845905542373657} -09/20/2021 23:56:37 - INFO - __main__ - Step 43656: {'lr': 0.00019920506134005447, 'samples': 1396992, 'steps': 2728, 'loss/train': 2.21923565864563} -09/20/2021 23:56:38 - INFO - __main__ - Step 43657: {'lr': 0.00019920506134005447, 'samples': 1397024, 'steps': 2728, 'loss/train': 3.122415542602539} -09/20/2021 23:56:39 - INFO - __main__ - Step 43658: {'lr': 0.00019920506134005447, 'samples': 1397056, 'steps': 2728, 'loss/train': 1.0077626705169678} -09/20/2021 23:56:39 - INFO - __main__ - Step 43659: {'lr': 0.00019920506134005447, 'samples': 1397088, 'steps': 2728, 'loss/train': 2.1144847869873047} -09/20/2021 23:56:40 - INFO - __main__ - Step 43660: {'lr': 0.00019920506134005447, 'samples': 1397120, 'steps': 2728, 'loss/train': 2.655139446258545} -09/20/2021 23:56:41 - INFO - __main__ - Step 43661: {'lr': 0.00019920506134005447, 'samples': 1397152, 'steps': 2728, 'loss/train': 2.744945764541626} -09/20/2021 23:56:42 - INFO - __main__ - Step 43662: {'lr': 0.00019920506134005447, 'samples': 1397184, 'steps': 2728, 'loss/train': 2.35884690284729} -09/20/2021 23:56:42 - INFO - __main__ - Step 43663: {'lr': 0.00019920506134005447, 'samples': 1397216, 'steps': 2728, 'loss/train': 1.504653811454773} -09/20/2021 23:56:43 - INFO - __main__ - Step 43664: {'lr': 0.00019920506134005447, 'samples': 1397248, 'steps': 2728, 'loss/train': 3.4861860275268555} -09/20/2021 23:56:44 - INFO - __main__ - Step 43665: {'lr': 0.00019920425842460352, 'samples': 1397280, 'steps': 2729, 'loss/train': 2.473188638687134} -09/20/2021 23:56:45 - INFO - __main__ - Step 43666: {'lr': 0.00019920425842460352, 'samples': 1397312, 'steps': 2729, 'loss/train': 2.7525768280029297} -09/20/2021 23:56:45 - INFO - __main__ - Step 43667: {'lr': 0.00019920425842460352, 'samples': 1397344, 'steps': 2729, 'loss/train': 1.7790900468826294} -09/20/2021 23:56:46 - INFO - __main__ - Step 43668: {'lr': 0.00019920425842460352, 'samples': 1397376, 'steps': 2729, 'loss/train': 1.4026708602905273} -09/20/2021 23:56:47 - INFO - __main__ - Step 43669: {'lr': 0.00019920425842460352, 'samples': 1397408, 'steps': 2729, 'loss/train': 2.92486572265625} -09/20/2021 23:56:48 - INFO - __main__ - Step 43670: {'lr': 0.00019920425842460352, 'samples': 1397440, 'steps': 2729, 'loss/train': 2.1111667156219482} -09/20/2021 23:56:48 - INFO - __main__ - Step 43671: {'lr': 0.00019920425842460352, 'samples': 1397472, 'steps': 2729, 'loss/train': 2.391900062561035} -09/20/2021 23:56:49 - INFO - __main__ - Step 43672: {'lr': 0.00019920425842460352, 'samples': 1397504, 'steps': 2729, 'loss/train': 1.9907034635543823} -09/20/2021 23:56:51 - INFO - __main__ - Step 43673: {'lr': 0.00019920425842460352, 'samples': 1397536, 'steps': 2729, 'loss/train': 2.084116220474243} -09/20/2021 23:56:52 - INFO - __main__ - Step 43674: {'lr': 0.00019920425842460352, 'samples': 1397568, 'steps': 2729, 'loss/train': 2.037987232208252} -09/20/2021 23:56:53 - INFO - __main__ - Step 43675: {'lr': 0.00019920425842460352, 'samples': 1397600, 'steps': 2729, 'loss/train': 1.2247830629348755} -09/20/2021 23:56:53 - INFO - __main__ - Step 43676: {'lr': 0.00019920425842460352, 'samples': 1397632, 'steps': 2729, 'loss/train': 2.0595452785491943} -09/20/2021 23:56:54 - INFO - __main__ - Step 43677: {'lr': 0.00019920425842460352, 'samples': 1397664, 'steps': 2729, 'loss/train': 1.1742876768112183} -09/20/2021 23:56:55 - INFO - __main__ - Step 43678: {'lr': 0.00019920425842460352, 'samples': 1397696, 'steps': 2729, 'loss/train': 0.8440008163452148} -09/20/2021 23:56:56 - INFO - __main__ - Step 43679: {'lr': 0.00019920425842460352, 'samples': 1397728, 'steps': 2729, 'loss/train': 0.8597447872161865} -09/20/2021 23:56:56 - INFO - __main__ - Step 43680: {'lr': 0.00019920425842460352, 'samples': 1397760, 'steps': 2729, 'loss/train': 0.5437193512916565} -09/20/2021 23:56:57 - INFO - __main__ - Step 43681: {'lr': 0.0001992034551054908, 'samples': 1397792, 'steps': 2730, 'loss/train': 0.536967396736145} -09/20/2021 23:56:58 - INFO - __main__ - Step 43682: {'lr': 0.0001992034551054908, 'samples': 1397824, 'steps': 2730, 'loss/train': 0.592631995677948} -09/20/2021 23:56:59 - INFO - __main__ - Step 43683: {'lr': 0.0001992034551054908, 'samples': 1397856, 'steps': 2730, 'loss/train': 0.5034891366958618} -09/20/2021 23:56:59 - INFO - __main__ - Step 43684: {'lr': 0.0001992034551054908, 'samples': 1397888, 'steps': 2730, 'loss/train': 0.4795246124267578} -09/20/2021 23:57:00 - INFO - __main__ - Step 43685: {'lr': 0.0001992034551054908, 'samples': 1397920, 'steps': 2730, 'loss/train': 0.3288189172744751} -09/20/2021 23:57:01 - INFO - __main__ - Step 43686: {'lr': 0.0001992034551054908, 'samples': 1397952, 'steps': 2730, 'loss/train': 1.7966125011444092} -09/20/2021 23:57:02 - INFO - __main__ - Step 43687: {'lr': 0.0001992034551054908, 'samples': 1397984, 'steps': 2730, 'loss/train': 1.484116792678833} -09/20/2021 23:57:02 - INFO - __main__ - Step 43688: {'lr': 0.0001992034551054908, 'samples': 1398016, 'steps': 2730, 'loss/train': 2.191528797149658} -09/20/2021 23:57:03 - INFO - __main__ - Step 43689: {'lr': 0.0001992034551054908, 'samples': 1398048, 'steps': 2730, 'loss/train': 1.5553793907165527} -09/20/2021 23:57:04 - INFO - __main__ - Step 43690: {'lr': 0.0001992034551054908, 'samples': 1398080, 'steps': 2730, 'loss/train': 1.5178141593933105} -09/20/2021 23:57:05 - INFO - __main__ - Step 43691: {'lr': 0.0001992034551054908, 'samples': 1398112, 'steps': 2730, 'loss/train': 1.8020020723342896} -09/20/2021 23:57:05 - INFO - __main__ - Step 43692: {'lr': 0.0001992034551054908, 'samples': 1398144, 'steps': 2730, 'loss/train': 2.1565656661987305} -09/20/2021 23:57:06 - INFO - __main__ - Step 43693: {'lr': 0.0001992034551054908, 'samples': 1398176, 'steps': 2730, 'loss/train': 2.3912665843963623} -09/20/2021 23:57:07 - INFO - __main__ - Step 43694: {'lr': 0.0001992034551054908, 'samples': 1398208, 'steps': 2730, 'loss/train': 1.306049108505249} -09/20/2021 23:57:08 - INFO - __main__ - Step 43695: {'lr': 0.0001992034551054908, 'samples': 1398240, 'steps': 2730, 'loss/train': 2.6917238235473633} -09/20/2021 23:57:08 - INFO - __main__ - Step 43696: {'lr': 0.0001992034551054908, 'samples': 1398272, 'steps': 2730, 'loss/train': 0.4783334732055664} -09/20/2021 23:57:09 - INFO - __main__ - Step 43697: {'lr': 0.0001992026513827196, 'samples': 1398304, 'steps': 2731, 'loss/train': 0.2243451327085495} -09/20/2021 23:57:10 - INFO - __main__ - Step 43698: {'lr': 0.0001992026513827196, 'samples': 1398336, 'steps': 2731, 'loss/train': 0.2705034911632538} -09/20/2021 23:57:11 - INFO - __main__ - Step 43699: {'lr': 0.0001992026513827196, 'samples': 1398368, 'steps': 2731, 'loss/train': 0.2871164381504059} -09/20/2021 23:57:12 - INFO - __main__ - Step 43700: {'lr': 0.0001992026513827196, 'samples': 1398400, 'steps': 2731, 'loss/train': 0.2822129428386688} -09/20/2021 23:57:12 - INFO - __main__ - Step 43701: {'lr': 0.0001992026513827196, 'samples': 1398432, 'steps': 2731, 'loss/train': 5.520656585693359} -09/20/2021 23:57:13 - INFO - __main__ - Step 43702: {'lr': 0.0001992026513827196, 'samples': 1398464, 'steps': 2731, 'loss/train': 1.5394634008407593} -09/20/2021 23:57:14 - INFO - __main__ - Step 43703: {'lr': 0.0001992026513827196, 'samples': 1398496, 'steps': 2731, 'loss/train': 2.5150814056396484} -09/20/2021 23:57:15 - INFO - __main__ - Step 43704: {'lr': 0.0001992026513827196, 'samples': 1398528, 'steps': 2731, 'loss/train': 1.3459001779556274} -09/20/2021 23:57:16 - INFO - __main__ - Step 43705: {'lr': 0.0001992026513827196, 'samples': 1398560, 'steps': 2731, 'loss/train': 1.7887420654296875} -09/20/2021 23:57:17 - INFO - __main__ - Step 43706: {'lr': 0.0001992026513827196, 'samples': 1398592, 'steps': 2731, 'loss/train': 1.8502168655395508} -09/20/2021 23:57:17 - INFO - __main__ - Step 43707: {'lr': 0.0001992026513827196, 'samples': 1398624, 'steps': 2731, 'loss/train': 1.8674235343933105} -09/20/2021 23:57:18 - INFO - __main__ - Step 43708: {'lr': 0.0001992026513827196, 'samples': 1398656, 'steps': 2731, 'loss/train': 2.1206374168395996} -09/20/2021 23:57:19 - INFO - __main__ - Step 43709: {'lr': 0.0001992026513827196, 'samples': 1398688, 'steps': 2731, 'loss/train': 1.9091870784759521} -09/20/2021 23:57:20 - INFO - __main__ - Step 43710: {'lr': 0.0001992026513827196, 'samples': 1398720, 'steps': 2731, 'loss/train': 0.38257208466529846} -09/20/2021 23:57:20 - INFO - __main__ - Step 43711: {'lr': 0.0001992026513827196, 'samples': 1398752, 'steps': 2731, 'loss/train': 2.1402997970581055} -09/20/2021 23:57:21 - INFO - __main__ - Step 43712: {'lr': 0.0001992026513827196, 'samples': 1398784, 'steps': 2731, 'loss/train': 1.949687123298645} -09/20/2021 23:57:22 - INFO - __main__ - Step 43713: {'lr': 0.00019920184725629323, 'samples': 1398816, 'steps': 2732, 'loss/train': 1.635901927947998} -09/20/2021 23:57:23 - INFO - __main__ - Step 43714: {'lr': 0.00019920184725629323, 'samples': 1398848, 'steps': 2732, 'loss/train': 1.5199280977249146} -09/20/2021 23:57:24 - INFO - __main__ - Step 43715: {'lr': 0.00019920184725629323, 'samples': 1398880, 'steps': 2732, 'loss/train': 1.5920807123184204} -09/20/2021 23:57:24 - INFO - __main__ - Step 43716: {'lr': 0.00019920184725629323, 'samples': 1398912, 'steps': 2732, 'loss/train': 1.9601763486862183} -09/20/2021 23:57:25 - INFO - __main__ - Step 43717: {'lr': 0.00019920184725629323, 'samples': 1398944, 'steps': 2732, 'loss/train': 2.814951181411743} -09/20/2021 23:57:26 - INFO - __main__ - Step 43718: {'lr': 0.00019920184725629323, 'samples': 1398976, 'steps': 2732, 'loss/train': 1.0675382614135742} -09/20/2021 23:57:27 - INFO - __main__ - Step 43719: {'lr': 0.00019920184725629323, 'samples': 1399008, 'steps': 2732, 'loss/train': 0.5899993777275085} -09/20/2021 23:57:27 - INFO - __main__ - Step 43720: {'lr': 0.00019920184725629323, 'samples': 1399040, 'steps': 2732, 'loss/train': 0.653374433517456} -09/20/2021 23:57:28 - INFO - __main__ - Step 43721: {'lr': 0.00019920184725629323, 'samples': 1399072, 'steps': 2732, 'loss/train': 0.9472662210464478} -09/20/2021 23:57:29 - INFO - __main__ - Step 43722: {'lr': 0.00019920184725629323, 'samples': 1399104, 'steps': 2732, 'loss/train': 0.6392946839332581} -09/20/2021 23:57:30 - INFO - __main__ - Step 43723: {'lr': 0.00019920184725629323, 'samples': 1399136, 'steps': 2732, 'loss/train': 1.504490852355957} -09/20/2021 23:57:30 - INFO - __main__ - Step 43724: {'lr': 0.00019920184725629323, 'samples': 1399168, 'steps': 2732, 'loss/train': 2.276837110519409} -09/20/2021 23:57:31 - INFO - __main__ - Step 43725: {'lr': 0.00019920184725629323, 'samples': 1399200, 'steps': 2732, 'loss/train': 2.101166248321533} -09/20/2021 23:57:32 - INFO - __main__ - Step 43726: {'lr': 0.00019920184725629323, 'samples': 1399232, 'steps': 2732, 'loss/train': 2.5474061965942383} -09/20/2021 23:57:33 - INFO - __main__ - Step 43727: {'lr': 0.00019920184725629323, 'samples': 1399264, 'steps': 2732, 'loss/train': 2.6664156913757324} -09/20/2021 23:57:33 - INFO - __main__ - Step 43728: {'lr': 0.00019920184725629323, 'samples': 1399296, 'steps': 2732, 'loss/train': 2.7271015644073486} -09/20/2021 23:57:34 - INFO - __main__ - Step 43729: {'lr': 0.0001992010427262149, 'samples': 1399328, 'steps': 2733, 'loss/train': 2.089893341064453} -09/20/2021 23:57:35 - INFO - __main__ - Step 43730: {'lr': 0.0001992010427262149, 'samples': 1399360, 'steps': 2733, 'loss/train': 2.1748719215393066} -09/20/2021 23:57:36 - INFO - __main__ - Step 43731: {'lr': 0.0001992010427262149, 'samples': 1399392, 'steps': 2733, 'loss/train': 2.1344261169433594} -09/20/2021 23:57:36 - INFO - __main__ - Step 43732: {'lr': 0.0001992010427262149, 'samples': 1399424, 'steps': 2733, 'loss/train': 2.464078187942505} -09/20/2021 23:57:37 - INFO - __main__ - Step 43733: {'lr': 0.0001992010427262149, 'samples': 1399456, 'steps': 2733, 'loss/train': 2.7731635570526123} -09/20/2021 23:57:38 - INFO - __main__ - Step 43734: {'lr': 0.0001992010427262149, 'samples': 1399488, 'steps': 2733, 'loss/train': 2.660499095916748} -09/20/2021 23:57:39 - INFO - __main__ - Step 43735: {'lr': 0.0001992010427262149, 'samples': 1399520, 'steps': 2733, 'loss/train': 1.7385278940200806} -09/20/2021 23:57:39 - INFO - __main__ - Step 43736: {'lr': 0.0001992010427262149, 'samples': 1399552, 'steps': 2733, 'loss/train': 2.1265811920166016} -09/20/2021 23:57:41 - INFO - __main__ - Step 43737: {'lr': 0.0001992010427262149, 'samples': 1399584, 'steps': 2733, 'loss/train': 2.294513702392578} -09/20/2021 23:57:42 - INFO - __main__ - Step 43738: {'lr': 0.0001992010427262149, 'samples': 1399616, 'steps': 2733, 'loss/train': 1.494471549987793} -09/20/2021 23:57:42 - INFO - __main__ - Step 43739: {'lr': 0.0001992010427262149, 'samples': 1399648, 'steps': 2733, 'loss/train': 1.5255621671676636} -09/20/2021 23:57:43 - INFO - __main__ - Step 43740: {'lr': 0.0001992010427262149, 'samples': 1399680, 'steps': 2733, 'loss/train': 2.34163236618042} -09/20/2021 23:57:44 - INFO - __main__ - Step 43741: {'lr': 0.0001992010427262149, 'samples': 1399712, 'steps': 2733, 'loss/train': 1.5646724700927734} -09/20/2021 23:57:45 - INFO - __main__ - Step 43742: {'lr': 0.0001992010427262149, 'samples': 1399744, 'steps': 2733, 'loss/train': 2.4261105060577393} -09/20/2021 23:57:45 - INFO - __main__ - Step 43743: {'lr': 0.0001992010427262149, 'samples': 1399776, 'steps': 2733, 'loss/train': 1.9770712852478027} -09/20/2021 23:57:46 - INFO - __main__ - Step 43744: {'lr': 0.0001992010427262149, 'samples': 1399808, 'steps': 2733, 'loss/train': 2.0883708000183105} -09/20/2021 23:57:47 - INFO - __main__ - Step 43745: {'lr': 0.00019920023779248792, 'samples': 1399840, 'steps': 2734, 'loss/train': 2.9935827255249023} -09/20/2021 23:57:48 - INFO - __main__ - Step 43746: {'lr': 0.00019920023779248792, 'samples': 1399872, 'steps': 2734, 'loss/train': 2.7887680530548096} -09/20/2021 23:57:48 - INFO - __main__ - Step 43747: {'lr': 0.00019920023779248792, 'samples': 1399904, 'steps': 2734, 'loss/train': 2.162748098373413} -09/20/2021 23:57:49 - INFO - __main__ - Step 43748: {'lr': 0.00019920023779248792, 'samples': 1399936, 'steps': 2734, 'loss/train': 2.321035146713257} -09/20/2021 23:57:50 - INFO - __main__ - Step 43749: {'lr': 0.00019920023779248792, 'samples': 1399968, 'steps': 2734, 'loss/train': 2.3129522800445557} -09/20/2021 23:57:51 - INFO - __main__ - Step 43750: {'lr': 0.00019920023779248792, 'samples': 1400000, 'steps': 2734, 'loss/train': 3.435570001602173} -09/20/2021 23:57:51 - INFO - __main__ - Step 43751: {'lr': 0.00019920023779248792, 'samples': 1400032, 'steps': 2734, 'loss/train': 2.4458541870117188} -09/20/2021 23:57:52 - INFO - __main__ - Step 43752: {'lr': 0.00019920023779248792, 'samples': 1400064, 'steps': 2734, 'loss/train': 2.5196726322174072} -09/20/2021 23:57:53 - INFO - __main__ - Step 43753: {'lr': 0.00019920023779248792, 'samples': 1400096, 'steps': 2734, 'loss/train': 1.971867322921753} -09/20/2021 23:57:54 - INFO - __main__ - Step 43754: {'lr': 0.00019920023779248792, 'samples': 1400128, 'steps': 2734, 'loss/train': 1.4045920372009277} -09/20/2021 23:57:54 - INFO - __main__ - Step 43755: {'lr': 0.00019920023779248792, 'samples': 1400160, 'steps': 2734, 'loss/train': 2.4681098461151123} -09/20/2021 23:57:55 - INFO - __main__ - Step 43756: {'lr': 0.00019920023779248792, 'samples': 1400192, 'steps': 2734, 'loss/train': 1.9218488931655884} -09/20/2021 23:57:56 - INFO - __main__ - Step 43757: {'lr': 0.00019920023779248792, 'samples': 1400224, 'steps': 2734, 'loss/train': 2.02575421333313} -09/20/2021 23:57:57 - INFO - __main__ - Step 43758: {'lr': 0.00019920023779248792, 'samples': 1400256, 'steps': 2734, 'loss/train': 3.052332878112793} -09/20/2021 23:57:57 - INFO - __main__ - Step 43759: {'lr': 0.00019920023779248792, 'samples': 1400288, 'steps': 2734, 'loss/train': 2.2929275035858154} -09/20/2021 23:57:58 - INFO - __main__ - Step 43760: {'lr': 0.00019920023779248792, 'samples': 1400320, 'steps': 2734, 'loss/train': 1.8878085613250732} -09/20/2021 23:57:59 - INFO - __main__ - Step 43761: {'lr': 0.00019919943245511558, 'samples': 1400352, 'steps': 2735, 'loss/train': 2.9772634506225586} -09/20/2021 23:58:00 - INFO - __main__ - Step 43762: {'lr': 0.00019919943245511558, 'samples': 1400384, 'steps': 2735, 'loss/train': 2.4369871616363525} -09/20/2021 23:58:01 - INFO - __main__ - Step 43763: {'lr': 0.00019919943245511558, 'samples': 1400416, 'steps': 2735, 'loss/train': 2.988179922103882} -09/20/2021 23:58:01 - INFO - __main__ - Step 43764: {'lr': 0.00019919943245511558, 'samples': 1400448, 'steps': 2735, 'loss/train': 2.5882418155670166} -09/20/2021 23:58:02 - INFO - __main__ - Step 43765: {'lr': 0.00019919943245511558, 'samples': 1400480, 'steps': 2735, 'loss/train': 0.5243893265724182} -09/20/2021 23:58:03 - INFO - __main__ - Step 43766: {'lr': 0.00019919943245511558, 'samples': 1400512, 'steps': 2735, 'loss/train': 1.9412516355514526} -09/20/2021 23:58:04 - INFO - __main__ - Step 43767: {'lr': 0.00019919943245511558, 'samples': 1400544, 'steps': 2735, 'loss/train': 2.275118350982666} -09/20/2021 23:58:05 - INFO - __main__ - Step 43768: {'lr': 0.00019919943245511558, 'samples': 1400576, 'steps': 2735, 'loss/train': 1.3467767238616943} -09/20/2021 23:58:06 - INFO - __main__ - Step 43769: {'lr': 0.00019919943245511558, 'samples': 1400608, 'steps': 2735, 'loss/train': 1.919883131980896} -09/20/2021 23:58:07 - INFO - __main__ - Step 43770: {'lr': 0.00019919943245511558, 'samples': 1400640, 'steps': 2735, 'loss/train': 2.602328062057495} -09/20/2021 23:58:07 - INFO - __main__ - Step 43771: {'lr': 0.00019919943245511558, 'samples': 1400672, 'steps': 2735, 'loss/train': 1.9538462162017822} -09/20/2021 23:58:08 - INFO - __main__ - Step 43772: {'lr': 0.00019919943245511558, 'samples': 1400704, 'steps': 2735, 'loss/train': 2.491656541824341} -09/20/2021 23:58:09 - INFO - __main__ - Step 43773: {'lr': 0.00019919943245511558, 'samples': 1400736, 'steps': 2735, 'loss/train': 1.9767876863479614} -09/20/2021 23:58:10 - INFO - __main__ - Step 43774: {'lr': 0.00019919943245511558, 'samples': 1400768, 'steps': 2735, 'loss/train': 1.7244642972946167} -09/20/2021 23:58:10 - INFO - __main__ - Step 43775: {'lr': 0.00019919943245511558, 'samples': 1400800, 'steps': 2735, 'loss/train': 2.143071174621582} -09/20/2021 23:58:11 - INFO - __main__ - Step 43776: {'lr': 0.00019919943245511558, 'samples': 1400832, 'steps': 2735, 'loss/train': 2.254223108291626} -09/20/2021 23:58:12 - INFO - __main__ - Step 43777: {'lr': 0.0001991986267141011, 'samples': 1400864, 'steps': 2736, 'loss/train': 2.2520828247070312} -09/20/2021 23:58:13 - INFO - __main__ - Step 43778: {'lr': 0.0001991986267141011, 'samples': 1400896, 'steps': 2736, 'loss/train': 1.780096173286438} -09/20/2021 23:58:13 - INFO - __main__ - Step 43779: {'lr': 0.0001991986267141011, 'samples': 1400928, 'steps': 2736, 'loss/train': 1.2864269018173218} -09/20/2021 23:58:14 - INFO - __main__ - Step 43780: {'lr': 0.0001991986267141011, 'samples': 1400960, 'steps': 2736, 'loss/train': 1.4712377786636353} -09/20/2021 23:58:15 - INFO - __main__ - Step 43781: {'lr': 0.0001991986267141011, 'samples': 1400992, 'steps': 2736, 'loss/train': 2.5010080337524414} -09/20/2021 23:58:16 - INFO - __main__ - Step 43782: {'lr': 0.0001991986267141011, 'samples': 1401024, 'steps': 2736, 'loss/train': 2.600706100463867} -09/20/2021 23:58:16 - INFO - __main__ - Step 43783: {'lr': 0.0001991986267141011, 'samples': 1401056, 'steps': 2736, 'loss/train': 1.3891522884368896} -09/20/2021 23:58:17 - INFO - __main__ - Step 43784: {'lr': 0.0001991986267141011, 'samples': 1401088, 'steps': 2736, 'loss/train': 1.9355533123016357} -09/20/2021 23:58:18 - INFO - __main__ - Step 43785: {'lr': 0.0001991986267141011, 'samples': 1401120, 'steps': 2736, 'loss/train': 1.4852192401885986} -09/20/2021 23:58:19 - INFO - __main__ - Step 43786: {'lr': 0.0001991986267141011, 'samples': 1401152, 'steps': 2736, 'loss/train': 2.464540481567383} -09/20/2021 23:58:19 - INFO - __main__ - Step 43787: {'lr': 0.0001991986267141011, 'samples': 1401184, 'steps': 2736, 'loss/train': 3.356550693511963} -09/20/2021 23:58:20 - INFO - __main__ - Step 43788: {'lr': 0.0001991986267141011, 'samples': 1401216, 'steps': 2736, 'loss/train': 2.9227802753448486} -09/20/2021 23:58:21 - INFO - __main__ - Step 43789: {'lr': 0.0001991986267141011, 'samples': 1401248, 'steps': 2736, 'loss/train': 3.351313352584839} -09/20/2021 23:58:22 - INFO - __main__ - Step 43790: {'lr': 0.0001991986267141011, 'samples': 1401280, 'steps': 2736, 'loss/train': 3.4679715633392334} -09/20/2021 23:58:22 - INFO - __main__ - Step 43791: {'lr': 0.0001991986267141011, 'samples': 1401312, 'steps': 2736, 'loss/train': 3.106332778930664} -09/20/2021 23:58:23 - INFO - __main__ - Step 43792: {'lr': 0.0001991986267141011, 'samples': 1401344, 'steps': 2736, 'loss/train': 3.459592342376709} -09/20/2021 23:58:24 - INFO - __main__ - Step 43793: {'lr': 0.0001991978205694478, 'samples': 1401376, 'steps': 2737, 'loss/train': 2.189811944961548} -09/20/2021 23:58:25 - INFO - __main__ - Step 43794: {'lr': 0.0001991978205694478, 'samples': 1401408, 'steps': 2737, 'loss/train': 2.8105475902557373} -09/20/2021 23:58:26 - INFO - __main__ - Step 43795: {'lr': 0.0001991978205694478, 'samples': 1401440, 'steps': 2737, 'loss/train': 1.5428972244262695} -09/20/2021 23:58:26 - INFO - __main__ - Step 43796: {'lr': 0.0001991978205694478, 'samples': 1401472, 'steps': 2737, 'loss/train': 2.0018692016601562} -09/20/2021 23:58:27 - INFO - __main__ - Step 43797: {'lr': 0.0001991978205694478, 'samples': 1401504, 'steps': 2737, 'loss/train': 2.0565030574798584} -09/20/2021 23:58:28 - INFO - __main__ - Step 43798: {'lr': 0.0001991978205694478, 'samples': 1401536, 'steps': 2737, 'loss/train': 2.8931095600128174} -09/20/2021 23:58:30 - INFO - __main__ - Step 43799: {'lr': 0.0001991978205694478, 'samples': 1401568, 'steps': 2737, 'loss/train': 2.4293816089630127} -09/20/2021 23:58:31 - INFO - __main__ - Step 43800: {'lr': 0.0001991978205694478, 'samples': 1401600, 'steps': 2737, 'loss/train': 2.3656253814697266} -09/20/2021 23:58:32 - INFO - __main__ - Step 43801: {'lr': 0.0001991978205694478, 'samples': 1401632, 'steps': 2737, 'loss/train': 2.1139979362487793} -09/20/2021 23:58:32 - INFO - __main__ - Step 43802: {'lr': 0.0001991978205694478, 'samples': 1401664, 'steps': 2737, 'loss/train': 1.479985237121582} -09/20/2021 23:58:33 - INFO - __main__ - Step 43803: {'lr': 0.0001991978205694478, 'samples': 1401696, 'steps': 2737, 'loss/train': 2.1326446533203125} -09/20/2021 23:58:34 - INFO - __main__ - Step 43804: {'lr': 0.0001991978205694478, 'samples': 1401728, 'steps': 2737, 'loss/train': 1.432289719581604} -09/20/2021 23:58:35 - INFO - __main__ - Step 43805: {'lr': 0.0001991978205694478, 'samples': 1401760, 'steps': 2737, 'loss/train': 1.7970434427261353} -09/20/2021 23:58:35 - INFO - __main__ - Step 43806: {'lr': 0.0001991978205694478, 'samples': 1401792, 'steps': 2737, 'loss/train': 2.5311784744262695} -09/20/2021 23:58:36 - INFO - __main__ - Step 43807: {'lr': 0.0001991978205694478, 'samples': 1401824, 'steps': 2737, 'loss/train': 1.5042704343795776} -09/20/2021 23:58:37 - INFO - __main__ - Step 43808: {'lr': 0.0001991978205694478, 'samples': 1401856, 'steps': 2737, 'loss/train': 2.658851146697998} -09/20/2021 23:58:38 - INFO - __main__ - Step 43809: {'lr': 0.000199197014021159, 'samples': 1401888, 'steps': 2738, 'loss/train': 2.1239802837371826} -09/20/2021 23:58:39 - INFO - __main__ - Step 43810: {'lr': 0.000199197014021159, 'samples': 1401920, 'steps': 2738, 'loss/train': 1.3668206930160522} -09/20/2021 23:58:39 - INFO - __main__ - Step 43811: {'lr': 0.000199197014021159, 'samples': 1401952, 'steps': 2738, 'loss/train': 2.354712724685669} -09/20/2021 23:58:40 - INFO - __main__ - Step 43812: {'lr': 0.000199197014021159, 'samples': 1401984, 'steps': 2738, 'loss/train': 2.6703267097473145} -09/20/2021 23:58:41 - INFO - __main__ - Step 43813: {'lr': 0.000199197014021159, 'samples': 1402016, 'steps': 2738, 'loss/train': 2.1340949535369873} -09/20/2021 23:58:42 - INFO - __main__ - Step 43814: {'lr': 0.000199197014021159, 'samples': 1402048, 'steps': 2738, 'loss/train': 2.339621067047119} -09/20/2021 23:58:42 - INFO - __main__ - Step 43815: {'lr': 0.000199197014021159, 'samples': 1402080, 'steps': 2738, 'loss/train': 2.865774393081665} -09/20/2021 23:58:43 - INFO - __main__ - Step 43816: {'lr': 0.000199197014021159, 'samples': 1402112, 'steps': 2738, 'loss/train': 1.7070425748825073} -09/20/2021 23:58:44 - INFO - __main__ - Step 43817: {'lr': 0.000199197014021159, 'samples': 1402144, 'steps': 2738, 'loss/train': 2.0850725173950195} -09/20/2021 23:58:45 - INFO - __main__ - Step 43818: {'lr': 0.000199197014021159, 'samples': 1402176, 'steps': 2738, 'loss/train': 2.2374191284179688} -09/20/2021 23:58:45 - INFO - __main__ - Step 43819: {'lr': 0.000199197014021159, 'samples': 1402208, 'steps': 2738, 'loss/train': 2.8435721397399902} -09/20/2021 23:58:46 - INFO - __main__ - Step 43820: {'lr': 0.000199197014021159, 'samples': 1402240, 'steps': 2738, 'loss/train': 1.5009164810180664} -09/20/2021 23:58:47 - INFO - __main__ - Step 43821: {'lr': 0.000199197014021159, 'samples': 1402272, 'steps': 2738, 'loss/train': 2.0081119537353516} -09/20/2021 23:58:48 - INFO - __main__ - Step 43822: {'lr': 0.000199197014021159, 'samples': 1402304, 'steps': 2738, 'loss/train': 1.370060682296753} -09/20/2021 23:58:48 - INFO - __main__ - Step 43823: {'lr': 0.000199197014021159, 'samples': 1402336, 'steps': 2738, 'loss/train': 1.3687517642974854} -09/20/2021 23:58:49 - INFO - __main__ - Step 43824: {'lr': 0.000199197014021159, 'samples': 1402368, 'steps': 2738, 'loss/train': 1.8519821166992188} -09/20/2021 23:58:50 - INFO - __main__ - Step 43825: {'lr': 0.00019919620706923788, 'samples': 1402400, 'steps': 2739, 'loss/train': 0.49355626106262207} -09/20/2021 23:58:51 - INFO - __main__ - Step 43826: {'lr': 0.00019919620706923788, 'samples': 1402432, 'steps': 2739, 'loss/train': 2.121378183364868} -09/20/2021 23:58:52 - INFO - __main__ - Step 43827: {'lr': 0.00019919620706923788, 'samples': 1402464, 'steps': 2739, 'loss/train': 0.45078346133232117} -09/20/2021 23:58:52 - INFO - __main__ - Step 43828: {'lr': 0.00019919620706923788, 'samples': 1402496, 'steps': 2739, 'loss/train': 0.3379513919353485} -09/20/2021 23:58:53 - INFO - __main__ - Step 43829: {'lr': 0.00019919620706923788, 'samples': 1402528, 'steps': 2739, 'loss/train': 0.5380942821502686} -09/20/2021 23:58:54 - INFO - __main__ - Step 43830: {'lr': 0.00019919620706923788, 'samples': 1402560, 'steps': 2739, 'loss/train': 0.38397371768951416} -09/20/2021 23:58:55 - INFO - __main__ - Step 43831: {'lr': 0.00019919620706923788, 'samples': 1402592, 'steps': 2739, 'loss/train': 0.5801599025726318} -09/20/2021 23:58:55 - INFO - __main__ - Step 43832: {'lr': 0.00019919620706923788, 'samples': 1402624, 'steps': 2739, 'loss/train': 0.4347091019153595} -09/20/2021 23:58:56 - INFO - __main__ - Step 43833: {'lr': 0.00019919620706923788, 'samples': 1402656, 'steps': 2739, 'loss/train': 0.5473398566246033} -09/20/2021 23:58:57 - INFO - __main__ - Step 43834: {'lr': 0.00019919620706923788, 'samples': 1402688, 'steps': 2739, 'loss/train': 0.6912961006164551} -09/20/2021 23:58:58 - INFO - __main__ - Step 43835: {'lr': 0.00019919620706923788, 'samples': 1402720, 'steps': 2739, 'loss/train': 1.7502769231796265} -09/20/2021 23:58:59 - INFO - __main__ - Step 43836: {'lr': 0.00019919620706923788, 'samples': 1402752, 'steps': 2739, 'loss/train': 1.0566867589950562} -09/20/2021 23:59:00 - INFO - __main__ - Step 43837: {'lr': 0.00019919620706923788, 'samples': 1402784, 'steps': 2739, 'loss/train': 1.3920077085494995} -09/20/2021 23:59:00 - INFO - __main__ - Step 43838: {'lr': 0.00019919620706923788, 'samples': 1402816, 'steps': 2739, 'loss/train': 1.1415668725967407} -09/20/2021 23:59:01 - INFO - __main__ - Step 43839: {'lr': 0.00019919620706923788, 'samples': 1402848, 'steps': 2739, 'loss/train': 2.6597468852996826} -09/20/2021 23:59:02 - INFO - __main__ - Step 43840: {'lr': 0.00019919620706923788, 'samples': 1402880, 'steps': 2739, 'loss/train': 3.2007670402526855} -09/20/2021 23:59:03 - INFO - __main__ - Step 43841: {'lr': 0.0001991953997136878, 'samples': 1402912, 'steps': 2740, 'loss/train': 2.9514193534851074} -09/20/2021 23:59:04 - INFO - __main__ - Step 43842: {'lr': 0.0001991953997136878, 'samples': 1402944, 'steps': 2740, 'loss/train': 2.5444846153259277} -09/20/2021 23:59:04 - INFO - __main__ - Step 43843: {'lr': 0.0001991953997136878, 'samples': 1402976, 'steps': 2740, 'loss/train': 2.450092077255249} -09/20/2021 23:59:05 - INFO - __main__ - Step 43844: {'lr': 0.0001991953997136878, 'samples': 1403008, 'steps': 2740, 'loss/train': 2.3788886070251465} -09/20/2021 23:59:06 - INFO - __main__ - Step 43845: {'lr': 0.0001991953997136878, 'samples': 1403040, 'steps': 2740, 'loss/train': 1.6705288887023926} -09/20/2021 23:59:07 - INFO - __main__ - Step 43846: {'lr': 0.0001991953997136878, 'samples': 1403072, 'steps': 2740, 'loss/train': 1.6338331699371338} -09/20/2021 23:59:07 - INFO - __main__ - Step 43847: {'lr': 0.0001991953997136878, 'samples': 1403104, 'steps': 2740, 'loss/train': 2.2609243392944336} -09/20/2021 23:59:08 - INFO - __main__ - Step 43848: {'lr': 0.0001991953997136878, 'samples': 1403136, 'steps': 2740, 'loss/train': 2.5166258811950684} -09/20/2021 23:59:09 - INFO - __main__ - Step 43849: {'lr': 0.0001991953997136878, 'samples': 1403168, 'steps': 2740, 'loss/train': 2.6081724166870117} -09/20/2021 23:59:10 - INFO - __main__ - Step 43850: {'lr': 0.0001991953997136878, 'samples': 1403200, 'steps': 2740, 'loss/train': 0.7195882201194763} -09/20/2021 23:59:10 - INFO - __main__ - Step 43851: {'lr': 0.0001991953997136878, 'samples': 1403232, 'steps': 2740, 'loss/train': 1.3205996751785278} -09/20/2021 23:59:11 - INFO - __main__ - Step 43852: {'lr': 0.0001991953997136878, 'samples': 1403264, 'steps': 2740, 'loss/train': 1.536655306816101} -09/20/2021 23:59:12 - INFO - __main__ - Step 43853: {'lr': 0.0001991953997136878, 'samples': 1403296, 'steps': 2740, 'loss/train': 2.1029627323150635} -09/20/2021 23:59:13 - INFO - __main__ - Step 43854: {'lr': 0.0001991953997136878, 'samples': 1403328, 'steps': 2740, 'loss/train': 2.6686952114105225} -09/20/2021 23:59:13 - INFO - __main__ - Step 43855: {'lr': 0.0001991953997136878, 'samples': 1403360, 'steps': 2740, 'loss/train': 2.3837029933929443} -09/20/2021 23:59:14 - INFO - __main__ - Step 43856: {'lr': 0.0001991953997136878, 'samples': 1403392, 'steps': 2740, 'loss/train': 1.82594633102417} -09/20/2021 23:59:15 - INFO - __main__ - Step 43857: {'lr': 0.000199194591954512, 'samples': 1403424, 'steps': 2741, 'loss/train': 2.5297625064849854} -09/20/2021 23:59:16 - INFO - __main__ - Step 43858: {'lr': 0.000199194591954512, 'samples': 1403456, 'steps': 2741, 'loss/train': 2.0849971771240234} -09/20/2021 23:59:16 - INFO - __main__ - Step 43859: {'lr': 0.000199194591954512, 'samples': 1403488, 'steps': 2741, 'loss/train': 2.2778782844543457} -09/20/2021 23:59:17 - INFO - __main__ - Step 43860: {'lr': 0.000199194591954512, 'samples': 1403520, 'steps': 2741, 'loss/train': 2.712608575820923} -09/20/2021 23:59:18 - INFO - __main__ - Step 43861: {'lr': 0.000199194591954512, 'samples': 1403552, 'steps': 2741, 'loss/train': 2.6372694969177246} -09/20/2021 23:59:19 - INFO - __main__ - Step 43862: {'lr': 0.000199194591954512, 'samples': 1403584, 'steps': 2741, 'loss/train': 1.043885350227356} -09/20/2021 23:59:19 - INFO - __main__ - Step 43863: {'lr': 0.000199194591954512, 'samples': 1403616, 'steps': 2741, 'loss/train': 2.074721574783325} -09/20/2021 23:59:21 - INFO - __main__ - Step 43864: {'lr': 0.000199194591954512, 'samples': 1403648, 'steps': 2741, 'loss/train': 2.217888593673706} -09/20/2021 23:59:21 - INFO - __main__ - Step 43865: {'lr': 0.000199194591954512, 'samples': 1403680, 'steps': 2741, 'loss/train': 1.8337147235870361} -09/20/2021 23:59:22 - INFO - __main__ - Step 43866: {'lr': 0.000199194591954512, 'samples': 1403712, 'steps': 2741, 'loss/train': 2.151980400085449} -09/20/2021 23:59:23 - INFO - __main__ - Step 43867: {'lr': 0.000199194591954512, 'samples': 1403744, 'steps': 2741, 'loss/train': 1.7787201404571533} -09/20/2021 23:59:24 - INFO - __main__ - Step 43868: {'lr': 0.000199194591954512, 'samples': 1403776, 'steps': 2741, 'loss/train': 2.439574718475342} -09/20/2021 23:59:24 - INFO - __main__ - Step 43869: {'lr': 0.000199194591954512, 'samples': 1403808, 'steps': 2741, 'loss/train': 1.9780330657958984} -09/20/2021 23:59:25 - INFO - __main__ - Step 43870: {'lr': 0.000199194591954512, 'samples': 1403840, 'steps': 2741, 'loss/train': 1.9898979663848877} -09/20/2021 23:59:26 - INFO - __main__ - Step 43871: {'lr': 0.000199194591954512, 'samples': 1403872, 'steps': 2741, 'loss/train': 1.9772734642028809} -09/20/2021 23:59:27 - INFO - __main__ - Step 43872: {'lr': 0.000199194591954512, 'samples': 1403904, 'steps': 2741, 'loss/train': 0.7889479398727417} -09/20/2021 23:59:28 - INFO - __main__ - Step 43873: {'lr': 0.0001991937837917138, 'samples': 1403936, 'steps': 2742, 'loss/train': 2.572141408920288} -09/20/2021 23:59:28 - INFO - __main__ - Step 43874: {'lr': 0.0001991937837917138, 'samples': 1403968, 'steps': 2742, 'loss/train': 2.540109634399414} -09/20/2021 23:59:29 - INFO - __main__ - Step 43875: {'lr': 0.0001991937837917138, 'samples': 1404000, 'steps': 2742, 'loss/train': 1.9659985303878784} -09/20/2021 23:59:30 - INFO - __main__ - Step 43876: {'lr': 0.0001991937837917138, 'samples': 1404032, 'steps': 2742, 'loss/train': 2.3810226917266846} -09/20/2021 23:59:31 - INFO - __main__ - Step 43877: {'lr': 0.0001991937837917138, 'samples': 1404064, 'steps': 2742, 'loss/train': 1.2375363111495972} -09/20/2021 23:59:31 - INFO - __main__ - Step 43878: {'lr': 0.0001991937837917138, 'samples': 1404096, 'steps': 2742, 'loss/train': 2.0584945678710938} -09/20/2021 23:59:32 - INFO - __main__ - Step 43879: {'lr': 0.0001991937837917138, 'samples': 1404128, 'steps': 2742, 'loss/train': 2.2095792293548584} -09/20/2021 23:59:33 - INFO - __main__ - Step 43880: {'lr': 0.0001991937837917138, 'samples': 1404160, 'steps': 2742, 'loss/train': 2.712486505508423} -09/20/2021 23:59:34 - INFO - __main__ - Step 43881: {'lr': 0.0001991937837917138, 'samples': 1404192, 'steps': 2742, 'loss/train': 2.6798787117004395} -09/20/2021 23:59:34 - INFO - __main__ - Step 43882: {'lr': 0.0001991937837917138, 'samples': 1404224, 'steps': 2742, 'loss/train': 2.5870742797851562} -09/20/2021 23:59:35 - INFO - __main__ - Step 43883: {'lr': 0.0001991937837917138, 'samples': 1404256, 'steps': 2742, 'loss/train': 2.65549635887146} -09/20/2021 23:59:36 - INFO - __main__ - Step 43884: {'lr': 0.0001991937837917138, 'samples': 1404288, 'steps': 2742, 'loss/train': 2.0452041625976562} -09/20/2021 23:59:37 - INFO - __main__ - Step 43885: {'lr': 0.0001991937837917138, 'samples': 1404320, 'steps': 2742, 'loss/train': 0.7620249390602112} -09/20/2021 23:59:37 - INFO - __main__ - Step 43886: {'lr': 0.0001991937837917138, 'samples': 1404352, 'steps': 2742, 'loss/train': 2.289717674255371} -09/20/2021 23:59:38 - INFO - __main__ - Step 43887: {'lr': 0.0001991937837917138, 'samples': 1404384, 'steps': 2742, 'loss/train': 2.274345636367798} -09/20/2021 23:59:39 - INFO - __main__ - Step 43888: {'lr': 0.0001991937837917138, 'samples': 1404416, 'steps': 2742, 'loss/train': 2.0366992950439453} -09/20/2021 23:59:40 - INFO - __main__ - Step 43889: {'lr': 0.0001991929752252965, 'samples': 1404448, 'steps': 2743, 'loss/train': 2.527235984802246} -09/20/2021 23:59:41 - INFO - __main__ - Step 43890: {'lr': 0.0001991929752252965, 'samples': 1404480, 'steps': 2743, 'loss/train': 1.4658963680267334} -09/20/2021 23:59:41 - INFO - __main__ - Step 43891: {'lr': 0.0001991929752252965, 'samples': 1404512, 'steps': 2743, 'loss/train': 2.313878059387207} -09/20/2021 23:59:42 - INFO - __main__ - Step 43892: {'lr': 0.0001991929752252965, 'samples': 1404544, 'steps': 2743, 'loss/train': 2.5661754608154297} -09/20/2021 23:59:43 - INFO - __main__ - Step 43893: {'lr': 0.0001991929752252965, 'samples': 1404576, 'steps': 2743, 'loss/train': 1.7906458377838135} -09/20/2021 23:59:44 - INFO - __main__ - Step 43894: {'lr': 0.0001991929752252965, 'samples': 1404608, 'steps': 2743, 'loss/train': 1.21794855594635} -09/20/2021 23:59:45 - INFO - __main__ - Step 43895: {'lr': 0.0001991929752252965, 'samples': 1404640, 'steps': 2743, 'loss/train': 2.7672994136810303} -09/20/2021 23:59:46 - INFO - __main__ - Step 43896: {'lr': 0.0001991929752252965, 'samples': 1404672, 'steps': 2743, 'loss/train': 1.7284393310546875} -09/20/2021 23:59:46 - INFO - __main__ - Step 43897: {'lr': 0.0001991929752252965, 'samples': 1404704, 'steps': 2743, 'loss/train': 1.6519337892532349} -09/20/2021 23:59:47 - INFO - __main__ - Step 43898: {'lr': 0.0001991929752252965, 'samples': 1404736, 'steps': 2743, 'loss/train': 2.3322110176086426} -09/20/2021 23:59:48 - INFO - __main__ - Step 43899: {'lr': 0.0001991929752252965, 'samples': 1404768, 'steps': 2743, 'loss/train': 2.147965669631958} -09/20/2021 23:59:49 - INFO - __main__ - Step 43900: {'lr': 0.0001991929752252965, 'samples': 1404800, 'steps': 2743, 'loss/train': 1.7358192205429077} -09/20/2021 23:59:49 - INFO - __main__ - Step 43901: {'lr': 0.0001991929752252965, 'samples': 1404832, 'steps': 2743, 'loss/train': 0.7878614664077759} -09/20/2021 23:59:50 - INFO - __main__ - Step 43902: {'lr': 0.0001991929752252965, 'samples': 1404864, 'steps': 2743, 'loss/train': 0.7427376508712769} -09/20/2021 23:59:51 - INFO - __main__ - Step 43903: {'lr': 0.0001991929752252965, 'samples': 1404896, 'steps': 2743, 'loss/train': 2.1735758781433105} -09/20/2021 23:59:52 - INFO - __main__ - Step 43904: {'lr': 0.0001991929752252965, 'samples': 1404928, 'steps': 2743, 'loss/train': 2.7893948554992676} -09/20/2021 23:59:53 - INFO - __main__ - Step 43905: {'lr': 0.00019919216625526335, 'samples': 1404960, 'steps': 2744, 'loss/train': 1.6277633905410767} -09/20/2021 23:59:53 - INFO - __main__ - Step 43906: {'lr': 0.00019919216625526335, 'samples': 1404992, 'steps': 2744, 'loss/train': 2.908273696899414} -09/20/2021 23:59:54 - INFO - __main__ - Step 43907: {'lr': 0.00019919216625526335, 'samples': 1405024, 'steps': 2744, 'loss/train': 2.1292049884796143} -09/20/2021 23:59:55 - INFO - __main__ - Step 43908: {'lr': 0.00019919216625526335, 'samples': 1405056, 'steps': 2744, 'loss/train': 0.40192052721977234} -09/20/2021 23:59:56 - INFO - __main__ - Step 43909: {'lr': 0.00019919216625526335, 'samples': 1405088, 'steps': 2744, 'loss/train': 1.3625391721725464} -09/20/2021 23:59:56 - INFO - __main__ - Step 43910: {'lr': 0.00019919216625526335, 'samples': 1405120, 'steps': 2744, 'loss/train': 1.911307692527771} -09/20/2021 23:59:57 - INFO - __main__ - Step 43911: {'lr': 0.00019919216625526335, 'samples': 1405152, 'steps': 2744, 'loss/train': 1.698085069656372} -09/20/2021 23:59:58 - INFO - __main__ - Step 43912: {'lr': 0.00019919216625526335, 'samples': 1405184, 'steps': 2744, 'loss/train': 1.1738828420639038} -09/20/2021 23:59:59 - INFO - __main__ - Step 43913: {'lr': 0.00019919216625526335, 'samples': 1405216, 'steps': 2744, 'loss/train': 1.8889272212982178} -09/20/2021 23:59:59 - INFO - __main__ - Step 43914: {'lr': 0.00019919216625526335, 'samples': 1405248, 'steps': 2744, 'loss/train': 2.119135618209839} -09/21/2021 00:00:00 - INFO - __main__ - Step 43915: {'lr': 0.00019919216625526335, 'samples': 1405280, 'steps': 2744, 'loss/train': 1.8480173349380493} -09/21/2021 00:00:01 - INFO - __main__ - Step 43916: {'lr': 0.00019919216625526335, 'samples': 1405312, 'steps': 2744, 'loss/train': 2.264686107635498} -09/21/2021 00:00:02 - INFO - __main__ - Step 43917: {'lr': 0.00019919216625526335, 'samples': 1405344, 'steps': 2744, 'loss/train': 2.2259063720703125} -09/21/2021 00:00:02 - INFO - __main__ - Step 43918: {'lr': 0.00019919216625526335, 'samples': 1405376, 'steps': 2744, 'loss/train': 2.12900447845459} -09/21/2021 00:00:03 - INFO - __main__ - Step 43919: {'lr': 0.00019919216625526335, 'samples': 1405408, 'steps': 2744, 'loss/train': 2.569444179534912} -09/21/2021 00:00:04 - INFO - __main__ - Step 43920: {'lr': 0.00019919216625526335, 'samples': 1405440, 'steps': 2744, 'loss/train': 2.407473087310791} -09/21/2021 00:00:05 - INFO - __main__ - Step 43921: {'lr': 0.00019919135688161767, 'samples': 1405472, 'steps': 2745, 'loss/train': 2.1358156204223633} -09/21/2021 00:00:05 - INFO - __main__ - Step 43922: {'lr': 0.00019919135688161767, 'samples': 1405504, 'steps': 2745, 'loss/train': 1.3172998428344727} -09/21/2021 00:00:06 - INFO - __main__ - Step 43923: {'lr': 0.00019919135688161767, 'samples': 1405536, 'steps': 2745, 'loss/train': 2.8071038722991943} -09/21/2021 00:00:07 - INFO - __main__ - Step 43924: {'lr': 0.00019919135688161767, 'samples': 1405568, 'steps': 2745, 'loss/train': 3.1617162227630615} -09/21/2021 00:00:08 - INFO - __main__ - Step 43925: {'lr': 0.00019919135688161767, 'samples': 1405600, 'steps': 2745, 'loss/train': 2.119203567504883} -09/21/2021 00:00:09 - INFO - __main__ - Step 43926: {'lr': 0.00019919135688161767, 'samples': 1405632, 'steps': 2745, 'loss/train': 0.8006832599639893} -09/21/2021 00:00:10 - INFO - __main__ - Step 43927: {'lr': 0.00019919135688161767, 'samples': 1405664, 'steps': 2745, 'loss/train': 1.5950422286987305} -09/21/2021 00:00:11 - INFO - __main__ - Step 43928: {'lr': 0.00019919135688161767, 'samples': 1405696, 'steps': 2745, 'loss/train': 2.1426331996917725} -09/21/2021 00:00:11 - INFO - __main__ - Step 43929: {'lr': 0.00019919135688161767, 'samples': 1405728, 'steps': 2745, 'loss/train': 2.252147912979126} -09/21/2021 00:00:12 - INFO - __main__ - Step 43930: {'lr': 0.00019919135688161767, 'samples': 1405760, 'steps': 2745, 'loss/train': 1.2738388776779175} -09/21/2021 00:00:13 - INFO - __main__ - Step 43931: {'lr': 0.00019919135688161767, 'samples': 1405792, 'steps': 2745, 'loss/train': 1.2665085792541504} -09/21/2021 00:00:14 - INFO - __main__ - Step 43932: {'lr': 0.00019919135688161767, 'samples': 1405824, 'steps': 2745, 'loss/train': 3.325307846069336} -09/21/2021 00:00:14 - INFO - __main__ - Step 43933: {'lr': 0.00019919135688161767, 'samples': 1405856, 'steps': 2745, 'loss/train': 2.31203293800354} -09/21/2021 00:00:15 - INFO - __main__ - Step 43934: {'lr': 0.00019919135688161767, 'samples': 1405888, 'steps': 2745, 'loss/train': 1.80311119556427} -09/21/2021 00:00:16 - INFO - __main__ - Step 43935: {'lr': 0.00019919135688161767, 'samples': 1405920, 'steps': 2745, 'loss/train': 2.2004551887512207} -09/21/2021 00:00:17 - INFO - __main__ - Step 43936: {'lr': 0.00019919135688161767, 'samples': 1405952, 'steps': 2745, 'loss/train': 2.341729164123535} -09/21/2021 00:00:17 - INFO - __main__ - Step 43937: {'lr': 0.00019919054710436273, 'samples': 1405984, 'steps': 2746, 'loss/train': 2.0381925106048584} -09/21/2021 00:00:18 - INFO - __main__ - Step 43938: {'lr': 0.00019919054710436273, 'samples': 1406016, 'steps': 2746, 'loss/train': 3.0117430686950684} -09/21/2021 00:00:19 - INFO - __main__ - Step 43939: {'lr': 0.00019919054710436273, 'samples': 1406048, 'steps': 2746, 'loss/train': 2.1904540061950684} -09/21/2021 00:00:20 - INFO - __main__ - Step 43940: {'lr': 0.00019919054710436273, 'samples': 1406080, 'steps': 2746, 'loss/train': 2.9272143840789795} -09/21/2021 00:00:20 - INFO - __main__ - Step 43941: {'lr': 0.00019919054710436273, 'samples': 1406112, 'steps': 2746, 'loss/train': 1.9693580865859985} -09/21/2021 00:00:21 - INFO - __main__ - Step 43942: {'lr': 0.00019919054710436273, 'samples': 1406144, 'steps': 2746, 'loss/train': 2.5497803688049316} -09/21/2021 00:00:22 - INFO - __main__ - Step 43943: {'lr': 0.00019919054710436273, 'samples': 1406176, 'steps': 2746, 'loss/train': 2.2235350608825684} -09/21/2021 00:00:23 - INFO - __main__ - Step 43944: {'lr': 0.00019919054710436273, 'samples': 1406208, 'steps': 2746, 'loss/train': 2.4822781085968018} -09/21/2021 00:00:23 - INFO - __main__ - Step 43945: {'lr': 0.00019919054710436273, 'samples': 1406240, 'steps': 2746, 'loss/train': 2.3701889514923096} -09/21/2021 00:00:24 - INFO - __main__ - Step 43946: {'lr': 0.00019919054710436273, 'samples': 1406272, 'steps': 2746, 'loss/train': 2.5183515548706055} -09/21/2021 00:00:25 - INFO - __main__ - Step 43947: {'lr': 0.00019919054710436273, 'samples': 1406304, 'steps': 2746, 'loss/train': 1.5919287204742432} -09/21/2021 00:00:26 - INFO - __main__ - Step 43948: {'lr': 0.00019919054710436273, 'samples': 1406336, 'steps': 2746, 'loss/train': 0.938090443611145} -09/21/2021 00:00:26 - INFO - __main__ - Step 43949: {'lr': 0.00019919054710436273, 'samples': 1406368, 'steps': 2746, 'loss/train': 2.7287633419036865} -09/21/2021 00:00:27 - INFO - __main__ - Step 43950: {'lr': 0.00019919054710436273, 'samples': 1406400, 'steps': 2746, 'loss/train': 2.067186117172241} -09/21/2021 00:00:28 - INFO - __main__ - Step 43951: {'lr': 0.00019919054710436273, 'samples': 1406432, 'steps': 2746, 'loss/train': 2.667052745819092} -09/21/2021 00:00:29 - INFO - __main__ - Step 43952: {'lr': 0.00019919054710436273, 'samples': 1406464, 'steps': 2746, 'loss/train': 2.377979040145874} -09/21/2021 00:00:30 - INFO - __main__ - Step 43953: {'lr': 0.00019918973692350186, 'samples': 1406496, 'steps': 2747, 'loss/train': 3.2359542846679688} -09/21/2021 00:00:30 - INFO - __main__ - Step 43954: {'lr': 0.00019918973692350186, 'samples': 1406528, 'steps': 2747, 'loss/train': 2.850367784500122} -09/21/2021 00:00:31 - INFO - __main__ - Step 43955: {'lr': 0.00019918973692350186, 'samples': 1406560, 'steps': 2747, 'loss/train': 2.457867383956909} -09/21/2021 00:00:32 - INFO - __main__ - Step 43956: {'lr': 0.00019918973692350186, 'samples': 1406592, 'steps': 2747, 'loss/train': 2.2922399044036865} -09/21/2021 00:00:33 - INFO - __main__ - Step 43957: {'lr': 0.00019918973692350186, 'samples': 1406624, 'steps': 2747, 'loss/train': 1.818061351776123} -09/21/2021 00:00:34 - INFO - __main__ - Step 43958: {'lr': 0.00019918973692350186, 'samples': 1406656, 'steps': 2747, 'loss/train': 1.8397449254989624} -09/21/2021 00:00:35 - INFO - __main__ - Step 43959: {'lr': 0.00019918973692350186, 'samples': 1406688, 'steps': 2747, 'loss/train': 1.925157070159912} -09/21/2021 00:00:35 - INFO - __main__ - Step 43960: {'lr': 0.00019918973692350186, 'samples': 1406720, 'steps': 2747, 'loss/train': 2.5756359100341797} -09/21/2021 00:00:36 - INFO - __main__ - Step 43961: {'lr': 0.00019918973692350186, 'samples': 1406752, 'steps': 2747, 'loss/train': 1.6203219890594482} -09/21/2021 00:00:37 - INFO - __main__ - Step 43962: {'lr': 0.00019918973692350186, 'samples': 1406784, 'steps': 2747, 'loss/train': 1.0004398822784424} -09/21/2021 00:00:38 - INFO - __main__ - Step 43963: {'lr': 0.00019918973692350186, 'samples': 1406816, 'steps': 2747, 'loss/train': 0.904202401638031} -09/21/2021 00:00:38 - INFO - __main__ - Step 43964: {'lr': 0.00019918973692350186, 'samples': 1406848, 'steps': 2747, 'loss/train': 2.8477590084075928} -09/21/2021 00:00:39 - INFO - __main__ - Step 43965: {'lr': 0.00019918973692350186, 'samples': 1406880, 'steps': 2747, 'loss/train': 2.317028522491455} -09/21/2021 00:00:40 - INFO - __main__ - Step 43966: {'lr': 0.00019918973692350186, 'samples': 1406912, 'steps': 2747, 'loss/train': 1.3671338558197021} -09/21/2021 00:00:41 - INFO - __main__ - Step 43967: {'lr': 0.00019918973692350186, 'samples': 1406944, 'steps': 2747, 'loss/train': 1.8646537065505981} -09/21/2021 00:00:41 - INFO - __main__ - Step 43968: {'lr': 0.00019918973692350186, 'samples': 1406976, 'steps': 2747, 'loss/train': 1.3246607780456543} -09/21/2021 00:00:42 - INFO - __main__ - Step 43969: {'lr': 0.00019918892633903834, 'samples': 1407008, 'steps': 2748, 'loss/train': 0.20013581216335297} -09/21/2021 00:00:43 - INFO - __main__ - Step 43970: {'lr': 0.00019918892633903834, 'samples': 1407040, 'steps': 2748, 'loss/train': 0.2174229621887207} -09/21/2021 00:00:44 - INFO - __main__ - Step 43971: {'lr': 0.00019918892633903834, 'samples': 1407072, 'steps': 2748, 'loss/train': 0.4988415241241455} -09/21/2021 00:00:45 - INFO - __main__ - Step 43972: {'lr': 0.00019918892633903834, 'samples': 1407104, 'steps': 2748, 'loss/train': 0.2867238223552704} -09/21/2021 00:00:45 - INFO - __main__ - Step 43973: {'lr': 0.00019918892633903834, 'samples': 1407136, 'steps': 2748, 'loss/train': 1.7501517534255981} -09/21/2021 00:00:46 - INFO - __main__ - Step 43974: {'lr': 0.00019918892633903834, 'samples': 1407168, 'steps': 2748, 'loss/train': 1.5933750867843628} -09/21/2021 00:00:47 - INFO - __main__ - Step 43975: {'lr': 0.00019918892633903834, 'samples': 1407200, 'steps': 2748, 'loss/train': 3.169968605041504} -09/21/2021 00:00:48 - INFO - __main__ - Step 43976: {'lr': 0.00019918892633903834, 'samples': 1407232, 'steps': 2748, 'loss/train': 2.5528109073638916} -09/21/2021 00:00:48 - INFO - __main__ - Step 43977: {'lr': 0.00019918892633903834, 'samples': 1407264, 'steps': 2748, 'loss/train': 0.8546589016914368} -09/21/2021 00:00:49 - INFO - __main__ - Step 43978: {'lr': 0.00019918892633903834, 'samples': 1407296, 'steps': 2748, 'loss/train': 1.6380709409713745} -09/21/2021 00:00:50 - INFO - __main__ - Step 43979: {'lr': 0.00019918892633903834, 'samples': 1407328, 'steps': 2748, 'loss/train': 2.1382339000701904} -09/21/2021 00:00:51 - INFO - __main__ - Step 43980: {'lr': 0.00019918892633903834, 'samples': 1407360, 'steps': 2748, 'loss/train': 1.2806469202041626} -09/21/2021 00:00:51 - INFO - __main__ - Step 43981: {'lr': 0.00019918892633903834, 'samples': 1407392, 'steps': 2748, 'loss/train': 1.8089216947555542} -09/21/2021 00:00:52 - INFO - __main__ - Step 43982: {'lr': 0.00019918892633903834, 'samples': 1407424, 'steps': 2748, 'loss/train': 2.3244829177856445} -09/21/2021 00:00:53 - INFO - __main__ - Step 43983: {'lr': 0.00019918892633903834, 'samples': 1407456, 'steps': 2748, 'loss/train': 2.412909984588623} -09/21/2021 00:00:54 - INFO - __main__ - Step 43984: {'lr': 0.00019918892633903834, 'samples': 1407488, 'steps': 2748, 'loss/train': 2.6233716011047363} -09/21/2021 00:00:54 - INFO - __main__ - Step 43985: {'lr': 0.00019918811535097543, 'samples': 1407520, 'steps': 2749, 'loss/train': 2.1609013080596924} -09/21/2021 00:00:55 - INFO - __main__ - Step 43986: {'lr': 0.00019918811535097543, 'samples': 1407552, 'steps': 2749, 'loss/train': 2.1056573390960693} -09/21/2021 00:00:56 - INFO - __main__ - Step 43987: {'lr': 0.00019918811535097543, 'samples': 1407584, 'steps': 2749, 'loss/train': 2.4229886531829834} -09/21/2021 00:00:57 - INFO - __main__ - Step 43988: {'lr': 0.00019918811535097543, 'samples': 1407616, 'steps': 2749, 'loss/train': 0.2326723337173462} -09/21/2021 00:00:57 - INFO - __main__ - Step 43989: {'lr': 0.00019918811535097543, 'samples': 1407648, 'steps': 2749, 'loss/train': 2.4607906341552734} -09/21/2021 00:00:59 - INFO - __main__ - Step 43990: {'lr': 0.00019918811535097543, 'samples': 1407680, 'steps': 2749, 'loss/train': 2.1056346893310547} -09/21/2021 00:00:59 - INFO - __main__ - Step 43991: {'lr': 0.00019918811535097543, 'samples': 1407712, 'steps': 2749, 'loss/train': 1.870975136756897} -09/21/2021 00:01:00 - INFO - __main__ - Step 43992: {'lr': 0.00019918811535097543, 'samples': 1407744, 'steps': 2749, 'loss/train': 0.3788890540599823} -09/21/2021 00:01:01 - INFO - __main__ - Step 43993: {'lr': 0.00019918811535097543, 'samples': 1407776, 'steps': 2749, 'loss/train': 2.237624406814575} -09/21/2021 00:01:02 - INFO - __main__ - Step 43994: {'lr': 0.00019918811535097543, 'samples': 1407808, 'steps': 2749, 'loss/train': 0.6318562030792236} -09/21/2021 00:01:02 - INFO - __main__ - Step 43995: {'lr': 0.00019918811535097543, 'samples': 1407840, 'steps': 2749, 'loss/train': 2.1265010833740234} -09/21/2021 00:01:03 - INFO - __main__ - Step 43996: {'lr': 0.00019918811535097543, 'samples': 1407872, 'steps': 2749, 'loss/train': 3.046416997909546} -09/21/2021 00:01:04 - INFO - __main__ - Step 43997: {'lr': 0.00019918811535097543, 'samples': 1407904, 'steps': 2749, 'loss/train': 1.976608157157898} -09/21/2021 00:01:05 - INFO - __main__ - Step 43998: {'lr': 0.00019918811535097543, 'samples': 1407936, 'steps': 2749, 'loss/train': 1.6572163105010986} -09/21/2021 00:01:05 - INFO - __main__ - Step 43999: {'lr': 0.00019918811535097543, 'samples': 1407968, 'steps': 2749, 'loss/train': 1.4218554496765137} -09/21/2021 00:01:06 - INFO - __main__ - Step 44000: {'lr': 0.00019918811535097543, 'samples': 1408000, 'steps': 2749, 'loss/train': 2.846083641052246} -09/21/2021 00:01:07 - INFO - __main__ - Step 44001: {'lr': 0.00019918730395931649, 'samples': 1408032, 'steps': 2750, 'loss/train': 2.4953224658966064} -09/21/2021 00:01:08 - INFO - __main__ - Step 44002: {'lr': 0.00019918730395931649, 'samples': 1408064, 'steps': 2750, 'loss/train': 1.8915504217147827} -09/21/2021 00:01:09 - INFO - __main__ - Step 44003: {'lr': 0.00019918730395931649, 'samples': 1408096, 'steps': 2750, 'loss/train': 1.5882630348205566} -09/21/2021 00:01:09 - INFO - __main__ - Step 44004: {'lr': 0.00019918730395931649, 'samples': 1408128, 'steps': 2750, 'loss/train': 1.7042137384414673} -09/21/2021 00:01:10 - INFO - __main__ - Step 44005: {'lr': 0.00019918730395931649, 'samples': 1408160, 'steps': 2750, 'loss/train': 1.4949893951416016} -09/21/2021 00:01:11 - INFO - __main__ - Step 44006: {'lr': 0.00019918730395931649, 'samples': 1408192, 'steps': 2750, 'loss/train': 1.8852074146270752} -09/21/2021 00:01:12 - INFO - __main__ - Step 44007: {'lr': 0.00019918730395931649, 'samples': 1408224, 'steps': 2750, 'loss/train': 1.150416612625122} -09/21/2021 00:01:12 - INFO - __main__ - Step 44008: {'lr': 0.00019918730395931649, 'samples': 1408256, 'steps': 2750, 'loss/train': 2.489071846008301} -09/21/2021 00:01:13 - INFO - __main__ - Step 44009: {'lr': 0.00019918730395931649, 'samples': 1408288, 'steps': 2750, 'loss/train': 2.3547449111938477} -09/21/2021 00:01:14 - INFO - __main__ - Step 44010: {'lr': 0.00019918730395931649, 'samples': 1408320, 'steps': 2750, 'loss/train': 2.652200222015381} -09/21/2021 00:01:15 - INFO - __main__ - Step 44011: {'lr': 0.00019918730395931649, 'samples': 1408352, 'steps': 2750, 'loss/train': 2.4073336124420166} -09/21/2021 00:01:15 - INFO - __main__ - Step 44012: {'lr': 0.00019918730395931649, 'samples': 1408384, 'steps': 2750, 'loss/train': 1.7336740493774414} -09/21/2021 00:01:16 - INFO - __main__ - Step 44013: {'lr': 0.00019918730395931649, 'samples': 1408416, 'steps': 2750, 'loss/train': 2.2966151237487793} -09/21/2021 00:01:17 - INFO - __main__ - Step 44014: {'lr': 0.00019918730395931649, 'samples': 1408448, 'steps': 2750, 'loss/train': 2.5861494541168213} -09/21/2021 00:01:18 - INFO - __main__ - Step 44015: {'lr': 0.00019918730395931649, 'samples': 1408480, 'steps': 2750, 'loss/train': 1.71122145652771} -09/21/2021 00:01:18 - INFO - __main__ - Step 44016: {'lr': 0.00019918730395931649, 'samples': 1408512, 'steps': 2750, 'loss/train': 2.037238359451294} -09/21/2021 00:01:19 - INFO - __main__ - Step 44017: {'lr': 0.0001991864921640648, 'samples': 1408544, 'steps': 2751, 'loss/train': 1.6483285427093506} -09/21/2021 00:01:20 - INFO - __main__ - Step 44018: {'lr': 0.0001991864921640648, 'samples': 1408576, 'steps': 2751, 'loss/train': 1.9661694765090942} -09/21/2021 00:01:21 - INFO - __main__ - Step 44019: {'lr': 0.0001991864921640648, 'samples': 1408608, 'steps': 2751, 'loss/train': 2.1383564472198486} -09/21/2021 00:01:22 - INFO - __main__ - Step 44020: {'lr': 0.0001991864921640648, 'samples': 1408640, 'steps': 2751, 'loss/train': 2.1900765895843506} -09/21/2021 00:01:23 - INFO - __main__ - Step 44021: {'lr': 0.0001991864921640648, 'samples': 1408672, 'steps': 2751, 'loss/train': 2.805431365966797} -09/21/2021 00:01:24 - INFO - __main__ - Step 44022: {'lr': 0.0001991864921640648, 'samples': 1408704, 'steps': 2751, 'loss/train': 2.7375972270965576} -09/21/2021 00:01:24 - INFO - __main__ - Step 44023: {'lr': 0.0001991864921640648, 'samples': 1408736, 'steps': 2751, 'loss/train': 2.303658962249756} -09/21/2021 00:01:25 - INFO - __main__ - Step 44024: {'lr': 0.0001991864921640648, 'samples': 1408768, 'steps': 2751, 'loss/train': 2.189335346221924} -09/21/2021 00:01:26 - INFO - __main__ - Step 44025: {'lr': 0.0001991864921640648, 'samples': 1408800, 'steps': 2751, 'loss/train': 2.570392370223999} -09/21/2021 00:01:27 - INFO - __main__ - Step 44026: {'lr': 0.0001991864921640648, 'samples': 1408832, 'steps': 2751, 'loss/train': 1.9689056873321533} -09/21/2021 00:01:27 - INFO - __main__ - Step 44027: {'lr': 0.0001991864921640648, 'samples': 1408864, 'steps': 2751, 'loss/train': 2.2767765522003174} -09/21/2021 00:01:28 - INFO - __main__ - Step 44028: {'lr': 0.0001991864921640648, 'samples': 1408896, 'steps': 2751, 'loss/train': 1.4595998525619507} -09/21/2021 00:01:29 - INFO - __main__ - Step 44029: {'lr': 0.0001991864921640648, 'samples': 1408928, 'steps': 2751, 'loss/train': 3.3987343311309814} -09/21/2021 00:01:30 - INFO - __main__ - Step 44030: {'lr': 0.0001991864921640648, 'samples': 1408960, 'steps': 2751, 'loss/train': 2.3306100368499756} -09/21/2021 00:01:30 - INFO - __main__ - Step 44031: {'lr': 0.0001991864921640648, 'samples': 1408992, 'steps': 2751, 'loss/train': 1.9602627754211426} -09/21/2021 00:01:31 - INFO - __main__ - Step 44032: {'lr': 0.0001991864921640648, 'samples': 1409024, 'steps': 2751, 'loss/train': 1.2083311080932617} -09/21/2021 00:01:32 - INFO - __main__ - Step 44033: {'lr': 0.00019918567996522364, 'samples': 1409056, 'steps': 2752, 'loss/train': 2.1089913845062256} -09/21/2021 00:01:33 - INFO - __main__ - Step 44034: {'lr': 0.00019918567996522364, 'samples': 1409088, 'steps': 2752, 'loss/train': 1.083640694618225} -09/21/2021 00:01:33 - INFO - __main__ - Step 44035: {'lr': 0.00019918567996522364, 'samples': 1409120, 'steps': 2752, 'loss/train': 2.6893410682678223} -09/21/2021 00:01:34 - INFO - __main__ - Step 44036: {'lr': 0.00019918567996522364, 'samples': 1409152, 'steps': 2752, 'loss/train': 2.7884130477905273} -09/21/2021 00:01:35 - INFO - __main__ - Step 44037: {'lr': 0.00019918567996522364, 'samples': 1409184, 'steps': 2752, 'loss/train': 2.3591043949127197} -09/21/2021 00:01:36 - INFO - __main__ - Step 44038: {'lr': 0.00019918567996522364, 'samples': 1409216, 'steps': 2752, 'loss/train': 1.8090182542800903} -09/21/2021 00:01:36 - INFO - __main__ - Step 44039: {'lr': 0.00019918567996522364, 'samples': 1409248, 'steps': 2752, 'loss/train': 1.6404199600219727} -09/21/2021 00:01:37 - INFO - __main__ - Step 44040: {'lr': 0.00019918567996522364, 'samples': 1409280, 'steps': 2752, 'loss/train': 2.101395845413208} -09/21/2021 00:01:38 - INFO - __main__ - Step 44041: {'lr': 0.00019918567996522364, 'samples': 1409312, 'steps': 2752, 'loss/train': 1.4764387607574463} -09/21/2021 00:01:39 - INFO - __main__ - Step 44042: {'lr': 0.00019918567996522364, 'samples': 1409344, 'steps': 2752, 'loss/train': 1.8531140089035034} -09/21/2021 00:01:39 - INFO - __main__ - Step 44043: {'lr': 0.00019918567996522364, 'samples': 1409376, 'steps': 2752, 'loss/train': 1.674148440361023} -09/21/2021 00:01:40 - INFO - __main__ - Step 44044: {'lr': 0.00019918567996522364, 'samples': 1409408, 'steps': 2752, 'loss/train': 2.2872321605682373} -09/21/2021 00:01:41 - INFO - __main__ - Step 44045: {'lr': 0.00019918567996522364, 'samples': 1409440, 'steps': 2752, 'loss/train': 1.7856354713439941} -09/21/2021 00:01:42 - INFO - __main__ - Step 44046: {'lr': 0.00019918567996522364, 'samples': 1409472, 'steps': 2752, 'loss/train': 1.7564711570739746} -09/21/2021 00:01:42 - INFO - __main__ - Step 44047: {'lr': 0.00019918567996522364, 'samples': 1409504, 'steps': 2752, 'loss/train': 2.333519697189331} -09/21/2021 00:01:43 - INFO - __main__ - Step 44048: {'lr': 0.00019918567996522364, 'samples': 1409536, 'steps': 2752, 'loss/train': 1.6614372730255127} -09/21/2021 00:01:44 - INFO - __main__ - Step 44049: {'lr': 0.00019918486736279634, 'samples': 1409568, 'steps': 2753, 'loss/train': 3.055891513824463} -09/21/2021 00:01:45 - INFO - __main__ - Step 44050: {'lr': 0.00019918486736279634, 'samples': 1409600, 'steps': 2753, 'loss/train': 1.674820899963379} -09/21/2021 00:01:46 - INFO - __main__ - Step 44051: {'lr': 0.00019918486736279634, 'samples': 1409632, 'steps': 2753, 'loss/train': 2.472670793533325} -09/21/2021 00:01:47 - INFO - __main__ - Step 44052: {'lr': 0.00019918486736279634, 'samples': 1409664, 'steps': 2753, 'loss/train': 2.1697909832000732} -09/21/2021 00:01:48 - INFO - __main__ - Step 44053: {'lr': 0.00019918486736279634, 'samples': 1409696, 'steps': 2753, 'loss/train': 1.543900489807129} -09/21/2021 00:01:48 - INFO - __main__ - Step 44054: {'lr': 0.00019918486736279634, 'samples': 1409728, 'steps': 2753, 'loss/train': 1.0887454748153687} -09/21/2021 00:01:49 - INFO - __main__ - Step 44055: {'lr': 0.00019918486736279634, 'samples': 1409760, 'steps': 2753, 'loss/train': 1.5376640558242798} -09/21/2021 00:01:50 - INFO - __main__ - Step 44056: {'lr': 0.00019918486736279634, 'samples': 1409792, 'steps': 2753, 'loss/train': 2.6668031215667725} -09/21/2021 00:01:51 - INFO - __main__ - Step 44057: {'lr': 0.00019918486736279634, 'samples': 1409824, 'steps': 2753, 'loss/train': 0.5438374876976013} -09/21/2021 00:01:51 - INFO - __main__ - Step 44058: {'lr': 0.00019918486736279634, 'samples': 1409856, 'steps': 2753, 'loss/train': 1.8141337633132935} -09/21/2021 00:01:52 - INFO - __main__ - Step 44059: {'lr': 0.00019918486736279634, 'samples': 1409888, 'steps': 2753, 'loss/train': 2.3588593006134033} -09/21/2021 00:01:53 - INFO - __main__ - Step 44060: {'lr': 0.00019918486736279634, 'samples': 1409920, 'steps': 2753, 'loss/train': 2.0912110805511475} -09/21/2021 00:01:54 - INFO - __main__ - Step 44061: {'lr': 0.00019918486736279634, 'samples': 1409952, 'steps': 2753, 'loss/train': 2.1524417400360107} -09/21/2021 00:01:54 - INFO - __main__ - Step 44062: {'lr': 0.00019918486736279634, 'samples': 1409984, 'steps': 2753, 'loss/train': 2.3382456302642822} -09/21/2021 00:01:55 - INFO - __main__ - Step 44063: {'lr': 0.00019918486736279634, 'samples': 1410016, 'steps': 2753, 'loss/train': 2.252998113632202} -09/21/2021 00:01:56 - INFO - __main__ - Step 44064: {'lr': 0.00019918486736279634, 'samples': 1410048, 'steps': 2753, 'loss/train': 2.247910261154175} -09/21/2021 00:01:57 - INFO - __main__ - Step 44065: {'lr': 0.00019918405435678617, 'samples': 1410080, 'steps': 2754, 'loss/train': 1.577308177947998} -09/21/2021 00:01:57 - INFO - __main__ - Step 44066: {'lr': 0.00019918405435678617, 'samples': 1410112, 'steps': 2754, 'loss/train': 1.9708547592163086} -09/21/2021 00:01:58 - INFO - __main__ - Step 44067: {'lr': 0.00019918405435678617, 'samples': 1410144, 'steps': 2754, 'loss/train': 1.2679007053375244} -09/21/2021 00:01:59 - INFO - __main__ - Step 44068: {'lr': 0.00019918405435678617, 'samples': 1410176, 'steps': 2754, 'loss/train': 1.5979704856872559} -09/21/2021 00:02:00 - INFO - __main__ - Step 44069: {'lr': 0.00019918405435678617, 'samples': 1410208, 'steps': 2754, 'loss/train': 2.3985626697540283} -09/21/2021 00:02:00 - INFO - __main__ - Step 44070: {'lr': 0.00019918405435678617, 'samples': 1410240, 'steps': 2754, 'loss/train': 1.9566278457641602} -09/21/2021 00:02:01 - INFO - __main__ - Step 44071: {'lr': 0.00019918405435678617, 'samples': 1410272, 'steps': 2754, 'loss/train': 1.6128003597259521} -09/21/2021 00:02:02 - INFO - __main__ - Step 44072: {'lr': 0.00019918405435678617, 'samples': 1410304, 'steps': 2754, 'loss/train': 1.9330730438232422} -09/21/2021 00:02:03 - INFO - __main__ - Step 44073: {'lr': 0.00019918405435678617, 'samples': 1410336, 'steps': 2754, 'loss/train': 2.374089002609253} -09/21/2021 00:02:03 - INFO - __main__ - Step 44074: {'lr': 0.00019918405435678617, 'samples': 1410368, 'steps': 2754, 'loss/train': 2.4980227947235107} -09/21/2021 00:02:04 - INFO - __main__ - Step 44075: {'lr': 0.00019918405435678617, 'samples': 1410400, 'steps': 2754, 'loss/train': 2.260230779647827} -09/21/2021 00:02:05 - INFO - __main__ - Step 44076: {'lr': 0.00019918405435678617, 'samples': 1410432, 'steps': 2754, 'loss/train': 2.3790082931518555} -09/21/2021 00:02:06 - INFO - __main__ - Step 44077: {'lr': 0.00019918405435678617, 'samples': 1410464, 'steps': 2754, 'loss/train': 2.5129244327545166} -09/21/2021 00:02:06 - INFO - __main__ - Step 44078: {'lr': 0.00019918405435678617, 'samples': 1410496, 'steps': 2754, 'loss/train': 3.6298794746398926} -09/21/2021 00:02:07 - INFO - __main__ - Step 44079: {'lr': 0.00019918405435678617, 'samples': 1410528, 'steps': 2754, 'loss/train': 1.9322429895401} -09/21/2021 00:02:08 - INFO - __main__ - Step 44080: {'lr': 0.00019918405435678617, 'samples': 1410560, 'steps': 2754, 'loss/train': 2.1441845893859863} -09/21/2021 00:02:09 - INFO - __main__ - Step 44081: {'lr': 0.00019918324094719651, 'samples': 1410592, 'steps': 2755, 'loss/train': 2.3294782638549805} -09/21/2021 00:02:10 - INFO - __main__ - Step 44082: {'lr': 0.00019918324094719651, 'samples': 1410624, 'steps': 2755, 'loss/train': 1.8058667182922363} -09/21/2021 00:02:11 - INFO - __main__ - Step 44083: {'lr': 0.00019918324094719651, 'samples': 1410656, 'steps': 2755, 'loss/train': 2.5459113121032715} -09/21/2021 00:02:12 - INFO - __main__ - Step 44084: {'lr': 0.00019918324094719651, 'samples': 1410688, 'steps': 2755, 'loss/train': 2.5513620376586914} -09/21/2021 00:02:13 - INFO - __main__ - Step 44085: {'lr': 0.00019918324094719651, 'samples': 1410720, 'steps': 2755, 'loss/train': 1.6005859375} -09/21/2021 00:02:14 - INFO - __main__ - Step 44086: {'lr': 0.00019918324094719651, 'samples': 1410752, 'steps': 2755, 'loss/train': 1.5799976587295532} -09/21/2021 00:02:14 - INFO - __main__ - Step 44087: {'lr': 0.00019918324094719651, 'samples': 1410784, 'steps': 2755, 'loss/train': 2.2575747966766357} -09/21/2021 00:02:15 - INFO - __main__ - Step 44088: {'lr': 0.00019918324094719651, 'samples': 1410816, 'steps': 2755, 'loss/train': 2.124742269515991} -09/21/2021 00:02:16 - INFO - __main__ - Step 44089: {'lr': 0.00019918324094719651, 'samples': 1410848, 'steps': 2755, 'loss/train': 1.4308130741119385} -09/21/2021 00:02:17 - INFO - __main__ - Step 44090: {'lr': 0.00019918324094719651, 'samples': 1410880, 'steps': 2755, 'loss/train': 2.4800164699554443} -09/21/2021 00:02:17 - INFO - __main__ - Step 44091: {'lr': 0.00019918324094719651, 'samples': 1410912, 'steps': 2755, 'loss/train': 2.1643736362457275} -09/21/2021 00:02:18 - INFO - __main__ - Step 44092: {'lr': 0.00019918324094719651, 'samples': 1410944, 'steps': 2755, 'loss/train': 1.9091744422912598} -09/21/2021 00:02:19 - INFO - __main__ - Step 44093: {'lr': 0.00019918324094719651, 'samples': 1410976, 'steps': 2755, 'loss/train': 2.7200980186462402} -09/21/2021 00:02:20 - INFO - __main__ - Step 44094: {'lr': 0.00019918324094719651, 'samples': 1411008, 'steps': 2755, 'loss/train': 0.25109782814979553} -09/21/2021 00:02:20 - INFO - __main__ - Step 44095: {'lr': 0.00019918324094719651, 'samples': 1411040, 'steps': 2755, 'loss/train': 0.2116667926311493} -09/21/2021 00:02:21 - INFO - __main__ - Step 44096: {'lr': 0.00019918324094719651, 'samples': 1411072, 'steps': 2755, 'loss/train': 0.26608163118362427} -09/21/2021 00:02:22 - INFO - __main__ - Step 44097: {'lr': 0.00019918242713403062, 'samples': 1411104, 'steps': 2756, 'loss/train': 2.5828158855438232} -09/21/2021 00:02:23 - INFO - __main__ - Step 44098: {'lr': 0.00019918242713403062, 'samples': 1411136, 'steps': 2756, 'loss/train': 1.9097325801849365} -09/21/2021 00:02:23 - INFO - __main__ - Step 44099: {'lr': 0.00019918242713403062, 'samples': 1411168, 'steps': 2756, 'loss/train': 2.529592990875244} -09/21/2021 00:02:24 - INFO - __main__ - Step 44100: {'lr': 0.00019918242713403062, 'samples': 1411200, 'steps': 2756, 'loss/train': 1.4433941841125488} -09/21/2021 00:02:25 - INFO - __main__ - Step 44101: {'lr': 0.00019918242713403062, 'samples': 1411232, 'steps': 2756, 'loss/train': 3.3155014514923096} -09/21/2021 00:02:26 - INFO - __main__ - Step 44102: {'lr': 0.00019918242713403062, 'samples': 1411264, 'steps': 2756, 'loss/train': 1.4340555667877197} -09/21/2021 00:02:26 - INFO - __main__ - Step 44103: {'lr': 0.00019918242713403062, 'samples': 1411296, 'steps': 2756, 'loss/train': 0.9112686514854431} -09/21/2021 00:02:27 - INFO - __main__ - Step 44104: {'lr': 0.00019918242713403062, 'samples': 1411328, 'steps': 2756, 'loss/train': 1.1012717485427856} -09/21/2021 00:02:28 - INFO - __main__ - Step 44105: {'lr': 0.00019918242713403062, 'samples': 1411360, 'steps': 2756, 'loss/train': 2.608107805252075} -09/21/2021 00:02:29 - INFO - __main__ - Step 44106: {'lr': 0.00019918242713403062, 'samples': 1411392, 'steps': 2756, 'loss/train': 1.9492402076721191} -09/21/2021 00:02:29 - INFO - __main__ - Step 44107: {'lr': 0.00019918242713403062, 'samples': 1411424, 'steps': 2756, 'loss/train': 2.407426118850708} -09/21/2021 00:02:30 - INFO - __main__ - Step 44108: {'lr': 0.00019918242713403062, 'samples': 1411456, 'steps': 2756, 'loss/train': 1.8061981201171875} -09/21/2021 00:02:31 - INFO - __main__ - Step 44109: {'lr': 0.00019918242713403062, 'samples': 1411488, 'steps': 2756, 'loss/train': 2.0149006843566895} -09/21/2021 00:02:32 - INFO - __main__ - Step 44110: {'lr': 0.00019918242713403062, 'samples': 1411520, 'steps': 2756, 'loss/train': 2.631279230117798} -09/21/2021 00:02:32 - INFO - __main__ - Step 44111: {'lr': 0.00019918242713403062, 'samples': 1411552, 'steps': 2756, 'loss/train': 0.6320576667785645} -09/21/2021 00:02:33 - INFO - __main__ - Step 44112: {'lr': 0.00019918242713403062, 'samples': 1411584, 'steps': 2756, 'loss/train': 0.4712580740451813} -09/21/2021 00:02:34 - INFO - __main__ - Step 44113: {'lr': 0.00019918161291729183, 'samples': 1411616, 'steps': 2757, 'loss/train': 0.5588498711585999} -09/21/2021 00:02:35 - INFO - __main__ - Step 44114: {'lr': 0.00019918161291729183, 'samples': 1411648, 'steps': 2757, 'loss/train': 0.3874741494655609} -09/21/2021 00:02:36 - INFO - __main__ - Step 44115: {'lr': 0.00019918161291729183, 'samples': 1411680, 'steps': 2757, 'loss/train': 0.3556886911392212} -09/21/2021 00:02:36 - INFO - __main__ - Step 44116: {'lr': 0.00019918161291729183, 'samples': 1411712, 'steps': 2757, 'loss/train': 0.3780757784843445} -09/21/2021 00:02:37 - INFO - __main__ - Step 44117: {'lr': 0.00019918161291729183, 'samples': 1411744, 'steps': 2757, 'loss/train': 0.3949335515499115} -09/21/2021 00:02:38 - INFO - __main__ - Step 44118: {'lr': 0.00019918161291729183, 'samples': 1411776, 'steps': 2757, 'loss/train': 0.38414567708969116} -09/21/2021 00:02:39 - INFO - __main__ - Step 44119: {'lr': 0.00019918161291729183, 'samples': 1411808, 'steps': 2757, 'loss/train': 0.6685134768486023} -09/21/2021 00:02:40 - INFO - __main__ - Step 44120: {'lr': 0.00019918161291729183, 'samples': 1411840, 'steps': 2757, 'loss/train': 1.8584322929382324} -09/21/2021 00:02:41 - INFO - __main__ - Step 44121: {'lr': 0.00019918161291729183, 'samples': 1411872, 'steps': 2757, 'loss/train': 2.0478694438934326} -09/21/2021 00:02:41 - INFO - __main__ - Step 44122: {'lr': 0.00019918161291729183, 'samples': 1411904, 'steps': 2757, 'loss/train': 1.982539415359497} -09/21/2021 00:02:42 - INFO - __main__ - Step 44123: {'lr': 0.00019918161291729183, 'samples': 1411936, 'steps': 2757, 'loss/train': 2.483414888381958} -09/21/2021 00:02:43 - INFO - __main__ - Step 44124: {'lr': 0.00019918161291729183, 'samples': 1411968, 'steps': 2757, 'loss/train': 0.6451221704483032} -09/21/2021 00:02:44 - INFO - __main__ - Step 44125: {'lr': 0.00019918161291729183, 'samples': 1412000, 'steps': 2757, 'loss/train': 2.273076295852661} -09/21/2021 00:02:44 - INFO - __main__ - Step 44126: {'lr': 0.00019918161291729183, 'samples': 1412032, 'steps': 2757, 'loss/train': 2.5208420753479004} -09/21/2021 00:02:45 - INFO - __main__ - Step 44127: {'lr': 0.00019918161291729183, 'samples': 1412064, 'steps': 2757, 'loss/train': 2.767012357711792} -09/21/2021 00:02:46 - INFO - __main__ - Step 44128: {'lr': 0.00019918161291729183, 'samples': 1412096, 'steps': 2757, 'loss/train': 0.7280303835868835} -09/21/2021 00:02:47 - INFO - __main__ - Step 44129: {'lr': 0.00019918079829698342, 'samples': 1412128, 'steps': 2758, 'loss/train': 1.9620782136917114} -09/21/2021 00:02:48 - INFO - __main__ - Step 44130: {'lr': 0.00019918079829698342, 'samples': 1412160, 'steps': 2758, 'loss/train': 2.225471019744873} -09/21/2021 00:02:48 - INFO - __main__ - Step 44131: {'lr': 0.00019918079829698342, 'samples': 1412192, 'steps': 2758, 'loss/train': 2.1120080947875977} -09/21/2021 00:02:49 - INFO - __main__ - Step 44132: {'lr': 0.00019918079829698342, 'samples': 1412224, 'steps': 2758, 'loss/train': 2.0821564197540283} -09/21/2021 00:02:50 - INFO - __main__ - Step 44133: {'lr': 0.00019918079829698342, 'samples': 1412256, 'steps': 2758, 'loss/train': 2.877357244491577} -09/21/2021 00:02:51 - INFO - __main__ - Step 44134: {'lr': 0.00019918079829698342, 'samples': 1412288, 'steps': 2758, 'loss/train': 2.714890956878662} -09/21/2021 00:02:51 - INFO - __main__ - Step 44135: {'lr': 0.00019918079829698342, 'samples': 1412320, 'steps': 2758, 'loss/train': 2.765514850616455} -09/21/2021 00:02:52 - INFO - __main__ - Step 44136: {'lr': 0.00019918079829698342, 'samples': 1412352, 'steps': 2758, 'loss/train': 2.0210938453674316} -09/21/2021 00:02:53 - INFO - __main__ - Step 44137: {'lr': 0.00019918079829698342, 'samples': 1412384, 'steps': 2758, 'loss/train': 2.250181198120117} -09/21/2021 00:02:54 - INFO - __main__ - Step 44138: {'lr': 0.00019918079829698342, 'samples': 1412416, 'steps': 2758, 'loss/train': 2.699051856994629} -09/21/2021 00:02:54 - INFO - __main__ - Step 44139: {'lr': 0.00019918079829698342, 'samples': 1412448, 'steps': 2758, 'loss/train': 0.6635119915008545} -09/21/2021 00:02:55 - INFO - __main__ - Step 44140: {'lr': 0.00019918079829698342, 'samples': 1412480, 'steps': 2758, 'loss/train': 1.631209135055542} -09/21/2021 00:02:56 - INFO - __main__ - Step 44141: {'lr': 0.00019918079829698342, 'samples': 1412512, 'steps': 2758, 'loss/train': 0.4208945035934448} -09/21/2021 00:02:57 - INFO - __main__ - Step 44142: {'lr': 0.00019918079829698342, 'samples': 1412544, 'steps': 2758, 'loss/train': 1.506787896156311} -09/21/2021 00:02:57 - INFO - __main__ - Step 44143: {'lr': 0.00019918079829698342, 'samples': 1412576, 'steps': 2758, 'loss/train': 3.3623971939086914} -09/21/2021 00:02:58 - INFO - __main__ - Step 44144: {'lr': 0.00019918079829698342, 'samples': 1412608, 'steps': 2758, 'loss/train': 1.962652325630188} -09/21/2021 00:02:59 - INFO - __main__ - Step 44145: {'lr': 0.00019917998327310873, 'samples': 1412640, 'steps': 2759, 'loss/train': 1.9516456127166748} -09/21/2021 00:03:00 - INFO - __main__ - Step 44146: {'lr': 0.00019917998327310873, 'samples': 1412672, 'steps': 2759, 'loss/train': 3.446256160736084} -09/21/2021 00:03:00 - INFO - __main__ - Step 44147: {'lr': 0.00019917998327310873, 'samples': 1412704, 'steps': 2759, 'loss/train': 0.3496793508529663} -09/21/2021 00:03:01 - INFO - __main__ - Step 44148: {'lr': 0.00019917998327310873, 'samples': 1412736, 'steps': 2759, 'loss/train': 1.9304946660995483} -09/21/2021 00:03:02 - INFO - __main__ - Step 44149: {'lr': 0.00019917998327310873, 'samples': 1412768, 'steps': 2759, 'loss/train': 1.5785911083221436} -09/21/2021 00:03:03 - INFO - __main__ - Step 44150: {'lr': 0.00019917998327310873, 'samples': 1412800, 'steps': 2759, 'loss/train': 2.1217808723449707} -09/21/2021 00:03:03 - INFO - __main__ - Step 44151: {'lr': 0.00019917998327310873, 'samples': 1412832, 'steps': 2759, 'loss/train': 2.198800563812256} -09/21/2021 00:03:04 - INFO - __main__ - Step 44152: {'lr': 0.00019917998327310873, 'samples': 1412864, 'steps': 2759, 'loss/train': 1.856325626373291} -09/21/2021 00:03:05 - INFO - __main__ - Step 44153: {'lr': 0.00019917998327310873, 'samples': 1412896, 'steps': 2759, 'loss/train': 2.394415855407715} -09/21/2021 00:03:06 - INFO - __main__ - Step 44154: {'lr': 0.00019917998327310873, 'samples': 1412928, 'steps': 2759, 'loss/train': 1.5857534408569336} -09/21/2021 00:03:07 - INFO - __main__ - Step 44155: {'lr': 0.00019917998327310873, 'samples': 1412960, 'steps': 2759, 'loss/train': 1.9591975212097168} -09/21/2021 00:03:08 - INFO - __main__ - Step 44156: {'lr': 0.00019917998327310873, 'samples': 1412992, 'steps': 2759, 'loss/train': 2.954650402069092} -09/21/2021 00:03:08 - INFO - __main__ - Step 44157: {'lr': 0.00019917998327310873, 'samples': 1413024, 'steps': 2759, 'loss/train': 2.257075071334839} -09/21/2021 00:03:09 - INFO - __main__ - Step 44158: {'lr': 0.00019917998327310873, 'samples': 1413056, 'steps': 2759, 'loss/train': 4.194089889526367} -09/21/2021 00:03:10 - INFO - __main__ - Step 44159: {'lr': 0.00019917998327310873, 'samples': 1413088, 'steps': 2759, 'loss/train': 2.379307270050049} -09/21/2021 00:03:11 - INFO - __main__ - Step 44160: {'lr': 0.00019917998327310873, 'samples': 1413120, 'steps': 2759, 'loss/train': 2.413668632507324} -09/21/2021 00:03:12 - INFO - __main__ - Step 44161: {'lr': 0.00019917916784567105, 'samples': 1413152, 'steps': 2760, 'loss/train': 2.4709722995758057} -09/21/2021 00:03:12 - INFO - __main__ - Step 44162: {'lr': 0.00019917916784567105, 'samples': 1413184, 'steps': 2760, 'loss/train': 2.4371581077575684} -09/21/2021 00:03:13 - INFO - __main__ - Step 44163: {'lr': 0.00019917916784567105, 'samples': 1413216, 'steps': 2760, 'loss/train': 1.891503930091858} -09/21/2021 00:03:14 - INFO - __main__ - Step 44164: {'lr': 0.00019917916784567105, 'samples': 1413248, 'steps': 2760, 'loss/train': 0.7942416667938232} -09/21/2021 00:03:15 - INFO - __main__ - Step 44165: {'lr': 0.00019917916784567105, 'samples': 1413280, 'steps': 2760, 'loss/train': 1.0649586915969849} -09/21/2021 00:03:15 - INFO - __main__ - Step 44166: {'lr': 0.00019917916784567105, 'samples': 1413312, 'steps': 2760, 'loss/train': 2.82210373878479} -09/21/2021 00:03:16 - INFO - __main__ - Step 44167: {'lr': 0.00019917916784567105, 'samples': 1413344, 'steps': 2760, 'loss/train': 1.9875363111495972} -09/21/2021 00:03:17 - INFO - __main__ - Step 44168: {'lr': 0.00019917916784567105, 'samples': 1413376, 'steps': 2760, 'loss/train': 2.7340023517608643} -09/21/2021 00:03:18 - INFO - __main__ - Step 44169: {'lr': 0.00019917916784567105, 'samples': 1413408, 'steps': 2760, 'loss/train': 1.908670425415039} -09/21/2021 00:03:18 - INFO - __main__ - Step 44170: {'lr': 0.00019917916784567105, 'samples': 1413440, 'steps': 2760, 'loss/train': 3.7015535831451416} -09/21/2021 00:03:19 - INFO - __main__ - Step 44171: {'lr': 0.00019917916784567105, 'samples': 1413472, 'steps': 2760, 'loss/train': 3.5044872760772705} -09/21/2021 00:03:20 - INFO - __main__ - Step 44172: {'lr': 0.00019917916784567105, 'samples': 1413504, 'steps': 2760, 'loss/train': 2.9913501739501953} -09/21/2021 00:03:21 - INFO - __main__ - Step 44173: {'lr': 0.00019917916784567105, 'samples': 1413536, 'steps': 2760, 'loss/train': 1.7641403675079346} -09/21/2021 00:03:21 - INFO - __main__ - Step 44174: {'lr': 0.00019917916784567105, 'samples': 1413568, 'steps': 2760, 'loss/train': 3.010979652404785} -09/21/2021 00:03:22 - INFO - __main__ - Step 44175: {'lr': 0.00019917916784567105, 'samples': 1413600, 'steps': 2760, 'loss/train': 2.2347500324249268} -09/21/2021 00:03:23 - INFO - __main__ - Step 44176: {'lr': 0.00019917916784567105, 'samples': 1413632, 'steps': 2760, 'loss/train': 1.8790020942687988} -09/21/2021 00:03:24 - INFO - __main__ - Step 44177: {'lr': 0.00019917835201467375, 'samples': 1413664, 'steps': 2761, 'loss/train': 2.136143207550049} -09/21/2021 00:03:25 - INFO - __main__ - Step 44178: {'lr': 0.00019917835201467375, 'samples': 1413696, 'steps': 2761, 'loss/train': 2.263983964920044} -09/21/2021 00:03:25 - INFO - __main__ - Step 44179: {'lr': 0.00019917835201467375, 'samples': 1413728, 'steps': 2761, 'loss/train': 2.4255058765411377} -09/21/2021 00:03:26 - INFO - __main__ - Step 44180: {'lr': 0.00019917835201467375, 'samples': 1413760, 'steps': 2761, 'loss/train': 2.130530595779419} -09/21/2021 00:03:27 - INFO - __main__ - Step 44181: {'lr': 0.00019917835201467375, 'samples': 1413792, 'steps': 2761, 'loss/train': 1.9312617778778076} -09/21/2021 00:03:27 - INFO - __main__ - Step 44182: {'lr': 0.00019917835201467375, 'samples': 1413824, 'steps': 2761, 'loss/train': 1.6952322721481323} -09/21/2021 00:03:29 - INFO - __main__ - Step 44183: {'lr': 0.00019917835201467375, 'samples': 1413856, 'steps': 2761, 'loss/train': 1.1869827508926392} -09/21/2021 00:03:30 - INFO - __main__ - Step 44184: {'lr': 0.00019917835201467375, 'samples': 1413888, 'steps': 2761, 'loss/train': 1.7567353248596191} -09/21/2021 00:03:30 - INFO - __main__ - Step 44185: {'lr': 0.00019917835201467375, 'samples': 1413920, 'steps': 2761, 'loss/train': 1.305261492729187} -09/21/2021 00:03:31 - INFO - __main__ - Step 44186: {'lr': 0.00019917835201467375, 'samples': 1413952, 'steps': 2761, 'loss/train': 2.278718948364258} -09/21/2021 00:03:32 - INFO - __main__ - Step 44187: {'lr': 0.00019917835201467375, 'samples': 1413984, 'steps': 2761, 'loss/train': 1.642391324043274} -09/21/2021 00:03:33 - INFO - __main__ - Step 44188: {'lr': 0.00019917835201467375, 'samples': 1414016, 'steps': 2761, 'loss/train': 0.9841243624687195} -09/21/2021 00:03:33 - INFO - __main__ - Step 44189: {'lr': 0.00019917835201467375, 'samples': 1414048, 'steps': 2761, 'loss/train': 1.8467670679092407} -09/21/2021 00:03:34 - INFO - __main__ - Step 44190: {'lr': 0.00019917835201467375, 'samples': 1414080, 'steps': 2761, 'loss/train': 2.65740704536438} -09/21/2021 00:03:35 - INFO - __main__ - Step 44191: {'lr': 0.00019917835201467375, 'samples': 1414112, 'steps': 2761, 'loss/train': 1.5249239206314087} -09/21/2021 00:03:36 - INFO - __main__ - Step 44192: {'lr': 0.00019917835201467375, 'samples': 1414144, 'steps': 2761, 'loss/train': 2.781074285507202} -09/21/2021 00:03:37 - INFO - __main__ - Step 44193: {'lr': 0.00019917753578012012, 'samples': 1414176, 'steps': 2762, 'loss/train': 2.3089332580566406} -09/21/2021 00:03:37 - INFO - __main__ - Step 44194: {'lr': 0.00019917753578012012, 'samples': 1414208, 'steps': 2762, 'loss/train': 2.0832788944244385} -09/21/2021 00:03:38 - INFO - __main__ - Step 44195: {'lr': 0.00019917753578012012, 'samples': 1414240, 'steps': 2762, 'loss/train': 0.5177257657051086} -09/21/2021 00:03:39 - INFO - __main__ - Step 44196: {'lr': 0.00019917753578012012, 'samples': 1414272, 'steps': 2762, 'loss/train': 1.0533798933029175} -09/21/2021 00:03:40 - INFO - __main__ - Step 44197: {'lr': 0.00019917753578012012, 'samples': 1414304, 'steps': 2762, 'loss/train': 3.151292085647583} -09/21/2021 00:03:40 - INFO - __main__ - Step 44198: {'lr': 0.00019917753578012012, 'samples': 1414336, 'steps': 2762, 'loss/train': 2.0382089614868164} -09/21/2021 00:03:41 - INFO - __main__ - Step 44199: {'lr': 0.00019917753578012012, 'samples': 1414368, 'steps': 2762, 'loss/train': 1.6885035037994385} -09/21/2021 00:03:42 - INFO - __main__ - Step 44200: {'lr': 0.00019917753578012012, 'samples': 1414400, 'steps': 2762, 'loss/train': 1.913435935974121} -09/21/2021 00:03:43 - INFO - __main__ - Step 44201: {'lr': 0.00019917753578012012, 'samples': 1414432, 'steps': 2762, 'loss/train': 1.74830961227417} -09/21/2021 00:03:43 - INFO - __main__ - Step 44202: {'lr': 0.00019917753578012012, 'samples': 1414464, 'steps': 2762, 'loss/train': 1.8722954988479614} -09/21/2021 00:03:44 - INFO - __main__ - Step 44203: {'lr': 0.00019917753578012012, 'samples': 1414496, 'steps': 2762, 'loss/train': 2.506591558456421} -09/21/2021 00:03:45 - INFO - __main__ - Step 44204: {'lr': 0.00019917753578012012, 'samples': 1414528, 'steps': 2762, 'loss/train': 2.8860316276550293} -09/21/2021 00:03:46 - INFO - __main__ - Step 44205: {'lr': 0.00019917753578012012, 'samples': 1414560, 'steps': 2762, 'loss/train': 1.983992338180542} -09/21/2021 00:03:46 - INFO - __main__ - Step 44206: {'lr': 0.00019917753578012012, 'samples': 1414592, 'steps': 2762, 'loss/train': 1.903939127922058} -09/21/2021 00:03:47 - INFO - __main__ - Step 44207: {'lr': 0.00019917753578012012, 'samples': 1414624, 'steps': 2762, 'loss/train': 1.4163100719451904} -09/21/2021 00:03:48 - INFO - __main__ - Step 44208: {'lr': 0.00019917753578012012, 'samples': 1414656, 'steps': 2762, 'loss/train': 2.0674705505371094} -09/21/2021 00:03:49 - INFO - __main__ - Step 44209: {'lr': 0.00019917671914201348, 'samples': 1414688, 'steps': 2763, 'loss/train': 2.1475236415863037} -09/21/2021 00:03:49 - INFO - __main__ - Step 44210: {'lr': 0.00019917671914201348, 'samples': 1414720, 'steps': 2763, 'loss/train': 2.0824172496795654} -09/21/2021 00:03:50 - INFO - __main__ - Step 44211: {'lr': 0.00019917671914201348, 'samples': 1414752, 'steps': 2763, 'loss/train': 1.9916369915008545} -09/21/2021 00:03:51 - INFO - __main__ - Step 44212: {'lr': 0.00019917671914201348, 'samples': 1414784, 'steps': 2763, 'loss/train': 0.9801046848297119} -09/21/2021 00:03:53 - INFO - __main__ - Step 44213: {'lr': 0.00019917671914201348, 'samples': 1414816, 'steps': 2763, 'loss/train': 1.9815574884414673} -09/21/2021 00:03:53 - INFO - __main__ - Step 44214: {'lr': 0.00019917671914201348, 'samples': 1414848, 'steps': 2763, 'loss/train': 2.4460017681121826} -09/21/2021 00:03:54 - INFO - __main__ - Step 44215: {'lr': 0.00019917671914201348, 'samples': 1414880, 'steps': 2763, 'loss/train': 2.3645670413970947} -09/21/2021 00:03:55 - INFO - __main__ - Step 44216: {'lr': 0.00019917671914201348, 'samples': 1414912, 'steps': 2763, 'loss/train': 1.8899658918380737} -09/21/2021 00:03:56 - INFO - __main__ - Step 44217: {'lr': 0.00019917671914201348, 'samples': 1414944, 'steps': 2763, 'loss/train': 2.9887351989746094} -09/21/2021 00:03:56 - INFO - __main__ - Step 44218: {'lr': 0.00019917671914201348, 'samples': 1414976, 'steps': 2763, 'loss/train': 1.7375643253326416} -09/21/2021 00:03:57 - INFO - __main__ - Step 44219: {'lr': 0.00019917671914201348, 'samples': 1415008, 'steps': 2763, 'loss/train': 0.7893490791320801} -09/21/2021 00:03:58 - INFO - __main__ - Step 44220: {'lr': 0.00019917671914201348, 'samples': 1415040, 'steps': 2763, 'loss/train': 1.6226577758789062} -09/21/2021 00:03:59 - INFO - __main__ - Step 44221: {'lr': 0.00019917671914201348, 'samples': 1415072, 'steps': 2763, 'loss/train': 1.6730504035949707} -09/21/2021 00:03:59 - INFO - __main__ - Step 44222: {'lr': 0.00019917671914201348, 'samples': 1415104, 'steps': 2763, 'loss/train': 0.4932379126548767} -09/21/2021 00:04:00 - INFO - __main__ - Step 44223: {'lr': 0.00019917671914201348, 'samples': 1415136, 'steps': 2763, 'loss/train': 2.031707763671875} -09/21/2021 00:04:01 - INFO - __main__ - Step 44224: {'lr': 0.00019917671914201348, 'samples': 1415168, 'steps': 2763, 'loss/train': 2.2516000270843506} -09/21/2021 00:04:02 - INFO - __main__ - Step 44225: {'lr': 0.00019917590210035715, 'samples': 1415200, 'steps': 2764, 'loss/train': 2.2820987701416016} -09/21/2021 00:04:03 - INFO - __main__ - Step 44226: {'lr': 0.00019917590210035715, 'samples': 1415232, 'steps': 2764, 'loss/train': 2.50180721282959} -09/21/2021 00:04:03 - INFO - __main__ - Step 44227: {'lr': 0.00019917590210035715, 'samples': 1415264, 'steps': 2764, 'loss/train': 2.4027862548828125} -09/21/2021 00:04:04 - INFO - __main__ - Step 44228: {'lr': 0.00019917590210035715, 'samples': 1415296, 'steps': 2764, 'loss/train': 2.180094003677368} -09/21/2021 00:04:05 - INFO - __main__ - Step 44229: {'lr': 0.00019917590210035715, 'samples': 1415328, 'steps': 2764, 'loss/train': 2.2917206287384033} -09/21/2021 00:04:06 - INFO - __main__ - Step 44230: {'lr': 0.00019917590210035715, 'samples': 1415360, 'steps': 2764, 'loss/train': 2.0346012115478516} -09/21/2021 00:04:06 - INFO - __main__ - Step 44231: {'lr': 0.00019917590210035715, 'samples': 1415392, 'steps': 2764, 'loss/train': 1.9480416774749756} -09/21/2021 00:04:07 - INFO - __main__ - Step 44232: {'lr': 0.00019917590210035715, 'samples': 1415424, 'steps': 2764, 'loss/train': 2.6234912872314453} -09/21/2021 00:04:08 - INFO - __main__ - Step 44233: {'lr': 0.00019917590210035715, 'samples': 1415456, 'steps': 2764, 'loss/train': 2.8617331981658936} -09/21/2021 00:04:09 - INFO - __main__ - Step 44234: {'lr': 0.00019917590210035715, 'samples': 1415488, 'steps': 2764, 'loss/train': 2.26452898979187} -09/21/2021 00:04:09 - INFO - __main__ - Step 44235: {'lr': 0.00019917590210035715, 'samples': 1415520, 'steps': 2764, 'loss/train': 1.1343344449996948} -09/21/2021 00:04:10 - INFO - __main__ - Step 44236: {'lr': 0.00019917590210035715, 'samples': 1415552, 'steps': 2764, 'loss/train': 1.1804568767547607} -09/21/2021 00:04:11 - INFO - __main__ - Step 44237: {'lr': 0.00019917590210035715, 'samples': 1415584, 'steps': 2764, 'loss/train': 2.721665620803833} -09/21/2021 00:04:12 - INFO - __main__ - Step 44238: {'lr': 0.00019917590210035715, 'samples': 1415616, 'steps': 2764, 'loss/train': 2.0360941886901855} -09/21/2021 00:04:12 - INFO - __main__ - Step 44239: {'lr': 0.00019917590210035715, 'samples': 1415648, 'steps': 2764, 'loss/train': 2.042262554168701} -09/21/2021 00:04:13 - INFO - __main__ - Step 44240: {'lr': 0.00019917590210035715, 'samples': 1415680, 'steps': 2764, 'loss/train': 2.678889751434326} -09/21/2021 00:04:14 - INFO - __main__ - Step 44241: {'lr': 0.00019917508465515447, 'samples': 1415712, 'steps': 2765, 'loss/train': 1.955530047416687} -09/21/2021 00:04:15 - INFO - __main__ - Step 44242: {'lr': 0.00019917508465515447, 'samples': 1415744, 'steps': 2765, 'loss/train': 1.0533159971237183} -09/21/2021 00:04:15 - INFO - __main__ - Step 44243: {'lr': 0.00019917508465515447, 'samples': 1415776, 'steps': 2765, 'loss/train': 1.8978159427642822} -09/21/2021 00:04:17 - INFO - __main__ - Step 44244: {'lr': 0.00019917508465515447, 'samples': 1415808, 'steps': 2765, 'loss/train': 1.2381290197372437} -09/21/2021 00:04:17 - INFO - __main__ - Step 44245: {'lr': 0.00019917508465515447, 'samples': 1415840, 'steps': 2765, 'loss/train': 2.1569762229919434} -09/21/2021 00:04:18 - INFO - __main__ - Step 44246: {'lr': 0.00019917508465515447, 'samples': 1415872, 'steps': 2765, 'loss/train': 1.8118603229522705} -09/21/2021 00:04:19 - INFO - __main__ - Step 44247: {'lr': 0.00019917508465515447, 'samples': 1415904, 'steps': 2765, 'loss/train': 1.579803228378296} -09/21/2021 00:04:20 - INFO - __main__ - Step 44248: {'lr': 0.00019917508465515447, 'samples': 1415936, 'steps': 2765, 'loss/train': 2.264402389526367} -09/21/2021 00:04:20 - INFO - __main__ - Step 44249: {'lr': 0.00019917508465515447, 'samples': 1415968, 'steps': 2765, 'loss/train': 1.779167890548706} -09/21/2021 00:04:21 - INFO - __main__ - Step 44250: {'lr': 0.00019917508465515447, 'samples': 1416000, 'steps': 2765, 'loss/train': 1.692546010017395} -09/21/2021 00:04:22 - INFO - __main__ - Step 44251: {'lr': 0.00019917508465515447, 'samples': 1416032, 'steps': 2765, 'loss/train': 3.15470290184021} -09/21/2021 00:04:23 - INFO - __main__ - Step 44252: {'lr': 0.00019917508465515447, 'samples': 1416064, 'steps': 2765, 'loss/train': 2.905134439468384} -09/21/2021 00:04:23 - INFO - __main__ - Step 44253: {'lr': 0.00019917508465515447, 'samples': 1416096, 'steps': 2765, 'loss/train': 2.0066816806793213} -09/21/2021 00:04:24 - INFO - __main__ - Step 44254: {'lr': 0.00019917508465515447, 'samples': 1416128, 'steps': 2765, 'loss/train': 1.8665292263031006} -09/21/2021 00:04:25 - INFO - __main__ - Step 44255: {'lr': 0.00019917508465515447, 'samples': 1416160, 'steps': 2765, 'loss/train': 1.3930081129074097} -09/21/2021 00:04:26 - INFO - __main__ - Step 44256: {'lr': 0.00019917508465515447, 'samples': 1416192, 'steps': 2765, 'loss/train': 1.9537888765335083} -09/21/2021 00:04:27 - INFO - __main__ - Step 44257: {'lr': 0.00019917426680640877, 'samples': 1416224, 'steps': 2766, 'loss/train': 2.537102699279785} -09/21/2021 00:04:27 - INFO - __main__ - Step 44258: {'lr': 0.00019917426680640877, 'samples': 1416256, 'steps': 2766, 'loss/train': 2.6344661712646484} -09/21/2021 00:04:28 - INFO - __main__ - Step 44259: {'lr': 0.00019917426680640877, 'samples': 1416288, 'steps': 2766, 'loss/train': 1.5329703092575073} -09/21/2021 00:04:29 - INFO - __main__ - Step 44260: {'lr': 0.00019917426680640877, 'samples': 1416320, 'steps': 2766, 'loss/train': 2.264181137084961} -09/21/2021 00:04:30 - INFO - __main__ - Step 44261: {'lr': 0.00019917426680640877, 'samples': 1416352, 'steps': 2766, 'loss/train': 1.768984079360962} -09/21/2021 00:04:30 - INFO - __main__ - Step 44262: {'lr': 0.00019917426680640877, 'samples': 1416384, 'steps': 2766, 'loss/train': 1.22559654712677} -09/21/2021 00:04:31 - INFO - __main__ - Step 44263: {'lr': 0.00019917426680640877, 'samples': 1416416, 'steps': 2766, 'loss/train': 2.982140064239502} -09/21/2021 00:04:32 - INFO - __main__ - Step 44264: {'lr': 0.00019917426680640877, 'samples': 1416448, 'steps': 2766, 'loss/train': 1.627711296081543} -09/21/2021 00:04:33 - INFO - __main__ - Step 44265: {'lr': 0.00019917426680640877, 'samples': 1416480, 'steps': 2766, 'loss/train': 2.3371710777282715} -09/21/2021 00:04:33 - INFO - __main__ - Step 44266: {'lr': 0.00019917426680640877, 'samples': 1416512, 'steps': 2766, 'loss/train': 1.9325352907180786} -09/21/2021 00:04:34 - INFO - __main__ - Step 44267: {'lr': 0.00019917426680640877, 'samples': 1416544, 'steps': 2766, 'loss/train': 2.978006362915039} -09/21/2021 00:04:35 - INFO - __main__ - Step 44268: {'lr': 0.00019917426680640877, 'samples': 1416576, 'steps': 2766, 'loss/train': 1.6736047267913818} -09/21/2021 00:04:36 - INFO - __main__ - Step 44269: {'lr': 0.00019917426680640877, 'samples': 1416608, 'steps': 2766, 'loss/train': 1.8184834718704224} -09/21/2021 00:04:36 - INFO - __main__ - Step 44270: {'lr': 0.00019917426680640877, 'samples': 1416640, 'steps': 2766, 'loss/train': 1.9969180822372437} -09/21/2021 00:04:37 - INFO - __main__ - Step 44271: {'lr': 0.00019917426680640877, 'samples': 1416672, 'steps': 2766, 'loss/train': 2.0365846157073975} -09/21/2021 00:04:38 - INFO - __main__ - Step 44272: {'lr': 0.00019917426680640877, 'samples': 1416704, 'steps': 2766, 'loss/train': 1.9099904298782349} -09/21/2021 00:04:39 - INFO - __main__ - Step 44273: {'lr': 0.00019917344855412331, 'samples': 1416736, 'steps': 2767, 'loss/train': 2.222419023513794} -09/21/2021 00:04:39 - INFO - __main__ - Step 44274: {'lr': 0.00019917344855412331, 'samples': 1416768, 'steps': 2767, 'loss/train': 1.6534024477005005} -09/21/2021 00:04:40 - INFO - __main__ - Step 44275: {'lr': 0.00019917344855412331, 'samples': 1416800, 'steps': 2767, 'loss/train': 1.3061884641647339} -09/21/2021 00:04:41 - INFO - __main__ - Step 44276: {'lr': 0.00019917344855412331, 'samples': 1416832, 'steps': 2767, 'loss/train': 2.557262659072876} -09/21/2021 00:04:42 - INFO - __main__ - Step 44277: {'lr': 0.00019917344855412331, 'samples': 1416864, 'steps': 2767, 'loss/train': 2.3616268634796143} -09/21/2021 00:04:43 - INFO - __main__ - Step 44278: {'lr': 0.00019917344855412331, 'samples': 1416896, 'steps': 2767, 'loss/train': 1.5377395153045654} -09/21/2021 00:04:44 - INFO - __main__ - Step 44279: {'lr': 0.00019917344855412331, 'samples': 1416928, 'steps': 2767, 'loss/train': 2.88629412651062} -09/21/2021 00:04:44 - INFO - __main__ - Step 44280: {'lr': 0.00019917344855412331, 'samples': 1416960, 'steps': 2767, 'loss/train': 1.616791844367981} -09/21/2021 00:04:45 - INFO - __main__ - Step 44281: {'lr': 0.00019917344855412331, 'samples': 1416992, 'steps': 2767, 'loss/train': 2.0385658740997314} -09/21/2021 00:04:46 - INFO - __main__ - Step 44282: {'lr': 0.00019917344855412331, 'samples': 1417024, 'steps': 2767, 'loss/train': 2.338487386703491} -09/21/2021 00:04:47 - INFO - __main__ - Step 44283: {'lr': 0.00019917344855412331, 'samples': 1417056, 'steps': 2767, 'loss/train': 2.435438394546509} -09/21/2021 00:04:47 - INFO - __main__ - Step 44284: {'lr': 0.00019917344855412331, 'samples': 1417088, 'steps': 2767, 'loss/train': 2.489671230316162} -09/21/2021 00:04:48 - INFO - __main__ - Step 44285: {'lr': 0.00019917344855412331, 'samples': 1417120, 'steps': 2767, 'loss/train': 2.6231391429901123} -09/21/2021 00:04:49 - INFO - __main__ - Step 44286: {'lr': 0.00019917344855412331, 'samples': 1417152, 'steps': 2767, 'loss/train': 1.7843371629714966} -09/21/2021 00:04:50 - INFO - __main__ - Step 44287: {'lr': 0.00019917344855412331, 'samples': 1417184, 'steps': 2767, 'loss/train': 2.4225473403930664} -09/21/2021 00:04:50 - INFO - __main__ - Step 44288: {'lr': 0.00019917344855412331, 'samples': 1417216, 'steps': 2767, 'loss/train': 2.0986721515655518} -09/21/2021 00:04:51 - INFO - __main__ - Step 44289: {'lr': 0.00019917262989830152, 'samples': 1417248, 'steps': 2768, 'loss/train': 1.6700350046157837} -09/21/2021 00:04:52 - INFO - __main__ - Step 44290: {'lr': 0.00019917262989830152, 'samples': 1417280, 'steps': 2768, 'loss/train': 1.4866611957550049} -09/21/2021 00:04:53 - INFO - __main__ - Step 44291: {'lr': 0.00019917262989830152, 'samples': 1417312, 'steps': 2768, 'loss/train': 2.051218271255493} -09/21/2021 00:04:54 - INFO - __main__ - Step 44292: {'lr': 0.00019917262989830152, 'samples': 1417344, 'steps': 2768, 'loss/train': 1.9813787937164307} -09/21/2021 00:04:54 - INFO - __main__ - Step 44293: {'lr': 0.00019917262989830152, 'samples': 1417376, 'steps': 2768, 'loss/train': 2.239060163497925} -09/21/2021 00:04:55 - INFO - __main__ - Step 44294: {'lr': 0.00019917262989830152, 'samples': 1417408, 'steps': 2768, 'loss/train': 1.0021343231201172} -09/21/2021 00:04:56 - INFO - __main__ - Step 44295: {'lr': 0.00019917262989830152, 'samples': 1417440, 'steps': 2768, 'loss/train': 2.3722307682037354} -09/21/2021 00:04:57 - INFO - __main__ - Step 44296: {'lr': 0.00019917262989830152, 'samples': 1417472, 'steps': 2768, 'loss/train': 2.2314140796661377} -09/21/2021 00:04:57 - INFO - __main__ - Step 44297: {'lr': 0.00019917262989830152, 'samples': 1417504, 'steps': 2768, 'loss/train': 1.9769484996795654} -09/21/2021 00:04:58 - INFO - __main__ - Step 44298: {'lr': 0.00019917262989830152, 'samples': 1417536, 'steps': 2768, 'loss/train': 2.3507089614868164} -09/21/2021 00:04:59 - INFO - __main__ - Step 44299: {'lr': 0.00019917262989830152, 'samples': 1417568, 'steps': 2768, 'loss/train': 2.7416067123413086} -09/21/2021 00:05:00 - INFO - __main__ - Step 44300: {'lr': 0.00019917262989830152, 'samples': 1417600, 'steps': 2768, 'loss/train': 2.4291927814483643} -09/21/2021 00:05:00 - INFO - __main__ - Step 44301: {'lr': 0.00019917262989830152, 'samples': 1417632, 'steps': 2768, 'loss/train': 1.0342073440551758} -09/21/2021 00:05:01 - INFO - __main__ - Step 44302: {'lr': 0.00019917262989830152, 'samples': 1417664, 'steps': 2768, 'loss/train': 2.324907064437866} -09/21/2021 00:05:02 - INFO - __main__ - Step 44303: {'lr': 0.00019917262989830152, 'samples': 1417696, 'steps': 2768, 'loss/train': 1.544111728668213} -09/21/2021 00:05:03 - INFO - __main__ - Step 44304: {'lr': 0.00019917262989830152, 'samples': 1417728, 'steps': 2768, 'loss/train': 1.7211589813232422} -09/21/2021 00:05:03 - INFO - __main__ - Step 44305: {'lr': 0.00019917181083894665, 'samples': 1417760, 'steps': 2769, 'loss/train': 1.550541639328003} -09/21/2021 00:05:05 - INFO - __main__ - Step 44306: {'lr': 0.00019917181083894665, 'samples': 1417792, 'steps': 2769, 'loss/train': 1.9605556726455688} -09/21/2021 00:05:05 - INFO - __main__ - Step 44307: {'lr': 0.00019917181083894665, 'samples': 1417824, 'steps': 2769, 'loss/train': 2.3727610111236572} -09/21/2021 00:05:06 - INFO - __main__ - Step 44308: {'lr': 0.00019917181083894665, 'samples': 1417856, 'steps': 2769, 'loss/train': 1.8893145322799683} -09/21/2021 00:05:07 - INFO - __main__ - Step 44309: {'lr': 0.00019917181083894665, 'samples': 1417888, 'steps': 2769, 'loss/train': 1.1334822177886963} -09/21/2021 00:05:08 - INFO - __main__ - Step 44310: {'lr': 0.00019917181083894665, 'samples': 1417920, 'steps': 2769, 'loss/train': 2.079317808151245} -09/21/2021 00:05:08 - INFO - __main__ - Step 44311: {'lr': 0.00019917181083894665, 'samples': 1417952, 'steps': 2769, 'loss/train': 2.521451234817505} -09/21/2021 00:05:09 - INFO - __main__ - Step 44312: {'lr': 0.00019917181083894665, 'samples': 1417984, 'steps': 2769, 'loss/train': 1.8813813924789429} -09/21/2021 00:05:10 - INFO - __main__ - Step 44313: {'lr': 0.00019917181083894665, 'samples': 1418016, 'steps': 2769, 'loss/train': 2.486908197402954} -09/21/2021 00:05:11 - INFO - __main__ - Step 44314: {'lr': 0.00019917181083894665, 'samples': 1418048, 'steps': 2769, 'loss/train': 2.1948306560516357} -09/21/2021 00:05:11 - INFO - __main__ - Step 44315: {'lr': 0.00019917181083894665, 'samples': 1418080, 'steps': 2769, 'loss/train': 2.1975746154785156} -09/21/2021 00:05:12 - INFO - __main__ - Step 44316: {'lr': 0.00019917181083894665, 'samples': 1418112, 'steps': 2769, 'loss/train': 2.4143455028533936} -09/21/2021 00:05:13 - INFO - __main__ - Step 44317: {'lr': 0.00019917181083894665, 'samples': 1418144, 'steps': 2769, 'loss/train': 2.1000070571899414} -09/21/2021 00:05:14 - INFO - __main__ - Step 44318: {'lr': 0.00019917181083894665, 'samples': 1418176, 'steps': 2769, 'loss/train': 2.6120448112487793} -09/21/2021 00:05:14 - INFO - __main__ - Step 44319: {'lr': 0.00019917181083894665, 'samples': 1418208, 'steps': 2769, 'loss/train': 1.3443729877471924} -09/21/2021 00:05:15 - INFO - __main__ - Step 44320: {'lr': 0.00019917181083894665, 'samples': 1418240, 'steps': 2769, 'loss/train': 2.2663803100585938} -09/21/2021 00:05:16 - INFO - __main__ - Step 44321: {'lr': 0.00019917099137606209, 'samples': 1418272, 'steps': 2770, 'loss/train': 2.276604652404785} -09/21/2021 00:05:17 - INFO - __main__ - Step 44322: {'lr': 0.00019917099137606209, 'samples': 1418304, 'steps': 2770, 'loss/train': 0.29543623328208923} -09/21/2021 00:05:18 - INFO - __main__ - Step 44323: {'lr': 0.00019917099137606209, 'samples': 1418336, 'steps': 2770, 'loss/train': 2.654874563217163} -09/21/2021 00:05:18 - INFO - __main__ - Step 44324: {'lr': 0.00019917099137606209, 'samples': 1418368, 'steps': 2770, 'loss/train': 1.7959645986557007} -09/21/2021 00:05:19 - INFO - __main__ - Step 44325: {'lr': 0.00019917099137606209, 'samples': 1418400, 'steps': 2770, 'loss/train': 1.5491385459899902} -09/21/2021 00:05:20 - INFO - __main__ - Step 44326: {'lr': 0.00019917099137606209, 'samples': 1418432, 'steps': 2770, 'loss/train': 2.0121350288391113} -09/21/2021 00:05:21 - INFO - __main__ - Step 44327: {'lr': 0.00019917099137606209, 'samples': 1418464, 'steps': 2770, 'loss/train': 1.7318106889724731} -09/21/2021 00:05:21 - INFO - __main__ - Step 44328: {'lr': 0.00019917099137606209, 'samples': 1418496, 'steps': 2770, 'loss/train': 1.5947260856628418} -09/21/2021 00:05:22 - INFO - __main__ - Step 44329: {'lr': 0.00019917099137606209, 'samples': 1418528, 'steps': 2770, 'loss/train': 1.7651631832122803} -09/21/2021 00:05:23 - INFO - __main__ - Step 44330: {'lr': 0.00019917099137606209, 'samples': 1418560, 'steps': 2770, 'loss/train': 2.0057992935180664} -09/21/2021 00:05:24 - INFO - __main__ - Step 44331: {'lr': 0.00019917099137606209, 'samples': 1418592, 'steps': 2770, 'loss/train': 1.025359869003296} -09/21/2021 00:05:24 - INFO - __main__ - Step 44332: {'lr': 0.00019917099137606209, 'samples': 1418624, 'steps': 2770, 'loss/train': 2.256711483001709} -09/21/2021 00:05:25 - INFO - __main__ - Step 44333: {'lr': 0.00019917099137606209, 'samples': 1418656, 'steps': 2770, 'loss/train': 1.9319580793380737} -09/21/2021 00:05:26 - INFO - __main__ - Step 44334: {'lr': 0.00019917099137606209, 'samples': 1418688, 'steps': 2770, 'loss/train': 1.7582650184631348} -09/21/2021 00:05:27 - INFO - __main__ - Step 44335: {'lr': 0.00019917099137606209, 'samples': 1418720, 'steps': 2770, 'loss/train': 1.2394527196884155} -09/21/2021 00:05:27 - INFO - __main__ - Step 44336: {'lr': 0.00019917099137606209, 'samples': 1418752, 'steps': 2770, 'loss/train': 0.3943954110145569} -09/21/2021 00:05:29 - INFO - __main__ - Step 44337: {'lr': 0.00019917017150965113, 'samples': 1418784, 'steps': 2771, 'loss/train': 2.6392226219177246} -09/21/2021 00:05:30 - INFO - __main__ - Step 44338: {'lr': 0.00019917017150965113, 'samples': 1418816, 'steps': 2771, 'loss/train': 1.755894422531128} -09/21/2021 00:05:30 - INFO - __main__ - Step 44339: {'lr': 0.00019917017150965113, 'samples': 1418848, 'steps': 2771, 'loss/train': 2.1495652198791504} -09/21/2021 00:05:31 - INFO - __main__ - Step 44340: {'lr': 0.00019917017150965113, 'samples': 1418880, 'steps': 2771, 'loss/train': 0.48115184903144836} -09/21/2021 00:05:32 - INFO - __main__ - Step 44341: {'lr': 0.00019917017150965113, 'samples': 1418912, 'steps': 2771, 'loss/train': 2.2297921180725098} -09/21/2021 00:05:33 - INFO - __main__ - Step 44342: {'lr': 0.00019917017150965113, 'samples': 1418944, 'steps': 2771, 'loss/train': 1.5777822732925415} -09/21/2021 00:05:33 - INFO - __main__ - Step 44343: {'lr': 0.00019917017150965113, 'samples': 1418976, 'steps': 2771, 'loss/train': 2.383044481277466} -09/21/2021 00:05:34 - INFO - __main__ - Step 44344: {'lr': 0.00019917017150965113, 'samples': 1419008, 'steps': 2771, 'loss/train': 2.81559681892395} -09/21/2021 00:05:35 - INFO - __main__ - Step 44345: {'lr': 0.00019917017150965113, 'samples': 1419040, 'steps': 2771, 'loss/train': 2.497669219970703} -09/21/2021 00:05:36 - INFO - __main__ - Step 44346: {'lr': 0.00019917017150965113, 'samples': 1419072, 'steps': 2771, 'loss/train': 1.7125836610794067} -09/21/2021 00:05:36 - INFO - __main__ - Step 44347: {'lr': 0.00019917017150965113, 'samples': 1419104, 'steps': 2771, 'loss/train': 3.2972137928009033} -09/21/2021 00:05:37 - INFO - __main__ - Step 44348: {'lr': 0.00019917017150965113, 'samples': 1419136, 'steps': 2771, 'loss/train': 2.7121450901031494} -09/21/2021 00:05:38 - INFO - __main__ - Step 44349: {'lr': 0.00019917017150965113, 'samples': 1419168, 'steps': 2771, 'loss/train': 2.1994056701660156} -09/21/2021 00:05:39 - INFO - __main__ - Step 44350: {'lr': 0.00019917017150965113, 'samples': 1419200, 'steps': 2771, 'loss/train': 2.3055005073547363} -09/21/2021 00:05:39 - INFO - __main__ - Step 44351: {'lr': 0.00019917017150965113, 'samples': 1419232, 'steps': 2771, 'loss/train': 1.5519497394561768} -09/21/2021 00:05:40 - INFO - __main__ - Step 44352: {'lr': 0.00019917017150965113, 'samples': 1419264, 'steps': 2771, 'loss/train': 1.8444080352783203} -09/21/2021 00:05:41 - INFO - __main__ - Step 44353: {'lr': 0.00019916935123971715, 'samples': 1419296, 'steps': 2772, 'loss/train': 2.8400516510009766} -09/21/2021 00:05:42 - INFO - __main__ - Step 44354: {'lr': 0.00019916935123971715, 'samples': 1419328, 'steps': 2772, 'loss/train': 2.0075109004974365} -09/21/2021 00:05:43 - INFO - __main__ - Step 44355: {'lr': 0.00019916935123971715, 'samples': 1419360, 'steps': 2772, 'loss/train': 2.64180064201355} -09/21/2021 00:05:43 - INFO - __main__ - Step 44356: {'lr': 0.00019916935123971715, 'samples': 1419392, 'steps': 2772, 'loss/train': 2.504112720489502} -09/21/2021 00:05:44 - INFO - __main__ - Step 44357: {'lr': 0.00019916935123971715, 'samples': 1419424, 'steps': 2772, 'loss/train': 2.1819493770599365} -09/21/2021 00:05:45 - INFO - __main__ - Step 44358: {'lr': 0.00019916935123971715, 'samples': 1419456, 'steps': 2772, 'loss/train': 1.6301512718200684} -09/21/2021 00:05:46 - INFO - __main__ - Step 44359: {'lr': 0.00019916935123971715, 'samples': 1419488, 'steps': 2772, 'loss/train': 1.366368293762207} -09/21/2021 00:05:46 - INFO - __main__ - Step 44360: {'lr': 0.00019916935123971715, 'samples': 1419520, 'steps': 2772, 'loss/train': 1.725081443786621} -09/21/2021 00:05:47 - INFO - __main__ - Step 44361: {'lr': 0.00019916935123971715, 'samples': 1419552, 'steps': 2772, 'loss/train': 2.1709892749786377} -09/21/2021 00:05:48 - INFO - __main__ - Step 44362: {'lr': 0.00019916935123971715, 'samples': 1419584, 'steps': 2772, 'loss/train': 2.4370269775390625} -09/21/2021 00:05:49 - INFO - __main__ - Step 44363: {'lr': 0.00019916935123971715, 'samples': 1419616, 'steps': 2772, 'loss/train': 1.8839428424835205} -09/21/2021 00:05:49 - INFO - __main__ - Step 44364: {'lr': 0.00019916935123971715, 'samples': 1419648, 'steps': 2772, 'loss/train': 2.273627281188965} -09/21/2021 00:05:50 - INFO - __main__ - Step 44365: {'lr': 0.00019916935123971715, 'samples': 1419680, 'steps': 2772, 'loss/train': 2.3580265045166016} -09/21/2021 00:05:51 - INFO - __main__ - Step 44366: {'lr': 0.00019916935123971715, 'samples': 1419712, 'steps': 2772, 'loss/train': 1.8176994323730469} -09/21/2021 00:05:52 - INFO - __main__ - Step 44367: {'lr': 0.00019916935123971715, 'samples': 1419744, 'steps': 2772, 'loss/train': 2.3604044914245605} -09/21/2021 00:05:53 - INFO - __main__ - Step 44368: {'lr': 0.00019916935123971715, 'samples': 1419776, 'steps': 2772, 'loss/train': 1.227855920791626} -09/21/2021 00:05:54 - INFO - __main__ - Step 44369: {'lr': 0.00019916853056626348, 'samples': 1419808, 'steps': 2773, 'loss/train': 1.8845902681350708} -09/21/2021 00:05:54 - INFO - __main__ - Step 44370: {'lr': 0.00019916853056626348, 'samples': 1419840, 'steps': 2773, 'loss/train': 1.5909706354141235} -09/21/2021 00:05:55 - INFO - __main__ - Step 44371: {'lr': 0.00019916853056626348, 'samples': 1419872, 'steps': 2773, 'loss/train': 1.0024417638778687} -09/21/2021 00:05:56 - INFO - __main__ - Step 44372: {'lr': 0.00019916853056626348, 'samples': 1419904, 'steps': 2773, 'loss/train': 1.6987249851226807} -09/21/2021 00:05:57 - INFO - __main__ - Step 44373: {'lr': 0.00019916853056626348, 'samples': 1419936, 'steps': 2773, 'loss/train': 2.576850175857544} -09/21/2021 00:05:57 - INFO - __main__ - Step 44374: {'lr': 0.00019916853056626348, 'samples': 1419968, 'steps': 2773, 'loss/train': 2.050196647644043} -09/21/2021 00:05:58 - INFO - __main__ - Step 44375: {'lr': 0.00019916853056626348, 'samples': 1420000, 'steps': 2773, 'loss/train': 1.3479706048965454} -09/21/2021 00:05:59 - INFO - __main__ - Step 44376: {'lr': 0.00019916853056626348, 'samples': 1420032, 'steps': 2773, 'loss/train': 1.616263747215271} -09/21/2021 00:06:00 - INFO - __main__ - Step 44377: {'lr': 0.00019916853056626348, 'samples': 1420064, 'steps': 2773, 'loss/train': 2.026386260986328} -09/21/2021 00:06:00 - INFO - __main__ - Step 44378: {'lr': 0.00019916853056626348, 'samples': 1420096, 'steps': 2773, 'loss/train': 2.344764232635498} -09/21/2021 00:06:01 - INFO - __main__ - Step 44379: {'lr': 0.00019916853056626348, 'samples': 1420128, 'steps': 2773, 'loss/train': 2.307175874710083} -09/21/2021 00:06:02 - INFO - __main__ - Step 44380: {'lr': 0.00019916853056626348, 'samples': 1420160, 'steps': 2773, 'loss/train': 2.261352062225342} -09/21/2021 00:06:03 - INFO - __main__ - Step 44381: {'lr': 0.00019916853056626348, 'samples': 1420192, 'steps': 2773, 'loss/train': 2.069242000579834} -09/21/2021 00:06:03 - INFO - __main__ - Step 44382: {'lr': 0.00019916853056626348, 'samples': 1420224, 'steps': 2773, 'loss/train': 2.3567843437194824} -09/21/2021 00:06:04 - INFO - __main__ - Step 44383: {'lr': 0.00019916853056626348, 'samples': 1420256, 'steps': 2773, 'loss/train': 1.7874048948287964} -09/21/2021 00:06:05 - INFO - __main__ - Step 44384: {'lr': 0.00019916853056626348, 'samples': 1420288, 'steps': 2773, 'loss/train': 1.975183129310608} -09/21/2021 00:06:06 - INFO - __main__ - Step 44385: {'lr': 0.00019916770948929342, 'samples': 1420320, 'steps': 2774, 'loss/train': 2.576484203338623} -09/21/2021 00:06:07 - INFO - __main__ - Step 44386: {'lr': 0.00019916770948929342, 'samples': 1420352, 'steps': 2774, 'loss/train': 2.3107588291168213} -09/21/2021 00:06:07 - INFO - __main__ - Step 44387: {'lr': 0.00019916770948929342, 'samples': 1420384, 'steps': 2774, 'loss/train': 1.993969440460205} -09/21/2021 00:06:08 - INFO - __main__ - Step 44388: {'lr': 0.00019916770948929342, 'samples': 1420416, 'steps': 2774, 'loss/train': 2.7203660011291504} -09/21/2021 00:06:09 - INFO - __main__ - Step 44389: {'lr': 0.00019916770948929342, 'samples': 1420448, 'steps': 2774, 'loss/train': 1.6333167552947998} -09/21/2021 00:06:10 - INFO - __main__ - Step 44390: {'lr': 0.00019916770948929342, 'samples': 1420480, 'steps': 2774, 'loss/train': 2.9571895599365234} -09/21/2021 00:06:10 - INFO - __main__ - Step 44391: {'lr': 0.00019916770948929342, 'samples': 1420512, 'steps': 2774, 'loss/train': 1.4628729820251465} -09/21/2021 00:06:11 - INFO - __main__ - Step 44392: {'lr': 0.00019916770948929342, 'samples': 1420544, 'steps': 2774, 'loss/train': 1.9848216772079468} -09/21/2021 00:06:12 - INFO - __main__ - Step 44393: {'lr': 0.00019916770948929342, 'samples': 1420576, 'steps': 2774, 'loss/train': 1.1039659976959229} -09/21/2021 00:06:13 - INFO - __main__ - Step 44394: {'lr': 0.00019916770948929342, 'samples': 1420608, 'steps': 2774, 'loss/train': 1.9959938526153564} -09/21/2021 00:06:13 - INFO - __main__ - Step 44395: {'lr': 0.00019916770948929342, 'samples': 1420640, 'steps': 2774, 'loss/train': 1.8216222524642944} -09/21/2021 00:06:15 - INFO - __main__ - Step 44396: {'lr': 0.00019916770948929342, 'samples': 1420672, 'steps': 2774, 'loss/train': 2.3223319053649902} -09/21/2021 00:06:15 - INFO - __main__ - Step 44397: {'lr': 0.00019916770948929342, 'samples': 1420704, 'steps': 2774, 'loss/train': 2.1521975994110107} -09/21/2021 00:06:16 - INFO - __main__ - Step 44398: {'lr': 0.00019916770948929342, 'samples': 1420736, 'steps': 2774, 'loss/train': 1.8090519905090332} -09/21/2021 00:06:17 - INFO - __main__ - Step 44399: {'lr': 0.00019916770948929342, 'samples': 1420768, 'steps': 2774, 'loss/train': 1.9071236848831177} -09/21/2021 00:06:18 - INFO - __main__ - Step 44400: {'lr': 0.00019916770948929342, 'samples': 1420800, 'steps': 2774, 'loss/train': 2.693276882171631} -09/21/2021 00:06:18 - INFO - __main__ - Step 44401: {'lr': 0.0001991668880088103, 'samples': 1420832, 'steps': 2775, 'loss/train': 1.6343982219696045} -09/21/2021 00:06:19 - INFO - __main__ - Step 44402: {'lr': 0.0001991668880088103, 'samples': 1420864, 'steps': 2775, 'loss/train': 2.0623221397399902} -09/21/2021 00:06:20 - INFO - __main__ - Step 44403: {'lr': 0.0001991668880088103, 'samples': 1420896, 'steps': 2775, 'loss/train': 0.5249242186546326} -09/21/2021 00:06:21 - INFO - __main__ - Step 44404: {'lr': 0.0001991668880088103, 'samples': 1420928, 'steps': 2775, 'loss/train': 1.777381420135498} -09/21/2021 00:06:21 - INFO - __main__ - Step 44405: {'lr': 0.0001991668880088103, 'samples': 1420960, 'steps': 2775, 'loss/train': 2.0598485469818115} -09/21/2021 00:06:22 - INFO - __main__ - Step 44406: {'lr': 0.0001991668880088103, 'samples': 1420992, 'steps': 2775, 'loss/train': 2.466765880584717} -09/21/2021 00:06:23 - INFO - __main__ - Step 44407: {'lr': 0.0001991668880088103, 'samples': 1421024, 'steps': 2775, 'loss/train': 2.50077748298645} -09/21/2021 00:06:24 - INFO - __main__ - Step 44408: {'lr': 0.0001991668880088103, 'samples': 1421056, 'steps': 2775, 'loss/train': 2.378955125808716} -09/21/2021 00:06:24 - INFO - __main__ - Step 44409: {'lr': 0.0001991668880088103, 'samples': 1421088, 'steps': 2775, 'loss/train': 1.7315107583999634} -09/21/2021 00:06:25 - INFO - __main__ - Step 44410: {'lr': 0.0001991668880088103, 'samples': 1421120, 'steps': 2775, 'loss/train': 1.7813527584075928} -09/21/2021 00:06:26 - INFO - __main__ - Step 44411: {'lr': 0.0001991668880088103, 'samples': 1421152, 'steps': 2775, 'loss/train': 2.0605149269104004} -09/21/2021 00:06:27 - INFO - __main__ - Step 44412: {'lr': 0.0001991668880088103, 'samples': 1421184, 'steps': 2775, 'loss/train': 2.4354686737060547} -09/21/2021 00:06:27 - INFO - __main__ - Step 44413: {'lr': 0.0001991668880088103, 'samples': 1421216, 'steps': 2775, 'loss/train': 2.1491801738739014} -09/21/2021 00:06:28 - INFO - __main__ - Step 44414: {'lr': 0.0001991668880088103, 'samples': 1421248, 'steps': 2775, 'loss/train': 1.7493212223052979} -09/21/2021 00:06:29 - INFO - __main__ - Step 44415: {'lr': 0.0001991668880088103, 'samples': 1421280, 'steps': 2775, 'loss/train': 2.3126003742218018} -09/21/2021 00:06:30 - INFO - __main__ - Step 44416: {'lr': 0.0001991668880088103, 'samples': 1421312, 'steps': 2775, 'loss/train': 2.581486940383911} -09/21/2021 00:06:31 - INFO - __main__ - Step 44417: {'lr': 0.00019916606612481753, 'samples': 1421344, 'steps': 2776, 'loss/train': 2.3135244846343994} -09/21/2021 00:06:31 - INFO - __main__ - Step 44418: {'lr': 0.00019916606612481753, 'samples': 1421376, 'steps': 2776, 'loss/train': 2.7242870330810547} -09/21/2021 00:06:32 - INFO - __main__ - Step 44419: {'lr': 0.00019916606612481753, 'samples': 1421408, 'steps': 2776, 'loss/train': 1.9619680643081665} -09/21/2021 00:06:33 - INFO - __main__ - Step 44420: {'lr': 0.00019916606612481753, 'samples': 1421440, 'steps': 2776, 'loss/train': 1.6835116147994995} -09/21/2021 00:06:34 - INFO - __main__ - Step 44421: {'lr': 0.00019916606612481753, 'samples': 1421472, 'steps': 2776, 'loss/train': 2.289928436279297} -09/21/2021 00:06:34 - INFO - __main__ - Step 44422: {'lr': 0.00019916606612481753, 'samples': 1421504, 'steps': 2776, 'loss/train': 2.4981422424316406} -09/21/2021 00:06:35 - INFO - __main__ - Step 44423: {'lr': 0.00019916606612481753, 'samples': 1421536, 'steps': 2776, 'loss/train': 2.6384668350219727} -09/21/2021 00:06:36 - INFO - __main__ - Step 44424: {'lr': 0.00019916606612481753, 'samples': 1421568, 'steps': 2776, 'loss/train': 2.0884671211242676} -09/21/2021 00:06:37 - INFO - __main__ - Step 44425: {'lr': 0.00019916606612481753, 'samples': 1421600, 'steps': 2776, 'loss/train': 2.059326410293579} -09/21/2021 00:06:37 - INFO - __main__ - Step 44426: {'lr': 0.00019916606612481753, 'samples': 1421632, 'steps': 2776, 'loss/train': 1.3999836444854736} -09/21/2021 00:06:39 - INFO - __main__ - Step 44427: {'lr': 0.00019916606612481753, 'samples': 1421664, 'steps': 2776, 'loss/train': 1.3186535835266113} -09/21/2021 00:06:39 - INFO - __main__ - Step 44428: {'lr': 0.00019916606612481753, 'samples': 1421696, 'steps': 2776, 'loss/train': 2.3392999172210693} -09/21/2021 00:06:40 - INFO - __main__ - Step 44429: {'lr': 0.00019916606612481753, 'samples': 1421728, 'steps': 2776, 'loss/train': 2.0632805824279785} -09/21/2021 00:06:41 - INFO - __main__ - Step 44430: {'lr': 0.00019916606612481753, 'samples': 1421760, 'steps': 2776, 'loss/train': 2.523829460144043} -09/21/2021 00:06:42 - INFO - __main__ - Step 44431: {'lr': 0.00019916606612481753, 'samples': 1421792, 'steps': 2776, 'loss/train': 1.9018034934997559} -09/21/2021 00:06:42 - INFO - __main__ - Step 44432: {'lr': 0.00019916606612481753, 'samples': 1421824, 'steps': 2776, 'loss/train': 1.7196768522262573} -09/21/2021 00:06:43 - INFO - __main__ - Step 44433: {'lr': 0.00019916524383731845, 'samples': 1421856, 'steps': 2777, 'loss/train': 2.0912554264068604} -09/21/2021 00:06:44 - INFO - __main__ - Step 44434: {'lr': 0.00019916524383731845, 'samples': 1421888, 'steps': 2777, 'loss/train': 0.6737768650054932} -09/21/2021 00:06:45 - INFO - __main__ - Step 44435: {'lr': 0.00019916524383731845, 'samples': 1421920, 'steps': 2777, 'loss/train': 2.080756664276123} -09/21/2021 00:06:45 - INFO - __main__ - Step 44436: {'lr': 0.00019916524383731845, 'samples': 1421952, 'steps': 2777, 'loss/train': 2.2497918605804443} -09/21/2021 00:06:46 - INFO - __main__ - Step 44437: {'lr': 0.00019916524383731845, 'samples': 1421984, 'steps': 2777, 'loss/train': 3.3816771507263184} -09/21/2021 00:06:47 - INFO - __main__ - Step 44438: {'lr': 0.00019916524383731845, 'samples': 1422016, 'steps': 2777, 'loss/train': 1.5307997465133667} -09/21/2021 00:06:48 - INFO - __main__ - Step 44439: {'lr': 0.00019916524383731845, 'samples': 1422048, 'steps': 2777, 'loss/train': 1.897485375404358} -09/21/2021 00:06:48 - INFO - __main__ - Step 44440: {'lr': 0.00019916524383731845, 'samples': 1422080, 'steps': 2777, 'loss/train': 1.79961359500885} -09/21/2021 00:06:49 - INFO - __main__ - Step 44441: {'lr': 0.00019916524383731845, 'samples': 1422112, 'steps': 2777, 'loss/train': 0.9023051261901855} -09/21/2021 00:06:50 - INFO - __main__ - Step 44442: {'lr': 0.00019916524383731845, 'samples': 1422144, 'steps': 2777, 'loss/train': 1.9553760290145874} -09/21/2021 00:06:51 - INFO - __main__ - Step 44443: {'lr': 0.00019916524383731845, 'samples': 1422176, 'steps': 2777, 'loss/train': 2.220625400543213} -09/21/2021 00:06:51 - INFO - __main__ - Step 44444: {'lr': 0.00019916524383731845, 'samples': 1422208, 'steps': 2777, 'loss/train': 2.2404584884643555} -09/21/2021 00:06:52 - INFO - __main__ - Step 44445: {'lr': 0.00019916524383731845, 'samples': 1422240, 'steps': 2777, 'loss/train': 1.3972270488739014} -09/21/2021 00:06:53 - INFO - __main__ - Step 44446: {'lr': 0.00019916524383731845, 'samples': 1422272, 'steps': 2777, 'loss/train': 1.5803213119506836} -09/21/2021 00:06:54 - INFO - __main__ - Step 44447: {'lr': 0.00019916524383731845, 'samples': 1422304, 'steps': 2777, 'loss/train': 1.893963098526001} -09/21/2021 00:06:54 - INFO - __main__ - Step 44448: {'lr': 0.00019916524383731845, 'samples': 1422336, 'steps': 2777, 'loss/train': 1.710233211517334} -09/21/2021 00:06:55 - INFO - __main__ - Step 44449: {'lr': 0.00019916442114631635, 'samples': 1422368, 'steps': 2778, 'loss/train': 1.501634955406189} -09/21/2021 00:06:56 - INFO - __main__ - Step 44450: {'lr': 0.00019916442114631635, 'samples': 1422400, 'steps': 2778, 'loss/train': 1.3179327249526978} -09/21/2021 00:06:57 - INFO - __main__ - Step 44451: {'lr': 0.00019916442114631635, 'samples': 1422432, 'steps': 2778, 'loss/train': 1.970985770225525} -09/21/2021 00:06:58 - INFO - __main__ - Step 44452: {'lr': 0.00019916442114631635, 'samples': 1422464, 'steps': 2778, 'loss/train': 1.5483051538467407} -09/21/2021 00:06:58 - INFO - __main__ - Step 44453: {'lr': 0.00019916442114631635, 'samples': 1422496, 'steps': 2778, 'loss/train': 2.0294137001037598} -09/21/2021 00:06:59 - INFO - __main__ - Step 44454: {'lr': 0.00019916442114631635, 'samples': 1422528, 'steps': 2778, 'loss/train': 1.849934697151184} -09/21/2021 00:07:00 - INFO - __main__ - Step 44455: {'lr': 0.00019916442114631635, 'samples': 1422560, 'steps': 2778, 'loss/train': 2.948495388031006} -09/21/2021 00:07:01 - INFO - __main__ - Step 44456: {'lr': 0.00019916442114631635, 'samples': 1422592, 'steps': 2778, 'loss/train': 1.4609698057174683} -09/21/2021 00:07:01 - INFO - __main__ - Step 44457: {'lr': 0.00019916442114631635, 'samples': 1422624, 'steps': 2778, 'loss/train': 2.559654951095581} -09/21/2021 00:07:02 - INFO - __main__ - Step 44458: {'lr': 0.00019916442114631635, 'samples': 1422656, 'steps': 2778, 'loss/train': 1.8453789949417114} -09/21/2021 00:07:03 - INFO - __main__ - Step 44459: {'lr': 0.00019916442114631635, 'samples': 1422688, 'steps': 2778, 'loss/train': 1.8705103397369385} -09/21/2021 00:07:04 - INFO - __main__ - Step 44460: {'lr': 0.00019916442114631635, 'samples': 1422720, 'steps': 2778, 'loss/train': 1.4484498500823975} -09/21/2021 00:07:05 - INFO - __main__ - Step 44461: {'lr': 0.00019916442114631635, 'samples': 1422752, 'steps': 2778, 'loss/train': 0.6821973323822021} -09/21/2021 00:07:06 - INFO - __main__ - Step 44462: {'lr': 0.00019916442114631635, 'samples': 1422784, 'steps': 2778, 'loss/train': 1.7789024114608765} -09/21/2021 00:07:06 - INFO - __main__ - Step 44463: {'lr': 0.00019916442114631635, 'samples': 1422816, 'steps': 2778, 'loss/train': 2.3633599281311035} -09/21/2021 00:07:07 - INFO - __main__ - Step 44464: {'lr': 0.00019916442114631635, 'samples': 1422848, 'steps': 2778, 'loss/train': 2.913738489151001} -09/21/2021 00:07:08 - INFO - __main__ - Step 44465: {'lr': 0.00019916359805181462, 'samples': 1422880, 'steps': 2779, 'loss/train': 2.7135210037231445} -09/21/2021 00:07:09 - INFO - __main__ - Step 44466: {'lr': 0.00019916359805181462, 'samples': 1422912, 'steps': 2779, 'loss/train': 2.0874106884002686} -09/21/2021 00:07:10 - INFO - __main__ - Step 44467: {'lr': 0.00019916359805181462, 'samples': 1422944, 'steps': 2779, 'loss/train': 2.1384036540985107} -09/21/2021 00:07:10 - INFO - __main__ - Step 44468: {'lr': 0.00019916359805181462, 'samples': 1422976, 'steps': 2779, 'loss/train': 2.294863700866699} -09/21/2021 00:07:11 - INFO - __main__ - Step 44469: {'lr': 0.00019916359805181462, 'samples': 1423008, 'steps': 2779, 'loss/train': 2.1142585277557373} -09/21/2021 00:07:12 - INFO - __main__ - Step 44470: {'lr': 0.00019916359805181462, 'samples': 1423040, 'steps': 2779, 'loss/train': 2.036358594894409} -09/21/2021 00:07:13 - INFO - __main__ - Step 44471: {'lr': 0.00019916359805181462, 'samples': 1423072, 'steps': 2779, 'loss/train': 1.8850361108779907} -09/21/2021 00:07:13 - INFO - __main__ - Step 44472: {'lr': 0.00019916359805181462, 'samples': 1423104, 'steps': 2779, 'loss/train': 1.407131314277649} -09/21/2021 00:07:14 - INFO - __main__ - Step 44473: {'lr': 0.00019916359805181462, 'samples': 1423136, 'steps': 2779, 'loss/train': 2.5182244777679443} -09/21/2021 00:07:15 - INFO - __main__ - Step 44474: {'lr': 0.00019916359805181462, 'samples': 1423168, 'steps': 2779, 'loss/train': 2.0910215377807617} -09/21/2021 00:07:16 - INFO - __main__ - Step 44475: {'lr': 0.00019916359805181462, 'samples': 1423200, 'steps': 2779, 'loss/train': 1.8054693937301636} -09/21/2021 00:07:16 - INFO - __main__ - Step 44476: {'lr': 0.00019916359805181462, 'samples': 1423232, 'steps': 2779, 'loss/train': 2.8691015243530273} -09/21/2021 00:07:17 - INFO - __main__ - Step 44477: {'lr': 0.00019916359805181462, 'samples': 1423264, 'steps': 2779, 'loss/train': 2.258820056915283} -09/21/2021 00:07:18 - INFO - __main__ - Step 44478: {'lr': 0.00019916359805181462, 'samples': 1423296, 'steps': 2779, 'loss/train': 2.2977731227874756} -09/21/2021 00:07:19 - INFO - __main__ - Step 44479: {'lr': 0.00019916359805181462, 'samples': 1423328, 'steps': 2779, 'loss/train': 1.571168303489685} -09/21/2021 00:07:19 - INFO - __main__ - Step 44480: {'lr': 0.00019916359805181462, 'samples': 1423360, 'steps': 2779, 'loss/train': 0.3269725739955902} -09/21/2021 00:07:20 - INFO - __main__ - Step 44481: {'lr': 0.00019916277455381658, 'samples': 1423392, 'steps': 2780, 'loss/train': 3.1437747478485107} -09/21/2021 00:07:21 - INFO - __main__ - Step 44482: {'lr': 0.00019916277455381658, 'samples': 1423424, 'steps': 2780, 'loss/train': 1.9465996026992798} -09/21/2021 00:07:22 - INFO - __main__ - Step 44483: {'lr': 0.00019916277455381658, 'samples': 1423456, 'steps': 2780, 'loss/train': 1.3022136688232422} -09/21/2021 00:07:22 - INFO - __main__ - Step 44484: {'lr': 0.00019916277455381658, 'samples': 1423488, 'steps': 2780, 'loss/train': 2.0748915672302246} -09/21/2021 00:07:23 - INFO - __main__ - Step 44485: {'lr': 0.00019916277455381658, 'samples': 1423520, 'steps': 2780, 'loss/train': 2.852077007293701} -09/21/2021 00:07:24 - INFO - __main__ - Step 44486: {'lr': 0.00019916277455381658, 'samples': 1423552, 'steps': 2780, 'loss/train': 0.8251991868019104} -09/21/2021 00:07:25 - INFO - __main__ - Step 44487: {'lr': 0.00019916277455381658, 'samples': 1423584, 'steps': 2780, 'loss/train': 1.938122272491455} -09/21/2021 00:07:25 - INFO - __main__ - Step 44488: {'lr': 0.00019916277455381658, 'samples': 1423616, 'steps': 2780, 'loss/train': 1.8932467699050903} -09/21/2021 00:07:26 - INFO - __main__ - Step 44489: {'lr': 0.00019916277455381658, 'samples': 1423648, 'steps': 2780, 'loss/train': 1.551369547843933} -09/21/2021 00:07:27 - INFO - __main__ - Step 44490: {'lr': 0.00019916277455381658, 'samples': 1423680, 'steps': 2780, 'loss/train': 0.5203750133514404} -09/21/2021 00:07:28 - INFO - __main__ - Step 44491: {'lr': 0.00019916277455381658, 'samples': 1423712, 'steps': 2780, 'loss/train': 1.6550554037094116} -09/21/2021 00:07:29 - INFO - __main__ - Step 44492: {'lr': 0.00019916277455381658, 'samples': 1423744, 'steps': 2780, 'loss/train': 2.219627857208252} -09/21/2021 00:07:30 - INFO - __main__ - Step 44493: {'lr': 0.00019916277455381658, 'samples': 1423776, 'steps': 2780, 'loss/train': 1.8312830924987793} -09/21/2021 00:07:31 - INFO - __main__ - Step 44494: {'lr': 0.00019916277455381658, 'samples': 1423808, 'steps': 2780, 'loss/train': 2.5255818367004395} -09/21/2021 00:07:31 - INFO - __main__ - Step 44495: {'lr': 0.00019916277455381658, 'samples': 1423840, 'steps': 2780, 'loss/train': 2.009815216064453} -09/21/2021 00:07:32 - INFO - __main__ - Step 44496: {'lr': 0.00019916277455381658, 'samples': 1423872, 'steps': 2780, 'loss/train': 1.9658600091934204} -09/21/2021 00:07:33 - INFO - __main__ - Step 44497: {'lr': 0.0001991619506523256, 'samples': 1423904, 'steps': 2781, 'loss/train': 1.3866349458694458} -09/21/2021 00:07:34 - INFO - __main__ - Step 44498: {'lr': 0.0001991619506523256, 'samples': 1423936, 'steps': 2781, 'loss/train': 2.116034507751465} -09/21/2021 00:07:34 - INFO - __main__ - Step 44499: {'lr': 0.0001991619506523256, 'samples': 1423968, 'steps': 2781, 'loss/train': 1.3332114219665527} -09/21/2021 00:07:35 - INFO - __main__ - Step 44500: {'lr': 0.0001991619506523256, 'samples': 1424000, 'steps': 2781, 'loss/train': 1.0867054462432861} -09/21/2021 00:07:36 - INFO - __main__ - Step 44501: {'lr': 0.0001991619506523256, 'samples': 1424032, 'steps': 2781, 'loss/train': 2.354825735092163} -09/21/2021 00:07:37 - INFO - __main__ - Step 44502: {'lr': 0.0001991619506523256, 'samples': 1424064, 'steps': 2781, 'loss/train': 1.5373777151107788} -09/21/2021 00:07:37 - INFO - __main__ - Step 44503: {'lr': 0.0001991619506523256, 'samples': 1424096, 'steps': 2781, 'loss/train': 0.40203604102134705} -09/21/2021 00:07:38 - INFO - __main__ - Step 44504: {'lr': 0.0001991619506523256, 'samples': 1424128, 'steps': 2781, 'loss/train': 2.0034549236297607} -09/21/2021 00:07:39 - INFO - __main__ - Step 44505: {'lr': 0.0001991619506523256, 'samples': 1424160, 'steps': 2781, 'loss/train': 1.8651937246322632} -09/21/2021 00:07:40 - INFO - __main__ - Step 44506: {'lr': 0.0001991619506523256, 'samples': 1424192, 'steps': 2781, 'loss/train': 2.1902871131896973} -09/21/2021 00:07:40 - INFO - __main__ - Step 44507: {'lr': 0.0001991619506523256, 'samples': 1424224, 'steps': 2781, 'loss/train': 1.6049655675888062} -09/21/2021 00:07:41 - INFO - __main__ - Step 44508: {'lr': 0.0001991619506523256, 'samples': 1424256, 'steps': 2781, 'loss/train': 1.9532016515731812} -09/21/2021 00:07:42 - INFO - __main__ - Step 44509: {'lr': 0.0001991619506523256, 'samples': 1424288, 'steps': 2781, 'loss/train': 1.9241154193878174} -09/21/2021 00:07:43 - INFO - __main__ - Step 44510: {'lr': 0.0001991619506523256, 'samples': 1424320, 'steps': 2781, 'loss/train': 2.289501905441284} -09/21/2021 00:07:43 - INFO - __main__ - Step 44511: {'lr': 0.0001991619506523256, 'samples': 1424352, 'steps': 2781, 'loss/train': 1.4909281730651855} -09/21/2021 00:07:44 - INFO - __main__ - Step 44512: {'lr': 0.0001991619506523256, 'samples': 1424384, 'steps': 2781, 'loss/train': 1.2914619445800781} -09/21/2021 00:07:45 - INFO - __main__ - Step 44513: {'lr': 0.000199161126347345, 'samples': 1424416, 'steps': 2782, 'loss/train': 2.1841506958007812} -09/21/2021 00:07:46 - INFO - __main__ - Step 44514: {'lr': 0.000199161126347345, 'samples': 1424448, 'steps': 2782, 'loss/train': 1.5932906866073608} -09/21/2021 00:07:47 - INFO - __main__ - Step 44515: {'lr': 0.000199161126347345, 'samples': 1424480, 'steps': 2782, 'loss/train': 2.8033266067504883} -09/21/2021 00:07:47 - INFO - __main__ - Step 44516: {'lr': 0.000199161126347345, 'samples': 1424512, 'steps': 2782, 'loss/train': 3.4941041469573975} -09/21/2021 00:07:48 - INFO - __main__ - Step 44517: {'lr': 0.000199161126347345, 'samples': 1424544, 'steps': 2782, 'loss/train': 1.8978357315063477} -09/21/2021 00:07:49 - INFO - __main__ - Step 44518: {'lr': 0.000199161126347345, 'samples': 1424576, 'steps': 2782, 'loss/train': 2.2001891136169434} -09/21/2021 00:07:50 - INFO - __main__ - Step 44519: {'lr': 0.000199161126347345, 'samples': 1424608, 'steps': 2782, 'loss/train': 1.8038877248764038} -09/21/2021 00:07:50 - INFO - __main__ - Step 44520: {'lr': 0.000199161126347345, 'samples': 1424640, 'steps': 2782, 'loss/train': 2.0221996307373047} -09/21/2021 00:07:51 - INFO - __main__ - Step 44521: {'lr': 0.000199161126347345, 'samples': 1424672, 'steps': 2782, 'loss/train': 1.9860697984695435} -09/21/2021 00:07:53 - INFO - __main__ - Step 44522: {'lr': 0.000199161126347345, 'samples': 1424704, 'steps': 2782, 'loss/train': 1.8149834871292114} -09/21/2021 00:07:54 - INFO - __main__ - Step 44523: {'lr': 0.000199161126347345, 'samples': 1424736, 'steps': 2782, 'loss/train': 1.8173710107803345} -09/21/2021 00:07:54 - INFO - __main__ - Step 44524: {'lr': 0.000199161126347345, 'samples': 1424768, 'steps': 2782, 'loss/train': 1.6919106245040894} -09/21/2021 00:07:55 - INFO - __main__ - Step 44525: {'lr': 0.000199161126347345, 'samples': 1424800, 'steps': 2782, 'loss/train': 1.8204371929168701} -09/21/2021 00:07:56 - INFO - __main__ - Step 44526: {'lr': 0.000199161126347345, 'samples': 1424832, 'steps': 2782, 'loss/train': 1.1332308053970337} -09/21/2021 00:07:57 - INFO - __main__ - Step 44527: {'lr': 0.000199161126347345, 'samples': 1424864, 'steps': 2782, 'loss/train': 2.1321818828582764} -09/21/2021 00:07:57 - INFO - __main__ - Step 44528: {'lr': 0.000199161126347345, 'samples': 1424896, 'steps': 2782, 'loss/train': 1.831300973892212} -09/21/2021 00:07:58 - INFO - __main__ - Step 44529: {'lr': 0.0001991603016388782, 'samples': 1424928, 'steps': 2783, 'loss/train': 2.251945734024048} -09/21/2021 00:07:59 - INFO - __main__ - Step 44530: {'lr': 0.0001991603016388782, 'samples': 1424960, 'steps': 2783, 'loss/train': 2.1890792846679688} -09/21/2021 00:08:00 - INFO - __main__ - Step 44531: {'lr': 0.0001991603016388782, 'samples': 1424992, 'steps': 2783, 'loss/train': 1.4871033430099487} -09/21/2021 00:08:00 - INFO - __main__ - Step 44532: {'lr': 0.0001991603016388782, 'samples': 1425024, 'steps': 2783, 'loss/train': 0.9580008387565613} -09/21/2021 00:08:01 - INFO - __main__ - Step 44533: {'lr': 0.0001991603016388782, 'samples': 1425056, 'steps': 2783, 'loss/train': 1.1250051259994507} -09/21/2021 00:08:02 - INFO - __main__ - Step 44534: {'lr': 0.0001991603016388782, 'samples': 1425088, 'steps': 2783, 'loss/train': 2.654613733291626} -09/21/2021 00:08:03 - INFO - __main__ - Step 44535: {'lr': 0.0001991603016388782, 'samples': 1425120, 'steps': 2783, 'loss/train': 1.9608098268508911} -09/21/2021 00:08:03 - INFO - __main__ - Step 44536: {'lr': 0.0001991603016388782, 'samples': 1425152, 'steps': 2783, 'loss/train': 2.8949761390686035} -09/21/2021 00:08:04 - INFO - __main__ - Step 44537: {'lr': 0.0001991603016388782, 'samples': 1425184, 'steps': 2783, 'loss/train': 2.3083696365356445} -09/21/2021 00:08:05 - INFO - __main__ - Step 44538: {'lr': 0.0001991603016388782, 'samples': 1425216, 'steps': 2783, 'loss/train': 2.049760580062866} -09/21/2021 00:08:06 - INFO - __main__ - Step 44539: {'lr': 0.0001991603016388782, 'samples': 1425248, 'steps': 2783, 'loss/train': 1.7827980518341064} -09/21/2021 00:08:06 - INFO - __main__ - Step 44540: {'lr': 0.0001991603016388782, 'samples': 1425280, 'steps': 2783, 'loss/train': 2.5498046875} -09/21/2021 00:08:07 - INFO - __main__ - Step 44541: {'lr': 0.0001991603016388782, 'samples': 1425312, 'steps': 2783, 'loss/train': 2.141019821166992} -09/21/2021 00:08:08 - INFO - __main__ - Step 44542: {'lr': 0.0001991603016388782, 'samples': 1425344, 'steps': 2783, 'loss/train': 1.880225658416748} -09/21/2021 00:08:09 - INFO - __main__ - Step 44543: {'lr': 0.0001991603016388782, 'samples': 1425376, 'steps': 2783, 'loss/train': 2.1681623458862305} -09/21/2021 00:08:09 - INFO - __main__ - Step 44544: {'lr': 0.0001991603016388782, 'samples': 1425408, 'steps': 2783, 'loss/train': 1.8045985698699951} -09/21/2021 00:08:10 - INFO - __main__ - Step 44545: {'lr': 0.0001991594765269285, 'samples': 1425440, 'steps': 2784, 'loss/train': 2.269737958908081} -09/21/2021 00:08:11 - INFO - __main__ - Step 44546: {'lr': 0.0001991594765269285, 'samples': 1425472, 'steps': 2784, 'loss/train': 1.785784363746643} -09/21/2021 00:08:12 - INFO - __main__ - Step 44547: {'lr': 0.0001991594765269285, 'samples': 1425504, 'steps': 2784, 'loss/train': 1.438711404800415} -09/21/2021 00:08:13 - INFO - __main__ - Step 44548: {'lr': 0.0001991594765269285, 'samples': 1425536, 'steps': 2784, 'loss/train': 0.41776153445243835} -09/21/2021 00:08:13 - INFO - __main__ - Step 44549: {'lr': 0.0001991594765269285, 'samples': 1425568, 'steps': 2784, 'loss/train': 2.7206003665924072} -09/21/2021 00:08:14 - INFO - __main__ - Step 44550: {'lr': 0.0001991594765269285, 'samples': 1425600, 'steps': 2784, 'loss/train': 2.4178476333618164} -09/21/2021 00:08:15 - INFO - __main__ - Step 44551: {'lr': 0.0001991594765269285, 'samples': 1425632, 'steps': 2784, 'loss/train': 2.2453837394714355} -09/21/2021 00:08:16 - INFO - __main__ - Step 44552: {'lr': 0.0001991594765269285, 'samples': 1425664, 'steps': 2784, 'loss/train': 1.2420369386672974} -09/21/2021 00:08:16 - INFO - __main__ - Step 44553: {'lr': 0.0001991594765269285, 'samples': 1425696, 'steps': 2784, 'loss/train': 2.1189091205596924} -09/21/2021 00:08:18 - INFO - __main__ - Step 44554: {'lr': 0.0001991594765269285, 'samples': 1425728, 'steps': 2784, 'loss/train': 1.4678760766983032} -09/21/2021 00:08:19 - INFO - __main__ - Step 44555: {'lr': 0.0001991594765269285, 'samples': 1425760, 'steps': 2784, 'loss/train': 2.213426351547241} -09/21/2021 00:08:19 - INFO - __main__ - Step 44556: {'lr': 0.0001991594765269285, 'samples': 1425792, 'steps': 2784, 'loss/train': 0.3848705589771271} -09/21/2021 00:08:20 - INFO - __main__ - Step 44557: {'lr': 0.0001991594765269285, 'samples': 1425824, 'steps': 2784, 'loss/train': 0.4223778247833252} -09/21/2021 00:08:21 - INFO - __main__ - Step 44558: {'lr': 0.0001991594765269285, 'samples': 1425856, 'steps': 2784, 'loss/train': 0.2940104305744171} -09/21/2021 00:08:22 - INFO - __main__ - Step 44559: {'lr': 0.0001991594765269285, 'samples': 1425888, 'steps': 2784, 'loss/train': 0.3328239619731903} -09/21/2021 00:08:22 - INFO - __main__ - Step 44560: {'lr': 0.0001991594765269285, 'samples': 1425920, 'steps': 2784, 'loss/train': 0.3609475791454315} -09/21/2021 00:08:23 - INFO - __main__ - Step 44561: {'lr': 0.0001991586510114993, 'samples': 1425952, 'steps': 2785, 'loss/train': 0.22133038938045502} -09/21/2021 00:08:24 - INFO - __main__ - Step 44562: {'lr': 0.0001991586510114993, 'samples': 1425984, 'steps': 2785, 'loss/train': 0.28081151843070984} -09/21/2021 00:08:25 - INFO - __main__ - Step 44563: {'lr': 0.0001991586510114993, 'samples': 1426016, 'steps': 2785, 'loss/train': 0.29409119486808777} -09/21/2021 00:08:26 - INFO - __main__ - Step 44564: {'lr': 0.0001991586510114993, 'samples': 1426048, 'steps': 2785, 'loss/train': 1.2651687860488892} -09/21/2021 00:08:26 - INFO - __main__ - Step 44565: {'lr': 0.0001991586510114993, 'samples': 1426080, 'steps': 2785, 'loss/train': 0.430042028427124} -09/21/2021 00:08:27 - INFO - __main__ - Step 44566: {'lr': 0.0001991586510114993, 'samples': 1426112, 'steps': 2785, 'loss/train': 2.0960774421691895} -09/21/2021 00:08:28 - INFO - __main__ - Step 44567: {'lr': 0.0001991586510114993, 'samples': 1426144, 'steps': 2785, 'loss/train': 1.3593612909317017} -09/21/2021 00:08:29 - INFO - __main__ - Step 44568: {'lr': 0.0001991586510114993, 'samples': 1426176, 'steps': 2785, 'loss/train': 2.4887499809265137} -09/21/2021 00:08:29 - INFO - __main__ - Step 44569: {'lr': 0.0001991586510114993, 'samples': 1426208, 'steps': 2785, 'loss/train': 2.009533166885376} -09/21/2021 00:08:30 - INFO - __main__ - Step 44570: {'lr': 0.0001991586510114993, 'samples': 1426240, 'steps': 2785, 'loss/train': 2.2699694633483887} -09/21/2021 00:08:31 - INFO - __main__ - Step 44571: {'lr': 0.0001991586510114993, 'samples': 1426272, 'steps': 2785, 'loss/train': 1.8575025796890259} -09/21/2021 00:08:32 - INFO - __main__ - Step 44572: {'lr': 0.0001991586510114993, 'samples': 1426304, 'steps': 2785, 'loss/train': 2.144747018814087} -09/21/2021 00:08:32 - INFO - __main__ - Step 44573: {'lr': 0.0001991586510114993, 'samples': 1426336, 'steps': 2785, 'loss/train': 1.3636702299118042} -09/21/2021 00:08:33 - INFO - __main__ - Step 44574: {'lr': 0.0001991586510114993, 'samples': 1426368, 'steps': 2785, 'loss/train': 1.789933443069458} -09/21/2021 00:08:34 - INFO - __main__ - Step 44575: {'lr': 0.0001991586510114993, 'samples': 1426400, 'steps': 2785, 'loss/train': 1.5560544729232788} -09/21/2021 00:08:35 - INFO - __main__ - Step 44576: {'lr': 0.0001991586510114993, 'samples': 1426432, 'steps': 2785, 'loss/train': 2.175286054611206} -09/21/2021 00:08:35 - INFO - __main__ - Step 44577: {'lr': 0.0001991578250925939, 'samples': 1426464, 'steps': 2786, 'loss/train': 1.9627220630645752} -09/21/2021 00:08:36 - INFO - __main__ - Step 44578: {'lr': 0.0001991578250925939, 'samples': 1426496, 'steps': 2786, 'loss/train': 1.2481892108917236} -09/21/2021 00:08:37 - INFO - __main__ - Step 44579: {'lr': 0.0001991578250925939, 'samples': 1426528, 'steps': 2786, 'loss/train': 0.42091166973114014} -09/21/2021 00:08:38 - INFO - __main__ - Step 44580: {'lr': 0.0001991578250925939, 'samples': 1426560, 'steps': 2786, 'loss/train': 2.6468355655670166} -09/21/2021 00:08:38 - INFO - __main__ - Step 44581: {'lr': 0.0001991578250925939, 'samples': 1426592, 'steps': 2786, 'loss/train': 2.5159196853637695} -09/21/2021 00:08:39 - INFO - __main__ - Step 44582: {'lr': 0.0001991578250925939, 'samples': 1426624, 'steps': 2786, 'loss/train': 0.9022814035415649} -09/21/2021 00:08:40 - INFO - __main__ - Step 44583: {'lr': 0.0001991578250925939, 'samples': 1426656, 'steps': 2786, 'loss/train': 0.9756106734275818} -09/21/2021 00:08:41 - INFO - __main__ - Step 44584: {'lr': 0.0001991578250925939, 'samples': 1426688, 'steps': 2786, 'loss/train': 0.9282281994819641} -09/21/2021 00:08:41 - INFO - __main__ - Step 44585: {'lr': 0.0001991578250925939, 'samples': 1426720, 'steps': 2786, 'loss/train': 1.9489011764526367} -09/21/2021 00:08:42 - INFO - __main__ - Step 44586: {'lr': 0.0001991578250925939, 'samples': 1426752, 'steps': 2786, 'loss/train': 2.835495948791504} -09/21/2021 00:08:43 - INFO - __main__ - Step 44587: {'lr': 0.0001991578250925939, 'samples': 1426784, 'steps': 2786, 'loss/train': 2.323125123977661} -09/21/2021 00:08:44 - INFO - __main__ - Step 44588: {'lr': 0.0001991578250925939, 'samples': 1426816, 'steps': 2786, 'loss/train': 0.4410744309425354} -09/21/2021 00:08:44 - INFO - __main__ - Step 44589: {'lr': 0.0001991578250925939, 'samples': 1426848, 'steps': 2786, 'loss/train': 1.3981714248657227} -09/21/2021 00:08:46 - INFO - __main__ - Step 44590: {'lr': 0.0001991578250925939, 'samples': 1426880, 'steps': 2786, 'loss/train': 2.092874526977539} -09/21/2021 00:08:46 - INFO - __main__ - Step 44591: {'lr': 0.0001991578250925939, 'samples': 1426912, 'steps': 2786, 'loss/train': 2.5620901584625244} -09/21/2021 00:08:47 - INFO - __main__ - Step 44592: {'lr': 0.0001991578250925939, 'samples': 1426944, 'steps': 2786, 'loss/train': 1.3967233896255493} -09/21/2021 00:08:48 - INFO - __main__ - Step 44593: {'lr': 0.00019915699877021573, 'samples': 1426976, 'steps': 2787, 'loss/train': 1.1991571187973022} -09/21/2021 00:08:49 - INFO - __main__ - Step 44594: {'lr': 0.00019915699877021573, 'samples': 1427008, 'steps': 2787, 'loss/train': 2.685845136642456} -09/21/2021 00:08:50 - INFO - __main__ - Step 44595: {'lr': 0.00019915699877021573, 'samples': 1427040, 'steps': 2787, 'loss/train': 1.622678279876709} -09/21/2021 00:08:50 - INFO - __main__ - Step 44596: {'lr': 0.00019915699877021573, 'samples': 1427072, 'steps': 2787, 'loss/train': 2.0421395301818848} -09/21/2021 00:08:51 - INFO - __main__ - Step 44597: {'lr': 0.00019915699877021573, 'samples': 1427104, 'steps': 2787, 'loss/train': 1.9040513038635254} -09/21/2021 00:08:52 - INFO - __main__ - Step 44598: {'lr': 0.00019915699877021573, 'samples': 1427136, 'steps': 2787, 'loss/train': 1.882769227027893} -09/21/2021 00:08:53 - INFO - __main__ - Step 44599: {'lr': 0.00019915699877021573, 'samples': 1427168, 'steps': 2787, 'loss/train': 1.0015376806259155} -09/21/2021 00:08:53 - INFO - __main__ - Step 44600: {'lr': 0.00019915699877021573, 'samples': 1427200, 'steps': 2787, 'loss/train': 3.7717843055725098} -09/21/2021 00:08:54 - INFO - __main__ - Step 44601: {'lr': 0.00019915699877021573, 'samples': 1427232, 'steps': 2787, 'loss/train': 0.8510698676109314} -09/21/2021 00:08:55 - INFO - __main__ - Step 44602: {'lr': 0.00019915699877021573, 'samples': 1427264, 'steps': 2787, 'loss/train': 1.275827407836914} -09/21/2021 00:08:56 - INFO - __main__ - Step 44603: {'lr': 0.00019915699877021573, 'samples': 1427296, 'steps': 2787, 'loss/train': 3.0366804599761963} -09/21/2021 00:08:56 - INFO - __main__ - Step 44604: {'lr': 0.00019915699877021573, 'samples': 1427328, 'steps': 2787, 'loss/train': 1.5688477754592896} -09/21/2021 00:08:57 - INFO - __main__ - Step 44605: {'lr': 0.00019915699877021573, 'samples': 1427360, 'steps': 2787, 'loss/train': 2.1933135986328125} -09/21/2021 00:08:58 - INFO - __main__ - Step 44606: {'lr': 0.00019915699877021573, 'samples': 1427392, 'steps': 2787, 'loss/train': 2.9846413135528564} -09/21/2021 00:08:59 - INFO - __main__ - Step 44607: {'lr': 0.00019915699877021573, 'samples': 1427424, 'steps': 2787, 'loss/train': 1.7987948656082153} -09/21/2021 00:08:59 - INFO - __main__ - Step 44608: {'lr': 0.00019915699877021573, 'samples': 1427456, 'steps': 2787, 'loss/train': 2.036619186401367} -09/21/2021 00:09:00 - INFO - __main__ - Step 44609: {'lr': 0.00019915617204436807, 'samples': 1427488, 'steps': 2788, 'loss/train': 3.4153926372528076} -09/21/2021 00:09:01 - INFO - __main__ - Step 44610: {'lr': 0.00019915617204436807, 'samples': 1427520, 'steps': 2788, 'loss/train': 2.3067376613616943} -09/21/2021 00:09:02 - INFO - __main__ - Step 44611: {'lr': 0.00019915617204436807, 'samples': 1427552, 'steps': 2788, 'loss/train': 1.7912650108337402} -09/21/2021 00:09:02 - INFO - __main__ - Step 44612: {'lr': 0.00019915617204436807, 'samples': 1427584, 'steps': 2788, 'loss/train': 2.7019190788269043} -09/21/2021 00:09:03 - INFO - __main__ - Step 44613: {'lr': 0.00019915617204436807, 'samples': 1427616, 'steps': 2788, 'loss/train': 2.6001081466674805} -09/21/2021 00:09:04 - INFO - __main__ - Step 44614: {'lr': 0.00019915617204436807, 'samples': 1427648, 'steps': 2788, 'loss/train': 2.105691909790039} -09/21/2021 00:09:05 - INFO - __main__ - Step 44615: {'lr': 0.00019915617204436807, 'samples': 1427680, 'steps': 2788, 'loss/train': 2.0657923221588135} -09/21/2021 00:09:05 - INFO - __main__ - Step 44616: {'lr': 0.00019915617204436807, 'samples': 1427712, 'steps': 2788, 'loss/train': 1.6720333099365234} -09/21/2021 00:09:06 - INFO - __main__ - Step 44617: {'lr': 0.00019915617204436807, 'samples': 1427744, 'steps': 2788, 'loss/train': 0.4708402752876282} -09/21/2021 00:09:07 - INFO - __main__ - Step 44618: {'lr': 0.00019915617204436807, 'samples': 1427776, 'steps': 2788, 'loss/train': 2.0894787311553955} -09/21/2021 00:09:08 - INFO - __main__ - Step 44619: {'lr': 0.00019915617204436807, 'samples': 1427808, 'steps': 2788, 'loss/train': 2.0369434356689453} -09/21/2021 00:09:08 - INFO - __main__ - Step 44620: {'lr': 0.00019915617204436807, 'samples': 1427840, 'steps': 2788, 'loss/train': 1.7778226137161255} -09/21/2021 00:09:09 - INFO - __main__ - Step 44621: {'lr': 0.00019915617204436807, 'samples': 1427872, 'steps': 2788, 'loss/train': 1.8002619743347168} -09/21/2021 00:09:11 - INFO - __main__ - Step 44622: {'lr': 0.00019915617204436807, 'samples': 1427904, 'steps': 2788, 'loss/train': 1.432877779006958} -09/21/2021 00:09:11 - INFO - __main__ - Step 44623: {'lr': 0.00019915617204436807, 'samples': 1427936, 'steps': 2788, 'loss/train': 2.105057716369629} -09/21/2021 00:09:12 - INFO - __main__ - Step 44624: {'lr': 0.00019915617204436807, 'samples': 1427968, 'steps': 2788, 'loss/train': 1.6850123405456543} -09/21/2021 00:09:13 - INFO - __main__ - Step 44625: {'lr': 0.00019915534491505438, 'samples': 1428000, 'steps': 2789, 'loss/train': 2.3100359439849854} -09/21/2021 00:09:14 - INFO - __main__ - Step 44626: {'lr': 0.00019915534491505438, 'samples': 1428032, 'steps': 2789, 'loss/train': 1.8939943313598633} -09/21/2021 00:09:14 - INFO - __main__ - Step 44627: {'lr': 0.00019915534491505438, 'samples': 1428064, 'steps': 2789, 'loss/train': 2.643195152282715} -09/21/2021 00:09:15 - INFO - __main__ - Step 44628: {'lr': 0.00019915534491505438, 'samples': 1428096, 'steps': 2789, 'loss/train': 1.6654142141342163} -09/21/2021 00:09:16 - INFO - __main__ - Step 44629: {'lr': 0.00019915534491505438, 'samples': 1428128, 'steps': 2789, 'loss/train': 1.8150490522384644} -09/21/2021 00:09:17 - INFO - __main__ - Step 44630: {'lr': 0.00019915534491505438, 'samples': 1428160, 'steps': 2789, 'loss/train': 1.398346185684204} -09/21/2021 00:09:17 - INFO - __main__ - Step 44631: {'lr': 0.00019915534491505438, 'samples': 1428192, 'steps': 2789, 'loss/train': 1.7704485654830933} -09/21/2021 00:09:18 - INFO - __main__ - Step 44632: {'lr': 0.00019915534491505438, 'samples': 1428224, 'steps': 2789, 'loss/train': 2.7609832286834717} -09/21/2021 00:09:19 - INFO - __main__ - Step 44633: {'lr': 0.00019915534491505438, 'samples': 1428256, 'steps': 2789, 'loss/train': 2.480855941772461} -09/21/2021 00:09:20 - INFO - __main__ - Step 44634: {'lr': 0.00019915534491505438, 'samples': 1428288, 'steps': 2789, 'loss/train': 1.9992691278457642} -09/21/2021 00:09:20 - INFO - __main__ - Step 44635: {'lr': 0.00019915534491505438, 'samples': 1428320, 'steps': 2789, 'loss/train': 2.9633255004882812} -09/21/2021 00:09:21 - INFO - __main__ - Step 44636: {'lr': 0.00019915534491505438, 'samples': 1428352, 'steps': 2789, 'loss/train': 2.4272780418395996} -09/21/2021 00:09:22 - INFO - __main__ - Step 44637: {'lr': 0.00019915534491505438, 'samples': 1428384, 'steps': 2789, 'loss/train': 2.2184364795684814} -09/21/2021 00:09:23 - INFO - __main__ - Step 44638: {'lr': 0.00019915534491505438, 'samples': 1428416, 'steps': 2789, 'loss/train': 2.4885642528533936} -09/21/2021 00:09:23 - INFO - __main__ - Step 44639: {'lr': 0.00019915534491505438, 'samples': 1428448, 'steps': 2789, 'loss/train': 2.262024164199829} -09/21/2021 00:09:24 - INFO - __main__ - Step 44640: {'lr': 0.00019915534491505438, 'samples': 1428480, 'steps': 2789, 'loss/train': 2.490206718444824} -09/21/2021 00:09:25 - INFO - __main__ - Step 44641: {'lr': 0.00019915451738227791, 'samples': 1428512, 'steps': 2790, 'loss/train': 2.2576119899749756} -09/21/2021 00:09:26 - INFO - __main__ - Step 44642: {'lr': 0.00019915451738227791, 'samples': 1428544, 'steps': 2790, 'loss/train': 2.699018955230713} -09/21/2021 00:09:27 - INFO - __main__ - Step 44643: {'lr': 0.00019915451738227791, 'samples': 1428576, 'steps': 2790, 'loss/train': 0.5188458561897278} -09/21/2021 00:09:27 - INFO - __main__ - Step 44644: {'lr': 0.00019915451738227791, 'samples': 1428608, 'steps': 2790, 'loss/train': 0.754204273223877} -09/21/2021 00:09:28 - INFO - __main__ - Step 44645: {'lr': 0.00019915451738227791, 'samples': 1428640, 'steps': 2790, 'loss/train': 2.595728635787964} -09/21/2021 00:09:29 - INFO - __main__ - Step 44646: {'lr': 0.00019915451738227791, 'samples': 1428672, 'steps': 2790, 'loss/train': 0.4717545509338379} -09/21/2021 00:09:30 - INFO - __main__ - Step 44647: {'lr': 0.00019915451738227791, 'samples': 1428704, 'steps': 2790, 'loss/train': 1.4871504306793213} -09/21/2021 00:09:30 - INFO - __main__ - Step 44648: {'lr': 0.00019915451738227791, 'samples': 1428736, 'steps': 2790, 'loss/train': 2.3494205474853516} -09/21/2021 00:09:31 - INFO - __main__ - Step 44649: {'lr': 0.00019915451738227791, 'samples': 1428768, 'steps': 2790, 'loss/train': 1.5667908191680908} -09/21/2021 00:09:32 - INFO - __main__ - Step 44650: {'lr': 0.00019915451738227791, 'samples': 1428800, 'steps': 2790, 'loss/train': 2.3435354232788086} -09/21/2021 00:09:33 - INFO - __main__ - Step 44651: {'lr': 0.00019915451738227791, 'samples': 1428832, 'steps': 2790, 'loss/train': 2.3224949836730957} -09/21/2021 00:09:33 - INFO - __main__ - Step 44652: {'lr': 0.00019915451738227791, 'samples': 1428864, 'steps': 2790, 'loss/train': 1.4797788858413696} -09/21/2021 00:09:34 - INFO - __main__ - Step 44653: {'lr': 0.00019915451738227791, 'samples': 1428896, 'steps': 2790, 'loss/train': 1.0293763875961304} -09/21/2021 00:09:35 - INFO - __main__ - Step 44654: {'lr': 0.00019915451738227791, 'samples': 1428928, 'steps': 2790, 'loss/train': 2.6098618507385254} -09/21/2021 00:09:36 - INFO - __main__ - Step 44655: {'lr': 0.00019915451738227791, 'samples': 1428960, 'steps': 2790, 'loss/train': 1.8921672105789185} -09/21/2021 00:09:37 - INFO - __main__ - Step 44656: {'lr': 0.00019915451738227791, 'samples': 1428992, 'steps': 2790, 'loss/train': 1.573879599571228} -09/21/2021 00:09:38 - INFO - __main__ - Step 44657: {'lr': 0.00019915368944604218, 'samples': 1429024, 'steps': 2791, 'loss/train': 2.621408224105835} -09/21/2021 00:09:38 - INFO - __main__ - Step 44658: {'lr': 0.00019915368944604218, 'samples': 1429056, 'steps': 2791, 'loss/train': 1.0420796871185303} -09/21/2021 00:09:39 - INFO - __main__ - Step 44659: {'lr': 0.00019915368944604218, 'samples': 1429088, 'steps': 2791, 'loss/train': 1.9774574041366577} -09/21/2021 00:09:40 - INFO - __main__ - Step 44660: {'lr': 0.00019915368944604218, 'samples': 1429120, 'steps': 2791, 'loss/train': 2.415459156036377} -09/21/2021 00:09:41 - INFO - __main__ - Step 44661: {'lr': 0.00019915368944604218, 'samples': 1429152, 'steps': 2791, 'loss/train': 1.3188098669052124} -09/21/2021 00:09:41 - INFO - __main__ - Step 44662: {'lr': 0.00019915368944604218, 'samples': 1429184, 'steps': 2791, 'loss/train': 2.0599281787872314} -09/21/2021 00:09:42 - INFO - __main__ - Step 44663: {'lr': 0.00019915368944604218, 'samples': 1429216, 'steps': 2791, 'loss/train': 1.75137197971344} -09/21/2021 00:09:43 - INFO - __main__ - Step 44664: {'lr': 0.00019915368944604218, 'samples': 1429248, 'steps': 2791, 'loss/train': 1.9561302661895752} -09/21/2021 00:09:44 - INFO - __main__ - Step 44665: {'lr': 0.00019915368944604218, 'samples': 1429280, 'steps': 2791, 'loss/train': 2.7021565437316895} -09/21/2021 00:09:44 - INFO - __main__ - Step 44666: {'lr': 0.00019915368944604218, 'samples': 1429312, 'steps': 2791, 'loss/train': 1.409488320350647} -09/21/2021 00:09:45 - INFO - __main__ - Step 44667: {'lr': 0.00019915368944604218, 'samples': 1429344, 'steps': 2791, 'loss/train': 1.623645544052124} -09/21/2021 00:09:46 - INFO - __main__ - Step 44668: {'lr': 0.00019915368944604218, 'samples': 1429376, 'steps': 2791, 'loss/train': 1.7345291376113892} -09/21/2021 00:09:47 - INFO - __main__ - Step 44669: {'lr': 0.00019915368944604218, 'samples': 1429408, 'steps': 2791, 'loss/train': 2.039299249649048} -09/21/2021 00:09:47 - INFO - __main__ - Step 44670: {'lr': 0.00019915368944604218, 'samples': 1429440, 'steps': 2791, 'loss/train': 2.579352617263794} -09/21/2021 00:09:48 - INFO - __main__ - Step 44671: {'lr': 0.00019915368944604218, 'samples': 1429472, 'steps': 2791, 'loss/train': 0.3583274483680725} -09/21/2021 00:09:49 - INFO - __main__ - Step 44672: {'lr': 0.00019915368944604218, 'samples': 1429504, 'steps': 2791, 'loss/train': 1.145285725593567} -09/21/2021 00:09:50 - INFO - __main__ - Step 44673: {'lr': 0.00019915286110635042, 'samples': 1429536, 'steps': 2792, 'loss/train': 2.4281768798828125} -09/21/2021 00:09:51 - INFO - __main__ - Step 44674: {'lr': 0.00019915286110635042, 'samples': 1429568, 'steps': 2792, 'loss/train': 1.8209635019302368} -09/21/2021 00:09:51 - INFO - __main__ - Step 44675: {'lr': 0.00019915286110635042, 'samples': 1429600, 'steps': 2792, 'loss/train': 3.0274858474731445} -09/21/2021 00:09:52 - INFO - __main__ - Step 44676: {'lr': 0.00019915286110635042, 'samples': 1429632, 'steps': 2792, 'loss/train': 1.6725493669509888} -09/21/2021 00:09:53 - INFO - __main__ - Step 44677: {'lr': 0.00019915286110635042, 'samples': 1429664, 'steps': 2792, 'loss/train': 1.5447324514389038} -09/21/2021 00:09:54 - INFO - __main__ - Step 44678: {'lr': 0.00019915286110635042, 'samples': 1429696, 'steps': 2792, 'loss/train': 1.6574677228927612} -09/21/2021 00:09:54 - INFO - __main__ - Step 44679: {'lr': 0.00019915286110635042, 'samples': 1429728, 'steps': 2792, 'loss/train': 1.757810354232788} -09/21/2021 00:09:55 - INFO - __main__ - Step 44680: {'lr': 0.00019915286110635042, 'samples': 1429760, 'steps': 2792, 'loss/train': 2.482140302658081} -09/21/2021 00:09:56 - INFO - __main__ - Step 44681: {'lr': 0.00019915286110635042, 'samples': 1429792, 'steps': 2792, 'loss/train': 1.9248871803283691} -09/21/2021 00:09:57 - INFO - __main__ - Step 44682: {'lr': 0.00019915286110635042, 'samples': 1429824, 'steps': 2792, 'loss/train': 1.7109676599502563} -09/21/2021 00:09:57 - INFO - __main__ - Step 44683: {'lr': 0.00019915286110635042, 'samples': 1429856, 'steps': 2792, 'loss/train': 2.6729586124420166} -09/21/2021 00:09:59 - INFO - __main__ - Step 44684: {'lr': 0.00019915286110635042, 'samples': 1429888, 'steps': 2792, 'loss/train': 2.3245134353637695} -09/21/2021 00:10:00 - INFO - __main__ - Step 44685: {'lr': 0.00019915286110635042, 'samples': 1429920, 'steps': 2792, 'loss/train': 1.5712268352508545} -09/21/2021 00:10:00 - INFO - __main__ - Step 44686: {'lr': 0.00019915286110635042, 'samples': 1429952, 'steps': 2792, 'loss/train': 0.3730154037475586} -09/21/2021 00:10:01 - INFO - __main__ - Step 44687: {'lr': 0.00019915286110635042, 'samples': 1429984, 'steps': 2792, 'loss/train': 1.9728124141693115} -09/21/2021 00:10:02 - INFO - __main__ - Step 44688: {'lr': 0.00019915286110635042, 'samples': 1430016, 'steps': 2792, 'loss/train': 1.8298861980438232} -09/21/2021 00:10:03 - INFO - __main__ - Step 44689: {'lr': 0.00019915203236320605, 'samples': 1430048, 'steps': 2793, 'loss/train': 1.5047862529754639} -09/21/2021 00:10:04 - INFO - __main__ - Step 44690: {'lr': 0.00019915203236320605, 'samples': 1430080, 'steps': 2793, 'loss/train': 0.4697090983390808} -09/21/2021 00:10:04 - INFO - __main__ - Step 44691: {'lr': 0.00019915203236320605, 'samples': 1430112, 'steps': 2793, 'loss/train': 1.4898186922073364} -09/21/2021 00:10:05 - INFO - __main__ - Step 44692: {'lr': 0.00019915203236320605, 'samples': 1430144, 'steps': 2793, 'loss/train': 1.671034812927246} -09/21/2021 00:10:06 - INFO - __main__ - Step 44693: {'lr': 0.00019915203236320605, 'samples': 1430176, 'steps': 2793, 'loss/train': 2.250756025314331} -09/21/2021 00:10:07 - INFO - __main__ - Step 44694: {'lr': 0.00019915203236320605, 'samples': 1430208, 'steps': 2793, 'loss/train': 1.9586520195007324} -09/21/2021 00:10:07 - INFO - __main__ - Step 44695: {'lr': 0.00019915203236320605, 'samples': 1430240, 'steps': 2793, 'loss/train': 1.9998505115509033} -09/21/2021 00:10:08 - INFO - __main__ - Step 44696: {'lr': 0.00019915203236320605, 'samples': 1430272, 'steps': 2793, 'loss/train': 2.3802645206451416} -09/21/2021 00:10:09 - INFO - __main__ - Step 44697: {'lr': 0.00019915203236320605, 'samples': 1430304, 'steps': 2793, 'loss/train': 2.366788387298584} -09/21/2021 00:10:10 - INFO - __main__ - Step 44698: {'lr': 0.00019915203236320605, 'samples': 1430336, 'steps': 2793, 'loss/train': 1.8478899002075195} -09/21/2021 00:10:10 - INFO - __main__ - Step 44699: {'lr': 0.00019915203236320605, 'samples': 1430368, 'steps': 2793, 'loss/train': 1.4543267488479614} -09/21/2021 00:10:11 - INFO - __main__ - Step 44700: {'lr': 0.00019915203236320605, 'samples': 1430400, 'steps': 2793, 'loss/train': 3.883843421936035} -09/21/2021 00:10:12 - INFO - __main__ - Step 44701: {'lr': 0.00019915203236320605, 'samples': 1430432, 'steps': 2793, 'loss/train': 3.904524326324463} -09/21/2021 00:10:13 - INFO - __main__ - Step 44702: {'lr': 0.00019915203236320605, 'samples': 1430464, 'steps': 2793, 'loss/train': 1.7948042154312134} -09/21/2021 00:10:13 - INFO - __main__ - Step 44703: {'lr': 0.00019915203236320605, 'samples': 1430496, 'steps': 2793, 'loss/train': 2.419835090637207} -09/21/2021 00:10:14 - INFO - __main__ - Step 44704: {'lr': 0.00019915203236320605, 'samples': 1430528, 'steps': 2793, 'loss/train': 2.425135612487793} -09/21/2021 00:10:15 - INFO - __main__ - Step 44705: {'lr': 0.00019915120321661246, 'samples': 1430560, 'steps': 2794, 'loss/train': 1.2763822078704834} -09/21/2021 00:10:16 - INFO - __main__ - Step 44706: {'lr': 0.00019915120321661246, 'samples': 1430592, 'steps': 2794, 'loss/train': 1.8244956731796265} -09/21/2021 00:10:16 - INFO - __main__ - Step 44707: {'lr': 0.00019915120321661246, 'samples': 1430624, 'steps': 2794, 'loss/train': 1.6637519598007202} -09/21/2021 00:10:17 - INFO - __main__ - Step 44708: {'lr': 0.00019915120321661246, 'samples': 1430656, 'steps': 2794, 'loss/train': 1.5346081256866455} -09/21/2021 00:10:18 - INFO - __main__ - Step 44709: {'lr': 0.00019915120321661246, 'samples': 1430688, 'steps': 2794, 'loss/train': 1.6935614347457886} -09/21/2021 00:10:19 - INFO - __main__ - Step 44710: {'lr': 0.00019915120321661246, 'samples': 1430720, 'steps': 2794, 'loss/train': 1.6655141115188599} -09/21/2021 00:10:19 - INFO - __main__ - Step 44711: {'lr': 0.00019915120321661246, 'samples': 1430752, 'steps': 2794, 'loss/train': 1.0514155626296997} -09/21/2021 00:10:20 - INFO - __main__ - Step 44712: {'lr': 0.00019915120321661246, 'samples': 1430784, 'steps': 2794, 'loss/train': 2.060823917388916} -09/21/2021 00:10:21 - INFO - __main__ - Step 44713: {'lr': 0.00019915120321661246, 'samples': 1430816, 'steps': 2794, 'loss/train': 1.8267314434051514} -09/21/2021 00:10:22 - INFO - __main__ - Step 44714: {'lr': 0.00019915120321661246, 'samples': 1430848, 'steps': 2794, 'loss/train': 2.5049819946289062} -09/21/2021 00:10:22 - INFO - __main__ - Step 44715: {'lr': 0.00019915120321661246, 'samples': 1430880, 'steps': 2794, 'loss/train': 0.4867062270641327} -09/21/2021 00:10:23 - INFO - __main__ - Step 44716: {'lr': 0.00019915120321661246, 'samples': 1430912, 'steps': 2794, 'loss/train': 0.4619224965572357} -09/21/2021 00:10:24 - INFO - __main__ - Step 44717: {'lr': 0.00019915120321661246, 'samples': 1430944, 'steps': 2794, 'loss/train': 0.5826117396354675} -09/21/2021 00:10:25 - INFO - __main__ - Step 44718: {'lr': 0.00019915120321661246, 'samples': 1430976, 'steps': 2794, 'loss/train': 0.4537779986858368} -09/21/2021 00:10:25 - INFO - __main__ - Step 44719: {'lr': 0.00019915120321661246, 'samples': 1431008, 'steps': 2794, 'loss/train': 0.3755296766757965} -09/21/2021 00:10:26 - INFO - __main__ - Step 44720: {'lr': 0.00019915120321661246, 'samples': 1431040, 'steps': 2794, 'loss/train': 0.5320300459861755} -09/21/2021 00:10:27 - INFO - __main__ - Step 44721: {'lr': 0.00019915037366657301, 'samples': 1431072, 'steps': 2795, 'loss/train': 0.34760725498199463} -09/21/2021 00:10:28 - INFO - __main__ - Step 44722: {'lr': 0.00019915037366657301, 'samples': 1431104, 'steps': 2795, 'loss/train': 0.3101786971092224} -09/21/2021 00:10:29 - INFO - __main__ - Step 44723: {'lr': 0.00019915037366657301, 'samples': 1431136, 'steps': 2795, 'loss/train': 0.39926692843437195} -09/21/2021 00:10:30 - INFO - __main__ - Step 44724: {'lr': 0.00019915037366657301, 'samples': 1431168, 'steps': 2795, 'loss/train': 2.0609073638916016} -09/21/2021 00:10:31 - INFO - __main__ - Step 44725: {'lr': 0.00019915037366657301, 'samples': 1431200, 'steps': 2795, 'loss/train': 1.6018677949905396} -09/21/2021 00:10:31 - INFO - __main__ - Step 44726: {'lr': 0.00019915037366657301, 'samples': 1431232, 'steps': 2795, 'loss/train': 3.3054277896881104} -09/21/2021 00:10:32 - INFO - __main__ - Step 44727: {'lr': 0.00019915037366657301, 'samples': 1431264, 'steps': 2795, 'loss/train': 2.3448004722595215} -09/21/2021 00:10:33 - INFO - __main__ - Step 44728: {'lr': 0.00019915037366657301, 'samples': 1431296, 'steps': 2795, 'loss/train': 1.5737671852111816} -09/21/2021 00:10:34 - INFO - __main__ - Step 44729: {'lr': 0.00019915037366657301, 'samples': 1431328, 'steps': 2795, 'loss/train': 2.6480906009674072} -09/21/2021 00:10:34 - INFO - __main__ - Step 44730: {'lr': 0.00019915037366657301, 'samples': 1431360, 'steps': 2795, 'loss/train': 1.7298879623413086} -09/21/2021 00:10:35 - INFO - __main__ - Step 44731: {'lr': 0.00019915037366657301, 'samples': 1431392, 'steps': 2795, 'loss/train': 1.8964661359786987} -09/21/2021 00:10:36 - INFO - __main__ - Step 44732: {'lr': 0.00019915037366657301, 'samples': 1431424, 'steps': 2795, 'loss/train': 2.4697022438049316} -09/21/2021 00:10:37 - INFO - __main__ - Step 44733: {'lr': 0.00019915037366657301, 'samples': 1431456, 'steps': 2795, 'loss/train': 1.5424211025238037} -09/21/2021 00:10:37 - INFO - __main__ - Step 44734: {'lr': 0.00019915037366657301, 'samples': 1431488, 'steps': 2795, 'loss/train': 1.9134868383407593} -09/21/2021 00:10:38 - INFO - __main__ - Step 44735: {'lr': 0.00019915037366657301, 'samples': 1431520, 'steps': 2795, 'loss/train': 2.488353729248047} -09/21/2021 00:10:39 - INFO - __main__ - Step 44736: {'lr': 0.00019915037366657301, 'samples': 1431552, 'steps': 2795, 'loss/train': 2.198699951171875} -09/21/2021 00:10:40 - INFO - __main__ - Step 44737: {'lr': 0.00019914954371309107, 'samples': 1431584, 'steps': 2796, 'loss/train': 1.7486321926116943} -09/21/2021 00:10:41 - INFO - __main__ - Step 44738: {'lr': 0.00019914954371309107, 'samples': 1431616, 'steps': 2796, 'loss/train': 1.4639222621917725} -09/21/2021 00:10:41 - INFO - __main__ - Step 44739: {'lr': 0.00019914954371309107, 'samples': 1431648, 'steps': 2796, 'loss/train': 1.7232738733291626} -09/21/2021 00:10:42 - INFO - __main__ - Step 44740: {'lr': 0.00019914954371309107, 'samples': 1431680, 'steps': 2796, 'loss/train': 2.302032709121704} -09/21/2021 00:10:43 - INFO - __main__ - Step 44741: {'lr': 0.00019914954371309107, 'samples': 1431712, 'steps': 2796, 'loss/train': 2.454531192779541} -09/21/2021 00:10:44 - INFO - __main__ - Step 44742: {'lr': 0.00019914954371309107, 'samples': 1431744, 'steps': 2796, 'loss/train': 2.1493449211120605} -09/21/2021 00:10:44 - INFO - __main__ - Step 44743: {'lr': 0.00019914954371309107, 'samples': 1431776, 'steps': 2796, 'loss/train': 3.042421817779541} -09/21/2021 00:10:45 - INFO - __main__ - Step 44744: {'lr': 0.00019914954371309107, 'samples': 1431808, 'steps': 2796, 'loss/train': 2.9801125526428223} -09/21/2021 00:10:46 - INFO - __main__ - Step 44745: {'lr': 0.00019914954371309107, 'samples': 1431840, 'steps': 2796, 'loss/train': 1.8758578300476074} -09/21/2021 00:10:47 - INFO - __main__ - Step 44746: {'lr': 0.00019914954371309107, 'samples': 1431872, 'steps': 2796, 'loss/train': 1.2840632200241089} -09/21/2021 00:10:47 - INFO - __main__ - Step 44747: {'lr': 0.00019914954371309107, 'samples': 1431904, 'steps': 2796, 'loss/train': 2.0224063396453857} -09/21/2021 00:10:48 - INFO - __main__ - Step 44748: {'lr': 0.00019914954371309107, 'samples': 1431936, 'steps': 2796, 'loss/train': 2.8019909858703613} -09/21/2021 00:10:49 - INFO - __main__ - Step 44749: {'lr': 0.00019914954371309107, 'samples': 1431968, 'steps': 2796, 'loss/train': 3.3134734630584717} -09/21/2021 00:10:50 - INFO - __main__ - Step 44750: {'lr': 0.00019914954371309107, 'samples': 1432000, 'steps': 2796, 'loss/train': 1.7881487607955933} -09/21/2021 00:10:50 - INFO - __main__ - Step 44751: {'lr': 0.00019914954371309107, 'samples': 1432032, 'steps': 2796, 'loss/train': 2.1533126831054688} -09/21/2021 00:10:51 - INFO - __main__ - Step 44752: {'lr': 0.00019914954371309107, 'samples': 1432064, 'steps': 2796, 'loss/train': 2.0685079097747803} -09/21/2021 00:10:52 - INFO - __main__ - Step 44753: {'lr': 0.00019914871335617002, 'samples': 1432096, 'steps': 2797, 'loss/train': 1.420582890510559} -09/21/2021 00:10:53 - INFO - __main__ - Step 44754: {'lr': 0.00019914871335617002, 'samples': 1432128, 'steps': 2797, 'loss/train': 1.7122440338134766} -09/21/2021 00:10:54 - INFO - __main__ - Step 44755: {'lr': 0.00019914871335617002, 'samples': 1432160, 'steps': 2797, 'loss/train': 2.9838154315948486} -09/21/2021 00:10:55 - INFO - __main__ - Step 44756: {'lr': 0.00019914871335617002, 'samples': 1432192, 'steps': 2797, 'loss/train': 2.147139310836792} -09/21/2021 00:10:55 - INFO - __main__ - Step 44757: {'lr': 0.00019914871335617002, 'samples': 1432224, 'steps': 2797, 'loss/train': 2.602638006210327} -09/21/2021 00:10:56 - INFO - __main__ - Step 44758: {'lr': 0.00019914871335617002, 'samples': 1432256, 'steps': 2797, 'loss/train': 2.032274007797241} -09/21/2021 00:10:57 - INFO - __main__ - Step 44759: {'lr': 0.00019914871335617002, 'samples': 1432288, 'steps': 2797, 'loss/train': 1.930935025215149} -09/21/2021 00:10:58 - INFO - __main__ - Step 44760: {'lr': 0.00019914871335617002, 'samples': 1432320, 'steps': 2797, 'loss/train': 2.053030490875244} -09/21/2021 00:10:58 - INFO - __main__ - Step 44761: {'lr': 0.00019914871335617002, 'samples': 1432352, 'steps': 2797, 'loss/train': 3.3665473461151123} -09/21/2021 00:10:59 - INFO - __main__ - Step 44762: {'lr': 0.00019914871335617002, 'samples': 1432384, 'steps': 2797, 'loss/train': 2.137486219406128} -09/21/2021 00:11:00 - INFO - __main__ - Step 44763: {'lr': 0.00019914871335617002, 'samples': 1432416, 'steps': 2797, 'loss/train': 2.555823564529419} -09/21/2021 00:11:01 - INFO - __main__ - Step 44764: {'lr': 0.00019914871335617002, 'samples': 1432448, 'steps': 2797, 'loss/train': 1.4398335218429565} -09/21/2021 00:11:01 - INFO - __main__ - Step 44765: {'lr': 0.00019914871335617002, 'samples': 1432480, 'steps': 2797, 'loss/train': 1.382561445236206} -09/21/2021 00:11:02 - INFO - __main__ - Step 44766: {'lr': 0.00019914871335617002, 'samples': 1432512, 'steps': 2797, 'loss/train': 2.120542049407959} -09/21/2021 00:11:03 - INFO - __main__ - Step 44767: {'lr': 0.00019914871335617002, 'samples': 1432544, 'steps': 2797, 'loss/train': 1.9498114585876465} -09/21/2021 00:11:04 - INFO - __main__ - Step 44768: {'lr': 0.00019914871335617002, 'samples': 1432576, 'steps': 2797, 'loss/train': 2.9128386974334717} -09/21/2021 00:11:05 - INFO - __main__ - Step 44769: {'lr': 0.00019914788259581324, 'samples': 1432608, 'steps': 2798, 'loss/train': 2.417036771774292} -09/21/2021 00:11:05 - INFO - __main__ - Step 44770: {'lr': 0.00019914788259581324, 'samples': 1432640, 'steps': 2798, 'loss/train': 1.8300644159317017} -09/21/2021 00:11:06 - INFO - __main__ - Step 44771: {'lr': 0.00019914788259581324, 'samples': 1432672, 'steps': 2798, 'loss/train': 1.915494441986084} -09/21/2021 00:11:07 - INFO - __main__ - Step 44772: {'lr': 0.00019914788259581324, 'samples': 1432704, 'steps': 2798, 'loss/train': 2.0137453079223633} -09/21/2021 00:11:08 - INFO - __main__ - Step 44773: {'lr': 0.00019914788259581324, 'samples': 1432736, 'steps': 2798, 'loss/train': 2.7611658573150635} -09/21/2021 00:11:08 - INFO - __main__ - Step 44774: {'lr': 0.00019914788259581324, 'samples': 1432768, 'steps': 2798, 'loss/train': 2.2950353622436523} -09/21/2021 00:11:09 - INFO - __main__ - Step 44775: {'lr': 0.00019914788259581324, 'samples': 1432800, 'steps': 2798, 'loss/train': 1.561308741569519} -09/21/2021 00:11:10 - INFO - __main__ - Step 44776: {'lr': 0.00019914788259581324, 'samples': 1432832, 'steps': 2798, 'loss/train': 1.9492472410202026} -09/21/2021 00:11:11 - INFO - __main__ - Step 44777: {'lr': 0.00019914788259581324, 'samples': 1432864, 'steps': 2798, 'loss/train': 0.6654841303825378} -09/21/2021 00:11:11 - INFO - __main__ - Step 44778: {'lr': 0.00019914788259581324, 'samples': 1432896, 'steps': 2798, 'loss/train': 1.2736610174179077} -09/21/2021 00:11:12 - INFO - __main__ - Step 44779: {'lr': 0.00019914788259581324, 'samples': 1432928, 'steps': 2798, 'loss/train': 1.70911705493927} -09/21/2021 00:11:13 - INFO - __main__ - Step 44780: {'lr': 0.00019914788259581324, 'samples': 1432960, 'steps': 2798, 'loss/train': 2.428830862045288} -09/21/2021 00:11:14 - INFO - __main__ - Step 44781: {'lr': 0.00019914788259581324, 'samples': 1432992, 'steps': 2798, 'loss/train': 1.5456022024154663} -09/21/2021 00:11:14 - INFO - __main__ - Step 44782: {'lr': 0.00019914788259581324, 'samples': 1433024, 'steps': 2798, 'loss/train': 2.6485345363616943} -09/21/2021 00:11:15 - INFO - __main__ - Step 44783: {'lr': 0.00019914788259581324, 'samples': 1433056, 'steps': 2798, 'loss/train': 2.0081281661987305} -09/21/2021 00:11:16 - INFO - __main__ - Step 44784: {'lr': 0.00019914788259581324, 'samples': 1433088, 'steps': 2798, 'loss/train': 2.425057888031006} -09/21/2021 00:11:17 - INFO - __main__ - Step 44785: {'lr': 0.00019914705143202414, 'samples': 1433120, 'steps': 2799, 'loss/train': 2.175116777420044} -09/21/2021 00:11:18 - INFO - __main__ - Step 44786: {'lr': 0.00019914705143202414, 'samples': 1433152, 'steps': 2799, 'loss/train': 2.993687629699707} -09/21/2021 00:11:19 - INFO - __main__ - Step 44787: {'lr': 0.00019914705143202414, 'samples': 1433184, 'steps': 2799, 'loss/train': 2.7901885509490967} -09/21/2021 00:11:19 - INFO - __main__ - Step 44788: {'lr': 0.00019914705143202414, 'samples': 1433216, 'steps': 2799, 'loss/train': 2.4135868549346924} -09/21/2021 00:11:20 - INFO - __main__ - Step 44789: {'lr': 0.00019914705143202414, 'samples': 1433248, 'steps': 2799, 'loss/train': 1.7452765703201294} -09/21/2021 00:11:21 - INFO - __main__ - Step 44790: {'lr': 0.00019914705143202414, 'samples': 1433280, 'steps': 2799, 'loss/train': 0.4342111647129059} -09/21/2021 00:11:22 - INFO - __main__ - Step 44791: {'lr': 0.00019914705143202414, 'samples': 1433312, 'steps': 2799, 'loss/train': 1.9695194959640503} -09/21/2021 00:11:22 - INFO - __main__ - Step 44792: {'lr': 0.00019914705143202414, 'samples': 1433344, 'steps': 2799, 'loss/train': 2.072751998901367} -09/21/2021 00:11:23 - INFO - __main__ - Step 44793: {'lr': 0.00019914705143202414, 'samples': 1433376, 'steps': 2799, 'loss/train': 1.991988182067871} -09/21/2021 00:11:24 - INFO - __main__ - Step 44794: {'lr': 0.00019914705143202414, 'samples': 1433408, 'steps': 2799, 'loss/train': 1.9871597290039062} -09/21/2021 00:11:25 - INFO - __main__ - Step 44795: {'lr': 0.00019914705143202414, 'samples': 1433440, 'steps': 2799, 'loss/train': 1.6670243740081787} -09/21/2021 00:11:25 - INFO - __main__ - Step 44796: {'lr': 0.00019914705143202414, 'samples': 1433472, 'steps': 2799, 'loss/train': 1.3489574193954468} -09/21/2021 00:11:26 - INFO - __main__ - Step 44797: {'lr': 0.00019914705143202414, 'samples': 1433504, 'steps': 2799, 'loss/train': 2.960432767868042} -09/21/2021 00:11:27 - INFO - __main__ - Step 44798: {'lr': 0.00019914705143202414, 'samples': 1433536, 'steps': 2799, 'loss/train': 1.7651206254959106} -09/21/2021 00:11:28 - INFO - __main__ - Step 44799: {'lr': 0.00019914705143202414, 'samples': 1433568, 'steps': 2799, 'loss/train': 2.0322306156158447} -09/21/2021 00:11:28 - INFO - __main__ - Step 44800: {'lr': 0.00019914705143202414, 'samples': 1433600, 'steps': 2799, 'loss/train': 4.116482257843018} -09/21/2021 00:11:29 - INFO - __main__ - Step 44801: {'lr': 0.00019914621986480603, 'samples': 1433632, 'steps': 2800, 'loss/train': 2.479490041732788} -09/21/2021 00:11:30 - INFO - __main__ - Step 44802: {'lr': 0.00019914621986480603, 'samples': 1433664, 'steps': 2800, 'loss/train': 3.066638469696045} -09/21/2021 00:11:31 - INFO - __main__ - Step 44803: {'lr': 0.00019914621986480603, 'samples': 1433696, 'steps': 2800, 'loss/train': 2.334082841873169} -09/21/2021 00:11:32 - INFO - __main__ - Step 44804: {'lr': 0.00019914621986480603, 'samples': 1433728, 'steps': 2800, 'loss/train': 2.3165128231048584} -09/21/2021 00:11:32 - INFO - __main__ - Step 44805: {'lr': 0.00019914621986480603, 'samples': 1433760, 'steps': 2800, 'loss/train': 1.4489684104919434} -09/21/2021 00:11:33 - INFO - __main__ - Step 44806: {'lr': 0.00019914621986480603, 'samples': 1433792, 'steps': 2800, 'loss/train': 2.7953684329986572} -09/21/2021 00:11:34 - INFO - __main__ - Step 44807: {'lr': 0.00019914621986480603, 'samples': 1433824, 'steps': 2800, 'loss/train': 1.8770732879638672} -09/21/2021 00:11:35 - INFO - __main__ - Step 44808: {'lr': 0.00019914621986480603, 'samples': 1433856, 'steps': 2800, 'loss/train': 2.9863457679748535} -09/21/2021 00:11:35 - INFO - __main__ - Step 44809: {'lr': 0.00019914621986480603, 'samples': 1433888, 'steps': 2800, 'loss/train': 2.1063246726989746} -09/21/2021 00:11:36 - INFO - __main__ - Step 44810: {'lr': 0.00019914621986480603, 'samples': 1433920, 'steps': 2800, 'loss/train': 2.084245204925537} -09/21/2021 00:11:37 - INFO - __main__ - Step 44811: {'lr': 0.00019914621986480603, 'samples': 1433952, 'steps': 2800, 'loss/train': 1.626763105392456} -09/21/2021 00:11:38 - INFO - __main__ - Step 44812: {'lr': 0.00019914621986480603, 'samples': 1433984, 'steps': 2800, 'loss/train': 2.254572629928589} -09/21/2021 00:11:38 - INFO - __main__ - Step 44813: {'lr': 0.00019914621986480603, 'samples': 1434016, 'steps': 2800, 'loss/train': 1.4491347074508667} -09/21/2021 00:11:39 - INFO - __main__ - Step 44814: {'lr': 0.00019914621986480603, 'samples': 1434048, 'steps': 2800, 'loss/train': 1.4049807786941528} -09/21/2021 00:11:40 - INFO - __main__ - Step 44815: {'lr': 0.00019914621986480603, 'samples': 1434080, 'steps': 2800, 'loss/train': 2.02433705329895} -09/21/2021 00:11:41 - INFO - __main__ - Step 44816: {'lr': 0.00019914621986480603, 'samples': 1434112, 'steps': 2800, 'loss/train': 3.5285613536834717} -09/21/2021 00:11:42 - INFO - __main__ - Step 44817: {'lr': 0.00019914538789416234, 'samples': 1434144, 'steps': 2801, 'loss/train': 1.3719395399093628} -09/21/2021 00:11:43 - INFO - __main__ - Step 44818: {'lr': 0.00019914538789416234, 'samples': 1434176, 'steps': 2801, 'loss/train': 1.62959885597229} -09/21/2021 00:11:43 - INFO - __main__ - Step 44819: {'lr': 0.00019914538789416234, 'samples': 1434208, 'steps': 2801, 'loss/train': 1.4737924337387085} -09/21/2021 00:11:44 - INFO - __main__ - Step 44820: {'lr': 0.00019914538789416234, 'samples': 1434240, 'steps': 2801, 'loss/train': 0.8928424119949341} -09/21/2021 00:11:45 - INFO - __main__ - Step 44821: {'lr': 0.00019914538789416234, 'samples': 1434272, 'steps': 2801, 'loss/train': 1.28726327419281} -09/21/2021 00:11:46 - INFO - __main__ - Step 44822: {'lr': 0.00019914538789416234, 'samples': 1434304, 'steps': 2801, 'loss/train': 1.7550686597824097} -09/21/2021 00:11:46 - INFO - __main__ - Step 44823: {'lr': 0.00019914538789416234, 'samples': 1434336, 'steps': 2801, 'loss/train': 2.2318170070648193} -09/21/2021 00:11:47 - INFO - __main__ - Step 44824: {'lr': 0.00019914538789416234, 'samples': 1434368, 'steps': 2801, 'loss/train': 2.2100484371185303} -09/21/2021 00:11:48 - INFO - __main__ - Step 44825: {'lr': 0.00019914538789416234, 'samples': 1434400, 'steps': 2801, 'loss/train': 2.319725513458252} -09/21/2021 00:11:49 - INFO - __main__ - Step 44826: {'lr': 0.00019914538789416234, 'samples': 1434432, 'steps': 2801, 'loss/train': 2.113525867462158} -09/21/2021 00:11:49 - INFO - __main__ - Step 44827: {'lr': 0.00019914538789416234, 'samples': 1434464, 'steps': 2801, 'loss/train': 2.3913280963897705} -09/21/2021 00:11:50 - INFO - __main__ - Step 44828: {'lr': 0.00019914538789416234, 'samples': 1434496, 'steps': 2801, 'loss/train': 1.5516868829727173} -09/21/2021 00:11:51 - INFO - __main__ - Step 44829: {'lr': 0.00019914538789416234, 'samples': 1434528, 'steps': 2801, 'loss/train': 2.154353141784668} -09/21/2021 00:11:52 - INFO - __main__ - Step 44830: {'lr': 0.00019914538789416234, 'samples': 1434560, 'steps': 2801, 'loss/train': 1.6830613613128662} -09/21/2021 00:11:52 - INFO - __main__ - Step 44831: {'lr': 0.00019914538789416234, 'samples': 1434592, 'steps': 2801, 'loss/train': 2.6378965377807617} -09/21/2021 00:11:53 - INFO - __main__ - Step 44832: {'lr': 0.00019914538789416234, 'samples': 1434624, 'steps': 2801, 'loss/train': 0.8503473401069641} -09/21/2021 00:11:54 - INFO - __main__ - Step 44833: {'lr': 0.00019914455552009645, 'samples': 1434656, 'steps': 2802, 'loss/train': 2.0512819290161133} -09/21/2021 00:11:55 - INFO - __main__ - Step 44834: {'lr': 0.00019914455552009645, 'samples': 1434688, 'steps': 2802, 'loss/train': 2.075683832168579} -09/21/2021 00:11:56 - INFO - __main__ - Step 44835: {'lr': 0.00019914455552009645, 'samples': 1434720, 'steps': 2802, 'loss/train': 1.9944802522659302} -09/21/2021 00:11:56 - INFO - __main__ - Step 44836: {'lr': 0.00019914455552009645, 'samples': 1434752, 'steps': 2802, 'loss/train': 2.006134271621704} -09/21/2021 00:11:57 - INFO - __main__ - Step 44837: {'lr': 0.00019914455552009645, 'samples': 1434784, 'steps': 2802, 'loss/train': 1.185592770576477} -09/21/2021 00:11:58 - INFO - __main__ - Step 44838: {'lr': 0.00019914455552009645, 'samples': 1434816, 'steps': 2802, 'loss/train': 2.1971871852874756} -09/21/2021 00:11:59 - INFO - __main__ - Step 44839: {'lr': 0.00019914455552009645, 'samples': 1434848, 'steps': 2802, 'loss/train': 1.4438954591751099} -09/21/2021 00:11:59 - INFO - __main__ - Step 44840: {'lr': 0.00019914455552009645, 'samples': 1434880, 'steps': 2802, 'loss/train': 2.9941837787628174} -09/21/2021 00:12:00 - INFO - __main__ - Step 44841: {'lr': 0.00019914455552009645, 'samples': 1434912, 'steps': 2802, 'loss/train': 1.8228102922439575} -09/21/2021 00:12:01 - INFO - __main__ - Step 44842: {'lr': 0.00019914455552009645, 'samples': 1434944, 'steps': 2802, 'loss/train': 2.1982619762420654} -09/21/2021 00:12:02 - INFO - __main__ - Step 44843: {'lr': 0.00019914455552009645, 'samples': 1434976, 'steps': 2802, 'loss/train': 2.5191268920898438} -09/21/2021 00:12:02 - INFO - __main__ - Step 44844: {'lr': 0.00019914455552009645, 'samples': 1435008, 'steps': 2802, 'loss/train': 2.72011399269104} -09/21/2021 00:12:03 - INFO - __main__ - Step 44845: {'lr': 0.00019914455552009645, 'samples': 1435040, 'steps': 2802, 'loss/train': 2.7670156955718994} -09/21/2021 00:12:05 - INFO - __main__ - Step 44846: {'lr': 0.00019914455552009645, 'samples': 1435072, 'steps': 2802, 'loss/train': 2.3471286296844482} -09/21/2021 00:12:06 - INFO - __main__ - Step 44847: {'lr': 0.00019914455552009645, 'samples': 1435104, 'steps': 2802, 'loss/train': 1.5723366737365723} -09/21/2021 00:12:06 - INFO - __main__ - Step 44848: {'lr': 0.00019914455552009645, 'samples': 1435136, 'steps': 2802, 'loss/train': 2.3297553062438965} -09/21/2021 00:12:07 - INFO - __main__ - Step 44849: {'lr': 0.00019914372274261176, 'samples': 1435168, 'steps': 2803, 'loss/train': 1.7786600589752197} -09/21/2021 00:12:08 - INFO - __main__ - Step 44850: {'lr': 0.00019914372274261176, 'samples': 1435200, 'steps': 2803, 'loss/train': 1.6946451663970947} -09/21/2021 00:12:09 - INFO - __main__ - Step 44851: {'lr': 0.00019914372274261176, 'samples': 1435232, 'steps': 2803, 'loss/train': 2.1025054454803467} -09/21/2021 00:12:10 - INFO - __main__ - Step 44852: {'lr': 0.00019914372274261176, 'samples': 1435264, 'steps': 2803, 'loss/train': 2.5827555656433105} -09/21/2021 00:12:10 - INFO - __main__ - Step 44853: {'lr': 0.00019914372274261176, 'samples': 1435296, 'steps': 2803, 'loss/train': 0.5979241132736206} -09/21/2021 00:12:11 - INFO - __main__ - Step 44854: {'lr': 0.00019914372274261176, 'samples': 1435328, 'steps': 2803, 'loss/train': 2.5040781497955322} -09/21/2021 00:12:12 - INFO - __main__ - Step 44855: {'lr': 0.00019914372274261176, 'samples': 1435360, 'steps': 2803, 'loss/train': 1.3493213653564453} -09/21/2021 00:12:13 - INFO - __main__ - Step 44856: {'lr': 0.00019914372274261176, 'samples': 1435392, 'steps': 2803, 'loss/train': 0.285845011472702} -09/21/2021 00:12:13 - INFO - __main__ - Step 44857: {'lr': 0.00019914372274261176, 'samples': 1435424, 'steps': 2803, 'loss/train': 1.6169687509536743} -09/21/2021 00:12:14 - INFO - __main__ - Step 44858: {'lr': 0.00019914372274261176, 'samples': 1435456, 'steps': 2803, 'loss/train': 2.2973132133483887} -09/21/2021 00:12:15 - INFO - __main__ - Step 44859: {'lr': 0.00019914372274261176, 'samples': 1435488, 'steps': 2803, 'loss/train': 1.6709697246551514} -09/21/2021 00:12:16 - INFO - __main__ - Step 44860: {'lr': 0.00019914372274261176, 'samples': 1435520, 'steps': 2803, 'loss/train': 2.8660542964935303} -09/21/2021 00:12:16 - INFO - __main__ - Step 44861: {'lr': 0.00019914372274261176, 'samples': 1435552, 'steps': 2803, 'loss/train': 1.0799239873886108} -09/21/2021 00:12:17 - INFO - __main__ - Step 44862: {'lr': 0.00019914372274261176, 'samples': 1435584, 'steps': 2803, 'loss/train': 3.412782907485962} -09/21/2021 00:12:18 - INFO - __main__ - Step 44863: {'lr': 0.00019914372274261176, 'samples': 1435616, 'steps': 2803, 'loss/train': 2.61051869392395} -09/21/2021 00:12:19 - INFO - __main__ - Step 44864: {'lr': 0.00019914372274261176, 'samples': 1435648, 'steps': 2803, 'loss/train': 2.349917411804199} -09/21/2021 00:12:19 - INFO - __main__ - Step 44865: {'lr': 0.00019914288956171164, 'samples': 1435680, 'steps': 2804, 'loss/train': 2.4950106143951416} -09/21/2021 00:12:20 - INFO - __main__ - Step 44866: {'lr': 0.00019914288956171164, 'samples': 1435712, 'steps': 2804, 'loss/train': 1.96153724193573} -09/21/2021 00:12:21 - INFO - __main__ - Step 44867: {'lr': 0.00019914288956171164, 'samples': 1435744, 'steps': 2804, 'loss/train': 1.8923958539962769} -09/21/2021 00:12:22 - INFO - __main__ - Step 44868: {'lr': 0.00019914288956171164, 'samples': 1435776, 'steps': 2804, 'loss/train': 2.779123306274414} -09/21/2021 00:12:22 - INFO - __main__ - Step 44869: {'lr': 0.00019914288956171164, 'samples': 1435808, 'steps': 2804, 'loss/train': 2.6924309730529785} -09/21/2021 00:12:23 - INFO - __main__ - Step 44870: {'lr': 0.00019914288956171164, 'samples': 1435840, 'steps': 2804, 'loss/train': 2.095358371734619} -09/21/2021 00:12:24 - INFO - __main__ - Step 44871: {'lr': 0.00019914288956171164, 'samples': 1435872, 'steps': 2804, 'loss/train': 3.400376081466675} -09/21/2021 00:12:25 - INFO - __main__ - Step 44872: {'lr': 0.00019914288956171164, 'samples': 1435904, 'steps': 2804, 'loss/train': 1.8496170043945312} -09/21/2021 00:12:25 - INFO - __main__ - Step 44873: {'lr': 0.00019914288956171164, 'samples': 1435936, 'steps': 2804, 'loss/train': 0.27940309047698975} -09/21/2021 00:12:26 - INFO - __main__ - Step 44874: {'lr': 0.00019914288956171164, 'samples': 1435968, 'steps': 2804, 'loss/train': 1.9527549743652344} -09/21/2021 00:12:27 - INFO - __main__ - Step 44875: {'lr': 0.00019914288956171164, 'samples': 1436000, 'steps': 2804, 'loss/train': 1.9092603921890259} -09/21/2021 00:12:28 - INFO - __main__ - Step 44876: {'lr': 0.00019914288956171164, 'samples': 1436032, 'steps': 2804, 'loss/train': 2.292539358139038} -09/21/2021 00:12:29 - INFO - __main__ - Step 44877: {'lr': 0.00019914288956171164, 'samples': 1436064, 'steps': 2804, 'loss/train': 2.7616562843322754} -09/21/2021 00:12:30 - INFO - __main__ - Step 44878: {'lr': 0.00019914288956171164, 'samples': 1436096, 'steps': 2804, 'loss/train': 2.061077117919922} -09/21/2021 00:12:31 - INFO - __main__ - Step 44879: {'lr': 0.00019914288956171164, 'samples': 1436128, 'steps': 2804, 'loss/train': 2.073805093765259} -09/21/2021 00:12:31 - INFO - __main__ - Step 44880: {'lr': 0.00019914288956171164, 'samples': 1436160, 'steps': 2804, 'loss/train': 2.209139823913574} -09/21/2021 00:12:32 - INFO - __main__ - Step 44881: {'lr': 0.00019914205597739953, 'samples': 1436192, 'steps': 2805, 'loss/train': 2.472665309906006} -09/21/2021 00:12:33 - INFO - __main__ - Step 44882: {'lr': 0.00019914205597739953, 'samples': 1436224, 'steps': 2805, 'loss/train': 1.9953134059906006} -09/21/2021 00:12:34 - INFO - __main__ - Step 44883: {'lr': 0.00019914205597739953, 'samples': 1436256, 'steps': 2805, 'loss/train': 2.716087818145752} -09/21/2021 00:12:35 - INFO - __main__ - Step 44884: {'lr': 0.00019914205597739953, 'samples': 1436288, 'steps': 2805, 'loss/train': 2.2479608058929443} -09/21/2021 00:12:35 - INFO - __main__ - Step 44885: {'lr': 0.00019914205597739953, 'samples': 1436320, 'steps': 2805, 'loss/train': 2.5834529399871826} -09/21/2021 00:12:36 - INFO - __main__ - Step 44886: {'lr': 0.00019914205597739953, 'samples': 1436352, 'steps': 2805, 'loss/train': 2.336667776107788} -09/21/2021 00:12:37 - INFO - __main__ - Step 44887: {'lr': 0.00019914205597739953, 'samples': 1436384, 'steps': 2805, 'loss/train': 1.519195556640625} -09/21/2021 00:12:38 - INFO - __main__ - Step 44888: {'lr': 0.00019914205597739953, 'samples': 1436416, 'steps': 2805, 'loss/train': 2.152135133743286} -09/21/2021 00:12:38 - INFO - __main__ - Step 44889: {'lr': 0.00019914205597739953, 'samples': 1436448, 'steps': 2805, 'loss/train': 2.1548752784729004} -09/21/2021 00:12:39 - INFO - __main__ - Step 44890: {'lr': 0.00019914205597739953, 'samples': 1436480, 'steps': 2805, 'loss/train': 1.6578998565673828} -09/21/2021 00:12:40 - INFO - __main__ - Step 44891: {'lr': 0.00019914205597739953, 'samples': 1436512, 'steps': 2805, 'loss/train': 2.4421746730804443} -09/21/2021 00:12:41 - INFO - __main__ - Step 44892: {'lr': 0.00019914205597739953, 'samples': 1436544, 'steps': 2805, 'loss/train': 2.467034101486206} -09/21/2021 00:12:41 - INFO - __main__ - Step 44893: {'lr': 0.00019914205597739953, 'samples': 1436576, 'steps': 2805, 'loss/train': 2.432682752609253} -09/21/2021 00:12:42 - INFO - __main__ - Step 44894: {'lr': 0.00019914205597739953, 'samples': 1436608, 'steps': 2805, 'loss/train': 1.6738111972808838} -09/21/2021 00:12:43 - INFO - __main__ - Step 44895: {'lr': 0.00019914205597739953, 'samples': 1436640, 'steps': 2805, 'loss/train': 2.2171359062194824} -09/21/2021 00:12:44 - INFO - __main__ - Step 44896: {'lr': 0.00019914205597739953, 'samples': 1436672, 'steps': 2805, 'loss/train': 1.9244587421417236} -09/21/2021 00:12:45 - INFO - __main__ - Step 44897: {'lr': 0.00019914122198967874, 'samples': 1436704, 'steps': 2806, 'loss/train': 2.484175443649292} -09/21/2021 00:12:45 - INFO - __main__ - Step 44898: {'lr': 0.00019914122198967874, 'samples': 1436736, 'steps': 2806, 'loss/train': 2.0481655597686768} -09/21/2021 00:12:46 - INFO - __main__ - Step 44899: {'lr': 0.00019914122198967874, 'samples': 1436768, 'steps': 2806, 'loss/train': 1.7321317195892334} -09/21/2021 00:12:47 - INFO - __main__ - Step 44900: {'lr': 0.00019914122198967874, 'samples': 1436800, 'steps': 2806, 'loss/train': 1.6888034343719482} -09/21/2021 00:12:48 - INFO - __main__ - Step 44901: {'lr': 0.00019914122198967874, 'samples': 1436832, 'steps': 2806, 'loss/train': 1.4864952564239502} -09/21/2021 00:12:48 - INFO - __main__ - Step 44902: {'lr': 0.00019914122198967874, 'samples': 1436864, 'steps': 2806, 'loss/train': 1.932857632637024} -09/21/2021 00:12:49 - INFO - __main__ - Step 44903: {'lr': 0.00019914122198967874, 'samples': 1436896, 'steps': 2806, 'loss/train': 1.973341703414917} -09/21/2021 00:12:50 - INFO - __main__ - Step 44904: {'lr': 0.00019914122198967874, 'samples': 1436928, 'steps': 2806, 'loss/train': 1.8448415994644165} -09/21/2021 00:12:50 - INFO - __main__ - Step 44905: {'lr': 0.00019914122198967874, 'samples': 1436960, 'steps': 2806, 'loss/train': 1.5610910654067993} -09/21/2021 00:12:51 - INFO - __main__ - Step 44906: {'lr': 0.00019914122198967874, 'samples': 1436992, 'steps': 2806, 'loss/train': 1.722561240196228} -09/21/2021 00:12:52 - INFO - __main__ - Step 44907: {'lr': 0.00019914122198967874, 'samples': 1437024, 'steps': 2806, 'loss/train': 2.594757318496704} -09/21/2021 00:12:54 - INFO - __main__ - Step 44908: {'lr': 0.00019914122198967874, 'samples': 1437056, 'steps': 2806, 'loss/train': 1.115877628326416} -09/21/2021 00:12:54 - INFO - __main__ - Step 44909: {'lr': 0.00019914122198967874, 'samples': 1437088, 'steps': 2806, 'loss/train': 1.8234550952911377} -09/21/2021 00:12:55 - INFO - __main__ - Step 44910: {'lr': 0.00019914122198967874, 'samples': 1437120, 'steps': 2806, 'loss/train': 1.5891822576522827} -09/21/2021 00:12:56 - INFO - __main__ - Step 44911: {'lr': 0.00019914122198967874, 'samples': 1437152, 'steps': 2806, 'loss/train': 5.863142967224121} -09/21/2021 00:12:57 - INFO - __main__ - Step 44912: {'lr': 0.00019914122198967874, 'samples': 1437184, 'steps': 2806, 'loss/train': 5.7043256759643555} -09/21/2021 00:12:57 - INFO - __main__ - Step 44913: {'lr': 0.0001991403875985527, 'samples': 1437216, 'steps': 2807, 'loss/train': 5.988603115081787} -09/21/2021 00:12:58 - INFO - __main__ - Step 44914: {'lr': 0.0001991403875985527, 'samples': 1437248, 'steps': 2807, 'loss/train': 6.083599090576172} -09/21/2021 00:12:59 - INFO - __main__ - Step 44915: {'lr': 0.0001991403875985527, 'samples': 1437280, 'steps': 2807, 'loss/train': 5.894504547119141} -09/21/2021 00:13:00 - INFO - __main__ - Step 44916: {'lr': 0.0001991403875985527, 'samples': 1437312, 'steps': 2807, 'loss/train': 5.886882305145264} -09/21/2021 00:13:00 - INFO - __main__ - Step 44917: {'lr': 0.0001991403875985527, 'samples': 1437344, 'steps': 2807, 'loss/train': 5.908447742462158} -09/21/2021 00:13:01 - INFO - __main__ - Step 44918: {'lr': 0.0001991403875985527, 'samples': 1437376, 'steps': 2807, 'loss/train': 5.670368671417236} -09/21/2021 00:13:02 - INFO - __main__ - Step 44919: {'lr': 0.0001991403875985527, 'samples': 1437408, 'steps': 2807, 'loss/train': 6.046610355377197} -09/21/2021 00:13:03 - INFO - __main__ - Step 44920: {'lr': 0.0001991403875985527, 'samples': 1437440, 'steps': 2807, 'loss/train': 5.810815811157227} -09/21/2021 00:13:03 - INFO - __main__ - Step 44921: {'lr': 0.0001991403875985527, 'samples': 1437472, 'steps': 2807, 'loss/train': 1.622979998588562} -09/21/2021 00:13:04 - INFO - __main__ - Step 44922: {'lr': 0.0001991403875985527, 'samples': 1437504, 'steps': 2807, 'loss/train': 1.9752150774002075} -09/21/2021 00:13:05 - INFO - __main__ - Step 44923: {'lr': 0.0001991403875985527, 'samples': 1437536, 'steps': 2807, 'loss/train': 0.6763580441474915} -09/21/2021 00:13:06 - INFO - __main__ - Step 44924: {'lr': 0.0001991403875985527, 'samples': 1437568, 'steps': 2807, 'loss/train': 0.8960887789726257} -09/21/2021 00:13:06 - INFO - __main__ - Step 44925: {'lr': 0.0001991403875985527, 'samples': 1437600, 'steps': 2807, 'loss/train': 2.0696911811828613} -09/21/2021 00:13:07 - INFO - __main__ - Step 44926: {'lr': 0.0001991403875985527, 'samples': 1437632, 'steps': 2807, 'loss/train': 2.231278657913208} -09/21/2021 00:13:08 - INFO - __main__ - Step 44927: {'lr': 0.0001991403875985527, 'samples': 1437664, 'steps': 2807, 'loss/train': 1.7144646644592285} -09/21/2021 00:13:09 - INFO - __main__ - Step 44928: {'lr': 0.0001991403875985527, 'samples': 1437696, 'steps': 2807, 'loss/train': 0.2359514981508255} -09/21/2021 00:13:10 - INFO - __main__ - Step 44929: {'lr': 0.00019913955280402484, 'samples': 1437728, 'steps': 2808, 'loss/train': 0.24526450037956238} -09/21/2021 00:13:10 - INFO - __main__ - Step 44930: {'lr': 0.00019913955280402484, 'samples': 1437760, 'steps': 2808, 'loss/train': 0.21673829853534698} -09/21/2021 00:13:11 - INFO - __main__ - Step 44931: {'lr': 0.00019913955280402484, 'samples': 1437792, 'steps': 2808, 'loss/train': 0.17737451195716858} -09/21/2021 00:13:12 - INFO - __main__ - Step 44932: {'lr': 0.00019913955280402484, 'samples': 1437824, 'steps': 2808, 'loss/train': 0.6962541937828064} -09/21/2021 00:13:13 - INFO - __main__ - Step 44933: {'lr': 0.00019913955280402484, 'samples': 1437856, 'steps': 2808, 'loss/train': 2.014359951019287} -09/21/2021 00:13:13 - INFO - __main__ - Step 44934: {'lr': 0.00019913955280402484, 'samples': 1437888, 'steps': 2808, 'loss/train': 2.150193691253662} -09/21/2021 00:13:14 - INFO - __main__ - Step 44935: {'lr': 0.00019913955280402484, 'samples': 1437920, 'steps': 2808, 'loss/train': 2.0740654468536377} -09/21/2021 00:13:15 - INFO - __main__ - Step 44936: {'lr': 0.00019913955280402484, 'samples': 1437952, 'steps': 2808, 'loss/train': 0.37991058826446533} -09/21/2021 00:13:16 - INFO - __main__ - Step 44937: {'lr': 0.00019913955280402484, 'samples': 1437984, 'steps': 2808, 'loss/train': 0.21663792431354523} -09/21/2021 00:13:16 - INFO - __main__ - Step 44938: {'lr': 0.00019913955280402484, 'samples': 1438016, 'steps': 2808, 'loss/train': 0.32469555735588074} -09/21/2021 00:13:17 - INFO - __main__ - Step 44939: {'lr': 0.00019913955280402484, 'samples': 1438048, 'steps': 2808, 'loss/train': 1.3627276420593262} -09/21/2021 00:13:18 - INFO - __main__ - Step 44940: {'lr': 0.00019913955280402484, 'samples': 1438080, 'steps': 2808, 'loss/train': 2.4679675102233887} -09/21/2021 00:13:19 - INFO - __main__ - Step 44941: {'lr': 0.00019913955280402484, 'samples': 1438112, 'steps': 2808, 'loss/train': 4.083931922912598} -09/21/2021 00:13:19 - INFO - __main__ - Step 44942: {'lr': 0.00019913955280402484, 'samples': 1438144, 'steps': 2808, 'loss/train': 1.2608797550201416} -09/21/2021 00:13:20 - INFO - __main__ - Step 44943: {'lr': 0.00019913955280402484, 'samples': 1438176, 'steps': 2808, 'loss/train': 2.387568950653076} -09/21/2021 00:13:21 - INFO - __main__ - Step 44944: {'lr': 0.00019913955280402484, 'samples': 1438208, 'steps': 2808, 'loss/train': 2.377673387527466} -09/21/2021 00:13:22 - INFO - __main__ - Step 44945: {'lr': 0.00019913871760609848, 'samples': 1438240, 'steps': 2809, 'loss/train': 2.3651905059814453} -09/21/2021 00:13:23 - INFO - __main__ - Step 44946: {'lr': 0.00019913871760609848, 'samples': 1438272, 'steps': 2809, 'loss/train': 1.2471399307250977} -09/21/2021 00:13:24 - INFO - __main__ - Step 44947: {'lr': 0.00019913871760609848, 'samples': 1438304, 'steps': 2809, 'loss/train': 3.3653604984283447} -09/21/2021 00:13:25 - INFO - __main__ - Step 44948: {'lr': 0.00019913871760609848, 'samples': 1438336, 'steps': 2809, 'loss/train': 2.767578601837158} -09/21/2021 00:13:25 - INFO - __main__ - Step 44949: {'lr': 0.00019913871760609848, 'samples': 1438368, 'steps': 2809, 'loss/train': 2.23249888420105} -09/21/2021 00:13:26 - INFO - __main__ - Step 44950: {'lr': 0.00019913871760609848, 'samples': 1438400, 'steps': 2809, 'loss/train': 2.7912213802337646} -09/21/2021 00:13:27 - INFO - __main__ - Step 44951: {'lr': 0.00019913871760609848, 'samples': 1438432, 'steps': 2809, 'loss/train': 1.949354887008667} -09/21/2021 00:13:28 - INFO - __main__ - Step 44952: {'lr': 0.00019913871760609848, 'samples': 1438464, 'steps': 2809, 'loss/train': 2.918226957321167} -09/21/2021 00:13:28 - INFO - __main__ - Step 44953: {'lr': 0.00019913871760609848, 'samples': 1438496, 'steps': 2809, 'loss/train': 1.7255629301071167} -09/21/2021 00:13:29 - INFO - __main__ - Step 44954: {'lr': 0.00019913871760609848, 'samples': 1438528, 'steps': 2809, 'loss/train': 2.2830240726470947} -09/21/2021 00:13:30 - INFO - __main__ - Step 44955: {'lr': 0.00019913871760609848, 'samples': 1438560, 'steps': 2809, 'loss/train': 2.43062686920166} -09/21/2021 00:13:31 - INFO - __main__ - Step 44956: {'lr': 0.00019913871760609848, 'samples': 1438592, 'steps': 2809, 'loss/train': 1.8654206991195679} -09/21/2021 00:13:31 - INFO - __main__ - Step 44957: {'lr': 0.00019913871760609848, 'samples': 1438624, 'steps': 2809, 'loss/train': 2.8275930881500244} -09/21/2021 00:13:32 - INFO - __main__ - Step 44958: {'lr': 0.00019913871760609848, 'samples': 1438656, 'steps': 2809, 'loss/train': 2.627122163772583} -09/21/2021 00:13:33 - INFO - __main__ - Step 44959: {'lr': 0.00019913871760609848, 'samples': 1438688, 'steps': 2809, 'loss/train': 1.7799861431121826} -09/21/2021 00:13:34 - INFO - __main__ - Step 44960: {'lr': 0.00019913871760609848, 'samples': 1438720, 'steps': 2809, 'loss/train': 2.324293851852417} -09/21/2021 00:13:34 - INFO - __main__ - Step 44961: {'lr': 0.00019913788200477708, 'samples': 1438752, 'steps': 2810, 'loss/train': 2.656846761703491} -09/21/2021 00:13:35 - INFO - __main__ - Step 44962: {'lr': 0.00019913788200477708, 'samples': 1438784, 'steps': 2810, 'loss/train': 0.46965160965919495} -09/21/2021 00:13:36 - INFO - __main__ - Step 44963: {'lr': 0.00019913788200477708, 'samples': 1438816, 'steps': 2810, 'loss/train': 2.1558218002319336} -09/21/2021 00:13:37 - INFO - __main__ - Step 44964: {'lr': 0.00019913788200477708, 'samples': 1438848, 'steps': 2810, 'loss/train': 2.4751360416412354} -09/21/2021 00:13:37 - INFO - __main__ - Step 44965: {'lr': 0.00019913788200477708, 'samples': 1438880, 'steps': 2810, 'loss/train': 1.7382699251174927} -09/21/2021 00:13:38 - INFO - __main__ - Step 44966: {'lr': 0.00019913788200477708, 'samples': 1438912, 'steps': 2810, 'loss/train': 2.4909377098083496} -09/21/2021 00:13:39 - INFO - __main__ - Step 44967: {'lr': 0.00019913788200477708, 'samples': 1438944, 'steps': 2810, 'loss/train': 1.3556275367736816} -09/21/2021 00:13:40 - INFO - __main__ - Step 44968: {'lr': 0.00019913788200477708, 'samples': 1438976, 'steps': 2810, 'loss/train': 2.1206600666046143} -09/21/2021 00:13:40 - INFO - __main__ - Step 44969: {'lr': 0.00019913788200477708, 'samples': 1439008, 'steps': 2810, 'loss/train': 1.1445579528808594} -09/21/2021 00:13:41 - INFO - __main__ - Step 44970: {'lr': 0.00019913788200477708, 'samples': 1439040, 'steps': 2810, 'loss/train': 1.6029380559921265} -09/21/2021 00:13:42 - INFO - __main__ - Step 44971: {'lr': 0.00019913788200477708, 'samples': 1439072, 'steps': 2810, 'loss/train': 1.8347605466842651} -09/21/2021 00:13:43 - INFO - __main__ - Step 44972: {'lr': 0.00019913788200477708, 'samples': 1439104, 'steps': 2810, 'loss/train': 1.327808141708374} -09/21/2021 00:13:43 - INFO - __main__ - Step 44973: {'lr': 0.00019913788200477708, 'samples': 1439136, 'steps': 2810, 'loss/train': 1.646288275718689} -09/21/2021 00:13:44 - INFO - __main__ - Step 44974: {'lr': 0.00019913788200477708, 'samples': 1439168, 'steps': 2810, 'loss/train': 2.966291904449463} -09/21/2021 00:13:45 - INFO - __main__ - Step 44975: {'lr': 0.00019913788200477708, 'samples': 1439200, 'steps': 2810, 'loss/train': 1.9209377765655518} -09/21/2021 00:13:46 - INFO - __main__ - Step 44976: {'lr': 0.00019913788200477708, 'samples': 1439232, 'steps': 2810, 'loss/train': 1.7528364658355713} -09/21/2021 00:13:47 - INFO - __main__ - Step 44977: {'lr': 0.00019913704600006403, 'samples': 1439264, 'steps': 2811, 'loss/train': 2.0518579483032227} -09/21/2021 00:13:48 - INFO - __main__ - Step 44978: {'lr': 0.00019913704600006403, 'samples': 1439296, 'steps': 2811, 'loss/train': 2.4973509311676025} -09/21/2021 00:13:49 - INFO - __main__ - Step 44979: {'lr': 0.00019913704600006403, 'samples': 1439328, 'steps': 2811, 'loss/train': 2.4076731204986572} -09/21/2021 00:13:49 - INFO - __main__ - Step 44980: {'lr': 0.00019913704600006403, 'samples': 1439360, 'steps': 2811, 'loss/train': 1.4614454507827759} -09/21/2021 00:13:50 - INFO - __main__ - Step 44981: {'lr': 0.00019913704600006403, 'samples': 1439392, 'steps': 2811, 'loss/train': 2.318131446838379} -09/21/2021 00:13:51 - INFO - __main__ - Step 44982: {'lr': 0.00019913704600006403, 'samples': 1439424, 'steps': 2811, 'loss/train': 1.9512784481048584} -09/21/2021 00:13:52 - INFO - __main__ - Step 44983: {'lr': 0.00019913704600006403, 'samples': 1439456, 'steps': 2811, 'loss/train': 1.7799043655395508} -09/21/2021 00:13:52 - INFO - __main__ - Step 44984: {'lr': 0.00019913704600006403, 'samples': 1439488, 'steps': 2811, 'loss/train': 1.7046904563903809} -09/21/2021 00:13:53 - INFO - __main__ - Step 44985: {'lr': 0.00019913704600006403, 'samples': 1439520, 'steps': 2811, 'loss/train': 2.73367977142334} -09/21/2021 00:13:54 - INFO - __main__ - Step 44986: {'lr': 0.00019913704600006403, 'samples': 1439552, 'steps': 2811, 'loss/train': 3.699796199798584} -09/21/2021 00:13:55 - INFO - __main__ - Step 44987: {'lr': 0.00019913704600006403, 'samples': 1439584, 'steps': 2811, 'loss/train': 1.7778215408325195} -09/21/2021 00:13:55 - INFO - __main__ - Step 44988: {'lr': 0.00019913704600006403, 'samples': 1439616, 'steps': 2811, 'loss/train': 1.476021647453308} -09/21/2021 00:13:56 - INFO - __main__ - Step 44989: {'lr': 0.00019913704600006403, 'samples': 1439648, 'steps': 2811, 'loss/train': 1.5343046188354492} -09/21/2021 00:13:57 - INFO - __main__ - Step 44990: {'lr': 0.00019913704600006403, 'samples': 1439680, 'steps': 2811, 'loss/train': 2.4582619667053223} -09/21/2021 00:13:58 - INFO - __main__ - Step 44991: {'lr': 0.00019913704600006403, 'samples': 1439712, 'steps': 2811, 'loss/train': 2.812753915786743} -09/21/2021 00:13:58 - INFO - __main__ - Step 44992: {'lr': 0.00019913704600006403, 'samples': 1439744, 'steps': 2811, 'loss/train': 2.6103572845458984} -09/21/2021 00:13:59 - INFO - __main__ - Step 44993: {'lr': 0.00019913620959196272, 'samples': 1439776, 'steps': 2812, 'loss/train': 1.9809495210647583} -09/21/2021 00:14:00 - INFO - __main__ - Step 44994: {'lr': 0.00019913620959196272, 'samples': 1439808, 'steps': 2812, 'loss/train': 2.4587278366088867} -09/21/2021 00:14:01 - INFO - __main__ - Step 44995: {'lr': 0.00019913620959196272, 'samples': 1439840, 'steps': 2812, 'loss/train': 2.3429017066955566} -09/21/2021 00:14:01 - INFO - __main__ - Step 44996: {'lr': 0.00019913620959196272, 'samples': 1439872, 'steps': 2812, 'loss/train': 2.795560359954834} -09/21/2021 00:14:02 - INFO - __main__ - Step 44997: {'lr': 0.00019913620959196272, 'samples': 1439904, 'steps': 2812, 'loss/train': 1.851952075958252} -09/21/2021 00:14:03 - INFO - __main__ - Step 44998: {'lr': 0.00019913620959196272, 'samples': 1439936, 'steps': 2812, 'loss/train': 1.0913523435592651} -09/21/2021 00:14:04 - INFO - __main__ - Step 44999: {'lr': 0.00019913620959196272, 'samples': 1439968, 'steps': 2812, 'loss/train': 1.755674958229065} -09/21/2021 00:14:04 - INFO - __main__ - Step 45000: {'lr': 0.00019913620959196272, 'samples': 1440000, 'steps': 2812, 'loss/train': 1.5427954196929932} -09/21/2021 00:14:05 - INFO - __main__ - Step 45001: {'lr': 0.00019913620959196272, 'samples': 1440032, 'steps': 2812, 'loss/train': 0.4720998704433441} -09/21/2021 00:14:06 - INFO - __main__ - Step 45002: {'lr': 0.00019913620959196272, 'samples': 1440064, 'steps': 2812, 'loss/train': 1.9808119535446167} -09/21/2021 00:14:07 - INFO - __main__ - Step 45003: {'lr': 0.00019913620959196272, 'samples': 1440096, 'steps': 2812, 'loss/train': 2.5670251846313477} -09/21/2021 00:14:07 - INFO - __main__ - Step 45004: {'lr': 0.00019913620959196272, 'samples': 1440128, 'steps': 2812, 'loss/train': 2.1877758502960205} -09/21/2021 00:14:08 - INFO - __main__ - Step 45005: {'lr': 0.00019913620959196272, 'samples': 1440160, 'steps': 2812, 'loss/train': 1.2069084644317627} -09/21/2021 00:14:09 - INFO - __main__ - Step 45006: {'lr': 0.00019913620959196272, 'samples': 1440192, 'steps': 2812, 'loss/train': 2.5361440181732178} -09/21/2021 00:14:10 - INFO - __main__ - Step 45007: {'lr': 0.00019913620959196272, 'samples': 1440224, 'steps': 2812, 'loss/train': 1.8502014875411987} -09/21/2021 00:14:10 - INFO - __main__ - Step 45008: {'lr': 0.00019913620959196272, 'samples': 1440256, 'steps': 2812, 'loss/train': 2.693401336669922} -09/21/2021 00:14:12 - INFO - __main__ - Step 45009: {'lr': 0.00019913537278047657, 'samples': 1440288, 'steps': 2813, 'loss/train': 1.6316213607788086} -09/21/2021 00:14:13 - INFO - __main__ - Step 45010: {'lr': 0.00019913537278047657, 'samples': 1440320, 'steps': 2813, 'loss/train': 2.1253018379211426} -09/21/2021 00:14:13 - INFO - __main__ - Step 45011: {'lr': 0.00019913537278047657, 'samples': 1440352, 'steps': 2813, 'loss/train': 2.303387403488159} -09/21/2021 00:14:14 - INFO - __main__ - Step 45012: {'lr': 0.00019913537278047657, 'samples': 1440384, 'steps': 2813, 'loss/train': 2.358682155609131} -09/21/2021 00:14:15 - INFO - __main__ - Step 45013: {'lr': 0.00019913537278047657, 'samples': 1440416, 'steps': 2813, 'loss/train': 1.8539059162139893} -09/21/2021 00:14:16 - INFO - __main__ - Step 45014: {'lr': 0.00019913537278047657, 'samples': 1440448, 'steps': 2813, 'loss/train': 1.9200313091278076} -09/21/2021 00:14:16 - INFO - __main__ - Step 45015: {'lr': 0.00019913537278047657, 'samples': 1440480, 'steps': 2813, 'loss/train': 2.085122585296631} -09/21/2021 00:14:17 - INFO - __main__ - Step 45016: {'lr': 0.00019913537278047657, 'samples': 1440512, 'steps': 2813, 'loss/train': 1.9514933824539185} -09/21/2021 00:14:18 - INFO - __main__ - Step 45017: {'lr': 0.00019913537278047657, 'samples': 1440544, 'steps': 2813, 'loss/train': 2.115565061569214} -09/21/2021 00:14:19 - INFO - __main__ - Step 45018: {'lr': 0.00019913537278047657, 'samples': 1440576, 'steps': 2813, 'loss/train': 1.8362414836883545} -09/21/2021 00:14:19 - INFO - __main__ - Step 45019: {'lr': 0.00019913537278047657, 'samples': 1440608, 'steps': 2813, 'loss/train': 2.6044762134552} -09/21/2021 00:14:20 - INFO - __main__ - Step 45020: {'lr': 0.00019913537278047657, 'samples': 1440640, 'steps': 2813, 'loss/train': 1.6931573152542114} -09/21/2021 00:14:21 - INFO - __main__ - Step 45021: {'lr': 0.00019913537278047657, 'samples': 1440672, 'steps': 2813, 'loss/train': 2.7733888626098633} -09/21/2021 00:14:22 - INFO - __main__ - Step 45022: {'lr': 0.00019913537278047657, 'samples': 1440704, 'steps': 2813, 'loss/train': 1.9250470399856567} -09/21/2021 00:14:22 - INFO - __main__ - Step 45023: {'lr': 0.00019913537278047657, 'samples': 1440736, 'steps': 2813, 'loss/train': 2.3321940898895264} -09/21/2021 00:14:23 - INFO - __main__ - Step 45024: {'lr': 0.00019913537278047657, 'samples': 1440768, 'steps': 2813, 'loss/train': 2.103652000427246} -09/21/2021 00:14:24 - INFO - __main__ - Step 45025: {'lr': 0.00019913453556560896, 'samples': 1440800, 'steps': 2814, 'loss/train': 1.9121179580688477} -09/21/2021 00:14:25 - INFO - __main__ - Step 45026: {'lr': 0.00019913453556560896, 'samples': 1440832, 'steps': 2814, 'loss/train': 1.6409956216812134} -09/21/2021 00:14:26 - INFO - __main__ - Step 45027: {'lr': 0.00019913453556560896, 'samples': 1440864, 'steps': 2814, 'loss/train': 1.873260259628296} -09/21/2021 00:14:26 - INFO - __main__ - Step 45028: {'lr': 0.00019913453556560896, 'samples': 1440896, 'steps': 2814, 'loss/train': 2.0281119346618652} -09/21/2021 00:14:27 - INFO - __main__ - Step 45029: {'lr': 0.00019913453556560896, 'samples': 1440928, 'steps': 2814, 'loss/train': 1.0552834272384644} -09/21/2021 00:14:28 - INFO - __main__ - Step 45030: {'lr': 0.00019913453556560896, 'samples': 1440960, 'steps': 2814, 'loss/train': 1.8521132469177246} -09/21/2021 00:14:29 - INFO - __main__ - Step 45031: {'lr': 0.00019913453556560896, 'samples': 1440992, 'steps': 2814, 'loss/train': 2.1449785232543945} -09/21/2021 00:14:29 - INFO - __main__ - Step 45032: {'lr': 0.00019913453556560896, 'samples': 1441024, 'steps': 2814, 'loss/train': 2.1906120777130127} -09/21/2021 00:14:30 - INFO - __main__ - Step 45033: {'lr': 0.00019913453556560896, 'samples': 1441056, 'steps': 2814, 'loss/train': 2.3143317699432373} -09/21/2021 00:14:31 - INFO - __main__ - Step 45034: {'lr': 0.00019913453556560896, 'samples': 1441088, 'steps': 2814, 'loss/train': 2.1924057006835938} -09/21/2021 00:14:32 - INFO - __main__ - Step 45035: {'lr': 0.00019913453556560896, 'samples': 1441120, 'steps': 2814, 'loss/train': 0.577482283115387} -09/21/2021 00:14:32 - INFO - __main__ - Step 45036: {'lr': 0.00019913453556560896, 'samples': 1441152, 'steps': 2814, 'loss/train': 1.473923683166504} -09/21/2021 00:14:33 - INFO - __main__ - Step 45037: {'lr': 0.00019913453556560896, 'samples': 1441184, 'steps': 2814, 'loss/train': 1.757075548171997} -09/21/2021 00:14:34 - INFO - __main__ - Step 45038: {'lr': 0.00019913453556560896, 'samples': 1441216, 'steps': 2814, 'loss/train': 1.8012138605117798} -09/21/2021 00:14:35 - INFO - __main__ - Step 45039: {'lr': 0.00019913453556560896, 'samples': 1441248, 'steps': 2814, 'loss/train': 2.190415859222412} -09/21/2021 00:14:36 - INFO - __main__ - Step 45040: {'lr': 0.00019913453556560896, 'samples': 1441280, 'steps': 2814, 'loss/train': 1.6446864604949951} -09/21/2021 00:14:37 - INFO - __main__ - Step 45041: {'lr': 0.0001991336979473633, 'samples': 1441312, 'steps': 2815, 'loss/train': 1.5929182767868042} -09/21/2021 00:14:38 - INFO - __main__ - Step 45042: {'lr': 0.0001991336979473633, 'samples': 1441344, 'steps': 2815, 'loss/train': 1.8123235702514648} -09/21/2021 00:14:38 - INFO - __main__ - Step 45043: {'lr': 0.0001991336979473633, 'samples': 1441376, 'steps': 2815, 'loss/train': 2.208685874938965} -09/21/2021 00:14:39 - INFO - __main__ - Step 45044: {'lr': 0.0001991336979473633, 'samples': 1441408, 'steps': 2815, 'loss/train': 2.1722793579101562} -09/21/2021 00:14:40 - INFO - __main__ - Step 45045: {'lr': 0.0001991336979473633, 'samples': 1441440, 'steps': 2815, 'loss/train': 2.004690647125244} -09/21/2021 00:14:41 - INFO - __main__ - Step 45046: {'lr': 0.0001991336979473633, 'samples': 1441472, 'steps': 2815, 'loss/train': 2.359874725341797} -09/21/2021 00:14:41 - INFO - __main__ - Step 45047: {'lr': 0.0001991336979473633, 'samples': 1441504, 'steps': 2815, 'loss/train': 2.2960150241851807} -09/21/2021 00:14:42 - INFO - __main__ - Step 45048: {'lr': 0.0001991336979473633, 'samples': 1441536, 'steps': 2815, 'loss/train': 2.6154046058654785} -09/21/2021 00:14:43 - INFO - __main__ - Step 45049: {'lr': 0.0001991336979473633, 'samples': 1441568, 'steps': 2815, 'loss/train': 2.2612884044647217} -09/21/2021 00:14:44 - INFO - __main__ - Step 45050: {'lr': 0.0001991336979473633, 'samples': 1441600, 'steps': 2815, 'loss/train': 2.1896400451660156} -09/21/2021 00:14:44 - INFO - __main__ - Step 45051: {'lr': 0.0001991336979473633, 'samples': 1441632, 'steps': 2815, 'loss/train': 2.4343879222869873} -09/21/2021 00:14:45 - INFO - __main__ - Step 45052: {'lr': 0.0001991336979473633, 'samples': 1441664, 'steps': 2815, 'loss/train': 1.3177374601364136} -09/21/2021 00:14:46 - INFO - __main__ - Step 45053: {'lr': 0.0001991336979473633, 'samples': 1441696, 'steps': 2815, 'loss/train': 2.1540448665618896} -09/21/2021 00:14:47 - INFO - __main__ - Step 45054: {'lr': 0.0001991336979473633, 'samples': 1441728, 'steps': 2815, 'loss/train': 1.9928624629974365} -09/21/2021 00:14:47 - INFO - __main__ - Step 45055: {'lr': 0.0001991336979473633, 'samples': 1441760, 'steps': 2815, 'loss/train': 3.111238718032837} -09/21/2021 00:14:48 - INFO - __main__ - Step 45056: {'lr': 0.0001991336979473633, 'samples': 1441792, 'steps': 2815, 'loss/train': 3.1731297969818115} -09/21/2021 00:14:49 - INFO - __main__ - Step 45057: {'lr': 0.00019913285992574303, 'samples': 1441824, 'steps': 2816, 'loss/train': 2.8896162509918213} -09/21/2021 00:14:50 - INFO - __main__ - Step 45058: {'lr': 0.00019913285992574303, 'samples': 1441856, 'steps': 2816, 'loss/train': 2.2391834259033203} -09/21/2021 00:14:50 - INFO - __main__ - Step 45059: {'lr': 0.00019913285992574303, 'samples': 1441888, 'steps': 2816, 'loss/train': 1.2723922729492188} -09/21/2021 00:14:51 - INFO - __main__ - Step 45060: {'lr': 0.00019913285992574303, 'samples': 1441920, 'steps': 2816, 'loss/train': 1.8371198177337646} -09/21/2021 00:14:52 - INFO - __main__ - Step 45061: {'lr': 0.00019913285992574303, 'samples': 1441952, 'steps': 2816, 'loss/train': 1.2657500505447388} -09/21/2021 00:14:53 - INFO - __main__ - Step 45062: {'lr': 0.00019913285992574303, 'samples': 1441984, 'steps': 2816, 'loss/train': 1.7185635566711426} -09/21/2021 00:14:53 - INFO - __main__ - Step 45063: {'lr': 0.00019913285992574303, 'samples': 1442016, 'steps': 2816, 'loss/train': 2.25626802444458} -09/21/2021 00:14:54 - INFO - __main__ - Step 45064: {'lr': 0.00019913285992574303, 'samples': 1442048, 'steps': 2816, 'loss/train': 1.5956887006759644} -09/21/2021 00:14:55 - INFO - __main__ - Step 45065: {'lr': 0.00019913285992574303, 'samples': 1442080, 'steps': 2816, 'loss/train': 1.3186808824539185} -09/21/2021 00:14:56 - INFO - __main__ - Step 45066: {'lr': 0.00019913285992574303, 'samples': 1442112, 'steps': 2816, 'loss/train': 1.62303626537323} -09/21/2021 00:14:56 - INFO - __main__ - Step 45067: {'lr': 0.00019913285992574303, 'samples': 1442144, 'steps': 2816, 'loss/train': 1.2536112070083618} -09/21/2021 00:14:57 - INFO - __main__ - Step 45068: {'lr': 0.00019913285992574303, 'samples': 1442176, 'steps': 2816, 'loss/train': 1.4407918453216553} -09/21/2021 00:14:58 - INFO - __main__ - Step 45069: {'lr': 0.00019913285992574303, 'samples': 1442208, 'steps': 2816, 'loss/train': 2.451785087585449} -09/21/2021 00:14:59 - INFO - __main__ - Step 45070: {'lr': 0.00019913285992574303, 'samples': 1442240, 'steps': 2816, 'loss/train': 1.756044864654541} -09/21/2021 00:15:00 - INFO - __main__ - Step 45071: {'lr': 0.00019913285992574303, 'samples': 1442272, 'steps': 2816, 'loss/train': 0.649699866771698} -09/21/2021 00:15:01 - INFO - __main__ - Step 45072: {'lr': 0.00019913285992574303, 'samples': 1442304, 'steps': 2816, 'loss/train': 1.675694227218628} -09/21/2021 00:15:02 - INFO - __main__ - Step 45073: {'lr': 0.0001991320215007515, 'samples': 1442336, 'steps': 2817, 'loss/train': 2.1983542442321777} -09/21/2021 00:15:02 - INFO - __main__ - Step 45074: {'lr': 0.0001991320215007515, 'samples': 1442368, 'steps': 2817, 'loss/train': 2.774456024169922} -09/21/2021 00:15:03 - INFO - __main__ - Step 45075: {'lr': 0.0001991320215007515, 'samples': 1442400, 'steps': 2817, 'loss/train': 1.961239218711853} -09/21/2021 00:15:04 - INFO - __main__ - Step 45076: {'lr': 0.0001991320215007515, 'samples': 1442432, 'steps': 2817, 'loss/train': 1.726123332977295} -09/21/2021 00:15:05 - INFO - __main__ - Step 45077: {'lr': 0.0001991320215007515, 'samples': 1442464, 'steps': 2817, 'loss/train': 1.963210940361023} -09/21/2021 00:15:05 - INFO - __main__ - Step 45078: {'lr': 0.0001991320215007515, 'samples': 1442496, 'steps': 2817, 'loss/train': 1.854155421257019} -09/21/2021 00:15:06 - INFO - __main__ - Step 45079: {'lr': 0.0001991320215007515, 'samples': 1442528, 'steps': 2817, 'loss/train': 1.3795866966247559} -09/21/2021 00:15:07 - INFO - __main__ - Step 45080: {'lr': 0.0001991320215007515, 'samples': 1442560, 'steps': 2817, 'loss/train': 1.860209584236145} -09/21/2021 00:15:08 - INFO - __main__ - Step 45081: {'lr': 0.0001991320215007515, 'samples': 1442592, 'steps': 2817, 'loss/train': 2.261590003967285} -09/21/2021 00:15:08 - INFO - __main__ - Step 45082: {'lr': 0.0001991320215007515, 'samples': 1442624, 'steps': 2817, 'loss/train': 1.7358150482177734} -09/21/2021 00:15:09 - INFO - __main__ - Step 45083: {'lr': 0.0001991320215007515, 'samples': 1442656, 'steps': 2817, 'loss/train': 2.2366061210632324} -09/21/2021 00:15:10 - INFO - __main__ - Step 45084: {'lr': 0.0001991320215007515, 'samples': 1442688, 'steps': 2817, 'loss/train': 2.052696466445923} -09/21/2021 00:15:11 - INFO - __main__ - Step 45085: {'lr': 0.0001991320215007515, 'samples': 1442720, 'steps': 2817, 'loss/train': 1.1892753839492798} -09/21/2021 00:15:11 - INFO - __main__ - Step 45086: {'lr': 0.0001991320215007515, 'samples': 1442752, 'steps': 2817, 'loss/train': 2.273930549621582} -09/21/2021 00:15:12 - INFO - __main__ - Step 45087: {'lr': 0.0001991320215007515, 'samples': 1442784, 'steps': 2817, 'loss/train': 2.156378746032715} -09/21/2021 00:15:13 - INFO - __main__ - Step 45088: {'lr': 0.0001991320215007515, 'samples': 1442816, 'steps': 2817, 'loss/train': 1.6617238521575928} -09/21/2021 00:15:14 - INFO - __main__ - Step 45089: {'lr': 0.0001991311826723922, 'samples': 1442848, 'steps': 2818, 'loss/train': 2.323960065841675} -09/21/2021 00:15:15 - INFO - __main__ - Step 45090: {'lr': 0.0001991311826723922, 'samples': 1442880, 'steps': 2818, 'loss/train': 3.653719425201416} -09/21/2021 00:15:15 - INFO - __main__ - Step 45091: {'lr': 0.0001991311826723922, 'samples': 1442912, 'steps': 2818, 'loss/train': 1.9960912466049194} -09/21/2021 00:15:16 - INFO - __main__ - Step 45092: {'lr': 0.0001991311826723922, 'samples': 1442944, 'steps': 2818, 'loss/train': 2.47495436668396} -09/21/2021 00:15:17 - INFO - __main__ - Step 45093: {'lr': 0.0001991311826723922, 'samples': 1442976, 'steps': 2818, 'loss/train': 1.9100192785263062} -09/21/2021 00:15:18 - INFO - __main__ - Step 45094: {'lr': 0.0001991311826723922, 'samples': 1443008, 'steps': 2818, 'loss/train': 2.875297784805298} -09/21/2021 00:15:18 - INFO - __main__ - Step 45095: {'lr': 0.0001991311826723922, 'samples': 1443040, 'steps': 2818, 'loss/train': 1.6498056650161743} -09/21/2021 00:15:19 - INFO - __main__ - Step 45096: {'lr': 0.0001991311826723922, 'samples': 1443072, 'steps': 2818, 'loss/train': 2.3211331367492676} -09/21/2021 00:15:20 - INFO - __main__ - Step 45097: {'lr': 0.0001991311826723922, 'samples': 1443104, 'steps': 2818, 'loss/train': 1.7488447427749634} -09/21/2021 00:15:21 - INFO - __main__ - Step 45098: {'lr': 0.0001991311826723922, 'samples': 1443136, 'steps': 2818, 'loss/train': 2.494987726211548} -09/21/2021 00:15:21 - INFO - __main__ - Step 45099: {'lr': 0.0001991311826723922, 'samples': 1443168, 'steps': 2818, 'loss/train': 1.6176968812942505} -09/21/2021 00:15:22 - INFO - __main__ - Step 45100: {'lr': 0.0001991311826723922, 'samples': 1443200, 'steps': 2818, 'loss/train': 2.284055709838867} -09/21/2021 00:15:23 - INFO - __main__ - Step 45101: {'lr': 0.0001991311826723922, 'samples': 1443232, 'steps': 2818, 'loss/train': 2.4780654907226562} -09/21/2021 00:15:24 - INFO - __main__ - Step 45102: {'lr': 0.0001991311826723922, 'samples': 1443264, 'steps': 2818, 'loss/train': 2.3977012634277344} -09/21/2021 00:15:25 - INFO - __main__ - Step 45103: {'lr': 0.0001991311826723922, 'samples': 1443296, 'steps': 2818, 'loss/train': 1.744389295578003} -09/21/2021 00:15:26 - INFO - __main__ - Step 45104: {'lr': 0.0001991311826723922, 'samples': 1443328, 'steps': 2818, 'loss/train': 2.3038880825042725} -09/21/2021 00:15:26 - INFO - __main__ - Step 45105: {'lr': 0.00019913034344066848, 'samples': 1443360, 'steps': 2819, 'loss/train': 1.7591021060943604} -09/21/2021 00:15:27 - INFO - __main__ - Step 45106: {'lr': 0.00019913034344066848, 'samples': 1443392, 'steps': 2819, 'loss/train': 2.185537338256836} -09/21/2021 00:15:28 - INFO - __main__ - Step 45107: {'lr': 0.00019913034344066848, 'samples': 1443424, 'steps': 2819, 'loss/train': 1.9353399276733398} -09/21/2021 00:15:29 - INFO - __main__ - Step 45108: {'lr': 0.00019913034344066848, 'samples': 1443456, 'steps': 2819, 'loss/train': 1.3056987524032593} -09/21/2021 00:15:29 - INFO - __main__ - Step 45109: {'lr': 0.00019913034344066848, 'samples': 1443488, 'steps': 2819, 'loss/train': 1.8531748056411743} -09/21/2021 00:15:30 - INFO - __main__ - Step 45110: {'lr': 0.00019913034344066848, 'samples': 1443520, 'steps': 2819, 'loss/train': 1.8918930292129517} -09/21/2021 00:15:31 - INFO - __main__ - Step 45111: {'lr': 0.00019913034344066848, 'samples': 1443552, 'steps': 2819, 'loss/train': 2.494136333465576} -09/21/2021 00:15:32 - INFO - __main__ - Step 45112: {'lr': 0.00019913034344066848, 'samples': 1443584, 'steps': 2819, 'loss/train': 1.928024411201477} -09/21/2021 00:15:32 - INFO - __main__ - Step 45113: {'lr': 0.00019913034344066848, 'samples': 1443616, 'steps': 2819, 'loss/train': 1.9633086919784546} -09/21/2021 00:15:33 - INFO - __main__ - Step 45114: {'lr': 0.00019913034344066848, 'samples': 1443648, 'steps': 2819, 'loss/train': 2.180565595626831} -09/21/2021 00:15:34 - INFO - __main__ - Step 45115: {'lr': 0.00019913034344066848, 'samples': 1443680, 'steps': 2819, 'loss/train': 2.084555149078369} -09/21/2021 00:15:35 - INFO - __main__ - Step 45116: {'lr': 0.00019913034344066848, 'samples': 1443712, 'steps': 2819, 'loss/train': 1.7759531736373901} -09/21/2021 00:15:35 - INFO - __main__ - Step 45117: {'lr': 0.00019913034344066848, 'samples': 1443744, 'steps': 2819, 'loss/train': 2.1279191970825195} -09/21/2021 00:15:36 - INFO - __main__ - Step 45118: {'lr': 0.00019913034344066848, 'samples': 1443776, 'steps': 2819, 'loss/train': 2.0770273208618164} -09/21/2021 00:15:37 - INFO - __main__ - Step 45119: {'lr': 0.00019913034344066848, 'samples': 1443808, 'steps': 2819, 'loss/train': 2.394104242324829} -09/21/2021 00:15:38 - INFO - __main__ - Step 45120: {'lr': 0.00019913034344066848, 'samples': 1443840, 'steps': 2819, 'loss/train': 2.637423276901245} -09/21/2021 00:15:39 - INFO - __main__ - Step 45121: {'lr': 0.00019912950380558377, 'samples': 1443872, 'steps': 2820, 'loss/train': 2.1638810634613037} -09/21/2021 00:15:39 - INFO - __main__ - Step 45122: {'lr': 0.00019912950380558377, 'samples': 1443904, 'steps': 2820, 'loss/train': 2.2796685695648193} -09/21/2021 00:15:40 - INFO - __main__ - Step 45123: {'lr': 0.00019912950380558377, 'samples': 1443936, 'steps': 2820, 'loss/train': 2.154810905456543} -09/21/2021 00:15:41 - INFO - __main__ - Step 45124: {'lr': 0.00019912950380558377, 'samples': 1443968, 'steps': 2820, 'loss/train': 2.061847686767578} -09/21/2021 00:15:42 - INFO - __main__ - Step 45125: {'lr': 0.00019912950380558377, 'samples': 1444000, 'steps': 2820, 'loss/train': 1.5825064182281494} -09/21/2021 00:15:42 - INFO - __main__ - Step 45126: {'lr': 0.00019912950380558377, 'samples': 1444032, 'steps': 2820, 'loss/train': 1.739296793937683} -09/21/2021 00:15:43 - INFO - __main__ - Step 45127: {'lr': 0.00019912950380558377, 'samples': 1444064, 'steps': 2820, 'loss/train': 2.956836462020874} -09/21/2021 00:15:44 - INFO - __main__ - Step 45128: {'lr': 0.00019912950380558377, 'samples': 1444096, 'steps': 2820, 'loss/train': 2.9068353176116943} -09/21/2021 00:15:45 - INFO - __main__ - Step 45129: {'lr': 0.00019912950380558377, 'samples': 1444128, 'steps': 2820, 'loss/train': 1.8275463581085205} -09/21/2021 00:15:45 - INFO - __main__ - Step 45130: {'lr': 0.00019912950380558377, 'samples': 1444160, 'steps': 2820, 'loss/train': 2.8166074752807617} -09/21/2021 00:15:46 - INFO - __main__ - Step 45131: {'lr': 0.00019912950380558377, 'samples': 1444192, 'steps': 2820, 'loss/train': 1.9772261381149292} -09/21/2021 00:15:47 - INFO - __main__ - Step 45132: {'lr': 0.00019912950380558377, 'samples': 1444224, 'steps': 2820, 'loss/train': 1.7492743730545044} -09/21/2021 00:15:48 - INFO - __main__ - Step 45133: {'lr': 0.00019912950380558377, 'samples': 1444256, 'steps': 2820, 'loss/train': 1.9512155055999756} -09/21/2021 00:15:49 - INFO - __main__ - Step 45134: {'lr': 0.00019912950380558377, 'samples': 1444288, 'steps': 2820, 'loss/train': 2.379143714904785} -09/21/2021 00:15:50 - INFO - __main__ - Step 45135: {'lr': 0.00019912950380558377, 'samples': 1444320, 'steps': 2820, 'loss/train': 2.2299208641052246} -09/21/2021 00:15:50 - INFO - __main__ - Step 45136: {'lr': 0.00019912950380558377, 'samples': 1444352, 'steps': 2820, 'loss/train': 2.1404812335968018} -09/21/2021 00:15:51 - INFO - __main__ - Step 45137: {'lr': 0.00019912866376714153, 'samples': 1444384, 'steps': 2821, 'loss/train': 2.0552124977111816} -09/21/2021 00:15:52 - INFO - __main__ - Step 45138: {'lr': 0.00019912866376714153, 'samples': 1444416, 'steps': 2821, 'loss/train': 2.043564796447754} -09/21/2021 00:15:53 - INFO - __main__ - Step 45139: {'lr': 0.00019912866376714153, 'samples': 1444448, 'steps': 2821, 'loss/train': 3.106405258178711} -09/21/2021 00:15:54 - INFO - __main__ - Step 45140: {'lr': 0.00019912866376714153, 'samples': 1444480, 'steps': 2821, 'loss/train': 1.8162540197372437} -09/21/2021 00:15:54 - INFO - __main__ - Step 45141: {'lr': 0.00019912866376714153, 'samples': 1444512, 'steps': 2821, 'loss/train': 2.269294261932373} -09/21/2021 00:15:55 - INFO - __main__ - Step 45142: {'lr': 0.00019912866376714153, 'samples': 1444544, 'steps': 2821, 'loss/train': 7.329026222229004} -09/21/2021 00:15:56 - INFO - __main__ - Step 45143: {'lr': 0.00019912866376714153, 'samples': 1444576, 'steps': 2821, 'loss/train': 1.9583848714828491} -09/21/2021 00:15:57 - INFO - __main__ - Step 45144: {'lr': 0.00019912866376714153, 'samples': 1444608, 'steps': 2821, 'loss/train': 1.7854115962982178} -09/21/2021 00:15:57 - INFO - __main__ - Step 45145: {'lr': 0.00019912866376714153, 'samples': 1444640, 'steps': 2821, 'loss/train': 1.3535374402999878} -09/21/2021 00:15:58 - INFO - __main__ - Step 45146: {'lr': 0.00019912866376714153, 'samples': 1444672, 'steps': 2821, 'loss/train': 2.2124252319335938} -09/21/2021 00:15:59 - INFO - __main__ - Step 45147: {'lr': 0.00019912866376714153, 'samples': 1444704, 'steps': 2821, 'loss/train': 1.6406410932540894} -09/21/2021 00:16:00 - INFO - __main__ - Step 45148: {'lr': 0.00019912866376714153, 'samples': 1444736, 'steps': 2821, 'loss/train': 2.076526165008545} -09/21/2021 00:16:00 - INFO - __main__ - Step 45149: {'lr': 0.00019912866376714153, 'samples': 1444768, 'steps': 2821, 'loss/train': 1.8947242498397827} -09/21/2021 00:16:01 - INFO - __main__ - Step 45150: {'lr': 0.00019912866376714153, 'samples': 1444800, 'steps': 2821, 'loss/train': 0.45395633578300476} -09/21/2021 00:16:02 - INFO - __main__ - Step 45151: {'lr': 0.00019912866376714153, 'samples': 1444832, 'steps': 2821, 'loss/train': 2.34505295753479} -09/21/2021 00:16:03 - INFO - __main__ - Step 45152: {'lr': 0.00019912866376714153, 'samples': 1444864, 'steps': 2821, 'loss/train': 1.6810970306396484} -09/21/2021 00:16:03 - INFO - __main__ - Step 45153: {'lr': 0.0001991278233253451, 'samples': 1444896, 'steps': 2822, 'loss/train': 1.410710096359253} -09/21/2021 00:16:04 - INFO - __main__ - Step 45154: {'lr': 0.0001991278233253451, 'samples': 1444928, 'steps': 2822, 'loss/train': 2.5298798084259033} -09/21/2021 00:16:05 - INFO - __main__ - Step 45155: {'lr': 0.0001991278233253451, 'samples': 1444960, 'steps': 2822, 'loss/train': 2.096215009689331} -09/21/2021 00:16:06 - INFO - __main__ - Step 45156: {'lr': 0.0001991278233253451, 'samples': 1444992, 'steps': 2822, 'loss/train': 2.259014368057251} -09/21/2021 00:16:06 - INFO - __main__ - Step 45157: {'lr': 0.0001991278233253451, 'samples': 1445024, 'steps': 2822, 'loss/train': 1.90095853805542} -09/21/2021 00:16:07 - INFO - __main__ - Step 45158: {'lr': 0.0001991278233253451, 'samples': 1445056, 'steps': 2822, 'loss/train': 2.4698522090911865} -09/21/2021 00:16:08 - INFO - __main__ - Step 45159: {'lr': 0.0001991278233253451, 'samples': 1445088, 'steps': 2822, 'loss/train': 0.9627260565757751} -09/21/2021 00:16:09 - INFO - __main__ - Step 45160: {'lr': 0.0001991278233253451, 'samples': 1445120, 'steps': 2822, 'loss/train': 1.4777765274047852} -09/21/2021 00:16:09 - INFO - __main__ - Step 45161: {'lr': 0.0001991278233253451, 'samples': 1445152, 'steps': 2822, 'loss/train': 1.8879499435424805} -09/21/2021 00:16:10 - INFO - __main__ - Step 45162: {'lr': 0.0001991278233253451, 'samples': 1445184, 'steps': 2822, 'loss/train': 1.638418436050415} -09/21/2021 00:16:12 - INFO - __main__ - Step 45163: {'lr': 0.0001991278233253451, 'samples': 1445216, 'steps': 2822, 'loss/train': 2.34848690032959} -09/21/2021 00:16:13 - INFO - __main__ - Step 45164: {'lr': 0.0001991278233253451, 'samples': 1445248, 'steps': 2822, 'loss/train': 2.139011859893799} -09/21/2021 00:16:13 - INFO - __main__ - Step 45165: {'lr': 0.0001991278233253451, 'samples': 1445280, 'steps': 2822, 'loss/train': 2.167985439300537} -09/21/2021 00:16:14 - INFO - __main__ - Step 45166: {'lr': 0.0001991278233253451, 'samples': 1445312, 'steps': 2822, 'loss/train': 1.3674203157424927} -09/21/2021 00:16:15 - INFO - __main__ - Step 45167: {'lr': 0.0001991278233253451, 'samples': 1445344, 'steps': 2822, 'loss/train': 1.3423480987548828} -09/21/2021 00:16:16 - INFO - __main__ - Step 45168: {'lr': 0.0001991278233253451, 'samples': 1445376, 'steps': 2822, 'loss/train': 1.640272855758667} -09/21/2021 00:16:16 - INFO - __main__ - Step 45169: {'lr': 0.00019912698248019796, 'samples': 1445408, 'steps': 2823, 'loss/train': 1.408091425895691} -09/21/2021 00:16:17 - INFO - __main__ - Step 45170: {'lr': 0.00019912698248019796, 'samples': 1445440, 'steps': 2823, 'loss/train': 1.4013104438781738} -09/21/2021 00:16:18 - INFO - __main__ - Step 45171: {'lr': 0.00019912698248019796, 'samples': 1445472, 'steps': 2823, 'loss/train': 2.209926128387451} -09/21/2021 00:16:19 - INFO - __main__ - Step 45172: {'lr': 0.00019912698248019796, 'samples': 1445504, 'steps': 2823, 'loss/train': 1.6259398460388184} -09/21/2021 00:16:19 - INFO - __main__ - Step 45173: {'lr': 0.00019912698248019796, 'samples': 1445536, 'steps': 2823, 'loss/train': 1.9629708528518677} -09/21/2021 00:16:20 - INFO - __main__ - Step 45174: {'lr': 0.00019912698248019796, 'samples': 1445568, 'steps': 2823, 'loss/train': 2.2744712829589844} -09/21/2021 00:16:21 - INFO - __main__ - Step 45175: {'lr': 0.00019912698248019796, 'samples': 1445600, 'steps': 2823, 'loss/train': 1.973178505897522} -09/21/2021 00:16:22 - INFO - __main__ - Step 45176: {'lr': 0.00019912698248019796, 'samples': 1445632, 'steps': 2823, 'loss/train': 2.6121034622192383} -09/21/2021 00:16:22 - INFO - __main__ - Step 45177: {'lr': 0.00019912698248019796, 'samples': 1445664, 'steps': 2823, 'loss/train': 1.4915779829025269} -09/21/2021 00:16:23 - INFO - __main__ - Step 45178: {'lr': 0.00019912698248019796, 'samples': 1445696, 'steps': 2823, 'loss/train': 0.638559877872467} -09/21/2021 00:16:24 - INFO - __main__ - Step 45179: {'lr': 0.00019912698248019796, 'samples': 1445728, 'steps': 2823, 'loss/train': 1.6417133808135986} -09/21/2021 00:16:25 - INFO - __main__ - Step 45180: {'lr': 0.00019912698248019796, 'samples': 1445760, 'steps': 2823, 'loss/train': 2.4940879344940186} -09/21/2021 00:16:25 - INFO - __main__ - Step 45181: {'lr': 0.00019912698248019796, 'samples': 1445792, 'steps': 2823, 'loss/train': 1.6268279552459717} -09/21/2021 00:16:26 - INFO - __main__ - Step 45182: {'lr': 0.00019912698248019796, 'samples': 1445824, 'steps': 2823, 'loss/train': 2.190793991088867} -09/21/2021 00:16:27 - INFO - __main__ - Step 45183: {'lr': 0.00019912698248019796, 'samples': 1445856, 'steps': 2823, 'loss/train': 0.6546878218650818} -09/21/2021 00:16:28 - INFO - __main__ - Step 45184: {'lr': 0.00019912698248019796, 'samples': 1445888, 'steps': 2823, 'loss/train': 1.6326860189437866} -09/21/2021 00:16:29 - INFO - __main__ - Step 45185: {'lr': 0.00019912614123170351, 'samples': 1445920, 'steps': 2824, 'loss/train': 2.334393262863159} -09/21/2021 00:16:29 - INFO - __main__ - Step 45186: {'lr': 0.00019912614123170351, 'samples': 1445952, 'steps': 2824, 'loss/train': 2.144660234451294} -09/21/2021 00:16:30 - INFO - __main__ - Step 45187: {'lr': 0.00019912614123170351, 'samples': 1445984, 'steps': 2824, 'loss/train': 2.5961050987243652} -09/21/2021 00:16:31 - INFO - __main__ - Step 45188: {'lr': 0.00019912614123170351, 'samples': 1446016, 'steps': 2824, 'loss/train': 2.4986588954925537} -09/21/2021 00:16:32 - INFO - __main__ - Step 45189: {'lr': 0.00019912614123170351, 'samples': 1446048, 'steps': 2824, 'loss/train': 1.83021879196167} -09/21/2021 00:16:32 - INFO - __main__ - Step 45190: {'lr': 0.00019912614123170351, 'samples': 1446080, 'steps': 2824, 'loss/train': 2.3928885459899902} -09/21/2021 00:16:33 - INFO - __main__ - Step 45191: {'lr': 0.00019912614123170351, 'samples': 1446112, 'steps': 2824, 'loss/train': 2.2482199668884277} -09/21/2021 00:16:34 - INFO - __main__ - Step 45192: {'lr': 0.00019912614123170351, 'samples': 1446144, 'steps': 2824, 'loss/train': 1.6694159507751465} -09/21/2021 00:16:35 - INFO - __main__ - Step 45193: {'lr': 0.00019912614123170351, 'samples': 1446176, 'steps': 2824, 'loss/train': 0.24006129801273346} -09/21/2021 00:16:35 - INFO - __main__ - Step 45194: {'lr': 0.00019912614123170351, 'samples': 1446208, 'steps': 2824, 'loss/train': 0.23624935746192932} -09/21/2021 00:16:37 - INFO - __main__ - Step 45195: {'lr': 0.00019912614123170351, 'samples': 1446240, 'steps': 2824, 'loss/train': 0.3043558597564697} -09/21/2021 00:16:38 - INFO - __main__ - Step 45196: {'lr': 0.00019912614123170351, 'samples': 1446272, 'steps': 2824, 'loss/train': 2.3488848209381104} -09/21/2021 00:16:39 - INFO - __main__ - Step 45197: {'lr': 0.00019912614123170351, 'samples': 1446304, 'steps': 2824, 'loss/train': 2.327192544937134} -09/21/2021 00:16:39 - INFO - __main__ - Step 45198: {'lr': 0.00019912614123170351, 'samples': 1446336, 'steps': 2824, 'loss/train': 1.6939268112182617} -09/21/2021 00:16:40 - INFO - __main__ - Step 45199: {'lr': 0.00019912614123170351, 'samples': 1446368, 'steps': 2824, 'loss/train': 2.997664213180542} -09/21/2021 00:16:41 - INFO - __main__ - Step 45200: {'lr': 0.00019912614123170351, 'samples': 1446400, 'steps': 2824, 'loss/train': 1.2938966751098633} -09/21/2021 00:16:42 - INFO - __main__ - Step 45201: {'lr': 0.00019912529957986518, 'samples': 1446432, 'steps': 2825, 'loss/train': 1.96767258644104} -09/21/2021 00:16:42 - INFO - __main__ - Step 45202: {'lr': 0.00019912529957986518, 'samples': 1446464, 'steps': 2825, 'loss/train': 0.20545722544193268} -09/21/2021 00:16:43 - INFO - __main__ - Step 45203: {'lr': 0.00019912529957986518, 'samples': 1446496, 'steps': 2825, 'loss/train': 0.18011482059955597} -09/21/2021 00:16:44 - INFO - __main__ - Step 45204: {'lr': 0.00019912529957986518, 'samples': 1446528, 'steps': 2825, 'loss/train': 1.513745665550232} -09/21/2021 00:16:45 - INFO - __main__ - Step 45205: {'lr': 0.00019912529957986518, 'samples': 1446560, 'steps': 2825, 'loss/train': 0.46364903450012207} -09/21/2021 00:16:45 - INFO - __main__ - Step 45206: {'lr': 0.00019912529957986518, 'samples': 1446592, 'steps': 2825, 'loss/train': 1.703273892402649} -09/21/2021 00:16:46 - INFO - __main__ - Step 45207: {'lr': 0.00019912529957986518, 'samples': 1446624, 'steps': 2825, 'loss/train': 1.6884061098098755} -09/21/2021 00:16:47 - INFO - __main__ - Step 45208: {'lr': 0.00019912529957986518, 'samples': 1446656, 'steps': 2825, 'loss/train': 1.6828888654708862} -09/21/2021 00:16:48 - INFO - __main__ - Step 45209: {'lr': 0.00019912529957986518, 'samples': 1446688, 'steps': 2825, 'loss/train': 2.8362977504730225} -09/21/2021 00:16:48 - INFO - __main__ - Step 45210: {'lr': 0.00019912529957986518, 'samples': 1446720, 'steps': 2825, 'loss/train': 2.1507229804992676} -09/21/2021 00:16:49 - INFO - __main__ - Step 45211: {'lr': 0.00019912529957986518, 'samples': 1446752, 'steps': 2825, 'loss/train': 1.0356898307800293} -09/21/2021 00:16:50 - INFO - __main__ - Step 45212: {'lr': 0.00019912529957986518, 'samples': 1446784, 'steps': 2825, 'loss/train': 2.1748464107513428} -09/21/2021 00:16:51 - INFO - __main__ - Step 45213: {'lr': 0.00019912529957986518, 'samples': 1446816, 'steps': 2825, 'loss/train': 2.2063164710998535} -09/21/2021 00:16:51 - INFO - __main__ - Step 45214: {'lr': 0.00019912529957986518, 'samples': 1446848, 'steps': 2825, 'loss/train': 1.7596937417984009} -09/21/2021 00:16:52 - INFO - __main__ - Step 45215: {'lr': 0.00019912529957986518, 'samples': 1446880, 'steps': 2825, 'loss/train': 1.5296893119812012} -09/21/2021 00:16:53 - INFO - __main__ - Step 45216: {'lr': 0.00019912529957986518, 'samples': 1446912, 'steps': 2825, 'loss/train': 3.1728227138519287} -09/21/2021 00:16:54 - INFO - __main__ - Step 45217: {'lr': 0.0001991244575246864, 'samples': 1446944, 'steps': 2826, 'loss/train': 2.1275203227996826} -09/21/2021 00:16:55 - INFO - __main__ - Step 45218: {'lr': 0.0001991244575246864, 'samples': 1446976, 'steps': 2826, 'loss/train': 3.130718231201172} -09/21/2021 00:16:55 - INFO - __main__ - Step 45219: {'lr': 0.0001991244575246864, 'samples': 1447008, 'steps': 2826, 'loss/train': 3.05749773979187} -09/21/2021 00:16:56 - INFO - __main__ - Step 45220: {'lr': 0.0001991244575246864, 'samples': 1447040, 'steps': 2826, 'loss/train': 1.8973661661148071} -09/21/2021 00:16:57 - INFO - __main__ - Step 45221: {'lr': 0.0001991244575246864, 'samples': 1447072, 'steps': 2826, 'loss/train': 1.8055713176727295} -09/21/2021 00:16:58 - INFO - __main__ - Step 45222: {'lr': 0.0001991244575246864, 'samples': 1447104, 'steps': 2826, 'loss/train': 2.1694867610931396} -09/21/2021 00:16:58 - INFO - __main__ - Step 45223: {'lr': 0.0001991244575246864, 'samples': 1447136, 'steps': 2826, 'loss/train': 1.9136039018630981} -09/21/2021 00:16:59 - INFO - __main__ - Step 45224: {'lr': 0.0001991244575246864, 'samples': 1447168, 'steps': 2826, 'loss/train': 1.5931689739227295} -09/21/2021 00:17:00 - INFO - __main__ - Step 45225: {'lr': 0.0001991244575246864, 'samples': 1447200, 'steps': 2826, 'loss/train': 2.352642774581909} -09/21/2021 00:17:01 - INFO - __main__ - Step 45226: {'lr': 0.0001991244575246864, 'samples': 1447232, 'steps': 2826, 'loss/train': 2.0534932613372803} -09/21/2021 00:17:02 - INFO - __main__ - Step 45227: {'lr': 0.0001991244575246864, 'samples': 1447264, 'steps': 2826, 'loss/train': 2.2719950675964355} -09/21/2021 00:17:03 - INFO - __main__ - Step 45228: {'lr': 0.0001991244575246864, 'samples': 1447296, 'steps': 2826, 'loss/train': 2.2872021198272705} -09/21/2021 00:17:03 - INFO - __main__ - Step 45229: {'lr': 0.0001991244575246864, 'samples': 1447328, 'steps': 2826, 'loss/train': 1.97373366355896} -09/21/2021 00:17:04 - INFO - __main__ - Step 45230: {'lr': 0.0001991244575246864, 'samples': 1447360, 'steps': 2826, 'loss/train': 3.1402931213378906} -09/21/2021 00:17:05 - INFO - __main__ - Step 45231: {'lr': 0.0001991244575246864, 'samples': 1447392, 'steps': 2826, 'loss/train': 1.2042003870010376} -09/21/2021 00:17:06 - INFO - __main__ - Step 45232: {'lr': 0.0001991244575246864, 'samples': 1447424, 'steps': 2826, 'loss/train': 2.333976984024048} -09/21/2021 00:17:07 - INFO - __main__ - Step 45233: {'lr': 0.0001991236150661706, 'samples': 1447456, 'steps': 2827, 'loss/train': 2.464700937271118} -09/21/2021 00:17:07 - INFO - __main__ - Step 45234: {'lr': 0.0001991236150661706, 'samples': 1447488, 'steps': 2827, 'loss/train': 1.7749401330947876} -09/21/2021 00:17:08 - INFO - __main__ - Step 45235: {'lr': 0.0001991236150661706, 'samples': 1447520, 'steps': 2827, 'loss/train': 1.150948166847229} -09/21/2021 00:17:09 - INFO - __main__ - Step 45236: {'lr': 0.0001991236150661706, 'samples': 1447552, 'steps': 2827, 'loss/train': 2.211430788040161} -09/21/2021 00:17:10 - INFO - __main__ - Step 45237: {'lr': 0.0001991236150661706, 'samples': 1447584, 'steps': 2827, 'loss/train': 2.4113214015960693} -09/21/2021 00:17:10 - INFO - __main__ - Step 45238: {'lr': 0.0001991236150661706, 'samples': 1447616, 'steps': 2827, 'loss/train': 1.7607309818267822} -09/21/2021 00:17:11 - INFO - __main__ - Step 45239: {'lr': 0.0001991236150661706, 'samples': 1447648, 'steps': 2827, 'loss/train': 0.4603959918022156} -09/21/2021 00:17:12 - INFO - __main__ - Step 45240: {'lr': 0.0001991236150661706, 'samples': 1447680, 'steps': 2827, 'loss/train': 1.9805442094802856} -09/21/2021 00:17:13 - INFO - __main__ - Step 45241: {'lr': 0.0001991236150661706, 'samples': 1447712, 'steps': 2827, 'loss/train': 1.6656304597854614} -09/21/2021 00:17:13 - INFO - __main__ - Step 45242: {'lr': 0.0001991236150661706, 'samples': 1447744, 'steps': 2827, 'loss/train': 0.5155513286590576} -09/21/2021 00:17:14 - INFO - __main__ - Step 45243: {'lr': 0.0001991236150661706, 'samples': 1447776, 'steps': 2827, 'loss/train': 2.239745616912842} -09/21/2021 00:17:15 - INFO - __main__ - Step 45244: {'lr': 0.0001991236150661706, 'samples': 1447808, 'steps': 2827, 'loss/train': 1.2060641050338745} -09/21/2021 00:17:16 - INFO - __main__ - Step 45245: {'lr': 0.0001991236150661706, 'samples': 1447840, 'steps': 2827, 'loss/train': 1.9837795495986938} -09/21/2021 00:17:16 - INFO - __main__ - Step 45246: {'lr': 0.0001991236150661706, 'samples': 1447872, 'steps': 2827, 'loss/train': 2.656484365463257} -09/21/2021 00:17:17 - INFO - __main__ - Step 45247: {'lr': 0.0001991236150661706, 'samples': 1447904, 'steps': 2827, 'loss/train': 1.6654669046401978} -09/21/2021 00:17:18 - INFO - __main__ - Step 45248: {'lr': 0.0001991236150661706, 'samples': 1447936, 'steps': 2827, 'loss/train': 1.868532657623291} -09/21/2021 00:17:19 - INFO - __main__ - Step 45249: {'lr': 0.00019912277220432117, 'samples': 1447968, 'steps': 2828, 'loss/train': 1.8862345218658447} -09/21/2021 00:17:19 - INFO - __main__ - Step 45250: {'lr': 0.00019912277220432117, 'samples': 1448000, 'steps': 2828, 'loss/train': 1.9555219411849976} -09/21/2021 00:17:20 - INFO - __main__ - Step 45251: {'lr': 0.00019912277220432117, 'samples': 1448032, 'steps': 2828, 'loss/train': 2.140549659729004} -09/21/2021 00:17:21 - INFO - __main__ - Step 45252: {'lr': 0.00019912277220432117, 'samples': 1448064, 'steps': 2828, 'loss/train': 0.9872394800186157} -09/21/2021 00:17:22 - INFO - __main__ - Step 45253: {'lr': 0.00019912277220432117, 'samples': 1448096, 'steps': 2828, 'loss/train': 1.3790388107299805} -09/21/2021 00:17:22 - INFO - __main__ - Step 45254: {'lr': 0.00019912277220432117, 'samples': 1448128, 'steps': 2828, 'loss/train': 2.2445852756500244} -09/21/2021 00:17:23 - INFO - __main__ - Step 45255: {'lr': 0.00019912277220432117, 'samples': 1448160, 'steps': 2828, 'loss/train': 2.0846381187438965} -09/21/2021 00:17:24 - INFO - __main__ - Step 45256: {'lr': 0.00019912277220432117, 'samples': 1448192, 'steps': 2828, 'loss/train': 1.681182861328125} -09/21/2021 00:17:25 - INFO - __main__ - Step 45257: {'lr': 0.00019912277220432117, 'samples': 1448224, 'steps': 2828, 'loss/train': 2.642251491546631} -09/21/2021 00:17:26 - INFO - __main__ - Step 45258: {'lr': 0.00019912277220432117, 'samples': 1448256, 'steps': 2828, 'loss/train': 2.716277837753296} -09/21/2021 00:17:27 - INFO - __main__ - Step 45259: {'lr': 0.00019912277220432117, 'samples': 1448288, 'steps': 2828, 'loss/train': 2.38558292388916} -09/21/2021 00:17:27 - INFO - __main__ - Step 45260: {'lr': 0.00019912277220432117, 'samples': 1448320, 'steps': 2828, 'loss/train': 2.8033053874969482} -09/21/2021 00:17:28 - INFO - __main__ - Step 45261: {'lr': 0.00019912277220432117, 'samples': 1448352, 'steps': 2828, 'loss/train': 1.7932555675506592} -09/21/2021 00:17:29 - INFO - __main__ - Step 45262: {'lr': 0.00019912277220432117, 'samples': 1448384, 'steps': 2828, 'loss/train': 2.434190034866333} -09/21/2021 00:17:30 - INFO - __main__ - Step 45263: {'lr': 0.00019912277220432117, 'samples': 1448416, 'steps': 2828, 'loss/train': 1.9913536310195923} -09/21/2021 00:17:30 - INFO - __main__ - Step 45264: {'lr': 0.00019912277220432117, 'samples': 1448448, 'steps': 2828, 'loss/train': 2.4293324947357178} -09/21/2021 00:17:31 - INFO - __main__ - Step 45265: {'lr': 0.00019912192893914153, 'samples': 1448480, 'steps': 2829, 'loss/train': 1.7330394983291626} -09/21/2021 00:17:32 - INFO - __main__ - Step 45266: {'lr': 0.00019912192893914153, 'samples': 1448512, 'steps': 2829, 'loss/train': 1.8404091596603394} -09/21/2021 00:17:33 - INFO - __main__ - Step 45267: {'lr': 0.00019912192893914153, 'samples': 1448544, 'steps': 2829, 'loss/train': 2.468747854232788} -09/21/2021 00:17:34 - INFO - __main__ - Step 45268: {'lr': 0.00019912192893914153, 'samples': 1448576, 'steps': 2829, 'loss/train': 2.827232837677002} -09/21/2021 00:17:34 - INFO - __main__ - Step 45269: {'lr': 0.00019912192893914153, 'samples': 1448608, 'steps': 2829, 'loss/train': 1.0306357145309448} -09/21/2021 00:17:35 - INFO - __main__ - Step 45270: {'lr': 0.00019912192893914153, 'samples': 1448640, 'steps': 2829, 'loss/train': 2.4913923740386963} -09/21/2021 00:17:36 - INFO - __main__ - Step 45271: {'lr': 0.00019912192893914153, 'samples': 1448672, 'steps': 2829, 'loss/train': 1.450103759765625} -09/21/2021 00:17:37 - INFO - __main__ - Step 45272: {'lr': 0.00019912192893914153, 'samples': 1448704, 'steps': 2829, 'loss/train': 2.100860595703125} -09/21/2021 00:17:37 - INFO - __main__ - Step 45273: {'lr': 0.00019912192893914153, 'samples': 1448736, 'steps': 2829, 'loss/train': 2.215348958969116} -09/21/2021 00:17:38 - INFO - __main__ - Step 45274: {'lr': 0.00019912192893914153, 'samples': 1448768, 'steps': 2829, 'loss/train': 2.1735358238220215} -09/21/2021 00:17:39 - INFO - __main__ - Step 45275: {'lr': 0.00019912192893914153, 'samples': 1448800, 'steps': 2829, 'loss/train': 1.5422660112380981} -09/21/2021 00:17:40 - INFO - __main__ - Step 45276: {'lr': 0.00019912192893914153, 'samples': 1448832, 'steps': 2829, 'loss/train': 2.4420201778411865} -09/21/2021 00:17:40 - INFO - __main__ - Step 45277: {'lr': 0.00019912192893914153, 'samples': 1448864, 'steps': 2829, 'loss/train': 1.4583312273025513} -09/21/2021 00:17:41 - INFO - __main__ - Step 45278: {'lr': 0.00019912192893914153, 'samples': 1448896, 'steps': 2829, 'loss/train': 2.453364372253418} -09/21/2021 00:17:42 - INFO - __main__ - Step 45279: {'lr': 0.00019912192893914153, 'samples': 1448928, 'steps': 2829, 'loss/train': 1.8436853885650635} -09/21/2021 00:17:43 - INFO - __main__ - Step 45280: {'lr': 0.00019912192893914153, 'samples': 1448960, 'steps': 2829, 'loss/train': 1.5509687662124634} -09/21/2021 00:17:43 - INFO - __main__ - Step 45281: {'lr': 0.0001991210852706352, 'samples': 1448992, 'steps': 2830, 'loss/train': 1.3047091960906982} -09/21/2021 00:17:44 - INFO - __main__ - Step 45282: {'lr': 0.0001991210852706352, 'samples': 1449024, 'steps': 2830, 'loss/train': 2.026024103164673} -09/21/2021 00:17:45 - INFO - __main__ - Step 45283: {'lr': 0.0001991210852706352, 'samples': 1449056, 'steps': 2830, 'loss/train': 0.7455807328224182} -09/21/2021 00:17:46 - INFO - __main__ - Step 45284: {'lr': 0.0001991210852706352, 'samples': 1449088, 'steps': 2830, 'loss/train': 1.779370903968811} -09/21/2021 00:17:46 - INFO - __main__ - Step 45285: {'lr': 0.0001991210852706352, 'samples': 1449120, 'steps': 2830, 'loss/train': 2.1466732025146484} -09/21/2021 00:17:47 - INFO - __main__ - Step 45286: {'lr': 0.0001991210852706352, 'samples': 1449152, 'steps': 2830, 'loss/train': 1.581610918045044} -09/21/2021 00:17:48 - INFO - __main__ - Step 45287: {'lr': 0.0001991210852706352, 'samples': 1449184, 'steps': 2830, 'loss/train': 2.4686107635498047} -09/21/2021 00:17:49 - INFO - __main__ - Step 45288: {'lr': 0.0001991210852706352, 'samples': 1449216, 'steps': 2830, 'loss/train': 2.473984479904175} -09/21/2021 00:17:50 - INFO - __main__ - Step 45289: {'lr': 0.0001991210852706352, 'samples': 1449248, 'steps': 2830, 'loss/train': 2.4089152812957764} -09/21/2021 00:17:51 - INFO - __main__ - Step 45290: {'lr': 0.0001991210852706352, 'samples': 1449280, 'steps': 2830, 'loss/train': 2.886833906173706} -09/21/2021 00:17:52 - INFO - __main__ - Step 45291: {'lr': 0.0001991210852706352, 'samples': 1449312, 'steps': 2830, 'loss/train': 1.8288618326187134} -09/21/2021 00:17:52 - INFO - __main__ - Step 45292: {'lr': 0.0001991210852706352, 'samples': 1449344, 'steps': 2830, 'loss/train': 0.2168438732624054} -09/21/2021 00:17:53 - INFO - __main__ - Step 45293: {'lr': 0.0001991210852706352, 'samples': 1449376, 'steps': 2830, 'loss/train': 0.16370762884616852} -09/21/2021 00:17:54 - INFO - __main__ - Step 45294: {'lr': 0.0001991210852706352, 'samples': 1449408, 'steps': 2830, 'loss/train': 0.28486528992652893} -09/21/2021 00:17:55 - INFO - __main__ - Step 45295: {'lr': 0.0001991210852706352, 'samples': 1449440, 'steps': 2830, 'loss/train': 2.0863258838653564} -09/21/2021 00:17:55 - INFO - __main__ - Step 45296: {'lr': 0.0001991210852706352, 'samples': 1449472, 'steps': 2830, 'loss/train': 1.6675130128860474} -09/21/2021 00:17:56 - INFO - __main__ - Step 45297: {'lr': 0.00019912024119880556, 'samples': 1449504, 'steps': 2831, 'loss/train': 1.4759804010391235} -09/21/2021 00:17:57 - INFO - __main__ - Step 45298: {'lr': 0.00019912024119880556, 'samples': 1449536, 'steps': 2831, 'loss/train': 2.3350234031677246} -09/21/2021 00:17:58 - INFO - __main__ - Step 45299: {'lr': 0.00019912024119880556, 'samples': 1449568, 'steps': 2831, 'loss/train': 2.0949747562408447} -09/21/2021 00:17:58 - INFO - __main__ - Step 45300: {'lr': 0.00019912024119880556, 'samples': 1449600, 'steps': 2831, 'loss/train': 2.237569808959961} -09/21/2021 00:17:59 - INFO - __main__ - Step 45301: {'lr': 0.00019912024119880556, 'samples': 1449632, 'steps': 2831, 'loss/train': 1.6828166246414185} -09/21/2021 00:18:00 - INFO - __main__ - Step 45302: {'lr': 0.00019912024119880556, 'samples': 1449664, 'steps': 2831, 'loss/train': 2.3494224548339844} -09/21/2021 00:18:01 - INFO - __main__ - Step 45303: {'lr': 0.00019912024119880556, 'samples': 1449696, 'steps': 2831, 'loss/train': 2.005095958709717} -09/21/2021 00:18:01 - INFO - __main__ - Step 45304: {'lr': 0.00019912024119880556, 'samples': 1449728, 'steps': 2831, 'loss/train': 2.4952354431152344} -09/21/2021 00:18:02 - INFO - __main__ - Step 45305: {'lr': 0.00019912024119880556, 'samples': 1449760, 'steps': 2831, 'loss/train': 2.8071651458740234} -09/21/2021 00:18:03 - INFO - __main__ - Step 45306: {'lr': 0.00019912024119880556, 'samples': 1449792, 'steps': 2831, 'loss/train': 2.1488492488861084} -09/21/2021 00:18:04 - INFO - __main__ - Step 45307: {'lr': 0.00019912024119880556, 'samples': 1449824, 'steps': 2831, 'loss/train': 2.1290082931518555} -09/21/2021 00:18:04 - INFO - __main__ - Step 45308: {'lr': 0.00019912024119880556, 'samples': 1449856, 'steps': 2831, 'loss/train': 2.4266867637634277} -09/21/2021 00:18:05 - INFO - __main__ - Step 45309: {'lr': 0.00019912024119880556, 'samples': 1449888, 'steps': 2831, 'loss/train': 0.4521244168281555} -09/21/2021 00:18:06 - INFO - __main__ - Step 45310: {'lr': 0.00019912024119880556, 'samples': 1449920, 'steps': 2831, 'loss/train': 2.53157639503479} -09/21/2021 00:18:07 - INFO - __main__ - Step 45311: {'lr': 0.00019912024119880556, 'samples': 1449952, 'steps': 2831, 'loss/train': 0.20491018891334534} -09/21/2021 00:18:07 - INFO - __main__ - Step 45312: {'lr': 0.00019912024119880556, 'samples': 1449984, 'steps': 2831, 'loss/train': 1.1336504220962524} -09/21/2021 00:18:08 - INFO - __main__ - Step 45313: {'lr': 0.00019911939672365603, 'samples': 1450016, 'steps': 2832, 'loss/train': 2.610140800476074} -09/21/2021 00:18:09 - INFO - __main__ - Step 45314: {'lr': 0.00019911939672365603, 'samples': 1450048, 'steps': 2832, 'loss/train': 1.9789543151855469} -09/21/2021 00:18:10 - INFO - __main__ - Step 45315: {'lr': 0.00019911939672365603, 'samples': 1450080, 'steps': 2832, 'loss/train': 2.4519224166870117} -09/21/2021 00:18:11 - INFO - __main__ - Step 45316: {'lr': 0.00019911939672365603, 'samples': 1450112, 'steps': 2832, 'loss/train': 2.0595219135284424} -09/21/2021 00:18:11 - INFO - __main__ - Step 45317: {'lr': 0.00019911939672365603, 'samples': 1450144, 'steps': 2832, 'loss/train': 1.4383785724639893} -09/21/2021 00:18:12 - INFO - __main__ - Step 45318: {'lr': 0.00019911939672365603, 'samples': 1450176, 'steps': 2832, 'loss/train': 1.380675196647644} -09/21/2021 00:18:13 - INFO - __main__ - Step 45319: {'lr': 0.00019911939672365603, 'samples': 1450208, 'steps': 2832, 'loss/train': 1.6119204759597778} -09/21/2021 00:18:14 - INFO - __main__ - Step 45320: {'lr': 0.00019911939672365603, 'samples': 1450240, 'steps': 2832, 'loss/train': 1.1203820705413818} -09/21/2021 00:18:15 - INFO - __main__ - Step 45321: {'lr': 0.00019911939672365603, 'samples': 1450272, 'steps': 2832, 'loss/train': 2.0251173973083496} -09/21/2021 00:18:16 - INFO - __main__ - Step 45322: {'lr': 0.00019911939672365603, 'samples': 1450304, 'steps': 2832, 'loss/train': 1.9895621538162231} -09/21/2021 00:18:16 - INFO - __main__ - Step 45323: {'lr': 0.00019911939672365603, 'samples': 1450336, 'steps': 2832, 'loss/train': 3.3608295917510986} -09/21/2021 00:18:17 - INFO - __main__ - Step 45324: {'lr': 0.00019911939672365603, 'samples': 1450368, 'steps': 2832, 'loss/train': 1.5165852308273315} -09/21/2021 00:18:18 - INFO - __main__ - Step 45325: {'lr': 0.00019911939672365603, 'samples': 1450400, 'steps': 2832, 'loss/train': 1.96152663230896} -09/21/2021 00:18:19 - INFO - __main__ - Step 45326: {'lr': 0.00019911939672365603, 'samples': 1450432, 'steps': 2832, 'loss/train': 2.0330350399017334} -09/21/2021 00:18:19 - INFO - __main__ - Step 45327: {'lr': 0.00019911939672365603, 'samples': 1450464, 'steps': 2832, 'loss/train': 1.728024959564209} -09/21/2021 00:18:20 - INFO - __main__ - Step 45328: {'lr': 0.00019911939672365603, 'samples': 1450496, 'steps': 2832, 'loss/train': 1.9899753332138062} -09/21/2021 00:18:21 - INFO - __main__ - Step 45329: {'lr': 0.00019911855184519004, 'samples': 1450528, 'steps': 2833, 'loss/train': 0.7581819295883179} -09/21/2021 00:18:22 - INFO - __main__ - Step 45330: {'lr': 0.00019911855184519004, 'samples': 1450560, 'steps': 2833, 'loss/train': 2.4740147590637207} -09/21/2021 00:18:23 - INFO - __main__ - Step 45331: {'lr': 0.00019911855184519004, 'samples': 1450592, 'steps': 2833, 'loss/train': 2.8459115028381348} -09/21/2021 00:18:23 - INFO - __main__ - Step 45332: {'lr': 0.00019911855184519004, 'samples': 1450624, 'steps': 2833, 'loss/train': 1.7552448511123657} -09/21/2021 00:18:24 - INFO - __main__ - Step 45333: {'lr': 0.00019911855184519004, 'samples': 1450656, 'steps': 2833, 'loss/train': 3.0238382816314697} -09/21/2021 00:18:25 - INFO - __main__ - Step 45334: {'lr': 0.00019911855184519004, 'samples': 1450688, 'steps': 2833, 'loss/train': 2.49792218208313} -09/21/2021 00:18:26 - INFO - __main__ - Step 45335: {'lr': 0.00019911855184519004, 'samples': 1450720, 'steps': 2833, 'loss/train': 1.5873242616653442} -09/21/2021 00:18:26 - INFO - __main__ - Step 45336: {'lr': 0.00019911855184519004, 'samples': 1450752, 'steps': 2833, 'loss/train': 1.5136305093765259} -09/21/2021 00:18:27 - INFO - __main__ - Step 45337: {'lr': 0.00019911855184519004, 'samples': 1450784, 'steps': 2833, 'loss/train': 1.977656364440918} -09/21/2021 00:18:28 - INFO - __main__ - Step 45338: {'lr': 0.00019911855184519004, 'samples': 1450816, 'steps': 2833, 'loss/train': 1.5170007944107056} -09/21/2021 00:18:29 - INFO - __main__ - Step 45339: {'lr': 0.00019911855184519004, 'samples': 1450848, 'steps': 2833, 'loss/train': 2.535737991333008} -09/21/2021 00:18:29 - INFO - __main__ - Step 45340: {'lr': 0.00019911855184519004, 'samples': 1450880, 'steps': 2833, 'loss/train': 1.6671925783157349} -09/21/2021 00:18:30 - INFO - __main__ - Step 45341: {'lr': 0.00019911855184519004, 'samples': 1450912, 'steps': 2833, 'loss/train': 2.24601149559021} -09/21/2021 00:18:31 - INFO - __main__ - Step 45342: {'lr': 0.00019911855184519004, 'samples': 1450944, 'steps': 2833, 'loss/train': 2.381269931793213} -09/21/2021 00:18:32 - INFO - __main__ - Step 45343: {'lr': 0.00019911855184519004, 'samples': 1450976, 'steps': 2833, 'loss/train': 2.3838703632354736} -09/21/2021 00:18:32 - INFO - __main__ - Step 45344: {'lr': 0.00019911855184519004, 'samples': 1451008, 'steps': 2833, 'loss/train': 1.3966370820999146} -09/21/2021 00:18:33 - INFO - __main__ - Step 45345: {'lr': 0.00019911770656341106, 'samples': 1451040, 'steps': 2834, 'loss/train': 1.8239904642105103} -09/21/2021 00:18:34 - INFO - __main__ - Step 45346: {'lr': 0.00019911770656341106, 'samples': 1451072, 'steps': 2834, 'loss/train': 1.463773250579834} -09/21/2021 00:18:35 - INFO - __main__ - Step 45347: {'lr': 0.00019911770656341106, 'samples': 1451104, 'steps': 2834, 'loss/train': 1.3725608587265015} -09/21/2021 00:18:35 - INFO - __main__ - Step 45348: {'lr': 0.00019911770656341106, 'samples': 1451136, 'steps': 2834, 'loss/train': 1.7819557189941406} -09/21/2021 00:18:36 - INFO - __main__ - Step 45349: {'lr': 0.00019911770656341106, 'samples': 1451168, 'steps': 2834, 'loss/train': 1.9202121496200562} -09/21/2021 00:18:37 - INFO - __main__ - Step 45350: {'lr': 0.00019911770656341106, 'samples': 1451200, 'steps': 2834, 'loss/train': 1.829158067703247} -09/21/2021 00:18:38 - INFO - __main__ - Step 45351: {'lr': 0.00019911770656341106, 'samples': 1451232, 'steps': 2834, 'loss/train': 2.7377147674560547} -09/21/2021 00:18:39 - INFO - __main__ - Step 45352: {'lr': 0.00019911770656341106, 'samples': 1451264, 'steps': 2834, 'loss/train': 1.5901498794555664} -09/21/2021 00:18:40 - INFO - __main__ - Step 45353: {'lr': 0.00019911770656341106, 'samples': 1451296, 'steps': 2834, 'loss/train': 0.5055565237998962} -09/21/2021 00:18:40 - INFO - __main__ - Step 45354: {'lr': 0.00019911770656341106, 'samples': 1451328, 'steps': 2834, 'loss/train': 2.3004214763641357} -09/21/2021 00:18:41 - INFO - __main__ - Step 45355: {'lr': 0.00019911770656341106, 'samples': 1451360, 'steps': 2834, 'loss/train': 2.248145818710327} -09/21/2021 00:18:42 - INFO - __main__ - Step 45356: {'lr': 0.00019911770656341106, 'samples': 1451392, 'steps': 2834, 'loss/train': 2.2661590576171875} -09/21/2021 00:18:43 - INFO - __main__ - Step 45357: {'lr': 0.00019911770656341106, 'samples': 1451424, 'steps': 2834, 'loss/train': 2.7874932289123535} -09/21/2021 00:18:43 - INFO - __main__ - Step 45358: {'lr': 0.00019911770656341106, 'samples': 1451456, 'steps': 2834, 'loss/train': 2.278285026550293} -09/21/2021 00:18:44 - INFO - __main__ - Step 45359: {'lr': 0.00019911770656341106, 'samples': 1451488, 'steps': 2834, 'loss/train': 1.9776067733764648} -09/21/2021 00:18:45 - INFO - __main__ - Step 45360: {'lr': 0.00019911770656341106, 'samples': 1451520, 'steps': 2834, 'loss/train': 1.694573998451233} -09/21/2021 00:18:46 - INFO - __main__ - Step 45361: {'lr': 0.00019911686087832254, 'samples': 1451552, 'steps': 2835, 'loss/train': 2.2915923595428467} -09/21/2021 00:18:47 - INFO - __main__ - Step 45362: {'lr': 0.00019911686087832254, 'samples': 1451584, 'steps': 2835, 'loss/train': 3.2217776775360107} -09/21/2021 00:18:47 - INFO - __main__ - Step 45363: {'lr': 0.00019911686087832254, 'samples': 1451616, 'steps': 2835, 'loss/train': 1.3712220191955566} -09/21/2021 00:18:48 - INFO - __main__ - Step 45364: {'lr': 0.00019911686087832254, 'samples': 1451648, 'steps': 2835, 'loss/train': 0.790530800819397} -09/21/2021 00:18:49 - INFO - __main__ - Step 45365: {'lr': 0.00019911686087832254, 'samples': 1451680, 'steps': 2835, 'loss/train': 3.03393292427063} -09/21/2021 00:18:50 - INFO - __main__ - Step 45366: {'lr': 0.00019911686087832254, 'samples': 1451712, 'steps': 2835, 'loss/train': 1.951517105102539} -09/21/2021 00:18:50 - INFO - __main__ - Step 45367: {'lr': 0.00019911686087832254, 'samples': 1451744, 'steps': 2835, 'loss/train': 0.835395097732544} -09/21/2021 00:18:51 - INFO - __main__ - Step 45368: {'lr': 0.00019911686087832254, 'samples': 1451776, 'steps': 2835, 'loss/train': 2.552429676055908} -09/21/2021 00:18:52 - INFO - __main__ - Step 45369: {'lr': 0.00019911686087832254, 'samples': 1451808, 'steps': 2835, 'loss/train': 3.042950391769409} -09/21/2021 00:18:53 - INFO - __main__ - Step 45370: {'lr': 0.00019911686087832254, 'samples': 1451840, 'steps': 2835, 'loss/train': 3.370290517807007} -09/21/2021 00:18:53 - INFO - __main__ - Step 45371: {'lr': 0.00019911686087832254, 'samples': 1451872, 'steps': 2835, 'loss/train': 2.4779763221740723} -09/21/2021 00:18:54 - INFO - __main__ - Step 45372: {'lr': 0.00019911686087832254, 'samples': 1451904, 'steps': 2835, 'loss/train': 0.4080277383327484} -09/21/2021 00:18:55 - INFO - __main__ - Step 45373: {'lr': 0.00019911686087832254, 'samples': 1451936, 'steps': 2835, 'loss/train': 1.8777943849563599} -09/21/2021 00:18:56 - INFO - __main__ - Step 45374: {'lr': 0.00019911686087832254, 'samples': 1451968, 'steps': 2835, 'loss/train': 1.737752914428711} -09/21/2021 00:18:56 - INFO - __main__ - Step 45375: {'lr': 0.00019911686087832254, 'samples': 1452000, 'steps': 2835, 'loss/train': 1.8574360609054565} -09/21/2021 00:18:57 - INFO - __main__ - Step 45376: {'lr': 0.00019911686087832254, 'samples': 1452032, 'steps': 2835, 'loss/train': 1.8024524450302124} -09/21/2021 00:18:58 - INFO - __main__ - Step 45377: {'lr': 0.00019911601478992788, 'samples': 1452064, 'steps': 2836, 'loss/train': 1.293363332748413} -09/21/2021 00:18:59 - INFO - __main__ - Step 45378: {'lr': 0.00019911601478992788, 'samples': 1452096, 'steps': 2836, 'loss/train': 0.9685549139976501} -09/21/2021 00:18:59 - INFO - __main__ - Step 45379: {'lr': 0.00019911601478992788, 'samples': 1452128, 'steps': 2836, 'loss/train': 1.5187506675720215} -09/21/2021 00:19:00 - INFO - __main__ - Step 45380: {'lr': 0.00019911601478992788, 'samples': 1452160, 'steps': 2836, 'loss/train': 2.01995587348938} -09/21/2021 00:19:01 - INFO - __main__ - Step 45381: {'lr': 0.00019911601478992788, 'samples': 1452192, 'steps': 2836, 'loss/train': 1.8197163343429565} -09/21/2021 00:19:02 - INFO - __main__ - Step 45382: {'lr': 0.00019911601478992788, 'samples': 1452224, 'steps': 2836, 'loss/train': 1.2129673957824707} -09/21/2021 00:19:03 - INFO - __main__ - Step 45383: {'lr': 0.00019911601478992788, 'samples': 1452256, 'steps': 2836, 'loss/train': 1.5379880666732788} -09/21/2021 00:19:04 - INFO - __main__ - Step 45384: {'lr': 0.00019911601478992788, 'samples': 1452288, 'steps': 2836, 'loss/train': 2.5438950061798096} -09/21/2021 00:19:05 - INFO - __main__ - Step 45385: {'lr': 0.00019911601478992788, 'samples': 1452320, 'steps': 2836, 'loss/train': 1.933516263961792} -09/21/2021 00:19:05 - INFO - __main__ - Step 45386: {'lr': 0.00019911601478992788, 'samples': 1452352, 'steps': 2836, 'loss/train': 2.155839443206787} -09/21/2021 00:19:06 - INFO - __main__ - Step 45387: {'lr': 0.00019911601478992788, 'samples': 1452384, 'steps': 2836, 'loss/train': 2.3760855197906494} -09/21/2021 00:19:07 - INFO - __main__ - Step 45388: {'lr': 0.00019911601478992788, 'samples': 1452416, 'steps': 2836, 'loss/train': 2.2545201778411865} -09/21/2021 00:19:08 - INFO - __main__ - Step 45389: {'lr': 0.00019911601478992788, 'samples': 1452448, 'steps': 2836, 'loss/train': 1.6668800115585327} -09/21/2021 00:19:08 - INFO - __main__ - Step 45390: {'lr': 0.00019911601478992788, 'samples': 1452480, 'steps': 2836, 'loss/train': 2.6585562229156494} -09/21/2021 00:19:09 - INFO - __main__ - Step 45391: {'lr': 0.00019911601478992788, 'samples': 1452512, 'steps': 2836, 'loss/train': 2.0647192001342773} -09/21/2021 00:19:10 - INFO - __main__ - Step 45392: {'lr': 0.00019911601478992788, 'samples': 1452544, 'steps': 2836, 'loss/train': 2.85908842086792} -09/21/2021 00:19:11 - INFO - __main__ - Step 45393: {'lr': 0.00019911516829823053, 'samples': 1452576, 'steps': 2837, 'loss/train': 2.1539134979248047} -09/21/2021 00:19:11 - INFO - __main__ - Step 45394: {'lr': 0.00019911516829823053, 'samples': 1452608, 'steps': 2837, 'loss/train': 1.9611937999725342} -09/21/2021 00:19:12 - INFO - __main__ - Step 45395: {'lr': 0.00019911516829823053, 'samples': 1452640, 'steps': 2837, 'loss/train': 1.990681767463684} -09/21/2021 00:19:13 - INFO - __main__ - Step 45396: {'lr': 0.00019911516829823053, 'samples': 1452672, 'steps': 2837, 'loss/train': 1.7385493516921997} -09/21/2021 00:19:14 - INFO - __main__ - Step 45397: {'lr': 0.00019911516829823053, 'samples': 1452704, 'steps': 2837, 'loss/train': 2.4691567420959473} -09/21/2021 00:19:14 - INFO - __main__ - Step 45398: {'lr': 0.00019911516829823053, 'samples': 1452736, 'steps': 2837, 'loss/train': 2.2742390632629395} -09/21/2021 00:19:15 - INFO - __main__ - Step 45399: {'lr': 0.00019911516829823053, 'samples': 1452768, 'steps': 2837, 'loss/train': 1.2683570384979248} -09/21/2021 00:19:16 - INFO - __main__ - Step 45400: {'lr': 0.00019911516829823053, 'samples': 1452800, 'steps': 2837, 'loss/train': 2.3131227493286133} -09/21/2021 00:19:17 - INFO - __main__ - Step 45401: {'lr': 0.00019911516829823053, 'samples': 1452832, 'steps': 2837, 'loss/train': 1.9040051698684692} -09/21/2021 00:19:17 - INFO - __main__ - Step 45402: {'lr': 0.00019911516829823053, 'samples': 1452864, 'steps': 2837, 'loss/train': 1.5736606121063232} -09/21/2021 00:19:18 - INFO - __main__ - Step 45403: {'lr': 0.00019911516829823053, 'samples': 1452896, 'steps': 2837, 'loss/train': 1.072507381439209} -09/21/2021 00:19:19 - INFO - __main__ - Step 45404: {'lr': 0.00019911516829823053, 'samples': 1452928, 'steps': 2837, 'loss/train': 2.4707016944885254} -09/21/2021 00:19:20 - INFO - __main__ - Step 45405: {'lr': 0.00019911516829823053, 'samples': 1452960, 'steps': 2837, 'loss/train': 2.235154151916504} -09/21/2021 00:19:21 - INFO - __main__ - Step 45406: {'lr': 0.00019911516829823053, 'samples': 1452992, 'steps': 2837, 'loss/train': 1.983171820640564} -09/21/2021 00:19:21 - INFO - __main__ - Step 45407: {'lr': 0.00019911516829823053, 'samples': 1453024, 'steps': 2837, 'loss/train': 1.471412181854248} -09/21/2021 00:19:22 - INFO - __main__ - Step 45408: {'lr': 0.00019911516829823053, 'samples': 1453056, 'steps': 2837, 'loss/train': 2.408710241317749} -09/21/2021 00:19:23 - INFO - __main__ - Step 45409: {'lr': 0.00019911432140323396, 'samples': 1453088, 'steps': 2838, 'loss/train': 2.2490997314453125} -09/21/2021 00:19:24 - INFO - __main__ - Step 45410: {'lr': 0.00019911432140323396, 'samples': 1453120, 'steps': 2838, 'loss/train': 1.4185388088226318} -09/21/2021 00:19:24 - INFO - __main__ - Step 45411: {'lr': 0.00019911432140323396, 'samples': 1453152, 'steps': 2838, 'loss/train': 1.9122533798217773} -09/21/2021 00:19:25 - INFO - __main__ - Step 45412: {'lr': 0.00019911432140323396, 'samples': 1453184, 'steps': 2838, 'loss/train': 1.841651439666748} -09/21/2021 00:19:26 - INFO - __main__ - Step 45413: {'lr': 0.00019911432140323396, 'samples': 1453216, 'steps': 2838, 'loss/train': 1.8885345458984375} -09/21/2021 00:19:27 - INFO - __main__ - Step 45414: {'lr': 0.00019911432140323396, 'samples': 1453248, 'steps': 2838, 'loss/train': 2.0656981468200684} -09/21/2021 00:19:28 - INFO - __main__ - Step 45415: {'lr': 0.00019911432140323396, 'samples': 1453280, 'steps': 2838, 'loss/train': 1.7375353574752808} -09/21/2021 00:19:29 - INFO - __main__ - Step 45416: {'lr': 0.00019911432140323396, 'samples': 1453312, 'steps': 2838, 'loss/train': 1.609750747680664} -09/21/2021 00:19:29 - INFO - __main__ - Step 45417: {'lr': 0.00019911432140323396, 'samples': 1453344, 'steps': 2838, 'loss/train': 3.380265474319458} -09/21/2021 00:19:30 - INFO - __main__ - Step 45418: {'lr': 0.00019911432140323396, 'samples': 1453376, 'steps': 2838, 'loss/train': 2.329897880554199} -09/21/2021 00:19:31 - INFO - __main__ - Step 45419: {'lr': 0.00019911432140323396, 'samples': 1453408, 'steps': 2838, 'loss/train': 1.5996005535125732} -09/21/2021 00:19:32 - INFO - __main__ - Step 45420: {'lr': 0.00019911432140323396, 'samples': 1453440, 'steps': 2838, 'loss/train': 1.923793077468872} -09/21/2021 00:19:32 - INFO - __main__ - Step 45421: {'lr': 0.00019911432140323396, 'samples': 1453472, 'steps': 2838, 'loss/train': 2.1151654720306396} -09/21/2021 00:19:33 - INFO - __main__ - Step 45422: {'lr': 0.00019911432140323396, 'samples': 1453504, 'steps': 2838, 'loss/train': 2.080763578414917} -09/21/2021 00:19:34 - INFO - __main__ - Step 45423: {'lr': 0.00019911432140323396, 'samples': 1453536, 'steps': 2838, 'loss/train': 1.963977336883545} -09/21/2021 00:19:35 - INFO - __main__ - Step 45424: {'lr': 0.00019911432140323396, 'samples': 1453568, 'steps': 2838, 'loss/train': 1.596766471862793} -09/21/2021 00:19:36 - INFO - __main__ - Step 45425: {'lr': 0.0001991134741049416, 'samples': 1453600, 'steps': 2839, 'loss/train': 2.8415310382843018} -09/21/2021 00:19:36 - INFO - __main__ - Step 45426: {'lr': 0.0001991134741049416, 'samples': 1453632, 'steps': 2839, 'loss/train': 1.6904572248458862} -09/21/2021 00:19:37 - INFO - __main__ - Step 45427: {'lr': 0.0001991134741049416, 'samples': 1453664, 'steps': 2839, 'loss/train': 2.0757224559783936} -09/21/2021 00:19:38 - INFO - __main__ - Step 45428: {'lr': 0.0001991134741049416, 'samples': 1453696, 'steps': 2839, 'loss/train': 1.8383400440216064} -09/21/2021 00:19:39 - INFO - __main__ - Step 45429: {'lr': 0.0001991134741049416, 'samples': 1453728, 'steps': 2839, 'loss/train': 1.7943252325057983} -09/21/2021 00:19:39 - INFO - __main__ - Step 45430: {'lr': 0.0001991134741049416, 'samples': 1453760, 'steps': 2839, 'loss/train': 2.3835601806640625} -09/21/2021 00:19:40 - INFO - __main__ - Step 45431: {'lr': 0.0001991134741049416, 'samples': 1453792, 'steps': 2839, 'loss/train': 1.6253108978271484} -09/21/2021 00:19:41 - INFO - __main__ - Step 45432: {'lr': 0.0001991134741049416, 'samples': 1453824, 'steps': 2839, 'loss/train': 2.7265357971191406} -09/21/2021 00:19:42 - INFO - __main__ - Step 45433: {'lr': 0.0001991134741049416, 'samples': 1453856, 'steps': 2839, 'loss/train': 2.1538643836975098} -09/21/2021 00:19:42 - INFO - __main__ - Step 45434: {'lr': 0.0001991134741049416, 'samples': 1453888, 'steps': 2839, 'loss/train': 2.8026375770568848} -09/21/2021 00:19:43 - INFO - __main__ - Step 45435: {'lr': 0.0001991134741049416, 'samples': 1453920, 'steps': 2839, 'loss/train': 2.6103360652923584} -09/21/2021 00:19:44 - INFO - __main__ - Step 45436: {'lr': 0.0001991134741049416, 'samples': 1453952, 'steps': 2839, 'loss/train': 2.2965004444122314} -09/21/2021 00:19:45 - INFO - __main__ - Step 45437: {'lr': 0.0001991134741049416, 'samples': 1453984, 'steps': 2839, 'loss/train': 1.5084102153778076} -09/21/2021 00:19:45 - INFO - __main__ - Step 45438: {'lr': 0.0001991134741049416, 'samples': 1454016, 'steps': 2839, 'loss/train': 2.1724774837493896} -09/21/2021 00:19:46 - INFO - __main__ - Step 45439: {'lr': 0.0001991134741049416, 'samples': 1454048, 'steps': 2839, 'loss/train': 1.5845386981964111} -09/21/2021 00:19:47 - INFO - __main__ - Step 45440: {'lr': 0.0001991134741049416, 'samples': 1454080, 'steps': 2839, 'loss/train': 1.5195943117141724} -09/21/2021 00:19:48 - INFO - __main__ - Step 45441: {'lr': 0.00019911262640335688, 'samples': 1454112, 'steps': 2840, 'loss/train': 1.6161658763885498} -09/21/2021 00:19:48 - INFO - __main__ - Step 45442: {'lr': 0.00019911262640335688, 'samples': 1454144, 'steps': 2840, 'loss/train': 1.0671241283416748} -09/21/2021 00:19:49 - INFO - __main__ - Step 45443: {'lr': 0.00019911262640335688, 'samples': 1454176, 'steps': 2840, 'loss/train': 2.218005657196045} -09/21/2021 00:19:50 - INFO - __main__ - Step 45444: {'lr': 0.00019911262640335688, 'samples': 1454208, 'steps': 2840, 'loss/train': 1.7544300556182861} -09/21/2021 00:19:51 - INFO - __main__ - Step 45445: {'lr': 0.00019911262640335688, 'samples': 1454240, 'steps': 2840, 'loss/train': 2.738218307495117} -09/21/2021 00:19:52 - INFO - __main__ - Step 45446: {'lr': 0.00019911262640335688, 'samples': 1454272, 'steps': 2840, 'loss/train': 1.9147011041641235} -09/21/2021 00:19:53 - INFO - __main__ - Step 45447: {'lr': 0.00019911262640335688, 'samples': 1454304, 'steps': 2840, 'loss/train': 1.7965000867843628} -09/21/2021 00:19:53 - INFO - __main__ - Step 45448: {'lr': 0.00019911262640335688, 'samples': 1454336, 'steps': 2840, 'loss/train': 2.0261716842651367} -09/21/2021 00:19:54 - INFO - __main__ - Step 45449: {'lr': 0.00019911262640335688, 'samples': 1454368, 'steps': 2840, 'loss/train': 2.4013757705688477} -09/21/2021 00:19:55 - INFO - __main__ - Step 45450: {'lr': 0.00019911262640335688, 'samples': 1454400, 'steps': 2840, 'loss/train': 1.8139361143112183} -09/21/2021 00:19:56 - INFO - __main__ - Step 45451: {'lr': 0.00019911262640335688, 'samples': 1454432, 'steps': 2840, 'loss/train': 2.50612473487854} -09/21/2021 00:19:56 - INFO - __main__ - Step 45452: {'lr': 0.00019911262640335688, 'samples': 1454464, 'steps': 2840, 'loss/train': 2.5657010078430176} -09/21/2021 00:19:57 - INFO - __main__ - Step 45453: {'lr': 0.00019911262640335688, 'samples': 1454496, 'steps': 2840, 'loss/train': 1.9057027101516724} -09/21/2021 00:19:58 - INFO - __main__ - Step 45454: {'lr': 0.00019911262640335688, 'samples': 1454528, 'steps': 2840, 'loss/train': 2.187838554382324} -09/21/2021 00:19:59 - INFO - __main__ - Step 45455: {'lr': 0.00019911262640335688, 'samples': 1454560, 'steps': 2840, 'loss/train': 1.9392125606536865} -09/21/2021 00:19:59 - INFO - __main__ - Step 45456: {'lr': 0.00019911262640335688, 'samples': 1454592, 'steps': 2840, 'loss/train': 2.089393377304077} -09/21/2021 00:20:00 - INFO - __main__ - Step 45457: {'lr': 0.00019911177829848328, 'samples': 1454624, 'steps': 2841, 'loss/train': 2.7114665508270264} -09/21/2021 00:20:01 - INFO - __main__ - Step 45458: {'lr': 0.00019911177829848328, 'samples': 1454656, 'steps': 2841, 'loss/train': 2.5847551822662354} -09/21/2021 00:20:02 - INFO - __main__ - Step 45459: {'lr': 0.00019911177829848328, 'samples': 1454688, 'steps': 2841, 'loss/train': 2.5916390419006348} -09/21/2021 00:20:03 - INFO - __main__ - Step 45460: {'lr': 0.00019911177829848328, 'samples': 1454720, 'steps': 2841, 'loss/train': 1.4154767990112305} -09/21/2021 00:20:03 - INFO - __main__ - Step 45461: {'lr': 0.00019911177829848328, 'samples': 1454752, 'steps': 2841, 'loss/train': 1.6043459177017212} -09/21/2021 00:20:04 - INFO - __main__ - Step 45462: {'lr': 0.00019911177829848328, 'samples': 1454784, 'steps': 2841, 'loss/train': 2.310215473175049} -09/21/2021 00:20:05 - INFO - __main__ - Step 45463: {'lr': 0.00019911177829848328, 'samples': 1454816, 'steps': 2841, 'loss/train': 1.8021317720413208} -09/21/2021 00:20:06 - INFO - __main__ - Step 45464: {'lr': 0.00019911177829848328, 'samples': 1454848, 'steps': 2841, 'loss/train': 1.0114046335220337} -09/21/2021 00:20:06 - INFO - __main__ - Step 45465: {'lr': 0.00019911177829848328, 'samples': 1454880, 'steps': 2841, 'loss/train': 2.490520715713501} -09/21/2021 00:20:07 - INFO - __main__ - Step 45466: {'lr': 0.00019911177829848328, 'samples': 1454912, 'steps': 2841, 'loss/train': 1.939801573753357} -09/21/2021 00:20:08 - INFO - __main__ - Step 45467: {'lr': 0.00019911177829848328, 'samples': 1454944, 'steps': 2841, 'loss/train': 2.3810813426971436} -09/21/2021 00:20:09 - INFO - __main__ - Step 45468: {'lr': 0.00019911177829848328, 'samples': 1454976, 'steps': 2841, 'loss/train': 2.3416836261749268} -09/21/2021 00:20:09 - INFO - __main__ - Step 45469: {'lr': 0.00019911177829848328, 'samples': 1455008, 'steps': 2841, 'loss/train': 2.3387019634246826} -09/21/2021 00:20:10 - INFO - __main__ - Step 45470: {'lr': 0.00019911177829848328, 'samples': 1455040, 'steps': 2841, 'loss/train': 1.9852195978164673} -09/21/2021 00:20:11 - INFO - __main__ - Step 45471: {'lr': 0.00019911177829848328, 'samples': 1455072, 'steps': 2841, 'loss/train': 0.21125009655952454} -09/21/2021 00:20:12 - INFO - __main__ - Step 45472: {'lr': 0.00019911177829848328, 'samples': 1455104, 'steps': 2841, 'loss/train': 1.8796287775039673} -09/21/2021 00:20:13 - INFO - __main__ - Step 45473: {'lr': 0.00019911092979032425, 'samples': 1455136, 'steps': 2842, 'loss/train': 2.408479928970337} -09/21/2021 00:20:13 - INFO - __main__ - Step 45474: {'lr': 0.00019911092979032425, 'samples': 1455168, 'steps': 2842, 'loss/train': 2.7291746139526367} -09/21/2021 00:20:14 - INFO - __main__ - Step 45475: {'lr': 0.00019911092979032425, 'samples': 1455200, 'steps': 2842, 'loss/train': 1.820712685585022} -09/21/2021 00:20:15 - INFO - __main__ - Step 45476: {'lr': 0.00019911092979032425, 'samples': 1455232, 'steps': 2842, 'loss/train': 2.2605388164520264} -09/21/2021 00:20:16 - INFO - __main__ - Step 45477: {'lr': 0.00019911092979032425, 'samples': 1455264, 'steps': 2842, 'loss/train': 2.6758856773376465} -09/21/2021 00:20:17 - INFO - __main__ - Step 45478: {'lr': 0.00019911092979032425, 'samples': 1455296, 'steps': 2842, 'loss/train': 1.500808835029602} -09/21/2021 00:20:18 - INFO - __main__ - Step 45479: {'lr': 0.00019911092979032425, 'samples': 1455328, 'steps': 2842, 'loss/train': 1.3680694103240967} -09/21/2021 00:20:18 - INFO - __main__ - Step 45480: {'lr': 0.00019911092979032425, 'samples': 1455360, 'steps': 2842, 'loss/train': 2.575254201889038} -09/21/2021 00:20:19 - INFO - __main__ - Step 45481: {'lr': 0.00019911092979032425, 'samples': 1455392, 'steps': 2842, 'loss/train': 2.2825193405151367} -09/21/2021 00:20:20 - INFO - __main__ - Step 45482: {'lr': 0.00019911092979032425, 'samples': 1455424, 'steps': 2842, 'loss/train': 1.9523872137069702} -09/21/2021 00:20:21 - INFO - __main__ - Step 45483: {'lr': 0.00019911092979032425, 'samples': 1455456, 'steps': 2842, 'loss/train': 2.2532429695129395} -09/21/2021 00:20:21 - INFO - __main__ - Step 45484: {'lr': 0.00019911092979032425, 'samples': 1455488, 'steps': 2842, 'loss/train': 2.564422369003296} -09/21/2021 00:20:22 - INFO - __main__ - Step 45485: {'lr': 0.00019911092979032425, 'samples': 1455520, 'steps': 2842, 'loss/train': 2.2884039878845215} -09/21/2021 00:20:23 - INFO - __main__ - Step 45486: {'lr': 0.00019911092979032425, 'samples': 1455552, 'steps': 2842, 'loss/train': 2.2178168296813965} -09/21/2021 00:20:24 - INFO - __main__ - Step 45487: {'lr': 0.00019911092979032425, 'samples': 1455584, 'steps': 2842, 'loss/train': 2.1755497455596924} -09/21/2021 00:20:24 - INFO - __main__ - Step 45488: {'lr': 0.00019911092979032425, 'samples': 1455616, 'steps': 2842, 'loss/train': 2.392672300338745} -09/21/2021 00:20:25 - INFO - __main__ - Step 45489: {'lr': 0.00019911008087888322, 'samples': 1455648, 'steps': 2843, 'loss/train': 2.0680623054504395} -09/21/2021 00:20:26 - INFO - __main__ - Step 45490: {'lr': 0.00019911008087888322, 'samples': 1455680, 'steps': 2843, 'loss/train': 2.133958339691162} -09/21/2021 00:20:27 - INFO - __main__ - Step 45491: {'lr': 0.00019911008087888322, 'samples': 1455712, 'steps': 2843, 'loss/train': 1.8516818284988403} -09/21/2021 00:20:27 - INFO - __main__ - Step 45492: {'lr': 0.00019911008087888322, 'samples': 1455744, 'steps': 2843, 'loss/train': 1.6395930051803589} -09/21/2021 00:20:28 - INFO - __main__ - Step 45493: {'lr': 0.00019911008087888322, 'samples': 1455776, 'steps': 2843, 'loss/train': 2.511705160140991} -09/21/2021 00:20:29 - INFO - __main__ - Step 45494: {'lr': 0.00019911008087888322, 'samples': 1455808, 'steps': 2843, 'loss/train': 2.6047279834747314} -09/21/2021 00:20:30 - INFO - __main__ - Step 45495: {'lr': 0.00019911008087888322, 'samples': 1455840, 'steps': 2843, 'loss/train': 3.002798080444336} -09/21/2021 00:20:30 - INFO - __main__ - Step 45496: {'lr': 0.00019911008087888322, 'samples': 1455872, 'steps': 2843, 'loss/train': 2.1758744716644287} -09/21/2021 00:20:31 - INFO - __main__ - Step 45497: {'lr': 0.00019911008087888322, 'samples': 1455904, 'steps': 2843, 'loss/train': 0.6804308891296387} -09/21/2021 00:20:32 - INFO - __main__ - Step 45498: {'lr': 0.00019911008087888322, 'samples': 1455936, 'steps': 2843, 'loss/train': 1.751800298690796} -09/21/2021 00:20:33 - INFO - __main__ - Step 45499: {'lr': 0.00019911008087888322, 'samples': 1455968, 'steps': 2843, 'loss/train': 1.9352657794952393} -09/21/2021 00:20:33 - INFO - __main__ - Step 45500: {'lr': 0.00019911008087888322, 'samples': 1456000, 'steps': 2843, 'loss/train': 1.538751482963562} -09/21/2021 00:20:34 - INFO - __main__ - Step 45501: {'lr': 0.00019911008087888322, 'samples': 1456032, 'steps': 2843, 'loss/train': 2.7367751598358154} -09/21/2021 00:20:35 - INFO - __main__ - Step 45502: {'lr': 0.00019911008087888322, 'samples': 1456064, 'steps': 2843, 'loss/train': 2.416196823120117} -09/21/2021 00:20:36 - INFO - __main__ - Step 45503: {'lr': 0.00019911008087888322, 'samples': 1456096, 'steps': 2843, 'loss/train': 1.9141658544540405} -09/21/2021 00:20:36 - INFO - __main__ - Step 45504: {'lr': 0.00019911008087888322, 'samples': 1456128, 'steps': 2843, 'loss/train': 1.9760923385620117} -09/21/2021 00:20:37 - INFO - __main__ - Step 45505: {'lr': 0.00019910923156416364, 'samples': 1456160, 'steps': 2844, 'loss/train': 2.591883897781372} -09/21/2021 00:20:38 - INFO - __main__ - Step 45506: {'lr': 0.00019910923156416364, 'samples': 1456192, 'steps': 2844, 'loss/train': 1.8714767694473267} -09/21/2021 00:20:40 - INFO - __main__ - Step 45507: {'lr': 0.00019910923156416364, 'samples': 1456224, 'steps': 2844, 'loss/train': 0.9799448847770691} -09/21/2021 00:20:41 - INFO - __main__ - Step 45508: {'lr': 0.00019910923156416364, 'samples': 1456256, 'steps': 2844, 'loss/train': 1.627525806427002} -09/21/2021 00:20:41 - INFO - __main__ - Step 45509: {'lr': 0.00019910923156416364, 'samples': 1456288, 'steps': 2844, 'loss/train': 2.893369197845459} -09/21/2021 00:20:42 - INFO - __main__ - Step 45510: {'lr': 0.00019910923156416364, 'samples': 1456320, 'steps': 2844, 'loss/train': 2.72735595703125} -09/21/2021 00:20:43 - INFO - __main__ - Step 45511: {'lr': 0.00019910923156416364, 'samples': 1456352, 'steps': 2844, 'loss/train': 0.3436777889728546} -09/21/2021 00:20:44 - INFO - __main__ - Step 45512: {'lr': 0.00019910923156416364, 'samples': 1456384, 'steps': 2844, 'loss/train': 1.7498358488082886} -09/21/2021 00:20:44 - INFO - __main__ - Step 45513: {'lr': 0.00019910923156416364, 'samples': 1456416, 'steps': 2844, 'loss/train': 2.122122049331665} -09/21/2021 00:20:45 - INFO - __main__ - Step 45514: {'lr': 0.00019910923156416364, 'samples': 1456448, 'steps': 2844, 'loss/train': 0.5608875751495361} -09/21/2021 00:20:46 - INFO - __main__ - Step 45515: {'lr': 0.00019910923156416364, 'samples': 1456480, 'steps': 2844, 'loss/train': 0.4156298339366913} -09/21/2021 00:20:47 - INFO - __main__ - Step 45516: {'lr': 0.00019910923156416364, 'samples': 1456512, 'steps': 2844, 'loss/train': 0.8663639426231384} -09/21/2021 00:20:47 - INFO - __main__ - Step 45517: {'lr': 0.00019910923156416364, 'samples': 1456544, 'steps': 2844, 'loss/train': 1.7755217552185059} -09/21/2021 00:20:48 - INFO - __main__ - Step 45518: {'lr': 0.00019910923156416364, 'samples': 1456576, 'steps': 2844, 'loss/train': 1.5446572303771973} -09/21/2021 00:20:49 - INFO - __main__ - Step 45519: {'lr': 0.00019910923156416364, 'samples': 1456608, 'steps': 2844, 'loss/train': 1.5730750560760498} -09/21/2021 00:20:50 - INFO - __main__ - Step 45520: {'lr': 0.00019910923156416364, 'samples': 1456640, 'steps': 2844, 'loss/train': 2.1357991695404053} -09/21/2021 00:20:51 - INFO - __main__ - Step 45521: {'lr': 0.000199108381846169, 'samples': 1456672, 'steps': 2845, 'loss/train': 2.1116015911102295} -09/21/2021 00:20:51 - INFO - __main__ - Step 45522: {'lr': 0.000199108381846169, 'samples': 1456704, 'steps': 2845, 'loss/train': 1.9898273944854736} -09/21/2021 00:20:52 - INFO - __main__ - Step 45523: {'lr': 0.000199108381846169, 'samples': 1456736, 'steps': 2845, 'loss/train': 1.2086248397827148} -09/21/2021 00:20:53 - INFO - __main__ - Step 45524: {'lr': 0.000199108381846169, 'samples': 1456768, 'steps': 2845, 'loss/train': 1.900633692741394} -09/21/2021 00:20:54 - INFO - __main__ - Step 45525: {'lr': 0.000199108381846169, 'samples': 1456800, 'steps': 2845, 'loss/train': 1.7827725410461426} -09/21/2021 00:20:54 - INFO - __main__ - Step 45526: {'lr': 0.000199108381846169, 'samples': 1456832, 'steps': 2845, 'loss/train': 2.0217068195343018} -09/21/2021 00:20:55 - INFO - __main__ - Step 45527: {'lr': 0.000199108381846169, 'samples': 1456864, 'steps': 2845, 'loss/train': 1.3973701000213623} -09/21/2021 00:20:56 - INFO - __main__ - Step 45528: {'lr': 0.000199108381846169, 'samples': 1456896, 'steps': 2845, 'loss/train': 1.44444739818573} -09/21/2021 00:20:57 - INFO - __main__ - Step 45529: {'lr': 0.000199108381846169, 'samples': 1456928, 'steps': 2845, 'loss/train': 2.3728249073028564} -09/21/2021 00:20:57 - INFO - __main__ - Step 45530: {'lr': 0.000199108381846169, 'samples': 1456960, 'steps': 2845, 'loss/train': 0.5708069205284119} -09/21/2021 00:20:58 - INFO - __main__ - Step 45531: {'lr': 0.000199108381846169, 'samples': 1456992, 'steps': 2845, 'loss/train': 0.13783608376979828} -09/21/2021 00:20:59 - INFO - __main__ - Step 45532: {'lr': 0.000199108381846169, 'samples': 1457024, 'steps': 2845, 'loss/train': 0.2772214114665985} -09/21/2021 00:21:00 - INFO - __main__ - Step 45533: {'lr': 0.000199108381846169, 'samples': 1457056, 'steps': 2845, 'loss/train': 0.17867012321949005} -09/21/2021 00:21:00 - INFO - __main__ - Step 45534: {'lr': 0.000199108381846169, 'samples': 1457088, 'steps': 2845, 'loss/train': 2.221554756164551} -09/21/2021 00:21:01 - INFO - __main__ - Step 45535: {'lr': 0.000199108381846169, 'samples': 1457120, 'steps': 2845, 'loss/train': 2.111269474029541} -09/21/2021 00:21:02 - INFO - __main__ - Step 45536: {'lr': 0.000199108381846169, 'samples': 1457152, 'steps': 2845, 'loss/train': 2.6652145385742188} -09/21/2021 00:21:03 - INFO - __main__ - Step 45537: {'lr': 0.00019910753172490276, 'samples': 1457184, 'steps': 2846, 'loss/train': 2.731735944747925} -09/21/2021 00:21:03 - INFO - __main__ - Step 45538: {'lr': 0.00019910753172490276, 'samples': 1457216, 'steps': 2846, 'loss/train': 0.13921767473220825} -09/21/2021 00:21:05 - INFO - __main__ - Step 45539: {'lr': 0.00019910753172490276, 'samples': 1457248, 'steps': 2846, 'loss/train': 0.22828584909439087} -09/21/2021 00:21:06 - INFO - __main__ - Step 45540: {'lr': 0.00019910753172490276, 'samples': 1457280, 'steps': 2846, 'loss/train': 1.5589306354522705} -09/21/2021 00:21:07 - INFO - __main__ - Step 45541: {'lr': 0.00019910753172490276, 'samples': 1457312, 'steps': 2846, 'loss/train': 2.727421998977661} -09/21/2021 00:21:07 - INFO - __main__ - Step 45542: {'lr': 0.00019910753172490276, 'samples': 1457344, 'steps': 2846, 'loss/train': 2.509168863296509} -09/21/2021 00:21:08 - INFO - __main__ - Step 45543: {'lr': 0.00019910753172490276, 'samples': 1457376, 'steps': 2846, 'loss/train': 1.9793853759765625} -09/21/2021 00:21:09 - INFO - __main__ - Step 45544: {'lr': 0.00019910753172490276, 'samples': 1457408, 'steps': 2846, 'loss/train': 1.511366844177246} -09/21/2021 00:21:10 - INFO - __main__ - Step 45545: {'lr': 0.00019910753172490276, 'samples': 1457440, 'steps': 2846, 'loss/train': 2.508025884628296} -09/21/2021 00:21:10 - INFO - __main__ - Step 45546: {'lr': 0.00019910753172490276, 'samples': 1457472, 'steps': 2846, 'loss/train': 1.8590084314346313} -09/21/2021 00:21:11 - INFO - __main__ - Step 45547: {'lr': 0.00019910753172490276, 'samples': 1457504, 'steps': 2846, 'loss/train': 3.5455472469329834} -09/21/2021 00:21:12 - INFO - __main__ - Step 45548: {'lr': 0.00019910753172490276, 'samples': 1457536, 'steps': 2846, 'loss/train': 2.9027504920959473} -09/21/2021 00:21:13 - INFO - __main__ - Step 45549: {'lr': 0.00019910753172490276, 'samples': 1457568, 'steps': 2846, 'loss/train': 2.2120726108551025} -09/21/2021 00:21:13 - INFO - __main__ - Step 45550: {'lr': 0.00019910753172490276, 'samples': 1457600, 'steps': 2846, 'loss/train': 2.5165486335754395} -09/21/2021 00:21:14 - INFO - __main__ - Step 45551: {'lr': 0.00019910753172490276, 'samples': 1457632, 'steps': 2846, 'loss/train': 1.969594955444336} -09/21/2021 00:21:15 - INFO - __main__ - Step 45552: {'lr': 0.00019910753172490276, 'samples': 1457664, 'steps': 2846, 'loss/train': 2.0019614696502686} -09/21/2021 00:21:16 - INFO - __main__ - Step 45553: {'lr': 0.0001991066812003683, 'samples': 1457696, 'steps': 2847, 'loss/train': 2.035475492477417} -09/21/2021 00:21:16 - INFO - __main__ - Step 45554: {'lr': 0.0001991066812003683, 'samples': 1457728, 'steps': 2847, 'loss/train': 1.7428208589553833} -09/21/2021 00:21:17 - INFO - __main__ - Step 45555: {'lr': 0.0001991066812003683, 'samples': 1457760, 'steps': 2847, 'loss/train': 2.8484609127044678} -09/21/2021 00:21:18 - INFO - __main__ - Step 45556: {'lr': 0.0001991066812003683, 'samples': 1457792, 'steps': 2847, 'loss/train': 1.7617346048355103} -09/21/2021 00:21:19 - INFO - __main__ - Step 45557: {'lr': 0.0001991066812003683, 'samples': 1457824, 'steps': 2847, 'loss/train': 1.9783918857574463} -09/21/2021 00:21:19 - INFO - __main__ - Step 45558: {'lr': 0.0001991066812003683, 'samples': 1457856, 'steps': 2847, 'loss/train': 0.32589811086654663} -09/21/2021 00:21:20 - INFO - __main__ - Step 45559: {'lr': 0.0001991066812003683, 'samples': 1457888, 'steps': 2847, 'loss/train': 0.360340416431427} -09/21/2021 00:21:21 - INFO - __main__ - Step 45560: {'lr': 0.0001991066812003683, 'samples': 1457920, 'steps': 2847, 'loss/train': 0.3062232434749603} -09/21/2021 00:21:22 - INFO - __main__ - Step 45561: {'lr': 0.0001991066812003683, 'samples': 1457952, 'steps': 2847, 'loss/train': 0.41952329874038696} -09/21/2021 00:21:22 - INFO - __main__ - Step 45562: {'lr': 0.0001991066812003683, 'samples': 1457984, 'steps': 2847, 'loss/train': 0.3901723325252533} -09/21/2021 00:21:23 - INFO - __main__ - Step 45563: {'lr': 0.0001991066812003683, 'samples': 1458016, 'steps': 2847, 'loss/train': 0.2564191520214081} -09/21/2021 00:21:24 - INFO - __main__ - Step 45564: {'lr': 0.0001991066812003683, 'samples': 1458048, 'steps': 2847, 'loss/train': 0.3325371742248535} -09/21/2021 00:21:25 - INFO - __main__ - Step 45565: {'lr': 0.0001991066812003683, 'samples': 1458080, 'steps': 2847, 'loss/train': 0.3248063623905182} -09/21/2021 00:21:25 - INFO - __main__ - Step 45566: {'lr': 0.0001991066812003683, 'samples': 1458112, 'steps': 2847, 'loss/train': 1.0934141874313354} -09/21/2021 00:21:26 - INFO - __main__ - Step 45567: {'lr': 0.0001991066812003683, 'samples': 1458144, 'steps': 2847, 'loss/train': 1.4320507049560547} -09/21/2021 00:21:27 - INFO - __main__ - Step 45568: {'lr': 0.0001991066812003683, 'samples': 1458176, 'steps': 2847, 'loss/train': 1.3302040100097656} -09/21/2021 00:21:28 - INFO - __main__ - Step 45569: {'lr': 0.0001991058302725692, 'samples': 1458208, 'steps': 2848, 'loss/train': 2.513242721557617} -09/21/2021 00:21:29 - INFO - __main__ - Step 45570: {'lr': 0.0001991058302725692, 'samples': 1458240, 'steps': 2848, 'loss/train': 1.9509600400924683} -09/21/2021 00:21:29 - INFO - __main__ - Step 45571: {'lr': 0.0001991058302725692, 'samples': 1458272, 'steps': 2848, 'loss/train': 1.2018429040908813} -09/21/2021 00:21:30 - INFO - __main__ - Step 45572: {'lr': 0.0001991058302725692, 'samples': 1458304, 'steps': 2848, 'loss/train': 0.7608073949813843} -09/21/2021 00:21:31 - INFO - __main__ - Step 45573: {'lr': 0.0001991058302725692, 'samples': 1458336, 'steps': 2848, 'loss/train': 0.8829887509346008} -09/21/2021 00:21:32 - INFO - __main__ - Step 45574: {'lr': 0.0001991058302725692, 'samples': 1458368, 'steps': 2848, 'loss/train': 1.007318139076233} -09/21/2021 00:21:32 - INFO - __main__ - Step 45575: {'lr': 0.0001991058302725692, 'samples': 1458400, 'steps': 2848, 'loss/train': 2.457115888595581} -09/21/2021 00:21:33 - INFO - __main__ - Step 45576: {'lr': 0.0001991058302725692, 'samples': 1458432, 'steps': 2848, 'loss/train': 1.2432483434677124} -09/21/2021 00:21:34 - INFO - __main__ - Step 45577: {'lr': 0.0001991058302725692, 'samples': 1458464, 'steps': 2848, 'loss/train': 1.9320058822631836} -09/21/2021 00:21:35 - INFO - __main__ - Step 45578: {'lr': 0.0001991058302725692, 'samples': 1458496, 'steps': 2848, 'loss/train': 1.898601770401001} -09/21/2021 00:21:36 - INFO - __main__ - Step 45579: {'lr': 0.0001991058302725692, 'samples': 1458528, 'steps': 2848, 'loss/train': 1.5477797985076904} -09/21/2021 00:21:37 - INFO - __main__ - Step 45580: {'lr': 0.0001991058302725692, 'samples': 1458560, 'steps': 2848, 'loss/train': 1.0673387050628662} -09/21/2021 00:21:37 - INFO - __main__ - Step 45581: {'lr': 0.0001991058302725692, 'samples': 1458592, 'steps': 2848, 'loss/train': 2.4296834468841553} -09/21/2021 00:21:38 - INFO - __main__ - Step 45582: {'lr': 0.0001991058302725692, 'samples': 1458624, 'steps': 2848, 'loss/train': 2.3165297508239746} -09/21/2021 00:21:39 - INFO - __main__ - Step 45583: {'lr': 0.0001991058302725692, 'samples': 1458656, 'steps': 2848, 'loss/train': 1.5278688669204712} -09/21/2021 00:21:40 - INFO - __main__ - Step 45584: {'lr': 0.0001991058302725692, 'samples': 1458688, 'steps': 2848, 'loss/train': 3.090890645980835} -09/21/2021 00:21:40 - INFO - __main__ - Step 45585: {'lr': 0.00019910497894150883, 'samples': 1458720, 'steps': 2849, 'loss/train': 2.469428062438965} -09/21/2021 00:21:41 - INFO - __main__ - Step 45586: {'lr': 0.00019910497894150883, 'samples': 1458752, 'steps': 2849, 'loss/train': 1.6373738050460815} -09/21/2021 00:21:42 - INFO - __main__ - Step 45587: {'lr': 0.00019910497894150883, 'samples': 1458784, 'steps': 2849, 'loss/train': 1.4138720035552979} -09/21/2021 00:21:43 - INFO - __main__ - Step 45588: {'lr': 0.00019910497894150883, 'samples': 1458816, 'steps': 2849, 'loss/train': 1.8836994171142578} -09/21/2021 00:21:43 - INFO - __main__ - Step 45589: {'lr': 0.00019910497894150883, 'samples': 1458848, 'steps': 2849, 'loss/train': 2.7412891387939453} -09/21/2021 00:21:44 - INFO - __main__ - Step 45590: {'lr': 0.00019910497894150883, 'samples': 1458880, 'steps': 2849, 'loss/train': 1.922342300415039} -09/21/2021 00:21:45 - INFO - __main__ - Step 45591: {'lr': 0.00019910497894150883, 'samples': 1458912, 'steps': 2849, 'loss/train': 2.9710493087768555} -09/21/2021 00:21:46 - INFO - __main__ - Step 45592: {'lr': 0.00019910497894150883, 'samples': 1458944, 'steps': 2849, 'loss/train': 1.3726128339767456} -09/21/2021 00:21:46 - INFO - __main__ - Step 45593: {'lr': 0.00019910497894150883, 'samples': 1458976, 'steps': 2849, 'loss/train': 2.4473936557769775} -09/21/2021 00:21:47 - INFO - __main__ - Step 45594: {'lr': 0.00019910497894150883, 'samples': 1459008, 'steps': 2849, 'loss/train': 2.034792184829712} -09/21/2021 00:21:48 - INFO - __main__ - Step 45595: {'lr': 0.00019910497894150883, 'samples': 1459040, 'steps': 2849, 'loss/train': 1.9299602508544922} -09/21/2021 00:21:49 - INFO - __main__ - Step 45596: {'lr': 0.00019910497894150883, 'samples': 1459072, 'steps': 2849, 'loss/train': 1.8163866996765137} -09/21/2021 00:21:49 - INFO - __main__ - Step 45597: {'lr': 0.00019910497894150883, 'samples': 1459104, 'steps': 2849, 'loss/train': 0.45857515931129456} -09/21/2021 00:21:50 - INFO - __main__ - Step 45598: {'lr': 0.00019910497894150883, 'samples': 1459136, 'steps': 2849, 'loss/train': 2.6243534088134766} -09/21/2021 00:21:51 - INFO - __main__ - Step 45599: {'lr': 0.00019910497894150883, 'samples': 1459168, 'steps': 2849, 'loss/train': 0.5391198992729187} -09/21/2021 00:21:52 - INFO - __main__ - Step 45600: {'lr': 0.00019910497894150883, 'samples': 1459200, 'steps': 2849, 'loss/train': 2.3495922088623047} -09/21/2021 00:21:53 - INFO - __main__ - Step 45601: {'lr': 0.0001991041272071907, 'samples': 1459232, 'steps': 2850, 'loss/train': 2.6203150749206543} -09/21/2021 00:21:53 - INFO - __main__ - Step 45602: {'lr': 0.0001991041272071907, 'samples': 1459264, 'steps': 2850, 'loss/train': 1.7430177927017212} -09/21/2021 00:21:54 - INFO - __main__ - Step 45603: {'lr': 0.0001991041272071907, 'samples': 1459296, 'steps': 2850, 'loss/train': 3.137650489807129} -09/21/2021 00:21:55 - INFO - __main__ - Step 45604: {'lr': 0.0001991041272071907, 'samples': 1459328, 'steps': 2850, 'loss/train': 2.377082347869873} -09/21/2021 00:21:56 - INFO - __main__ - Step 45605: {'lr': 0.0001991041272071907, 'samples': 1459360, 'steps': 2850, 'loss/train': 2.4063072204589844} -09/21/2021 00:21:56 - INFO - __main__ - Step 45606: {'lr': 0.0001991041272071907, 'samples': 1459392, 'steps': 2850, 'loss/train': 3.1331570148468018} -09/21/2021 00:21:57 - INFO - __main__ - Step 45607: {'lr': 0.0001991041272071907, 'samples': 1459424, 'steps': 2850, 'loss/train': 2.1889913082122803} -09/21/2021 00:21:59 - INFO - __main__ - Step 45608: {'lr': 0.0001991041272071907, 'samples': 1459456, 'steps': 2850, 'loss/train': 2.130373477935791} -09/21/2021 00:22:00 - INFO - __main__ - Step 45609: {'lr': 0.0001991041272071907, 'samples': 1459488, 'steps': 2850, 'loss/train': 1.919140100479126} -09/21/2021 00:22:00 - INFO - __main__ - Step 45610: {'lr': 0.0001991041272071907, 'samples': 1459520, 'steps': 2850, 'loss/train': 1.446630597114563} -09/21/2021 00:22:01 - INFO - __main__ - Step 45611: {'lr': 0.0001991041272071907, 'samples': 1459552, 'steps': 2850, 'loss/train': 2.3392984867095947} -09/21/2021 00:22:02 - INFO - __main__ - Step 45612: {'lr': 0.0001991041272071907, 'samples': 1459584, 'steps': 2850, 'loss/train': 2.3207011222839355} -09/21/2021 00:22:03 - INFO - __main__ - Step 45613: {'lr': 0.0001991041272071907, 'samples': 1459616, 'steps': 2850, 'loss/train': 0.3067587614059448} -09/21/2021 00:22:03 - INFO - __main__ - Step 45614: {'lr': 0.0001991041272071907, 'samples': 1459648, 'steps': 2850, 'loss/train': 2.4409210681915283} -09/21/2021 00:22:04 - INFO - __main__ - Step 45615: {'lr': 0.0001991041272071907, 'samples': 1459680, 'steps': 2850, 'loss/train': 2.382841110229492} -09/21/2021 00:22:05 - INFO - __main__ - Step 45616: {'lr': 0.0001991041272071907, 'samples': 1459712, 'steps': 2850, 'loss/train': 2.4750733375549316} -09/21/2021 00:22:06 - INFO - __main__ - Step 45617: {'lr': 0.00019910327506961824, 'samples': 1459744, 'steps': 2851, 'loss/train': 0.5669282078742981} -09/21/2021 00:22:07 - INFO - __main__ - Step 45618: {'lr': 0.00019910327506961824, 'samples': 1459776, 'steps': 2851, 'loss/train': 0.14344894886016846} -09/21/2021 00:22:07 - INFO - __main__ - Step 45619: {'lr': 0.00019910327506961824, 'samples': 1459808, 'steps': 2851, 'loss/train': 0.22254402935504913} -09/21/2021 00:22:08 - INFO - __main__ - Step 45620: {'lr': 0.00019910327506961824, 'samples': 1459840, 'steps': 2851, 'loss/train': 0.27885615825653076} -09/21/2021 00:22:09 - INFO - __main__ - Step 45621: {'lr': 0.00019910327506961824, 'samples': 1459872, 'steps': 2851, 'loss/train': 0.39422866702079773} -09/21/2021 00:22:10 - INFO - __main__ - Step 45622: {'lr': 0.00019910327506961824, 'samples': 1459904, 'steps': 2851, 'loss/train': 0.23418936133384705} -09/21/2021 00:22:10 - INFO - __main__ - Step 45623: {'lr': 0.00019910327506961824, 'samples': 1459936, 'steps': 2851, 'loss/train': 0.19611287117004395} -09/21/2021 00:22:11 - INFO - __main__ - Step 45624: {'lr': 0.00019910327506961824, 'samples': 1459968, 'steps': 2851, 'loss/train': 0.5923670530319214} -09/21/2021 00:22:12 - INFO - __main__ - Step 45625: {'lr': 0.00019910327506961824, 'samples': 1460000, 'steps': 2851, 'loss/train': 3.020028591156006} -09/21/2021 00:22:13 - INFO - __main__ - Step 45626: {'lr': 0.00019910327506961824, 'samples': 1460032, 'steps': 2851, 'loss/train': 1.8772220611572266} -09/21/2021 00:22:13 - INFO - __main__ - Step 45627: {'lr': 0.00019910327506961824, 'samples': 1460064, 'steps': 2851, 'loss/train': 2.0681345462799072} -09/21/2021 00:22:14 - INFO - __main__ - Step 45628: {'lr': 0.00019910327506961824, 'samples': 1460096, 'steps': 2851, 'loss/train': 2.0582404136657715} -09/21/2021 00:22:15 - INFO - __main__ - Step 45629: {'lr': 0.00019910327506961824, 'samples': 1460128, 'steps': 2851, 'loss/train': 1.5857406854629517} -09/21/2021 00:22:16 - INFO - __main__ - Step 45630: {'lr': 0.00019910327506961824, 'samples': 1460160, 'steps': 2851, 'loss/train': 2.3594632148742676} -09/21/2021 00:22:16 - INFO - __main__ - Step 45631: {'lr': 0.00019910327506961824, 'samples': 1460192, 'steps': 2851, 'loss/train': 1.570048213005066} -09/21/2021 00:22:17 - INFO - __main__ - Step 45632: {'lr': 0.00019910327506961824, 'samples': 1460224, 'steps': 2851, 'loss/train': 2.515029191970825} -09/21/2021 00:22:18 - INFO - __main__ - Step 45633: {'lr': 0.00019910242252879496, 'samples': 1460256, 'steps': 2852, 'loss/train': 2.4263288974761963} -09/21/2021 00:22:19 - INFO - __main__ - Step 45634: {'lr': 0.00019910242252879496, 'samples': 1460288, 'steps': 2852, 'loss/train': 1.0952030420303345} -09/21/2021 00:22:19 - INFO - __main__ - Step 45635: {'lr': 0.00019910242252879496, 'samples': 1460320, 'steps': 2852, 'loss/train': 2.0661234855651855} -09/21/2021 00:22:20 - INFO - __main__ - Step 45636: {'lr': 0.00019910242252879496, 'samples': 1460352, 'steps': 2852, 'loss/train': 1.8456850051879883} -09/21/2021 00:22:21 - INFO - __main__ - Step 45637: {'lr': 0.00019910242252879496, 'samples': 1460384, 'steps': 2852, 'loss/train': 0.5021089315414429} -09/21/2021 00:22:22 - INFO - __main__ - Step 45638: {'lr': 0.00019910242252879496, 'samples': 1460416, 'steps': 2852, 'loss/train': 1.4871389865875244} -09/21/2021 00:22:23 - INFO - __main__ - Step 45639: {'lr': 0.00019910242252879496, 'samples': 1460448, 'steps': 2852, 'loss/train': 2.4705162048339844} -09/21/2021 00:22:24 - INFO - __main__ - Step 45640: {'lr': 0.00019910242252879496, 'samples': 1460480, 'steps': 2852, 'loss/train': 1.632361650466919} -09/21/2021 00:22:24 - INFO - __main__ - Step 45641: {'lr': 0.00019910242252879496, 'samples': 1460512, 'steps': 2852, 'loss/train': 1.3087537288665771} -09/21/2021 00:22:25 - INFO - __main__ - Step 45642: {'lr': 0.00019910242252879496, 'samples': 1460544, 'steps': 2852, 'loss/train': 2.3666141033172607} -09/21/2021 00:22:26 - INFO - __main__ - Step 45643: {'lr': 0.00019910242252879496, 'samples': 1460576, 'steps': 2852, 'loss/train': 2.8220009803771973} -09/21/2021 00:22:27 - INFO - __main__ - Step 45644: {'lr': 0.00019910242252879496, 'samples': 1460608, 'steps': 2852, 'loss/train': 2.258937358856201} -09/21/2021 00:22:27 - INFO - __main__ - Step 45645: {'lr': 0.00019910242252879496, 'samples': 1460640, 'steps': 2852, 'loss/train': 1.919002652168274} -09/21/2021 00:22:28 - INFO - __main__ - Step 45646: {'lr': 0.00019910242252879496, 'samples': 1460672, 'steps': 2852, 'loss/train': 2.4024436473846436} -09/21/2021 00:22:29 - INFO - __main__ - Step 45647: {'lr': 0.00019910242252879496, 'samples': 1460704, 'steps': 2852, 'loss/train': 1.0486726760864258} -09/21/2021 00:22:30 - INFO - __main__ - Step 45648: {'lr': 0.00019910242252879496, 'samples': 1460736, 'steps': 2852, 'loss/train': 2.0070369243621826} -09/21/2021 00:22:31 - INFO - __main__ - Step 45649: {'lr': 0.00019910156958472428, 'samples': 1460768, 'steps': 2853, 'loss/train': 2.103679895401001} -09/21/2021 00:22:31 - INFO - __main__ - Step 45650: {'lr': 0.00019910156958472428, 'samples': 1460800, 'steps': 2853, 'loss/train': 2.975642681121826} -09/21/2021 00:22:32 - INFO - __main__ - Step 45651: {'lr': 0.00019910156958472428, 'samples': 1460832, 'steps': 2853, 'loss/train': 3.562610149383545} -09/21/2021 00:22:33 - INFO - __main__ - Step 45652: {'lr': 0.00019910156958472428, 'samples': 1460864, 'steps': 2853, 'loss/train': 1.8755398988723755} -09/21/2021 00:22:34 - INFO - __main__ - Step 45653: {'lr': 0.00019910156958472428, 'samples': 1460896, 'steps': 2853, 'loss/train': 3.0654215812683105} -09/21/2021 00:22:34 - INFO - __main__ - Step 45654: {'lr': 0.00019910156958472428, 'samples': 1460928, 'steps': 2853, 'loss/train': 2.394796848297119} -09/21/2021 00:22:35 - INFO - __main__ - Step 45655: {'lr': 0.00019910156958472428, 'samples': 1460960, 'steps': 2853, 'loss/train': 2.662862777709961} -09/21/2021 00:22:36 - INFO - __main__ - Step 45656: {'lr': 0.00019910156958472428, 'samples': 1460992, 'steps': 2853, 'loss/train': 1.338446855545044} -09/21/2021 00:22:37 - INFO - __main__ - Step 45657: {'lr': 0.00019910156958472428, 'samples': 1461024, 'steps': 2853, 'loss/train': 1.5466196537017822} -09/21/2021 00:22:37 - INFO - __main__ - Step 45658: {'lr': 0.00019910156958472428, 'samples': 1461056, 'steps': 2853, 'loss/train': 1.8323036432266235} -09/21/2021 00:22:38 - INFO - __main__ - Step 45659: {'lr': 0.00019910156958472428, 'samples': 1461088, 'steps': 2853, 'loss/train': 1.9272724390029907} -09/21/2021 00:22:39 - INFO - __main__ - Step 45660: {'lr': 0.00019910156958472428, 'samples': 1461120, 'steps': 2853, 'loss/train': 2.407367706298828} -09/21/2021 00:22:40 - INFO - __main__ - Step 45661: {'lr': 0.00019910156958472428, 'samples': 1461152, 'steps': 2853, 'loss/train': 1.5129112005233765} -09/21/2021 00:22:40 - INFO - __main__ - Step 45662: {'lr': 0.00019910156958472428, 'samples': 1461184, 'steps': 2853, 'loss/train': 2.0269792079925537} -09/21/2021 00:22:41 - INFO - __main__ - Step 45663: {'lr': 0.00019910156958472428, 'samples': 1461216, 'steps': 2853, 'loss/train': 1.842637538909912} -09/21/2021 00:22:42 - INFO - __main__ - Step 45664: {'lr': 0.00019910156958472428, 'samples': 1461248, 'steps': 2853, 'loss/train': 2.7364180088043213} -09/21/2021 00:22:43 - INFO - __main__ - Step 45665: {'lr': 0.0001991007162374097, 'samples': 1461280, 'steps': 2854, 'loss/train': 2.140655279159546} -09/21/2021 00:22:44 - INFO - __main__ - Step 45666: {'lr': 0.0001991007162374097, 'samples': 1461312, 'steps': 2854, 'loss/train': 2.8301477432250977} -09/21/2021 00:22:44 - INFO - __main__ - Step 45667: {'lr': 0.0001991007162374097, 'samples': 1461344, 'steps': 2854, 'loss/train': 1.9316797256469727} -09/21/2021 00:22:45 - INFO - __main__ - Step 45668: {'lr': 0.0001991007162374097, 'samples': 1461376, 'steps': 2854, 'loss/train': 2.531855821609497} -09/21/2021 00:22:46 - INFO - __main__ - Step 45669: {'lr': 0.0001991007162374097, 'samples': 1461408, 'steps': 2854, 'loss/train': 1.9316902160644531} -09/21/2021 00:22:47 - INFO - __main__ - Step 45670: {'lr': 0.0001991007162374097, 'samples': 1461440, 'steps': 2854, 'loss/train': 2.58026385307312} -09/21/2021 00:22:48 - INFO - __main__ - Step 45671: {'lr': 0.0001991007162374097, 'samples': 1461472, 'steps': 2854, 'loss/train': 2.191157341003418} -09/21/2021 00:22:49 - INFO - __main__ - Step 45672: {'lr': 0.0001991007162374097, 'samples': 1461504, 'steps': 2854, 'loss/train': 2.555523157119751} -09/21/2021 00:22:49 - INFO - __main__ - Step 45673: {'lr': 0.0001991007162374097, 'samples': 1461536, 'steps': 2854, 'loss/train': 1.9781192541122437} -09/21/2021 00:22:50 - INFO - __main__ - Step 45674: {'lr': 0.0001991007162374097, 'samples': 1461568, 'steps': 2854, 'loss/train': 0.6885474920272827} -09/21/2021 00:22:51 - INFO - __main__ - Step 45675: {'lr': 0.0001991007162374097, 'samples': 1461600, 'steps': 2854, 'loss/train': 2.112614870071411} -09/21/2021 00:22:52 - INFO - __main__ - Step 45676: {'lr': 0.0001991007162374097, 'samples': 1461632, 'steps': 2854, 'loss/train': 3.651675224304199} -09/21/2021 00:22:52 - INFO - __main__ - Step 45677: {'lr': 0.0001991007162374097, 'samples': 1461664, 'steps': 2854, 'loss/train': 1.7573716640472412} -09/21/2021 00:22:53 - INFO - __main__ - Step 45678: {'lr': 0.0001991007162374097, 'samples': 1461696, 'steps': 2854, 'loss/train': 1.6603809595108032} -09/21/2021 00:22:54 - INFO - __main__ - Step 45679: {'lr': 0.0001991007162374097, 'samples': 1461728, 'steps': 2854, 'loss/train': 1.4329824447631836} -09/21/2021 00:22:55 - INFO - __main__ - Step 45680: {'lr': 0.0001991007162374097, 'samples': 1461760, 'steps': 2854, 'loss/train': 2.0124616622924805} -09/21/2021 00:22:55 - INFO - __main__ - Step 45681: {'lr': 0.00019909986248685472, 'samples': 1461792, 'steps': 2855, 'loss/train': 1.456440806388855} -09/21/2021 00:22:56 - INFO - __main__ - Step 45682: {'lr': 0.00019909986248685472, 'samples': 1461824, 'steps': 2855, 'loss/train': 1.228518009185791} -09/21/2021 00:22:57 - INFO - __main__ - Step 45683: {'lr': 0.00019909986248685472, 'samples': 1461856, 'steps': 2855, 'loss/train': 2.1085658073425293} -09/21/2021 00:22:58 - INFO - __main__ - Step 45684: {'lr': 0.00019909986248685472, 'samples': 1461888, 'steps': 2855, 'loss/train': 1.877588152885437} -09/21/2021 00:22:58 - INFO - __main__ - Step 45685: {'lr': 0.00019909986248685472, 'samples': 1461920, 'steps': 2855, 'loss/train': 2.828366279602051} -09/21/2021 00:22:59 - INFO - __main__ - Step 45686: {'lr': 0.00019909986248685472, 'samples': 1461952, 'steps': 2855, 'loss/train': 0.4573300778865814} -09/21/2021 00:23:00 - INFO - __main__ - Step 45687: {'lr': 0.00019909986248685472, 'samples': 1461984, 'steps': 2855, 'loss/train': 1.7105298042297363} -09/21/2021 00:23:01 - INFO - __main__ - Step 45688: {'lr': 0.00019909986248685472, 'samples': 1462016, 'steps': 2855, 'loss/train': 2.1960153579711914} -09/21/2021 00:23:01 - INFO - __main__ - Step 45689: {'lr': 0.00019909986248685472, 'samples': 1462048, 'steps': 2855, 'loss/train': 1.888074517250061} -09/21/2021 00:23:02 - INFO - __main__ - Step 45690: {'lr': 0.00019909986248685472, 'samples': 1462080, 'steps': 2855, 'loss/train': 1.5583099126815796} -09/21/2021 00:23:03 - INFO - __main__ - Step 45691: {'lr': 0.00019909986248685472, 'samples': 1462112, 'steps': 2855, 'loss/train': 1.8521922826766968} -09/21/2021 00:23:04 - INFO - __main__ - Step 45692: {'lr': 0.00019909986248685472, 'samples': 1462144, 'steps': 2855, 'loss/train': 2.063340902328491} -09/21/2021 00:23:04 - INFO - __main__ - Step 45693: {'lr': 0.00019909986248685472, 'samples': 1462176, 'steps': 2855, 'loss/train': 1.4885220527648926} -09/21/2021 00:23:05 - INFO - __main__ - Step 45694: {'lr': 0.00019909986248685472, 'samples': 1462208, 'steps': 2855, 'loss/train': 1.7256453037261963} -09/21/2021 00:23:06 - INFO - __main__ - Step 45695: {'lr': 0.00019909986248685472, 'samples': 1462240, 'steps': 2855, 'loss/train': 1.1283619403839111} -09/21/2021 00:23:07 - INFO - __main__ - Step 45696: {'lr': 0.00019909986248685472, 'samples': 1462272, 'steps': 2855, 'loss/train': 2.329228162765503} -09/21/2021 00:23:08 - INFO - __main__ - Step 45697: {'lr': 0.00019909900833306278, 'samples': 1462304, 'steps': 2856, 'loss/train': 2.340880870819092} -09/21/2021 00:23:08 - INFO - __main__ - Step 45698: {'lr': 0.00019909900833306278, 'samples': 1462336, 'steps': 2856, 'loss/train': 2.044642925262451} -09/21/2021 00:23:09 - INFO - __main__ - Step 45699: {'lr': 0.00019909900833306278, 'samples': 1462368, 'steps': 2856, 'loss/train': 3.015611171722412} -09/21/2021 00:23:10 - INFO - __main__ - Step 45700: {'lr': 0.00019909900833306278, 'samples': 1462400, 'steps': 2856, 'loss/train': 1.4908562898635864} -09/21/2021 00:23:11 - INFO - __main__ - Step 45701: {'lr': 0.00019909900833306278, 'samples': 1462432, 'steps': 2856, 'loss/train': 2.477198362350464} -09/21/2021 00:23:11 - INFO - __main__ - Step 45702: {'lr': 0.00019909900833306278, 'samples': 1462464, 'steps': 2856, 'loss/train': 1.9502631425857544} -09/21/2021 00:23:13 - INFO - __main__ - Step 45703: {'lr': 0.00019909900833306278, 'samples': 1462496, 'steps': 2856, 'loss/train': 2.134084701538086} -09/21/2021 00:23:13 - INFO - __main__ - Step 45704: {'lr': 0.00019909900833306278, 'samples': 1462528, 'steps': 2856, 'loss/train': 1.4421874284744263} -09/21/2021 00:23:14 - INFO - __main__ - Step 45705: {'lr': 0.00019909900833306278, 'samples': 1462560, 'steps': 2856, 'loss/train': 1.2747682332992554} -09/21/2021 00:23:15 - INFO - __main__ - Step 45706: {'lr': 0.00019909900833306278, 'samples': 1462592, 'steps': 2856, 'loss/train': 1.2721290588378906} -09/21/2021 00:23:16 - INFO - __main__ - Step 45707: {'lr': 0.00019909900833306278, 'samples': 1462624, 'steps': 2856, 'loss/train': 2.55241060256958} -09/21/2021 00:23:16 - INFO - __main__ - Step 45708: {'lr': 0.00019909900833306278, 'samples': 1462656, 'steps': 2856, 'loss/train': 4.810369491577148} -09/21/2021 00:23:17 - INFO - __main__ - Step 45709: {'lr': 0.00019909900833306278, 'samples': 1462688, 'steps': 2856, 'loss/train': 1.4715989828109741} -09/21/2021 00:23:18 - INFO - __main__ - Step 45710: {'lr': 0.00019909900833306278, 'samples': 1462720, 'steps': 2856, 'loss/train': 1.1846054792404175} -09/21/2021 00:23:19 - INFO - __main__ - Step 45711: {'lr': 0.00019909900833306278, 'samples': 1462752, 'steps': 2856, 'loss/train': 1.3544988632202148} -09/21/2021 00:23:19 - INFO - __main__ - Step 45712: {'lr': 0.00019909900833306278, 'samples': 1462784, 'steps': 2856, 'loss/train': 1.9274017810821533} -09/21/2021 00:23:20 - INFO - __main__ - Step 45713: {'lr': 0.00019909815377603732, 'samples': 1462816, 'steps': 2857, 'loss/train': 1.8826467990875244} -09/21/2021 00:23:21 - INFO - __main__ - Step 45714: {'lr': 0.00019909815377603732, 'samples': 1462848, 'steps': 2857, 'loss/train': 1.6065298318862915} -09/21/2021 00:23:22 - INFO - __main__ - Step 45715: {'lr': 0.00019909815377603732, 'samples': 1462880, 'steps': 2857, 'loss/train': 1.850794792175293} -09/21/2021 00:23:23 - INFO - __main__ - Step 45716: {'lr': 0.00019909815377603732, 'samples': 1462912, 'steps': 2857, 'loss/train': 2.1685945987701416} -09/21/2021 00:23:23 - INFO - __main__ - Step 45717: {'lr': 0.00019909815377603732, 'samples': 1462944, 'steps': 2857, 'loss/train': 2.2606379985809326} -09/21/2021 00:23:24 - INFO - __main__ - Step 45718: {'lr': 0.00019909815377603732, 'samples': 1462976, 'steps': 2857, 'loss/train': 1.4452402591705322} -09/21/2021 00:23:25 - INFO - __main__ - Step 45719: {'lr': 0.00019909815377603732, 'samples': 1463008, 'steps': 2857, 'loss/train': 2.486513614654541} -09/21/2021 00:23:26 - INFO - __main__ - Step 45720: {'lr': 0.00019909815377603732, 'samples': 1463040, 'steps': 2857, 'loss/train': 2.8440091609954834} -09/21/2021 00:23:26 - INFO - __main__ - Step 45721: {'lr': 0.00019909815377603732, 'samples': 1463072, 'steps': 2857, 'loss/train': 1.9382612705230713} -09/21/2021 00:23:27 - INFO - __main__ - Step 45722: {'lr': 0.00019909815377603732, 'samples': 1463104, 'steps': 2857, 'loss/train': 1.755562663078308} -09/21/2021 00:23:28 - INFO - __main__ - Step 45723: {'lr': 0.00019909815377603732, 'samples': 1463136, 'steps': 2857, 'loss/train': 2.5899853706359863} -09/21/2021 00:23:29 - INFO - __main__ - Step 45724: {'lr': 0.00019909815377603732, 'samples': 1463168, 'steps': 2857, 'loss/train': 1.5716861486434937} -09/21/2021 00:23:29 - INFO - __main__ - Step 45725: {'lr': 0.00019909815377603732, 'samples': 1463200, 'steps': 2857, 'loss/train': 1.7499189376831055} -09/21/2021 00:23:30 - INFO - __main__ - Step 45726: {'lr': 0.00019909815377603732, 'samples': 1463232, 'steps': 2857, 'loss/train': 2.166938066482544} -09/21/2021 00:23:31 - INFO - __main__ - Step 45727: {'lr': 0.00019909815377603732, 'samples': 1463264, 'steps': 2857, 'loss/train': 1.8771483898162842} -09/21/2021 00:23:32 - INFO - __main__ - Step 45728: {'lr': 0.00019909815377603732, 'samples': 1463296, 'steps': 2857, 'loss/train': 1.5011441707611084} -09/21/2021 00:23:32 - INFO - __main__ - Step 45729: {'lr': 0.0001990972988157819, 'samples': 1463328, 'steps': 2858, 'loss/train': 2.2200450897216797} -09/21/2021 00:23:33 - INFO - __main__ - Step 45730: {'lr': 0.0001990972988157819, 'samples': 1463360, 'steps': 2858, 'loss/train': 1.5506852865219116} -09/21/2021 00:23:34 - INFO - __main__ - Step 45731: {'lr': 0.0001990972988157819, 'samples': 1463392, 'steps': 2858, 'loss/train': 1.4214389324188232} -09/21/2021 00:23:35 - INFO - __main__ - Step 45732: {'lr': 0.0001990972988157819, 'samples': 1463424, 'steps': 2858, 'loss/train': 1.879167079925537} -09/21/2021 00:23:35 - INFO - __main__ - Step 45733: {'lr': 0.0001990972988157819, 'samples': 1463456, 'steps': 2858, 'loss/train': 2.126875638961792} -09/21/2021 00:23:37 - INFO - __main__ - Step 45734: {'lr': 0.0001990972988157819, 'samples': 1463488, 'steps': 2858, 'loss/train': 2.015151023864746} -09/21/2021 00:23:37 - INFO - __main__ - Step 45735: {'lr': 0.0001990972988157819, 'samples': 1463520, 'steps': 2858, 'loss/train': 2.03005313873291} -09/21/2021 00:23:38 - INFO - __main__ - Step 45736: {'lr': 0.0001990972988157819, 'samples': 1463552, 'steps': 2858, 'loss/train': 1.8209465742111206} -09/21/2021 00:23:39 - INFO - __main__ - Step 45737: {'lr': 0.0001990972988157819, 'samples': 1463584, 'steps': 2858, 'loss/train': 2.1599843502044678} -09/21/2021 00:23:40 - INFO - __main__ - Step 45738: {'lr': 0.0001990972988157819, 'samples': 1463616, 'steps': 2858, 'loss/train': 2.093634843826294} -09/21/2021 00:23:40 - INFO - __main__ - Step 45739: {'lr': 0.0001990972988157819, 'samples': 1463648, 'steps': 2858, 'loss/train': 2.072951316833496} -09/21/2021 00:23:41 - INFO - __main__ - Step 45740: {'lr': 0.0001990972988157819, 'samples': 1463680, 'steps': 2858, 'loss/train': 1.4565891027450562} -09/21/2021 00:23:42 - INFO - __main__ - Step 45741: {'lr': 0.0001990972988157819, 'samples': 1463712, 'steps': 2858, 'loss/train': 2.17219614982605} -09/21/2021 00:23:43 - INFO - __main__ - Step 45742: {'lr': 0.0001990972988157819, 'samples': 1463744, 'steps': 2858, 'loss/train': 0.7863460779190063} -09/21/2021 00:23:43 - INFO - __main__ - Step 45743: {'lr': 0.0001990972988157819, 'samples': 1463776, 'steps': 2858, 'loss/train': 1.9166676998138428} -09/21/2021 00:23:44 - INFO - __main__ - Step 45744: {'lr': 0.0001990972988157819, 'samples': 1463808, 'steps': 2858, 'loss/train': 1.7555360794067383} -09/21/2021 00:23:45 - INFO - __main__ - Step 45745: {'lr': 0.00019909644345229995, 'samples': 1463840, 'steps': 2859, 'loss/train': 2.3416907787323} -09/21/2021 00:23:46 - INFO - __main__ - Step 45746: {'lr': 0.00019909644345229995, 'samples': 1463872, 'steps': 2859, 'loss/train': 0.48616302013397217} -09/21/2021 00:23:47 - INFO - __main__ - Step 45747: {'lr': 0.00019909644345229995, 'samples': 1463904, 'steps': 2859, 'loss/train': 1.9939515590667725} -09/21/2021 00:23:47 - INFO - __main__ - Step 45748: {'lr': 0.00019909644345229995, 'samples': 1463936, 'steps': 2859, 'loss/train': 2.6273365020751953} -09/21/2021 00:23:48 - INFO - __main__ - Step 45749: {'lr': 0.00019909644345229995, 'samples': 1463968, 'steps': 2859, 'loss/train': 2.271075487136841} -09/21/2021 00:23:49 - INFO - __main__ - Step 45750: {'lr': 0.00019909644345229995, 'samples': 1464000, 'steps': 2859, 'loss/train': 1.8725827932357788} -09/21/2021 00:23:50 - INFO - __main__ - Step 45751: {'lr': 0.00019909644345229995, 'samples': 1464032, 'steps': 2859, 'loss/train': 1.964431643486023} -09/21/2021 00:23:50 - INFO - __main__ - Step 45752: {'lr': 0.00019909644345229995, 'samples': 1464064, 'steps': 2859, 'loss/train': 1.1319655179977417} -09/21/2021 00:23:51 - INFO - __main__ - Step 45753: {'lr': 0.00019909644345229995, 'samples': 1464096, 'steps': 2859, 'loss/train': 2.0400166511535645} -09/21/2021 00:23:52 - INFO - __main__ - Step 45754: {'lr': 0.00019909644345229995, 'samples': 1464128, 'steps': 2859, 'loss/train': 2.1332733631134033} -09/21/2021 00:23:53 - INFO - __main__ - Step 45755: {'lr': 0.00019909644345229995, 'samples': 1464160, 'steps': 2859, 'loss/train': 1.2222439050674438} -09/21/2021 00:23:53 - INFO - __main__ - Step 45756: {'lr': 0.00019909644345229995, 'samples': 1464192, 'steps': 2859, 'loss/train': 2.0291731357574463} -09/21/2021 00:23:54 - INFO - __main__ - Step 45757: {'lr': 0.00019909644345229995, 'samples': 1464224, 'steps': 2859, 'loss/train': 2.0410046577453613} -09/21/2021 00:23:55 - INFO - __main__ - Step 45758: {'lr': 0.00019909644345229995, 'samples': 1464256, 'steps': 2859, 'loss/train': 2.1306915283203125} -09/21/2021 00:23:56 - INFO - __main__ - Step 45759: {'lr': 0.00019909644345229995, 'samples': 1464288, 'steps': 2859, 'loss/train': 2.914177894592285} -09/21/2021 00:23:56 - INFO - __main__ - Step 45760: {'lr': 0.00019909644345229995, 'samples': 1464320, 'steps': 2859, 'loss/train': 1.6732017993927002} -09/21/2021 00:23:57 - INFO - __main__ - Step 45761: {'lr': 0.00019909558768559495, 'samples': 1464352, 'steps': 2860, 'loss/train': 2.2663207054138184} -09/21/2021 00:23:58 - INFO - __main__ - Step 45762: {'lr': 0.00019909558768559495, 'samples': 1464384, 'steps': 2860, 'loss/train': 0.9441612362861633} -09/21/2021 00:23:59 - INFO - __main__ - Step 45763: {'lr': 0.00019909558768559495, 'samples': 1464416, 'steps': 2860, 'loss/train': 0.9605840444564819} -09/21/2021 00:24:00 - INFO - __main__ - Step 45764: {'lr': 0.00019909558768559495, 'samples': 1464448, 'steps': 2860, 'loss/train': 1.3597415685653687} -09/21/2021 00:24:01 - INFO - __main__ - Step 45765: {'lr': 0.00019909558768559495, 'samples': 1464480, 'steps': 2860, 'loss/train': 2.26517915725708} -09/21/2021 00:24:02 - INFO - __main__ - Step 45766: {'lr': 0.00019909558768559495, 'samples': 1464512, 'steps': 2860, 'loss/train': 2.539381265640259} -09/21/2021 00:24:02 - INFO - __main__ - Step 45767: {'lr': 0.00019909558768559495, 'samples': 1464544, 'steps': 2860, 'loss/train': 2.1279780864715576} -09/21/2021 00:24:03 - INFO - __main__ - Step 45768: {'lr': 0.00019909558768559495, 'samples': 1464576, 'steps': 2860, 'loss/train': 1.6208109855651855} -09/21/2021 00:24:04 - INFO - __main__ - Step 45769: {'lr': 0.00019909558768559495, 'samples': 1464608, 'steps': 2860, 'loss/train': 1.7500219345092773} -09/21/2021 00:24:05 - INFO - __main__ - Step 45770: {'lr': 0.00019909558768559495, 'samples': 1464640, 'steps': 2860, 'loss/train': 1.7719318866729736} -09/21/2021 00:24:05 - INFO - __main__ - Step 45771: {'lr': 0.00019909558768559495, 'samples': 1464672, 'steps': 2860, 'loss/train': 2.109924077987671} -09/21/2021 00:24:06 - INFO - __main__ - Step 45772: {'lr': 0.00019909558768559495, 'samples': 1464704, 'steps': 2860, 'loss/train': 1.2146574258804321} -09/21/2021 00:24:07 - INFO - __main__ - Step 45773: {'lr': 0.00019909558768559495, 'samples': 1464736, 'steps': 2860, 'loss/train': 1.8539263010025024} -09/21/2021 00:24:08 - INFO - __main__ - Step 45774: {'lr': 0.00019909558768559495, 'samples': 1464768, 'steps': 2860, 'loss/train': 1.0337839126586914} -09/21/2021 00:24:08 - INFO - __main__ - Step 45775: {'lr': 0.00019909558768559495, 'samples': 1464800, 'steps': 2860, 'loss/train': 2.4914653301239014} -09/21/2021 00:24:09 - INFO - __main__ - Step 45776: {'lr': 0.00019909558768559495, 'samples': 1464832, 'steps': 2860, 'loss/train': 1.7349516153335571} -09/21/2021 00:24:10 - INFO - __main__ - Step 45777: {'lr': 0.0001990947315156704, 'samples': 1464864, 'steps': 2861, 'loss/train': 0.7290442585945129} -09/21/2021 00:24:11 - INFO - __main__ - Step 45778: {'lr': 0.0001990947315156704, 'samples': 1464896, 'steps': 2861, 'loss/train': 0.9661502242088318} -09/21/2021 00:24:11 - INFO - __main__ - Step 45779: {'lr': 0.0001990947315156704, 'samples': 1464928, 'steps': 2861, 'loss/train': 1.1598565578460693} -09/21/2021 00:24:12 - INFO - __main__ - Step 45780: {'lr': 0.0001990947315156704, 'samples': 1464960, 'steps': 2861, 'loss/train': 0.7169561386108398} -09/21/2021 00:24:13 - INFO - __main__ - Step 45781: {'lr': 0.0001990947315156704, 'samples': 1464992, 'steps': 2861, 'loss/train': 2.6428017616271973} -09/21/2021 00:24:14 - INFO - __main__ - Step 45782: {'lr': 0.0001990947315156704, 'samples': 1465024, 'steps': 2861, 'loss/train': 2.4889822006225586} -09/21/2021 00:24:14 - INFO - __main__ - Step 45783: {'lr': 0.0001990947315156704, 'samples': 1465056, 'steps': 2861, 'loss/train': 1.7420077323913574} -09/21/2021 00:24:15 - INFO - __main__ - Step 45784: {'lr': 0.0001990947315156704, 'samples': 1465088, 'steps': 2861, 'loss/train': 2.220285415649414} -09/21/2021 00:24:16 - INFO - __main__ - Step 45785: {'lr': 0.0001990947315156704, 'samples': 1465120, 'steps': 2861, 'loss/train': 2.7836453914642334} -09/21/2021 00:24:17 - INFO - __main__ - Step 45786: {'lr': 0.0001990947315156704, 'samples': 1465152, 'steps': 2861, 'loss/train': 2.2787511348724365} -09/21/2021 00:24:17 - INFO - __main__ - Step 45787: {'lr': 0.0001990947315156704, 'samples': 1465184, 'steps': 2861, 'loss/train': 1.6989879608154297} -09/21/2021 00:24:18 - INFO - __main__ - Step 45788: {'lr': 0.0001990947315156704, 'samples': 1465216, 'steps': 2861, 'loss/train': 1.6284269094467163} -09/21/2021 00:24:19 - INFO - __main__ - Step 45789: {'lr': 0.0001990947315156704, 'samples': 1465248, 'steps': 2861, 'loss/train': 2.1088333129882812} -09/21/2021 00:24:20 - INFO - __main__ - Step 45790: {'lr': 0.0001990947315156704, 'samples': 1465280, 'steps': 2861, 'loss/train': 2.699329137802124} -09/21/2021 00:24:20 - INFO - __main__ - Step 45791: {'lr': 0.0001990947315156704, 'samples': 1465312, 'steps': 2861, 'loss/train': 2.317729949951172} -09/21/2021 00:24:21 - INFO - __main__ - Step 45792: {'lr': 0.0001990947315156704, 'samples': 1465344, 'steps': 2861, 'loss/train': 2.5189273357391357} -09/21/2021 00:24:22 - INFO - __main__ - Step 45793: {'lr': 0.00019909387494252974, 'samples': 1465376, 'steps': 2862, 'loss/train': 1.4662597179412842} -09/21/2021 00:24:23 - INFO - __main__ - Step 45794: {'lr': 0.00019909387494252974, 'samples': 1465408, 'steps': 2862, 'loss/train': 2.2976467609405518} -09/21/2021 00:24:24 - INFO - __main__ - Step 45795: {'lr': 0.00019909387494252974, 'samples': 1465440, 'steps': 2862, 'loss/train': 2.1308414936065674} -09/21/2021 00:24:25 - INFO - __main__ - Step 45796: {'lr': 0.00019909387494252974, 'samples': 1465472, 'steps': 2862, 'loss/train': 2.555341958999634} -09/21/2021 00:24:26 - INFO - __main__ - Step 45797: {'lr': 0.00019909387494252974, 'samples': 1465504, 'steps': 2862, 'loss/train': 1.8250850439071655} -09/21/2021 00:24:27 - INFO - __main__ - Step 45798: {'lr': 0.00019909387494252974, 'samples': 1465536, 'steps': 2862, 'loss/train': 1.7445191144943237} -09/21/2021 00:24:28 - INFO - __main__ - Step 45799: {'lr': 0.00019909387494252974, 'samples': 1465568, 'steps': 2862, 'loss/train': 2.137583017349243} -09/21/2021 00:24:28 - INFO - __main__ - Step 45800: {'lr': 0.00019909387494252974, 'samples': 1465600, 'steps': 2862, 'loss/train': 2.0973706245422363} -09/21/2021 00:24:29 - INFO - __main__ - Step 45801: {'lr': 0.00019909387494252974, 'samples': 1465632, 'steps': 2862, 'loss/train': 1.9894201755523682} -09/21/2021 00:24:30 - INFO - __main__ - Step 45802: {'lr': 0.00019909387494252974, 'samples': 1465664, 'steps': 2862, 'loss/train': 2.0099289417266846} -09/21/2021 00:24:31 - INFO - __main__ - Step 45803: {'lr': 0.00019909387494252974, 'samples': 1465696, 'steps': 2862, 'loss/train': 1.8038020133972168} -09/21/2021 00:24:31 - INFO - __main__ - Step 45804: {'lr': 0.00019909387494252974, 'samples': 1465728, 'steps': 2862, 'loss/train': 1.7376587390899658} -09/21/2021 00:24:32 - INFO - __main__ - Step 45805: {'lr': 0.00019909387494252974, 'samples': 1465760, 'steps': 2862, 'loss/train': 2.568675994873047} -09/21/2021 00:24:33 - INFO - __main__ - Step 45806: {'lr': 0.00019909387494252974, 'samples': 1465792, 'steps': 2862, 'loss/train': 2.3900301456451416} -09/21/2021 00:24:34 - INFO - __main__ - Step 45807: {'lr': 0.00019909387494252974, 'samples': 1465824, 'steps': 2862, 'loss/train': 2.3239364624023438} -09/21/2021 00:24:34 - INFO - __main__ - Step 45808: {'lr': 0.00019909387494252974, 'samples': 1465856, 'steps': 2862, 'loss/train': 1.3705394268035889} -09/21/2021 00:24:35 - INFO - __main__ - Step 45809: {'lr': 0.00019909301796617652, 'samples': 1465888, 'steps': 2863, 'loss/train': 2.0300943851470947} -09/21/2021 00:24:36 - INFO - __main__ - Step 45810: {'lr': 0.00019909301796617652, 'samples': 1465920, 'steps': 2863, 'loss/train': 2.198356866836548} -09/21/2021 00:24:37 - INFO - __main__ - Step 45811: {'lr': 0.00019909301796617652, 'samples': 1465952, 'steps': 2863, 'loss/train': 2.8062679767608643} -09/21/2021 00:24:37 - INFO - __main__ - Step 45812: {'lr': 0.00019909301796617652, 'samples': 1465984, 'steps': 2863, 'loss/train': 1.8540834188461304} -09/21/2021 00:24:38 - INFO - __main__ - Step 45813: {'lr': 0.00019909301796617652, 'samples': 1466016, 'steps': 2863, 'loss/train': 2.381399631500244} -09/21/2021 00:24:39 - INFO - __main__ - Step 45814: {'lr': 0.00019909301796617652, 'samples': 1466048, 'steps': 2863, 'loss/train': 2.1890177726745605} -09/21/2021 00:24:40 - INFO - __main__ - Step 45815: {'lr': 0.00019909301796617652, 'samples': 1466080, 'steps': 2863, 'loss/train': 1.3946232795715332} -09/21/2021 00:24:40 - INFO - __main__ - Step 45816: {'lr': 0.00019909301796617652, 'samples': 1466112, 'steps': 2863, 'loss/train': 1.1472901105880737} -09/21/2021 00:24:41 - INFO - __main__ - Step 45817: {'lr': 0.00019909301796617652, 'samples': 1466144, 'steps': 2863, 'loss/train': 1.8620573282241821} -09/21/2021 00:24:42 - INFO - __main__ - Step 45818: {'lr': 0.00019909301796617652, 'samples': 1466176, 'steps': 2863, 'loss/train': 1.7137161493301392} -09/21/2021 00:24:43 - INFO - __main__ - Step 45819: {'lr': 0.00019909301796617652, 'samples': 1466208, 'steps': 2863, 'loss/train': 0.8060780167579651} -09/21/2021 00:24:43 - INFO - __main__ - Step 45820: {'lr': 0.00019909301796617652, 'samples': 1466240, 'steps': 2863, 'loss/train': 0.8829475045204163} -09/21/2021 00:24:44 - INFO - __main__ - Step 45821: {'lr': 0.00019909301796617652, 'samples': 1466272, 'steps': 2863, 'loss/train': 0.7351418137550354} -09/21/2021 00:24:45 - INFO - __main__ - Step 45822: {'lr': 0.00019909301796617652, 'samples': 1466304, 'steps': 2863, 'loss/train': 0.5423137545585632} -09/21/2021 00:24:46 - INFO - __main__ - Step 45823: {'lr': 0.00019909301796617652, 'samples': 1466336, 'steps': 2863, 'loss/train': 0.44547560811042786} -09/21/2021 00:24:46 - INFO - __main__ - Step 45824: {'lr': 0.00019909301796617652, 'samples': 1466368, 'steps': 2863, 'loss/train': 0.7454389929771423} -09/21/2021 00:24:47 - INFO - __main__ - Step 45825: {'lr': 0.00019909216058661418, 'samples': 1466400, 'steps': 2864, 'loss/train': 0.43643873929977417} -09/21/2021 00:24:48 - INFO - __main__ - Step 45826: {'lr': 0.00019909216058661418, 'samples': 1466432, 'steps': 2864, 'loss/train': 0.8283472657203674} -09/21/2021 00:24:49 - INFO - __main__ - Step 45827: {'lr': 0.00019909216058661418, 'samples': 1466464, 'steps': 2864, 'loss/train': 1.8289732933044434} -09/21/2021 00:24:50 - INFO - __main__ - Step 45828: {'lr': 0.00019909216058661418, 'samples': 1466496, 'steps': 2864, 'loss/train': 2.3662049770355225} -09/21/2021 00:24:50 - INFO - __main__ - Step 45829: {'lr': 0.00019909216058661418, 'samples': 1466528, 'steps': 2864, 'loss/train': 1.7150272130966187} -09/21/2021 00:24:51 - INFO - __main__ - Step 45830: {'lr': 0.00019909216058661418, 'samples': 1466560, 'steps': 2864, 'loss/train': 1.6200584173202515} -09/21/2021 00:24:52 - INFO - __main__ - Step 45831: {'lr': 0.00019909216058661418, 'samples': 1466592, 'steps': 2864, 'loss/train': 0.4455219507217407} -09/21/2021 00:24:53 - INFO - __main__ - Step 45832: {'lr': 0.00019909216058661418, 'samples': 1466624, 'steps': 2864, 'loss/train': 1.711608648300171} -09/21/2021 00:24:54 - INFO - __main__ - Step 45833: {'lr': 0.00019909216058661418, 'samples': 1466656, 'steps': 2864, 'loss/train': 1.4537155628204346} -09/21/2021 00:24:55 - INFO - __main__ - Step 45834: {'lr': 0.00019909216058661418, 'samples': 1466688, 'steps': 2864, 'loss/train': 2.5683796405792236} -09/21/2021 00:24:55 - INFO - __main__ - Step 45835: {'lr': 0.00019909216058661418, 'samples': 1466720, 'steps': 2864, 'loss/train': 2.163065195083618} -09/21/2021 00:24:56 - INFO - __main__ - Step 45836: {'lr': 0.00019909216058661418, 'samples': 1466752, 'steps': 2864, 'loss/train': 2.0495948791503906} -09/21/2021 00:24:57 - INFO - __main__ - Step 45837: {'lr': 0.00019909216058661418, 'samples': 1466784, 'steps': 2864, 'loss/train': 1.6863384246826172} -09/21/2021 00:24:58 - INFO - __main__ - Step 45838: {'lr': 0.00019909216058661418, 'samples': 1466816, 'steps': 2864, 'loss/train': 1.5717124938964844} -09/21/2021 00:24:58 - INFO - __main__ - Step 45839: {'lr': 0.00019909216058661418, 'samples': 1466848, 'steps': 2864, 'loss/train': 1.4699374437332153} -09/21/2021 00:24:59 - INFO - __main__ - Step 45840: {'lr': 0.00019909216058661418, 'samples': 1466880, 'steps': 2864, 'loss/train': 2.6660985946655273} -09/21/2021 00:25:00 - INFO - __main__ - Step 45841: {'lr': 0.00019909130280384621, 'samples': 1466912, 'steps': 2865, 'loss/train': 2.115370035171509} -09/21/2021 00:25:01 - INFO - __main__ - Step 45842: {'lr': 0.00019909130280384621, 'samples': 1466944, 'steps': 2865, 'loss/train': 2.6706788539886475} -09/21/2021 00:25:02 - INFO - __main__ - Step 45843: {'lr': 0.00019909130280384621, 'samples': 1466976, 'steps': 2865, 'loss/train': 1.1264572143554688} -09/21/2021 00:25:02 - INFO - __main__ - Step 45844: {'lr': 0.00019909130280384621, 'samples': 1467008, 'steps': 2865, 'loss/train': 0.4185682237148285} -09/21/2021 00:25:03 - INFO - __main__ - Step 45845: {'lr': 0.00019909130280384621, 'samples': 1467040, 'steps': 2865, 'loss/train': 2.206775426864624} -09/21/2021 00:25:04 - INFO - __main__ - Step 45846: {'lr': 0.00019909130280384621, 'samples': 1467072, 'steps': 2865, 'loss/train': 2.8241517543792725} -09/21/2021 00:25:05 - INFO - __main__ - Step 45847: {'lr': 0.00019909130280384621, 'samples': 1467104, 'steps': 2865, 'loss/train': 2.9785144329071045} -09/21/2021 00:25:05 - INFO - __main__ - Step 45848: {'lr': 0.00019909130280384621, 'samples': 1467136, 'steps': 2865, 'loss/train': 1.9381921291351318} -09/21/2021 00:25:06 - INFO - __main__ - Step 45849: {'lr': 0.00019909130280384621, 'samples': 1467168, 'steps': 2865, 'loss/train': 1.452839732170105} -09/21/2021 00:25:07 - INFO - __main__ - Step 45850: {'lr': 0.00019909130280384621, 'samples': 1467200, 'steps': 2865, 'loss/train': 1.7680375576019287} -09/21/2021 00:25:08 - INFO - __main__ - Step 45851: {'lr': 0.00019909130280384621, 'samples': 1467232, 'steps': 2865, 'loss/train': 2.0844268798828125} -09/21/2021 00:25:08 - INFO - __main__ - Step 45852: {'lr': 0.00019909130280384621, 'samples': 1467264, 'steps': 2865, 'loss/train': 2.4379701614379883} -09/21/2021 00:25:09 - INFO - __main__ - Step 45853: {'lr': 0.00019909130280384621, 'samples': 1467296, 'steps': 2865, 'loss/train': 2.1696479320526123} -09/21/2021 00:25:10 - INFO - __main__ - Step 45854: {'lr': 0.00019909130280384621, 'samples': 1467328, 'steps': 2865, 'loss/train': 1.003838300704956} -09/21/2021 00:25:11 - INFO - __main__ - Step 45855: {'lr': 0.00019909130280384621, 'samples': 1467360, 'steps': 2865, 'loss/train': 1.8239012956619263} -09/21/2021 00:25:11 - INFO - __main__ - Step 45856: {'lr': 0.00019909130280384621, 'samples': 1467392, 'steps': 2865, 'loss/train': 2.797192335128784} -09/21/2021 00:25:12 - INFO - __main__ - Step 45857: {'lr': 0.00019909044461787615, 'samples': 1467424, 'steps': 2866, 'loss/train': 2.0953891277313232} -09/21/2021 00:25:13 - INFO - __main__ - Step 45858: {'lr': 0.00019909044461787615, 'samples': 1467456, 'steps': 2866, 'loss/train': 1.6961586475372314} -09/21/2021 00:25:14 - INFO - __main__ - Step 45859: {'lr': 0.00019909044461787615, 'samples': 1467488, 'steps': 2866, 'loss/train': 1.6995846033096313} -09/21/2021 00:25:14 - INFO - __main__ - Step 45860: {'lr': 0.00019909044461787615, 'samples': 1467520, 'steps': 2866, 'loss/train': 2.0605857372283936} -09/21/2021 00:25:15 - INFO - __main__ - Step 45861: {'lr': 0.00019909044461787615, 'samples': 1467552, 'steps': 2866, 'loss/train': 1.5914487838745117} -09/21/2021 00:25:16 - INFO - __main__ - Step 45862: {'lr': 0.00019909044461787615, 'samples': 1467584, 'steps': 2866, 'loss/train': 2.0317399501800537} -09/21/2021 00:25:18 - INFO - __main__ - Step 45863: {'lr': 0.00019909044461787615, 'samples': 1467616, 'steps': 2866, 'loss/train': 1.8453601598739624} -09/21/2021 00:25:18 - INFO - __main__ - Step 45864: {'lr': 0.00019909044461787615, 'samples': 1467648, 'steps': 2866, 'loss/train': 2.4998416900634766} -09/21/2021 00:25:19 - INFO - __main__ - Step 45865: {'lr': 0.00019909044461787615, 'samples': 1467680, 'steps': 2866, 'loss/train': 1.5230497121810913} -09/21/2021 00:25:20 - INFO - __main__ - Step 45866: {'lr': 0.00019909044461787615, 'samples': 1467712, 'steps': 2866, 'loss/train': 2.5604851245880127} -09/21/2021 00:25:21 - INFO - __main__ - Step 45867: {'lr': 0.00019909044461787615, 'samples': 1467744, 'steps': 2866, 'loss/train': 2.4276602268218994} -09/21/2021 00:25:21 - INFO - __main__ - Step 45868: {'lr': 0.00019909044461787615, 'samples': 1467776, 'steps': 2866, 'loss/train': 2.096062421798706} -09/21/2021 00:25:22 - INFO - __main__ - Step 45869: {'lr': 0.00019909044461787615, 'samples': 1467808, 'steps': 2866, 'loss/train': 2.536816358566284} -09/21/2021 00:25:23 - INFO - __main__ - Step 45870: {'lr': 0.00019909044461787615, 'samples': 1467840, 'steps': 2866, 'loss/train': 2.4488353729248047} -09/21/2021 00:25:24 - INFO - __main__ - Step 45871: {'lr': 0.00019909044461787615, 'samples': 1467872, 'steps': 2866, 'loss/train': 1.7138645648956299} -09/21/2021 00:25:24 - INFO - __main__ - Step 45872: {'lr': 0.00019909044461787615, 'samples': 1467904, 'steps': 2866, 'loss/train': 2.194481134414673} -09/21/2021 00:25:25 - INFO - __main__ - Step 45873: {'lr': 0.00019908958602870742, 'samples': 1467936, 'steps': 2867, 'loss/train': 2.1512398719787598} -09/21/2021 00:25:26 - INFO - __main__ - Step 45874: {'lr': 0.00019908958602870742, 'samples': 1467968, 'steps': 2867, 'loss/train': 0.5838533043861389} -09/21/2021 00:25:27 - INFO - __main__ - Step 45875: {'lr': 0.00019908958602870742, 'samples': 1468000, 'steps': 2867, 'loss/train': 2.2872989177703857} -09/21/2021 00:25:28 - INFO - __main__ - Step 45876: {'lr': 0.00019908958602870742, 'samples': 1468032, 'steps': 2867, 'loss/train': 1.89433753490448} -09/21/2021 00:25:28 - INFO - __main__ - Step 45877: {'lr': 0.00019908958602870742, 'samples': 1468064, 'steps': 2867, 'loss/train': 2.113534927368164} -09/21/2021 00:25:29 - INFO - __main__ - Step 45878: {'lr': 0.00019908958602870742, 'samples': 1468096, 'steps': 2867, 'loss/train': 2.4304237365722656} -09/21/2021 00:25:30 - INFO - __main__ - Step 45879: {'lr': 0.00019908958602870742, 'samples': 1468128, 'steps': 2867, 'loss/train': 2.8606908321380615} -09/21/2021 00:25:31 - INFO - __main__ - Step 45880: {'lr': 0.00019908958602870742, 'samples': 1468160, 'steps': 2867, 'loss/train': 2.259021520614624} -09/21/2021 00:25:31 - INFO - __main__ - Step 45881: {'lr': 0.00019908958602870742, 'samples': 1468192, 'steps': 2867, 'loss/train': 0.9297533631324768} -09/21/2021 00:25:32 - INFO - __main__ - Step 45882: {'lr': 0.00019908958602870742, 'samples': 1468224, 'steps': 2867, 'loss/train': 2.972621440887451} -09/21/2021 00:25:33 - INFO - __main__ - Step 45883: {'lr': 0.00019908958602870742, 'samples': 1468256, 'steps': 2867, 'loss/train': 1.6836878061294556} -09/21/2021 00:25:34 - INFO - __main__ - Step 45884: {'lr': 0.00019908958602870742, 'samples': 1468288, 'steps': 2867, 'loss/train': 1.8478918075561523} -09/21/2021 00:25:34 - INFO - __main__ - Step 45885: {'lr': 0.00019908958602870742, 'samples': 1468320, 'steps': 2867, 'loss/train': 1.8533660173416138} -09/21/2021 00:25:35 - INFO - __main__ - Step 45886: {'lr': 0.00019908958602870742, 'samples': 1468352, 'steps': 2867, 'loss/train': 0.4072988033294678} -09/21/2021 00:25:36 - INFO - __main__ - Step 45887: {'lr': 0.00019908958602870742, 'samples': 1468384, 'steps': 2867, 'loss/train': 2.400796413421631} -09/21/2021 00:25:37 - INFO - __main__ - Step 45888: {'lr': 0.00019908958602870742, 'samples': 1468416, 'steps': 2867, 'loss/train': 3.4393227100372314} -09/21/2021 00:25:37 - INFO - __main__ - Step 45889: {'lr': 0.00019908872703634355, 'samples': 1468448, 'steps': 2868, 'loss/train': 1.2962491512298584} -09/21/2021 00:25:38 - INFO - __main__ - Step 45890: {'lr': 0.00019908872703634355, 'samples': 1468480, 'steps': 2868, 'loss/train': 1.6897298097610474} -09/21/2021 00:25:39 - INFO - __main__ - Step 45891: {'lr': 0.00019908872703634355, 'samples': 1468512, 'steps': 2868, 'loss/train': 1.605128526687622} -09/21/2021 00:25:40 - INFO - __main__ - Step 45892: {'lr': 0.00019908872703634355, 'samples': 1468544, 'steps': 2868, 'loss/train': 2.0684471130371094} -09/21/2021 00:25:41 - INFO - __main__ - Step 45893: {'lr': 0.00019908872703634355, 'samples': 1468576, 'steps': 2868, 'loss/train': 2.6135153770446777} -09/21/2021 00:25:42 - INFO - __main__ - Step 45894: {'lr': 0.00019908872703634355, 'samples': 1468608, 'steps': 2868, 'loss/train': 2.030635356903076} -09/21/2021 00:25:43 - INFO - __main__ - Step 45895: {'lr': 0.00019908872703634355, 'samples': 1468640, 'steps': 2868, 'loss/train': 1.688769817352295} -09/21/2021 00:25:43 - INFO - __main__ - Step 45896: {'lr': 0.00019908872703634355, 'samples': 1468672, 'steps': 2868, 'loss/train': 1.9472137689590454} -09/21/2021 00:25:44 - INFO - __main__ - Step 45897: {'lr': 0.00019908872703634355, 'samples': 1468704, 'steps': 2868, 'loss/train': 1.5205262899398804} -09/21/2021 00:25:45 - INFO - __main__ - Step 45898: {'lr': 0.00019908872703634355, 'samples': 1468736, 'steps': 2868, 'loss/train': 1.9297808408737183} -09/21/2021 00:25:46 - INFO - __main__ - Step 45899: {'lr': 0.00019908872703634355, 'samples': 1468768, 'steps': 2868, 'loss/train': 1.657785177230835} -09/21/2021 00:25:46 - INFO - __main__ - Step 45900: {'lr': 0.00019908872703634355, 'samples': 1468800, 'steps': 2868, 'loss/train': 1.9887118339538574} -09/21/2021 00:25:47 - INFO - __main__ - Step 45901: {'lr': 0.00019908872703634355, 'samples': 1468832, 'steps': 2868, 'loss/train': 1.6815510988235474} -09/21/2021 00:25:48 - INFO - __main__ - Step 45902: {'lr': 0.00019908872703634355, 'samples': 1468864, 'steps': 2868, 'loss/train': 1.9423164129257202} -09/21/2021 00:25:49 - INFO - __main__ - Step 45903: {'lr': 0.00019908872703634355, 'samples': 1468896, 'steps': 2868, 'loss/train': 1.2055671215057373} -09/21/2021 00:25:49 - INFO - __main__ - Step 45904: {'lr': 0.00019908872703634355, 'samples': 1468928, 'steps': 2868, 'loss/train': 1.5116046667099} -09/21/2021 00:25:50 - INFO - __main__ - Step 45905: {'lr': 0.00019908786764078807, 'samples': 1468960, 'steps': 2869, 'loss/train': 1.8966660499572754} -09/21/2021 00:25:51 - INFO - __main__ - Step 45906: {'lr': 0.00019908786764078807, 'samples': 1468992, 'steps': 2869, 'loss/train': 1.791579008102417} -09/21/2021 00:25:52 - INFO - __main__ - Step 45907: {'lr': 0.00019908786764078807, 'samples': 1469024, 'steps': 2869, 'loss/train': 1.8762450218200684} -09/21/2021 00:25:52 - INFO - __main__ - Step 45908: {'lr': 0.00019908786764078807, 'samples': 1469056, 'steps': 2869, 'loss/train': 1.817533254623413} -09/21/2021 00:25:53 - INFO - __main__ - Step 45909: {'lr': 0.00019908786764078807, 'samples': 1469088, 'steps': 2869, 'loss/train': 1.851840615272522} -09/21/2021 00:25:54 - INFO - __main__ - Step 45910: {'lr': 0.00019908786764078807, 'samples': 1469120, 'steps': 2869, 'loss/train': 0.42621394991874695} -09/21/2021 00:25:55 - INFO - __main__ - Step 45911: {'lr': 0.00019908786764078807, 'samples': 1469152, 'steps': 2869, 'loss/train': 1.5875873565673828} -09/21/2021 00:25:55 - INFO - __main__ - Step 45912: {'lr': 0.00019908786764078807, 'samples': 1469184, 'steps': 2869, 'loss/train': 1.653198480606079} -09/21/2021 00:25:56 - INFO - __main__ - Step 45913: {'lr': 0.00019908786764078807, 'samples': 1469216, 'steps': 2869, 'loss/train': 1.5063287019729614} -09/21/2021 00:25:57 - INFO - __main__ - Step 45914: {'lr': 0.00019908786764078807, 'samples': 1469248, 'steps': 2869, 'loss/train': 1.109242558479309} -09/21/2021 00:25:58 - INFO - __main__ - Step 45915: {'lr': 0.00019908786764078807, 'samples': 1469280, 'steps': 2869, 'loss/train': 2.585162878036499} -09/21/2021 00:25:58 - INFO - __main__ - Step 45916: {'lr': 0.00019908786764078807, 'samples': 1469312, 'steps': 2869, 'loss/train': 1.706016182899475} -09/21/2021 00:25:59 - INFO - __main__ - Step 45917: {'lr': 0.00019908786764078807, 'samples': 1469344, 'steps': 2869, 'loss/train': 2.446838617324829} -09/21/2021 00:26:00 - INFO - __main__ - Step 45918: {'lr': 0.00019908786764078807, 'samples': 1469376, 'steps': 2869, 'loss/train': 2.6968085765838623} -09/21/2021 00:26:01 - INFO - __main__ - Step 45919: {'lr': 0.00019908786764078807, 'samples': 1469408, 'steps': 2869, 'loss/train': 2.6286821365356445} -09/21/2021 00:26:01 - INFO - __main__ - Step 45920: {'lr': 0.00019908786764078807, 'samples': 1469440, 'steps': 2869, 'loss/train': 2.429131507873535} -09/21/2021 00:26:02 - INFO - __main__ - Step 45921: {'lr': 0.00019908700784204442, 'samples': 1469472, 'steps': 2870, 'loss/train': 0.6114750504493713} -09/21/2021 00:26:03 - INFO - __main__ - Step 45922: {'lr': 0.00019908700784204442, 'samples': 1469504, 'steps': 2870, 'loss/train': 0.7083702683448792} -09/21/2021 00:26:04 - INFO - __main__ - Step 45923: {'lr': 0.00019908700784204442, 'samples': 1469536, 'steps': 2870, 'loss/train': 0.8584249019622803} -09/21/2021 00:26:05 - INFO - __main__ - Step 45924: {'lr': 0.00019908700784204442, 'samples': 1469568, 'steps': 2870, 'loss/train': 2.7008113861083984} -09/21/2021 00:26:06 - INFO - __main__ - Step 45925: {'lr': 0.00019908700784204442, 'samples': 1469600, 'steps': 2870, 'loss/train': 3.4940831661224365} -09/21/2021 00:26:07 - INFO - __main__ - Step 45926: {'lr': 0.00019908700784204442, 'samples': 1469632, 'steps': 2870, 'loss/train': 2.406597852706909} -09/21/2021 00:26:08 - INFO - __main__ - Step 45927: {'lr': 0.00019908700784204442, 'samples': 1469664, 'steps': 2870, 'loss/train': 0.4576622247695923} -09/21/2021 00:26:08 - INFO - __main__ - Step 45928: {'lr': 0.00019908700784204442, 'samples': 1469696, 'steps': 2870, 'loss/train': 1.614443302154541} -09/21/2021 00:26:09 - INFO - __main__ - Step 45929: {'lr': 0.00019908700784204442, 'samples': 1469728, 'steps': 2870, 'loss/train': 1.640602946281433} -09/21/2021 00:26:10 - INFO - __main__ - Step 45930: {'lr': 0.00019908700784204442, 'samples': 1469760, 'steps': 2870, 'loss/train': 2.023484230041504} -09/21/2021 00:26:11 - INFO - __main__ - Step 45931: {'lr': 0.00019908700784204442, 'samples': 1469792, 'steps': 2870, 'loss/train': 0.9645005464553833} -09/21/2021 00:26:11 - INFO - __main__ - Step 45932: {'lr': 0.00019908700784204442, 'samples': 1469824, 'steps': 2870, 'loss/train': 1.2676736116409302} -09/21/2021 00:26:12 - INFO - __main__ - Step 45933: {'lr': 0.00019908700784204442, 'samples': 1469856, 'steps': 2870, 'loss/train': 2.337376832962036} -09/21/2021 00:26:13 - INFO - __main__ - Step 45934: {'lr': 0.00019908700784204442, 'samples': 1469888, 'steps': 2870, 'loss/train': 1.6844815015792847} -09/21/2021 00:26:14 - INFO - __main__ - Step 45935: {'lr': 0.00019908700784204442, 'samples': 1469920, 'steps': 2870, 'loss/train': 1.3871638774871826} -09/21/2021 00:26:14 - INFO - __main__ - Step 45936: {'lr': 0.00019908700784204442, 'samples': 1469952, 'steps': 2870, 'loss/train': 2.477769613265991} -09/21/2021 00:26:15 - INFO - __main__ - Step 45937: {'lr': 0.0001990861476401161, 'samples': 1469984, 'steps': 2871, 'loss/train': 1.7825175523757935} -09/21/2021 00:26:16 - INFO - __main__ - Step 45938: {'lr': 0.0001990861476401161, 'samples': 1470016, 'steps': 2871, 'loss/train': 1.6510179042816162} -09/21/2021 00:26:17 - INFO - __main__ - Step 45939: {'lr': 0.0001990861476401161, 'samples': 1470048, 'steps': 2871, 'loss/train': 1.8328044414520264} -09/21/2021 00:26:18 - INFO - __main__ - Step 45940: {'lr': 0.0001990861476401161, 'samples': 1470080, 'steps': 2871, 'loss/train': 1.5000520944595337} -09/21/2021 00:26:18 - INFO - __main__ - Step 45941: {'lr': 0.0001990861476401161, 'samples': 1470112, 'steps': 2871, 'loss/train': 1.270477294921875} -09/21/2021 00:26:19 - INFO - __main__ - Step 45942: {'lr': 0.0001990861476401161, 'samples': 1470144, 'steps': 2871, 'loss/train': 2.0989935398101807} -09/21/2021 00:26:20 - INFO - __main__ - Step 45943: {'lr': 0.0001990861476401161, 'samples': 1470176, 'steps': 2871, 'loss/train': 1.6721699237823486} -09/21/2021 00:26:21 - INFO - __main__ - Step 45944: {'lr': 0.0001990861476401161, 'samples': 1470208, 'steps': 2871, 'loss/train': 1.9985333681106567} -09/21/2021 00:26:21 - INFO - __main__ - Step 45945: {'lr': 0.0001990861476401161, 'samples': 1470240, 'steps': 2871, 'loss/train': 2.39442777633667} -09/21/2021 00:26:22 - INFO - __main__ - Step 45946: {'lr': 0.0001990861476401161, 'samples': 1470272, 'steps': 2871, 'loss/train': 1.9599286317825317} -09/21/2021 00:26:23 - INFO - __main__ - Step 45947: {'lr': 0.0001990861476401161, 'samples': 1470304, 'steps': 2871, 'loss/train': 2.0905048847198486} -09/21/2021 00:26:24 - INFO - __main__ - Step 45948: {'lr': 0.0001990861476401161, 'samples': 1470336, 'steps': 2871, 'loss/train': 2.3501436710357666} -09/21/2021 00:26:24 - INFO - __main__ - Step 45949: {'lr': 0.0001990861476401161, 'samples': 1470368, 'steps': 2871, 'loss/train': 0.9075565338134766} -09/21/2021 00:26:25 - INFO - __main__ - Step 45950: {'lr': 0.0001990861476401161, 'samples': 1470400, 'steps': 2871, 'loss/train': 0.32113227248191833} -09/21/2021 00:26:26 - INFO - __main__ - Step 45951: {'lr': 0.0001990861476401161, 'samples': 1470432, 'steps': 2871, 'loss/train': 0.5541273355484009} -09/21/2021 00:26:27 - INFO - __main__ - Step 45952: {'lr': 0.0001990861476401161, 'samples': 1470464, 'steps': 2871, 'loss/train': 0.5359486937522888} -09/21/2021 00:26:27 - INFO - __main__ - Step 45953: {'lr': 0.00019908528703500665, 'samples': 1470496, 'steps': 2872, 'loss/train': 0.3437764346599579} -09/21/2021 00:26:28 - INFO - __main__ - Step 45954: {'lr': 0.00019908528703500665, 'samples': 1470528, 'steps': 2872, 'loss/train': 0.1693950593471527} -09/21/2021 00:26:30 - INFO - __main__ - Step 45955: {'lr': 0.00019908528703500665, 'samples': 1470560, 'steps': 2872, 'loss/train': 0.5972825288772583} -09/21/2021 00:26:30 - INFO - __main__ - Step 45956: {'lr': 0.00019908528703500665, 'samples': 1470592, 'steps': 2872, 'loss/train': 2.4193522930145264} -09/21/2021 00:26:31 - INFO - __main__ - Step 45957: {'lr': 0.00019908528703500665, 'samples': 1470624, 'steps': 2872, 'loss/train': 1.7083433866500854} -09/21/2021 00:26:32 - INFO - __main__ - Step 45958: {'lr': 0.00019908528703500665, 'samples': 1470656, 'steps': 2872, 'loss/train': 1.30750572681427} -09/21/2021 00:26:33 - INFO - __main__ - Step 45959: {'lr': 0.00019908528703500665, 'samples': 1470688, 'steps': 2872, 'loss/train': 1.5389493703842163} -09/21/2021 00:26:33 - INFO - __main__ - Step 45960: {'lr': 0.00019908528703500665, 'samples': 1470720, 'steps': 2872, 'loss/train': 1.8229678869247437} -09/21/2021 00:26:34 - INFO - __main__ - Step 45961: {'lr': 0.00019908528703500665, 'samples': 1470752, 'steps': 2872, 'loss/train': 2.0928304195404053} -09/21/2021 00:26:35 - INFO - __main__ - Step 45962: {'lr': 0.00019908528703500665, 'samples': 1470784, 'steps': 2872, 'loss/train': 1.6989058256149292} -09/21/2021 00:26:36 - INFO - __main__ - Step 45963: {'lr': 0.00019908528703500665, 'samples': 1470816, 'steps': 2872, 'loss/train': 1.1978868246078491} -09/21/2021 00:26:36 - INFO - __main__ - Step 45964: {'lr': 0.00019908528703500665, 'samples': 1470848, 'steps': 2872, 'loss/train': 1.7441328763961792} -09/21/2021 00:26:37 - INFO - __main__ - Step 45965: {'lr': 0.00019908528703500665, 'samples': 1470880, 'steps': 2872, 'loss/train': 2.0978782176971436} -09/21/2021 00:26:38 - INFO - __main__ - Step 45966: {'lr': 0.00019908528703500665, 'samples': 1470912, 'steps': 2872, 'loss/train': 2.4511232376098633} -09/21/2021 00:26:39 - INFO - __main__ - Step 45967: {'lr': 0.00019908528703500665, 'samples': 1470944, 'steps': 2872, 'loss/train': 1.777850866317749} -09/21/2021 00:26:39 - INFO - __main__ - Step 45968: {'lr': 0.00019908528703500665, 'samples': 1470976, 'steps': 2872, 'loss/train': 4.46752405166626} -09/21/2021 00:26:40 - INFO - __main__ - Step 45969: {'lr': 0.00019908442602671955, 'samples': 1471008, 'steps': 2873, 'loss/train': 2.7378251552581787} -09/21/2021 00:26:41 - INFO - __main__ - Step 45970: {'lr': 0.00019908442602671955, 'samples': 1471040, 'steps': 2873, 'loss/train': 0.26284366846084595} -09/21/2021 00:26:42 - INFO - __main__ - Step 45971: {'lr': 0.00019908442602671955, 'samples': 1471072, 'steps': 2873, 'loss/train': 1.9116324186325073} -09/21/2021 00:26:42 - INFO - __main__ - Step 45972: {'lr': 0.00019908442602671955, 'samples': 1471104, 'steps': 2873, 'loss/train': 2.099248170852661} -09/21/2021 00:26:43 - INFO - __main__ - Step 45973: {'lr': 0.00019908442602671955, 'samples': 1471136, 'steps': 2873, 'loss/train': 2.194762945175171} -09/21/2021 00:26:44 - INFO - __main__ - Step 45974: {'lr': 0.00019908442602671955, 'samples': 1471168, 'steps': 2873, 'loss/train': 0.7198723554611206} -09/21/2021 00:26:45 - INFO - __main__ - Step 45975: {'lr': 0.00019908442602671955, 'samples': 1471200, 'steps': 2873, 'loss/train': 1.9572117328643799} -09/21/2021 00:26:45 - INFO - __main__ - Step 45976: {'lr': 0.00019908442602671955, 'samples': 1471232, 'steps': 2873, 'loss/train': 1.8902051448822021} -09/21/2021 00:26:46 - INFO - __main__ - Step 45977: {'lr': 0.00019908442602671955, 'samples': 1471264, 'steps': 2873, 'loss/train': 2.114464044570923} -09/21/2021 00:26:47 - INFO - __main__ - Step 45978: {'lr': 0.00019908442602671955, 'samples': 1471296, 'steps': 2873, 'loss/train': 1.4404411315917969} -09/21/2021 00:26:48 - INFO - __main__ - Step 45979: {'lr': 0.00019908442602671955, 'samples': 1471328, 'steps': 2873, 'loss/train': 1.461996078491211} -09/21/2021 00:26:48 - INFO - __main__ - Step 45980: {'lr': 0.00019908442602671955, 'samples': 1471360, 'steps': 2873, 'loss/train': 2.501534938812256} -09/21/2021 00:26:49 - INFO - __main__ - Step 45981: {'lr': 0.00019908442602671955, 'samples': 1471392, 'steps': 2873, 'loss/train': 2.179173231124878} -09/21/2021 00:26:50 - INFO - __main__ - Step 45982: {'lr': 0.00019908442602671955, 'samples': 1471424, 'steps': 2873, 'loss/train': 2.820246696472168} -09/21/2021 00:26:51 - INFO - __main__ - Step 45983: {'lr': 0.00019908442602671955, 'samples': 1471456, 'steps': 2873, 'loss/train': 0.39185699820518494} -09/21/2021 00:26:51 - INFO - __main__ - Step 45984: {'lr': 0.00019908442602671955, 'samples': 1471488, 'steps': 2873, 'loss/train': 1.3577910661697388} -09/21/2021 00:26:52 - INFO - __main__ - Step 45985: {'lr': 0.0001990835646152583, 'samples': 1471520, 'steps': 2874, 'loss/train': 2.637861490249634} -09/21/2021 00:26:54 - INFO - __main__ - Step 45986: {'lr': 0.0001990835646152583, 'samples': 1471552, 'steps': 2874, 'loss/train': 1.8410664796829224} -09/21/2021 00:26:55 - INFO - __main__ - Step 45987: {'lr': 0.0001990835646152583, 'samples': 1471584, 'steps': 2874, 'loss/train': 1.933434009552002} -09/21/2021 00:26:55 - INFO - __main__ - Step 45988: {'lr': 0.0001990835646152583, 'samples': 1471616, 'steps': 2874, 'loss/train': 2.430756092071533} -09/21/2021 00:26:56 - INFO - __main__ - Step 45989: {'lr': 0.0001990835646152583, 'samples': 1471648, 'steps': 2874, 'loss/train': 1.881068468093872} -09/21/2021 00:26:57 - INFO - __main__ - Step 45990: {'lr': 0.0001990835646152583, 'samples': 1471680, 'steps': 2874, 'loss/train': 1.7721974849700928} -09/21/2021 00:26:58 - INFO - __main__ - Step 45991: {'lr': 0.0001990835646152583, 'samples': 1471712, 'steps': 2874, 'loss/train': 1.363906979560852} -09/21/2021 00:26:58 - INFO - __main__ - Step 45992: {'lr': 0.0001990835646152583, 'samples': 1471744, 'steps': 2874, 'loss/train': 1.2239234447479248} -09/21/2021 00:26:59 - INFO - __main__ - Step 45993: {'lr': 0.0001990835646152583, 'samples': 1471776, 'steps': 2874, 'loss/train': 2.8841235637664795} -09/21/2021 00:27:00 - INFO - __main__ - Step 45994: {'lr': 0.0001990835646152583, 'samples': 1471808, 'steps': 2874, 'loss/train': 2.5368473529815674} -09/21/2021 00:27:01 - INFO - __main__ - Step 45995: {'lr': 0.0001990835646152583, 'samples': 1471840, 'steps': 2874, 'loss/train': 2.7132437229156494} -09/21/2021 00:27:01 - INFO - __main__ - Step 45996: {'lr': 0.0001990835646152583, 'samples': 1471872, 'steps': 2874, 'loss/train': 2.2219042778015137} -09/21/2021 00:27:02 - INFO - __main__ - Step 45997: {'lr': 0.0001990835646152583, 'samples': 1471904, 'steps': 2874, 'loss/train': 1.9340577125549316} -09/21/2021 00:27:03 - INFO - __main__ - Step 45998: {'lr': 0.0001990835646152583, 'samples': 1471936, 'steps': 2874, 'loss/train': 1.9065206050872803} -09/21/2021 00:27:04 - INFO - __main__ - Step 45999: {'lr': 0.0001990835646152583, 'samples': 1471968, 'steps': 2874, 'loss/train': 1.2760858535766602} -09/21/2021 00:27:04 - INFO - __main__ - Step 46000: {'lr': 0.0001990835646152583, 'samples': 1472000, 'steps': 2874, 'loss/train': 1.9356138706207275} -09/21/2021 00:27:05 - INFO - __main__ - Step 46001: {'lr': 0.00019908270280062643, 'samples': 1472032, 'steps': 2875, 'loss/train': 2.1732337474823} -09/21/2021 00:27:06 - INFO - __main__ - Step 46002: {'lr': 0.00019908270280062643, 'samples': 1472064, 'steps': 2875, 'loss/train': 1.0203310251235962} -09/21/2021 00:27:07 - INFO - __main__ - Step 46003: {'lr': 0.00019908270280062643, 'samples': 1472096, 'steps': 2875, 'loss/train': 2.2699146270751953} -09/21/2021 00:27:07 - INFO - __main__ - Step 46004: {'lr': 0.00019908270280062643, 'samples': 1472128, 'steps': 2875, 'loss/train': 1.9931546449661255} -09/21/2021 00:27:08 - INFO - __main__ - Step 46005: {'lr': 0.00019908270280062643, 'samples': 1472160, 'steps': 2875, 'loss/train': 1.9900859594345093} -09/21/2021 00:27:09 - INFO - __main__ - Step 46006: {'lr': 0.00019908270280062643, 'samples': 1472192, 'steps': 2875, 'loss/train': 2.463697910308838} -09/21/2021 00:27:10 - INFO - __main__ - Step 46007: {'lr': 0.00019908270280062643, 'samples': 1472224, 'steps': 2875, 'loss/train': 1.1568522453308105} -09/21/2021 00:27:10 - INFO - __main__ - Step 46008: {'lr': 0.00019908270280062643, 'samples': 1472256, 'steps': 2875, 'loss/train': 1.872584581375122} -09/21/2021 00:27:11 - INFO - __main__ - Step 46009: {'lr': 0.00019908270280062643, 'samples': 1472288, 'steps': 2875, 'loss/train': 2.56069278717041} -09/21/2021 00:27:12 - INFO - __main__ - Step 46010: {'lr': 0.00019908270280062643, 'samples': 1472320, 'steps': 2875, 'loss/train': 1.6402040719985962} -09/21/2021 00:27:13 - INFO - __main__ - Step 46011: {'lr': 0.00019908270280062643, 'samples': 1472352, 'steps': 2875, 'loss/train': 1.8629121780395508} -09/21/2021 00:27:13 - INFO - __main__ - Step 46012: {'lr': 0.00019908270280062643, 'samples': 1472384, 'steps': 2875, 'loss/train': 1.6560804843902588} -09/21/2021 00:27:14 - INFO - __main__ - Step 46013: {'lr': 0.00019908270280062643, 'samples': 1472416, 'steps': 2875, 'loss/train': 0.32706451416015625} -09/21/2021 00:27:15 - INFO - __main__ - Step 46014: {'lr': 0.00019908270280062643, 'samples': 1472448, 'steps': 2875, 'loss/train': 0.20226119458675385} -09/21/2021 00:27:16 - INFO - __main__ - Step 46015: {'lr': 0.00019908270280062643, 'samples': 1472480, 'steps': 2875, 'loss/train': 0.21203085780143738} -09/21/2021 00:27:16 - INFO - __main__ - Step 46016: {'lr': 0.00019908270280062643, 'samples': 1472512, 'steps': 2875, 'loss/train': 0.16608552634716034} -09/21/2021 00:27:18 - INFO - __main__ - Step 46017: {'lr': 0.0001990818405828274, 'samples': 1472544, 'steps': 2876, 'loss/train': 2.4005250930786133} -09/21/2021 00:27:19 - INFO - __main__ - Step 46018: {'lr': 0.0001990818405828274, 'samples': 1472576, 'steps': 2876, 'loss/train': 2.9514222145080566} -09/21/2021 00:27:20 - INFO - __main__ - Step 46019: {'lr': 0.0001990818405828274, 'samples': 1472608, 'steps': 2876, 'loss/train': 1.4151376485824585} -09/21/2021 00:27:20 - INFO - __main__ - Step 46020: {'lr': 0.0001990818405828274, 'samples': 1472640, 'steps': 2876, 'loss/train': 0.8193358182907104} -09/21/2021 00:27:21 - INFO - __main__ - Step 46021: {'lr': 0.0001990818405828274, 'samples': 1472672, 'steps': 2876, 'loss/train': 2.587520122528076} -09/21/2021 00:27:22 - INFO - __main__ - Step 46022: {'lr': 0.0001990818405828274, 'samples': 1472704, 'steps': 2876, 'loss/train': 2.315511703491211} -09/21/2021 00:27:23 - INFO - __main__ - Step 46023: {'lr': 0.0001990818405828274, 'samples': 1472736, 'steps': 2876, 'loss/train': 1.164864420890808} -09/21/2021 00:27:23 - INFO - __main__ - Step 46024: {'lr': 0.0001990818405828274, 'samples': 1472768, 'steps': 2876, 'loss/train': 1.798716425895691} -09/21/2021 00:27:24 - INFO - __main__ - Step 46025: {'lr': 0.0001990818405828274, 'samples': 1472800, 'steps': 2876, 'loss/train': 1.6370524168014526} -09/21/2021 00:27:25 - INFO - __main__ - Step 46026: {'lr': 0.0001990818405828274, 'samples': 1472832, 'steps': 2876, 'loss/train': 2.195945978164673} -09/21/2021 00:27:26 - INFO - __main__ - Step 46027: {'lr': 0.0001990818405828274, 'samples': 1472864, 'steps': 2876, 'loss/train': 1.8228366374969482} -09/21/2021 00:27:26 - INFO - __main__ - Step 46028: {'lr': 0.0001990818405828274, 'samples': 1472896, 'steps': 2876, 'loss/train': 2.4775185585021973} -09/21/2021 00:27:27 - INFO - __main__ - Step 46029: {'lr': 0.0001990818405828274, 'samples': 1472928, 'steps': 2876, 'loss/train': 0.8666069507598877} -09/21/2021 00:27:28 - INFO - __main__ - Step 46030: {'lr': 0.0001990818405828274, 'samples': 1472960, 'steps': 2876, 'loss/train': 2.690467596054077} -09/21/2021 00:27:29 - INFO - __main__ - Step 46031: {'lr': 0.0001990818405828274, 'samples': 1472992, 'steps': 2876, 'loss/train': 2.0161147117614746} -09/21/2021 00:27:29 - INFO - __main__ - Step 46032: {'lr': 0.0001990818405828274, 'samples': 1473024, 'steps': 2876, 'loss/train': 2.284468650817871} -09/21/2021 00:27:30 - INFO - __main__ - Step 46033: {'lr': 0.00019908097796186475, 'samples': 1473056, 'steps': 2877, 'loss/train': 2.4133355617523193} -09/21/2021 00:27:31 - INFO - __main__ - Step 46034: {'lr': 0.00019908097796186475, 'samples': 1473088, 'steps': 2877, 'loss/train': 2.449291229248047} -09/21/2021 00:27:32 - INFO - __main__ - Step 46035: {'lr': 0.00019908097796186475, 'samples': 1473120, 'steps': 2877, 'loss/train': 2.139940023422241} -09/21/2021 00:27:32 - INFO - __main__ - Step 46036: {'lr': 0.00019908097796186475, 'samples': 1473152, 'steps': 2877, 'loss/train': 2.2484917640686035} -09/21/2021 00:27:33 - INFO - __main__ - Step 46037: {'lr': 0.00019908097796186475, 'samples': 1473184, 'steps': 2877, 'loss/train': 2.2505438327789307} -09/21/2021 00:27:34 - INFO - __main__ - Step 46038: {'lr': 0.00019908097796186475, 'samples': 1473216, 'steps': 2877, 'loss/train': 0.09446787089109421} -09/21/2021 00:27:35 - INFO - __main__ - Step 46039: {'lr': 0.00019908097796186475, 'samples': 1473248, 'steps': 2877, 'loss/train': 0.1000669002532959} -09/21/2021 00:27:35 - INFO - __main__ - Step 46040: {'lr': 0.00019908097796186475, 'samples': 1473280, 'steps': 2877, 'loss/train': 0.9450580477714539} -09/21/2021 00:27:36 - INFO - __main__ - Step 46041: {'lr': 0.00019908097796186475, 'samples': 1473312, 'steps': 2877, 'loss/train': 3.7832367420196533} -09/21/2021 00:27:37 - INFO - __main__ - Step 46042: {'lr': 0.00019908097796186475, 'samples': 1473344, 'steps': 2877, 'loss/train': 2.2237558364868164} -09/21/2021 00:27:38 - INFO - __main__ - Step 46043: {'lr': 0.00019908097796186475, 'samples': 1473376, 'steps': 2877, 'loss/train': 2.235213279724121} -09/21/2021 00:27:38 - INFO - __main__ - Step 46044: {'lr': 0.00019908097796186475, 'samples': 1473408, 'steps': 2877, 'loss/train': 1.8450164794921875} -09/21/2021 00:27:39 - INFO - __main__ - Step 46045: {'lr': 0.00019908097796186475, 'samples': 1473440, 'steps': 2877, 'loss/train': 1.9753696918487549} -09/21/2021 00:27:40 - INFO - __main__ - Step 46046: {'lr': 0.00019908097796186475, 'samples': 1473472, 'steps': 2877, 'loss/train': 1.7271356582641602} -09/21/2021 00:27:41 - INFO - __main__ - Step 46047: {'lr': 0.00019908097796186475, 'samples': 1473504, 'steps': 2877, 'loss/train': 1.4916352033615112} -09/21/2021 00:27:42 - INFO - __main__ - Step 46048: {'lr': 0.00019908097796186475, 'samples': 1473536, 'steps': 2877, 'loss/train': 1.5630247592926025} -09/21/2021 00:27:43 - INFO - __main__ - Step 46049: {'lr': 0.000199080114937742, 'samples': 1473568, 'steps': 2878, 'loss/train': 1.4525021314620972} -09/21/2021 00:27:44 - INFO - __main__ - Step 46050: {'lr': 0.000199080114937742, 'samples': 1473600, 'steps': 2878, 'loss/train': 2.2281126976013184} -09/21/2021 00:27:44 - INFO - __main__ - Step 46051: {'lr': 0.000199080114937742, 'samples': 1473632, 'steps': 2878, 'loss/train': 1.9058674573898315} -09/21/2021 00:27:45 - INFO - __main__ - Step 46052: {'lr': 0.000199080114937742, 'samples': 1473664, 'steps': 2878, 'loss/train': 1.7523951530456543} -09/21/2021 00:27:46 - INFO - __main__ - Step 46053: {'lr': 0.000199080114937742, 'samples': 1473696, 'steps': 2878, 'loss/train': 0.7688280344009399} -09/21/2021 00:27:47 - INFO - __main__ - Step 46054: {'lr': 0.000199080114937742, 'samples': 1473728, 'steps': 2878, 'loss/train': 0.2151940017938614} -09/21/2021 00:27:47 - INFO - __main__ - Step 46055: {'lr': 0.000199080114937742, 'samples': 1473760, 'steps': 2878, 'loss/train': 1.8307056427001953} -09/21/2021 00:27:48 - INFO - __main__ - Step 46056: {'lr': 0.000199080114937742, 'samples': 1473792, 'steps': 2878, 'loss/train': 0.8420156836509705} -09/21/2021 00:27:49 - INFO - __main__ - Step 46057: {'lr': 0.000199080114937742, 'samples': 1473824, 'steps': 2878, 'loss/train': 2.656262159347534} -09/21/2021 00:27:50 - INFO - __main__ - Step 46058: {'lr': 0.000199080114937742, 'samples': 1473856, 'steps': 2878, 'loss/train': 2.1589443683624268} -09/21/2021 00:27:50 - INFO - __main__ - Step 46059: {'lr': 0.000199080114937742, 'samples': 1473888, 'steps': 2878, 'loss/train': 2.368467330932617} -09/21/2021 00:27:51 - INFO - __main__ - Step 46060: {'lr': 0.000199080114937742, 'samples': 1473920, 'steps': 2878, 'loss/train': 2.0752289295196533} -09/21/2021 00:27:52 - INFO - __main__ - Step 46061: {'lr': 0.000199080114937742, 'samples': 1473952, 'steps': 2878, 'loss/train': 1.8628658056259155} -09/21/2021 00:27:53 - INFO - __main__ - Step 46062: {'lr': 0.000199080114937742, 'samples': 1473984, 'steps': 2878, 'loss/train': 2.2965164184570312} -09/21/2021 00:27:53 - INFO - __main__ - Step 46063: {'lr': 0.000199080114937742, 'samples': 1474016, 'steps': 2878, 'loss/train': 2.026771306991577} -09/21/2021 00:27:54 - INFO - __main__ - Step 46064: {'lr': 0.000199080114937742, 'samples': 1474048, 'steps': 2878, 'loss/train': 0.8166279792785645} -09/21/2021 00:27:55 - INFO - __main__ - Step 46065: {'lr': 0.00019907925151046264, 'samples': 1474080, 'steps': 2879, 'loss/train': 2.238409996032715} -09/21/2021 00:27:56 - INFO - __main__ - Step 46066: {'lr': 0.00019907925151046264, 'samples': 1474112, 'steps': 2879, 'loss/train': 1.7294650077819824} -09/21/2021 00:27:57 - INFO - __main__ - Step 46067: {'lr': 0.00019907925151046264, 'samples': 1474144, 'steps': 2879, 'loss/train': 1.6704033613204956} -09/21/2021 00:27:57 - INFO - __main__ - Step 46068: {'lr': 0.00019907925151046264, 'samples': 1474176, 'steps': 2879, 'loss/train': 1.6908702850341797} -09/21/2021 00:27:58 - INFO - __main__ - Step 46069: {'lr': 0.00019907925151046264, 'samples': 1474208, 'steps': 2879, 'loss/train': 2.6096761226654053} -09/21/2021 00:27:59 - INFO - __main__ - Step 46070: {'lr': 0.00019907925151046264, 'samples': 1474240, 'steps': 2879, 'loss/train': 2.135305881500244} -09/21/2021 00:28:00 - INFO - __main__ - Step 46071: {'lr': 0.00019907925151046264, 'samples': 1474272, 'steps': 2879, 'loss/train': 1.8867367506027222} -09/21/2021 00:28:00 - INFO - __main__ - Step 46072: {'lr': 0.00019907925151046264, 'samples': 1474304, 'steps': 2879, 'loss/train': 2.5637967586517334} -09/21/2021 00:28:01 - INFO - __main__ - Step 46073: {'lr': 0.00019907925151046264, 'samples': 1474336, 'steps': 2879, 'loss/train': 2.3995132446289062} -09/21/2021 00:28:02 - INFO - __main__ - Step 46074: {'lr': 0.00019907925151046264, 'samples': 1474368, 'steps': 2879, 'loss/train': 2.2040255069732666} -09/21/2021 00:28:03 - INFO - __main__ - Step 46075: {'lr': 0.00019907925151046264, 'samples': 1474400, 'steps': 2879, 'loss/train': 2.310565710067749} -09/21/2021 00:28:03 - INFO - __main__ - Step 46076: {'lr': 0.00019907925151046264, 'samples': 1474432, 'steps': 2879, 'loss/train': 2.339792490005493} -09/21/2021 00:28:04 - INFO - __main__ - Step 46077: {'lr': 0.00019907925151046264, 'samples': 1474464, 'steps': 2879, 'loss/train': 1.2988091707229614} -09/21/2021 00:28:05 - INFO - __main__ - Step 46078: {'lr': 0.00019907925151046264, 'samples': 1474496, 'steps': 2879, 'loss/train': 2.5235235691070557} -09/21/2021 00:28:06 - INFO - __main__ - Step 46079: {'lr': 0.00019907925151046264, 'samples': 1474528, 'steps': 2879, 'loss/train': 2.041876792907715} -09/21/2021 00:28:07 - INFO - __main__ - Step 46080: {'lr': 0.00019907925151046264, 'samples': 1474560, 'steps': 2879, 'loss/train': 2.1229164600372314} -09/21/2021 00:28:08 - INFO - __main__ - Step 46081: {'lr': 0.0001990783876800302, 'samples': 1474592, 'steps': 2880, 'loss/train': 2.7056288719177246} -09/21/2021 00:28:08 - INFO - __main__ - Step 46082: {'lr': 0.0001990783876800302, 'samples': 1474624, 'steps': 2880, 'loss/train': 1.3184735774993896} -09/21/2021 00:28:09 - INFO - __main__ - Step 46083: {'lr': 0.0001990783876800302, 'samples': 1474656, 'steps': 2880, 'loss/train': 2.270493507385254} -09/21/2021 00:28:10 - INFO - __main__ - Step 46084: {'lr': 0.0001990783876800302, 'samples': 1474688, 'steps': 2880, 'loss/train': 2.142925977706909} -09/21/2021 00:28:11 - INFO - __main__ - Step 46085: {'lr': 0.0001990783876800302, 'samples': 1474720, 'steps': 2880, 'loss/train': 2.6747689247131348} -09/21/2021 00:28:11 - INFO - __main__ - Step 46086: {'lr': 0.0001990783876800302, 'samples': 1474752, 'steps': 2880, 'loss/train': 0.8327831029891968} -09/21/2021 00:28:12 - INFO - __main__ - Step 46087: {'lr': 0.0001990783876800302, 'samples': 1474784, 'steps': 2880, 'loss/train': 2.751131057739258} -09/21/2021 00:28:13 - INFO - __main__ - Step 46088: {'lr': 0.0001990783876800302, 'samples': 1474816, 'steps': 2880, 'loss/train': 1.201601505279541} -09/21/2021 00:28:14 - INFO - __main__ - Step 46089: {'lr': 0.0001990783876800302, 'samples': 1474848, 'steps': 2880, 'loss/train': 1.7932274341583252} -09/21/2021 00:28:14 - INFO - __main__ - Step 46090: {'lr': 0.0001990783876800302, 'samples': 1474880, 'steps': 2880, 'loss/train': 2.131359338760376} -09/21/2021 00:28:15 - INFO - __main__ - Step 46091: {'lr': 0.0001990783876800302, 'samples': 1474912, 'steps': 2880, 'loss/train': 1.8828572034835815} -09/21/2021 00:28:16 - INFO - __main__ - Step 46092: {'lr': 0.0001990783876800302, 'samples': 1474944, 'steps': 2880, 'loss/train': 2.594280958175659} -09/21/2021 00:28:17 - INFO - __main__ - Step 46093: {'lr': 0.0001990783876800302, 'samples': 1474976, 'steps': 2880, 'loss/train': 1.8241910934448242} -09/21/2021 00:28:17 - INFO - __main__ - Step 46094: {'lr': 0.0001990783876800302, 'samples': 1475008, 'steps': 2880, 'loss/train': 0.39705511927604675} -09/21/2021 00:28:18 - INFO - __main__ - Step 46095: {'lr': 0.0001990783876800302, 'samples': 1475040, 'steps': 2880, 'loss/train': 1.9589810371398926} -09/21/2021 00:28:19 - INFO - __main__ - Step 46096: {'lr': 0.0001990783876800302, 'samples': 1475072, 'steps': 2880, 'loss/train': 2.3920376300811768} -09/21/2021 00:28:20 - INFO - __main__ - Step 46097: {'lr': 0.00019907752344644814, 'samples': 1475104, 'steps': 2881, 'loss/train': 2.234644889831543} -09/21/2021 00:28:21 - INFO - __main__ - Step 46098: {'lr': 0.00019907752344644814, 'samples': 1475136, 'steps': 2881, 'loss/train': 2.2263269424438477} -09/21/2021 00:28:21 - INFO - __main__ - Step 46099: {'lr': 0.00019907752344644814, 'samples': 1475168, 'steps': 2881, 'loss/train': 5.417247772216797} -09/21/2021 00:28:22 - INFO - __main__ - Step 46100: {'lr': 0.00019907752344644814, 'samples': 1475200, 'steps': 2881, 'loss/train': 2.464146614074707} -09/21/2021 00:28:23 - INFO - __main__ - Step 46101: {'lr': 0.00019907752344644814, 'samples': 1475232, 'steps': 2881, 'loss/train': 1.578363299369812} -09/21/2021 00:28:24 - INFO - __main__ - Step 46102: {'lr': 0.00019907752344644814, 'samples': 1475264, 'steps': 2881, 'loss/train': 1.764485478401184} -09/21/2021 00:28:24 - INFO - __main__ - Step 46103: {'lr': 0.00019907752344644814, 'samples': 1475296, 'steps': 2881, 'loss/train': 1.4767695665359497} -09/21/2021 00:28:25 - INFO - __main__ - Step 46104: {'lr': 0.00019907752344644814, 'samples': 1475328, 'steps': 2881, 'loss/train': 2.078526496887207} -09/21/2021 00:28:26 - INFO - __main__ - Step 46105: {'lr': 0.00019907752344644814, 'samples': 1475360, 'steps': 2881, 'loss/train': 2.512197256088257} -09/21/2021 00:28:27 - INFO - __main__ - Step 46106: {'lr': 0.00019907752344644814, 'samples': 1475392, 'steps': 2881, 'loss/train': 2.038616180419922} -09/21/2021 00:28:27 - INFO - __main__ - Step 46107: {'lr': 0.00019907752344644814, 'samples': 1475424, 'steps': 2881, 'loss/train': 1.6593583822250366} -09/21/2021 00:28:28 - INFO - __main__ - Step 46108: {'lr': 0.00019907752344644814, 'samples': 1475456, 'steps': 2881, 'loss/train': 1.8920938968658447} -09/21/2021 00:28:29 - INFO - __main__ - Step 46109: {'lr': 0.00019907752344644814, 'samples': 1475488, 'steps': 2881, 'loss/train': 2.0703861713409424} -09/21/2021 00:28:30 - INFO - __main__ - Step 46110: {'lr': 0.00019907752344644814, 'samples': 1475520, 'steps': 2881, 'loss/train': 1.8485270738601685} -09/21/2021 00:28:31 - INFO - __main__ - Step 46111: {'lr': 0.00019907752344644814, 'samples': 1475552, 'steps': 2881, 'loss/train': 0.08713173121213913} -09/21/2021 00:28:32 - INFO - __main__ - Step 46112: {'lr': 0.00019907752344644814, 'samples': 1475584, 'steps': 2881, 'loss/train': 0.5171141028404236} -09/21/2021 00:28:33 - INFO - __main__ - Step 46113: {'lr': 0.00019907665880972006, 'samples': 1475616, 'steps': 2882, 'loss/train': 0.6615684032440186} -09/21/2021 00:28:33 - INFO - __main__ - Step 46114: {'lr': 0.00019907665880972006, 'samples': 1475648, 'steps': 2882, 'loss/train': 1.6229701042175293} -09/21/2021 00:28:34 - INFO - __main__ - Step 46115: {'lr': 0.00019907665880972006, 'samples': 1475680, 'steps': 2882, 'loss/train': 2.2370765209198} -09/21/2021 00:28:35 - INFO - __main__ - Step 46116: {'lr': 0.00019907665880972006, 'samples': 1475712, 'steps': 2882, 'loss/train': 1.7436556816101074} -09/21/2021 00:28:36 - INFO - __main__ - Step 46117: {'lr': 0.00019907665880972006, 'samples': 1475744, 'steps': 2882, 'loss/train': 1.7558751106262207} -09/21/2021 00:28:36 - INFO - __main__ - Step 46118: {'lr': 0.00019907665880972006, 'samples': 1475776, 'steps': 2882, 'loss/train': 2.33984112739563} -09/21/2021 00:28:37 - INFO - __main__ - Step 46119: {'lr': 0.00019907665880972006, 'samples': 1475808, 'steps': 2882, 'loss/train': 2.023829460144043} -09/21/2021 00:28:38 - INFO - __main__ - Step 46120: {'lr': 0.00019907665880972006, 'samples': 1475840, 'steps': 2882, 'loss/train': 1.3093925714492798} -09/21/2021 00:28:39 - INFO - __main__ - Step 46121: {'lr': 0.00019907665880972006, 'samples': 1475872, 'steps': 2882, 'loss/train': 0.41297444701194763} -09/21/2021 00:28:39 - INFO - __main__ - Step 46122: {'lr': 0.00019907665880972006, 'samples': 1475904, 'steps': 2882, 'loss/train': 1.987834095954895} -09/21/2021 00:28:40 - INFO - __main__ - Step 46123: {'lr': 0.00019907665880972006, 'samples': 1475936, 'steps': 2882, 'loss/train': 0.3409433960914612} -09/21/2021 00:28:41 - INFO - __main__ - Step 46124: {'lr': 0.00019907665880972006, 'samples': 1475968, 'steps': 2882, 'loss/train': 2.2810616493225098} -09/21/2021 00:28:42 - INFO - __main__ - Step 46125: {'lr': 0.00019907665880972006, 'samples': 1476000, 'steps': 2882, 'loss/train': 0.317908376455307} -09/21/2021 00:28:42 - INFO - __main__ - Step 46126: {'lr': 0.00019907665880972006, 'samples': 1476032, 'steps': 2882, 'loss/train': 2.3604700565338135} -09/21/2021 00:28:43 - INFO - __main__ - Step 46127: {'lr': 0.00019907665880972006, 'samples': 1476064, 'steps': 2882, 'loss/train': 1.8617444038391113} -09/21/2021 00:28:44 - INFO - __main__ - Step 46128: {'lr': 0.00019907665880972006, 'samples': 1476096, 'steps': 2882, 'loss/train': 2.2833364009857178} -09/21/2021 00:28:45 - INFO - __main__ - Step 46129: {'lr': 0.00019907579376984944, 'samples': 1476128, 'steps': 2883, 'loss/train': 1.153693675994873} -09/21/2021 00:28:45 - INFO - __main__ - Step 46130: {'lr': 0.00019907579376984944, 'samples': 1476160, 'steps': 2883, 'loss/train': 2.2568352222442627} -09/21/2021 00:28:46 - INFO - __main__ - Step 46131: {'lr': 0.00019907579376984944, 'samples': 1476192, 'steps': 2883, 'loss/train': 1.9185044765472412} -09/21/2021 00:28:47 - INFO - __main__ - Step 46132: {'lr': 0.00019907579376984944, 'samples': 1476224, 'steps': 2883, 'loss/train': 1.8298672437667847} -09/21/2021 00:28:48 - INFO - __main__ - Step 46133: {'lr': 0.00019907579376984944, 'samples': 1476256, 'steps': 2883, 'loss/train': 1.9969940185546875} -09/21/2021 00:28:48 - INFO - __main__ - Step 46134: {'lr': 0.00019907579376984944, 'samples': 1476288, 'steps': 2883, 'loss/train': 1.9768682718276978} -09/21/2021 00:28:49 - INFO - __main__ - Step 46135: {'lr': 0.00019907579376984944, 'samples': 1476320, 'steps': 2883, 'loss/train': 3.0069777965545654} -09/21/2021 00:28:50 - INFO - __main__ - Step 46136: {'lr': 0.00019907579376984944, 'samples': 1476352, 'steps': 2883, 'loss/train': 2.6712303161621094} -09/21/2021 00:28:51 - INFO - __main__ - Step 46137: {'lr': 0.00019907579376984944, 'samples': 1476384, 'steps': 2883, 'loss/train': 1.6044238805770874} -09/21/2021 00:28:51 - INFO - __main__ - Step 46138: {'lr': 0.00019907579376984944, 'samples': 1476416, 'steps': 2883, 'loss/train': 1.914957880973816} -09/21/2021 00:28:52 - INFO - __main__ - Step 46139: {'lr': 0.00019907579376984944, 'samples': 1476448, 'steps': 2883, 'loss/train': 1.2344187498092651} -09/21/2021 00:28:54 - INFO - __main__ - Step 46140: {'lr': 0.00019907579376984944, 'samples': 1476480, 'steps': 2883, 'loss/train': 2.1535091400146484} -09/21/2021 00:28:54 - INFO - __main__ - Step 46141: {'lr': 0.00019907579376984944, 'samples': 1476512, 'steps': 2883, 'loss/train': 1.5893441438674927} -09/21/2021 00:28:55 - INFO - __main__ - Step 46142: {'lr': 0.00019907579376984944, 'samples': 1476544, 'steps': 2883, 'loss/train': 1.9549446105957031} -09/21/2021 00:28:56 - INFO - __main__ - Step 46143: {'lr': 0.00019907579376984944, 'samples': 1476576, 'steps': 2883, 'loss/train': 2.1467738151550293} -09/21/2021 00:28:57 - INFO - __main__ - Step 46144: {'lr': 0.00019907579376984944, 'samples': 1476608, 'steps': 2883, 'loss/train': 2.39866042137146} -09/21/2021 00:28:57 - INFO - __main__ - Step 46145: {'lr': 0.0001990749283268398, 'samples': 1476640, 'steps': 2884, 'loss/train': 2.1391382217407227} -09/21/2021 00:28:58 - INFO - __main__ - Step 46146: {'lr': 0.0001990749283268398, 'samples': 1476672, 'steps': 2884, 'loss/train': 2.9323160648345947} -09/21/2021 00:28:59 - INFO - __main__ - Step 46147: {'lr': 0.0001990749283268398, 'samples': 1476704, 'steps': 2884, 'loss/train': 1.3248013257980347} -09/21/2021 00:29:00 - INFO - __main__ - Step 46148: {'lr': 0.0001990749283268398, 'samples': 1476736, 'steps': 2884, 'loss/train': 1.4950389862060547} -09/21/2021 00:29:00 - INFO - __main__ - Step 46149: {'lr': 0.0001990749283268398, 'samples': 1476768, 'steps': 2884, 'loss/train': 2.434744358062744} -09/21/2021 00:29:01 - INFO - __main__ - Step 46150: {'lr': 0.0001990749283268398, 'samples': 1476800, 'steps': 2884, 'loss/train': 1.6521767377853394} -09/21/2021 00:29:02 - INFO - __main__ - Step 46151: {'lr': 0.0001990749283268398, 'samples': 1476832, 'steps': 2884, 'loss/train': 2.015690803527832} -09/21/2021 00:29:03 - INFO - __main__ - Step 46152: {'lr': 0.0001990749283268398, 'samples': 1476864, 'steps': 2884, 'loss/train': 1.145490050315857} -09/21/2021 00:29:03 - INFO - __main__ - Step 46153: {'lr': 0.0001990749283268398, 'samples': 1476896, 'steps': 2884, 'loss/train': 1.9248625040054321} -09/21/2021 00:29:04 - INFO - __main__ - Step 46154: {'lr': 0.0001990749283268398, 'samples': 1476928, 'steps': 2884, 'loss/train': 2.4086549282073975} -09/21/2021 00:29:05 - INFO - __main__ - Step 46155: {'lr': 0.0001990749283268398, 'samples': 1476960, 'steps': 2884, 'loss/train': 2.035477638244629} -09/21/2021 00:29:06 - INFO - __main__ - Step 46156: {'lr': 0.0001990749283268398, 'samples': 1476992, 'steps': 2884, 'loss/train': 1.9868454933166504} -09/21/2021 00:29:06 - INFO - __main__ - Step 46157: {'lr': 0.0001990749283268398, 'samples': 1477024, 'steps': 2884, 'loss/train': 1.99833083152771} -09/21/2021 00:29:07 - INFO - __main__ - Step 46158: {'lr': 0.0001990749283268398, 'samples': 1477056, 'steps': 2884, 'loss/train': 2.8163185119628906} -09/21/2021 00:29:08 - INFO - __main__ - Step 46159: {'lr': 0.0001990749283268398, 'samples': 1477088, 'steps': 2884, 'loss/train': 2.870501756668091} -09/21/2021 00:29:09 - INFO - __main__ - Step 46160: {'lr': 0.0001990749283268398, 'samples': 1477120, 'steps': 2884, 'loss/train': 1.9673444032669067} -09/21/2021 00:29:10 - INFO - __main__ - Step 46161: {'lr': 0.00019907406248069465, 'samples': 1477152, 'steps': 2885, 'loss/train': 2.0552942752838135} -09/21/2021 00:29:10 - INFO - __main__ - Step 46162: {'lr': 0.00019907406248069465, 'samples': 1477184, 'steps': 2885, 'loss/train': 1.9511451721191406} -09/21/2021 00:29:11 - INFO - __main__ - Step 46163: {'lr': 0.00019907406248069465, 'samples': 1477216, 'steps': 2885, 'loss/train': 6.2317795753479} -09/21/2021 00:29:12 - INFO - __main__ - Step 46164: {'lr': 0.00019907406248069465, 'samples': 1477248, 'steps': 2885, 'loss/train': 5.636096477508545} -09/21/2021 00:29:13 - INFO - __main__ - Step 46165: {'lr': 0.00019907406248069465, 'samples': 1477280, 'steps': 2885, 'loss/train': 5.536646842956543} -09/21/2021 00:29:13 - INFO - __main__ - Step 46166: {'lr': 0.00019907406248069465, 'samples': 1477312, 'steps': 2885, 'loss/train': 6.0395188331604} -09/21/2021 00:29:14 - INFO - __main__ - Step 46167: {'lr': 0.00019907406248069465, 'samples': 1477344, 'steps': 2885, 'loss/train': 5.731837749481201} -09/21/2021 00:29:15 - INFO - __main__ - Step 46168: {'lr': 0.00019907406248069465, 'samples': 1477376, 'steps': 2885, 'loss/train': 1.2757234573364258} -09/21/2021 00:29:16 - INFO - __main__ - Step 46169: {'lr': 0.00019907406248069465, 'samples': 1477408, 'steps': 2885, 'loss/train': 2.8924412727355957} -09/21/2021 00:29:16 - INFO - __main__ - Step 46170: {'lr': 0.00019907406248069465, 'samples': 1477440, 'steps': 2885, 'loss/train': 2.1506998538970947} -09/21/2021 00:29:17 - INFO - __main__ - Step 46171: {'lr': 0.00019907406248069465, 'samples': 1477472, 'steps': 2885, 'loss/train': 1.89657461643219} -09/21/2021 00:29:18 - INFO - __main__ - Step 46172: {'lr': 0.00019907406248069465, 'samples': 1477504, 'steps': 2885, 'loss/train': 2.5413997173309326} -09/21/2021 00:29:19 - INFO - __main__ - Step 46173: {'lr': 0.00019907406248069465, 'samples': 1477536, 'steps': 2885, 'loss/train': 1.8444032669067383} -09/21/2021 00:29:21 - INFO - __main__ - Step 46174: {'lr': 0.00019907406248069465, 'samples': 1477568, 'steps': 2885, 'loss/train': 1.638607144355774} -09/21/2021 00:29:22 - INFO - __main__ - Step 46175: {'lr': 0.00019907406248069465, 'samples': 1477600, 'steps': 2885, 'loss/train': 1.9968947172164917} -09/21/2021 00:29:22 - INFO - __main__ - Step 46176: {'lr': 0.00019907406248069465, 'samples': 1477632, 'steps': 2885, 'loss/train': 1.9902229309082031} -09/21/2021 00:29:23 - INFO - __main__ - Step 46177: {'lr': 0.00019907319623141753, 'samples': 1477664, 'steps': 2886, 'loss/train': 2.2684547901153564} -09/21/2021 00:29:24 - INFO - __main__ - Step 46178: {'lr': 0.00019907319623141753, 'samples': 1477696, 'steps': 2886, 'loss/train': 2.782604217529297} -09/21/2021 00:29:25 - INFO - __main__ - Step 46179: {'lr': 0.00019907319623141753, 'samples': 1477728, 'steps': 2886, 'loss/train': 2.5069196224212646} -09/21/2021 00:29:26 - INFO - __main__ - Step 46180: {'lr': 0.00019907319623141753, 'samples': 1477760, 'steps': 2886, 'loss/train': 1.9027596712112427} -09/21/2021 00:29:26 - INFO - __main__ - Step 46181: {'lr': 0.00019907319623141753, 'samples': 1477792, 'steps': 2886, 'loss/train': 1.9087430238723755} -09/21/2021 00:29:27 - INFO - __main__ - Step 46182: {'lr': 0.00019907319623141753, 'samples': 1477824, 'steps': 2886, 'loss/train': 2.0567309856414795} -09/21/2021 00:29:28 - INFO - __main__ - Step 46183: {'lr': 0.00019907319623141753, 'samples': 1477856, 'steps': 2886, 'loss/train': 0.3817935287952423} -09/21/2021 00:29:29 - INFO - __main__ - Step 46184: {'lr': 0.00019907319623141753, 'samples': 1477888, 'steps': 2886, 'loss/train': 1.9513983726501465} -09/21/2021 00:29:29 - INFO - __main__ - Step 46185: {'lr': 0.00019907319623141753, 'samples': 1477920, 'steps': 2886, 'loss/train': 2.227454900741577} -09/21/2021 00:29:30 - INFO - __main__ - Step 46186: {'lr': 0.00019907319623141753, 'samples': 1477952, 'steps': 2886, 'loss/train': 1.5618500709533691} -09/21/2021 00:29:31 - INFO - __main__ - Step 46187: {'lr': 0.00019907319623141753, 'samples': 1477984, 'steps': 2886, 'loss/train': 0.36762577295303345} -09/21/2021 00:29:32 - INFO - __main__ - Step 46188: {'lr': 0.00019907319623141753, 'samples': 1478016, 'steps': 2886, 'loss/train': 2.197253942489624} -09/21/2021 00:29:32 - INFO - __main__ - Step 46189: {'lr': 0.00019907319623141753, 'samples': 1478048, 'steps': 2886, 'loss/train': 3.1642918586730957} -09/21/2021 00:29:33 - INFO - __main__ - Step 46190: {'lr': 0.00019907319623141753, 'samples': 1478080, 'steps': 2886, 'loss/train': 2.3393683433532715} -09/21/2021 00:29:34 - INFO - __main__ - Step 46191: {'lr': 0.00019907319623141753, 'samples': 1478112, 'steps': 2886, 'loss/train': 2.645780086517334} -09/21/2021 00:29:35 - INFO - __main__ - Step 46192: {'lr': 0.00019907319623141753, 'samples': 1478144, 'steps': 2886, 'loss/train': 2.6026060581207275} -09/21/2021 00:29:35 - INFO - __main__ - Step 46193: {'lr': 0.00019907232957901196, 'samples': 1478176, 'steps': 2887, 'loss/train': 3.596717357635498} -09/21/2021 00:29:36 - INFO - __main__ - Step 46194: {'lr': 0.00019907232957901196, 'samples': 1478208, 'steps': 2887, 'loss/train': 4.029306411743164} -09/21/2021 00:29:37 - INFO - __main__ - Step 46195: {'lr': 0.00019907232957901196, 'samples': 1478240, 'steps': 2887, 'loss/train': 3.972480297088623} -09/21/2021 00:29:38 - INFO - __main__ - Step 46196: {'lr': 0.00019907232957901196, 'samples': 1478272, 'steps': 2887, 'loss/train': 3.7111992835998535} -09/21/2021 00:29:38 - INFO - __main__ - Step 46197: {'lr': 0.00019907232957901196, 'samples': 1478304, 'steps': 2887, 'loss/train': 3.784451484680176} -09/21/2021 00:29:39 - INFO - __main__ - Step 46198: {'lr': 0.00019907232957901196, 'samples': 1478336, 'steps': 2887, 'loss/train': 1.8614146709442139} -09/21/2021 00:29:40 - INFO - __main__ - Step 46199: {'lr': 0.00019907232957901196, 'samples': 1478368, 'steps': 2887, 'loss/train': 1.8435461521148682} -09/21/2021 00:29:41 - INFO - __main__ - Step 46200: {'lr': 0.00019907232957901196, 'samples': 1478400, 'steps': 2887, 'loss/train': 1.9533157348632812} -09/21/2021 00:29:41 - INFO - __main__ - Step 46201: {'lr': 0.00019907232957901196, 'samples': 1478432, 'steps': 2887, 'loss/train': 2.656754732131958} -09/21/2021 00:29:42 - INFO - __main__ - Step 46202: {'lr': 0.00019907232957901196, 'samples': 1478464, 'steps': 2887, 'loss/train': 2.0703749656677246} -09/21/2021 00:29:43 - INFO - __main__ - Step 46203: {'lr': 0.00019907232957901196, 'samples': 1478496, 'steps': 2887, 'loss/train': 2.068018674850464} -09/21/2021 00:29:44 - INFO - __main__ - Step 46204: {'lr': 0.00019907232957901196, 'samples': 1478528, 'steps': 2887, 'loss/train': 2.228065013885498} -09/21/2021 00:29:44 - INFO - __main__ - Step 46205: {'lr': 0.00019907232957901196, 'samples': 1478560, 'steps': 2887, 'loss/train': 2.029522180557251} -09/21/2021 00:29:45 - INFO - __main__ - Step 46206: {'lr': 0.00019907232957901196, 'samples': 1478592, 'steps': 2887, 'loss/train': 1.8460863828659058} -09/21/2021 00:29:46 - INFO - __main__ - Step 46207: {'lr': 0.00019907232957901196, 'samples': 1478624, 'steps': 2887, 'loss/train': 0.8623737692832947} -09/21/2021 00:29:47 - INFO - __main__ - Step 46208: {'lr': 0.00019907232957901196, 'samples': 1478656, 'steps': 2887, 'loss/train': 2.0623936653137207} -09/21/2021 00:29:48 - INFO - __main__ - Step 46209: {'lr': 0.00019907146252348147, 'samples': 1478688, 'steps': 2888, 'loss/train': 1.7916195392608643} -09/21/2021 00:29:48 - INFO - __main__ - Step 46210: {'lr': 0.00019907146252348147, 'samples': 1478720, 'steps': 2888, 'loss/train': 2.000499725341797} -09/21/2021 00:29:50 - INFO - __main__ - Step 46211: {'lr': 0.00019907146252348147, 'samples': 1478752, 'steps': 2888, 'loss/train': 1.4454857110977173} -09/21/2021 00:29:50 - INFO - __main__ - Step 46212: {'lr': 0.00019907146252348147, 'samples': 1478784, 'steps': 2888, 'loss/train': 2.239408016204834} -09/21/2021 00:29:51 - INFO - __main__ - Step 46213: {'lr': 0.00019907146252348147, 'samples': 1478816, 'steps': 2888, 'loss/train': 2.457984685897827} -09/21/2021 00:29:52 - INFO - __main__ - Step 46214: {'lr': 0.00019907146252348147, 'samples': 1478848, 'steps': 2888, 'loss/train': 1.6968474388122559} -09/21/2021 00:29:53 - INFO - __main__ - Step 46215: {'lr': 0.00019907146252348147, 'samples': 1478880, 'steps': 2888, 'loss/train': 2.4378485679626465} -09/21/2021 00:29:53 - INFO - __main__ - Step 46216: {'lr': 0.00019907146252348147, 'samples': 1478912, 'steps': 2888, 'loss/train': 1.6405730247497559} -09/21/2021 00:29:54 - INFO - __main__ - Step 46217: {'lr': 0.00019907146252348147, 'samples': 1478944, 'steps': 2888, 'loss/train': 2.274541139602661} -09/21/2021 00:29:55 - INFO - __main__ - Step 46218: {'lr': 0.00019907146252348147, 'samples': 1478976, 'steps': 2888, 'loss/train': 1.5254039764404297} -09/21/2021 00:29:56 - INFO - __main__ - Step 46219: {'lr': 0.00019907146252348147, 'samples': 1479008, 'steps': 2888, 'loss/train': 1.3413033485412598} -09/21/2021 00:29:56 - INFO - __main__ - Step 46220: {'lr': 0.00019907146252348147, 'samples': 1479040, 'steps': 2888, 'loss/train': 1.7582857608795166} -09/21/2021 00:29:57 - INFO - __main__ - Step 46221: {'lr': 0.00019907146252348147, 'samples': 1479072, 'steps': 2888, 'loss/train': 1.658058762550354} -09/21/2021 00:29:58 - INFO - __main__ - Step 46222: {'lr': 0.00019907146252348147, 'samples': 1479104, 'steps': 2888, 'loss/train': 2.2237677574157715} -09/21/2021 00:29:59 - INFO - __main__ - Step 46223: {'lr': 0.00019907146252348147, 'samples': 1479136, 'steps': 2888, 'loss/train': 4.054081439971924} -09/21/2021 00:29:59 - INFO - __main__ - Step 46224: {'lr': 0.00019907146252348147, 'samples': 1479168, 'steps': 2888, 'loss/train': 1.8814575672149658} -09/21/2021 00:30:00 - INFO - __main__ - Step 46225: {'lr': 0.00019907059506482958, 'samples': 1479200, 'steps': 2889, 'loss/train': 1.6302692890167236} -09/21/2021 00:30:01 - INFO - __main__ - Step 46226: {'lr': 0.00019907059506482958, 'samples': 1479232, 'steps': 2889, 'loss/train': 1.2634433507919312} -09/21/2021 00:30:02 - INFO - __main__ - Step 46227: {'lr': 0.00019907059506482958, 'samples': 1479264, 'steps': 2889, 'loss/train': 1.7400777339935303} -09/21/2021 00:30:03 - INFO - __main__ - Step 46228: {'lr': 0.00019907059506482958, 'samples': 1479296, 'steps': 2889, 'loss/train': 2.1948578357696533} -09/21/2021 00:30:03 - INFO - __main__ - Step 46229: {'lr': 0.00019907059506482958, 'samples': 1479328, 'steps': 2889, 'loss/train': 2.606174945831299} -09/21/2021 00:30:04 - INFO - __main__ - Step 46230: {'lr': 0.00019907059506482958, 'samples': 1479360, 'steps': 2889, 'loss/train': 2.2432408332824707} -09/21/2021 00:30:05 - INFO - __main__ - Step 46231: {'lr': 0.00019907059506482958, 'samples': 1479392, 'steps': 2889, 'loss/train': 1.9049055576324463} -09/21/2021 00:30:06 - INFO - __main__ - Step 46232: {'lr': 0.00019907059506482958, 'samples': 1479424, 'steps': 2889, 'loss/train': 3.0201618671417236} -09/21/2021 00:30:06 - INFO - __main__ - Step 46233: {'lr': 0.00019907059506482958, 'samples': 1479456, 'steps': 2889, 'loss/train': 1.7516499757766724} -09/21/2021 00:30:07 - INFO - __main__ - Step 46234: {'lr': 0.00019907059506482958, 'samples': 1479488, 'steps': 2889, 'loss/train': 2.0079026222229004} -09/21/2021 00:30:08 - INFO - __main__ - Step 46235: {'lr': 0.00019907059506482958, 'samples': 1479520, 'steps': 2889, 'loss/train': 1.8955639600753784} -09/21/2021 00:30:09 - INFO - __main__ - Step 46236: {'lr': 0.00019907059506482958, 'samples': 1479552, 'steps': 2889, 'loss/train': 2.2014405727386475} -09/21/2021 00:30:09 - INFO - __main__ - Step 46237: {'lr': 0.00019907059506482958, 'samples': 1479584, 'steps': 2889, 'loss/train': 1.1551064252853394} -09/21/2021 00:30:10 - INFO - __main__ - Step 46238: {'lr': 0.00019907059506482958, 'samples': 1479616, 'steps': 2889, 'loss/train': 2.89863657951355} -09/21/2021 00:30:11 - INFO - __main__ - Step 46239: {'lr': 0.00019907059506482958, 'samples': 1479648, 'steps': 2889, 'loss/train': 1.9885140657424927} -09/21/2021 00:30:12 - INFO - __main__ - Step 46240: {'lr': 0.00019907059506482958, 'samples': 1479680, 'steps': 2889, 'loss/train': 2.320202350616455} -09/21/2021 00:30:13 - INFO - __main__ - Step 46241: {'lr': 0.0001990697272030598, 'samples': 1479712, 'steps': 2890, 'loss/train': 2.27742862701416} -09/21/2021 00:30:14 - INFO - __main__ - Step 46242: {'lr': 0.0001990697272030598, 'samples': 1479744, 'steps': 2890, 'loss/train': 1.6355054378509521} -09/21/2021 00:30:15 - INFO - __main__ - Step 46243: {'lr': 0.0001990697272030598, 'samples': 1479776, 'steps': 2890, 'loss/train': 2.496835470199585} -09/21/2021 00:30:15 - INFO - __main__ - Step 46244: {'lr': 0.0001990697272030598, 'samples': 1479808, 'steps': 2890, 'loss/train': 2.146204710006714} -09/21/2021 00:30:16 - INFO - __main__ - Step 46245: {'lr': 0.0001990697272030598, 'samples': 1479840, 'steps': 2890, 'loss/train': 2.1177992820739746} -09/21/2021 00:30:17 - INFO - __main__ - Step 46246: {'lr': 0.0001990697272030598, 'samples': 1479872, 'steps': 2890, 'loss/train': 2.1990532875061035} -09/21/2021 00:30:18 - INFO - __main__ - Step 46247: {'lr': 0.0001990697272030598, 'samples': 1479904, 'steps': 2890, 'loss/train': 1.462350845336914} -09/21/2021 00:30:18 - INFO - __main__ - Step 46248: {'lr': 0.0001990697272030598, 'samples': 1479936, 'steps': 2890, 'loss/train': 1.9537299871444702} -09/21/2021 00:30:19 - INFO - __main__ - Step 46249: {'lr': 0.0001990697272030598, 'samples': 1479968, 'steps': 2890, 'loss/train': 2.110459804534912} -09/21/2021 00:30:20 - INFO - __main__ - Step 46250: {'lr': 0.0001990697272030598, 'samples': 1480000, 'steps': 2890, 'loss/train': 1.4195650815963745} -09/21/2021 00:30:21 - INFO - __main__ - Step 46251: {'lr': 0.0001990697272030598, 'samples': 1480032, 'steps': 2890, 'loss/train': 1.3689758777618408} -09/21/2021 00:30:21 - INFO - __main__ - Step 46252: {'lr': 0.0001990697272030598, 'samples': 1480064, 'steps': 2890, 'loss/train': 0.9993861317634583} -09/21/2021 00:30:22 - INFO - __main__ - Step 46253: {'lr': 0.0001990697272030598, 'samples': 1480096, 'steps': 2890, 'loss/train': 2.0902411937713623} -09/21/2021 00:30:23 - INFO - __main__ - Step 46254: {'lr': 0.0001990697272030598, 'samples': 1480128, 'steps': 2890, 'loss/train': 1.0613532066345215} -09/21/2021 00:30:24 - INFO - __main__ - Step 46255: {'lr': 0.0001990697272030598, 'samples': 1480160, 'steps': 2890, 'loss/train': 1.9090851545333862} -09/21/2021 00:30:24 - INFO - __main__ - Step 46256: {'lr': 0.0001990697272030598, 'samples': 1480192, 'steps': 2890, 'loss/train': 1.642581820487976} -09/21/2021 00:30:25 - INFO - __main__ - Step 46257: {'lr': 0.00019906885893817574, 'samples': 1480224, 'steps': 2891, 'loss/train': 2.4968535900115967} -09/21/2021 00:30:26 - INFO - __main__ - Step 46258: {'lr': 0.00019906885893817574, 'samples': 1480256, 'steps': 2891, 'loss/train': 2.0507938861846924} -09/21/2021 00:30:27 - INFO - __main__ - Step 46259: {'lr': 0.00019906885893817574, 'samples': 1480288, 'steps': 2891, 'loss/train': 2.1952662467956543} -09/21/2021 00:30:27 - INFO - __main__ - Step 46260: {'lr': 0.00019906885893817574, 'samples': 1480320, 'steps': 2891, 'loss/train': 2.069493293762207} -09/21/2021 00:30:28 - INFO - __main__ - Step 46261: {'lr': 0.00019906885893817574, 'samples': 1480352, 'steps': 2891, 'loss/train': 2.146967649459839} -09/21/2021 00:30:29 - INFO - __main__ - Step 46262: {'lr': 0.00019906885893817574, 'samples': 1480384, 'steps': 2891, 'loss/train': 2.045233726501465} -09/21/2021 00:30:30 - INFO - __main__ - Step 46263: {'lr': 0.00019906885893817574, 'samples': 1480416, 'steps': 2891, 'loss/train': 1.720310091972351} -09/21/2021 00:30:30 - INFO - __main__ - Step 46264: {'lr': 0.00019906885893817574, 'samples': 1480448, 'steps': 2891, 'loss/train': 2.1823744773864746} -09/21/2021 00:30:31 - INFO - __main__ - Step 46265: {'lr': 0.00019906885893817574, 'samples': 1480480, 'steps': 2891, 'loss/train': 1.9860700368881226} -09/21/2021 00:30:32 - INFO - __main__ - Step 46266: {'lr': 0.00019906885893817574, 'samples': 1480512, 'steps': 2891, 'loss/train': 2.7106919288635254} -09/21/2021 00:30:33 - INFO - __main__ - Step 46267: {'lr': 0.00019906885893817574, 'samples': 1480544, 'steps': 2891, 'loss/train': 2.9356632232666016} -09/21/2021 00:30:33 - INFO - __main__ - Step 46268: {'lr': 0.00019906885893817574, 'samples': 1480576, 'steps': 2891, 'loss/train': 1.8239920139312744} -09/21/2021 00:30:34 - INFO - __main__ - Step 46269: {'lr': 0.00019906885893817574, 'samples': 1480608, 'steps': 2891, 'loss/train': 1.7240935564041138} -09/21/2021 00:30:35 - INFO - __main__ - Step 46270: {'lr': 0.00019906885893817574, 'samples': 1480640, 'steps': 2891, 'loss/train': 2.5138468742370605} -09/21/2021 00:30:36 - INFO - __main__ - Step 46271: {'lr': 0.00019906885893817574, 'samples': 1480672, 'steps': 2891, 'loss/train': 0.15593013167381287} -09/21/2021 00:30:38 - INFO - __main__ - Step 46272: {'lr': 0.00019906885893817574, 'samples': 1480704, 'steps': 2891, 'loss/train': 0.30344218015670776} -09/21/2021 00:30:39 - INFO - __main__ - Step 46273: {'lr': 0.00019906799027018083, 'samples': 1480736, 'steps': 2892, 'loss/train': 2.4434244632720947} -09/21/2021 00:30:39 - INFO - __main__ - Step 46274: {'lr': 0.00019906799027018083, 'samples': 1480768, 'steps': 2892, 'loss/train': 1.843263030052185} -09/21/2021 00:30:40 - INFO - __main__ - Step 46275: {'lr': 0.00019906799027018083, 'samples': 1480800, 'steps': 2892, 'loss/train': 1.9743068218231201} -09/21/2021 00:30:41 - INFO - __main__ - Step 46276: {'lr': 0.00019906799027018083, 'samples': 1480832, 'steps': 2892, 'loss/train': 0.1666393131017685} -09/21/2021 00:30:42 - INFO - __main__ - Step 46277: {'lr': 0.00019906799027018083, 'samples': 1480864, 'steps': 2892, 'loss/train': 0.1361285001039505} -09/21/2021 00:30:42 - INFO - __main__ - Step 46278: {'lr': 0.00019906799027018083, 'samples': 1480896, 'steps': 2892, 'loss/train': 0.19476185739040375} -09/21/2021 00:30:43 - INFO - __main__ - Step 46279: {'lr': 0.00019906799027018083, 'samples': 1480928, 'steps': 2892, 'loss/train': 1.902443528175354} -09/21/2021 00:30:44 - INFO - __main__ - Step 46280: {'lr': 0.00019906799027018083, 'samples': 1480960, 'steps': 2892, 'loss/train': 2.567096471786499} -09/21/2021 00:30:45 - INFO - __main__ - Step 46281: {'lr': 0.00019906799027018083, 'samples': 1480992, 'steps': 2892, 'loss/train': 1.4844361543655396} -09/21/2021 00:30:45 - INFO - __main__ - Step 46282: {'lr': 0.00019906799027018083, 'samples': 1481024, 'steps': 2892, 'loss/train': 2.1593472957611084} -09/21/2021 00:30:46 - INFO - __main__ - Step 46283: {'lr': 0.00019906799027018083, 'samples': 1481056, 'steps': 2892, 'loss/train': 2.4771077632904053} -09/21/2021 00:30:47 - INFO - __main__ - Step 46284: {'lr': 0.00019906799027018083, 'samples': 1481088, 'steps': 2892, 'loss/train': 0.7381072640419006} -09/21/2021 00:30:48 - INFO - __main__ - Step 46285: {'lr': 0.00019906799027018083, 'samples': 1481120, 'steps': 2892, 'loss/train': 2.2676212787628174} -09/21/2021 00:30:48 - INFO - __main__ - Step 46286: {'lr': 0.00019906799027018083, 'samples': 1481152, 'steps': 2892, 'loss/train': 0.29365548491477966} -09/21/2021 00:30:49 - INFO - __main__ - Step 46287: {'lr': 0.00019906799027018083, 'samples': 1481184, 'steps': 2892, 'loss/train': 1.456539511680603} -09/21/2021 00:30:50 - INFO - __main__ - Step 46288: {'lr': 0.00019906799027018083, 'samples': 1481216, 'steps': 2892, 'loss/train': 2.302482843399048} -09/21/2021 00:30:51 - INFO - __main__ - Step 46289: {'lr': 0.00019906712119907867, 'samples': 1481248, 'steps': 2893, 'loss/train': 1.8044648170471191} -09/21/2021 00:30:51 - INFO - __main__ - Step 46290: {'lr': 0.00019906712119907867, 'samples': 1481280, 'steps': 2893, 'loss/train': 2.0924360752105713} -09/21/2021 00:30:52 - INFO - __main__ - Step 46291: {'lr': 0.00019906712119907867, 'samples': 1481312, 'steps': 2893, 'loss/train': 1.471564769744873} -09/21/2021 00:30:53 - INFO - __main__ - Step 46292: {'lr': 0.00019906712119907867, 'samples': 1481344, 'steps': 2893, 'loss/train': 1.7439285516738892} -09/21/2021 00:30:54 - INFO - __main__ - Step 46293: {'lr': 0.00019906712119907867, 'samples': 1481376, 'steps': 2893, 'loss/train': 2.480935573577881} -09/21/2021 00:30:54 - INFO - __main__ - Step 46294: {'lr': 0.00019906712119907867, 'samples': 1481408, 'steps': 2893, 'loss/train': 2.747241258621216} -09/21/2021 00:30:55 - INFO - __main__ - Step 46295: {'lr': 0.00019906712119907867, 'samples': 1481440, 'steps': 2893, 'loss/train': 2.0851659774780273} -09/21/2021 00:30:56 - INFO - __main__ - Step 46296: {'lr': 0.00019906712119907867, 'samples': 1481472, 'steps': 2893, 'loss/train': 1.1876498460769653} -09/21/2021 00:30:57 - INFO - __main__ - Step 46297: {'lr': 0.00019906712119907867, 'samples': 1481504, 'steps': 2893, 'loss/train': 1.3502376079559326} -09/21/2021 00:30:57 - INFO - __main__ - Step 46298: {'lr': 0.00019906712119907867, 'samples': 1481536, 'steps': 2893, 'loss/train': 2.7947909832000732} -09/21/2021 00:30:58 - INFO - __main__ - Step 46299: {'lr': 0.00019906712119907867, 'samples': 1481568, 'steps': 2893, 'loss/train': 1.862676739692688} -09/21/2021 00:30:59 - INFO - __main__ - Step 46300: {'lr': 0.00019906712119907867, 'samples': 1481600, 'steps': 2893, 'loss/train': 1.8425847291946411} -09/21/2021 00:31:00 - INFO - __main__ - Step 46301: {'lr': 0.00019906712119907867, 'samples': 1481632, 'steps': 2893, 'loss/train': 0.5865341424942017} -09/21/2021 00:31:00 - INFO - __main__ - Step 46302: {'lr': 0.00019906712119907867, 'samples': 1481664, 'steps': 2893, 'loss/train': 0.30964264273643494} -09/21/2021 00:31:01 - INFO - __main__ - Step 46303: {'lr': 0.00019906712119907867, 'samples': 1481696, 'steps': 2893, 'loss/train': 0.14784324169158936} -09/21/2021 00:31:02 - INFO - __main__ - Step 46304: {'lr': 0.00019906712119907867, 'samples': 1481728, 'steps': 2893, 'loss/train': 0.24042177200317383} -09/21/2021 00:31:03 - INFO - __main__ - Step 46305: {'lr': 0.0001990662517248728, 'samples': 1481760, 'steps': 2894, 'loss/train': 0.2779507339000702} -09/21/2021 00:31:04 - INFO - __main__ - Step 46306: {'lr': 0.0001990662517248728, 'samples': 1481792, 'steps': 2894, 'loss/train': 0.4910758435726166} -09/21/2021 00:31:04 - INFO - __main__ - Step 46307: {'lr': 0.0001990662517248728, 'samples': 1481824, 'steps': 2894, 'loss/train': 0.19401399791240692} -09/21/2021 00:31:06 - INFO - __main__ - Step 46308: {'lr': 0.0001990662517248728, 'samples': 1481856, 'steps': 2894, 'loss/train': 0.12440718710422516} -09/21/2021 00:31:06 - INFO - __main__ - Step 46309: {'lr': 0.0001990662517248728, 'samples': 1481888, 'steps': 2894, 'loss/train': 1.1333460807800293} -09/21/2021 00:31:07 - INFO - __main__ - Step 46310: {'lr': 0.0001990662517248728, 'samples': 1481920, 'steps': 2894, 'loss/train': 2.5372350215911865} -09/21/2021 00:31:08 - INFO - __main__ - Step 46311: {'lr': 0.0001990662517248728, 'samples': 1481952, 'steps': 2894, 'loss/train': 1.873697280883789} -09/21/2021 00:31:09 - INFO - __main__ - Step 46312: {'lr': 0.0001990662517248728, 'samples': 1481984, 'steps': 2894, 'loss/train': 1.847948431968689} -09/21/2021 00:31:09 - INFO - __main__ - Step 46313: {'lr': 0.0001990662517248728, 'samples': 1482016, 'steps': 2894, 'loss/train': 1.4753912687301636} -09/21/2021 00:31:10 - INFO - __main__ - Step 46314: {'lr': 0.0001990662517248728, 'samples': 1482048, 'steps': 2894, 'loss/train': 1.9631648063659668} -09/21/2021 00:31:11 - INFO - __main__ - Step 46315: {'lr': 0.0001990662517248728, 'samples': 1482080, 'steps': 2894, 'loss/train': 2.1573801040649414} -09/21/2021 00:31:12 - INFO - __main__ - Step 46316: {'lr': 0.0001990662517248728, 'samples': 1482112, 'steps': 2894, 'loss/train': 1.914015531539917} -09/21/2021 00:31:12 - INFO - __main__ - Step 46317: {'lr': 0.0001990662517248728, 'samples': 1482144, 'steps': 2894, 'loss/train': 2.1932249069213867} -09/21/2021 00:31:13 - INFO - __main__ - Step 46318: {'lr': 0.0001990662517248728, 'samples': 1482176, 'steps': 2894, 'loss/train': 1.2837620973587036} -09/21/2021 00:31:14 - INFO - __main__ - Step 46319: {'lr': 0.0001990662517248728, 'samples': 1482208, 'steps': 2894, 'loss/train': 2.4894895553588867} -09/21/2021 00:31:15 - INFO - __main__ - Step 46320: {'lr': 0.0001990662517248728, 'samples': 1482240, 'steps': 2894, 'loss/train': 1.7249369621276855} -09/21/2021 00:31:16 - INFO - __main__ - Step 46321: {'lr': 0.0001990653818475667, 'samples': 1482272, 'steps': 2895, 'loss/train': 2.062739133834839} -09/21/2021 00:31:16 - INFO - __main__ - Step 46322: {'lr': 0.0001990653818475667, 'samples': 1482304, 'steps': 2895, 'loss/train': 2.3360724449157715} -09/21/2021 00:31:17 - INFO - __main__ - Step 46323: {'lr': 0.0001990653818475667, 'samples': 1482336, 'steps': 2895, 'loss/train': 2.440462589263916} -09/21/2021 00:31:18 - INFO - __main__ - Step 46324: {'lr': 0.0001990653818475667, 'samples': 1482368, 'steps': 2895, 'loss/train': 2.736450433731079} -09/21/2021 00:31:19 - INFO - __main__ - Step 46325: {'lr': 0.0001990653818475667, 'samples': 1482400, 'steps': 2895, 'loss/train': 1.2895838022232056} -09/21/2021 00:31:19 - INFO - __main__ - Step 46326: {'lr': 0.0001990653818475667, 'samples': 1482432, 'steps': 2895, 'loss/train': 1.5411947965621948} -09/21/2021 00:31:20 - INFO - __main__ - Step 46327: {'lr': 0.0001990653818475667, 'samples': 1482464, 'steps': 2895, 'loss/train': 2.662233591079712} -09/21/2021 00:31:21 - INFO - __main__ - Step 46328: {'lr': 0.0001990653818475667, 'samples': 1482496, 'steps': 2895, 'loss/train': 2.0694990158081055} -09/21/2021 00:31:22 - INFO - __main__ - Step 46329: {'lr': 0.0001990653818475667, 'samples': 1482528, 'steps': 2895, 'loss/train': 1.932116985321045} -09/21/2021 00:31:22 - INFO - __main__ - Step 46330: {'lr': 0.0001990653818475667, 'samples': 1482560, 'steps': 2895, 'loss/train': 0.990790843963623} -09/21/2021 00:31:23 - INFO - __main__ - Step 46331: {'lr': 0.0001990653818475667, 'samples': 1482592, 'steps': 2895, 'loss/train': 2.0343546867370605} -09/21/2021 00:31:24 - INFO - __main__ - Step 46332: {'lr': 0.0001990653818475667, 'samples': 1482624, 'steps': 2895, 'loss/train': 1.6456042528152466} -09/21/2021 00:31:25 - INFO - __main__ - Step 46333: {'lr': 0.0001990653818475667, 'samples': 1482656, 'steps': 2895, 'loss/train': 2.5772809982299805} -09/21/2021 00:31:25 - INFO - __main__ - Step 46334: {'lr': 0.0001990653818475667, 'samples': 1482688, 'steps': 2895, 'loss/train': 2.357844114303589} -09/21/2021 00:31:26 - INFO - __main__ - Step 46335: {'lr': 0.0001990653818475667, 'samples': 1482720, 'steps': 2895, 'loss/train': 1.1990082263946533} -09/21/2021 00:31:27 - INFO - __main__ - Step 46336: {'lr': 0.0001990653818475667, 'samples': 1482752, 'steps': 2895, 'loss/train': 3.1363508701324463} -09/21/2021 00:31:28 - INFO - __main__ - Step 46337: {'lr': 0.00019906451156716392, 'samples': 1482784, 'steps': 2896, 'loss/train': 2.572221279144287} -09/21/2021 00:31:28 - INFO - __main__ - Step 46338: {'lr': 0.00019906451156716392, 'samples': 1482816, 'steps': 2896, 'loss/train': 1.9598665237426758} -09/21/2021 00:31:30 - INFO - __main__ - Step 46339: {'lr': 0.00019906451156716392, 'samples': 1482848, 'steps': 2896, 'loss/train': 1.2301323413848877} -09/21/2021 00:31:30 - INFO - __main__ - Step 46340: {'lr': 0.00019906451156716392, 'samples': 1482880, 'steps': 2896, 'loss/train': 2.7541849613189697} -09/21/2021 00:31:31 - INFO - __main__ - Step 46341: {'lr': 0.00019906451156716392, 'samples': 1482912, 'steps': 2896, 'loss/train': 1.3096120357513428} -09/21/2021 00:31:32 - INFO - __main__ - Step 46342: {'lr': 0.00019906451156716392, 'samples': 1482944, 'steps': 2896, 'loss/train': 2.247819423675537} -09/21/2021 00:31:33 - INFO - __main__ - Step 46343: {'lr': 0.00019906451156716392, 'samples': 1482976, 'steps': 2896, 'loss/train': 2.4665024280548096} -09/21/2021 00:31:33 - INFO - __main__ - Step 46344: {'lr': 0.00019906451156716392, 'samples': 1483008, 'steps': 2896, 'loss/train': 1.8986057043075562} -09/21/2021 00:31:34 - INFO - __main__ - Step 46345: {'lr': 0.00019906451156716392, 'samples': 1483040, 'steps': 2896, 'loss/train': 1.6000115871429443} -09/21/2021 00:31:35 - INFO - __main__ - Step 46346: {'lr': 0.00019906451156716392, 'samples': 1483072, 'steps': 2896, 'loss/train': 1.99319326877594} -09/21/2021 00:31:36 - INFO - __main__ - Step 46347: {'lr': 0.00019906451156716392, 'samples': 1483104, 'steps': 2896, 'loss/train': 2.2320613861083984} -09/21/2021 00:31:36 - INFO - __main__ - Step 46348: {'lr': 0.00019906451156716392, 'samples': 1483136, 'steps': 2896, 'loss/train': 1.419907808303833} -09/21/2021 00:31:37 - INFO - __main__ - Step 46349: {'lr': 0.00019906451156716392, 'samples': 1483168, 'steps': 2896, 'loss/train': 0.7659675478935242} -09/21/2021 00:31:38 - INFO - __main__ - Step 46350: {'lr': 0.00019906451156716392, 'samples': 1483200, 'steps': 2896, 'loss/train': 2.3081042766571045} -09/21/2021 00:31:39 - INFO - __main__ - Step 46351: {'lr': 0.00019906451156716392, 'samples': 1483232, 'steps': 2896, 'loss/train': 1.6820616722106934} -09/21/2021 00:31:39 - INFO - __main__ - Step 46352: {'lr': 0.00019906451156716392, 'samples': 1483264, 'steps': 2896, 'loss/train': 2.7550976276397705} -09/21/2021 00:31:40 - INFO - __main__ - Step 46353: {'lr': 0.00019906364088366808, 'samples': 1483296, 'steps': 2897, 'loss/train': 1.8881365060806274} -09/21/2021 00:31:41 - INFO - __main__ - Step 46354: {'lr': 0.00019906364088366808, 'samples': 1483328, 'steps': 2897, 'loss/train': 1.9816489219665527} -09/21/2021 00:31:42 - INFO - __main__ - Step 46355: {'lr': 0.00019906364088366808, 'samples': 1483360, 'steps': 2897, 'loss/train': 0.3867141902446747} -09/21/2021 00:31:43 - INFO - __main__ - Step 46356: {'lr': 0.00019906364088366808, 'samples': 1483392, 'steps': 2897, 'loss/train': 1.4959083795547485} -09/21/2021 00:31:43 - INFO - __main__ - Step 46357: {'lr': 0.00019906364088366808, 'samples': 1483424, 'steps': 2897, 'loss/train': 2.1376967430114746} -09/21/2021 00:31:44 - INFO - __main__ - Step 46358: {'lr': 0.00019906364088366808, 'samples': 1483456, 'steps': 2897, 'loss/train': 1.4315046072006226} -09/21/2021 00:31:45 - INFO - __main__ - Step 46359: {'lr': 0.00019906364088366808, 'samples': 1483488, 'steps': 2897, 'loss/train': 2.9309020042419434} -09/21/2021 00:31:46 - INFO - __main__ - Step 46360: {'lr': 0.00019906364088366808, 'samples': 1483520, 'steps': 2897, 'loss/train': 2.6341934204101562} -09/21/2021 00:31:46 - INFO - __main__ - Step 46361: {'lr': 0.00019906364088366808, 'samples': 1483552, 'steps': 2897, 'loss/train': 2.04904842376709} -09/21/2021 00:31:47 - INFO - __main__ - Step 46362: {'lr': 0.00019906364088366808, 'samples': 1483584, 'steps': 2897, 'loss/train': 0.167317733168602} -09/21/2021 00:31:48 - INFO - __main__ - Step 46363: {'lr': 0.00019906364088366808, 'samples': 1483616, 'steps': 2897, 'loss/train': 2.3630690574645996} -09/21/2021 00:31:49 - INFO - __main__ - Step 46364: {'lr': 0.00019906364088366808, 'samples': 1483648, 'steps': 2897, 'loss/train': 2.3897695541381836} -09/21/2021 00:31:49 - INFO - __main__ - Step 46365: {'lr': 0.00019906364088366808, 'samples': 1483680, 'steps': 2897, 'loss/train': 2.5793673992156982} -09/21/2021 00:31:50 - INFO - __main__ - Step 46366: {'lr': 0.00019906364088366808, 'samples': 1483712, 'steps': 2897, 'loss/train': 2.0540263652801514} -09/21/2021 00:31:51 - INFO - __main__ - Step 46367: {'lr': 0.00019906364088366808, 'samples': 1483744, 'steps': 2897, 'loss/train': 1.8049824237823486} -09/21/2021 00:31:52 - INFO - __main__ - Step 46368: {'lr': 0.00019906364088366808, 'samples': 1483776, 'steps': 2897, 'loss/train': 1.9263163805007935} -09/21/2021 00:31:52 - INFO - __main__ - Step 46369: {'lr': 0.00019906276979708264, 'samples': 1483808, 'steps': 2898, 'loss/train': 0.6875824928283691} -09/21/2021 00:31:53 - INFO - __main__ - Step 46370: {'lr': 0.00019906276979708264, 'samples': 1483840, 'steps': 2898, 'loss/train': 2.669783115386963} -09/21/2021 00:31:54 - INFO - __main__ - Step 46371: {'lr': 0.00019906276979708264, 'samples': 1483872, 'steps': 2898, 'loss/train': 1.5493439435958862} -09/21/2021 00:31:55 - INFO - __main__ - Step 46372: {'lr': 0.00019906276979708264, 'samples': 1483904, 'steps': 2898, 'loss/train': 2.3059380054473877} -09/21/2021 00:31:56 - INFO - __main__ - Step 46373: {'lr': 0.00019906276979708264, 'samples': 1483936, 'steps': 2898, 'loss/train': 2.8447306156158447} -09/21/2021 00:31:57 - INFO - __main__ - Step 46374: {'lr': 0.00019906276979708264, 'samples': 1483968, 'steps': 2898, 'loss/train': 0.6355414390563965} -09/21/2021 00:31:57 - INFO - __main__ - Step 46375: {'lr': 0.00019906276979708264, 'samples': 1484000, 'steps': 2898, 'loss/train': 2.2535645961761475} -09/21/2021 00:31:58 - INFO - __main__ - Step 46376: {'lr': 0.00019906276979708264, 'samples': 1484032, 'steps': 2898, 'loss/train': 2.5815234184265137} -09/21/2021 00:31:59 - INFO - __main__ - Step 46377: {'lr': 0.00019906276979708264, 'samples': 1484064, 'steps': 2898, 'loss/train': 2.1962287425994873} -09/21/2021 00:32:00 - INFO - __main__ - Step 46378: {'lr': 0.00019906276979708264, 'samples': 1484096, 'steps': 2898, 'loss/train': 2.7434144020080566} -09/21/2021 00:32:00 - INFO - __main__ - Step 46379: {'lr': 0.00019906276979708264, 'samples': 1484128, 'steps': 2898, 'loss/train': 2.0158374309539795} -09/21/2021 00:32:01 - INFO - __main__ - Step 46380: {'lr': 0.00019906276979708264, 'samples': 1484160, 'steps': 2898, 'loss/train': 2.8649795055389404} -09/21/2021 00:32:02 - INFO - __main__ - Step 46381: {'lr': 0.00019906276979708264, 'samples': 1484192, 'steps': 2898, 'loss/train': 2.3284049034118652} -09/21/2021 00:32:03 - INFO - __main__ - Step 46382: {'lr': 0.00019906276979708264, 'samples': 1484224, 'steps': 2898, 'loss/train': 1.980966567993164} -09/21/2021 00:32:03 - INFO - __main__ - Step 46383: {'lr': 0.00019906276979708264, 'samples': 1484256, 'steps': 2898, 'loss/train': 2.4492974281311035} -09/21/2021 00:32:04 - INFO - __main__ - Step 46384: {'lr': 0.00019906276979708264, 'samples': 1484288, 'steps': 2898, 'loss/train': 1.6953234672546387} -09/21/2021 00:32:05 - INFO - __main__ - Step 46385: {'lr': 0.0001990618983074112, 'samples': 1484320, 'steps': 2899, 'loss/train': 1.647288203239441} -09/21/2021 00:32:06 - INFO - __main__ - Step 46386: {'lr': 0.0001990618983074112, 'samples': 1484352, 'steps': 2899, 'loss/train': 2.6346065998077393} -09/21/2021 00:32:07 - INFO - __main__ - Step 46387: {'lr': 0.0001990618983074112, 'samples': 1484384, 'steps': 2899, 'loss/train': 2.402153253555298} -09/21/2021 00:32:07 - INFO - __main__ - Step 46388: {'lr': 0.0001990618983074112, 'samples': 1484416, 'steps': 2899, 'loss/train': 2.284029245376587} -09/21/2021 00:32:08 - INFO - __main__ - Step 46389: {'lr': 0.0001990618983074112, 'samples': 1484448, 'steps': 2899, 'loss/train': 1.838434100151062} -09/21/2021 00:32:09 - INFO - __main__ - Step 46390: {'lr': 0.0001990618983074112, 'samples': 1484480, 'steps': 2899, 'loss/train': 4.400279998779297} -09/21/2021 00:32:10 - INFO - __main__ - Step 46391: {'lr': 0.0001990618983074112, 'samples': 1484512, 'steps': 2899, 'loss/train': 1.7703748941421509} -09/21/2021 00:32:10 - INFO - __main__ - Step 46392: {'lr': 0.0001990618983074112, 'samples': 1484544, 'steps': 2899, 'loss/train': 2.4017388820648193} -09/21/2021 00:32:11 - INFO - __main__ - Step 46393: {'lr': 0.0001990618983074112, 'samples': 1484576, 'steps': 2899, 'loss/train': 2.8849375247955322} -09/21/2021 00:32:12 - INFO - __main__ - Step 46394: {'lr': 0.0001990618983074112, 'samples': 1484608, 'steps': 2899, 'loss/train': 0.4242119789123535} -09/21/2021 00:32:13 - INFO - __main__ - Step 46395: {'lr': 0.0001990618983074112, 'samples': 1484640, 'steps': 2899, 'loss/train': 1.5239404439926147} -09/21/2021 00:32:13 - INFO - __main__ - Step 46396: {'lr': 0.0001990618983074112, 'samples': 1484672, 'steps': 2899, 'loss/train': 2.3107869625091553} -09/21/2021 00:32:14 - INFO - __main__ - Step 46397: {'lr': 0.0001990618983074112, 'samples': 1484704, 'steps': 2899, 'loss/train': 0.9914686679840088} -09/21/2021 00:32:15 - INFO - __main__ - Step 46398: {'lr': 0.0001990618983074112, 'samples': 1484736, 'steps': 2899, 'loss/train': 1.9782367944717407} -09/21/2021 00:32:16 - INFO - __main__ - Step 46399: {'lr': 0.0001990618983074112, 'samples': 1484768, 'steps': 2899, 'loss/train': 2.148738145828247} -09/21/2021 00:32:16 - INFO - __main__ - Step 46400: {'lr': 0.0001990618983074112, 'samples': 1484800, 'steps': 2899, 'loss/train': 1.898427963256836} -09/21/2021 00:32:18 - INFO - __main__ - Step 46401: {'lr': 0.00019906102641465727, 'samples': 1484832, 'steps': 2900, 'loss/train': 1.4177753925323486} -09/21/2021 00:32:19 - INFO - __main__ - Step 46402: {'lr': 0.00019906102641465727, 'samples': 1484864, 'steps': 2900, 'loss/train': 3.027782917022705} -09/21/2021 00:32:19 - INFO - __main__ - Step 46403: {'lr': 0.00019906102641465727, 'samples': 1484896, 'steps': 2900, 'loss/train': 0.7790743708610535} -09/21/2021 00:32:20 - INFO - __main__ - Step 46404: {'lr': 0.00019906102641465727, 'samples': 1484928, 'steps': 2900, 'loss/train': 1.9135215282440186} -09/21/2021 00:32:21 - INFO - __main__ - Step 46405: {'lr': 0.00019906102641465727, 'samples': 1484960, 'steps': 2900, 'loss/train': 2.1529464721679688} -09/21/2021 00:32:22 - INFO - __main__ - Step 46406: {'lr': 0.00019906102641465727, 'samples': 1484992, 'steps': 2900, 'loss/train': 1.9451522827148438} -09/21/2021 00:32:22 - INFO - __main__ - Step 46407: {'lr': 0.00019906102641465727, 'samples': 1485024, 'steps': 2900, 'loss/train': 1.3431812524795532} -09/21/2021 00:32:23 - INFO - __main__ - Step 46408: {'lr': 0.00019906102641465727, 'samples': 1485056, 'steps': 2900, 'loss/train': 3.1471316814422607} -09/21/2021 00:32:24 - INFO - __main__ - Step 46409: {'lr': 0.00019906102641465727, 'samples': 1485088, 'steps': 2900, 'loss/train': 2.364057779312134} -09/21/2021 00:32:25 - INFO - __main__ - Step 46410: {'lr': 0.00019906102641465727, 'samples': 1485120, 'steps': 2900, 'loss/train': 2.1713874340057373} -09/21/2021 00:32:25 - INFO - __main__ - Step 46411: {'lr': 0.00019906102641465727, 'samples': 1485152, 'steps': 2900, 'loss/train': 2.5929625034332275} -09/21/2021 00:32:26 - INFO - __main__ - Step 46412: {'lr': 0.00019906102641465727, 'samples': 1485184, 'steps': 2900, 'loss/train': 1.6815707683563232} -09/21/2021 00:32:27 - INFO - __main__ - Step 46413: {'lr': 0.00019906102641465727, 'samples': 1485216, 'steps': 2900, 'loss/train': 2.155405044555664} -09/21/2021 00:32:28 - INFO - __main__ - Step 46414: {'lr': 0.00019906102641465727, 'samples': 1485248, 'steps': 2900, 'loss/train': 0.5123428702354431} -09/21/2021 00:32:28 - INFO - __main__ - Step 46415: {'lr': 0.00019906102641465727, 'samples': 1485280, 'steps': 2900, 'loss/train': 2.0149128437042236} -09/21/2021 00:32:29 - INFO - __main__ - Step 46416: {'lr': 0.00019906102641465727, 'samples': 1485312, 'steps': 2900, 'loss/train': 1.928967833518982} -09/21/2021 00:32:30 - INFO - __main__ - Step 46417: {'lr': 0.0001990601541188244, 'samples': 1485344, 'steps': 2901, 'loss/train': 1.388916015625} -09/21/2021 00:32:31 - INFO - __main__ - Step 46418: {'lr': 0.0001990601541188244, 'samples': 1485376, 'steps': 2901, 'loss/train': 2.65164852142334} -09/21/2021 00:32:31 - INFO - __main__ - Step 46419: {'lr': 0.0001990601541188244, 'samples': 1485408, 'steps': 2901, 'loss/train': 1.7943828105926514} -09/21/2021 00:32:32 - INFO - __main__ - Step 46420: {'lr': 0.0001990601541188244, 'samples': 1485440, 'steps': 2901, 'loss/train': 2.495298147201538} -09/21/2021 00:32:33 - INFO - __main__ - Step 46421: {'lr': 0.0001990601541188244, 'samples': 1485472, 'steps': 2901, 'loss/train': 1.791210412979126} -09/21/2021 00:32:34 - INFO - __main__ - Step 46422: {'lr': 0.0001990601541188244, 'samples': 1485504, 'steps': 2901, 'loss/train': 1.500520944595337} -09/21/2021 00:32:34 - INFO - __main__ - Step 46423: {'lr': 0.0001990601541188244, 'samples': 1485536, 'steps': 2901, 'loss/train': 2.024857521057129} -09/21/2021 00:32:35 - INFO - __main__ - Step 46424: {'lr': 0.0001990601541188244, 'samples': 1485568, 'steps': 2901, 'loss/train': 2.3531577587127686} -09/21/2021 00:32:36 - INFO - __main__ - Step 46425: {'lr': 0.0001990601541188244, 'samples': 1485600, 'steps': 2901, 'loss/train': 1.5009266138076782} -09/21/2021 00:32:37 - INFO - __main__ - Step 46426: {'lr': 0.0001990601541188244, 'samples': 1485632, 'steps': 2901, 'loss/train': 1.440205454826355} -09/21/2021 00:32:37 - INFO - __main__ - Step 46427: {'lr': 0.0001990601541188244, 'samples': 1485664, 'steps': 2901, 'loss/train': 1.6748284101486206} -09/21/2021 00:32:38 - INFO - __main__ - Step 46428: {'lr': 0.0001990601541188244, 'samples': 1485696, 'steps': 2901, 'loss/train': 1.8795186281204224} -09/21/2021 00:32:39 - INFO - __main__ - Step 46429: {'lr': 0.0001990601541188244, 'samples': 1485728, 'steps': 2901, 'loss/train': 2.049044370651245} -09/21/2021 00:32:40 - INFO - __main__ - Step 46430: {'lr': 0.0001990601541188244, 'samples': 1485760, 'steps': 2901, 'loss/train': 2.2420995235443115} -09/21/2021 00:32:41 - INFO - __main__ - Step 46431: {'lr': 0.0001990601541188244, 'samples': 1485792, 'steps': 2901, 'loss/train': 1.4204498529434204} -09/21/2021 00:32:42 - INFO - __main__ - Step 46432: {'lr': 0.0001990601541188244, 'samples': 1485824, 'steps': 2901, 'loss/train': 1.6250312328338623} -09/21/2021 00:32:43 - INFO - __main__ - Step 46433: {'lr': 0.00019905928141991617, 'samples': 1485856, 'steps': 2902, 'loss/train': 2.2865803241729736} -09/21/2021 00:32:43 - INFO - __main__ - Step 46434: {'lr': 0.00019905928141991617, 'samples': 1485888, 'steps': 2902, 'loss/train': 1.7809771299362183} -09/21/2021 00:32:44 - INFO - __main__ - Step 46435: {'lr': 0.00019905928141991617, 'samples': 1485920, 'steps': 2902, 'loss/train': 2.5043866634368896} -09/21/2021 00:32:45 - INFO - __main__ - Step 46436: {'lr': 0.00019905928141991617, 'samples': 1485952, 'steps': 2902, 'loss/train': 1.559869647026062} -09/21/2021 00:32:46 - INFO - __main__ - Step 46437: {'lr': 0.00019905928141991617, 'samples': 1485984, 'steps': 2902, 'loss/train': 1.7020090818405151} -09/21/2021 00:32:46 - INFO - __main__ - Step 46438: {'lr': 0.00019905928141991617, 'samples': 1486016, 'steps': 2902, 'loss/train': 2.184321641921997} -09/21/2021 00:32:47 - INFO - __main__ - Step 46439: {'lr': 0.00019905928141991617, 'samples': 1486048, 'steps': 2902, 'loss/train': 1.9587944746017456} -09/21/2021 00:32:48 - INFO - __main__ - Step 46440: {'lr': 0.00019905928141991617, 'samples': 1486080, 'steps': 2902, 'loss/train': 1.9260215759277344} -09/21/2021 00:32:49 - INFO - __main__ - Step 46441: {'lr': 0.00019905928141991617, 'samples': 1486112, 'steps': 2902, 'loss/train': 2.335618019104004} -09/21/2021 00:32:49 - INFO - __main__ - Step 46442: {'lr': 0.00019905928141991617, 'samples': 1486144, 'steps': 2902, 'loss/train': 1.384529948234558} -09/21/2021 00:32:50 - INFO - __main__ - Step 46443: {'lr': 0.00019905928141991617, 'samples': 1486176, 'steps': 2902, 'loss/train': 2.5951666831970215} -09/21/2021 00:32:51 - INFO - __main__ - Step 46444: {'lr': 0.00019905928141991617, 'samples': 1486208, 'steps': 2902, 'loss/train': 1.441756010055542} -09/21/2021 00:32:52 - INFO - __main__ - Step 46445: {'lr': 0.00019905928141991617, 'samples': 1486240, 'steps': 2902, 'loss/train': 1.848877191543579} -09/21/2021 00:32:52 - INFO - __main__ - Step 46446: {'lr': 0.00019905928141991617, 'samples': 1486272, 'steps': 2902, 'loss/train': 1.534178614616394} -09/21/2021 00:32:53 - INFO - __main__ - Step 46447: {'lr': 0.00019905928141991617, 'samples': 1486304, 'steps': 2902, 'loss/train': 1.7294275760650635} -09/21/2021 00:32:54 - INFO - __main__ - Step 46448: {'lr': 0.00019905928141991617, 'samples': 1486336, 'steps': 2902, 'loss/train': 2.39986515045166} -09/21/2021 00:32:55 - INFO - __main__ - Step 46449: {'lr': 0.0001990584083179361, 'samples': 1486368, 'steps': 2903, 'loss/train': 1.4141950607299805} -09/21/2021 00:32:55 - INFO - __main__ - Step 46450: {'lr': 0.0001990584083179361, 'samples': 1486400, 'steps': 2903, 'loss/train': 2.4112844467163086} -09/21/2021 00:32:56 - INFO - __main__ - Step 46451: {'lr': 0.0001990584083179361, 'samples': 1486432, 'steps': 2903, 'loss/train': 1.5560954809188843} -09/21/2021 00:32:57 - INFO - __main__ - Step 46452: {'lr': 0.0001990584083179361, 'samples': 1486464, 'steps': 2903, 'loss/train': 2.715243101119995} -09/21/2021 00:32:58 - INFO - __main__ - Step 46453: {'lr': 0.0001990584083179361, 'samples': 1486496, 'steps': 2903, 'loss/train': 1.3293284177780151} -09/21/2021 00:32:58 - INFO - __main__ - Step 46454: {'lr': 0.0001990584083179361, 'samples': 1486528, 'steps': 2903, 'loss/train': 1.9811524152755737} -09/21/2021 00:32:59 - INFO - __main__ - Step 46455: {'lr': 0.0001990584083179361, 'samples': 1486560, 'steps': 2903, 'loss/train': 1.2505974769592285} -09/21/2021 00:33:00 - INFO - __main__ - Step 46456: {'lr': 0.0001990584083179361, 'samples': 1486592, 'steps': 2903, 'loss/train': 1.9488403797149658} -09/21/2021 00:33:01 - INFO - __main__ - Step 46457: {'lr': 0.0001990584083179361, 'samples': 1486624, 'steps': 2903, 'loss/train': 1.5669955015182495} -09/21/2021 00:33:01 - INFO - __main__ - Step 46458: {'lr': 0.0001990584083179361, 'samples': 1486656, 'steps': 2903, 'loss/train': 2.0697181224823} -09/21/2021 00:33:02 - INFO - __main__ - Step 46459: {'lr': 0.0001990584083179361, 'samples': 1486688, 'steps': 2903, 'loss/train': 1.8865488767623901} -09/21/2021 00:33:03 - INFO - __main__ - Step 46460: {'lr': 0.0001990584083179361, 'samples': 1486720, 'steps': 2903, 'loss/train': 1.6038806438446045} -09/21/2021 00:33:04 - INFO - __main__ - Step 46461: {'lr': 0.0001990584083179361, 'samples': 1486752, 'steps': 2903, 'loss/train': 2.025038480758667} -09/21/2021 00:33:05 - INFO - __main__ - Step 46462: {'lr': 0.0001990584083179361, 'samples': 1486784, 'steps': 2903, 'loss/train': 0.9937188029289246} -09/21/2021 00:33:06 - INFO - __main__ - Step 46463: {'lr': 0.0001990584083179361, 'samples': 1486816, 'steps': 2903, 'loss/train': 1.3963007926940918} -09/21/2021 00:33:07 - INFO - __main__ - Step 46464: {'lr': 0.0001990584083179361, 'samples': 1486848, 'steps': 2903, 'loss/train': 1.8426669836044312} -09/21/2021 00:33:07 - INFO - __main__ - Step 46465: {'lr': 0.0001990575348128877, 'samples': 1486880, 'steps': 2904, 'loss/train': 1.4485212564468384} -09/21/2021 00:33:08 - INFO - __main__ - Step 46466: {'lr': 0.0001990575348128877, 'samples': 1486912, 'steps': 2904, 'loss/train': 2.341087818145752} -09/21/2021 00:33:09 - INFO - __main__ - Step 46467: {'lr': 0.0001990575348128877, 'samples': 1486944, 'steps': 2904, 'loss/train': 1.6272588968276978} -09/21/2021 00:33:10 - INFO - __main__ - Step 46468: {'lr': 0.0001990575348128877, 'samples': 1486976, 'steps': 2904, 'loss/train': 3.4723479747772217} -09/21/2021 00:33:10 - INFO - __main__ - Step 46469: {'lr': 0.0001990575348128877, 'samples': 1487008, 'steps': 2904, 'loss/train': 1.6250940561294556} -09/21/2021 00:33:11 - INFO - __main__ - Step 46470: {'lr': 0.0001990575348128877, 'samples': 1487040, 'steps': 2904, 'loss/train': 3.0477495193481445} -09/21/2021 00:33:12 - INFO - __main__ - Step 46471: {'lr': 0.0001990575348128877, 'samples': 1487072, 'steps': 2904, 'loss/train': 1.535630226135254} -09/21/2021 00:33:13 - INFO - __main__ - Step 46472: {'lr': 0.0001990575348128877, 'samples': 1487104, 'steps': 2904, 'loss/train': 3.8664753437042236} -09/21/2021 00:33:13 - INFO - __main__ - Step 46473: {'lr': 0.0001990575348128877, 'samples': 1487136, 'steps': 2904, 'loss/train': 2.564959764480591} -09/21/2021 00:33:14 - INFO - __main__ - Step 46474: {'lr': 0.0001990575348128877, 'samples': 1487168, 'steps': 2904, 'loss/train': 1.8251734972000122} -09/21/2021 00:33:15 - INFO - __main__ - Step 46475: {'lr': 0.0001990575348128877, 'samples': 1487200, 'steps': 2904, 'loss/train': 1.8886889219284058} -09/21/2021 00:33:16 - INFO - __main__ - Step 46476: {'lr': 0.0001990575348128877, 'samples': 1487232, 'steps': 2904, 'loss/train': 2.588789939880371} -09/21/2021 00:33:16 - INFO - __main__ - Step 46477: {'lr': 0.0001990575348128877, 'samples': 1487264, 'steps': 2904, 'loss/train': 1.375630497932434} -09/21/2021 00:33:17 - INFO - __main__ - Step 46478: {'lr': 0.0001990575348128877, 'samples': 1487296, 'steps': 2904, 'loss/train': 1.470428228378296} -09/21/2021 00:33:18 - INFO - __main__ - Step 46479: {'lr': 0.0001990575348128877, 'samples': 1487328, 'steps': 2904, 'loss/train': 2.1933929920196533} -09/21/2021 00:33:19 - INFO - __main__ - Step 46480: {'lr': 0.0001990575348128877, 'samples': 1487360, 'steps': 2904, 'loss/train': 1.7227436304092407} -09/21/2021 00:33:20 - INFO - __main__ - Step 46481: {'lr': 0.00019905666090477465, 'samples': 1487392, 'steps': 2905, 'loss/train': 1.957100749015808} -09/21/2021 00:33:20 - INFO - __main__ - Step 46482: {'lr': 0.00019905666090477465, 'samples': 1487424, 'steps': 2905, 'loss/train': 2.1896145343780518} -09/21/2021 00:33:21 - INFO - __main__ - Step 46483: {'lr': 0.00019905666090477465, 'samples': 1487456, 'steps': 2905, 'loss/train': 2.2139854431152344} -09/21/2021 00:33:22 - INFO - __main__ - Step 46484: {'lr': 0.00019905666090477465, 'samples': 1487488, 'steps': 2905, 'loss/train': 1.8064956665039062} -09/21/2021 00:33:23 - INFO - __main__ - Step 46485: {'lr': 0.00019905666090477465, 'samples': 1487520, 'steps': 2905, 'loss/train': 2.1983063220977783} -09/21/2021 00:33:23 - INFO - __main__ - Step 46486: {'lr': 0.00019905666090477465, 'samples': 1487552, 'steps': 2905, 'loss/train': 1.8239208459854126} -09/21/2021 00:33:24 - INFO - __main__ - Step 46487: {'lr': 0.00019905666090477465, 'samples': 1487584, 'steps': 2905, 'loss/train': 1.509951114654541} -09/21/2021 00:33:25 - INFO - __main__ - Step 46488: {'lr': 0.00019905666090477465, 'samples': 1487616, 'steps': 2905, 'loss/train': 2.1427085399627686} -09/21/2021 00:33:26 - INFO - __main__ - Step 46489: {'lr': 0.00019905666090477465, 'samples': 1487648, 'steps': 2905, 'loss/train': 2.4936230182647705} -09/21/2021 00:33:26 - INFO - __main__ - Step 46490: {'lr': 0.00019905666090477465, 'samples': 1487680, 'steps': 2905, 'loss/train': 0.23275333642959595} -09/21/2021 00:33:27 - INFO - __main__ - Step 46491: {'lr': 0.00019905666090477465, 'samples': 1487712, 'steps': 2905, 'loss/train': 2.1006267070770264} -09/21/2021 00:33:28 - INFO - __main__ - Step 46492: {'lr': 0.00019905666090477465, 'samples': 1487744, 'steps': 2905, 'loss/train': 1.610943078994751} -09/21/2021 00:33:29 - INFO - __main__ - Step 46493: {'lr': 0.00019905666090477465, 'samples': 1487776, 'steps': 2905, 'loss/train': 2.4655749797821045} -09/21/2021 00:33:30 - INFO - __main__ - Step 46494: {'lr': 0.00019905666090477465, 'samples': 1487808, 'steps': 2905, 'loss/train': 1.7175421714782715} -09/21/2021 00:33:31 - INFO - __main__ - Step 46495: {'lr': 0.00019905666090477465, 'samples': 1487840, 'steps': 2905, 'loss/train': 1.991336703300476} -09/21/2021 00:33:31 - INFO - __main__ - Step 46496: {'lr': 0.00019905666090477465, 'samples': 1487872, 'steps': 2905, 'loss/train': 2.028578996658325} -09/21/2021 00:33:32 - INFO - __main__ - Step 46497: {'lr': 0.00019905578659360038, 'samples': 1487904, 'steps': 2906, 'loss/train': 1.8169455528259277} -09/21/2021 00:33:33 - INFO - __main__ - Step 46498: {'lr': 0.00019905578659360038, 'samples': 1487936, 'steps': 2906, 'loss/train': 1.2327884435653687} -09/21/2021 00:33:34 - INFO - __main__ - Step 46499: {'lr': 0.00019905578659360038, 'samples': 1487968, 'steps': 2906, 'loss/train': 2.561696767807007} -09/21/2021 00:33:34 - INFO - __main__ - Step 46500: {'lr': 0.00019905578659360038, 'samples': 1488000, 'steps': 2906, 'loss/train': 2.6808061599731445} -09/21/2021 00:33:35 - INFO - __main__ - Step 46501: {'lr': 0.00019905578659360038, 'samples': 1488032, 'steps': 2906, 'loss/train': 2.18434476852417} -09/21/2021 00:33:36 - INFO - __main__ - Step 46502: {'lr': 0.00019905578659360038, 'samples': 1488064, 'steps': 2906, 'loss/train': 1.9007542133331299} -09/21/2021 00:33:37 - INFO - __main__ - Step 46503: {'lr': 0.00019905578659360038, 'samples': 1488096, 'steps': 2906, 'loss/train': 2.11551570892334} -09/21/2021 00:33:37 - INFO - __main__ - Step 46504: {'lr': 0.00019905578659360038, 'samples': 1488128, 'steps': 2906, 'loss/train': 0.6226959228515625} -09/21/2021 00:33:38 - INFO - __main__ - Step 46505: {'lr': 0.00019905578659360038, 'samples': 1488160, 'steps': 2906, 'loss/train': 1.4431923627853394} -09/21/2021 00:33:39 - INFO - __main__ - Step 46506: {'lr': 0.00019905578659360038, 'samples': 1488192, 'steps': 2906, 'loss/train': 1.9235577583312988} -09/21/2021 00:33:40 - INFO - __main__ - Step 46507: {'lr': 0.00019905578659360038, 'samples': 1488224, 'steps': 2906, 'loss/train': 1.7338252067565918} -09/21/2021 00:33:40 - INFO - __main__ - Step 46508: {'lr': 0.00019905578659360038, 'samples': 1488256, 'steps': 2906, 'loss/train': 1.9543269872665405} -09/21/2021 00:33:41 - INFO - __main__ - Step 46509: {'lr': 0.00019905578659360038, 'samples': 1488288, 'steps': 2906, 'loss/train': 2.0303397178649902} -09/21/2021 00:33:42 - INFO - __main__ - Step 46510: {'lr': 0.00019905578659360038, 'samples': 1488320, 'steps': 2906, 'loss/train': 2.133892297744751} -09/21/2021 00:33:43 - INFO - __main__ - Step 46511: {'lr': 0.00019905578659360038, 'samples': 1488352, 'steps': 2906, 'loss/train': 1.8219679594039917} -09/21/2021 00:33:43 - INFO - __main__ - Step 46512: {'lr': 0.00019905578659360038, 'samples': 1488384, 'steps': 2906, 'loss/train': 2.1828718185424805} -09/21/2021 00:33:44 - INFO - __main__ - Step 46513: {'lr': 0.00019905491187936853, 'samples': 1488416, 'steps': 2907, 'loss/train': 2.0380377769470215} -09/21/2021 00:33:45 - INFO - __main__ - Step 46514: {'lr': 0.00019905491187936853, 'samples': 1488448, 'steps': 2907, 'loss/train': 2.247361660003662} -09/21/2021 00:33:46 - INFO - __main__ - Step 46515: {'lr': 0.00019905491187936853, 'samples': 1488480, 'steps': 2907, 'loss/train': 1.8427146673202515} -09/21/2021 00:33:47 - INFO - __main__ - Step 46516: {'lr': 0.00019905491187936853, 'samples': 1488512, 'steps': 2907, 'loss/train': 2.1628735065460205} -09/21/2021 00:33:47 - INFO - __main__ - Step 46517: {'lr': 0.00019905491187936853, 'samples': 1488544, 'steps': 2907, 'loss/train': 1.8115732669830322} -09/21/2021 00:33:48 - INFO - __main__ - Step 46518: {'lr': 0.00019905491187936853, 'samples': 1488576, 'steps': 2907, 'loss/train': 1.9031906127929688} -09/21/2021 00:33:49 - INFO - __main__ - Step 46519: {'lr': 0.00019905491187936853, 'samples': 1488608, 'steps': 2907, 'loss/train': 1.207897424697876} -09/21/2021 00:33:50 - INFO - __main__ - Step 46520: {'lr': 0.00019905491187936853, 'samples': 1488640, 'steps': 2907, 'loss/train': 2.1576085090637207} -09/21/2021 00:33:50 - INFO - __main__ - Step 46521: {'lr': 0.00019905491187936853, 'samples': 1488672, 'steps': 2907, 'loss/train': 1.8188387155532837} -09/21/2021 00:33:51 - INFO - __main__ - Step 46522: {'lr': 0.00019905491187936853, 'samples': 1488704, 'steps': 2907, 'loss/train': 2.2491350173950195} -09/21/2021 00:33:53 - INFO - __main__ - Step 46523: {'lr': 0.00019905491187936853, 'samples': 1488736, 'steps': 2907, 'loss/train': 2.5395781993865967} -09/21/2021 00:33:54 - INFO - __main__ - Step 46524: {'lr': 0.00019905491187936853, 'samples': 1488768, 'steps': 2907, 'loss/train': 2.339930534362793} -09/21/2021 00:33:54 - INFO - __main__ - Step 46525: {'lr': 0.00019905491187936853, 'samples': 1488800, 'steps': 2907, 'loss/train': 1.6560859680175781} -09/21/2021 00:33:55 - INFO - __main__ - Step 46526: {'lr': 0.00019905491187936853, 'samples': 1488832, 'steps': 2907, 'loss/train': 1.7178994417190552} -09/21/2021 00:33:56 - INFO - __main__ - Step 46527: {'lr': 0.00019905491187936853, 'samples': 1488864, 'steps': 2907, 'loss/train': 2.0460853576660156} -09/21/2021 00:33:57 - INFO - __main__ - Step 46528: {'lr': 0.00019905491187936853, 'samples': 1488896, 'steps': 2907, 'loss/train': 2.0936808586120605} -09/21/2021 00:33:58 - INFO - __main__ - Step 46529: {'lr': 0.0001990540367620826, 'samples': 1488928, 'steps': 2908, 'loss/train': 1.1099966764450073} -09/21/2021 00:33:58 - INFO - __main__ - Step 46530: {'lr': 0.0001990540367620826, 'samples': 1488960, 'steps': 2908, 'loss/train': 1.5190651416778564} -09/21/2021 00:33:59 - INFO - __main__ - Step 46531: {'lr': 0.0001990540367620826, 'samples': 1488992, 'steps': 2908, 'loss/train': 1.8941916227340698} -09/21/2021 00:34:00 - INFO - __main__ - Step 46532: {'lr': 0.0001990540367620826, 'samples': 1489024, 'steps': 2908, 'loss/train': 2.2692105770111084} -09/21/2021 00:34:01 - INFO - __main__ - Step 46533: {'lr': 0.0001990540367620826, 'samples': 1489056, 'steps': 2908, 'loss/train': 2.667929172515869} -09/21/2021 00:34:01 - INFO - __main__ - Step 46534: {'lr': 0.0001990540367620826, 'samples': 1489088, 'steps': 2908, 'loss/train': 2.0074851512908936} -09/21/2021 00:34:02 - INFO - __main__ - Step 46535: {'lr': 0.0001990540367620826, 'samples': 1489120, 'steps': 2908, 'loss/train': 1.9379143714904785} -09/21/2021 00:34:03 - INFO - __main__ - Step 46536: {'lr': 0.0001990540367620826, 'samples': 1489152, 'steps': 2908, 'loss/train': 2.0995733737945557} -09/21/2021 00:34:04 - INFO - __main__ - Step 46537: {'lr': 0.0001990540367620826, 'samples': 1489184, 'steps': 2908, 'loss/train': 2.121256113052368} -09/21/2021 00:34:04 - INFO - __main__ - Step 46538: {'lr': 0.0001990540367620826, 'samples': 1489216, 'steps': 2908, 'loss/train': 2.129246950149536} -09/21/2021 00:34:05 - INFO - __main__ - Step 46539: {'lr': 0.0001990540367620826, 'samples': 1489248, 'steps': 2908, 'loss/train': 1.0967249870300293} -09/21/2021 00:34:06 - INFO - __main__ - Step 46540: {'lr': 0.0001990540367620826, 'samples': 1489280, 'steps': 2908, 'loss/train': 1.837622880935669} -09/21/2021 00:34:07 - INFO - __main__ - Step 46541: {'lr': 0.0001990540367620826, 'samples': 1489312, 'steps': 2908, 'loss/train': 1.646382212638855} -09/21/2021 00:34:07 - INFO - __main__ - Step 46542: {'lr': 0.0001990540367620826, 'samples': 1489344, 'steps': 2908, 'loss/train': 2.052412271499634} -09/21/2021 00:34:08 - INFO - __main__ - Step 46543: {'lr': 0.0001990540367620826, 'samples': 1489376, 'steps': 2908, 'loss/train': 1.785012125968933} -09/21/2021 00:34:09 - INFO - __main__ - Step 46544: {'lr': 0.0001990540367620826, 'samples': 1489408, 'steps': 2908, 'loss/train': 2.244647741317749} -09/21/2021 00:34:10 - INFO - __main__ - Step 46545: {'lr': 0.0001990531612417462, 'samples': 1489440, 'steps': 2909, 'loss/train': 1.6904927492141724} -09/21/2021 00:34:10 - INFO - __main__ - Step 46546: {'lr': 0.0001990531612417462, 'samples': 1489472, 'steps': 2909, 'loss/train': 1.647207260131836} -09/21/2021 00:34:11 - INFO - __main__ - Step 46547: {'lr': 0.0001990531612417462, 'samples': 1489504, 'steps': 2909, 'loss/train': 2.143416404724121} -09/21/2021 00:34:12 - INFO - __main__ - Step 46548: {'lr': 0.0001990531612417462, 'samples': 1489536, 'steps': 2909, 'loss/train': 1.7017766237258911} -09/21/2021 00:34:13 - INFO - __main__ - Step 46549: {'lr': 0.0001990531612417462, 'samples': 1489568, 'steps': 2909, 'loss/train': 2.5499820709228516} -09/21/2021 00:34:13 - INFO - __main__ - Step 46550: {'lr': 0.0001990531612417462, 'samples': 1489600, 'steps': 2909, 'loss/train': 1.3681129217147827} -09/21/2021 00:34:14 - INFO - __main__ - Step 46551: {'lr': 0.0001990531612417462, 'samples': 1489632, 'steps': 2909, 'loss/train': 2.0733120441436768} -09/21/2021 00:34:15 - INFO - __main__ - Step 46552: {'lr': 0.0001990531612417462, 'samples': 1489664, 'steps': 2909, 'loss/train': 2.2235267162323} -09/21/2021 00:34:16 - INFO - __main__ - Step 46553: {'lr': 0.0001990531612417462, 'samples': 1489696, 'steps': 2909, 'loss/train': 1.8324986696243286} -09/21/2021 00:34:17 - INFO - __main__ - Step 46554: {'lr': 0.0001990531612417462, 'samples': 1489728, 'steps': 2909, 'loss/train': 1.7777235507965088} -09/21/2021 00:34:18 - INFO - __main__ - Step 46555: {'lr': 0.0001990531612417462, 'samples': 1489760, 'steps': 2909, 'loss/train': 2.3759119510650635} -09/21/2021 00:34:18 - INFO - __main__ - Step 46556: {'lr': 0.0001990531612417462, 'samples': 1489792, 'steps': 2909, 'loss/train': 2.5025928020477295} -09/21/2021 00:34:19 - INFO - __main__ - Step 46557: {'lr': 0.0001990531612417462, 'samples': 1489824, 'steps': 2909, 'loss/train': 1.684515357017517} -09/21/2021 00:34:20 - INFO - __main__ - Step 46558: {'lr': 0.0001990531612417462, 'samples': 1489856, 'steps': 2909, 'loss/train': 1.8894126415252686} -09/21/2021 00:34:21 - INFO - __main__ - Step 46559: {'lr': 0.0001990531612417462, 'samples': 1489888, 'steps': 2909, 'loss/train': 1.7367864847183228} -09/21/2021 00:34:21 - INFO - __main__ - Step 46560: {'lr': 0.0001990531612417462, 'samples': 1489920, 'steps': 2909, 'loss/train': 2.210571765899658} -09/21/2021 00:34:22 - INFO - __main__ - Step 46561: {'lr': 0.00019905228531836287, 'samples': 1489952, 'steps': 2910, 'loss/train': 1.0254676342010498} -09/21/2021 00:34:23 - INFO - __main__ - Step 46562: {'lr': 0.00019905228531836287, 'samples': 1489984, 'steps': 2910, 'loss/train': 2.0224385261535645} -09/21/2021 00:34:24 - INFO - __main__ - Step 46563: {'lr': 0.00019905228531836287, 'samples': 1490016, 'steps': 2910, 'loss/train': 1.492585301399231} -09/21/2021 00:34:25 - INFO - __main__ - Step 46564: {'lr': 0.00019905228531836287, 'samples': 1490048, 'steps': 2910, 'loss/train': 1.8972851037979126} -09/21/2021 00:34:25 - INFO - __main__ - Step 46565: {'lr': 0.00019905228531836287, 'samples': 1490080, 'steps': 2910, 'loss/train': 1.7846524715423584} -09/21/2021 00:34:26 - INFO - __main__ - Step 46566: {'lr': 0.00019905228531836287, 'samples': 1490112, 'steps': 2910, 'loss/train': 5.841304779052734} -09/21/2021 00:34:27 - INFO - __main__ - Step 46567: {'lr': 0.00019905228531836287, 'samples': 1490144, 'steps': 2910, 'loss/train': 1.9610236883163452} -09/21/2021 00:34:28 - INFO - __main__ - Step 46568: {'lr': 0.00019905228531836287, 'samples': 1490176, 'steps': 2910, 'loss/train': 2.568382740020752} -09/21/2021 00:34:28 - INFO - __main__ - Step 46569: {'lr': 0.00019905228531836287, 'samples': 1490208, 'steps': 2910, 'loss/train': 2.4523069858551025} -09/21/2021 00:34:29 - INFO - __main__ - Step 46570: {'lr': 0.00019905228531836287, 'samples': 1490240, 'steps': 2910, 'loss/train': 2.3856027126312256} -09/21/2021 00:34:30 - INFO - __main__ - Step 46571: {'lr': 0.00019905228531836287, 'samples': 1490272, 'steps': 2910, 'loss/train': 2.5740389823913574} -09/21/2021 00:34:31 - INFO - __main__ - Step 46572: {'lr': 0.00019905228531836287, 'samples': 1490304, 'steps': 2910, 'loss/train': 1.4594590663909912} -09/21/2021 00:34:31 - INFO - __main__ - Step 46573: {'lr': 0.00019905228531836287, 'samples': 1490336, 'steps': 2910, 'loss/train': 2.4588074684143066} -09/21/2021 00:34:32 - INFO - __main__ - Step 46574: {'lr': 0.00019905228531836287, 'samples': 1490368, 'steps': 2910, 'loss/train': 1.0213505029678345} -09/21/2021 00:34:33 - INFO - __main__ - Step 46575: {'lr': 0.00019905228531836287, 'samples': 1490400, 'steps': 2910, 'loss/train': 1.7302302122116089} -09/21/2021 00:34:34 - INFO - __main__ - Step 46576: {'lr': 0.00019905228531836287, 'samples': 1490432, 'steps': 2910, 'loss/train': 2.108368158340454} -09/21/2021 00:34:34 - INFO - __main__ - Step 46577: {'lr': 0.00019905140899193619, 'samples': 1490464, 'steps': 2911, 'loss/train': 2.3401331901550293} -09/21/2021 00:34:35 - INFO - __main__ - Step 46578: {'lr': 0.00019905140899193619, 'samples': 1490496, 'steps': 2911, 'loss/train': 1.5740965604782104} -09/21/2021 00:34:36 - INFO - __main__ - Step 46579: {'lr': 0.00019905140899193619, 'samples': 1490528, 'steps': 2911, 'loss/train': 2.1367180347442627} -09/21/2021 00:34:37 - INFO - __main__ - Step 46580: {'lr': 0.00019905140899193619, 'samples': 1490560, 'steps': 2911, 'loss/train': 2.3040435314178467} -09/21/2021 00:34:38 - INFO - __main__ - Step 46581: {'lr': 0.00019905140899193619, 'samples': 1490592, 'steps': 2911, 'loss/train': 1.0259495973587036} -09/21/2021 00:34:38 - INFO - __main__ - Step 46582: {'lr': 0.00019905140899193619, 'samples': 1490624, 'steps': 2911, 'loss/train': 2.8875465393066406} -09/21/2021 00:34:39 - INFO - __main__ - Step 46583: {'lr': 0.00019905140899193619, 'samples': 1490656, 'steps': 2911, 'loss/train': 2.2236862182617188} -09/21/2021 00:34:40 - INFO - __main__ - Step 46584: {'lr': 0.00019905140899193619, 'samples': 1490688, 'steps': 2911, 'loss/train': 0.41281434893608093} -09/21/2021 00:34:41 - INFO - __main__ - Step 46585: {'lr': 0.00019905140899193619, 'samples': 1490720, 'steps': 2911, 'loss/train': 2.4201064109802246} -09/21/2021 00:34:42 - INFO - __main__ - Step 46586: {'lr': 0.00019905140899193619, 'samples': 1490752, 'steps': 2911, 'loss/train': 1.8596595525741577} -09/21/2021 00:34:43 - INFO - __main__ - Step 46587: {'lr': 0.00019905140899193619, 'samples': 1490784, 'steps': 2911, 'loss/train': 1.2807700634002686} -09/21/2021 00:34:43 - INFO - __main__ - Step 46588: {'lr': 0.00019905140899193619, 'samples': 1490816, 'steps': 2911, 'loss/train': 1.6157574653625488} -09/21/2021 00:34:44 - INFO - __main__ - Step 46589: {'lr': 0.00019905140899193619, 'samples': 1490848, 'steps': 2911, 'loss/train': 0.18409988284111023} -09/21/2021 00:34:45 - INFO - __main__ - Step 46590: {'lr': 0.00019905140899193619, 'samples': 1490880, 'steps': 2911, 'loss/train': 2.3489866256713867} -09/21/2021 00:34:46 - INFO - __main__ - Step 46591: {'lr': 0.00019905140899193619, 'samples': 1490912, 'steps': 2911, 'loss/train': 1.6852045059204102} -09/21/2021 00:34:46 - INFO - __main__ - Step 46592: {'lr': 0.00019905140899193619, 'samples': 1490944, 'steps': 2911, 'loss/train': 3.612257719039917} -09/21/2021 00:34:47 - INFO - __main__ - Step 46593: {'lr': 0.00019905053226246968, 'samples': 1490976, 'steps': 2912, 'loss/train': 2.622605800628662} -09/21/2021 00:34:48 - INFO - __main__ - Step 46594: {'lr': 0.00019905053226246968, 'samples': 1491008, 'steps': 2912, 'loss/train': 1.6383275985717773} -09/21/2021 00:34:49 - INFO - __main__ - Step 46595: {'lr': 0.00019905053226246968, 'samples': 1491040, 'steps': 2912, 'loss/train': 1.9970569610595703} -09/21/2021 00:34:49 - INFO - __main__ - Step 46596: {'lr': 0.00019905053226246968, 'samples': 1491072, 'steps': 2912, 'loss/train': 1.4341105222702026} -09/21/2021 00:34:50 - INFO - __main__ - Step 46597: {'lr': 0.00019905053226246968, 'samples': 1491104, 'steps': 2912, 'loss/train': 0.924956738948822} -09/21/2021 00:34:51 - INFO - __main__ - Step 46598: {'lr': 0.00019905053226246968, 'samples': 1491136, 'steps': 2912, 'loss/train': 1.905301809310913} -09/21/2021 00:34:52 - INFO - __main__ - Step 46599: {'lr': 0.00019905053226246968, 'samples': 1491168, 'steps': 2912, 'loss/train': 1.8677499294281006} -09/21/2021 00:34:52 - INFO - __main__ - Step 46600: {'lr': 0.00019905053226246968, 'samples': 1491200, 'steps': 2912, 'loss/train': 2.2709057331085205} -09/21/2021 00:34:53 - INFO - __main__ - Step 46601: {'lr': 0.00019905053226246968, 'samples': 1491232, 'steps': 2912, 'loss/train': 2.0077590942382812} -09/21/2021 00:34:54 - INFO - __main__ - Step 46602: {'lr': 0.00019905053226246968, 'samples': 1491264, 'steps': 2912, 'loss/train': 1.7801696062088013} -09/21/2021 00:34:55 - INFO - __main__ - Step 46603: {'lr': 0.00019905053226246968, 'samples': 1491296, 'steps': 2912, 'loss/train': 2.5015599727630615} -09/21/2021 00:34:55 - INFO - __main__ - Step 46604: {'lr': 0.00019905053226246968, 'samples': 1491328, 'steps': 2912, 'loss/train': 2.994281053543091} -09/21/2021 00:34:56 - INFO - __main__ - Step 46605: {'lr': 0.00019905053226246968, 'samples': 1491360, 'steps': 2912, 'loss/train': 1.9807884693145752} -09/21/2021 00:34:57 - INFO - __main__ - Step 46606: {'lr': 0.00019905053226246968, 'samples': 1491392, 'steps': 2912, 'loss/train': 1.9550203084945679} -09/21/2021 00:34:58 - INFO - __main__ - Step 46607: {'lr': 0.00019905053226246968, 'samples': 1491424, 'steps': 2912, 'loss/train': 2.363243341445923} -09/21/2021 00:34:58 - INFO - __main__ - Step 46608: {'lr': 0.00019905053226246968, 'samples': 1491456, 'steps': 2912, 'loss/train': 2.169010639190674} -09/21/2021 00:34:59 - INFO - __main__ - Step 46609: {'lr': 0.00019904965512996693, 'samples': 1491488, 'steps': 2913, 'loss/train': 1.4203606843948364} -09/21/2021 00:35:00 - INFO - __main__ - Step 46610: {'lr': 0.00019904965512996693, 'samples': 1491520, 'steps': 2913, 'loss/train': 1.2470930814743042} -09/21/2021 00:35:01 - INFO - __main__ - Step 46611: {'lr': 0.00019904965512996693, 'samples': 1491552, 'steps': 2913, 'loss/train': 1.7928892374038696} -09/21/2021 00:35:02 - INFO - __main__ - Step 46612: {'lr': 0.00019904965512996693, 'samples': 1491584, 'steps': 2913, 'loss/train': 1.4467310905456543} -09/21/2021 00:35:02 - INFO - __main__ - Step 46613: {'lr': 0.00019904965512996693, 'samples': 1491616, 'steps': 2913, 'loss/train': 1.5386898517608643} -09/21/2021 00:35:03 - INFO - __main__ - Step 46614: {'lr': 0.00019904965512996693, 'samples': 1491648, 'steps': 2913, 'loss/train': 2.412181854248047} -09/21/2021 00:35:04 - INFO - __main__ - Step 46615: {'lr': 0.00019904965512996693, 'samples': 1491680, 'steps': 2913, 'loss/train': 1.443833351135254} -09/21/2021 00:35:05 - INFO - __main__ - Step 46616: {'lr': 0.00019904965512996693, 'samples': 1491712, 'steps': 2913, 'loss/train': 2.5168869495391846} -09/21/2021 00:35:06 - INFO - __main__ - Step 46617: {'lr': 0.00019904965512996693, 'samples': 1491744, 'steps': 2913, 'loss/train': 2.561588764190674} -09/21/2021 00:35:07 - INFO - __main__ - Step 46618: {'lr': 0.00019904965512996693, 'samples': 1491776, 'steps': 2913, 'loss/train': 2.5423107147216797} -09/21/2021 00:35:07 - INFO - __main__ - Step 46619: {'lr': 0.00019904965512996693, 'samples': 1491808, 'steps': 2913, 'loss/train': 1.1782528162002563} -09/21/2021 00:35:08 - INFO - __main__ - Step 46620: {'lr': 0.00019904965512996693, 'samples': 1491840, 'steps': 2913, 'loss/train': 1.472213625907898} -09/21/2021 00:35:09 - INFO - __main__ - Step 46621: {'lr': 0.00019904965512996693, 'samples': 1491872, 'steps': 2913, 'loss/train': 1.8133589029312134} -09/21/2021 00:35:10 - INFO - __main__ - Step 46622: {'lr': 0.00019904965512996693, 'samples': 1491904, 'steps': 2913, 'loss/train': 1.7567867040634155} -09/21/2021 00:35:10 - INFO - __main__ - Step 46623: {'lr': 0.00019904965512996693, 'samples': 1491936, 'steps': 2913, 'loss/train': 2.5647737979888916} -09/21/2021 00:35:11 - INFO - __main__ - Step 46624: {'lr': 0.00019904965512996693, 'samples': 1491968, 'steps': 2913, 'loss/train': 0.8795934319496155} -09/21/2021 00:35:12 - INFO - __main__ - Step 46625: {'lr': 0.00019904877759443154, 'samples': 1492000, 'steps': 2914, 'loss/train': 1.3606306314468384} -09/21/2021 00:35:13 - INFO - __main__ - Step 46626: {'lr': 0.00019904877759443154, 'samples': 1492032, 'steps': 2914, 'loss/train': 1.2061882019042969} -09/21/2021 00:35:13 - INFO - __main__ - Step 46627: {'lr': 0.00019904877759443154, 'samples': 1492064, 'steps': 2914, 'loss/train': 2.6534788608551025} -09/21/2021 00:35:14 - INFO - __main__ - Step 46628: {'lr': 0.00019904877759443154, 'samples': 1492096, 'steps': 2914, 'loss/train': 1.8490616083145142} -09/21/2021 00:35:15 - INFO - __main__ - Step 46629: {'lr': 0.00019904877759443154, 'samples': 1492128, 'steps': 2914, 'loss/train': 1.9190505743026733} -09/21/2021 00:35:16 - INFO - __main__ - Step 46630: {'lr': 0.00019904877759443154, 'samples': 1492160, 'steps': 2914, 'loss/train': 2.0462377071380615} -09/21/2021 00:35:16 - INFO - __main__ - Step 46631: {'lr': 0.00019904877759443154, 'samples': 1492192, 'steps': 2914, 'loss/train': 1.622776985168457} -09/21/2021 00:35:17 - INFO - __main__ - Step 46632: {'lr': 0.00019904877759443154, 'samples': 1492224, 'steps': 2914, 'loss/train': 1.4692504405975342} -09/21/2021 00:35:18 - INFO - __main__ - Step 46633: {'lr': 0.00019904877759443154, 'samples': 1492256, 'steps': 2914, 'loss/train': 2.2308239936828613} -09/21/2021 00:35:19 - INFO - __main__ - Step 46634: {'lr': 0.00019904877759443154, 'samples': 1492288, 'steps': 2914, 'loss/train': 0.7592671513557434} -09/21/2021 00:35:19 - INFO - __main__ - Step 46635: {'lr': 0.00019904877759443154, 'samples': 1492320, 'steps': 2914, 'loss/train': 1.431675672531128} -09/21/2021 00:35:20 - INFO - __main__ - Step 46636: {'lr': 0.00019904877759443154, 'samples': 1492352, 'steps': 2914, 'loss/train': 2.369152307510376} -09/21/2021 00:35:21 - INFO - __main__ - Step 46637: {'lr': 0.00019904877759443154, 'samples': 1492384, 'steps': 2914, 'loss/train': 0.6980656981468201} -09/21/2021 00:35:22 - INFO - __main__ - Step 46638: {'lr': 0.00019904877759443154, 'samples': 1492416, 'steps': 2914, 'loss/train': 1.2774461507797241} -09/21/2021 00:35:22 - INFO - __main__ - Step 46639: {'lr': 0.00019904877759443154, 'samples': 1492448, 'steps': 2914, 'loss/train': 2.1670174598693848} -09/21/2021 00:35:23 - INFO - __main__ - Step 46640: {'lr': 0.00019904877759443154, 'samples': 1492480, 'steps': 2914, 'loss/train': 0.6664710640907288} -09/21/2021 00:35:24 - INFO - __main__ - Step 46641: {'lr': 0.00019904789965586708, 'samples': 1492512, 'steps': 2915, 'loss/train': 1.2748662233352661} -09/21/2021 00:35:25 - INFO - __main__ - Step 46642: {'lr': 0.00019904789965586708, 'samples': 1492544, 'steps': 2915, 'loss/train': 0.17969505488872528} -09/21/2021 00:35:26 - INFO - __main__ - Step 46643: {'lr': 0.00019904789965586708, 'samples': 1492576, 'steps': 2915, 'loss/train': 0.5191158652305603} -09/21/2021 00:35:26 - INFO - __main__ - Step 46644: {'lr': 0.00019904789965586708, 'samples': 1492608, 'steps': 2915, 'loss/train': 2.305314779281616} -09/21/2021 00:35:27 - INFO - __main__ - Step 46645: {'lr': 0.00019904789965586708, 'samples': 1492640, 'steps': 2915, 'loss/train': 0.7368952035903931} -09/21/2021 00:35:28 - INFO - __main__ - Step 46646: {'lr': 0.00019904789965586708, 'samples': 1492672, 'steps': 2915, 'loss/train': 2.898477792739868} -09/21/2021 00:35:29 - INFO - __main__ - Step 46647: {'lr': 0.00019904789965586708, 'samples': 1492704, 'steps': 2915, 'loss/train': 1.4233145713806152} -09/21/2021 00:35:30 - INFO - __main__ - Step 46648: {'lr': 0.00019904789965586708, 'samples': 1492736, 'steps': 2915, 'loss/train': 2.675452947616577} -09/21/2021 00:35:31 - INFO - __main__ - Step 46649: {'lr': 0.00019904789965586708, 'samples': 1492768, 'steps': 2915, 'loss/train': 2.802180767059326} -09/21/2021 00:35:31 - INFO - __main__ - Step 46650: {'lr': 0.00019904789965586708, 'samples': 1492800, 'steps': 2915, 'loss/train': 2.574918270111084} -09/21/2021 00:35:32 - INFO - __main__ - Step 46651: {'lr': 0.00019904789965586708, 'samples': 1492832, 'steps': 2915, 'loss/train': 2.9622809886932373} -09/21/2021 00:35:33 - INFO - __main__ - Step 46652: {'lr': 0.00019904789965586708, 'samples': 1492864, 'steps': 2915, 'loss/train': 2.020366668701172} -09/21/2021 00:35:34 - INFO - __main__ - Step 46653: {'lr': 0.00019904789965586708, 'samples': 1492896, 'steps': 2915, 'loss/train': 1.8292715549468994} -09/21/2021 00:35:34 - INFO - __main__ - Step 46654: {'lr': 0.00019904789965586708, 'samples': 1492928, 'steps': 2915, 'loss/train': 2.640300989151001} -09/21/2021 00:35:35 - INFO - __main__ - Step 46655: {'lr': 0.00019904789965586708, 'samples': 1492960, 'steps': 2915, 'loss/train': 1.7923179864883423} -09/21/2021 00:35:36 - INFO - __main__ - Step 46656: {'lr': 0.00019904789965586708, 'samples': 1492992, 'steps': 2915, 'loss/train': 1.8959343433380127} -09/21/2021 00:35:37 - INFO - __main__ - Step 46657: {'lr': 0.00019904702131427708, 'samples': 1493024, 'steps': 2916, 'loss/train': 2.540726661682129} -09/21/2021 00:35:38 - INFO - __main__ - Step 46658: {'lr': 0.00019904702131427708, 'samples': 1493056, 'steps': 2916, 'loss/train': 0.5134089589118958} -09/21/2021 00:35:38 - INFO - __main__ - Step 46659: {'lr': 0.00019904702131427708, 'samples': 1493088, 'steps': 2916, 'loss/train': 2.2660574913024902} -09/21/2021 00:35:39 - INFO - __main__ - Step 46660: {'lr': 0.00019904702131427708, 'samples': 1493120, 'steps': 2916, 'loss/train': 1.6565673351287842} -09/21/2021 00:35:40 - INFO - __main__ - Step 46661: {'lr': 0.00019904702131427708, 'samples': 1493152, 'steps': 2916, 'loss/train': 0.3704785108566284} -09/21/2021 00:35:41 - INFO - __main__ - Step 46662: {'lr': 0.00019904702131427708, 'samples': 1493184, 'steps': 2916, 'loss/train': 2.542341947555542} -09/21/2021 00:35:41 - INFO - __main__ - Step 46663: {'lr': 0.00019904702131427708, 'samples': 1493216, 'steps': 2916, 'loss/train': 2.239956855773926} -09/21/2021 00:35:42 - INFO - __main__ - Step 46664: {'lr': 0.00019904702131427708, 'samples': 1493248, 'steps': 2916, 'loss/train': 2.457007646560669} -09/21/2021 00:35:43 - INFO - __main__ - Step 46665: {'lr': 0.00019904702131427708, 'samples': 1493280, 'steps': 2916, 'loss/train': 1.1007986068725586} -09/21/2021 00:35:44 - INFO - __main__ - Step 46666: {'lr': 0.00019904702131427708, 'samples': 1493312, 'steps': 2916, 'loss/train': 2.0329227447509766} -09/21/2021 00:35:44 - INFO - __main__ - Step 46667: {'lr': 0.00019904702131427708, 'samples': 1493344, 'steps': 2916, 'loss/train': 2.1730844974517822} -09/21/2021 00:35:45 - INFO - __main__ - Step 46668: {'lr': 0.00019904702131427708, 'samples': 1493376, 'steps': 2916, 'loss/train': 2.2049829959869385} -09/21/2021 00:35:46 - INFO - __main__ - Step 46669: {'lr': 0.00019904702131427708, 'samples': 1493408, 'steps': 2916, 'loss/train': 2.4923853874206543} -09/21/2021 00:35:47 - INFO - __main__ - Step 46670: {'lr': 0.00019904702131427708, 'samples': 1493440, 'steps': 2916, 'loss/train': 2.7685036659240723} -09/21/2021 00:35:47 - INFO - __main__ - Step 46671: {'lr': 0.00019904702131427708, 'samples': 1493472, 'steps': 2916, 'loss/train': 1.6374340057373047} -09/21/2021 00:35:48 - INFO - __main__ - Step 46672: {'lr': 0.00019904702131427708, 'samples': 1493504, 'steps': 2916, 'loss/train': 2.0071778297424316} -09/21/2021 00:35:49 - INFO - __main__ - Step 46673: {'lr': 0.00019904614256966512, 'samples': 1493536, 'steps': 2917, 'loss/train': 1.492138385772705} -09/21/2021 00:35:50 - INFO - __main__ - Step 46674: {'lr': 0.00019904614256966512, 'samples': 1493568, 'steps': 2917, 'loss/train': 2.179236650466919} -09/21/2021 00:35:50 - INFO - __main__ - Step 46675: {'lr': 0.00019904614256966512, 'samples': 1493600, 'steps': 2917, 'loss/train': 2.2628092765808105} -09/21/2021 00:35:51 - INFO - __main__ - Step 46676: {'lr': 0.00019904614256966512, 'samples': 1493632, 'steps': 2917, 'loss/train': 1.9108551740646362} -09/21/2021 00:35:52 - INFO - __main__ - Step 46677: {'lr': 0.00019904614256966512, 'samples': 1493664, 'steps': 2917, 'loss/train': 2.795076608657837} -09/21/2021 00:35:53 - INFO - __main__ - Step 46678: {'lr': 0.00019904614256966512, 'samples': 1493696, 'steps': 2917, 'loss/train': 1.2961527109146118} -09/21/2021 00:35:54 - INFO - __main__ - Step 46679: {'lr': 0.00019904614256966512, 'samples': 1493728, 'steps': 2917, 'loss/train': 1.3680294752120972} -09/21/2021 00:35:55 - INFO - __main__ - Step 46680: {'lr': 0.00019904614256966512, 'samples': 1493760, 'steps': 2917, 'loss/train': 1.5815467834472656} -09/21/2021 00:35:55 - INFO - __main__ - Step 46681: {'lr': 0.00019904614256966512, 'samples': 1493792, 'steps': 2917, 'loss/train': 2.4613208770751953} -09/21/2021 00:35:56 - INFO - __main__ - Step 46682: {'lr': 0.00019904614256966512, 'samples': 1493824, 'steps': 2917, 'loss/train': 1.9656494855880737} -09/21/2021 00:35:57 - INFO - __main__ - Step 46683: {'lr': 0.00019904614256966512, 'samples': 1493856, 'steps': 2917, 'loss/train': 2.0651144981384277} -09/21/2021 00:35:58 - INFO - __main__ - Step 46684: {'lr': 0.00019904614256966512, 'samples': 1493888, 'steps': 2917, 'loss/train': 1.8626056909561157} -09/21/2021 00:35:59 - INFO - __main__ - Step 46685: {'lr': 0.00019904614256966512, 'samples': 1493920, 'steps': 2917, 'loss/train': 2.121857166290283} -09/21/2021 00:35:59 - INFO - __main__ - Step 46686: {'lr': 0.00019904614256966512, 'samples': 1493952, 'steps': 2917, 'loss/train': 1.444138526916504} -09/21/2021 00:36:00 - INFO - __main__ - Step 46687: {'lr': 0.00019904614256966512, 'samples': 1493984, 'steps': 2917, 'loss/train': 2.486241102218628} -09/21/2021 00:36:01 - INFO - __main__ - Step 46688: {'lr': 0.00019904614256966512, 'samples': 1494016, 'steps': 2917, 'loss/train': 2.4554672241210938} -09/21/2021 00:36:02 - INFO - __main__ - Step 46689: {'lr': 0.00019904526342203483, 'samples': 1494048, 'steps': 2918, 'loss/train': 2.4408650398254395} -09/21/2021 00:36:02 - INFO - __main__ - Step 46690: {'lr': 0.00019904526342203483, 'samples': 1494080, 'steps': 2918, 'loss/train': 1.1899445056915283} -09/21/2021 00:36:03 - INFO - __main__ - Step 46691: {'lr': 0.00019904526342203483, 'samples': 1494112, 'steps': 2918, 'loss/train': 2.158426284790039} -09/21/2021 00:36:04 - INFO - __main__ - Step 46692: {'lr': 0.00019904526342203483, 'samples': 1494144, 'steps': 2918, 'loss/train': 2.7792744636535645} -09/21/2021 00:36:05 - INFO - __main__ - Step 46693: {'lr': 0.00019904526342203483, 'samples': 1494176, 'steps': 2918, 'loss/train': 2.5833611488342285} -09/21/2021 00:36:05 - INFO - __main__ - Step 46694: {'lr': 0.00019904526342203483, 'samples': 1494208, 'steps': 2918, 'loss/train': 2.4439611434936523} -09/21/2021 00:36:06 - INFO - __main__ - Step 46695: {'lr': 0.00019904526342203483, 'samples': 1494240, 'steps': 2918, 'loss/train': 0.7967913746833801} -09/21/2021 00:36:07 - INFO - __main__ - Step 46696: {'lr': 0.00019904526342203483, 'samples': 1494272, 'steps': 2918, 'loss/train': 1.946921467781067} -09/21/2021 00:36:08 - INFO - __main__ - Step 46697: {'lr': 0.00019904526342203483, 'samples': 1494304, 'steps': 2918, 'loss/train': 2.122776508331299} -09/21/2021 00:36:08 - INFO - __main__ - Step 46698: {'lr': 0.00019904526342203483, 'samples': 1494336, 'steps': 2918, 'loss/train': 1.6308969259262085} -09/21/2021 00:36:09 - INFO - __main__ - Step 46699: {'lr': 0.00019904526342203483, 'samples': 1494368, 'steps': 2918, 'loss/train': 2.5972745418548584} -09/21/2021 00:36:10 - INFO - __main__ - Step 46700: {'lr': 0.00019904526342203483, 'samples': 1494400, 'steps': 2918, 'loss/train': 1.1412826776504517} -09/21/2021 00:36:11 - INFO - __main__ - Step 46701: {'lr': 0.00019904526342203483, 'samples': 1494432, 'steps': 2918, 'loss/train': 0.20289668440818787} -09/21/2021 00:36:11 - INFO - __main__ - Step 46702: {'lr': 0.00019904526342203483, 'samples': 1494464, 'steps': 2918, 'loss/train': 0.09929156303405762} -09/21/2021 00:36:12 - INFO - __main__ - Step 46703: {'lr': 0.00019904526342203483, 'samples': 1494496, 'steps': 2918, 'loss/train': 0.16575179994106293} -09/21/2021 00:36:13 - INFO - __main__ - Step 46704: {'lr': 0.00019904526342203483, 'samples': 1494528, 'steps': 2918, 'loss/train': 2.650257110595703} -09/21/2021 00:36:14 - INFO - __main__ - Step 46705: {'lr': 0.0001990443838713897, 'samples': 1494560, 'steps': 2919, 'loss/train': 1.0376098155975342} -09/21/2021 00:36:15 - INFO - __main__ - Step 46706: {'lr': 0.0001990443838713897, 'samples': 1494592, 'steps': 2919, 'loss/train': 3.723788022994995} -09/21/2021 00:36:16 - INFO - __main__ - Step 46707: {'lr': 0.0001990443838713897, 'samples': 1494624, 'steps': 2919, 'loss/train': 3.0315840244293213} -09/21/2021 00:36:17 - INFO - __main__ - Step 46708: {'lr': 0.0001990443838713897, 'samples': 1494656, 'steps': 2919, 'loss/train': 1.7035564184188843} -09/21/2021 00:36:17 - INFO - __main__ - Step 46709: {'lr': 0.0001990443838713897, 'samples': 1494688, 'steps': 2919, 'loss/train': 1.417661190032959} -09/21/2021 00:36:18 - INFO - __main__ - Step 46710: {'lr': 0.0001990443838713897, 'samples': 1494720, 'steps': 2919, 'loss/train': 1.736388921737671} -09/21/2021 00:36:19 - INFO - __main__ - Step 46711: {'lr': 0.0001990443838713897, 'samples': 1494752, 'steps': 2919, 'loss/train': 6.915346622467041} -09/21/2021 00:36:20 - INFO - __main__ - Step 46712: {'lr': 0.0001990443838713897, 'samples': 1494784, 'steps': 2919, 'loss/train': 6.8104777336120605} -09/21/2021 00:36:20 - INFO - __main__ - Step 46713: {'lr': 0.0001990443838713897, 'samples': 1494816, 'steps': 2919, 'loss/train': 6.82589864730835} -09/21/2021 00:36:21 - INFO - __main__ - Step 46714: {'lr': 0.0001990443838713897, 'samples': 1494848, 'steps': 2919, 'loss/train': 6.940062522888184} -09/21/2021 00:36:22 - INFO - __main__ - Step 46715: {'lr': 0.0001990443838713897, 'samples': 1494880, 'steps': 2919, 'loss/train': 2.249760389328003} -09/21/2021 00:36:23 - INFO - __main__ - Step 46716: {'lr': 0.0001990443838713897, 'samples': 1494912, 'steps': 2919, 'loss/train': 1.8160526752471924} -09/21/2021 00:36:23 - INFO - __main__ - Step 46717: {'lr': 0.0001990443838713897, 'samples': 1494944, 'steps': 2919, 'loss/train': 1.7466182708740234} -09/21/2021 00:36:24 - INFO - __main__ - Step 46718: {'lr': 0.0001990443838713897, 'samples': 1494976, 'steps': 2919, 'loss/train': 2.0736887454986572} -09/21/2021 00:36:25 - INFO - __main__ - Step 46719: {'lr': 0.0001990443838713897, 'samples': 1495008, 'steps': 2919, 'loss/train': 2.0932071208953857} -09/21/2021 00:36:26 - INFO - __main__ - Step 46720: {'lr': 0.0001990443838713897, 'samples': 1495040, 'steps': 2919, 'loss/train': 1.3599467277526855} -09/21/2021 00:36:27 - INFO - __main__ - Step 46721: {'lr': 0.0001990435039177334, 'samples': 1495072, 'steps': 2920, 'loss/train': 1.9083784818649292} -09/21/2021 00:36:27 - INFO - __main__ - Step 46722: {'lr': 0.0001990435039177334, 'samples': 1495104, 'steps': 2920, 'loss/train': 2.7893214225769043} -09/21/2021 00:36:28 - INFO - __main__ - Step 46723: {'lr': 0.0001990435039177334, 'samples': 1495136, 'steps': 2920, 'loss/train': 1.9164360761642456} -09/21/2021 00:36:29 - INFO - __main__ - Step 46724: {'lr': 0.0001990435039177334, 'samples': 1495168, 'steps': 2920, 'loss/train': 1.6792303323745728} -09/21/2021 00:36:30 - INFO - __main__ - Step 46725: {'lr': 0.0001990435039177334, 'samples': 1495200, 'steps': 2920, 'loss/train': 2.8336517810821533} -09/21/2021 00:36:30 - INFO - __main__ - Step 46726: {'lr': 0.0001990435039177334, 'samples': 1495232, 'steps': 2920, 'loss/train': 1.6040623188018799} -09/21/2021 00:36:31 - INFO - __main__ - Step 46727: {'lr': 0.0001990435039177334, 'samples': 1495264, 'steps': 2920, 'loss/train': 3.3949058055877686} -09/21/2021 00:36:32 - INFO - __main__ - Step 46728: {'lr': 0.0001990435039177334, 'samples': 1495296, 'steps': 2920, 'loss/train': 2.503030300140381} -09/21/2021 00:36:33 - INFO - __main__ - Step 46729: {'lr': 0.0001990435039177334, 'samples': 1495328, 'steps': 2920, 'loss/train': 2.0801992416381836} -09/21/2021 00:36:33 - INFO - __main__ - Step 46730: {'lr': 0.0001990435039177334, 'samples': 1495360, 'steps': 2920, 'loss/train': 2.0832605361938477} -09/21/2021 00:36:34 - INFO - __main__ - Step 46731: {'lr': 0.0001990435039177334, 'samples': 1495392, 'steps': 2920, 'loss/train': 1.4093042612075806} -09/21/2021 00:36:35 - INFO - __main__ - Step 46732: {'lr': 0.0001990435039177334, 'samples': 1495424, 'steps': 2920, 'loss/train': 2.4793343544006348} -09/21/2021 00:36:36 - INFO - __main__ - Step 46733: {'lr': 0.0001990435039177334, 'samples': 1495456, 'steps': 2920, 'loss/train': 2.0984134674072266} -09/21/2021 00:36:36 - INFO - __main__ - Step 46734: {'lr': 0.0001990435039177334, 'samples': 1495488, 'steps': 2920, 'loss/train': 1.8697683811187744} -09/21/2021 00:36:37 - INFO - __main__ - Step 46735: {'lr': 0.0001990435039177334, 'samples': 1495520, 'steps': 2920, 'loss/train': 2.453402519226074} -09/21/2021 00:36:38 - INFO - __main__ - Step 46736: {'lr': 0.0001990435039177334, 'samples': 1495552, 'steps': 2920, 'loss/train': 2.5686230659484863} -09/21/2021 00:36:39 - INFO - __main__ - Step 46737: {'lr': 0.00019904262356106945, 'samples': 1495584, 'steps': 2921, 'loss/train': 1.7583881616592407} -09/21/2021 00:36:39 - INFO - __main__ - Step 46738: {'lr': 0.00019904262356106945, 'samples': 1495616, 'steps': 2921, 'loss/train': 1.7759445905685425} -09/21/2021 00:36:40 - INFO - __main__ - Step 46739: {'lr': 0.00019904262356106945, 'samples': 1495648, 'steps': 2921, 'loss/train': 2.0355324745178223} -09/21/2021 00:36:41 - INFO - __main__ - Step 46740: {'lr': 0.00019904262356106945, 'samples': 1495680, 'steps': 2921, 'loss/train': 1.8680905103683472} -09/21/2021 00:36:42 - INFO - __main__ - Step 46741: {'lr': 0.00019904262356106945, 'samples': 1495712, 'steps': 2921, 'loss/train': 1.7914299964904785} -09/21/2021 00:36:43 - INFO - __main__ - Step 46742: {'lr': 0.00019904262356106945, 'samples': 1495744, 'steps': 2921, 'loss/train': 2.546621799468994} -09/21/2021 00:36:44 - INFO - __main__ - Step 46743: {'lr': 0.00019904262356106945, 'samples': 1495776, 'steps': 2921, 'loss/train': 1.5734164714813232} -09/21/2021 00:36:44 - INFO - __main__ - Step 46744: {'lr': 0.00019904262356106945, 'samples': 1495808, 'steps': 2921, 'loss/train': 3.2262723445892334} -09/21/2021 00:36:45 - INFO - __main__ - Step 46745: {'lr': 0.00019904262356106945, 'samples': 1495840, 'steps': 2921, 'loss/train': 2.0401113033294678} -09/21/2021 00:36:46 - INFO - __main__ - Step 46746: {'lr': 0.00019904262356106945, 'samples': 1495872, 'steps': 2921, 'loss/train': 2.991109848022461} -09/21/2021 00:36:47 - INFO - __main__ - Step 46747: {'lr': 0.00019904262356106945, 'samples': 1495904, 'steps': 2921, 'loss/train': 1.6208537817001343} -09/21/2021 00:36:47 - INFO - __main__ - Step 46748: {'lr': 0.00019904262356106945, 'samples': 1495936, 'steps': 2921, 'loss/train': 1.3981716632843018} -09/21/2021 00:36:48 - INFO - __main__ - Step 46749: {'lr': 0.00019904262356106945, 'samples': 1495968, 'steps': 2921, 'loss/train': 2.3125505447387695} -09/21/2021 00:36:49 - INFO - __main__ - Step 46750: {'lr': 0.00019904262356106945, 'samples': 1496000, 'steps': 2921, 'loss/train': 1.5058847665786743} -09/21/2021 00:36:50 - INFO - __main__ - Step 46751: {'lr': 0.00019904262356106945, 'samples': 1496032, 'steps': 2921, 'loss/train': 2.3509979248046875} -09/21/2021 00:36:50 - INFO - __main__ - Step 46752: {'lr': 0.00019904262356106945, 'samples': 1496064, 'steps': 2921, 'loss/train': 2.207033395767212} -09/21/2021 00:36:51 - INFO - __main__ - Step 46753: {'lr': 0.00019904174280140142, 'samples': 1496096, 'steps': 2922, 'loss/train': 2.0799055099487305} -09/21/2021 00:36:52 - INFO - __main__ - Step 46754: {'lr': 0.00019904174280140142, 'samples': 1496128, 'steps': 2922, 'loss/train': 2.4075400829315186} -09/21/2021 00:36:53 - INFO - __main__ - Step 46755: {'lr': 0.00019904174280140142, 'samples': 1496160, 'steps': 2922, 'loss/train': 1.8247829675674438} -09/21/2021 00:36:54 - INFO - __main__ - Step 46756: {'lr': 0.00019904174280140142, 'samples': 1496192, 'steps': 2922, 'loss/train': 2.310854196548462} -09/21/2021 00:36:54 - INFO - __main__ - Step 46757: {'lr': 0.00019904174280140142, 'samples': 1496224, 'steps': 2922, 'loss/train': 1.2189878225326538} -09/21/2021 00:36:55 - INFO - __main__ - Step 46758: {'lr': 0.00019904174280140142, 'samples': 1496256, 'steps': 2922, 'loss/train': 1.5987375974655151} -09/21/2021 00:36:56 - INFO - __main__ - Step 46759: {'lr': 0.00019904174280140142, 'samples': 1496288, 'steps': 2922, 'loss/train': 1.263134241104126} -09/21/2021 00:36:57 - INFO - __main__ - Step 46760: {'lr': 0.00019904174280140142, 'samples': 1496320, 'steps': 2922, 'loss/train': 1.318840742111206} -09/21/2021 00:36:57 - INFO - __main__ - Step 46761: {'lr': 0.00019904174280140142, 'samples': 1496352, 'steps': 2922, 'loss/train': 2.760080099105835} -09/21/2021 00:36:58 - INFO - __main__ - Step 46762: {'lr': 0.00019904174280140142, 'samples': 1496384, 'steps': 2922, 'loss/train': 1.1360013484954834} -09/21/2021 00:36:59 - INFO - __main__ - Step 46763: {'lr': 0.00019904174280140142, 'samples': 1496416, 'steps': 2922, 'loss/train': 1.9569876194000244} -09/21/2021 00:37:00 - INFO - __main__ - Step 46764: {'lr': 0.00019904174280140142, 'samples': 1496448, 'steps': 2922, 'loss/train': 2.110231637954712} -09/21/2021 00:37:00 - INFO - __main__ - Step 46765: {'lr': 0.00019904174280140142, 'samples': 1496480, 'steps': 2922, 'loss/train': 2.176718235015869} -09/21/2021 00:37:01 - INFO - __main__ - Step 46766: {'lr': 0.00019904174280140142, 'samples': 1496512, 'steps': 2922, 'loss/train': 1.9948139190673828} -09/21/2021 00:37:02 - INFO - __main__ - Step 46767: {'lr': 0.00019904174280140142, 'samples': 1496544, 'steps': 2922, 'loss/train': 4.717682361602783} -09/21/2021 00:37:03 - INFO - __main__ - Step 46768: {'lr': 0.00019904174280140142, 'samples': 1496576, 'steps': 2922, 'loss/train': 1.968562364578247} -09/21/2021 00:37:04 - INFO - __main__ - Step 46769: {'lr': 0.00019904086163873296, 'samples': 1496608, 'steps': 2923, 'loss/train': 1.981000542640686} -09/21/2021 00:37:04 - INFO - __main__ - Step 46770: {'lr': 0.00019904086163873296, 'samples': 1496640, 'steps': 2923, 'loss/train': 2.21187686920166} -09/21/2021 00:37:05 - INFO - __main__ - Step 46771: {'lr': 0.00019904086163873296, 'samples': 1496672, 'steps': 2923, 'loss/train': 2.0808780193328857} -09/21/2021 00:37:06 - INFO - __main__ - Step 46772: {'lr': 0.00019904086163873296, 'samples': 1496704, 'steps': 2923, 'loss/train': 1.3876579999923706} -09/21/2021 00:37:07 - INFO - __main__ - Step 46773: {'lr': 0.00019904086163873296, 'samples': 1496736, 'steps': 2923, 'loss/train': 2.175147294998169} -09/21/2021 00:37:08 - INFO - __main__ - Step 46774: {'lr': 0.00019904086163873296, 'samples': 1496768, 'steps': 2923, 'loss/train': 2.6614487171173096} -09/21/2021 00:37:08 - INFO - __main__ - Step 46775: {'lr': 0.00019904086163873296, 'samples': 1496800, 'steps': 2923, 'loss/train': 2.2801434993743896} -09/21/2021 00:37:09 - INFO - __main__ - Step 46776: {'lr': 0.00019904086163873296, 'samples': 1496832, 'steps': 2923, 'loss/train': 1.5441540479660034} -09/21/2021 00:37:10 - INFO - __main__ - Step 46777: {'lr': 0.00019904086163873296, 'samples': 1496864, 'steps': 2923, 'loss/train': 2.6131277084350586} -09/21/2021 00:37:11 - INFO - __main__ - Step 46778: {'lr': 0.00019904086163873296, 'samples': 1496896, 'steps': 2923, 'loss/train': 2.161073684692383} -09/21/2021 00:37:11 - INFO - __main__ - Step 46779: {'lr': 0.00019904086163873296, 'samples': 1496928, 'steps': 2923, 'loss/train': 2.369255781173706} -09/21/2021 00:37:12 - INFO - __main__ - Step 46780: {'lr': 0.00019904086163873296, 'samples': 1496960, 'steps': 2923, 'loss/train': 2.4785659313201904} -09/21/2021 00:37:13 - INFO - __main__ - Step 46781: {'lr': 0.00019904086163873296, 'samples': 1496992, 'steps': 2923, 'loss/train': 2.285317897796631} -09/21/2021 00:37:14 - INFO - __main__ - Step 46782: {'lr': 0.00019904086163873296, 'samples': 1497024, 'steps': 2923, 'loss/train': 1.7622313499450684} -09/21/2021 00:37:14 - INFO - __main__ - Step 46783: {'lr': 0.00019904086163873296, 'samples': 1497056, 'steps': 2923, 'loss/train': 2.2716176509857178} -09/21/2021 00:37:15 - INFO - __main__ - Step 46784: {'lr': 0.00019904086163873296, 'samples': 1497088, 'steps': 2923, 'loss/train': 1.8215663433074951} -09/21/2021 00:37:16 - INFO - __main__ - Step 46785: {'lr': 0.0001990399800730676, 'samples': 1497120, 'steps': 2924, 'loss/train': 2.1778390407562256} -09/21/2021 00:37:17 - INFO - __main__ - Step 46786: {'lr': 0.0001990399800730676, 'samples': 1497152, 'steps': 2924, 'loss/train': 2.2514944076538086} -09/21/2021 00:37:18 - INFO - __main__ - Step 46787: {'lr': 0.0001990399800730676, 'samples': 1497184, 'steps': 2924, 'loss/train': 1.3520445823669434} -09/21/2021 00:37:18 - INFO - __main__ - Step 46788: {'lr': 0.0001990399800730676, 'samples': 1497216, 'steps': 2924, 'loss/train': 1.8334659337997437} -09/21/2021 00:37:19 - INFO - __main__ - Step 46789: {'lr': 0.0001990399800730676, 'samples': 1497248, 'steps': 2924, 'loss/train': 2.1955811977386475} -09/21/2021 00:37:20 - INFO - __main__ - Step 46790: {'lr': 0.0001990399800730676, 'samples': 1497280, 'steps': 2924, 'loss/train': 2.564107894897461} -09/21/2021 00:37:21 - INFO - __main__ - Step 46791: {'lr': 0.0001990399800730676, 'samples': 1497312, 'steps': 2924, 'loss/train': 2.494685173034668} -09/21/2021 00:37:21 - INFO - __main__ - Step 46792: {'lr': 0.0001990399800730676, 'samples': 1497344, 'steps': 2924, 'loss/train': 2.301537036895752} -09/21/2021 00:37:22 - INFO - __main__ - Step 46793: {'lr': 0.0001990399800730676, 'samples': 1497376, 'steps': 2924, 'loss/train': 0.1406632661819458} -09/21/2021 00:37:23 - INFO - __main__ - Step 46794: {'lr': 0.0001990399800730676, 'samples': 1497408, 'steps': 2924, 'loss/train': 2.196932792663574} -09/21/2021 00:37:24 - INFO - __main__ - Step 46795: {'lr': 0.0001990399800730676, 'samples': 1497440, 'steps': 2924, 'loss/train': 2.1251232624053955} -09/21/2021 00:37:24 - INFO - __main__ - Step 46796: {'lr': 0.0001990399800730676, 'samples': 1497472, 'steps': 2924, 'loss/train': 2.03252911567688} -09/21/2021 00:37:25 - INFO - __main__ - Step 46797: {'lr': 0.0001990399800730676, 'samples': 1497504, 'steps': 2924, 'loss/train': 1.6891350746154785} -09/21/2021 00:37:26 - INFO - __main__ - Step 46798: {'lr': 0.0001990399800730676, 'samples': 1497536, 'steps': 2924, 'loss/train': 1.942673683166504} -09/21/2021 00:37:27 - INFO - __main__ - Step 46799: {'lr': 0.0001990399800730676, 'samples': 1497568, 'steps': 2924, 'loss/train': 2.0613958835601807} -09/21/2021 00:37:27 - INFO - __main__ - Step 46800: {'lr': 0.0001990399800730676, 'samples': 1497600, 'steps': 2924, 'loss/train': 2.183068037033081} -09/21/2021 00:37:28 - INFO - __main__ - Step 46801: {'lr': 0.00019903909810440896, 'samples': 1497632, 'steps': 2925, 'loss/train': 1.335626482963562} -09/21/2021 00:37:30 - INFO - __main__ - Step 46802: {'lr': 0.00019903909810440896, 'samples': 1497664, 'steps': 2925, 'loss/train': 1.3903446197509766} -09/21/2021 00:37:30 - INFO - __main__ - Step 46803: {'lr': 0.00019903909810440896, 'samples': 1497696, 'steps': 2925, 'loss/train': 1.4824540615081787} -09/21/2021 00:37:31 - INFO - __main__ - Step 46804: {'lr': 0.00019903909810440896, 'samples': 1497728, 'steps': 2925, 'loss/train': 1.6988121271133423} -09/21/2021 00:37:32 - INFO - __main__ - Step 46805: {'lr': 0.00019903909810440896, 'samples': 1497760, 'steps': 2925, 'loss/train': 2.3290176391601562} -09/21/2021 00:37:33 - INFO - __main__ - Step 46806: {'lr': 0.00019903909810440896, 'samples': 1497792, 'steps': 2925, 'loss/train': 2.439647674560547} -09/21/2021 00:37:33 - INFO - __main__ - Step 46807: {'lr': 0.00019903909810440896, 'samples': 1497824, 'steps': 2925, 'loss/train': 3.3077616691589355} -09/21/2021 00:37:34 - INFO - __main__ - Step 46808: {'lr': 0.00019903909810440896, 'samples': 1497856, 'steps': 2925, 'loss/train': 1.9460023641586304} -09/21/2021 00:37:35 - INFO - __main__ - Step 46809: {'lr': 0.00019903909810440896, 'samples': 1497888, 'steps': 2925, 'loss/train': 1.074416995048523} -09/21/2021 00:37:36 - INFO - __main__ - Step 46810: {'lr': 0.00019903909810440896, 'samples': 1497920, 'steps': 2925, 'loss/train': 1.53316330909729} -09/21/2021 00:37:36 - INFO - __main__ - Step 46811: {'lr': 0.00019903909810440896, 'samples': 1497952, 'steps': 2925, 'loss/train': 0.8201570510864258} -09/21/2021 00:37:37 - INFO - __main__ - Step 46812: {'lr': 0.00019903909810440896, 'samples': 1497984, 'steps': 2925, 'loss/train': 3.1712286472320557} -09/21/2021 00:37:38 - INFO - __main__ - Step 46813: {'lr': 0.00019903909810440896, 'samples': 1498016, 'steps': 2925, 'loss/train': 2.9448776245117188} -09/21/2021 00:37:39 - INFO - __main__ - Step 46814: {'lr': 0.00019903909810440896, 'samples': 1498048, 'steps': 2925, 'loss/train': 1.620971918106079} -09/21/2021 00:37:39 - INFO - __main__ - Step 46815: {'lr': 0.00019903909810440896, 'samples': 1498080, 'steps': 2925, 'loss/train': 2.1618549823760986} -09/21/2021 00:37:40 - INFO - __main__ - Step 46816: {'lr': 0.00019903909810440896, 'samples': 1498112, 'steps': 2925, 'loss/train': 1.9594465494155884} -09/21/2021 00:37:41 - INFO - __main__ - Step 46817: {'lr': 0.0001990382157327606, 'samples': 1498144, 'steps': 2926, 'loss/train': 2.4552083015441895} -09/21/2021 00:37:42 - INFO - __main__ - Step 46818: {'lr': 0.0001990382157327606, 'samples': 1498176, 'steps': 2926, 'loss/train': 2.411716938018799} -09/21/2021 00:37:42 - INFO - __main__ - Step 46819: {'lr': 0.0001990382157327606, 'samples': 1498208, 'steps': 2926, 'loss/train': 2.2699544429779053} -09/21/2021 00:37:43 - INFO - __main__ - Step 46820: {'lr': 0.0001990382157327606, 'samples': 1498240, 'steps': 2926, 'loss/train': 2.329465389251709} -09/21/2021 00:37:44 - INFO - __main__ - Step 46821: {'lr': 0.0001990382157327606, 'samples': 1498272, 'steps': 2926, 'loss/train': 1.7220971584320068} -09/21/2021 00:37:45 - INFO - __main__ - Step 46822: {'lr': 0.0001990382157327606, 'samples': 1498304, 'steps': 2926, 'loss/train': 2.1761505603790283} -09/21/2021 00:37:45 - INFO - __main__ - Step 46823: {'lr': 0.0001990382157327606, 'samples': 1498336, 'steps': 2926, 'loss/train': 1.1157315969467163} -09/21/2021 00:37:46 - INFO - __main__ - Step 46824: {'lr': 0.0001990382157327606, 'samples': 1498368, 'steps': 2926, 'loss/train': 2.26737904548645} -09/21/2021 00:37:47 - INFO - __main__ - Step 46825: {'lr': 0.0001990382157327606, 'samples': 1498400, 'steps': 2926, 'loss/train': 1.7375677824020386} -09/21/2021 00:37:48 - INFO - __main__ - Step 46826: {'lr': 0.0001990382157327606, 'samples': 1498432, 'steps': 2926, 'loss/train': 0.41159647703170776} -09/21/2021 00:37:48 - INFO - __main__ - Step 46827: {'lr': 0.0001990382157327606, 'samples': 1498464, 'steps': 2926, 'loss/train': 2.6803953647613525} -09/21/2021 00:37:49 - INFO - __main__ - Step 46828: {'lr': 0.0001990382157327606, 'samples': 1498496, 'steps': 2926, 'loss/train': 2.169806718826294} -09/21/2021 00:37:50 - INFO - __main__ - Step 46829: {'lr': 0.0001990382157327606, 'samples': 1498528, 'steps': 2926, 'loss/train': 2.089235782623291} -09/21/2021 00:37:51 - INFO - __main__ - Step 46830: {'lr': 0.0001990382157327606, 'samples': 1498560, 'steps': 2926, 'loss/train': 2.8117475509643555} -09/21/2021 00:37:51 - INFO - __main__ - Step 46831: {'lr': 0.0001990382157327606, 'samples': 1498592, 'steps': 2926, 'loss/train': 2.0888679027557373} -09/21/2021 00:37:52 - INFO - __main__ - Step 46832: {'lr': 0.0001990382157327606, 'samples': 1498624, 'steps': 2926, 'loss/train': 1.9993492364883423} -09/21/2021 00:37:54 - INFO - __main__ - Step 46833: {'lr': 0.00019903733295812613, 'samples': 1498656, 'steps': 2927, 'loss/train': 2.3666608333587646} -09/21/2021 00:37:55 - INFO - __main__ - Step 46834: {'lr': 0.00019903733295812613, 'samples': 1498688, 'steps': 2927, 'loss/train': 1.954699158668518} -09/21/2021 00:37:56 - INFO - __main__ - Step 46835: {'lr': 0.00019903733295812613, 'samples': 1498720, 'steps': 2927, 'loss/train': 1.635940432548523} -09/21/2021 00:37:56 - INFO - __main__ - Step 46836: {'lr': 0.00019903733295812613, 'samples': 1498752, 'steps': 2927, 'loss/train': 1.6744340658187866} -09/21/2021 00:37:57 - INFO - __main__ - Step 46837: {'lr': 0.00019903733295812613, 'samples': 1498784, 'steps': 2927, 'loss/train': 1.7644237279891968} -09/21/2021 00:37:58 - INFO - __main__ - Step 46838: {'lr': 0.00019903733295812613, 'samples': 1498816, 'steps': 2927, 'loss/train': 1.0928651094436646} -09/21/2021 00:37:59 - INFO - __main__ - Step 46839: {'lr': 0.00019903733295812613, 'samples': 1498848, 'steps': 2927, 'loss/train': 2.672633171081543} -09/21/2021 00:37:59 - INFO - __main__ - Step 46840: {'lr': 0.00019903733295812613, 'samples': 1498880, 'steps': 2927, 'loss/train': 2.80694317817688} -09/21/2021 00:38:00 - INFO - __main__ - Step 46841: {'lr': 0.00019903733295812613, 'samples': 1498912, 'steps': 2927, 'loss/train': 1.9552139043807983} -09/21/2021 00:38:01 - INFO - __main__ - Step 46842: {'lr': 0.00019903733295812613, 'samples': 1498944, 'steps': 2927, 'loss/train': 2.248516082763672} -09/21/2021 00:38:02 - INFO - __main__ - Step 46843: {'lr': 0.00019903733295812613, 'samples': 1498976, 'steps': 2927, 'loss/train': 2.4197866916656494} -09/21/2021 00:38:02 - INFO - __main__ - Step 46844: {'lr': 0.00019903733295812613, 'samples': 1499008, 'steps': 2927, 'loss/train': 1.7531558275222778} -09/21/2021 00:38:03 - INFO - __main__ - Step 46845: {'lr': 0.00019903733295812613, 'samples': 1499040, 'steps': 2927, 'loss/train': 0.5876085758209229} -09/21/2021 00:38:04 - INFO - __main__ - Step 46846: {'lr': 0.00019903733295812613, 'samples': 1499072, 'steps': 2927, 'loss/train': 2.3228976726531982} -09/21/2021 00:38:05 - INFO - __main__ - Step 46847: {'lr': 0.00019903733295812613, 'samples': 1499104, 'steps': 2927, 'loss/train': 1.7638335227966309} -09/21/2021 00:38:05 - INFO - __main__ - Step 46848: {'lr': 0.00019903733295812613, 'samples': 1499136, 'steps': 2927, 'loss/train': 2.2116363048553467} -09/21/2021 00:38:06 - INFO - __main__ - Step 46849: {'lr': 0.00019903644978050913, 'samples': 1499168, 'steps': 2928, 'loss/train': 1.4709062576293945} -09/21/2021 00:38:07 - INFO - __main__ - Step 46850: {'lr': 0.00019903644978050913, 'samples': 1499200, 'steps': 2928, 'loss/train': 2.2282516956329346} -09/21/2021 00:38:08 - INFO - __main__ - Step 46851: {'lr': 0.00019903644978050913, 'samples': 1499232, 'steps': 2928, 'loss/train': 2.0197508335113525} -09/21/2021 00:38:09 - INFO - __main__ - Step 46852: {'lr': 0.00019903644978050913, 'samples': 1499264, 'steps': 2928, 'loss/train': 1.5700368881225586} -09/21/2021 00:38:09 - INFO - __main__ - Step 46853: {'lr': 0.00019903644978050913, 'samples': 1499296, 'steps': 2928, 'loss/train': 1.6158632040023804} -09/21/2021 00:38:10 - INFO - __main__ - Step 46854: {'lr': 0.00019903644978050913, 'samples': 1499328, 'steps': 2928, 'loss/train': 1.5926796197891235} -09/21/2021 00:38:11 - INFO - __main__ - Step 46855: {'lr': 0.00019903644978050913, 'samples': 1499360, 'steps': 2928, 'loss/train': 1.9709917306900024} -09/21/2021 00:38:12 - INFO - __main__ - Step 46856: {'lr': 0.00019903644978050913, 'samples': 1499392, 'steps': 2928, 'loss/train': 2.127140760421753} -09/21/2021 00:38:12 - INFO - __main__ - Step 46857: {'lr': 0.00019903644978050913, 'samples': 1499424, 'steps': 2928, 'loss/train': 1.8343449831008911} -09/21/2021 00:38:13 - INFO - __main__ - Step 46858: {'lr': 0.00019903644978050913, 'samples': 1499456, 'steps': 2928, 'loss/train': 1.3063936233520508} -09/21/2021 00:38:14 - INFO - __main__ - Step 46859: {'lr': 0.00019903644978050913, 'samples': 1499488, 'steps': 2928, 'loss/train': 1.8207180500030518} -09/21/2021 00:38:15 - INFO - __main__ - Step 46860: {'lr': 0.00019903644978050913, 'samples': 1499520, 'steps': 2928, 'loss/train': 2.652658224105835} -09/21/2021 00:38:15 - INFO - __main__ - Step 46861: {'lr': 0.00019903644978050913, 'samples': 1499552, 'steps': 2928, 'loss/train': 1.9860811233520508} -09/21/2021 00:38:16 - INFO - __main__ - Step 46862: {'lr': 0.00019903644978050913, 'samples': 1499584, 'steps': 2928, 'loss/train': 1.8670049905776978} -09/21/2021 00:38:17 - INFO - __main__ - Step 46863: {'lr': 0.00019903644978050913, 'samples': 1499616, 'steps': 2928, 'loss/train': 2.0534284114837646} -09/21/2021 00:38:18 - INFO - __main__ - Step 46864: {'lr': 0.00019903644978050913, 'samples': 1499648, 'steps': 2928, 'loss/train': 1.8961827754974365} -09/21/2021 00:38:19 - INFO - __main__ - Step 46865: {'lr': 0.0001990355661999132, 'samples': 1499680, 'steps': 2929, 'loss/train': 2.068887710571289} -09/21/2021 00:38:20 - INFO - __main__ - Step 46866: {'lr': 0.0001990355661999132, 'samples': 1499712, 'steps': 2929, 'loss/train': 1.2757539749145508} -09/21/2021 00:38:21 - INFO - __main__ - Step 46867: {'lr': 0.0001990355661999132, 'samples': 1499744, 'steps': 2929, 'loss/train': 1.7201915979385376} -09/21/2021 00:38:22 - INFO - __main__ - Step 46868: {'lr': 0.0001990355661999132, 'samples': 1499776, 'steps': 2929, 'loss/train': 1.9953094720840454} -09/21/2021 00:38:22 - INFO - __main__ - Step 46869: {'lr': 0.0001990355661999132, 'samples': 1499808, 'steps': 2929, 'loss/train': 1.6745301485061646} -09/21/2021 00:38:23 - INFO - __main__ - Step 46870: {'lr': 0.0001990355661999132, 'samples': 1499840, 'steps': 2929, 'loss/train': 2.1245477199554443} -09/21/2021 00:38:24 - INFO - __main__ - Step 46871: {'lr': 0.0001990355661999132, 'samples': 1499872, 'steps': 2929, 'loss/train': 2.1903305053710938} -09/21/2021 00:38:25 - INFO - __main__ - Step 46872: {'lr': 0.0001990355661999132, 'samples': 1499904, 'steps': 2929, 'loss/train': 0.4414110779762268} -09/21/2021 00:38:25 - INFO - __main__ - Step 46873: {'lr': 0.0001990355661999132, 'samples': 1499936, 'steps': 2929, 'loss/train': 2.293595552444458} -09/21/2021 00:38:26 - INFO - __main__ - Step 46874: {'lr': 0.0001990355661999132, 'samples': 1499968, 'steps': 2929, 'loss/train': 1.1347905397415161} -09/21/2021 00:38:27 - INFO - __main__ - Step 46875: {'lr': 0.0001990355661999132, 'samples': 1500000, 'steps': 2929, 'loss/train': 1.131959319114685} -09/21/2021 00:38:28 - INFO - __main__ - Step 46876: {'lr': 0.0001990355661999132, 'samples': 1500032, 'steps': 2929, 'loss/train': 1.5124907493591309} -09/21/2021 00:38:28 - INFO - __main__ - Step 46877: {'lr': 0.0001990355661999132, 'samples': 1500064, 'steps': 2929, 'loss/train': 1.994035243988037} -09/21/2021 00:38:29 - INFO - __main__ - Step 46878: {'lr': 0.0001990355661999132, 'samples': 1500096, 'steps': 2929, 'loss/train': 1.9765846729278564} -09/21/2021 00:38:30 - INFO - __main__ - Step 46879: {'lr': 0.0001990355661999132, 'samples': 1500128, 'steps': 2929, 'loss/train': 0.5136539340019226} -09/21/2021 00:38:31 - INFO - __main__ - Step 46880: {'lr': 0.0001990355661999132, 'samples': 1500160, 'steps': 2929, 'loss/train': 2.1932225227355957} -09/21/2021 00:38:31 - INFO - __main__ - Step 46881: {'lr': 0.00019903468221634194, 'samples': 1500192, 'steps': 2930, 'loss/train': 3.3394176959991455} -09/21/2021 00:38:32 - INFO - __main__ - Step 46882: {'lr': 0.00019903468221634194, 'samples': 1500224, 'steps': 2930, 'loss/train': 1.847679853439331} -09/21/2021 00:38:33 - INFO - __main__ - Step 46883: {'lr': 0.00019903468221634194, 'samples': 1500256, 'steps': 2930, 'loss/train': 2.625680923461914} -09/21/2021 00:38:34 - INFO - __main__ - Step 46884: {'lr': 0.00019903468221634194, 'samples': 1500288, 'steps': 2930, 'loss/train': 1.2030922174453735} -09/21/2021 00:38:34 - INFO - __main__ - Step 46885: {'lr': 0.00019903468221634194, 'samples': 1500320, 'steps': 2930, 'loss/train': 1.5851054191589355} -09/21/2021 00:38:35 - INFO - __main__ - Step 46886: {'lr': 0.00019903468221634194, 'samples': 1500352, 'steps': 2930, 'loss/train': 2.1628758907318115} -09/21/2021 00:38:36 - INFO - __main__ - Step 46887: {'lr': 0.00019903468221634194, 'samples': 1500384, 'steps': 2930, 'loss/train': 2.378836154937744} -09/21/2021 00:38:37 - INFO - __main__ - Step 46888: {'lr': 0.00019903468221634194, 'samples': 1500416, 'steps': 2930, 'loss/train': 2.5371458530426025} -09/21/2021 00:38:37 - INFO - __main__ - Step 46889: {'lr': 0.00019903468221634194, 'samples': 1500448, 'steps': 2930, 'loss/train': 1.5169981718063354} -09/21/2021 00:38:38 - INFO - __main__ - Step 46890: {'lr': 0.00019903468221634194, 'samples': 1500480, 'steps': 2930, 'loss/train': 1.2329157590866089} -09/21/2021 00:38:39 - INFO - __main__ - Step 46891: {'lr': 0.00019903468221634194, 'samples': 1500512, 'steps': 2930, 'loss/train': 1.341859221458435} -09/21/2021 00:38:40 - INFO - __main__ - Step 46892: {'lr': 0.00019903468221634194, 'samples': 1500544, 'steps': 2930, 'loss/train': 1.6984211206436157} -09/21/2021 00:38:40 - INFO - __main__ - Step 46893: {'lr': 0.00019903468221634194, 'samples': 1500576, 'steps': 2930, 'loss/train': 2.0833868980407715} -09/21/2021 00:38:41 - INFO - __main__ - Step 46894: {'lr': 0.00019903468221634194, 'samples': 1500608, 'steps': 2930, 'loss/train': 2.7493860721588135} -09/21/2021 00:38:42 - INFO - __main__ - Step 46895: {'lr': 0.00019903468221634194, 'samples': 1500640, 'steps': 2930, 'loss/train': 1.8145498037338257} -09/21/2021 00:38:43 - INFO - __main__ - Step 46896: {'lr': 0.00019903468221634194, 'samples': 1500672, 'steps': 2930, 'loss/train': 0.5034054517745972} -09/21/2021 00:38:44 - INFO - __main__ - Step 46897: {'lr': 0.00019903379782979896, 'samples': 1500704, 'steps': 2931, 'loss/train': 2.143277883529663} -09/21/2021 00:38:45 - INFO - __main__ - Step 46898: {'lr': 0.00019903379782979896, 'samples': 1500736, 'steps': 2931, 'loss/train': 0.27499333024024963} -09/21/2021 00:38:46 - INFO - __main__ - Step 46899: {'lr': 0.00019903379782979896, 'samples': 1500768, 'steps': 2931, 'loss/train': 2.3876852989196777} -09/21/2021 00:38:46 - INFO - __main__ - Step 46900: {'lr': 0.00019903379782979896, 'samples': 1500800, 'steps': 2931, 'loss/train': 1.811691403388977} -09/21/2021 00:38:47 - INFO - __main__ - Step 46901: {'lr': 0.00019903379782979896, 'samples': 1500832, 'steps': 2931, 'loss/train': 1.4076049327850342} -09/21/2021 00:38:48 - INFO - __main__ - Step 46902: {'lr': 0.00019903379782979896, 'samples': 1500864, 'steps': 2931, 'loss/train': 1.918138027191162} -09/21/2021 00:38:49 - INFO - __main__ - Step 46903: {'lr': 0.00019903379782979896, 'samples': 1500896, 'steps': 2931, 'loss/train': 1.5879992246627808} -09/21/2021 00:38:49 - INFO - __main__ - Step 46904: {'lr': 0.00019903379782979896, 'samples': 1500928, 'steps': 2931, 'loss/train': 1.9948941469192505} -09/21/2021 00:38:50 - INFO - __main__ - Step 46905: {'lr': 0.00019903379782979896, 'samples': 1500960, 'steps': 2931, 'loss/train': 1.7725433111190796} -09/21/2021 00:38:51 - INFO - __main__ - Step 46906: {'lr': 0.00019903379782979896, 'samples': 1500992, 'steps': 2931, 'loss/train': 1.5466279983520508} -09/21/2021 00:38:52 - INFO - __main__ - Step 46907: {'lr': 0.00019903379782979896, 'samples': 1501024, 'steps': 2931, 'loss/train': 1.5677030086517334} -09/21/2021 00:38:52 - INFO - __main__ - Step 46908: {'lr': 0.00019903379782979896, 'samples': 1501056, 'steps': 2931, 'loss/train': 2.028243064880371} -09/21/2021 00:38:53 - INFO - __main__ - Step 46909: {'lr': 0.00019903379782979896, 'samples': 1501088, 'steps': 2931, 'loss/train': 2.178537607192993} -09/21/2021 00:38:54 - INFO - __main__ - Step 46910: {'lr': 0.00019903379782979896, 'samples': 1501120, 'steps': 2931, 'loss/train': 2.1265859603881836} -09/21/2021 00:38:55 - INFO - __main__ - Step 46911: {'lr': 0.00019903379782979896, 'samples': 1501152, 'steps': 2931, 'loss/train': 1.3184419870376587} -09/21/2021 00:38:55 - INFO - __main__ - Step 46912: {'lr': 0.00019903379782979896, 'samples': 1501184, 'steps': 2931, 'loss/train': 2.399872303009033} -09/21/2021 00:38:56 - INFO - __main__ - Step 46913: {'lr': 0.00019903291304028783, 'samples': 1501216, 'steps': 2932, 'loss/train': 3.236097574234009} -09/21/2021 00:38:57 - INFO - __main__ - Step 46914: {'lr': 0.00019903291304028783, 'samples': 1501248, 'steps': 2932, 'loss/train': 1.8521510362625122} -09/21/2021 00:38:58 - INFO - __main__ - Step 46915: {'lr': 0.00019903291304028783, 'samples': 1501280, 'steps': 2932, 'loss/train': 1.7556827068328857} -09/21/2021 00:38:58 - INFO - __main__ - Step 46916: {'lr': 0.00019903291304028783, 'samples': 1501312, 'steps': 2932, 'loss/train': 2.699110507965088} -09/21/2021 00:38:59 - INFO - __main__ - Step 46917: {'lr': 0.00019903291304028783, 'samples': 1501344, 'steps': 2932, 'loss/train': 2.1122355461120605} -09/21/2021 00:39:00 - INFO - __main__ - Step 46918: {'lr': 0.00019903291304028783, 'samples': 1501376, 'steps': 2932, 'loss/train': 1.4243355989456177} -09/21/2021 00:39:01 - INFO - __main__ - Step 46919: {'lr': 0.00019903291304028783, 'samples': 1501408, 'steps': 2932, 'loss/train': 1.5379616022109985} -09/21/2021 00:39:01 - INFO - __main__ - Step 46920: {'lr': 0.00019903291304028783, 'samples': 1501440, 'steps': 2932, 'loss/train': 2.3583388328552246} -09/21/2021 00:39:02 - INFO - __main__ - Step 46921: {'lr': 0.00019903291304028783, 'samples': 1501472, 'steps': 2932, 'loss/train': 1.5830373764038086} -09/21/2021 00:39:03 - INFO - __main__ - Step 46922: {'lr': 0.00019903291304028783, 'samples': 1501504, 'steps': 2932, 'loss/train': 2.5507030487060547} -09/21/2021 00:39:04 - INFO - __main__ - Step 46923: {'lr': 0.00019903291304028783, 'samples': 1501536, 'steps': 2932, 'loss/train': 1.4656795263290405} -09/21/2021 00:39:04 - INFO - __main__ - Step 46924: {'lr': 0.00019903291304028783, 'samples': 1501568, 'steps': 2932, 'loss/train': 3.473677396774292} -09/21/2021 00:39:06 - INFO - __main__ - Step 46925: {'lr': 0.00019903291304028783, 'samples': 1501600, 'steps': 2932, 'loss/train': 2.0078155994415283} -09/21/2021 00:39:06 - INFO - __main__ - Step 46926: {'lr': 0.00019903291304028783, 'samples': 1501632, 'steps': 2932, 'loss/train': 2.1455862522125244} -09/21/2021 00:39:07 - INFO - __main__ - Step 46927: {'lr': 0.00019903291304028783, 'samples': 1501664, 'steps': 2932, 'loss/train': 1.207930326461792} -09/21/2021 00:39:08 - INFO - __main__ - Step 46928: {'lr': 0.00019903291304028783, 'samples': 1501696, 'steps': 2932, 'loss/train': 2.44724440574646} -09/21/2021 00:39:09 - INFO - __main__ - Step 46929: {'lr': 0.00019903202784781214, 'samples': 1501728, 'steps': 2933, 'loss/train': 2.007967233657837} -09/21/2021 00:39:10 - INFO - __main__ - Step 46930: {'lr': 0.00019903202784781214, 'samples': 1501760, 'steps': 2933, 'loss/train': 3.3649864196777344} -09/21/2021 00:39:10 - INFO - __main__ - Step 46931: {'lr': 0.00019903202784781214, 'samples': 1501792, 'steps': 2933, 'loss/train': 2.280723810195923} -09/21/2021 00:39:11 - INFO - __main__ - Step 46932: {'lr': 0.00019903202784781214, 'samples': 1501824, 'steps': 2933, 'loss/train': 1.5712844133377075} -09/21/2021 00:39:12 - INFO - __main__ - Step 46933: {'lr': 0.00019903202784781214, 'samples': 1501856, 'steps': 2933, 'loss/train': 1.9001140594482422} -09/21/2021 00:39:13 - INFO - __main__ - Step 46934: {'lr': 0.00019903202784781214, 'samples': 1501888, 'steps': 2933, 'loss/train': 2.040252685546875} -09/21/2021 00:39:13 - INFO - __main__ - Step 46935: {'lr': 0.00019903202784781214, 'samples': 1501920, 'steps': 2933, 'loss/train': 2.4271678924560547} -09/21/2021 00:39:14 - INFO - __main__ - Step 46936: {'lr': 0.00019903202784781214, 'samples': 1501952, 'steps': 2933, 'loss/train': 1.9284679889678955} -09/21/2021 00:39:15 - INFO - __main__ - Step 46937: {'lr': 0.00019903202784781214, 'samples': 1501984, 'steps': 2933, 'loss/train': 2.6034839153289795} -09/21/2021 00:39:16 - INFO - __main__ - Step 46938: {'lr': 0.00019903202784781214, 'samples': 1502016, 'steps': 2933, 'loss/train': 1.5266257524490356} -09/21/2021 00:39:16 - INFO - __main__ - Step 46939: {'lr': 0.00019903202784781214, 'samples': 1502048, 'steps': 2933, 'loss/train': 1.6178090572357178} -09/21/2021 00:39:17 - INFO - __main__ - Step 46940: {'lr': 0.00019903202784781214, 'samples': 1502080, 'steps': 2933, 'loss/train': 1.9759196043014526} -09/21/2021 00:39:18 - INFO - __main__ - Step 46941: {'lr': 0.00019903202784781214, 'samples': 1502112, 'steps': 2933, 'loss/train': 1.429943561553955} -09/21/2021 00:39:19 - INFO - __main__ - Step 46942: {'lr': 0.00019903202784781214, 'samples': 1502144, 'steps': 2933, 'loss/train': 2.6463541984558105} -09/21/2021 00:39:19 - INFO - __main__ - Step 46943: {'lr': 0.00019903202784781214, 'samples': 1502176, 'steps': 2933, 'loss/train': 1.9407380819320679} -09/21/2021 00:39:20 - INFO - __main__ - Step 46944: {'lr': 0.00019903202784781214, 'samples': 1502208, 'steps': 2933, 'loss/train': 1.5312230587005615} -09/21/2021 00:39:21 - INFO - __main__ - Step 46945: {'lr': 0.00019903114225237553, 'samples': 1502240, 'steps': 2934, 'loss/train': 2.4005956649780273} -09/21/2021 00:39:22 - INFO - __main__ - Step 46946: {'lr': 0.00019903114225237553, 'samples': 1502272, 'steps': 2934, 'loss/train': 0.3863717317581177} -09/21/2021 00:39:22 - INFO - __main__ - Step 46947: {'lr': 0.00019903114225237553, 'samples': 1502304, 'steps': 2934, 'loss/train': 1.2030599117279053} -09/21/2021 00:39:23 - INFO - __main__ - Step 46948: {'lr': 0.00019903114225237553, 'samples': 1502336, 'steps': 2934, 'loss/train': 1.3976305723190308} -09/21/2021 00:39:24 - INFO - __main__ - Step 46949: {'lr': 0.00019903114225237553, 'samples': 1502368, 'steps': 2934, 'loss/train': 2.6424148082733154} -09/21/2021 00:39:25 - INFO - __main__ - Step 46950: {'lr': 0.00019903114225237553, 'samples': 1502400, 'steps': 2934, 'loss/train': 2.093538999557495} -09/21/2021 00:39:25 - INFO - __main__ - Step 46951: {'lr': 0.00019903114225237553, 'samples': 1502432, 'steps': 2934, 'loss/train': 1.9712754487991333} -09/21/2021 00:39:26 - INFO - __main__ - Step 46952: {'lr': 0.00019903114225237553, 'samples': 1502464, 'steps': 2934, 'loss/train': 1.6477129459381104} -09/21/2021 00:39:27 - INFO - __main__ - Step 46953: {'lr': 0.00019903114225237553, 'samples': 1502496, 'steps': 2934, 'loss/train': 2.402604818344116} -09/21/2021 00:39:28 - INFO - __main__ - Step 46954: {'lr': 0.00019903114225237553, 'samples': 1502528, 'steps': 2934, 'loss/train': 1.8423306941986084} -09/21/2021 00:39:28 - INFO - __main__ - Step 46955: {'lr': 0.00019903114225237553, 'samples': 1502560, 'steps': 2934, 'loss/train': 1.9553111791610718} -09/21/2021 00:39:30 - INFO - __main__ - Step 46956: {'lr': 0.00019903114225237553, 'samples': 1502592, 'steps': 2934, 'loss/train': 1.751628041267395} -09/21/2021 00:39:30 - INFO - __main__ - Step 46957: {'lr': 0.00019903114225237553, 'samples': 1502624, 'steps': 2934, 'loss/train': 1.446574091911316} -09/21/2021 00:39:31 - INFO - __main__ - Step 46958: {'lr': 0.00019903114225237553, 'samples': 1502656, 'steps': 2934, 'loss/train': 1.4048100709915161} -09/21/2021 00:39:32 - INFO - __main__ - Step 46959: {'lr': 0.00019903114225237553, 'samples': 1502688, 'steps': 2934, 'loss/train': 1.8712698221206665} -09/21/2021 00:39:33 - INFO - __main__ - Step 46960: {'lr': 0.00019903114225237553, 'samples': 1502720, 'steps': 2934, 'loss/train': 1.399362564086914} -09/21/2021 00:39:34 - INFO - __main__ - Step 46961: {'lr': 0.0001990302562539816, 'samples': 1502752, 'steps': 2935, 'loss/train': 1.7336149215698242} -09/21/2021 00:39:34 - INFO - __main__ - Step 46962: {'lr': 0.0001990302562539816, 'samples': 1502784, 'steps': 2935, 'loss/train': 2.2018563747406006} -09/21/2021 00:39:35 - INFO - __main__ - Step 46963: {'lr': 0.0001990302562539816, 'samples': 1502816, 'steps': 2935, 'loss/train': 2.5812087059020996} -09/21/2021 00:39:36 - INFO - __main__ - Step 46964: {'lr': 0.0001990302562539816, 'samples': 1502848, 'steps': 2935, 'loss/train': 1.8008239269256592} -09/21/2021 00:39:37 - INFO - __main__ - Step 46965: {'lr': 0.0001990302562539816, 'samples': 1502880, 'steps': 2935, 'loss/train': 2.265439510345459} -09/21/2021 00:39:37 - INFO - __main__ - Step 46966: {'lr': 0.0001990302562539816, 'samples': 1502912, 'steps': 2935, 'loss/train': 1.3783656358718872} -09/21/2021 00:39:38 - INFO - __main__ - Step 46967: {'lr': 0.0001990302562539816, 'samples': 1502944, 'steps': 2935, 'loss/train': 1.3632428646087646} -09/21/2021 00:39:39 - INFO - __main__ - Step 46968: {'lr': 0.0001990302562539816, 'samples': 1502976, 'steps': 2935, 'loss/train': 1.7793207168579102} -09/21/2021 00:39:40 - INFO - __main__ - Step 46969: {'lr': 0.0001990302562539816, 'samples': 1503008, 'steps': 2935, 'loss/train': 2.4289369583129883} -09/21/2021 00:39:40 - INFO - __main__ - Step 46970: {'lr': 0.0001990302562539816, 'samples': 1503040, 'steps': 2935, 'loss/train': 2.3788869380950928} -09/21/2021 00:39:41 - INFO - __main__ - Step 46971: {'lr': 0.0001990302562539816, 'samples': 1503072, 'steps': 2935, 'loss/train': 1.723854422569275} -09/21/2021 00:39:42 - INFO - __main__ - Step 46972: {'lr': 0.0001990302562539816, 'samples': 1503104, 'steps': 2935, 'loss/train': 2.8078761100769043} -09/21/2021 00:39:43 - INFO - __main__ - Step 46973: {'lr': 0.0001990302562539816, 'samples': 1503136, 'steps': 2935, 'loss/train': 2.075284719467163} -09/21/2021 00:39:43 - INFO - __main__ - Step 46974: {'lr': 0.0001990302562539816, 'samples': 1503168, 'steps': 2935, 'loss/train': 1.545145034790039} -09/21/2021 00:39:44 - INFO - __main__ - Step 46975: {'lr': 0.0001990302562539816, 'samples': 1503200, 'steps': 2935, 'loss/train': 1.9541298151016235} -09/21/2021 00:39:45 - INFO - __main__ - Step 46976: {'lr': 0.0001990302562539816, 'samples': 1503232, 'steps': 2935, 'loss/train': 2.0695674419403076} -09/21/2021 00:39:46 - INFO - __main__ - Step 46977: {'lr': 0.0001990293698526339, 'samples': 1503264, 'steps': 2936, 'loss/train': 0.6341695785522461} -09/21/2021 00:39:47 - INFO - __main__ - Step 46978: {'lr': 0.0001990293698526339, 'samples': 1503296, 'steps': 2936, 'loss/train': 1.7948591709136963} -09/21/2021 00:39:47 - INFO - __main__ - Step 46979: {'lr': 0.0001990293698526339, 'samples': 1503328, 'steps': 2936, 'loss/train': 1.3167001008987427} -09/21/2021 00:39:48 - INFO - __main__ - Step 46980: {'lr': 0.0001990293698526339, 'samples': 1503360, 'steps': 2936, 'loss/train': 2.6936869621276855} -09/21/2021 00:39:49 - INFO - __main__ - Step 46981: {'lr': 0.0001990293698526339, 'samples': 1503392, 'steps': 2936, 'loss/train': 2.5324108600616455} -09/21/2021 00:39:50 - INFO - __main__ - Step 46982: {'lr': 0.0001990293698526339, 'samples': 1503424, 'steps': 2936, 'loss/train': 2.2375869750976562} -09/21/2021 00:39:50 - INFO - __main__ - Step 46983: {'lr': 0.0001990293698526339, 'samples': 1503456, 'steps': 2936, 'loss/train': 1.611738920211792} -09/21/2021 00:39:51 - INFO - __main__ - Step 46984: {'lr': 0.0001990293698526339, 'samples': 1503488, 'steps': 2936, 'loss/train': 1.8109099864959717} -09/21/2021 00:39:52 - INFO - __main__ - Step 46985: {'lr': 0.0001990293698526339, 'samples': 1503520, 'steps': 2936, 'loss/train': 2.2714436054229736} -09/21/2021 00:39:53 - INFO - __main__ - Step 46986: {'lr': 0.0001990293698526339, 'samples': 1503552, 'steps': 2936, 'loss/train': 1.8053427934646606} -09/21/2021 00:39:54 - INFO - __main__ - Step 46987: {'lr': 0.0001990293698526339, 'samples': 1503584, 'steps': 2936, 'loss/train': 2.167449474334717} -09/21/2021 00:39:55 - INFO - __main__ - Step 46988: {'lr': 0.0001990293698526339, 'samples': 1503616, 'steps': 2936, 'loss/train': 1.484005331993103} -09/21/2021 00:39:55 - INFO - __main__ - Step 46989: {'lr': 0.0001990293698526339, 'samples': 1503648, 'steps': 2936, 'loss/train': 2.4108762741088867} -09/21/2021 00:39:56 - INFO - __main__ - Step 46990: {'lr': 0.0001990293698526339, 'samples': 1503680, 'steps': 2936, 'loss/train': 2.750422477722168} -09/21/2021 00:39:57 - INFO - __main__ - Step 46991: {'lr': 0.0001990293698526339, 'samples': 1503712, 'steps': 2936, 'loss/train': 1.97174870967865} -09/21/2021 00:39:58 - INFO - __main__ - Step 46992: {'lr': 0.0001990293698526339, 'samples': 1503744, 'steps': 2936, 'loss/train': 2.3822813034057617} -09/21/2021 00:39:59 - INFO - __main__ - Step 46993: {'lr': 0.00019902848304833613, 'samples': 1503776, 'steps': 2937, 'loss/train': 2.6079230308532715} -09/21/2021 00:39:59 - INFO - __main__ - Step 46994: {'lr': 0.00019902848304833613, 'samples': 1503808, 'steps': 2937, 'loss/train': 2.0800106525421143} -09/21/2021 00:40:00 - INFO - __main__ - Step 46995: {'lr': 0.00019902848304833613, 'samples': 1503840, 'steps': 2937, 'loss/train': 2.041017532348633} -09/21/2021 00:40:01 - INFO - __main__ - Step 46996: {'lr': 0.00019902848304833613, 'samples': 1503872, 'steps': 2937, 'loss/train': 1.1240978240966797} -09/21/2021 00:40:02 - INFO - __main__ - Step 46997: {'lr': 0.00019902848304833613, 'samples': 1503904, 'steps': 2937, 'loss/train': 1.8809393644332886} -09/21/2021 00:40:02 - INFO - __main__ - Step 46998: {'lr': 0.00019902848304833613, 'samples': 1503936, 'steps': 2937, 'loss/train': 1.786623477935791} -09/21/2021 00:40:03 - INFO - __main__ - Step 46999: {'lr': 0.00019902848304833613, 'samples': 1503968, 'steps': 2937, 'loss/train': 2.028960943222046} -09/21/2021 00:40:04 - INFO - __main__ - Step 47000: {'lr': 0.00019902848304833613, 'samples': 1504000, 'steps': 2937, 'loss/train': 2.2156620025634766} -09/21/2021 00:40:05 - INFO - __main__ - Step 47001: {'lr': 0.00019902848304833613, 'samples': 1504032, 'steps': 2937, 'loss/train': 2.5898900032043457} -09/21/2021 00:40:05 - INFO - __main__ - Step 47002: {'lr': 0.00019902848304833613, 'samples': 1504064, 'steps': 2937, 'loss/train': 2.3599798679351807} -09/21/2021 00:40:06 - INFO - __main__ - Step 47003: {'lr': 0.00019902848304833613, 'samples': 1504096, 'steps': 2937, 'loss/train': 1.9338370561599731} -09/21/2021 00:40:07 - INFO - __main__ - Step 47004: {'lr': 0.00019902848304833613, 'samples': 1504128, 'steps': 2937, 'loss/train': 2.1964545249938965} -09/21/2021 00:40:08 - INFO - __main__ - Step 47005: {'lr': 0.00019902848304833613, 'samples': 1504160, 'steps': 2937, 'loss/train': 6.107872486114502} -09/21/2021 00:40:08 - INFO - __main__ - Step 47006: {'lr': 0.00019902848304833613, 'samples': 1504192, 'steps': 2937, 'loss/train': 6.389329433441162} -09/21/2021 00:40:09 - INFO - __main__ - Step 47007: {'lr': 0.00019902848304833613, 'samples': 1504224, 'steps': 2937, 'loss/train': 6.58701229095459} -09/21/2021 00:40:10 - INFO - __main__ - Step 47008: {'lr': 0.00019902848304833613, 'samples': 1504256, 'steps': 2937, 'loss/train': 5.872402667999268} -09/21/2021 00:40:11 - INFO - __main__ - Step 47009: {'lr': 0.00019902759584109183, 'samples': 1504288, 'steps': 2938, 'loss/train': 5.347360610961914} -09/21/2021 00:40:11 - INFO - __main__ - Step 47010: {'lr': 0.00019902759584109183, 'samples': 1504320, 'steps': 2938, 'loss/train': 6.798940181732178} -09/21/2021 00:40:12 - INFO - __main__ - Step 47011: {'lr': 0.00019902759584109183, 'samples': 1504352, 'steps': 2938, 'loss/train': 7.035219669342041} -09/21/2021 00:40:13 - INFO - __main__ - Step 47012: {'lr': 0.00019902759584109183, 'samples': 1504384, 'steps': 2938, 'loss/train': 6.893153667449951} -09/21/2021 00:40:14 - INFO - __main__ - Step 47013: {'lr': 0.00019902759584109183, 'samples': 1504416, 'steps': 2938, 'loss/train': 1.4025439023971558} -09/21/2021 00:40:14 - INFO - __main__ - Step 47014: {'lr': 0.00019902759584109183, 'samples': 1504448, 'steps': 2938, 'loss/train': 2.1816787719726562} -09/21/2021 00:40:15 - INFO - __main__ - Step 47015: {'lr': 0.00019902759584109183, 'samples': 1504480, 'steps': 2938, 'loss/train': 1.87334144115448} -09/21/2021 00:40:16 - INFO - __main__ - Step 47016: {'lr': 0.00019902759584109183, 'samples': 1504512, 'steps': 2938, 'loss/train': 2.019406318664551} -09/21/2021 00:40:17 - INFO - __main__ - Step 47017: {'lr': 0.00019902759584109183, 'samples': 1504544, 'steps': 2938, 'loss/train': 1.3522542715072632} -09/21/2021 00:40:17 - INFO - __main__ - Step 47018: {'lr': 0.00019902759584109183, 'samples': 1504576, 'steps': 2938, 'loss/train': 1.4387016296386719} -09/21/2021 00:40:18 - INFO - __main__ - Step 47019: {'lr': 0.00019902759584109183, 'samples': 1504608, 'steps': 2938, 'loss/train': 1.8835821151733398} -09/21/2021 00:40:19 - INFO - __main__ - Step 47020: {'lr': 0.00019902759584109183, 'samples': 1504640, 'steps': 2938, 'loss/train': 2.005626916885376} -09/21/2021 00:40:20 - INFO - __main__ - Step 47021: {'lr': 0.00019902759584109183, 'samples': 1504672, 'steps': 2938, 'loss/train': 1.8356765508651733} -09/21/2021 00:40:21 - INFO - __main__ - Step 47022: {'lr': 0.00019902759584109183, 'samples': 1504704, 'steps': 2938, 'loss/train': 1.9212086200714111} -09/21/2021 00:40:22 - INFO - __main__ - Step 47023: {'lr': 0.00019902759584109183, 'samples': 1504736, 'steps': 2938, 'loss/train': 2.3275201320648193} -09/21/2021 00:40:23 - INFO - __main__ - Step 47024: {'lr': 0.00019902759584109183, 'samples': 1504768, 'steps': 2938, 'loss/train': 1.628429651260376} -09/21/2021 00:40:24 - INFO - __main__ - Step 47025: {'lr': 0.0001990267082309046, 'samples': 1504800, 'steps': 2939, 'loss/train': 2.393688678741455} -09/21/2021 00:40:24 - INFO - __main__ - Step 47026: {'lr': 0.0001990267082309046, 'samples': 1504832, 'steps': 2939, 'loss/train': 2.198892831802368} -09/21/2021 00:40:25 - INFO - __main__ - Step 47027: {'lr': 0.0001990267082309046, 'samples': 1504864, 'steps': 2939, 'loss/train': 2.0304322242736816} -09/21/2021 00:40:26 - INFO - __main__ - Step 47028: {'lr': 0.0001990267082309046, 'samples': 1504896, 'steps': 2939, 'loss/train': 1.6153221130371094} -09/21/2021 00:40:27 - INFO - __main__ - Step 47029: {'lr': 0.0001990267082309046, 'samples': 1504928, 'steps': 2939, 'loss/train': 1.8421213626861572} -09/21/2021 00:40:27 - INFO - __main__ - Step 47030: {'lr': 0.0001990267082309046, 'samples': 1504960, 'steps': 2939, 'loss/train': 1.910522222518921} -09/21/2021 00:40:28 - INFO - __main__ - Step 47031: {'lr': 0.0001990267082309046, 'samples': 1504992, 'steps': 2939, 'loss/train': 2.5071914196014404} -09/21/2021 00:40:29 - INFO - __main__ - Step 47032: {'lr': 0.0001990267082309046, 'samples': 1505024, 'steps': 2939, 'loss/train': 2.0880961418151855} -09/21/2021 00:40:30 - INFO - __main__ - Step 47033: {'lr': 0.0001990267082309046, 'samples': 1505056, 'steps': 2939, 'loss/train': 2.876779079437256} -09/21/2021 00:40:30 - INFO - __main__ - Step 47034: {'lr': 0.0001990267082309046, 'samples': 1505088, 'steps': 2939, 'loss/train': 1.5212790966033936} -09/21/2021 00:40:31 - INFO - __main__ - Step 47035: {'lr': 0.0001990267082309046, 'samples': 1505120, 'steps': 2939, 'loss/train': 1.213167428970337} -09/21/2021 00:40:32 - INFO - __main__ - Step 47036: {'lr': 0.0001990267082309046, 'samples': 1505152, 'steps': 2939, 'loss/train': 1.1798028945922852} -09/21/2021 00:40:33 - INFO - __main__ - Step 47037: {'lr': 0.0001990267082309046, 'samples': 1505184, 'steps': 2939, 'loss/train': 1.245071291923523} -09/21/2021 00:40:33 - INFO - __main__ - Step 47038: {'lr': 0.0001990267082309046, 'samples': 1505216, 'steps': 2939, 'loss/train': 1.461234211921692} -09/21/2021 00:40:34 - INFO - __main__ - Step 47039: {'lr': 0.0001990267082309046, 'samples': 1505248, 'steps': 2939, 'loss/train': 1.1693114042282104} -09/21/2021 00:40:35 - INFO - __main__ - Step 47040: {'lr': 0.0001990267082309046, 'samples': 1505280, 'steps': 2939, 'loss/train': 1.375350832939148} -09/21/2021 00:40:36 - INFO - __main__ - Step 47041: {'lr': 0.0001990258202177781, 'samples': 1505312, 'steps': 2940, 'loss/train': 1.2077078819274902} -09/21/2021 00:40:37 - INFO - __main__ - Step 47042: {'lr': 0.0001990258202177781, 'samples': 1505344, 'steps': 2940, 'loss/train': 1.8811084032058716} -09/21/2021 00:40:37 - INFO - __main__ - Step 47043: {'lr': 0.0001990258202177781, 'samples': 1505376, 'steps': 2940, 'loss/train': 1.8957618474960327} -09/21/2021 00:40:38 - INFO - __main__ - Step 47044: {'lr': 0.0001990258202177781, 'samples': 1505408, 'steps': 2940, 'loss/train': 1.3808307647705078} -09/21/2021 00:40:39 - INFO - __main__ - Step 47045: {'lr': 0.0001990258202177781, 'samples': 1505440, 'steps': 2940, 'loss/train': 2.232832193374634} -09/21/2021 00:40:40 - INFO - __main__ - Step 47046: {'lr': 0.0001990258202177781, 'samples': 1505472, 'steps': 2940, 'loss/train': 0.9029306173324585} -09/21/2021 00:40:40 - INFO - __main__ - Step 47047: {'lr': 0.0001990258202177781, 'samples': 1505504, 'steps': 2940, 'loss/train': 3.628620147705078} -09/21/2021 00:40:41 - INFO - __main__ - Step 47048: {'lr': 0.0001990258202177781, 'samples': 1505536, 'steps': 2940, 'loss/train': 3.376516342163086} -09/21/2021 00:40:42 - INFO - __main__ - Step 47049: {'lr': 0.0001990258202177781, 'samples': 1505568, 'steps': 2940, 'loss/train': 2.7669501304626465} -09/21/2021 00:40:43 - INFO - __main__ - Step 47050: {'lr': 0.0001990258202177781, 'samples': 1505600, 'steps': 2940, 'loss/train': 1.6459625959396362} -09/21/2021 00:40:43 - INFO - __main__ - Step 47051: {'lr': 0.0001990258202177781, 'samples': 1505632, 'steps': 2940, 'loss/train': 2.7263081073760986} -09/21/2021 00:40:44 - INFO - __main__ - Step 47052: {'lr': 0.0001990258202177781, 'samples': 1505664, 'steps': 2940, 'loss/train': 2.720940351486206} -09/21/2021 00:40:45 - INFO - __main__ - Step 47053: {'lr': 0.0001990258202177781, 'samples': 1505696, 'steps': 2940, 'loss/train': 1.663432240486145} -09/21/2021 00:40:46 - INFO - __main__ - Step 47054: {'lr': 0.0001990258202177781, 'samples': 1505728, 'steps': 2940, 'loss/train': 0.9920403957366943} -09/21/2021 00:40:47 - INFO - __main__ - Step 47055: {'lr': 0.0001990258202177781, 'samples': 1505760, 'steps': 2940, 'loss/train': 2.213654041290283} -09/21/2021 00:40:48 - INFO - __main__ - Step 47056: {'lr': 0.0001990258202177781, 'samples': 1505792, 'steps': 2940, 'loss/train': 1.7924613952636719} -09/21/2021 00:40:48 - INFO - __main__ - Step 47057: {'lr': 0.00019902493180171593, 'samples': 1505824, 'steps': 2941, 'loss/train': 1.4994744062423706} -09/21/2021 00:40:49 - INFO - __main__ - Step 47058: {'lr': 0.00019902493180171593, 'samples': 1505856, 'steps': 2941, 'loss/train': 1.8580973148345947} -09/21/2021 00:40:50 - INFO - __main__ - Step 47059: {'lr': 0.00019902493180171593, 'samples': 1505888, 'steps': 2941, 'loss/train': 1.8114337921142578} -09/21/2021 00:40:51 - INFO - __main__ - Step 47060: {'lr': 0.00019902493180171593, 'samples': 1505920, 'steps': 2941, 'loss/train': 2.30473256111145} -09/21/2021 00:40:51 - INFO - __main__ - Step 47061: {'lr': 0.00019902493180171593, 'samples': 1505952, 'steps': 2941, 'loss/train': 2.608057975769043} -09/21/2021 00:40:52 - INFO - __main__ - Step 47062: {'lr': 0.00019902493180171593, 'samples': 1505984, 'steps': 2941, 'loss/train': 2.599714994430542} -09/21/2021 00:40:53 - INFO - __main__ - Step 47063: {'lr': 0.00019902493180171593, 'samples': 1506016, 'steps': 2941, 'loss/train': 2.2771995067596436} -09/21/2021 00:40:54 - INFO - __main__ - Step 47064: {'lr': 0.00019902493180171593, 'samples': 1506048, 'steps': 2941, 'loss/train': 2.8398425579071045} -09/21/2021 00:40:54 - INFO - __main__ - Step 47065: {'lr': 0.00019902493180171593, 'samples': 1506080, 'steps': 2941, 'loss/train': 1.8307691812515259} -09/21/2021 00:40:55 - INFO - __main__ - Step 47066: {'lr': 0.00019902493180171593, 'samples': 1506112, 'steps': 2941, 'loss/train': 1.6162934303283691} -09/21/2021 00:40:56 - INFO - __main__ - Step 47067: {'lr': 0.00019902493180171593, 'samples': 1506144, 'steps': 2941, 'loss/train': 2.775672435760498} -09/21/2021 00:40:57 - INFO - __main__ - Step 47068: {'lr': 0.00019902493180171593, 'samples': 1506176, 'steps': 2941, 'loss/train': 1.7761108875274658} -09/21/2021 00:40:57 - INFO - __main__ - Step 47069: {'lr': 0.00019902493180171593, 'samples': 1506208, 'steps': 2941, 'loss/train': 2.3602147102355957} -09/21/2021 00:40:58 - INFO - __main__ - Step 47070: {'lr': 0.00019902493180171593, 'samples': 1506240, 'steps': 2941, 'loss/train': 2.544544219970703} -09/21/2021 00:40:59 - INFO - __main__ - Step 47071: {'lr': 0.00019902493180171593, 'samples': 1506272, 'steps': 2941, 'loss/train': 2.136715888977051} -09/21/2021 00:41:00 - INFO - __main__ - Step 47072: {'lr': 0.00019902493180171593, 'samples': 1506304, 'steps': 2941, 'loss/train': 2.0194671154022217} -09/21/2021 00:41:01 - INFO - __main__ - Step 47073: {'lr': 0.00019902404298272167, 'samples': 1506336, 'steps': 2942, 'loss/train': 1.5350748300552368} -09/21/2021 00:41:01 - INFO - __main__ - Step 47074: {'lr': 0.00019902404298272167, 'samples': 1506368, 'steps': 2942, 'loss/train': 2.173473596572876} -09/21/2021 00:41:02 - INFO - __main__ - Step 47075: {'lr': 0.00019902404298272167, 'samples': 1506400, 'steps': 2942, 'loss/train': 2.3918392658233643} -09/21/2021 00:41:03 - INFO - __main__ - Step 47076: {'lr': 0.00019902404298272167, 'samples': 1506432, 'steps': 2942, 'loss/train': 2.6789207458496094} -09/21/2021 00:41:04 - INFO - __main__ - Step 47077: {'lr': 0.00019902404298272167, 'samples': 1506464, 'steps': 2942, 'loss/train': 2.3238143920898438} -09/21/2021 00:41:04 - INFO - __main__ - Step 47078: {'lr': 0.00019902404298272167, 'samples': 1506496, 'steps': 2942, 'loss/train': 2.129852771759033} -09/21/2021 00:41:05 - INFO - __main__ - Step 47079: {'lr': 0.00019902404298272167, 'samples': 1506528, 'steps': 2942, 'loss/train': 3.121058702468872} -09/21/2021 00:41:06 - INFO - __main__ - Step 47080: {'lr': 0.00019902404298272167, 'samples': 1506560, 'steps': 2942, 'loss/train': 1.8887182474136353} -09/21/2021 00:41:07 - INFO - __main__ - Step 47081: {'lr': 0.00019902404298272167, 'samples': 1506592, 'steps': 2942, 'loss/train': 2.077576160430908} -09/21/2021 00:41:07 - INFO - __main__ - Step 47082: {'lr': 0.00019902404298272167, 'samples': 1506624, 'steps': 2942, 'loss/train': 1.3692361116409302} -09/21/2021 00:41:08 - INFO - __main__ - Step 47083: {'lr': 0.00019902404298272167, 'samples': 1506656, 'steps': 2942, 'loss/train': 1.0064142942428589} -09/21/2021 00:41:09 - INFO - __main__ - Step 47084: {'lr': 0.00019902404298272167, 'samples': 1506688, 'steps': 2942, 'loss/train': 1.8731271028518677} -09/21/2021 00:41:10 - INFO - __main__ - Step 47085: {'lr': 0.00019902404298272167, 'samples': 1506720, 'steps': 2942, 'loss/train': 1.2765114307403564} -09/21/2021 00:41:11 - INFO - __main__ - Step 47086: {'lr': 0.00019902404298272167, 'samples': 1506752, 'steps': 2942, 'loss/train': 2.0660390853881836} -09/21/2021 00:41:12 - INFO - __main__ - Step 47087: {'lr': 0.00019902404298272167, 'samples': 1506784, 'steps': 2942, 'loss/train': 2.415384531021118} -09/21/2021 00:41:13 - INFO - __main__ - Step 47088: {'lr': 0.00019902404298272167, 'samples': 1506816, 'steps': 2942, 'loss/train': 2.0349555015563965} -09/21/2021 00:41:13 - INFO - __main__ - Step 47089: {'lr': 0.00019902315376079898, 'samples': 1506848, 'steps': 2943, 'loss/train': 2.3536863327026367} -09/21/2021 00:41:14 - INFO - __main__ - Step 47090: {'lr': 0.00019902315376079898, 'samples': 1506880, 'steps': 2943, 'loss/train': 2.0340867042541504} -09/21/2021 00:41:15 - INFO - __main__ - Step 47091: {'lr': 0.00019902315376079898, 'samples': 1506912, 'steps': 2943, 'loss/train': 1.476188063621521} -09/21/2021 00:41:16 - INFO - __main__ - Step 47092: {'lr': 0.00019902315376079898, 'samples': 1506944, 'steps': 2943, 'loss/train': 3.136798858642578} -09/21/2021 00:41:16 - INFO - __main__ - Step 47093: {'lr': 0.00019902315376079898, 'samples': 1506976, 'steps': 2943, 'loss/train': 1.7261128425598145} -09/21/2021 00:41:17 - INFO - __main__ - Step 47094: {'lr': 0.00019902315376079898, 'samples': 1507008, 'steps': 2943, 'loss/train': 1.7929574251174927} -09/21/2021 00:41:18 - INFO - __main__ - Step 47095: {'lr': 0.00019902315376079898, 'samples': 1507040, 'steps': 2943, 'loss/train': 2.6544854640960693} -09/21/2021 00:41:19 - INFO - __main__ - Step 47096: {'lr': 0.00019902315376079898, 'samples': 1507072, 'steps': 2943, 'loss/train': 2.501385450363159} -09/21/2021 00:41:19 - INFO - __main__ - Step 47097: {'lr': 0.00019902315376079898, 'samples': 1507104, 'steps': 2943, 'loss/train': 1.9666513204574585} -09/21/2021 00:41:20 - INFO - __main__ - Step 47098: {'lr': 0.00019902315376079898, 'samples': 1507136, 'steps': 2943, 'loss/train': 2.1449639797210693} -09/21/2021 00:41:21 - INFO - __main__ - Step 47099: {'lr': 0.00019902315376079898, 'samples': 1507168, 'steps': 2943, 'loss/train': 1.4993418455123901} -09/21/2021 00:41:22 - INFO - __main__ - Step 47100: {'lr': 0.00019902315376079898, 'samples': 1507200, 'steps': 2943, 'loss/train': 1.9522302150726318} -09/21/2021 00:41:22 - INFO - __main__ - Step 47101: {'lr': 0.00019902315376079898, 'samples': 1507232, 'steps': 2943, 'loss/train': 1.7746717929840088} -09/21/2021 00:41:23 - INFO - __main__ - Step 47102: {'lr': 0.00019902315376079898, 'samples': 1507264, 'steps': 2943, 'loss/train': 2.142430305480957} -09/21/2021 00:41:24 - INFO - __main__ - Step 47103: {'lr': 0.00019902315376079898, 'samples': 1507296, 'steps': 2943, 'loss/train': 2.225064277648926} -09/21/2021 00:41:25 - INFO - __main__ - Step 47104: {'lr': 0.00019902315376079898, 'samples': 1507328, 'steps': 2943, 'loss/train': 2.2274365425109863} -09/21/2021 00:41:26 - INFO - __main__ - Step 47105: {'lr': 0.00019902226413595145, 'samples': 1507360, 'steps': 2944, 'loss/train': 1.409112811088562} -09/21/2021 00:41:26 - INFO - __main__ - Step 47106: {'lr': 0.00019902226413595145, 'samples': 1507392, 'steps': 2944, 'loss/train': 2.0152578353881836} -09/21/2021 00:41:27 - INFO - __main__ - Step 47107: {'lr': 0.00019902226413595145, 'samples': 1507424, 'steps': 2944, 'loss/train': 0.7965605854988098} -09/21/2021 00:41:28 - INFO - __main__ - Step 47108: {'lr': 0.00019902226413595145, 'samples': 1507456, 'steps': 2944, 'loss/train': 2.2846710681915283} -09/21/2021 00:41:29 - INFO - __main__ - Step 47109: {'lr': 0.00019902226413595145, 'samples': 1507488, 'steps': 2944, 'loss/train': 2.7724196910858154} -09/21/2021 00:41:29 - INFO - __main__ - Step 47110: {'lr': 0.00019902226413595145, 'samples': 1507520, 'steps': 2944, 'loss/train': 2.494328737258911} -09/21/2021 00:41:30 - INFO - __main__ - Step 47111: {'lr': 0.00019902226413595145, 'samples': 1507552, 'steps': 2944, 'loss/train': 1.8740602731704712} -09/21/2021 00:41:31 - INFO - __main__ - Step 47112: {'lr': 0.00019902226413595145, 'samples': 1507584, 'steps': 2944, 'loss/train': 0.09373138844966888} -09/21/2021 00:41:32 - INFO - __main__ - Step 47113: {'lr': 0.00019902226413595145, 'samples': 1507616, 'steps': 2944, 'loss/train': 0.613251268863678} -09/21/2021 00:41:32 - INFO - __main__ - Step 47114: {'lr': 0.00019902226413595145, 'samples': 1507648, 'steps': 2944, 'loss/train': 0.16167022287845612} -09/21/2021 00:41:33 - INFO - __main__ - Step 47115: {'lr': 0.00019902226413595145, 'samples': 1507680, 'steps': 2944, 'loss/train': 1.7589964866638184} -09/21/2021 00:41:34 - INFO - __main__ - Step 47116: {'lr': 0.00019902226413595145, 'samples': 1507712, 'steps': 2944, 'loss/train': 2.0725934505462646} -09/21/2021 00:41:35 - INFO - __main__ - Step 47117: {'lr': 0.00019902226413595145, 'samples': 1507744, 'steps': 2944, 'loss/train': 1.4454904794692993} -09/21/2021 00:41:36 - INFO - __main__ - Step 47118: {'lr': 0.00019902226413595145, 'samples': 1507776, 'steps': 2944, 'loss/train': 2.3096563816070557} -09/21/2021 00:41:37 - INFO - __main__ - Step 47119: {'lr': 0.00019902226413595145, 'samples': 1507808, 'steps': 2944, 'loss/train': 1.226181149482727} -09/21/2021 00:41:37 - INFO - __main__ - Step 47120: {'lr': 0.00019902226413595145, 'samples': 1507840, 'steps': 2944, 'loss/train': 1.8831697702407837} -09/21/2021 00:41:38 - INFO - __main__ - Step 47121: {'lr': 0.00019902137410818274, 'samples': 1507872, 'steps': 2945, 'loss/train': 2.7577967643737793} -09/21/2021 00:41:39 - INFO - __main__ - Step 47122: {'lr': 0.00019902137410818274, 'samples': 1507904, 'steps': 2945, 'loss/train': 2.1054444313049316} -09/21/2021 00:41:40 - INFO - __main__ - Step 47123: {'lr': 0.00019902137410818274, 'samples': 1507936, 'steps': 2945, 'loss/train': 2.591282606124878} -09/21/2021 00:41:41 - INFO - __main__ - Step 47124: {'lr': 0.00019902137410818274, 'samples': 1507968, 'steps': 2945, 'loss/train': 1.6770209074020386} -09/21/2021 00:41:41 - INFO - __main__ - Step 47125: {'lr': 0.00019902137410818274, 'samples': 1508000, 'steps': 2945, 'loss/train': 2.1749608516693115} -09/21/2021 00:41:42 - INFO - __main__ - Step 47126: {'lr': 0.00019902137410818274, 'samples': 1508032, 'steps': 2945, 'loss/train': 2.7092125415802} -09/21/2021 00:41:43 - INFO - __main__ - Step 47127: {'lr': 0.00019902137410818274, 'samples': 1508064, 'steps': 2945, 'loss/train': 3.1784517765045166} -09/21/2021 00:41:44 - INFO - __main__ - Step 47128: {'lr': 0.00019902137410818274, 'samples': 1508096, 'steps': 2945, 'loss/train': 2.2368178367614746} -09/21/2021 00:41:44 - INFO - __main__ - Step 47129: {'lr': 0.00019902137410818274, 'samples': 1508128, 'steps': 2945, 'loss/train': 2.4205362796783447} -09/21/2021 00:41:45 - INFO - __main__ - Step 47130: {'lr': 0.00019902137410818274, 'samples': 1508160, 'steps': 2945, 'loss/train': 2.9608452320098877} -09/21/2021 00:41:46 - INFO - __main__ - Step 47131: {'lr': 0.00019902137410818274, 'samples': 1508192, 'steps': 2945, 'loss/train': 1.4105716943740845} -09/21/2021 00:41:47 - INFO - __main__ - Step 47132: {'lr': 0.00019902137410818274, 'samples': 1508224, 'steps': 2945, 'loss/train': 1.715279221534729} -09/21/2021 00:41:47 - INFO - __main__ - Step 47133: {'lr': 0.00019902137410818274, 'samples': 1508256, 'steps': 2945, 'loss/train': 1.2942149639129639} -09/21/2021 00:41:48 - INFO - __main__ - Step 47134: {'lr': 0.00019902137410818274, 'samples': 1508288, 'steps': 2945, 'loss/train': 2.508545160293579} -09/21/2021 00:41:49 - INFO - __main__ - Step 47135: {'lr': 0.00019902137410818274, 'samples': 1508320, 'steps': 2945, 'loss/train': 1.464614987373352} -09/21/2021 00:41:50 - INFO - __main__ - Step 47136: {'lr': 0.00019902137410818274, 'samples': 1508352, 'steps': 2945, 'loss/train': 2.1271660327911377} -09/21/2021 00:41:50 - INFO - __main__ - Step 47137: {'lr': 0.00019902048367749644, 'samples': 1508384, 'steps': 2946, 'loss/train': 1.6440765857696533} -09/21/2021 00:41:51 - INFO - __main__ - Step 47138: {'lr': 0.00019902048367749644, 'samples': 1508416, 'steps': 2946, 'loss/train': 1.523179531097412} -09/21/2021 00:41:52 - INFO - __main__ - Step 47139: {'lr': 0.00019902048367749644, 'samples': 1508448, 'steps': 2946, 'loss/train': 1.6507103443145752} -09/21/2021 00:41:53 - INFO - __main__ - Step 47140: {'lr': 0.00019902048367749644, 'samples': 1508480, 'steps': 2946, 'loss/train': 1.7600325345993042} -09/21/2021 00:41:53 - INFO - __main__ - Step 47141: {'lr': 0.00019902048367749644, 'samples': 1508512, 'steps': 2946, 'loss/train': 2.3924994468688965} -09/21/2021 00:41:54 - INFO - __main__ - Step 47142: {'lr': 0.00019902048367749644, 'samples': 1508544, 'steps': 2946, 'loss/train': 2.222524881362915} -09/21/2021 00:41:55 - INFO - __main__ - Step 47143: {'lr': 0.00019902048367749644, 'samples': 1508576, 'steps': 2946, 'loss/train': 3.005173921585083} -09/21/2021 00:41:56 - INFO - __main__ - Step 47144: {'lr': 0.00019902048367749644, 'samples': 1508608, 'steps': 2946, 'loss/train': 1.6934705972671509} -09/21/2021 00:41:56 - INFO - __main__ - Step 47145: {'lr': 0.00019902048367749644, 'samples': 1508640, 'steps': 2946, 'loss/train': 1.6273772716522217} -09/21/2021 00:41:57 - INFO - __main__ - Step 47146: {'lr': 0.00019902048367749644, 'samples': 1508672, 'steps': 2946, 'loss/train': 2.017395496368408} -09/21/2021 00:41:59 - INFO - __main__ - Step 47147: {'lr': 0.00019902048367749644, 'samples': 1508704, 'steps': 2946, 'loss/train': 1.4723368883132935} -09/21/2021 00:42:00 - INFO - __main__ - Step 47148: {'lr': 0.00019902048367749644, 'samples': 1508736, 'steps': 2946, 'loss/train': 2.3606648445129395} -09/21/2021 00:42:01 - INFO - __main__ - Step 47149: {'lr': 0.00019902048367749644, 'samples': 1508768, 'steps': 2946, 'loss/train': 2.18290114402771} -09/21/2021 00:42:01 - INFO - __main__ - Step 47150: {'lr': 0.00019902048367749644, 'samples': 1508800, 'steps': 2946, 'loss/train': 2.009434938430786} -09/21/2021 00:42:02 - INFO - __main__ - Step 47151: {'lr': 0.00019902048367749644, 'samples': 1508832, 'steps': 2946, 'loss/train': 2.5942628383636475} -09/21/2021 00:42:03 - INFO - __main__ - Step 47152: {'lr': 0.00019902048367749644, 'samples': 1508864, 'steps': 2946, 'loss/train': 2.7556848526000977} -09/21/2021 00:42:04 - INFO - __main__ - Step 47153: {'lr': 0.00019901959284389617, 'samples': 1508896, 'steps': 2947, 'loss/train': 1.9575562477111816} -09/21/2021 00:42:05 - INFO - __main__ - Step 47154: {'lr': 0.00019901959284389617, 'samples': 1508928, 'steps': 2947, 'loss/train': 1.5856226682662964} -09/21/2021 00:42:05 - INFO - __main__ - Step 47155: {'lr': 0.00019901959284389617, 'samples': 1508960, 'steps': 2947, 'loss/train': 1.467397689819336} -09/21/2021 00:42:06 - INFO - __main__ - Step 47156: {'lr': 0.00019901959284389617, 'samples': 1508992, 'steps': 2947, 'loss/train': 1.3899039030075073} -09/21/2021 00:42:07 - INFO - __main__ - Step 47157: {'lr': 0.00019901959284389617, 'samples': 1509024, 'steps': 2947, 'loss/train': 1.8836621046066284} -09/21/2021 00:42:08 - INFO - __main__ - Step 47158: {'lr': 0.00019901959284389617, 'samples': 1509056, 'steps': 2947, 'loss/train': 1.470566749572754} -09/21/2021 00:42:08 - INFO - __main__ - Step 47159: {'lr': 0.00019901959284389617, 'samples': 1509088, 'steps': 2947, 'loss/train': 2.8094613552093506} -09/21/2021 00:42:09 - INFO - __main__ - Step 47160: {'lr': 0.00019901959284389617, 'samples': 1509120, 'steps': 2947, 'loss/train': 2.2182626724243164} -09/21/2021 00:42:10 - INFO - __main__ - Step 47161: {'lr': 0.00019901959284389617, 'samples': 1509152, 'steps': 2947, 'loss/train': 1.5187187194824219} -09/21/2021 00:42:11 - INFO - __main__ - Step 47162: {'lr': 0.00019901959284389617, 'samples': 1509184, 'steps': 2947, 'loss/train': 2.473640203475952} -09/21/2021 00:42:11 - INFO - __main__ - Step 47163: {'lr': 0.00019901959284389617, 'samples': 1509216, 'steps': 2947, 'loss/train': 1.8578404188156128} -09/21/2021 00:42:12 - INFO - __main__ - Step 47164: {'lr': 0.00019901959284389617, 'samples': 1509248, 'steps': 2947, 'loss/train': 1.5924111604690552} -09/21/2021 00:42:13 - INFO - __main__ - Step 47165: {'lr': 0.00019901959284389617, 'samples': 1509280, 'steps': 2947, 'loss/train': 0.2829611599445343} -09/21/2021 00:42:14 - INFO - __main__ - Step 47166: {'lr': 0.00019901959284389617, 'samples': 1509312, 'steps': 2947, 'loss/train': 0.11989884078502655} -09/21/2021 00:42:14 - INFO - __main__ - Step 47167: {'lr': 0.00019901959284389617, 'samples': 1509344, 'steps': 2947, 'loss/train': 0.10861940681934357} -09/21/2021 00:42:15 - INFO - __main__ - Step 47168: {'lr': 0.00019901959284389617, 'samples': 1509376, 'steps': 2947, 'loss/train': 0.13272568583488464} -09/21/2021 00:42:16 - INFO - __main__ - Step 47169: {'lr': 0.00019901870160738555, 'samples': 1509408, 'steps': 2948, 'loss/train': 1.0956445932388306} -09/21/2021 00:42:17 - INFO - __main__ - Step 47170: {'lr': 0.00019901870160738555, 'samples': 1509440, 'steps': 2948, 'loss/train': 2.850445032119751} -09/21/2021 00:42:18 - INFO - __main__ - Step 47171: {'lr': 0.00019901870160738555, 'samples': 1509472, 'steps': 2948, 'loss/train': 1.9710313081741333} -09/21/2021 00:42:18 - INFO - __main__ - Step 47172: {'lr': 0.00019901870160738555, 'samples': 1509504, 'steps': 2948, 'loss/train': 2.005557060241699} -09/21/2021 00:42:19 - INFO - __main__ - Step 47173: {'lr': 0.00019901870160738555, 'samples': 1509536, 'steps': 2948, 'loss/train': 1.8836989402770996} -09/21/2021 00:42:20 - INFO - __main__ - Step 47174: {'lr': 0.00019901870160738555, 'samples': 1509568, 'steps': 2948, 'loss/train': 2.5525403022766113} -09/21/2021 00:42:21 - INFO - __main__ - Step 47175: {'lr': 0.00019901870160738555, 'samples': 1509600, 'steps': 2948, 'loss/train': 3.128007411956787} -09/21/2021 00:42:21 - INFO - __main__ - Step 47176: {'lr': 0.00019901870160738555, 'samples': 1509632, 'steps': 2948, 'loss/train': 2.5239856243133545} -09/21/2021 00:42:22 - INFO - __main__ - Step 47177: {'lr': 0.00019901870160738555, 'samples': 1509664, 'steps': 2948, 'loss/train': 2.1635029315948486} -09/21/2021 00:42:23 - INFO - __main__ - Step 47178: {'lr': 0.00019901870160738555, 'samples': 1509696, 'steps': 2948, 'loss/train': 2.056551694869995} -09/21/2021 00:42:24 - INFO - __main__ - Step 47179: {'lr': 0.00019901870160738555, 'samples': 1509728, 'steps': 2948, 'loss/train': 2.364290237426758} -09/21/2021 00:42:25 - INFO - __main__ - Step 47180: {'lr': 0.00019901870160738555, 'samples': 1509760, 'steps': 2948, 'loss/train': 1.7497119903564453} -09/21/2021 00:42:26 - INFO - __main__ - Step 47181: {'lr': 0.00019901870160738555, 'samples': 1509792, 'steps': 2948, 'loss/train': 1.6360418796539307} -09/21/2021 00:42:26 - INFO - __main__ - Step 47182: {'lr': 0.00019901870160738555, 'samples': 1509824, 'steps': 2948, 'loss/train': 2.205120086669922} -09/21/2021 00:42:27 - INFO - __main__ - Step 47183: {'lr': 0.00019901870160738555, 'samples': 1509856, 'steps': 2948, 'loss/train': 1.2903145551681519} -09/21/2021 00:42:28 - INFO - __main__ - Step 47184: {'lr': 0.00019901870160738555, 'samples': 1509888, 'steps': 2948, 'loss/train': 1.6897571086883545} -09/21/2021 00:42:29 - INFO - __main__ - Step 47185: {'lr': 0.00019901780996796822, 'samples': 1509920, 'steps': 2949, 'loss/train': 1.5186288356781006} -09/21/2021 00:42:30 - INFO - __main__ - Step 47186: {'lr': 0.00019901780996796822, 'samples': 1509952, 'steps': 2949, 'loss/train': 0.1949584186077118} -09/21/2021 00:42:30 - INFO - __main__ - Step 47187: {'lr': 0.00019901780996796822, 'samples': 1509984, 'steps': 2949, 'loss/train': 1.9473661184310913} -09/21/2021 00:42:31 - INFO - __main__ - Step 47188: {'lr': 0.00019901780996796822, 'samples': 1510016, 'steps': 2949, 'loss/train': 0.13864222168922424} -09/21/2021 00:42:32 - INFO - __main__ - Step 47189: {'lr': 0.00019901780996796822, 'samples': 1510048, 'steps': 2949, 'loss/train': 0.1499001830816269} -09/21/2021 00:42:33 - INFO - __main__ - Step 47190: {'lr': 0.00019901780996796822, 'samples': 1510080, 'steps': 2949, 'loss/train': 0.1830003708600998} -09/21/2021 00:42:33 - INFO - __main__ - Step 47191: {'lr': 0.00019901780996796822, 'samples': 1510112, 'steps': 2949, 'loss/train': 2.4451334476470947} -09/21/2021 00:42:34 - INFO - __main__ - Step 47192: {'lr': 0.00019901780996796822, 'samples': 1510144, 'steps': 2949, 'loss/train': 0.3464387357234955} -09/21/2021 00:42:35 - INFO - __main__ - Step 47193: {'lr': 0.00019901780996796822, 'samples': 1510176, 'steps': 2949, 'loss/train': 2.9290273189544678} -09/21/2021 00:42:36 - INFO - __main__ - Step 47194: {'lr': 0.00019901780996796822, 'samples': 1510208, 'steps': 2949, 'loss/train': 1.905508279800415} -09/21/2021 00:42:36 - INFO - __main__ - Step 47195: {'lr': 0.00019901780996796822, 'samples': 1510240, 'steps': 2949, 'loss/train': 1.788344383239746} -09/21/2021 00:42:37 - INFO - __main__ - Step 47196: {'lr': 0.00019901780996796822, 'samples': 1510272, 'steps': 2949, 'loss/train': 1.9649357795715332} -09/21/2021 00:42:38 - INFO - __main__ - Step 47197: {'lr': 0.00019901780996796822, 'samples': 1510304, 'steps': 2949, 'loss/train': 2.947392702102661} -09/21/2021 00:42:39 - INFO - __main__ - Step 47198: {'lr': 0.00019901780996796822, 'samples': 1510336, 'steps': 2949, 'loss/train': 1.3718855381011963} -09/21/2021 00:42:39 - INFO - __main__ - Step 47199: {'lr': 0.00019901780996796822, 'samples': 1510368, 'steps': 2949, 'loss/train': 2.16823148727417} -09/21/2021 00:42:40 - INFO - __main__ - Step 47200: {'lr': 0.00019901780996796822, 'samples': 1510400, 'steps': 2949, 'loss/train': 2.017179012298584} -09/21/2021 00:42:41 - INFO - __main__ - Step 47201: {'lr': 0.0001990169179256478, 'samples': 1510432, 'steps': 2950, 'loss/train': 2.5057003498077393} -09/21/2021 00:42:42 - INFO - __main__ - Step 47202: {'lr': 0.0001990169179256478, 'samples': 1510464, 'steps': 2950, 'loss/train': 2.029738664627075} -09/21/2021 00:42:42 - INFO - __main__ - Step 47203: {'lr': 0.0001990169179256478, 'samples': 1510496, 'steps': 2950, 'loss/train': 2.0360047817230225} -09/21/2021 00:42:43 - INFO - __main__ - Step 47204: {'lr': 0.0001990169179256478, 'samples': 1510528, 'steps': 2950, 'loss/train': 2.1416404247283936} -09/21/2021 00:42:44 - INFO - __main__ - Step 47205: {'lr': 0.0001990169179256478, 'samples': 1510560, 'steps': 2950, 'loss/train': 1.630330204963684} -09/21/2021 00:42:45 - INFO - __main__ - Step 47206: {'lr': 0.0001990169179256478, 'samples': 1510592, 'steps': 2950, 'loss/train': 0.9925554990768433} -09/21/2021 00:42:45 - INFO - __main__ - Step 47207: {'lr': 0.0001990169179256478, 'samples': 1510624, 'steps': 2950, 'loss/train': 2.3816936016082764} -09/21/2021 00:42:46 - INFO - __main__ - Step 47208: {'lr': 0.0001990169179256478, 'samples': 1510656, 'steps': 2950, 'loss/train': 1.4450606107711792} -09/21/2021 00:42:47 - INFO - __main__ - Step 47209: {'lr': 0.0001990169179256478, 'samples': 1510688, 'steps': 2950, 'loss/train': 1.6544541120529175} -09/21/2021 00:42:48 - INFO - __main__ - Step 47210: {'lr': 0.0001990169179256478, 'samples': 1510720, 'steps': 2950, 'loss/train': 1.8987666368484497} -09/21/2021 00:42:49 - INFO - __main__ - Step 47211: {'lr': 0.0001990169179256478, 'samples': 1510752, 'steps': 2950, 'loss/train': 2.0677077770233154} -09/21/2021 00:42:50 - INFO - __main__ - Step 47212: {'lr': 0.0001990169179256478, 'samples': 1510784, 'steps': 2950, 'loss/train': 1.985939621925354} -09/21/2021 00:42:51 - INFO - __main__ - Step 47213: {'lr': 0.0001990169179256478, 'samples': 1510816, 'steps': 2950, 'loss/train': 1.4974499940872192} -09/21/2021 00:42:51 - INFO - __main__ - Step 47214: {'lr': 0.0001990169179256478, 'samples': 1510848, 'steps': 2950, 'loss/train': 1.577189564704895} -09/21/2021 00:42:52 - INFO - __main__ - Step 47215: {'lr': 0.0001990169179256478, 'samples': 1510880, 'steps': 2950, 'loss/train': 2.595546007156372} -09/21/2021 00:42:53 - INFO - __main__ - Step 47216: {'lr': 0.0001990169179256478, 'samples': 1510912, 'steps': 2950, 'loss/train': 2.6584503650665283} -09/21/2021 00:42:54 - INFO - __main__ - Step 47217: {'lr': 0.00019901602548042796, 'samples': 1510944, 'steps': 2951, 'loss/train': 1.7644460201263428} -09/21/2021 00:42:54 - INFO - __main__ - Step 47218: {'lr': 0.00019901602548042796, 'samples': 1510976, 'steps': 2951, 'loss/train': 2.5862627029418945} -09/21/2021 00:42:55 - INFO - __main__ - Step 47219: {'lr': 0.00019901602548042796, 'samples': 1511008, 'steps': 2951, 'loss/train': 2.1666715145111084} -09/21/2021 00:42:56 - INFO - __main__ - Step 47220: {'lr': 0.00019901602548042796, 'samples': 1511040, 'steps': 2951, 'loss/train': 1.8261868953704834} -09/21/2021 00:42:57 - INFO - __main__ - Step 47221: {'lr': 0.00019901602548042796, 'samples': 1511072, 'steps': 2951, 'loss/train': 1.7245327234268188} -09/21/2021 00:42:57 - INFO - __main__ - Step 47222: {'lr': 0.00019901602548042796, 'samples': 1511104, 'steps': 2951, 'loss/train': 1.7344293594360352} -09/21/2021 00:42:58 - INFO - __main__ - Step 47223: {'lr': 0.00019901602548042796, 'samples': 1511136, 'steps': 2951, 'loss/train': 2.0154809951782227} -09/21/2021 00:42:59 - INFO - __main__ - Step 47224: {'lr': 0.00019901602548042796, 'samples': 1511168, 'steps': 2951, 'loss/train': 1.834092378616333} -09/21/2021 00:43:00 - INFO - __main__ - Step 47225: {'lr': 0.00019901602548042796, 'samples': 1511200, 'steps': 2951, 'loss/train': 2.6817617416381836} -09/21/2021 00:43:00 - INFO - __main__ - Step 47226: {'lr': 0.00019901602548042796, 'samples': 1511232, 'steps': 2951, 'loss/train': 2.4643969535827637} -09/21/2021 00:43:01 - INFO - __main__ - Step 47227: {'lr': 0.00019901602548042796, 'samples': 1511264, 'steps': 2951, 'loss/train': 1.6717379093170166} -09/21/2021 00:43:02 - INFO - __main__ - Step 47228: {'lr': 0.00019901602548042796, 'samples': 1511296, 'steps': 2951, 'loss/train': 3.4402270317077637} -09/21/2021 00:43:03 - INFO - __main__ - Step 47229: {'lr': 0.00019901602548042796, 'samples': 1511328, 'steps': 2951, 'loss/train': 2.2359747886657715} -09/21/2021 00:43:03 - INFO - __main__ - Step 47230: {'lr': 0.00019901602548042796, 'samples': 1511360, 'steps': 2951, 'loss/train': 2.586732864379883} -09/21/2021 00:43:04 - INFO - __main__ - Step 47231: {'lr': 0.00019901602548042796, 'samples': 1511392, 'steps': 2951, 'loss/train': 1.6837869882583618} -09/21/2021 00:43:05 - INFO - __main__ - Step 47232: {'lr': 0.00019901602548042796, 'samples': 1511424, 'steps': 2951, 'loss/train': 1.9502394199371338} -09/21/2021 00:43:06 - INFO - __main__ - Step 47233: {'lr': 0.00019901513263231223, 'samples': 1511456, 'steps': 2952, 'loss/train': 0.4546533524990082} -09/21/2021 00:43:07 - INFO - __main__ - Step 47234: {'lr': 0.00019901513263231223, 'samples': 1511488, 'steps': 2952, 'loss/train': 1.654339075088501} -09/21/2021 00:43:07 - INFO - __main__ - Step 47235: {'lr': 0.00019901513263231223, 'samples': 1511520, 'steps': 2952, 'loss/train': 1.3739408254623413} -09/21/2021 00:43:08 - INFO - __main__ - Step 47236: {'lr': 0.00019901513263231223, 'samples': 1511552, 'steps': 2952, 'loss/train': 2.780060052871704} -09/21/2021 00:43:09 - INFO - __main__ - Step 47237: {'lr': 0.00019901513263231223, 'samples': 1511584, 'steps': 2952, 'loss/train': 1.9525495767593384} -09/21/2021 00:43:10 - INFO - __main__ - Step 47238: {'lr': 0.00019901513263231223, 'samples': 1511616, 'steps': 2952, 'loss/train': 1.848156213760376} -09/21/2021 00:43:10 - INFO - __main__ - Step 47239: {'lr': 0.00019901513263231223, 'samples': 1511648, 'steps': 2952, 'loss/train': 2.784449815750122} -09/21/2021 00:43:11 - INFO - __main__ - Step 47240: {'lr': 0.00019901513263231223, 'samples': 1511680, 'steps': 2952, 'loss/train': 2.303420305252075} -09/21/2021 00:43:12 - INFO - __main__ - Step 47241: {'lr': 0.00019901513263231223, 'samples': 1511712, 'steps': 2952, 'loss/train': 1.9718655347824097} -09/21/2021 00:43:13 - INFO - __main__ - Step 47242: {'lr': 0.00019901513263231223, 'samples': 1511744, 'steps': 2952, 'loss/train': 2.6304471492767334} -09/21/2021 00:43:14 - INFO - __main__ - Step 47243: {'lr': 0.00019901513263231223, 'samples': 1511776, 'steps': 2952, 'loss/train': 1.6063681840896606} -09/21/2021 00:43:15 - INFO - __main__ - Step 47244: {'lr': 0.00019901513263231223, 'samples': 1511808, 'steps': 2952, 'loss/train': 2.5254464149475098} -09/21/2021 00:43:15 - INFO - __main__ - Step 47245: {'lr': 0.00019901513263231223, 'samples': 1511840, 'steps': 2952, 'loss/train': 2.3465025424957275} -09/21/2021 00:43:16 - INFO - __main__ - Step 47246: {'lr': 0.00019901513263231223, 'samples': 1511872, 'steps': 2952, 'loss/train': 1.70975923538208} -09/21/2021 00:43:17 - INFO - __main__ - Step 47247: {'lr': 0.00019901513263231223, 'samples': 1511904, 'steps': 2952, 'loss/train': 2.63116455078125} -09/21/2021 00:43:18 - INFO - __main__ - Step 47248: {'lr': 0.00019901513263231223, 'samples': 1511936, 'steps': 2952, 'loss/train': 1.786953091621399} -09/21/2021 00:43:18 - INFO - __main__ - Step 47249: {'lr': 0.00019901423938130437, 'samples': 1511968, 'steps': 2953, 'loss/train': 3.2384488582611084} -09/21/2021 00:43:19 - INFO - __main__ - Step 47250: {'lr': 0.00019901423938130437, 'samples': 1512000, 'steps': 2953, 'loss/train': 3.572550058364868} -09/21/2021 00:43:20 - INFO - __main__ - Step 47251: {'lr': 0.00019901423938130437, 'samples': 1512032, 'steps': 2953, 'loss/train': 2.6126129627227783} -09/21/2021 00:43:21 - INFO - __main__ - Step 47252: {'lr': 0.00019901423938130437, 'samples': 1512064, 'steps': 2953, 'loss/train': 1.5652973651885986} -09/21/2021 00:43:21 - INFO - __main__ - Step 47253: {'lr': 0.00019901423938130437, 'samples': 1512096, 'steps': 2953, 'loss/train': 1.1443161964416504} -09/21/2021 00:43:22 - INFO - __main__ - Step 47254: {'lr': 0.00019901423938130437, 'samples': 1512128, 'steps': 2953, 'loss/train': 1.6137923002243042} -09/21/2021 00:43:23 - INFO - __main__ - Step 47255: {'lr': 0.00019901423938130437, 'samples': 1512160, 'steps': 2953, 'loss/train': 1.5056641101837158} -09/21/2021 00:43:24 - INFO - __main__ - Step 47256: {'lr': 0.00019901423938130437, 'samples': 1512192, 'steps': 2953, 'loss/train': 1.9331244230270386} -09/21/2021 00:43:24 - INFO - __main__ - Step 47257: {'lr': 0.00019901423938130437, 'samples': 1512224, 'steps': 2953, 'loss/train': 2.2425193786621094} -09/21/2021 00:43:25 - INFO - __main__ - Step 47258: {'lr': 0.00019901423938130437, 'samples': 1512256, 'steps': 2953, 'loss/train': 1.6132655143737793} -09/21/2021 00:43:26 - INFO - __main__ - Step 47259: {'lr': 0.00019901423938130437, 'samples': 1512288, 'steps': 2953, 'loss/train': 1.7745615243911743} -09/21/2021 00:43:27 - INFO - __main__ - Step 47260: {'lr': 0.00019901423938130437, 'samples': 1512320, 'steps': 2953, 'loss/train': 1.5058627128601074} -09/21/2021 00:43:27 - INFO - __main__ - Step 47261: {'lr': 0.00019901423938130437, 'samples': 1512352, 'steps': 2953, 'loss/train': 2.229902505874634} -09/21/2021 00:43:28 - INFO - __main__ - Step 47262: {'lr': 0.00019901423938130437, 'samples': 1512384, 'steps': 2953, 'loss/train': 1.6349011659622192} -09/21/2021 00:43:29 - INFO - __main__ - Step 47263: {'lr': 0.00019901423938130437, 'samples': 1512416, 'steps': 2953, 'loss/train': 2.14534592628479} -09/21/2021 00:43:30 - INFO - __main__ - Step 47264: {'lr': 0.00019901423938130437, 'samples': 1512448, 'steps': 2953, 'loss/train': 2.993485450744629} -09/21/2021 00:43:31 - INFO - __main__ - Step 47265: {'lr': 0.00019901334572740794, 'samples': 1512480, 'steps': 2954, 'loss/train': 2.350803852081299} -09/21/2021 00:43:31 - INFO - __main__ - Step 47266: {'lr': 0.00019901334572740794, 'samples': 1512512, 'steps': 2954, 'loss/train': 2.001260280609131} -09/21/2021 00:43:32 - INFO - __main__ - Step 47267: {'lr': 0.00019901334572740794, 'samples': 1512544, 'steps': 2954, 'loss/train': 1.3876789808273315} -09/21/2021 00:43:33 - INFO - __main__ - Step 47268: {'lr': 0.00019901334572740794, 'samples': 1512576, 'steps': 2954, 'loss/train': 1.7027543783187866} -09/21/2021 00:43:34 - INFO - __main__ - Step 47269: {'lr': 0.00019901334572740794, 'samples': 1512608, 'steps': 2954, 'loss/train': 2.0432426929473877} -09/21/2021 00:43:34 - INFO - __main__ - Step 47270: {'lr': 0.00019901334572740794, 'samples': 1512640, 'steps': 2954, 'loss/train': 2.0140621662139893} -09/21/2021 00:43:35 - INFO - __main__ - Step 47271: {'lr': 0.00019901334572740794, 'samples': 1512672, 'steps': 2954, 'loss/train': 2.0212349891662598} -09/21/2021 00:43:37 - INFO - __main__ - Step 47272: {'lr': 0.00019901334572740794, 'samples': 1512704, 'steps': 2954, 'loss/train': 1.9268863201141357} -09/21/2021 00:43:37 - INFO - __main__ - Step 47273: {'lr': 0.00019901334572740794, 'samples': 1512736, 'steps': 2954, 'loss/train': 2.5246543884277344} -09/21/2021 00:43:38 - INFO - __main__ - Step 47274: {'lr': 0.00019901334572740794, 'samples': 1512768, 'steps': 2954, 'loss/train': 2.5513360500335693} -09/21/2021 00:43:39 - INFO - __main__ - Step 47275: {'lr': 0.00019901334572740794, 'samples': 1512800, 'steps': 2954, 'loss/train': 1.6029541492462158} -09/21/2021 00:43:40 - INFO - __main__ - Step 47276: {'lr': 0.00019901334572740794, 'samples': 1512832, 'steps': 2954, 'loss/train': 2.2609848976135254} -09/21/2021 00:43:40 - INFO - __main__ - Step 47277: {'lr': 0.00019901334572740794, 'samples': 1512864, 'steps': 2954, 'loss/train': 1.6357805728912354} -09/21/2021 00:43:41 - INFO - __main__ - Step 47278: {'lr': 0.00019901334572740794, 'samples': 1512896, 'steps': 2954, 'loss/train': 1.7656093835830688} -09/21/2021 00:43:42 - INFO - __main__ - Step 47279: {'lr': 0.00019901334572740794, 'samples': 1512928, 'steps': 2954, 'loss/train': 1.6959187984466553} -09/21/2021 00:43:43 - INFO - __main__ - Step 47280: {'lr': 0.00019901334572740794, 'samples': 1512960, 'steps': 2954, 'loss/train': 3.2444567680358887} -09/21/2021 00:43:44 - INFO - __main__ - Step 47281: {'lr': 0.00019901245167062656, 'samples': 1512992, 'steps': 2955, 'loss/train': 2.505533456802368} -09/21/2021 00:43:44 - INFO - __main__ - Step 47282: {'lr': 0.00019901245167062656, 'samples': 1513024, 'steps': 2955, 'loss/train': 1.9155653715133667} -09/21/2021 00:43:45 - INFO - __main__ - Step 47283: {'lr': 0.00019901245167062656, 'samples': 1513056, 'steps': 2955, 'loss/train': 1.9170749187469482} -09/21/2021 00:43:46 - INFO - __main__ - Step 47284: {'lr': 0.00019901245167062656, 'samples': 1513088, 'steps': 2955, 'loss/train': 2.093660354614258} -09/21/2021 00:43:47 - INFO - __main__ - Step 47285: {'lr': 0.00019901245167062656, 'samples': 1513120, 'steps': 2955, 'loss/train': 2.015974521636963} -09/21/2021 00:43:47 - INFO - __main__ - Step 47286: {'lr': 0.00019901245167062656, 'samples': 1513152, 'steps': 2955, 'loss/train': 1.5235055685043335} -09/21/2021 00:43:48 - INFO - __main__ - Step 47287: {'lr': 0.00019901245167062656, 'samples': 1513184, 'steps': 2955, 'loss/train': 1.8767614364624023} -09/21/2021 00:43:49 - INFO - __main__ - Step 47288: {'lr': 0.00019901245167062656, 'samples': 1513216, 'steps': 2955, 'loss/train': 2.751702308654785} -09/21/2021 00:43:50 - INFO - __main__ - Step 47289: {'lr': 0.00019901245167062656, 'samples': 1513248, 'steps': 2955, 'loss/train': 2.8395140171051025} -09/21/2021 00:43:50 - INFO - __main__ - Step 47290: {'lr': 0.00019901245167062656, 'samples': 1513280, 'steps': 2955, 'loss/train': 1.7987862825393677} -09/21/2021 00:43:51 - INFO - __main__ - Step 47291: {'lr': 0.00019901245167062656, 'samples': 1513312, 'steps': 2955, 'loss/train': 2.706139087677002} -09/21/2021 00:43:52 - INFO - __main__ - Step 47292: {'lr': 0.00019901245167062656, 'samples': 1513344, 'steps': 2955, 'loss/train': 0.7977263331413269} -09/21/2021 00:43:53 - INFO - __main__ - Step 47293: {'lr': 0.00019901245167062656, 'samples': 1513376, 'steps': 2955, 'loss/train': 2.5522055625915527} -09/21/2021 00:43:53 - INFO - __main__ - Step 47294: {'lr': 0.00019901245167062656, 'samples': 1513408, 'steps': 2955, 'loss/train': 1.758811116218567} -09/21/2021 00:43:54 - INFO - __main__ - Step 47295: {'lr': 0.00019901245167062656, 'samples': 1513440, 'steps': 2955, 'loss/train': 1.9586994647979736} -09/21/2021 00:43:55 - INFO - __main__ - Step 47296: {'lr': 0.00019901245167062656, 'samples': 1513472, 'steps': 2955, 'loss/train': 0.15939445793628693} -09/21/2021 00:43:56 - INFO - __main__ - Step 47297: {'lr': 0.00019901155721096394, 'samples': 1513504, 'steps': 2956, 'loss/train': 0.16857488453388214} -09/21/2021 00:43:56 - INFO - __main__ - Step 47298: {'lr': 0.00019901155721096394, 'samples': 1513536, 'steps': 2956, 'loss/train': 0.21420514583587646} -09/21/2021 00:43:57 - INFO - __main__ - Step 47299: {'lr': 0.00019901155721096394, 'samples': 1513568, 'steps': 2956, 'loss/train': 0.6881736516952515} -09/21/2021 00:43:58 - INFO - __main__ - Step 47300: {'lr': 0.00019901155721096394, 'samples': 1513600, 'steps': 2956, 'loss/train': 3.111623764038086} -09/21/2021 00:43:59 - INFO - __main__ - Step 47301: {'lr': 0.00019901155721096394, 'samples': 1513632, 'steps': 2956, 'loss/train': 2.3630526065826416} -09/21/2021 00:44:00 - INFO - __main__ - Step 47302: {'lr': 0.00019901155721096394, 'samples': 1513664, 'steps': 2956, 'loss/train': 1.8829426765441895} -09/21/2021 00:44:01 - INFO - __main__ - Step 47303: {'lr': 0.00019901155721096394, 'samples': 1513696, 'steps': 2956, 'loss/train': 1.964246153831482} -09/21/2021 00:44:02 - INFO - __main__ - Step 47304: {'lr': 0.00019901155721096394, 'samples': 1513728, 'steps': 2956, 'loss/train': 1.9015462398529053} -09/21/2021 00:44:02 - INFO - __main__ - Step 47305: {'lr': 0.00019901155721096394, 'samples': 1513760, 'steps': 2956, 'loss/train': 1.2446553707122803} -09/21/2021 00:44:03 - INFO - __main__ - Step 47306: {'lr': 0.00019901155721096394, 'samples': 1513792, 'steps': 2956, 'loss/train': 2.836879253387451} -09/21/2021 00:44:04 - INFO - __main__ - Step 47307: {'lr': 0.00019901155721096394, 'samples': 1513824, 'steps': 2956, 'loss/train': 5.183773517608643} -09/21/2021 00:44:05 - INFO - __main__ - Step 47308: {'lr': 0.00019901155721096394, 'samples': 1513856, 'steps': 2956, 'loss/train': 1.5696823596954346} -09/21/2021 00:44:05 - INFO - __main__ - Step 47309: {'lr': 0.00019901155721096394, 'samples': 1513888, 'steps': 2956, 'loss/train': 2.447193145751953} -09/21/2021 00:44:06 - INFO - __main__ - Step 47310: {'lr': 0.00019901155721096394, 'samples': 1513920, 'steps': 2956, 'loss/train': 2.3978543281555176} -09/21/2021 00:44:07 - INFO - __main__ - Step 47311: {'lr': 0.00019901155721096394, 'samples': 1513952, 'steps': 2956, 'loss/train': 1.5156394243240356} -09/21/2021 00:44:08 - INFO - __main__ - Step 47312: {'lr': 0.00019901155721096394, 'samples': 1513984, 'steps': 2956, 'loss/train': 2.267864942550659} -09/21/2021 00:44:08 - INFO - __main__ - Step 47313: {'lr': 0.00019901066234842367, 'samples': 1514016, 'steps': 2957, 'loss/train': 1.1310515403747559} -09/21/2021 00:44:09 - INFO - __main__ - Step 47314: {'lr': 0.00019901066234842367, 'samples': 1514048, 'steps': 2957, 'loss/train': 1.8805774450302124} -09/21/2021 00:44:10 - INFO - __main__ - Step 47315: {'lr': 0.00019901066234842367, 'samples': 1514080, 'steps': 2957, 'loss/train': 2.272730588912964} -09/21/2021 00:44:11 - INFO - __main__ - Step 47316: {'lr': 0.00019901066234842367, 'samples': 1514112, 'steps': 2957, 'loss/train': 0.23395316302776337} -09/21/2021 00:44:11 - INFO - __main__ - Step 47317: {'lr': 0.00019901066234842367, 'samples': 1514144, 'steps': 2957, 'loss/train': 1.8501360416412354} -09/21/2021 00:44:12 - INFO - __main__ - Step 47318: {'lr': 0.00019901066234842367, 'samples': 1514176, 'steps': 2957, 'loss/train': 1.7367241382598877} -09/21/2021 00:44:13 - INFO - __main__ - Step 47319: {'lr': 0.00019901066234842367, 'samples': 1514208, 'steps': 2957, 'loss/train': 2.831197738647461} -09/21/2021 00:44:14 - INFO - __main__ - Step 47320: {'lr': 0.00019901066234842367, 'samples': 1514240, 'steps': 2957, 'loss/train': 1.7253355979919434} -09/21/2021 00:44:14 - INFO - __main__ - Step 47321: {'lr': 0.00019901066234842367, 'samples': 1514272, 'steps': 2957, 'loss/train': 1.8883719444274902} -09/21/2021 00:44:15 - INFO - __main__ - Step 47322: {'lr': 0.00019901066234842367, 'samples': 1514304, 'steps': 2957, 'loss/train': 2.549250841140747} -09/21/2021 00:44:16 - INFO - __main__ - Step 47323: {'lr': 0.00019901066234842367, 'samples': 1514336, 'steps': 2957, 'loss/train': 2.706815004348755} -09/21/2021 00:44:17 - INFO - __main__ - Step 47324: {'lr': 0.00019901066234842367, 'samples': 1514368, 'steps': 2957, 'loss/train': 2.3056821823120117} -09/21/2021 00:44:17 - INFO - __main__ - Step 47325: {'lr': 0.00019901066234842367, 'samples': 1514400, 'steps': 2957, 'loss/train': 2.848412275314331} -09/21/2021 00:44:18 - INFO - __main__ - Step 47326: {'lr': 0.00019901066234842367, 'samples': 1514432, 'steps': 2957, 'loss/train': 1.8718258142471313} -09/21/2021 00:44:19 - INFO - __main__ - Step 47327: {'lr': 0.00019901066234842367, 'samples': 1514464, 'steps': 2957, 'loss/train': 1.814307689666748} -09/21/2021 00:44:20 - INFO - __main__ - Step 47328: {'lr': 0.00019901066234842367, 'samples': 1514496, 'steps': 2957, 'loss/train': 1.459342360496521} -09/21/2021 00:44:21 - INFO - __main__ - Step 47329: {'lr': 0.00019900976708300938, 'samples': 1514528, 'steps': 2958, 'loss/train': 2.118506669998169} -09/21/2021 00:44:21 - INFO - __main__ - Step 47330: {'lr': 0.00019900976708300938, 'samples': 1514560, 'steps': 2958, 'loss/train': 1.6086615324020386} -09/21/2021 00:44:22 - INFO - __main__ - Step 47331: {'lr': 0.00019900976708300938, 'samples': 1514592, 'steps': 2958, 'loss/train': 2.004303216934204} -09/21/2021 00:44:23 - INFO - __main__ - Step 47332: {'lr': 0.00019900976708300938, 'samples': 1514624, 'steps': 2958, 'loss/train': 1.0389958620071411} -09/21/2021 00:44:24 - INFO - __main__ - Step 47333: {'lr': 0.00019900976708300938, 'samples': 1514656, 'steps': 2958, 'loss/train': 0.23499220609664917} -09/21/2021 00:44:25 - INFO - __main__ - Step 47334: {'lr': 0.00019900976708300938, 'samples': 1514688, 'steps': 2958, 'loss/train': 1.8469574451446533} -09/21/2021 00:44:26 - INFO - __main__ - Step 47335: {'lr': 0.00019900976708300938, 'samples': 1514720, 'steps': 2958, 'loss/train': 2.3980536460876465} -09/21/2021 00:44:26 - INFO - __main__ - Step 47336: {'lr': 0.00019900976708300938, 'samples': 1514752, 'steps': 2958, 'loss/train': 2.2190184593200684} -09/21/2021 00:44:27 - INFO - __main__ - Step 47337: {'lr': 0.00019900976708300938, 'samples': 1514784, 'steps': 2958, 'loss/train': 0.6810067296028137} -09/21/2021 00:44:28 - INFO - __main__ - Step 47338: {'lr': 0.00019900976708300938, 'samples': 1514816, 'steps': 2958, 'loss/train': 1.4806785583496094} -09/21/2021 00:44:29 - INFO - __main__ - Step 47339: {'lr': 0.00019900976708300938, 'samples': 1514848, 'steps': 2958, 'loss/train': 2.1241812705993652} -09/21/2021 00:44:29 - INFO - __main__ - Step 47340: {'lr': 0.00019900976708300938, 'samples': 1514880, 'steps': 2958, 'loss/train': 1.9435830116271973} -09/21/2021 00:44:30 - INFO - __main__ - Step 47341: {'lr': 0.00019900976708300938, 'samples': 1514912, 'steps': 2958, 'loss/train': 2.788588047027588} -09/21/2021 00:44:31 - INFO - __main__ - Step 47342: {'lr': 0.00019900976708300938, 'samples': 1514944, 'steps': 2958, 'loss/train': 1.9042019844055176} -09/21/2021 00:44:32 - INFO - __main__ - Step 47343: {'lr': 0.00019900976708300938, 'samples': 1514976, 'steps': 2958, 'loss/train': 1.2679849863052368} -09/21/2021 00:44:32 - INFO - __main__ - Step 47344: {'lr': 0.00019900976708300938, 'samples': 1515008, 'steps': 2958, 'loss/train': 2.1264970302581787} -09/21/2021 00:44:33 - INFO - __main__ - Step 47345: {'lr': 0.00019900887141472472, 'samples': 1515040, 'steps': 2959, 'loss/train': 2.613037109375} -09/21/2021 00:44:34 - INFO - __main__ - Step 47346: {'lr': 0.00019900887141472472, 'samples': 1515072, 'steps': 2959, 'loss/train': 2.0608742237091064} -09/21/2021 00:44:35 - INFO - __main__ - Step 47347: {'lr': 0.00019900887141472472, 'samples': 1515104, 'steps': 2959, 'loss/train': 2.873811721801758} -09/21/2021 00:44:36 - INFO - __main__ - Step 47348: {'lr': 0.00019900887141472472, 'samples': 1515136, 'steps': 2959, 'loss/train': 1.810903787612915} -09/21/2021 00:44:36 - INFO - __main__ - Step 47349: {'lr': 0.00019900887141472472, 'samples': 1515168, 'steps': 2959, 'loss/train': 2.314885139465332} -09/21/2021 00:44:37 - INFO - __main__ - Step 47350: {'lr': 0.00019900887141472472, 'samples': 1515200, 'steps': 2959, 'loss/train': 2.3126306533813477} -09/21/2021 00:44:38 - INFO - __main__ - Step 47351: {'lr': 0.00019900887141472472, 'samples': 1515232, 'steps': 2959, 'loss/train': 1.7723487615585327} -09/21/2021 00:44:39 - INFO - __main__ - Step 47352: {'lr': 0.00019900887141472472, 'samples': 1515264, 'steps': 2959, 'loss/train': 2.10868239402771} -09/21/2021 00:44:39 - INFO - __main__ - Step 47353: {'lr': 0.00019900887141472472, 'samples': 1515296, 'steps': 2959, 'loss/train': 2.2685587406158447} -09/21/2021 00:44:40 - INFO - __main__ - Step 47354: {'lr': 0.00019900887141472472, 'samples': 1515328, 'steps': 2959, 'loss/train': 1.2307206392288208} -09/21/2021 00:44:41 - INFO - __main__ - Step 47355: {'lr': 0.00019900887141472472, 'samples': 1515360, 'steps': 2959, 'loss/train': 2.470241069793701} -09/21/2021 00:44:42 - INFO - __main__ - Step 47356: {'lr': 0.00019900887141472472, 'samples': 1515392, 'steps': 2959, 'loss/train': 0.24761585891246796} -09/21/2021 00:44:42 - INFO - __main__ - Step 47357: {'lr': 0.00019900887141472472, 'samples': 1515424, 'steps': 2959, 'loss/train': 0.18455269932746887} -09/21/2021 00:44:43 - INFO - __main__ - Step 47358: {'lr': 0.00019900887141472472, 'samples': 1515456, 'steps': 2959, 'loss/train': 0.5372511744499207} -09/21/2021 00:44:44 - INFO - __main__ - Step 47359: {'lr': 0.00019900887141472472, 'samples': 1515488, 'steps': 2959, 'loss/train': 1.0865769386291504} -09/21/2021 00:44:45 - INFO - __main__ - Step 47360: {'lr': 0.00019900887141472472, 'samples': 1515520, 'steps': 2959, 'loss/train': 1.346346378326416} -09/21/2021 00:44:45 - INFO - __main__ - Step 47361: {'lr': 0.0001990079753435734, 'samples': 1515552, 'steps': 2960, 'loss/train': 2.8556196689605713} -09/21/2021 00:44:46 - INFO - __main__ - Step 47362: {'lr': 0.0001990079753435734, 'samples': 1515584, 'steps': 2960, 'loss/train': 2.05595064163208} -09/21/2021 00:44:47 - INFO - __main__ - Step 47363: {'lr': 0.0001990079753435734, 'samples': 1515616, 'steps': 2960, 'loss/train': 2.317718744277954} -09/21/2021 00:44:48 - INFO - __main__ - Step 47364: {'lr': 0.0001990079753435734, 'samples': 1515648, 'steps': 2960, 'loss/train': 2.5351932048797607} -09/21/2021 00:44:49 - INFO - __main__ - Step 47365: {'lr': 0.0001990079753435734, 'samples': 1515680, 'steps': 2960, 'loss/train': 2.074495315551758} -09/21/2021 00:44:50 - INFO - __main__ - Step 47366: {'lr': 0.0001990079753435734, 'samples': 1515712, 'steps': 2960, 'loss/train': 0.9007338881492615} -09/21/2021 00:44:50 - INFO - __main__ - Step 47367: {'lr': 0.0001990079753435734, 'samples': 1515744, 'steps': 2960, 'loss/train': 2.0612645149230957} -09/21/2021 00:44:51 - INFO - __main__ - Step 47368: {'lr': 0.0001990079753435734, 'samples': 1515776, 'steps': 2960, 'loss/train': 2.085789918899536} -09/21/2021 00:44:52 - INFO - __main__ - Step 47369: {'lr': 0.0001990079753435734, 'samples': 1515808, 'steps': 2960, 'loss/train': 1.3979640007019043} -09/21/2021 00:44:53 - INFO - __main__ - Step 47370: {'lr': 0.0001990079753435734, 'samples': 1515840, 'steps': 2960, 'loss/train': 2.7677371501922607} -09/21/2021 00:44:53 - INFO - __main__ - Step 47371: {'lr': 0.0001990079753435734, 'samples': 1515872, 'steps': 2960, 'loss/train': 1.3867950439453125} -09/21/2021 00:44:54 - INFO - __main__ - Step 47372: {'lr': 0.0001990079753435734, 'samples': 1515904, 'steps': 2960, 'loss/train': 1.6867402791976929} -09/21/2021 00:44:55 - INFO - __main__ - Step 47373: {'lr': 0.0001990079753435734, 'samples': 1515936, 'steps': 2960, 'loss/train': 3.189445734024048} -09/21/2021 00:44:56 - INFO - __main__ - Step 47374: {'lr': 0.0001990079753435734, 'samples': 1515968, 'steps': 2960, 'loss/train': 2.560595989227295} -09/21/2021 00:44:57 - INFO - __main__ - Step 47375: {'lr': 0.0001990079753435734, 'samples': 1516000, 'steps': 2960, 'loss/train': 1.8573014736175537} -09/21/2021 00:44:57 - INFO - __main__ - Step 47376: {'lr': 0.0001990079753435734, 'samples': 1516032, 'steps': 2960, 'loss/train': 1.5654215812683105} -09/21/2021 00:44:58 - INFO - __main__ - Step 47377: {'lr': 0.00019900707886955896, 'samples': 1516064, 'steps': 2961, 'loss/train': 1.2208226919174194} -09/21/2021 00:44:59 - INFO - __main__ - Step 47378: {'lr': 0.00019900707886955896, 'samples': 1516096, 'steps': 2961, 'loss/train': 2.380617380142212} -09/21/2021 00:45:00 - INFO - __main__ - Step 47379: {'lr': 0.00019900707886955896, 'samples': 1516128, 'steps': 2961, 'loss/train': 2.1510791778564453} -09/21/2021 00:45:00 - INFO - __main__ - Step 47380: {'lr': 0.00019900707886955896, 'samples': 1516160, 'steps': 2961, 'loss/train': 0.37279313802719116} -09/21/2021 00:45:01 - INFO - __main__ - Step 47381: {'lr': 0.00019900707886955896, 'samples': 1516192, 'steps': 2961, 'loss/train': 1.8291186094284058} -09/21/2021 00:45:02 - INFO - __main__ - Step 47382: {'lr': 0.00019900707886955896, 'samples': 1516224, 'steps': 2961, 'loss/train': 2.503829002380371} -09/21/2021 00:45:03 - INFO - __main__ - Step 47383: {'lr': 0.00019900707886955896, 'samples': 1516256, 'steps': 2961, 'loss/train': 1.200003743171692} -09/21/2021 00:45:03 - INFO - __main__ - Step 47384: {'lr': 0.00019900707886955896, 'samples': 1516288, 'steps': 2961, 'loss/train': 1.5429457426071167} -09/21/2021 00:45:04 - INFO - __main__ - Step 47385: {'lr': 0.00019900707886955896, 'samples': 1516320, 'steps': 2961, 'loss/train': 1.5347487926483154} -09/21/2021 00:45:05 - INFO - __main__ - Step 47386: {'lr': 0.00019900707886955896, 'samples': 1516352, 'steps': 2961, 'loss/train': 1.4148699045181274} -09/21/2021 00:45:06 - INFO - __main__ - Step 47387: {'lr': 0.00019900707886955896, 'samples': 1516384, 'steps': 2961, 'loss/train': 1.5916717052459717} -09/21/2021 00:45:06 - INFO - __main__ - Step 47388: {'lr': 0.00019900707886955896, 'samples': 1516416, 'steps': 2961, 'loss/train': 1.6264278888702393} -09/21/2021 00:45:07 - INFO - __main__ - Step 47389: {'lr': 0.00019900707886955896, 'samples': 1516448, 'steps': 2961, 'loss/train': 1.5818811655044556} -09/21/2021 00:45:08 - INFO - __main__ - Step 47390: {'lr': 0.00019900707886955896, 'samples': 1516480, 'steps': 2961, 'loss/train': 2.134915828704834} -09/21/2021 00:45:09 - INFO - __main__ - Step 47391: {'lr': 0.00019900707886955896, 'samples': 1516512, 'steps': 2961, 'loss/train': 1.382529616355896} -09/21/2021 00:45:09 - INFO - __main__ - Step 47392: {'lr': 0.00019900707886955896, 'samples': 1516544, 'steps': 2961, 'loss/train': 0.5097174644470215} -09/21/2021 00:45:10 - INFO - __main__ - Step 47393: {'lr': 0.00019900618199268513, 'samples': 1516576, 'steps': 2962, 'loss/train': 0.7792540788650513} -09/21/2021 00:45:11 - INFO - __main__ - Step 47394: {'lr': 0.00019900618199268513, 'samples': 1516608, 'steps': 2962, 'loss/train': 1.6933165788650513} -09/21/2021 00:45:12 - INFO - __main__ - Step 47395: {'lr': 0.00019900618199268513, 'samples': 1516640, 'steps': 2962, 'loss/train': 2.4568984508514404} -09/21/2021 00:45:13 - INFO - __main__ - Step 47396: {'lr': 0.00019900618199268513, 'samples': 1516672, 'steps': 2962, 'loss/train': 1.8931232690811157} -09/21/2021 00:45:14 - INFO - __main__ - Step 47397: {'lr': 0.00019900618199268513, 'samples': 1516704, 'steps': 2962, 'loss/train': 0.3669250011444092} -09/21/2021 00:45:15 - INFO - __main__ - Step 47398: {'lr': 0.00019900618199268513, 'samples': 1516736, 'steps': 2962, 'loss/train': 0.9448419213294983} -09/21/2021 00:45:15 - INFO - __main__ - Step 47399: {'lr': 0.00019900618199268513, 'samples': 1516768, 'steps': 2962, 'loss/train': 1.6995673179626465} -09/21/2021 00:45:16 - INFO - __main__ - Step 47400: {'lr': 0.00019900618199268513, 'samples': 1516800, 'steps': 2962, 'loss/train': 2.950409412384033} -09/21/2021 00:45:17 - INFO - __main__ - Step 47401: {'lr': 0.00019900618199268513, 'samples': 1516832, 'steps': 2962, 'loss/train': 1.6222807168960571} -09/21/2021 00:45:18 - INFO - __main__ - Step 47402: {'lr': 0.00019900618199268513, 'samples': 1516864, 'steps': 2962, 'loss/train': 1.9378405809402466} -09/21/2021 00:45:18 - INFO - __main__ - Step 47403: {'lr': 0.00019900618199268513, 'samples': 1516896, 'steps': 2962, 'loss/train': 0.9639261960983276} -09/21/2021 00:45:19 - INFO - __main__ - Step 47404: {'lr': 0.00019900618199268513, 'samples': 1516928, 'steps': 2962, 'loss/train': 1.962049126625061} -09/21/2021 00:45:20 - INFO - __main__ - Step 47405: {'lr': 0.00019900618199268513, 'samples': 1516960, 'steps': 2962, 'loss/train': 1.8429648876190186} -09/21/2021 00:45:21 - INFO - __main__ - Step 47406: {'lr': 0.00019900618199268513, 'samples': 1516992, 'steps': 2962, 'loss/train': 1.516194462776184} -09/21/2021 00:45:21 - INFO - __main__ - Step 47407: {'lr': 0.00019900618199268513, 'samples': 1517024, 'steps': 2962, 'loss/train': 2.20550537109375} -09/21/2021 00:45:22 - INFO - __main__ - Step 47408: {'lr': 0.00019900618199268513, 'samples': 1517056, 'steps': 2962, 'loss/train': 1.6752947568893433} -09/21/2021 00:45:23 - INFO - __main__ - Step 47409: {'lr': 0.00019900528471295553, 'samples': 1517088, 'steps': 2963, 'loss/train': 1.765307903289795} -09/21/2021 00:45:24 - INFO - __main__ - Step 47410: {'lr': 0.00019900528471295553, 'samples': 1517120, 'steps': 2963, 'loss/train': 2.062788724899292} -09/21/2021 00:45:24 - INFO - __main__ - Step 47411: {'lr': 0.00019900528471295553, 'samples': 1517152, 'steps': 2963, 'loss/train': 1.407131552696228} -09/21/2021 00:45:25 - INFO - __main__ - Step 47412: {'lr': 0.00019900528471295553, 'samples': 1517184, 'steps': 2963, 'loss/train': 2.4310309886932373} -09/21/2021 00:45:26 - INFO - __main__ - Step 47413: {'lr': 0.00019900528471295553, 'samples': 1517216, 'steps': 2963, 'loss/train': 2.3116466999053955} -09/21/2021 00:45:27 - INFO - __main__ - Step 47414: {'lr': 0.00019900528471295553, 'samples': 1517248, 'steps': 2963, 'loss/train': 2.140029191970825} -09/21/2021 00:45:27 - INFO - __main__ - Step 47415: {'lr': 0.00019900528471295553, 'samples': 1517280, 'steps': 2963, 'loss/train': 1.7553296089172363} -09/21/2021 00:45:28 - INFO - __main__ - Step 47416: {'lr': 0.00019900528471295553, 'samples': 1517312, 'steps': 2963, 'loss/train': 1.9892628192901611} -09/21/2021 00:45:29 - INFO - __main__ - Step 47417: {'lr': 0.00019900528471295553, 'samples': 1517344, 'steps': 2963, 'loss/train': 1.6191282272338867} -09/21/2021 00:45:30 - INFO - __main__ - Step 47418: {'lr': 0.00019900528471295553, 'samples': 1517376, 'steps': 2963, 'loss/train': 2.7448415756225586} -09/21/2021 00:45:30 - INFO - __main__ - Step 47419: {'lr': 0.00019900528471295553, 'samples': 1517408, 'steps': 2963, 'loss/train': 1.5181219577789307} -09/21/2021 00:45:31 - INFO - __main__ - Step 47420: {'lr': 0.00019900528471295553, 'samples': 1517440, 'steps': 2963, 'loss/train': 3.1678144931793213} -09/21/2021 00:45:32 - INFO - __main__ - Step 47421: {'lr': 0.00019900528471295553, 'samples': 1517472, 'steps': 2963, 'loss/train': 3.6421892642974854} -09/21/2021 00:45:33 - INFO - __main__ - Step 47422: {'lr': 0.00019900528471295553, 'samples': 1517504, 'steps': 2963, 'loss/train': 1.8569484949111938} -09/21/2021 00:45:33 - INFO - __main__ - Step 47423: {'lr': 0.00019900528471295553, 'samples': 1517536, 'steps': 2963, 'loss/train': 1.9573888778686523} -09/21/2021 00:45:34 - INFO - __main__ - Step 47424: {'lr': 0.00019900528471295553, 'samples': 1517568, 'steps': 2963, 'loss/train': 1.9414888620376587} -09/21/2021 00:45:35 - INFO - __main__ - Step 47425: {'lr': 0.0001990043870303738, 'samples': 1517600, 'steps': 2964, 'loss/train': 2.7841861248016357} -09/21/2021 00:45:36 - INFO - __main__ - Step 47426: {'lr': 0.0001990043870303738, 'samples': 1517632, 'steps': 2964, 'loss/train': 1.3455885648727417} -09/21/2021 00:45:37 - INFO - __main__ - Step 47427: {'lr': 0.0001990043870303738, 'samples': 1517664, 'steps': 2964, 'loss/train': 1.8547582626342773} -09/21/2021 00:45:38 - INFO - __main__ - Step 47428: {'lr': 0.0001990043870303738, 'samples': 1517696, 'steps': 2964, 'loss/train': 3.6002721786499023} -09/21/2021 00:45:39 - INFO - __main__ - Step 47429: {'lr': 0.0001990043870303738, 'samples': 1517728, 'steps': 2964, 'loss/train': 1.9999346733093262} -09/21/2021 00:45:39 - INFO - __main__ - Step 47430: {'lr': 0.0001990043870303738, 'samples': 1517760, 'steps': 2964, 'loss/train': 2.4482924938201904} -09/21/2021 00:45:40 - INFO - __main__ - Step 47431: {'lr': 0.0001990043870303738, 'samples': 1517792, 'steps': 2964, 'loss/train': 1.9216821193695068} -09/21/2021 00:45:41 - INFO - __main__ - Step 47432: {'lr': 0.0001990043870303738, 'samples': 1517824, 'steps': 2964, 'loss/train': 2.1202738285064697} -09/21/2021 00:45:42 - INFO - __main__ - Step 47433: {'lr': 0.0001990043870303738, 'samples': 1517856, 'steps': 2964, 'loss/train': 2.295447587966919} -09/21/2021 00:45:42 - INFO - __main__ - Step 47434: {'lr': 0.0001990043870303738, 'samples': 1517888, 'steps': 2964, 'loss/train': 1.9644138813018799} -09/21/2021 00:45:43 - INFO - __main__ - Step 47435: {'lr': 0.0001990043870303738, 'samples': 1517920, 'steps': 2964, 'loss/train': 1.1603789329528809} -09/21/2021 00:45:44 - INFO - __main__ - Step 47436: {'lr': 0.0001990043870303738, 'samples': 1517952, 'steps': 2964, 'loss/train': 2.710317850112915} -09/21/2021 00:45:45 - INFO - __main__ - Step 47437: {'lr': 0.0001990043870303738, 'samples': 1517984, 'steps': 2964, 'loss/train': 2.3996615409851074} -09/21/2021 00:45:45 - INFO - __main__ - Step 47438: {'lr': 0.0001990043870303738, 'samples': 1518016, 'steps': 2964, 'loss/train': 2.480041265487671} -09/21/2021 00:45:46 - INFO - __main__ - Step 47439: {'lr': 0.0001990043870303738, 'samples': 1518048, 'steps': 2964, 'loss/train': 1.5280487537384033} -09/21/2021 00:45:47 - INFO - __main__ - Step 47440: {'lr': 0.0001990043870303738, 'samples': 1518080, 'steps': 2964, 'loss/train': 1.314839482307434} -09/21/2021 00:45:48 - INFO - __main__ - Step 47441: {'lr': 0.0001990034889449436, 'samples': 1518112, 'steps': 2965, 'loss/train': 2.5090510845184326} -09/21/2021 00:45:49 - INFO - __main__ - Step 47442: {'lr': 0.0001990034889449436, 'samples': 1518144, 'steps': 2965, 'loss/train': 1.0852137804031372} -09/21/2021 00:45:49 - INFO - __main__ - Step 47443: {'lr': 0.0001990034889449436, 'samples': 1518176, 'steps': 2965, 'loss/train': 1.8397912979125977} -09/21/2021 00:45:50 - INFO - __main__ - Step 47444: {'lr': 0.0001990034889449436, 'samples': 1518208, 'steps': 2965, 'loss/train': 2.6104609966278076} -09/21/2021 00:45:51 - INFO - __main__ - Step 47445: {'lr': 0.0001990034889449436, 'samples': 1518240, 'steps': 2965, 'loss/train': 1.6911182403564453} -09/21/2021 00:45:52 - INFO - __main__ - Step 47446: {'lr': 0.0001990034889449436, 'samples': 1518272, 'steps': 2965, 'loss/train': 2.8276185989379883} -09/21/2021 00:45:52 - INFO - __main__ - Step 47447: {'lr': 0.0001990034889449436, 'samples': 1518304, 'steps': 2965, 'loss/train': 1.639336109161377} -09/21/2021 00:45:53 - INFO - __main__ - Step 47448: {'lr': 0.0001990034889449436, 'samples': 1518336, 'steps': 2965, 'loss/train': 2.605053186416626} -09/21/2021 00:45:54 - INFO - __main__ - Step 47449: {'lr': 0.0001990034889449436, 'samples': 1518368, 'steps': 2965, 'loss/train': 1.3552316427230835} -09/21/2021 00:45:55 - INFO - __main__ - Step 47450: {'lr': 0.0001990034889449436, 'samples': 1518400, 'steps': 2965, 'loss/train': 2.3757851123809814} -09/21/2021 00:45:55 - INFO - __main__ - Step 47451: {'lr': 0.0001990034889449436, 'samples': 1518432, 'steps': 2965, 'loss/train': 2.1293795108795166} -09/21/2021 00:45:56 - INFO - __main__ - Step 47452: {'lr': 0.0001990034889449436, 'samples': 1518464, 'steps': 2965, 'loss/train': 1.1950143575668335} -09/21/2021 00:45:57 - INFO - __main__ - Step 47453: {'lr': 0.0001990034889449436, 'samples': 1518496, 'steps': 2965, 'loss/train': 1.981127142906189} -09/21/2021 00:45:58 - INFO - __main__ - Step 47454: {'lr': 0.0001990034889449436, 'samples': 1518528, 'steps': 2965, 'loss/train': 0.9941156506538391} -09/21/2021 00:45:58 - INFO - __main__ - Step 47455: {'lr': 0.0001990034889449436, 'samples': 1518560, 'steps': 2965, 'loss/train': 2.41789174079895} -09/21/2021 00:45:59 - INFO - __main__ - Step 47456: {'lr': 0.0001990034889449436, 'samples': 1518592, 'steps': 2965, 'loss/train': 3.009579658508301} -09/21/2021 00:46:00 - INFO - __main__ - Step 47457: {'lr': 0.00019900259045666857, 'samples': 1518624, 'steps': 2966, 'loss/train': 1.647295355796814} -09/21/2021 00:46:01 - INFO - __main__ - Step 47458: {'lr': 0.00019900259045666857, 'samples': 1518656, 'steps': 2966, 'loss/train': 0.4776059091091156} -09/21/2021 00:46:02 - INFO - __main__ - Step 47459: {'lr': 0.00019900259045666857, 'samples': 1518688, 'steps': 2966, 'loss/train': 2.0136892795562744} -09/21/2021 00:46:03 - INFO - __main__ - Step 47460: {'lr': 0.00019900259045666857, 'samples': 1518720, 'steps': 2966, 'loss/train': 2.079298973083496} -09/21/2021 00:46:04 - INFO - __main__ - Step 47461: {'lr': 0.00019900259045666857, 'samples': 1518752, 'steps': 2966, 'loss/train': 2.5122804641723633} -09/21/2021 00:46:04 - INFO - __main__ - Step 47462: {'lr': 0.00019900259045666857, 'samples': 1518784, 'steps': 2966, 'loss/train': 2.1572136878967285} -09/21/2021 00:46:05 - INFO - __main__ - Step 47463: {'lr': 0.00019900259045666857, 'samples': 1518816, 'steps': 2966, 'loss/train': 2.2732388973236084} -09/21/2021 00:46:06 - INFO - __main__ - Step 47464: {'lr': 0.00019900259045666857, 'samples': 1518848, 'steps': 2966, 'loss/train': 2.260392665863037} -09/21/2021 00:46:07 - INFO - __main__ - Step 47465: {'lr': 0.00019900259045666857, 'samples': 1518880, 'steps': 2966, 'loss/train': 1.7388700246810913} -09/21/2021 00:46:07 - INFO - __main__ - Step 47466: {'lr': 0.00019900259045666857, 'samples': 1518912, 'steps': 2966, 'loss/train': 2.9294207096099854} -09/21/2021 00:46:08 - INFO - __main__ - Step 47467: {'lr': 0.00019900259045666857, 'samples': 1518944, 'steps': 2966, 'loss/train': 1.3016051054000854} -09/21/2021 00:46:09 - INFO - __main__ - Step 47468: {'lr': 0.00019900259045666857, 'samples': 1518976, 'steps': 2966, 'loss/train': 2.4788424968719482} -09/21/2021 00:46:10 - INFO - __main__ - Step 47469: {'lr': 0.00019900259045666857, 'samples': 1519008, 'steps': 2966, 'loss/train': 2.069591999053955} -09/21/2021 00:46:10 - INFO - __main__ - Step 47470: {'lr': 0.00019900259045666857, 'samples': 1519040, 'steps': 2966, 'loss/train': 1.4989993572235107} -09/21/2021 00:46:11 - INFO - __main__ - Step 47471: {'lr': 0.00019900259045666857, 'samples': 1519072, 'steps': 2966, 'loss/train': 1.8840758800506592} -09/21/2021 00:46:12 - INFO - __main__ - Step 47472: {'lr': 0.00019900259045666857, 'samples': 1519104, 'steps': 2966, 'loss/train': 2.527099370956421} -09/21/2021 00:46:13 - INFO - __main__ - Step 47473: {'lr': 0.0001990016915655524, 'samples': 1519136, 'steps': 2967, 'loss/train': 2.492769718170166} -09/21/2021 00:46:14 - INFO - __main__ - Step 47474: {'lr': 0.0001990016915655524, 'samples': 1519168, 'steps': 2967, 'loss/train': 1.168404221534729} -09/21/2021 00:46:14 - INFO - __main__ - Step 47475: {'lr': 0.0001990016915655524, 'samples': 1519200, 'steps': 2967, 'loss/train': 1.937880516052246} -09/21/2021 00:46:15 - INFO - __main__ - Step 47476: {'lr': 0.0001990016915655524, 'samples': 1519232, 'steps': 2967, 'loss/train': 1.8562294244766235} -09/21/2021 00:46:16 - INFO - __main__ - Step 47477: {'lr': 0.0001990016915655524, 'samples': 1519264, 'steps': 2967, 'loss/train': 0.6448002457618713} -09/21/2021 00:46:17 - INFO - __main__ - Step 47478: {'lr': 0.0001990016915655524, 'samples': 1519296, 'steps': 2967, 'loss/train': 2.433587074279785} -09/21/2021 00:46:17 - INFO - __main__ - Step 47479: {'lr': 0.0001990016915655524, 'samples': 1519328, 'steps': 2967, 'loss/train': 3.1107370853424072} -09/21/2021 00:46:18 - INFO - __main__ - Step 47480: {'lr': 0.0001990016915655524, 'samples': 1519360, 'steps': 2967, 'loss/train': 3.1720807552337646} -09/21/2021 00:46:19 - INFO - __main__ - Step 47481: {'lr': 0.0001990016915655524, 'samples': 1519392, 'steps': 2967, 'loss/train': 3.046483039855957} -09/21/2021 00:46:20 - INFO - __main__ - Step 47482: {'lr': 0.0001990016915655524, 'samples': 1519424, 'steps': 2967, 'loss/train': 3.009309768676758} -09/21/2021 00:46:20 - INFO - __main__ - Step 47483: {'lr': 0.0001990016915655524, 'samples': 1519456, 'steps': 2967, 'loss/train': 3.059307098388672} -09/21/2021 00:46:21 - INFO - __main__ - Step 47484: {'lr': 0.0001990016915655524, 'samples': 1519488, 'steps': 2967, 'loss/train': 2.964587688446045} -09/21/2021 00:46:22 - INFO - __main__ - Step 47485: {'lr': 0.0001990016915655524, 'samples': 1519520, 'steps': 2967, 'loss/train': 3.0316410064697266} -09/21/2021 00:46:23 - INFO - __main__ - Step 47486: {'lr': 0.0001990016915655524, 'samples': 1519552, 'steps': 2967, 'loss/train': 2.9928183555603027} -09/21/2021 00:46:23 - INFO - __main__ - Step 47487: {'lr': 0.0001990016915655524, 'samples': 1519584, 'steps': 2967, 'loss/train': 1.50137197971344} -09/21/2021 00:46:24 - INFO - __main__ - Step 47488: {'lr': 0.0001990016915655524, 'samples': 1519616, 'steps': 2967, 'loss/train': 1.769900918006897} -09/21/2021 00:46:25 - INFO - __main__ - Step 47489: {'lr': 0.00019900079227159876, 'samples': 1519648, 'steps': 2968, 'loss/train': 2.033804416656494} -09/21/2021 00:46:26 - INFO - __main__ - Step 47490: {'lr': 0.00019900079227159876, 'samples': 1519680, 'steps': 2968, 'loss/train': 2.1585488319396973} -09/21/2021 00:46:27 - INFO - __main__ - Step 47491: {'lr': 0.00019900079227159876, 'samples': 1519712, 'steps': 2968, 'loss/train': 1.784374475479126} -09/21/2021 00:46:27 - INFO - __main__ - Step 47492: {'lr': 0.00019900079227159876, 'samples': 1519744, 'steps': 2968, 'loss/train': 1.3571683168411255} -09/21/2021 00:46:28 - INFO - __main__ - Step 47493: {'lr': 0.00019900079227159876, 'samples': 1519776, 'steps': 2968, 'loss/train': 1.8919519186019897} -09/21/2021 00:46:29 - INFO - __main__ - Step 47494: {'lr': 0.00019900079227159876, 'samples': 1519808, 'steps': 2968, 'loss/train': 1.8212270736694336} -09/21/2021 00:46:31 - INFO - __main__ - Step 47495: {'lr': 0.00019900079227159876, 'samples': 1519840, 'steps': 2968, 'loss/train': 2.047123908996582} -09/21/2021 00:46:32 - INFO - __main__ - Step 47496: {'lr': 0.00019900079227159876, 'samples': 1519872, 'steps': 2968, 'loss/train': 2.9465584754943848} -09/21/2021 00:46:33 - INFO - __main__ - Step 47497: {'lr': 0.00019900079227159876, 'samples': 1519904, 'steps': 2968, 'loss/train': 2.0455362796783447} -09/21/2021 00:46:34 - INFO - __main__ - Step 47498: {'lr': 0.00019900079227159876, 'samples': 1519936, 'steps': 2968, 'loss/train': 2.0942955017089844} -09/21/2021 00:46:34 - INFO - __main__ - Step 47499: {'lr': 0.00019900079227159876, 'samples': 1519968, 'steps': 2968, 'loss/train': 1.4678748846054077} -09/21/2021 00:46:35 - INFO - __main__ - Step 47500: {'lr': 0.00019900079227159876, 'samples': 1520000, 'steps': 2968, 'loss/train': 2.0285837650299072} -09/21/2021 00:46:36 - INFO - __main__ - Step 47501: {'lr': 0.00019900079227159876, 'samples': 1520032, 'steps': 2968, 'loss/train': 1.1454973220825195} -09/21/2021 00:46:37 - INFO - __main__ - Step 47502: {'lr': 0.00019900079227159876, 'samples': 1520064, 'steps': 2968, 'loss/train': 2.148775339126587} -09/21/2021 00:46:37 - INFO - __main__ - Step 47503: {'lr': 0.00019900079227159876, 'samples': 1520096, 'steps': 2968, 'loss/train': 2.7201952934265137} -09/21/2021 00:46:38 - INFO - __main__ - Step 47504: {'lr': 0.00019900079227159876, 'samples': 1520128, 'steps': 2968, 'loss/train': 1.9810914993286133} -09/21/2021 00:46:39 - INFO - __main__ - Step 47505: {'lr': 0.00019899989257481126, 'samples': 1520160, 'steps': 2969, 'loss/train': 1.495179533958435} -09/21/2021 00:46:40 - INFO - __main__ - Step 47506: {'lr': 0.00019899989257481126, 'samples': 1520192, 'steps': 2969, 'loss/train': 0.2554008960723877} -09/21/2021 00:46:40 - INFO - __main__ - Step 47507: {'lr': 0.00019899989257481126, 'samples': 1520224, 'steps': 2969, 'loss/train': 0.9516690373420715} -09/21/2021 00:46:41 - INFO - __main__ - Step 47508: {'lr': 0.00019899989257481126, 'samples': 1520256, 'steps': 2969, 'loss/train': 1.8562546968460083} -09/21/2021 00:46:42 - INFO - __main__ - Step 47509: {'lr': 0.00019899989257481126, 'samples': 1520288, 'steps': 2969, 'loss/train': 3.162456750869751} -09/21/2021 00:46:43 - INFO - __main__ - Step 47510: {'lr': 0.00019899989257481126, 'samples': 1520320, 'steps': 2969, 'loss/train': 3.0962977409362793} -09/21/2021 00:46:43 - INFO - __main__ - Step 47511: {'lr': 0.00019899989257481126, 'samples': 1520352, 'steps': 2969, 'loss/train': 3.1217398643493652} -09/21/2021 00:46:44 - INFO - __main__ - Step 47512: {'lr': 0.00019899989257481126, 'samples': 1520384, 'steps': 2969, 'loss/train': 2.2000625133514404} -09/21/2021 00:46:45 - INFO - __main__ - Step 47513: {'lr': 0.00019899989257481126, 'samples': 1520416, 'steps': 2969, 'loss/train': 2.4900760650634766} -09/21/2021 00:46:46 - INFO - __main__ - Step 47514: {'lr': 0.00019899989257481126, 'samples': 1520448, 'steps': 2969, 'loss/train': 1.8674510717391968} -09/21/2021 00:46:46 - INFO - __main__ - Step 47515: {'lr': 0.00019899989257481126, 'samples': 1520480, 'steps': 2969, 'loss/train': 1.704099416732788} -09/21/2021 00:46:47 - INFO - __main__ - Step 47516: {'lr': 0.00019899989257481126, 'samples': 1520512, 'steps': 2969, 'loss/train': 1.616206169128418} -09/21/2021 00:46:48 - INFO - __main__ - Step 47517: {'lr': 0.00019899989257481126, 'samples': 1520544, 'steps': 2969, 'loss/train': 2.1401150226593018} -09/21/2021 00:46:49 - INFO - __main__ - Step 47518: {'lr': 0.00019899989257481126, 'samples': 1520576, 'steps': 2969, 'loss/train': 0.5586042404174805} -09/21/2021 00:46:49 - INFO - __main__ - Step 47519: {'lr': 0.00019899989257481126, 'samples': 1520608, 'steps': 2969, 'loss/train': 0.7298814058303833} -09/21/2021 00:46:50 - INFO - __main__ - Step 47520: {'lr': 0.00019899989257481126, 'samples': 1520640, 'steps': 2969, 'loss/train': 0.2485809326171875} -09/21/2021 00:46:51 - INFO - __main__ - Step 47521: {'lr': 0.0001989989924751936, 'samples': 1520672, 'steps': 2970, 'loss/train': 0.3085592985153198} -09/21/2021 00:46:52 - INFO - __main__ - Step 47522: {'lr': 0.0001989989924751936, 'samples': 1520704, 'steps': 2970, 'loss/train': 0.39277857542037964} -09/21/2021 00:46:53 - INFO - __main__ - Step 47523: {'lr': 0.0001989989924751936, 'samples': 1520736, 'steps': 2970, 'loss/train': 0.31334617733955383} -09/21/2021 00:46:53 - INFO - __main__ - Step 47524: {'lr': 0.0001989989924751936, 'samples': 1520768, 'steps': 2970, 'loss/train': 0.35054051876068115} -09/21/2021 00:46:54 - INFO - __main__ - Step 47525: {'lr': 0.0001989989924751936, 'samples': 1520800, 'steps': 2970, 'loss/train': 1.9456181526184082} -09/21/2021 00:46:55 - INFO - __main__ - Step 47526: {'lr': 0.0001989989924751936, 'samples': 1520832, 'steps': 2970, 'loss/train': 3.2549407482147217} -09/21/2021 00:46:56 - INFO - __main__ - Step 47527: {'lr': 0.0001989989924751936, 'samples': 1520864, 'steps': 2970, 'loss/train': 0.3140055537223816} -09/21/2021 00:46:56 - INFO - __main__ - Step 47528: {'lr': 0.0001989989924751936, 'samples': 1520896, 'steps': 2970, 'loss/train': 0.26874879002571106} -09/21/2021 00:46:57 - INFO - __main__ - Step 47529: {'lr': 0.0001989989924751936, 'samples': 1520928, 'steps': 2970, 'loss/train': 0.25679612159729004} -09/21/2021 00:46:58 - INFO - __main__ - Step 47530: {'lr': 0.0001989989924751936, 'samples': 1520960, 'steps': 2970, 'loss/train': 0.2735253870487213} -09/21/2021 00:46:59 - INFO - __main__ - Step 47531: {'lr': 0.0001989989924751936, 'samples': 1520992, 'steps': 2970, 'loss/train': 0.30772867798805237} -09/21/2021 00:46:59 - INFO - __main__ - Step 47532: {'lr': 0.0001989989924751936, 'samples': 1521024, 'steps': 2970, 'loss/train': 0.31603336334228516} -09/21/2021 00:47:00 - INFO - __main__ - Step 47533: {'lr': 0.0001989989924751936, 'samples': 1521056, 'steps': 2970, 'loss/train': 0.2913142144680023} -09/21/2021 00:47:01 - INFO - __main__ - Step 47534: {'lr': 0.0001989989924751936, 'samples': 1521088, 'steps': 2970, 'loss/train': 0.3913862109184265} -09/21/2021 00:47:02 - INFO - __main__ - Step 47535: {'lr': 0.0001989989924751936, 'samples': 1521120, 'steps': 2970, 'loss/train': 0.20686876773834229} -09/21/2021 00:47:02 - INFO - __main__ - Step 47536: {'lr': 0.0001989989924751936, 'samples': 1521152, 'steps': 2970, 'loss/train': 0.23918534815311432} -09/21/2021 00:47:03 - INFO - __main__ - Step 47537: {'lr': 0.00019899809197274938, 'samples': 1521184, 'steps': 2971, 'loss/train': 0.30136144161224365} -09/21/2021 00:47:04 - INFO - __main__ - Step 47538: {'lr': 0.00019899809197274938, 'samples': 1521216, 'steps': 2971, 'loss/train': 0.2780826687812805} -09/21/2021 00:47:05 - INFO - __main__ - Step 47539: {'lr': 0.00019899809197274938, 'samples': 1521248, 'steps': 2971, 'loss/train': 0.32186535000801086} -09/21/2021 00:47:06 - INFO - __main__ - Step 47540: {'lr': 0.00019899809197274938, 'samples': 1521280, 'steps': 2971, 'loss/train': 1.939125895500183} -09/21/2021 00:47:07 - INFO - __main__ - Step 47541: {'lr': 0.00019899809197274938, 'samples': 1521312, 'steps': 2971, 'loss/train': 2.1931204795837402} -09/21/2021 00:47:07 - INFO - __main__ - Step 47542: {'lr': 0.00019899809197274938, 'samples': 1521344, 'steps': 2971, 'loss/train': 2.5628256797790527} -09/21/2021 00:47:08 - INFO - __main__ - Step 47543: {'lr': 0.00019899809197274938, 'samples': 1521376, 'steps': 2971, 'loss/train': 2.168332815170288} -09/21/2021 00:47:09 - INFO - __main__ - Step 47544: {'lr': 0.00019899809197274938, 'samples': 1521408, 'steps': 2971, 'loss/train': 2.489786148071289} -09/21/2021 00:47:10 - INFO - __main__ - Step 47545: {'lr': 0.00019899809197274938, 'samples': 1521440, 'steps': 2971, 'loss/train': 0.6306990385055542} -09/21/2021 00:47:10 - INFO - __main__ - Step 47546: {'lr': 0.00019899809197274938, 'samples': 1521472, 'steps': 2971, 'loss/train': 1.5130021572113037} -09/21/2021 00:47:11 - INFO - __main__ - Step 47547: {'lr': 0.00019899809197274938, 'samples': 1521504, 'steps': 2971, 'loss/train': 2.609220266342163} -09/21/2021 00:47:12 - INFO - __main__ - Step 47548: {'lr': 0.00019899809197274938, 'samples': 1521536, 'steps': 2971, 'loss/train': 1.9249963760375977} -09/21/2021 00:47:13 - INFO - __main__ - Step 47549: {'lr': 0.00019899809197274938, 'samples': 1521568, 'steps': 2971, 'loss/train': 1.952984094619751} -09/21/2021 00:47:13 - INFO - __main__ - Step 47550: {'lr': 0.00019899809197274938, 'samples': 1521600, 'steps': 2971, 'loss/train': 2.288367509841919} -09/21/2021 00:47:14 - INFO - __main__ - Step 47551: {'lr': 0.00019899809197274938, 'samples': 1521632, 'steps': 2971, 'loss/train': 1.3525006771087646} -09/21/2021 00:47:15 - INFO - __main__ - Step 47552: {'lr': 0.00019899809197274938, 'samples': 1521664, 'steps': 2971, 'loss/train': 1.760063886642456} -09/21/2021 00:47:16 - INFO - __main__ - Step 47553: {'lr': 0.00019899719106748233, 'samples': 1521696, 'steps': 2972, 'loss/train': 1.6694538593292236} -09/21/2021 00:47:17 - INFO - __main__ - Step 47554: {'lr': 0.00019899719106748233, 'samples': 1521728, 'steps': 2972, 'loss/train': 1.0370806455612183} -09/21/2021 00:47:17 - INFO - __main__ - Step 47555: {'lr': 0.00019899719106748233, 'samples': 1521760, 'steps': 2972, 'loss/train': 1.8342688083648682} -09/21/2021 00:47:18 - INFO - __main__ - Step 47556: {'lr': 0.00019899719106748233, 'samples': 1521792, 'steps': 2972, 'loss/train': 0.4400070011615753} -09/21/2021 00:47:19 - INFO - __main__ - Step 47557: {'lr': 0.00019899719106748233, 'samples': 1521824, 'steps': 2972, 'loss/train': 2.9299633502960205} -09/21/2021 00:47:20 - INFO - __main__ - Step 47558: {'lr': 0.00019899719106748233, 'samples': 1521856, 'steps': 2972, 'loss/train': 4.1828107833862305} -09/21/2021 00:47:20 - INFO - __main__ - Step 47559: {'lr': 0.00019899719106748233, 'samples': 1521888, 'steps': 2972, 'loss/train': 1.4536101818084717} -09/21/2021 00:47:21 - INFO - __main__ - Step 47560: {'lr': 0.00019899719106748233, 'samples': 1521920, 'steps': 2972, 'loss/train': 1.5210875272750854} -09/21/2021 00:47:22 - INFO - __main__ - Step 47561: {'lr': 0.00019899719106748233, 'samples': 1521952, 'steps': 2972, 'loss/train': 1.9451695680618286} -09/21/2021 00:47:23 - INFO - __main__ - Step 47562: {'lr': 0.00019899719106748233, 'samples': 1521984, 'steps': 2972, 'loss/train': 1.9319732189178467} -09/21/2021 00:47:23 - INFO - __main__ - Step 47563: {'lr': 0.00019899719106748233, 'samples': 1522016, 'steps': 2972, 'loss/train': 0.7156324982643127} -09/21/2021 00:47:24 - INFO - __main__ - Step 47564: {'lr': 0.00019899719106748233, 'samples': 1522048, 'steps': 2972, 'loss/train': 2.382133960723877} -09/21/2021 00:47:25 - INFO - __main__ - Step 47565: {'lr': 0.00019899719106748233, 'samples': 1522080, 'steps': 2972, 'loss/train': 1.7742024660110474} -09/21/2021 00:47:26 - INFO - __main__ - Step 47566: {'lr': 0.00019899719106748233, 'samples': 1522112, 'steps': 2972, 'loss/train': 2.0042901039123535} -09/21/2021 00:47:26 - INFO - __main__ - Step 47567: {'lr': 0.00019899719106748233, 'samples': 1522144, 'steps': 2972, 'loss/train': 3.2319514751434326} -09/21/2021 00:47:27 - INFO - __main__ - Step 47568: {'lr': 0.00019899719106748233, 'samples': 1522176, 'steps': 2972, 'loss/train': 1.7219791412353516} -09/21/2021 00:47:28 - INFO - __main__ - Step 47569: {'lr': 0.00019899628975939611, 'samples': 1522208, 'steps': 2973, 'loss/train': 1.4108668565750122} -09/21/2021 00:47:29 - INFO - __main__ - Step 47570: {'lr': 0.00019899628975939611, 'samples': 1522240, 'steps': 2973, 'loss/train': 1.8654309511184692} -09/21/2021 00:47:30 - INFO - __main__ - Step 47571: {'lr': 0.00019899628975939611, 'samples': 1522272, 'steps': 2973, 'loss/train': 2.7840991020202637} -09/21/2021 00:47:31 - INFO - __main__ - Step 47572: {'lr': 0.00019899628975939611, 'samples': 1522304, 'steps': 2973, 'loss/train': 1.0175780057907104} -09/21/2021 00:47:31 - INFO - __main__ - Step 47573: {'lr': 0.00019899628975939611, 'samples': 1522336, 'steps': 2973, 'loss/train': 1.8950233459472656} -09/21/2021 00:47:32 - INFO - __main__ - Step 47574: {'lr': 0.00019899628975939611, 'samples': 1522368, 'steps': 2973, 'loss/train': 2.011956214904785} -09/21/2021 00:47:33 - INFO - __main__ - Step 47575: {'lr': 0.00019899628975939611, 'samples': 1522400, 'steps': 2973, 'loss/train': 2.274712562561035} -09/21/2021 00:47:34 - INFO - __main__ - Step 47576: {'lr': 0.00019899628975939611, 'samples': 1522432, 'steps': 2973, 'loss/train': 1.5912569761276245} -09/21/2021 00:47:34 - INFO - __main__ - Step 47577: {'lr': 0.00019899628975939611, 'samples': 1522464, 'steps': 2973, 'loss/train': 1.9806737899780273} -09/21/2021 00:47:35 - INFO - __main__ - Step 47578: {'lr': 0.00019899628975939611, 'samples': 1522496, 'steps': 2973, 'loss/train': 2.3615949153900146} -09/21/2021 00:47:36 - INFO - __main__ - Step 47579: {'lr': 0.00019899628975939611, 'samples': 1522528, 'steps': 2973, 'loss/train': 2.087825059890747} -09/21/2021 00:47:37 - INFO - __main__ - Step 47580: {'lr': 0.00019899628975939611, 'samples': 1522560, 'steps': 2973, 'loss/train': 2.044822931289673} -09/21/2021 00:47:37 - INFO - __main__ - Step 47581: {'lr': 0.00019899628975939611, 'samples': 1522592, 'steps': 2973, 'loss/train': 1.5129468441009521} -09/21/2021 00:47:38 - INFO - __main__ - Step 47582: {'lr': 0.00019899628975939611, 'samples': 1522624, 'steps': 2973, 'loss/train': 1.7301324605941772} -09/21/2021 00:47:39 - INFO - __main__ - Step 47583: {'lr': 0.00019899628975939611, 'samples': 1522656, 'steps': 2973, 'loss/train': 2.4691052436828613} -09/21/2021 00:47:40 - INFO - __main__ - Step 47584: {'lr': 0.00019899628975939611, 'samples': 1522688, 'steps': 2973, 'loss/train': 3.4483633041381836} -09/21/2021 00:47:41 - INFO - __main__ - Step 47585: {'lr': 0.00019899538804849437, 'samples': 1522720, 'steps': 2974, 'loss/train': 1.8272145986557007} -09/21/2021 00:47:41 - INFO - __main__ - Step 47586: {'lr': 0.00019899538804849437, 'samples': 1522752, 'steps': 2974, 'loss/train': 1.5206595659255981} -09/21/2021 00:47:42 - INFO - __main__ - Step 47587: {'lr': 0.00019899538804849437, 'samples': 1522784, 'steps': 2974, 'loss/train': 2.4118340015411377} -09/21/2021 00:47:43 - INFO - __main__ - Step 47588: {'lr': 0.00019899538804849437, 'samples': 1522816, 'steps': 2974, 'loss/train': 1.9734845161437988} -09/21/2021 00:47:44 - INFO - __main__ - Step 47589: {'lr': 0.00019899538804849437, 'samples': 1522848, 'steps': 2974, 'loss/train': 1.783262848854065} -09/21/2021 00:47:44 - INFO - __main__ - Step 47590: {'lr': 0.00019899538804849437, 'samples': 1522880, 'steps': 2974, 'loss/train': 1.8438830375671387} -09/21/2021 00:47:45 - INFO - __main__ - Step 47591: {'lr': 0.00019899538804849437, 'samples': 1522912, 'steps': 2974, 'loss/train': 2.1024138927459717} -09/21/2021 00:47:46 - INFO - __main__ - Step 47592: {'lr': 0.00019899538804849437, 'samples': 1522944, 'steps': 2974, 'loss/train': 1.8426008224487305} -09/21/2021 00:47:47 - INFO - __main__ - Step 47593: {'lr': 0.00019899538804849437, 'samples': 1522976, 'steps': 2974, 'loss/train': 1.8488694429397583} -09/21/2021 00:47:47 - INFO - __main__ - Step 47594: {'lr': 0.00019899538804849437, 'samples': 1523008, 'steps': 2974, 'loss/train': 1.8929975032806396} -09/21/2021 00:47:48 - INFO - __main__ - Step 47595: {'lr': 0.00019899538804849437, 'samples': 1523040, 'steps': 2974, 'loss/train': 2.144890785217285} -09/21/2021 00:47:49 - INFO - __main__ - Step 47596: {'lr': 0.00019899538804849437, 'samples': 1523072, 'steps': 2974, 'loss/train': 1.1145349740982056} -09/21/2021 00:47:50 - INFO - __main__ - Step 47597: {'lr': 0.00019899538804849437, 'samples': 1523104, 'steps': 2974, 'loss/train': 2.4347424507141113} -09/21/2021 00:47:50 - INFO - __main__ - Step 47598: {'lr': 0.00019899538804849437, 'samples': 1523136, 'steps': 2974, 'loss/train': 1.4067217111587524} -09/21/2021 00:47:51 - INFO - __main__ - Step 47599: {'lr': 0.00019899538804849437, 'samples': 1523168, 'steps': 2974, 'loss/train': 2.6412582397460938} -09/21/2021 00:47:52 - INFO - __main__ - Step 47600: {'lr': 0.00019899538804849437, 'samples': 1523200, 'steps': 2974, 'loss/train': 2.918243408203125} -09/21/2021 00:47:53 - INFO - __main__ - Step 47601: {'lr': 0.00019899448593478075, 'samples': 1523232, 'steps': 2975, 'loss/train': 1.9417405128479004} -09/21/2021 00:47:54 - INFO - __main__ - Step 47602: {'lr': 0.00019899448593478075, 'samples': 1523264, 'steps': 2975, 'loss/train': 1.9963685274124146} -09/21/2021 00:47:55 - INFO - __main__ - Step 47603: {'lr': 0.00019899448593478075, 'samples': 1523296, 'steps': 2975, 'loss/train': 1.9578380584716797} -09/21/2021 00:47:56 - INFO - __main__ - Step 47604: {'lr': 0.00019899448593478075, 'samples': 1523328, 'steps': 2975, 'loss/train': 1.505102515220642} -09/21/2021 00:47:56 - INFO - __main__ - Step 47605: {'lr': 0.00019899448593478075, 'samples': 1523360, 'steps': 2975, 'loss/train': 2.3921196460723877} -09/21/2021 00:47:57 - INFO - __main__ - Step 47606: {'lr': 0.00019899448593478075, 'samples': 1523392, 'steps': 2975, 'loss/train': 2.176208972930908} -09/21/2021 00:47:58 - INFO - __main__ - Step 47607: {'lr': 0.00019899448593478075, 'samples': 1523424, 'steps': 2975, 'loss/train': 1.9762037992477417} -09/21/2021 00:47:59 - INFO - __main__ - Step 47608: {'lr': 0.00019899448593478075, 'samples': 1523456, 'steps': 2975, 'loss/train': 1.7003297805786133} -09/21/2021 00:47:59 - INFO - __main__ - Step 47609: {'lr': 0.00019899448593478075, 'samples': 1523488, 'steps': 2975, 'loss/train': 1.7053414583206177} -09/21/2021 00:48:00 - INFO - __main__ - Step 47610: {'lr': 0.00019899448593478075, 'samples': 1523520, 'steps': 2975, 'loss/train': 2.077996253967285} -09/21/2021 00:48:01 - INFO - __main__ - Step 47611: {'lr': 0.00019899448593478075, 'samples': 1523552, 'steps': 2975, 'loss/train': 2.0728886127471924} -09/21/2021 00:48:02 - INFO - __main__ - Step 47612: {'lr': 0.00019899448593478075, 'samples': 1523584, 'steps': 2975, 'loss/train': 2.5781164169311523} -09/21/2021 00:48:02 - INFO - __main__ - Step 47613: {'lr': 0.00019899448593478075, 'samples': 1523616, 'steps': 2975, 'loss/train': 1.2344653606414795} -09/21/2021 00:48:03 - INFO - __main__ - Step 47614: {'lr': 0.00019899448593478075, 'samples': 1523648, 'steps': 2975, 'loss/train': 2.0072460174560547} -09/21/2021 00:48:04 - INFO - __main__ - Step 47615: {'lr': 0.00019899448593478075, 'samples': 1523680, 'steps': 2975, 'loss/train': 1.5949501991271973} -09/21/2021 00:48:05 - INFO - __main__ - Step 47616: {'lr': 0.00019899448593478075, 'samples': 1523712, 'steps': 2975, 'loss/train': 1.3847014904022217} -09/21/2021 00:48:05 - INFO - __main__ - Step 47617: {'lr': 0.00019899358341825897, 'samples': 1523744, 'steps': 2976, 'loss/train': 0.17175602912902832} -09/21/2021 00:48:06 - INFO - __main__ - Step 47618: {'lr': 0.00019899358341825897, 'samples': 1523776, 'steps': 2976, 'loss/train': 2.0225865840911865} -09/21/2021 00:48:07 - INFO - __main__ - Step 47619: {'lr': 0.00019899358341825897, 'samples': 1523808, 'steps': 2976, 'loss/train': 2.936857223510742} -09/21/2021 00:48:08 - INFO - __main__ - Step 47620: {'lr': 0.00019899358341825897, 'samples': 1523840, 'steps': 2976, 'loss/train': 1.6415948867797852} -09/21/2021 00:48:08 - INFO - __main__ - Step 47621: {'lr': 0.00019899358341825897, 'samples': 1523872, 'steps': 2976, 'loss/train': 2.5968990325927734} -09/21/2021 00:48:09 - INFO - __main__ - Step 47622: {'lr': 0.00019899358341825897, 'samples': 1523904, 'steps': 2976, 'loss/train': 0.9863175749778748} -09/21/2021 00:48:10 - INFO - __main__ - Step 47623: {'lr': 0.00019899358341825897, 'samples': 1523936, 'steps': 2976, 'loss/train': 2.7846944332122803} -09/21/2021 00:48:11 - INFO - __main__ - Step 47624: {'lr': 0.00019899358341825897, 'samples': 1523968, 'steps': 2976, 'loss/train': 1.738077998161316} -09/21/2021 00:48:11 - INFO - __main__ - Step 47625: {'lr': 0.00019899358341825897, 'samples': 1524000, 'steps': 2976, 'loss/train': 1.5680458545684814} -09/21/2021 00:48:12 - INFO - __main__ - Step 47626: {'lr': 0.00019899358341825897, 'samples': 1524032, 'steps': 2976, 'loss/train': 1.491241216659546} -09/21/2021 00:48:13 - INFO - __main__ - Step 47627: {'lr': 0.00019899358341825897, 'samples': 1524064, 'steps': 2976, 'loss/train': 1.6786339282989502} -09/21/2021 00:48:14 - INFO - __main__ - Step 47628: {'lr': 0.00019899358341825897, 'samples': 1524096, 'steps': 2976, 'loss/train': 3.219653844833374} -09/21/2021 00:48:14 - INFO - __main__ - Step 47629: {'lr': 0.00019899358341825897, 'samples': 1524128, 'steps': 2976, 'loss/train': 2.026679039001465} -09/21/2021 00:48:16 - INFO - __main__ - Step 47630: {'lr': 0.00019899358341825897, 'samples': 1524160, 'steps': 2976, 'loss/train': 2.108185291290283} -09/21/2021 00:48:16 - INFO - __main__ - Step 47631: {'lr': 0.00019899358341825897, 'samples': 1524192, 'steps': 2976, 'loss/train': 2.3219497203826904} -09/21/2021 00:48:17 - INFO - __main__ - Step 47632: {'lr': 0.00019899358341825897, 'samples': 1524224, 'steps': 2976, 'loss/train': 2.862936496734619} -09/21/2021 00:48:18 - INFO - __main__ - Step 47633: {'lr': 0.0001989926804989327, 'samples': 1524256, 'steps': 2977, 'loss/train': 2.4236936569213867} -09/21/2021 00:48:19 - INFO - __main__ - Step 47634: {'lr': 0.0001989926804989327, 'samples': 1524288, 'steps': 2977, 'loss/train': 1.4195499420166016} -09/21/2021 00:48:20 - INFO - __main__ - Step 47635: {'lr': 0.0001989926804989327, 'samples': 1524320, 'steps': 2977, 'loss/train': 1.7831430435180664} -09/21/2021 00:48:20 - INFO - __main__ - Step 47636: {'lr': 0.0001989926804989327, 'samples': 1524352, 'steps': 2977, 'loss/train': 1.945225477218628} -09/21/2021 00:48:21 - INFO - __main__ - Step 47637: {'lr': 0.0001989926804989327, 'samples': 1524384, 'steps': 2977, 'loss/train': 1.7469488382339478} -09/21/2021 00:48:22 - INFO - __main__ - Step 47638: {'lr': 0.0001989926804989327, 'samples': 1524416, 'steps': 2977, 'loss/train': 0.27475595474243164} -09/21/2021 00:48:23 - INFO - __main__ - Step 47639: {'lr': 0.0001989926804989327, 'samples': 1524448, 'steps': 2977, 'loss/train': 2.294283628463745} -09/21/2021 00:48:23 - INFO - __main__ - Step 47640: {'lr': 0.0001989926804989327, 'samples': 1524480, 'steps': 2977, 'loss/train': 1.6059354543685913} -09/21/2021 00:48:24 - INFO - __main__ - Step 47641: {'lr': 0.0001989926804989327, 'samples': 1524512, 'steps': 2977, 'loss/train': 2.4723267555236816} -09/21/2021 00:48:25 - INFO - __main__ - Step 47642: {'lr': 0.0001989926804989327, 'samples': 1524544, 'steps': 2977, 'loss/train': 1.9977481365203857} -09/21/2021 00:48:26 - INFO - __main__ - Step 47643: {'lr': 0.0001989926804989327, 'samples': 1524576, 'steps': 2977, 'loss/train': 1.7048254013061523} -09/21/2021 00:48:26 - INFO - __main__ - Step 47644: {'lr': 0.0001989926804989327, 'samples': 1524608, 'steps': 2977, 'loss/train': 2.3177027702331543} -09/21/2021 00:48:27 - INFO - __main__ - Step 47645: {'lr': 0.0001989926804989327, 'samples': 1524640, 'steps': 2977, 'loss/train': 1.6364039182662964} -09/21/2021 00:48:28 - INFO - __main__ - Step 47646: {'lr': 0.0001989926804989327, 'samples': 1524672, 'steps': 2977, 'loss/train': 1.8390650749206543} -09/21/2021 00:48:29 - INFO - __main__ - Step 47647: {'lr': 0.0001989926804989327, 'samples': 1524704, 'steps': 2977, 'loss/train': 2.2539892196655273} -09/21/2021 00:48:29 - INFO - __main__ - Step 47648: {'lr': 0.0001989926804989327, 'samples': 1524736, 'steps': 2977, 'loss/train': 1.8463561534881592} -09/21/2021 00:48:30 - INFO - __main__ - Step 47649: {'lr': 0.00019899177717680556, 'samples': 1524768, 'steps': 2978, 'loss/train': 1.4628866910934448} -09/21/2021 00:48:31 - INFO - __main__ - Step 47650: {'lr': 0.00019899177717680556, 'samples': 1524800, 'steps': 2978, 'loss/train': 2.256222724914551} -09/21/2021 00:48:32 - INFO - __main__ - Step 47651: {'lr': 0.00019899177717680556, 'samples': 1524832, 'steps': 2978, 'loss/train': 1.638253927230835} -09/21/2021 00:48:32 - INFO - __main__ - Step 47652: {'lr': 0.00019899177717680556, 'samples': 1524864, 'steps': 2978, 'loss/train': 2.4528489112854004} -09/21/2021 00:48:33 - INFO - __main__ - Step 47653: {'lr': 0.00019899177717680556, 'samples': 1524896, 'steps': 2978, 'loss/train': 1.891048789024353} -09/21/2021 00:48:34 - INFO - __main__ - Step 47654: {'lr': 0.00019899177717680556, 'samples': 1524928, 'steps': 2978, 'loss/train': 2.369269371032715} -09/21/2021 00:48:35 - INFO - __main__ - Step 47655: {'lr': 0.00019899177717680556, 'samples': 1524960, 'steps': 2978, 'loss/train': 1.9293936491012573} -09/21/2021 00:48:35 - INFO - __main__ - Step 47656: {'lr': 0.00019899177717680556, 'samples': 1524992, 'steps': 2978, 'loss/train': 2.3064587116241455} -09/21/2021 00:48:36 - INFO - __main__ - Step 47657: {'lr': 0.00019899177717680556, 'samples': 1525024, 'steps': 2978, 'loss/train': 2.0655643939971924} -09/21/2021 00:48:37 - INFO - __main__ - Step 47658: {'lr': 0.00019899177717680556, 'samples': 1525056, 'steps': 2978, 'loss/train': 1.940982699394226} -09/21/2021 00:48:38 - INFO - __main__ - Step 47659: {'lr': 0.00019899177717680556, 'samples': 1525088, 'steps': 2978, 'loss/train': 2.750758647918701} -09/21/2021 00:48:38 - INFO - __main__ - Step 47660: {'lr': 0.00019899177717680556, 'samples': 1525120, 'steps': 2978, 'loss/train': 2.1413559913635254} -09/21/2021 00:48:40 - INFO - __main__ - Step 47661: {'lr': 0.00019899177717680556, 'samples': 1525152, 'steps': 2978, 'loss/train': 2.688939094543457} -09/21/2021 00:48:41 - INFO - __main__ - Step 47662: {'lr': 0.00019899177717680556, 'samples': 1525184, 'steps': 2978, 'loss/train': 1.580490231513977} -09/21/2021 00:48:41 - INFO - __main__ - Step 47663: {'lr': 0.00019899177717680556, 'samples': 1525216, 'steps': 2978, 'loss/train': 1.2816100120544434} -09/21/2021 00:48:42 - INFO - __main__ - Step 47664: {'lr': 0.00019899177717680556, 'samples': 1525248, 'steps': 2978, 'loss/train': 2.7202117443084717} -09/21/2021 00:48:43 - INFO - __main__ - Step 47665: {'lr': 0.0001989908734518813, 'samples': 1525280, 'steps': 2979, 'loss/train': 1.9405409097671509} -09/21/2021 00:48:44 - INFO - __main__ - Step 47666: {'lr': 0.0001989908734518813, 'samples': 1525312, 'steps': 2979, 'loss/train': 2.5350770950317383} -09/21/2021 00:48:44 - INFO - __main__ - Step 47667: {'lr': 0.0001989908734518813, 'samples': 1525344, 'steps': 2979, 'loss/train': 2.1414361000061035} -09/21/2021 00:48:45 - INFO - __main__ - Step 47668: {'lr': 0.0001989908734518813, 'samples': 1525376, 'steps': 2979, 'loss/train': 1.7978081703186035} -09/21/2021 00:48:46 - INFO - __main__ - Step 47669: {'lr': 0.0001989908734518813, 'samples': 1525408, 'steps': 2979, 'loss/train': 1.88201105594635} -09/21/2021 00:48:47 - INFO - __main__ - Step 47670: {'lr': 0.0001989908734518813, 'samples': 1525440, 'steps': 2979, 'loss/train': 2.1803619861602783} -09/21/2021 00:48:47 - INFO - __main__ - Step 47671: {'lr': 0.0001989908734518813, 'samples': 1525472, 'steps': 2979, 'loss/train': 0.1948980689048767} -09/21/2021 00:48:48 - INFO - __main__ - Step 47672: {'lr': 0.0001989908734518813, 'samples': 1525504, 'steps': 2979, 'loss/train': 1.2341750860214233} -09/21/2021 00:48:49 - INFO - __main__ - Step 47673: {'lr': 0.0001989908734518813, 'samples': 1525536, 'steps': 2979, 'loss/train': 2.4578495025634766} -09/21/2021 00:48:50 - INFO - __main__ - Step 47674: {'lr': 0.0001989908734518813, 'samples': 1525568, 'steps': 2979, 'loss/train': 1.4991710186004639} -09/21/2021 00:48:50 - INFO - __main__ - Step 47675: {'lr': 0.0001989908734518813, 'samples': 1525600, 'steps': 2979, 'loss/train': 2.368344783782959} -09/21/2021 00:48:51 - INFO - __main__ - Step 47676: {'lr': 0.0001989908734518813, 'samples': 1525632, 'steps': 2979, 'loss/train': 2.3018805980682373} -09/21/2021 00:48:52 - INFO - __main__ - Step 47677: {'lr': 0.0001989908734518813, 'samples': 1525664, 'steps': 2979, 'loss/train': 1.7085461616516113} -09/21/2021 00:48:53 - INFO - __main__ - Step 47678: {'lr': 0.0001989908734518813, 'samples': 1525696, 'steps': 2979, 'loss/train': 2.4789395332336426} -09/21/2021 00:48:53 - INFO - __main__ - Step 47679: {'lr': 0.0001989908734518813, 'samples': 1525728, 'steps': 2979, 'loss/train': 1.5041382312774658} -09/21/2021 00:48:54 - INFO - __main__ - Step 47680: {'lr': 0.0001989908734518813, 'samples': 1525760, 'steps': 2979, 'loss/train': 1.3856011629104614} -09/21/2021 00:48:55 - INFO - __main__ - Step 47681: {'lr': 0.00019898996932416353, 'samples': 1525792, 'steps': 2980, 'loss/train': 1.6246877908706665} -09/21/2021 00:48:56 - INFO - __main__ - Step 47682: {'lr': 0.00019898996932416353, 'samples': 1525824, 'steps': 2980, 'loss/train': 2.0673322677612305} -09/21/2021 00:48:57 - INFO - __main__ - Step 47683: {'lr': 0.00019898996932416353, 'samples': 1525856, 'steps': 2980, 'loss/train': 3.227644205093384} -09/21/2021 00:48:57 - INFO - __main__ - Step 47684: {'lr': 0.00019898996932416353, 'samples': 1525888, 'steps': 2980, 'loss/train': 2.172231912612915} -09/21/2021 00:48:58 - INFO - __main__ - Step 47685: {'lr': 0.00019898996932416353, 'samples': 1525920, 'steps': 2980, 'loss/train': 1.815452218055725} -09/21/2021 00:48:59 - INFO - __main__ - Step 47686: {'lr': 0.00019898996932416353, 'samples': 1525952, 'steps': 2980, 'loss/train': 1.7623745203018188} -09/21/2021 00:49:00 - INFO - __main__ - Step 47687: {'lr': 0.00019898996932416353, 'samples': 1525984, 'steps': 2980, 'loss/train': 1.8213871717453003} -09/21/2021 00:49:00 - INFO - __main__ - Step 47688: {'lr': 0.00019898996932416353, 'samples': 1526016, 'steps': 2980, 'loss/train': 1.0326138734817505} -09/21/2021 00:49:01 - INFO - __main__ - Step 47689: {'lr': 0.00019898996932416353, 'samples': 1526048, 'steps': 2980, 'loss/train': 1.4343644380569458} -09/21/2021 00:49:02 - INFO - __main__ - Step 47690: {'lr': 0.00019898996932416353, 'samples': 1526080, 'steps': 2980, 'loss/train': 1.5059345960617065} -09/21/2021 00:49:03 - INFO - __main__ - Step 47691: {'lr': 0.00019898996932416353, 'samples': 1526112, 'steps': 2980, 'loss/train': 2.0269436836242676} -09/21/2021 00:49:03 - INFO - __main__ - Step 47692: {'lr': 0.00019898996932416353, 'samples': 1526144, 'steps': 2980, 'loss/train': 2.4856784343719482} -09/21/2021 00:49:05 - INFO - __main__ - Step 47693: {'lr': 0.00019898996932416353, 'samples': 1526176, 'steps': 2980, 'loss/train': 1.394347071647644} -09/21/2021 00:49:06 - INFO - __main__ - Step 47694: {'lr': 0.00019898996932416353, 'samples': 1526208, 'steps': 2980, 'loss/train': 1.9991387128829956} -09/21/2021 00:49:06 - INFO - __main__ - Step 47695: {'lr': 0.00019898996932416353, 'samples': 1526240, 'steps': 2980, 'loss/train': 2.3125996589660645} -09/21/2021 00:49:07 - INFO - __main__ - Step 47696: {'lr': 0.00019898996932416353, 'samples': 1526272, 'steps': 2980, 'loss/train': 1.4879779815673828} -09/21/2021 00:49:08 - INFO - __main__ - Step 47697: {'lr': 0.00019898906479365596, 'samples': 1526304, 'steps': 2981, 'loss/train': 2.0053117275238037} -09/21/2021 00:49:09 - INFO - __main__ - Step 47698: {'lr': 0.00019898906479365596, 'samples': 1526336, 'steps': 2981, 'loss/train': 0.2561191916465759} -09/21/2021 00:49:09 - INFO - __main__ - Step 47699: {'lr': 0.00019898906479365596, 'samples': 1526368, 'steps': 2981, 'loss/train': 0.19145166873931885} -09/21/2021 00:49:10 - INFO - __main__ - Step 47700: {'lr': 0.00019898906479365596, 'samples': 1526400, 'steps': 2981, 'loss/train': 0.18234208226203918} -09/21/2021 00:49:11 - INFO - __main__ - Step 47701: {'lr': 0.00019898906479365596, 'samples': 1526432, 'steps': 2981, 'loss/train': 0.18670812249183655} -09/21/2021 00:49:12 - INFO - __main__ - Step 47702: {'lr': 0.00019898906479365596, 'samples': 1526464, 'steps': 2981, 'loss/train': 0.9369500279426575} -09/21/2021 00:49:12 - INFO - __main__ - Step 47703: {'lr': 0.00019898906479365596, 'samples': 1526496, 'steps': 2981, 'loss/train': 1.3140418529510498} -09/21/2021 00:49:13 - INFO - __main__ - Step 47704: {'lr': 0.00019898906479365596, 'samples': 1526528, 'steps': 2981, 'loss/train': 1.0435236692428589} -09/21/2021 00:49:14 - INFO - __main__ - Step 47705: {'lr': 0.00019898906479365596, 'samples': 1526560, 'steps': 2981, 'loss/train': 1.055740475654602} -09/21/2021 00:49:15 - INFO - __main__ - Step 47706: {'lr': 0.00019898906479365596, 'samples': 1526592, 'steps': 2981, 'loss/train': 1.4580637216567993} -09/21/2021 00:49:15 - INFO - __main__ - Step 47707: {'lr': 0.00019898906479365596, 'samples': 1526624, 'steps': 2981, 'loss/train': 1.4515572786331177} -09/21/2021 00:49:16 - INFO - __main__ - Step 47708: {'lr': 0.00019898906479365596, 'samples': 1526656, 'steps': 2981, 'loss/train': 2.1500134468078613} -09/21/2021 00:49:17 - INFO - __main__ - Step 47709: {'lr': 0.00019898906479365596, 'samples': 1526688, 'steps': 2981, 'loss/train': 1.2864989042282104} -09/21/2021 00:49:18 - INFO - __main__ - Step 47710: {'lr': 0.00019898906479365596, 'samples': 1526720, 'steps': 2981, 'loss/train': 2.359065532684326} -09/21/2021 00:49:18 - INFO - __main__ - Step 47711: {'lr': 0.00019898906479365596, 'samples': 1526752, 'steps': 2981, 'loss/train': 1.6201781034469604} -09/21/2021 00:49:19 - INFO - __main__ - Step 47712: {'lr': 0.00019898906479365596, 'samples': 1526784, 'steps': 2981, 'loss/train': 1.7129364013671875} -09/21/2021 00:49:20 - INFO - __main__ - Step 47713: {'lr': 0.00019898815986036227, 'samples': 1526816, 'steps': 2982, 'loss/train': 1.851499080657959} -09/21/2021 00:49:21 - INFO - __main__ - Step 47714: {'lr': 0.00019898815986036227, 'samples': 1526848, 'steps': 2982, 'loss/train': 2.575604200363159} -09/21/2021 00:49:22 - INFO - __main__ - Step 47715: {'lr': 0.00019898815986036227, 'samples': 1526880, 'steps': 2982, 'loss/train': 2.1703686714172363} -09/21/2021 00:49:22 - INFO - __main__ - Step 47716: {'lr': 0.00019898815986036227, 'samples': 1526912, 'steps': 2982, 'loss/train': 0.7880554795265198} -09/21/2021 00:49:23 - INFO - __main__ - Step 47717: {'lr': 0.00019898815986036227, 'samples': 1526944, 'steps': 2982, 'loss/train': 1.7184693813323975} -09/21/2021 00:49:24 - INFO - __main__ - Step 47718: {'lr': 0.00019898815986036227, 'samples': 1526976, 'steps': 2982, 'loss/train': 1.8925987482070923} -09/21/2021 00:49:25 - INFO - __main__ - Step 47719: {'lr': 0.00019898815986036227, 'samples': 1527008, 'steps': 2982, 'loss/train': 2.306300640106201} -09/21/2021 00:49:25 - INFO - __main__ - Step 47720: {'lr': 0.00019898815986036227, 'samples': 1527040, 'steps': 2982, 'loss/train': 1.8077478408813477} -09/21/2021 00:49:26 - INFO - __main__ - Step 47721: {'lr': 0.00019898815986036227, 'samples': 1527072, 'steps': 2982, 'loss/train': 1.9962188005447388} -09/21/2021 00:49:27 - INFO - __main__ - Step 47722: {'lr': 0.00019898815986036227, 'samples': 1527104, 'steps': 2982, 'loss/train': 1.9917042255401611} -09/21/2021 00:49:28 - INFO - __main__ - Step 47723: {'lr': 0.00019898815986036227, 'samples': 1527136, 'steps': 2982, 'loss/train': 2.0815296173095703} -09/21/2021 00:49:29 - INFO - __main__ - Step 47724: {'lr': 0.00019898815986036227, 'samples': 1527168, 'steps': 2982, 'loss/train': 2.6775667667388916} -09/21/2021 00:49:30 - INFO - __main__ - Step 47725: {'lr': 0.00019898815986036227, 'samples': 1527200, 'steps': 2982, 'loss/train': 2.233212471008301} -09/21/2021 00:49:30 - INFO - __main__ - Step 47726: {'lr': 0.00019898815986036227, 'samples': 1527232, 'steps': 2982, 'loss/train': 0.15134617686271667} -09/21/2021 00:49:31 - INFO - __main__ - Step 47727: {'lr': 0.00019898815986036227, 'samples': 1527264, 'steps': 2982, 'loss/train': 2.1036436557769775} -09/21/2021 00:49:32 - INFO - __main__ - Step 47728: {'lr': 0.00019898815986036227, 'samples': 1527296, 'steps': 2982, 'loss/train': 1.6574474573135376} -09/21/2021 00:49:33 - INFO - __main__ - Step 47729: {'lr': 0.00019898725452428617, 'samples': 1527328, 'steps': 2983, 'loss/train': 2.19228196144104} -09/21/2021 00:49:34 - INFO - __main__ - Step 47730: {'lr': 0.00019898725452428617, 'samples': 1527360, 'steps': 2983, 'loss/train': 1.9641523361206055} -09/21/2021 00:49:34 - INFO - __main__ - Step 47731: {'lr': 0.00019898725452428617, 'samples': 1527392, 'steps': 2983, 'loss/train': 1.1313430070877075} -09/21/2021 00:49:35 - INFO - __main__ - Step 47732: {'lr': 0.00019898725452428617, 'samples': 1527424, 'steps': 2983, 'loss/train': 1.6675199270248413} -09/21/2021 00:49:36 - INFO - __main__ - Step 47733: {'lr': 0.00019898725452428617, 'samples': 1527456, 'steps': 2983, 'loss/train': 2.031463861465454} -09/21/2021 00:49:37 - INFO - __main__ - Step 47734: {'lr': 0.00019898725452428617, 'samples': 1527488, 'steps': 2983, 'loss/train': 1.2979998588562012} -09/21/2021 00:49:37 - INFO - __main__ - Step 47735: {'lr': 0.00019898725452428617, 'samples': 1527520, 'steps': 2983, 'loss/train': 2.432386636734009} -09/21/2021 00:49:38 - INFO - __main__ - Step 47736: {'lr': 0.00019898725452428617, 'samples': 1527552, 'steps': 2983, 'loss/train': 0.10735492408275604} -09/21/2021 00:49:39 - INFO - __main__ - Step 47737: {'lr': 0.00019898725452428617, 'samples': 1527584, 'steps': 2983, 'loss/train': 0.13495270907878876} -09/21/2021 00:49:40 - INFO - __main__ - Step 47738: {'lr': 0.00019898725452428617, 'samples': 1527616, 'steps': 2983, 'loss/train': 2.4238059520721436} -09/21/2021 00:49:40 - INFO - __main__ - Step 47739: {'lr': 0.00019898725452428617, 'samples': 1527648, 'steps': 2983, 'loss/train': 2.958627700805664} -09/21/2021 00:49:41 - INFO - __main__ - Step 47740: {'lr': 0.00019898725452428617, 'samples': 1527680, 'steps': 2983, 'loss/train': 6.047813415527344} -09/21/2021 00:49:42 - INFO - __main__ - Step 47741: {'lr': 0.00019898725452428617, 'samples': 1527712, 'steps': 2983, 'loss/train': 2.4574668407440186} -09/21/2021 00:49:43 - INFO - __main__ - Step 47742: {'lr': 0.00019898725452428617, 'samples': 1527744, 'steps': 2983, 'loss/train': 2.016153573989868} -09/21/2021 00:49:43 - INFO - __main__ - Step 47743: {'lr': 0.00019898725452428617, 'samples': 1527776, 'steps': 2983, 'loss/train': 1.906623363494873} -09/21/2021 00:49:44 - INFO - __main__ - Step 47744: {'lr': 0.00019898725452428617, 'samples': 1527808, 'steps': 2983, 'loss/train': 1.5785009860992432} -09/21/2021 00:49:45 - INFO - __main__ - Step 47745: {'lr': 0.0001989863487854313, 'samples': 1527840, 'steps': 2984, 'loss/train': 2.1227028369903564} -09/21/2021 00:49:46 - INFO - __main__ - Step 47746: {'lr': 0.0001989863487854313, 'samples': 1527872, 'steps': 2984, 'loss/train': 1.2979058027267456} -09/21/2021 00:49:46 - INFO - __main__ - Step 47747: {'lr': 0.0001989863487854313, 'samples': 1527904, 'steps': 2984, 'loss/train': 1.9750888347625732} -09/21/2021 00:49:47 - INFO - __main__ - Step 47748: {'lr': 0.0001989863487854313, 'samples': 1527936, 'steps': 2984, 'loss/train': 1.548478364944458} -09/21/2021 00:49:48 - INFO - __main__ - Step 47749: {'lr': 0.0001989863487854313, 'samples': 1527968, 'steps': 2984, 'loss/train': 1.7076936960220337} -09/21/2021 00:49:49 - INFO - __main__ - Step 47750: {'lr': 0.0001989863487854313, 'samples': 1528000, 'steps': 2984, 'loss/train': 1.753491759300232} -09/21/2021 00:49:49 - INFO - __main__ - Step 47751: {'lr': 0.0001989863487854313, 'samples': 1528032, 'steps': 2984, 'loss/train': 2.424191474914551} -09/21/2021 00:49:50 - INFO - __main__ - Step 47752: {'lr': 0.0001989863487854313, 'samples': 1528064, 'steps': 2984, 'loss/train': 1.9527443647384644} -09/21/2021 00:49:51 - INFO - __main__ - Step 47753: {'lr': 0.0001989863487854313, 'samples': 1528096, 'steps': 2984, 'loss/train': 2.7109532356262207} -09/21/2021 00:49:52 - INFO - __main__ - Step 47754: {'lr': 0.0001989863487854313, 'samples': 1528128, 'steps': 2984, 'loss/train': 1.906927227973938} -09/21/2021 00:49:53 - INFO - __main__ - Step 47755: {'lr': 0.0001989863487854313, 'samples': 1528160, 'steps': 2984, 'loss/train': 0.46803542971611023} -09/21/2021 00:49:54 - INFO - __main__ - Step 47756: {'lr': 0.0001989863487854313, 'samples': 1528192, 'steps': 2984, 'loss/train': 1.7970826625823975} -09/21/2021 00:49:55 - INFO - __main__ - Step 47757: {'lr': 0.0001989863487854313, 'samples': 1528224, 'steps': 2984, 'loss/train': 2.0721004009246826} -09/21/2021 00:49:55 - INFO - __main__ - Step 47758: {'lr': 0.0001989863487854313, 'samples': 1528256, 'steps': 2984, 'loss/train': 2.330174684524536} -09/21/2021 00:49:56 - INFO - __main__ - Step 47759: {'lr': 0.0001989863487854313, 'samples': 1528288, 'steps': 2984, 'loss/train': 1.6785091161727905} -09/21/2021 00:49:57 - INFO - __main__ - Step 47760: {'lr': 0.0001989863487854313, 'samples': 1528320, 'steps': 2984, 'loss/train': 3.2416186332702637} -09/21/2021 00:49:58 - INFO - __main__ - Step 47761: {'lr': 0.00019898544264380138, 'samples': 1528352, 'steps': 2985, 'loss/train': 3.233661651611328} -09/21/2021 00:49:59 - INFO - __main__ - Step 47762: {'lr': 0.00019898544264380138, 'samples': 1528384, 'steps': 2985, 'loss/train': 3.260305166244507} -09/21/2021 00:49:59 - INFO - __main__ - Step 47763: {'lr': 0.00019898544264380138, 'samples': 1528416, 'steps': 2985, 'loss/train': 1.8429149389266968} -09/21/2021 00:50:00 - INFO - __main__ - Step 47764: {'lr': 0.00019898544264380138, 'samples': 1528448, 'steps': 2985, 'loss/train': 2.1841681003570557} -09/21/2021 00:50:01 - INFO - __main__ - Step 47765: {'lr': 0.00019898544264380138, 'samples': 1528480, 'steps': 2985, 'loss/train': 1.4140279293060303} -09/21/2021 00:50:02 - INFO - __main__ - Step 47766: {'lr': 0.00019898544264380138, 'samples': 1528512, 'steps': 2985, 'loss/train': 1.0751869678497314} -09/21/2021 00:50:02 - INFO - __main__ - Step 47767: {'lr': 0.00019898544264380138, 'samples': 1528544, 'steps': 2985, 'loss/train': 1.239052653312683} -09/21/2021 00:50:03 - INFO - __main__ - Step 47768: {'lr': 0.00019898544264380138, 'samples': 1528576, 'steps': 2985, 'loss/train': 2.338221311569214} -09/21/2021 00:50:04 - INFO - __main__ - Step 47769: {'lr': 0.00019898544264380138, 'samples': 1528608, 'steps': 2985, 'loss/train': 2.4189279079437256} -09/21/2021 00:50:05 - INFO - __main__ - Step 47770: {'lr': 0.00019898544264380138, 'samples': 1528640, 'steps': 2985, 'loss/train': 1.8058233261108398} -09/21/2021 00:50:05 - INFO - __main__ - Step 47771: {'lr': 0.00019898544264380138, 'samples': 1528672, 'steps': 2985, 'loss/train': 2.2360105514526367} -09/21/2021 00:50:06 - INFO - __main__ - Step 47772: {'lr': 0.00019898544264380138, 'samples': 1528704, 'steps': 2985, 'loss/train': 2.030900716781616} -09/21/2021 00:50:07 - INFO - __main__ - Step 47773: {'lr': 0.00019898544264380138, 'samples': 1528736, 'steps': 2985, 'loss/train': 2.613173723220825} -09/21/2021 00:50:08 - INFO - __main__ - Step 47774: {'lr': 0.00019898544264380138, 'samples': 1528768, 'steps': 2985, 'loss/train': 2.1962263584136963} -09/21/2021 00:50:08 - INFO - __main__ - Step 47775: {'lr': 0.00019898544264380138, 'samples': 1528800, 'steps': 2985, 'loss/train': 1.3547749519348145} -09/21/2021 00:50:09 - INFO - __main__ - Step 47776: {'lr': 0.00019898544264380138, 'samples': 1528832, 'steps': 2985, 'loss/train': 2.308586359024048} -09/21/2021 00:50:10 - INFO - __main__ - Step 47777: {'lr': 0.00019898453609940004, 'samples': 1528864, 'steps': 2986, 'loss/train': 2.6774587631225586} -09/21/2021 00:50:11 - INFO - __main__ - Step 47778: {'lr': 0.00019898453609940004, 'samples': 1528896, 'steps': 2986, 'loss/train': 1.7453978061676025} -09/21/2021 00:50:11 - INFO - __main__ - Step 47779: {'lr': 0.00019898453609940004, 'samples': 1528928, 'steps': 2986, 'loss/train': 3.0416364669799805} -09/21/2021 00:50:12 - INFO - __main__ - Step 47780: {'lr': 0.00019898453609940004, 'samples': 1528960, 'steps': 2986, 'loss/train': 1.9704017639160156} -09/21/2021 00:50:13 - INFO - __main__ - Step 47781: {'lr': 0.00019898453609940004, 'samples': 1528992, 'steps': 2986, 'loss/train': 2.7739148139953613} -09/21/2021 00:50:14 - INFO - __main__ - Step 47782: {'lr': 0.00019898453609940004, 'samples': 1529024, 'steps': 2986, 'loss/train': 2.060582399368286} -09/21/2021 00:50:14 - INFO - __main__ - Step 47783: {'lr': 0.00019898453609940004, 'samples': 1529056, 'steps': 2986, 'loss/train': 1.156686782836914} -09/21/2021 00:50:15 - INFO - __main__ - Step 47784: {'lr': 0.00019898453609940004, 'samples': 1529088, 'steps': 2986, 'loss/train': 2.484607219696045} -09/21/2021 00:50:16 - INFO - __main__ - Step 47785: {'lr': 0.00019898453609940004, 'samples': 1529120, 'steps': 2986, 'loss/train': 1.9399526119232178} -09/21/2021 00:50:17 - INFO - __main__ - Step 47786: {'lr': 0.00019898453609940004, 'samples': 1529152, 'steps': 2986, 'loss/train': 2.438861846923828} -09/21/2021 00:50:17 - INFO - __main__ - Step 47787: {'lr': 0.00019898453609940004, 'samples': 1529184, 'steps': 2986, 'loss/train': 2.766789674758911} -09/21/2021 00:50:19 - INFO - __main__ - Step 47788: {'lr': 0.00019898453609940004, 'samples': 1529216, 'steps': 2986, 'loss/train': 2.7149362564086914} -09/21/2021 00:50:20 - INFO - __main__ - Step 47789: {'lr': 0.00019898453609940004, 'samples': 1529248, 'steps': 2986, 'loss/train': 2.596813678741455} -09/21/2021 00:50:20 - INFO - __main__ - Step 47790: {'lr': 0.00019898453609940004, 'samples': 1529280, 'steps': 2986, 'loss/train': 2.602895975112915} -09/21/2021 00:50:21 - INFO - __main__ - Step 47791: {'lr': 0.00019898453609940004, 'samples': 1529312, 'steps': 2986, 'loss/train': 1.2501388788223267} -09/21/2021 00:50:22 - INFO - __main__ - Step 47792: {'lr': 0.00019898453609940004, 'samples': 1529344, 'steps': 2986, 'loss/train': 2.2953295707702637} -09/21/2021 00:50:23 - INFO - __main__ - Step 47793: {'lr': 0.000198983629152231, 'samples': 1529376, 'steps': 2987, 'loss/train': 2.3970813751220703} -09/21/2021 00:50:23 - INFO - __main__ - Step 47794: {'lr': 0.000198983629152231, 'samples': 1529408, 'steps': 2987, 'loss/train': 2.314366102218628} -09/21/2021 00:50:24 - INFO - __main__ - Step 47795: {'lr': 0.000198983629152231, 'samples': 1529440, 'steps': 2987, 'loss/train': 1.892500400543213} -09/21/2021 00:50:25 - INFO - __main__ - Step 47796: {'lr': 0.000198983629152231, 'samples': 1529472, 'steps': 2987, 'loss/train': 1.995005488395691} -09/21/2021 00:50:26 - INFO - __main__ - Step 47797: {'lr': 0.000198983629152231, 'samples': 1529504, 'steps': 2987, 'loss/train': 2.1031999588012695} -09/21/2021 00:50:26 - INFO - __main__ - Step 47798: {'lr': 0.000198983629152231, 'samples': 1529536, 'steps': 2987, 'loss/train': 2.1545329093933105} -09/21/2021 00:50:27 - INFO - __main__ - Step 47799: {'lr': 0.000198983629152231, 'samples': 1529568, 'steps': 2987, 'loss/train': 2.2883458137512207} -09/21/2021 00:50:28 - INFO - __main__ - Step 47800: {'lr': 0.000198983629152231, 'samples': 1529600, 'steps': 2987, 'loss/train': 2.367236852645874} -09/21/2021 00:50:29 - INFO - __main__ - Step 47801: {'lr': 0.000198983629152231, 'samples': 1529632, 'steps': 2987, 'loss/train': 1.352218747138977} -09/21/2021 00:50:29 - INFO - __main__ - Step 47802: {'lr': 0.000198983629152231, 'samples': 1529664, 'steps': 2987, 'loss/train': 2.3499531745910645} -09/21/2021 00:50:30 - INFO - __main__ - Step 47803: {'lr': 0.000198983629152231, 'samples': 1529696, 'steps': 2987, 'loss/train': 1.5928072929382324} -09/21/2021 00:50:31 - INFO - __main__ - Step 47804: {'lr': 0.000198983629152231, 'samples': 1529728, 'steps': 2987, 'loss/train': 1.6110179424285889} -09/21/2021 00:50:32 - INFO - __main__ - Step 47805: {'lr': 0.000198983629152231, 'samples': 1529760, 'steps': 2987, 'loss/train': 1.886863350868225} -09/21/2021 00:50:32 - INFO - __main__ - Step 47806: {'lr': 0.000198983629152231, 'samples': 1529792, 'steps': 2987, 'loss/train': 1.727237343788147} -09/21/2021 00:50:33 - INFO - __main__ - Step 47807: {'lr': 0.000198983629152231, 'samples': 1529824, 'steps': 2987, 'loss/train': 1.4562557935714722} -09/21/2021 00:50:34 - INFO - __main__ - Step 47808: {'lr': 0.000198983629152231, 'samples': 1529856, 'steps': 2987, 'loss/train': 2.3248138427734375} -09/21/2021 00:50:35 - INFO - __main__ - Step 47809: {'lr': 0.000198982721802298, 'samples': 1529888, 'steps': 2988, 'loss/train': 1.6715905666351318} -09/21/2021 00:50:36 - INFO - __main__ - Step 47810: {'lr': 0.000198982721802298, 'samples': 1529920, 'steps': 2988, 'loss/train': 1.8224629163742065} -09/21/2021 00:50:36 - INFO - __main__ - Step 47811: {'lr': 0.000198982721802298, 'samples': 1529952, 'steps': 2988, 'loss/train': 1.750709891319275} -09/21/2021 00:50:37 - INFO - __main__ - Step 47812: {'lr': 0.000198982721802298, 'samples': 1529984, 'steps': 2988, 'loss/train': 2.0149567127227783} -09/21/2021 00:50:38 - INFO - __main__ - Step 47813: {'lr': 0.000198982721802298, 'samples': 1530016, 'steps': 2988, 'loss/train': 2.1940689086914062} -09/21/2021 00:50:39 - INFO - __main__ - Step 47814: {'lr': 0.000198982721802298, 'samples': 1530048, 'steps': 2988, 'loss/train': 1.6486108303070068} -09/21/2021 00:50:39 - INFO - __main__ - Step 47815: {'lr': 0.000198982721802298, 'samples': 1530080, 'steps': 2988, 'loss/train': 1.4218205213546753} -09/21/2021 00:50:40 - INFO - __main__ - Step 47816: {'lr': 0.000198982721802298, 'samples': 1530112, 'steps': 2988, 'loss/train': 2.0522377490997314} -09/21/2021 00:50:41 - INFO - __main__ - Step 47817: {'lr': 0.000198982721802298, 'samples': 1530144, 'steps': 2988, 'loss/train': 1.3532384634017944} -09/21/2021 00:50:43 - INFO - __main__ - Step 47818: {'lr': 0.000198982721802298, 'samples': 1530176, 'steps': 2988, 'loss/train': 1.4346920251846313} -09/21/2021 00:50:43 - INFO - __main__ - Step 47819: {'lr': 0.000198982721802298, 'samples': 1530208, 'steps': 2988, 'loss/train': 2.1485466957092285} -09/21/2021 00:50:44 - INFO - __main__ - Step 47820: {'lr': 0.000198982721802298, 'samples': 1530240, 'steps': 2988, 'loss/train': 2.2836039066314697} -09/21/2021 00:50:45 - INFO - __main__ - Step 47821: {'lr': 0.000198982721802298, 'samples': 1530272, 'steps': 2988, 'loss/train': 2.5149896144866943} -09/21/2021 00:50:46 - INFO - __main__ - Step 47822: {'lr': 0.000198982721802298, 'samples': 1530304, 'steps': 2988, 'loss/train': 1.5082457065582275} -09/21/2021 00:50:46 - INFO - __main__ - Step 47823: {'lr': 0.000198982721802298, 'samples': 1530336, 'steps': 2988, 'loss/train': 0.8343294262886047} -09/21/2021 00:50:47 - INFO - __main__ - Step 47824: {'lr': 0.000198982721802298, 'samples': 1530368, 'steps': 2988, 'loss/train': 2.2667479515075684} -09/21/2021 00:50:48 - INFO - __main__ - Step 47825: {'lr': 0.00019898181404960465, 'samples': 1530400, 'steps': 2989, 'loss/train': 1.9371074438095093} -09/21/2021 00:50:49 - INFO - __main__ - Step 47826: {'lr': 0.00019898181404960465, 'samples': 1530432, 'steps': 2989, 'loss/train': 1.9092614650726318} -09/21/2021 00:50:50 - INFO - __main__ - Step 47827: {'lr': 0.00019898181404960465, 'samples': 1530464, 'steps': 2989, 'loss/train': 1.7062052488327026} -09/21/2021 00:50:50 - INFO - __main__ - Step 47828: {'lr': 0.00019898181404960465, 'samples': 1530496, 'steps': 2989, 'loss/train': 2.511453866958618} -09/21/2021 00:50:51 - INFO - __main__ - Step 47829: {'lr': 0.00019898181404960465, 'samples': 1530528, 'steps': 2989, 'loss/train': 1.7432606220245361} -09/21/2021 00:50:52 - INFO - __main__ - Step 47830: {'lr': 0.00019898181404960465, 'samples': 1530560, 'steps': 2989, 'loss/train': 2.127687454223633} -09/21/2021 00:50:53 - INFO - __main__ - Step 47831: {'lr': 0.00019898181404960465, 'samples': 1530592, 'steps': 2989, 'loss/train': 1.97892165184021} -09/21/2021 00:50:53 - INFO - __main__ - Step 47832: {'lr': 0.00019898181404960465, 'samples': 1530624, 'steps': 2989, 'loss/train': 1.360654354095459} -09/21/2021 00:50:54 - INFO - __main__ - Step 47833: {'lr': 0.00019898181404960465, 'samples': 1530656, 'steps': 2989, 'loss/train': 0.8566622734069824} -09/21/2021 00:50:55 - INFO - __main__ - Step 47834: {'lr': 0.00019898181404960465, 'samples': 1530688, 'steps': 2989, 'loss/train': 1.4526625871658325} -09/21/2021 00:50:56 - INFO - __main__ - Step 47835: {'lr': 0.00019898181404960465, 'samples': 1530720, 'steps': 2989, 'loss/train': 2.4636106491088867} -09/21/2021 00:50:56 - INFO - __main__ - Step 47836: {'lr': 0.00019898181404960465, 'samples': 1530752, 'steps': 2989, 'loss/train': 2.768192768096924} -09/21/2021 00:50:57 - INFO - __main__ - Step 47837: {'lr': 0.00019898181404960465, 'samples': 1530784, 'steps': 2989, 'loss/train': 2.0077555179595947} -09/21/2021 00:50:58 - INFO - __main__ - Step 47838: {'lr': 0.00019898181404960465, 'samples': 1530816, 'steps': 2989, 'loss/train': 2.1790337562561035} -09/21/2021 00:50:59 - INFO - __main__ - Step 47839: {'lr': 0.00019898181404960465, 'samples': 1530848, 'steps': 2989, 'loss/train': 2.49088454246521} -09/21/2021 00:50:59 - INFO - __main__ - Step 47840: {'lr': 0.00019898181404960465, 'samples': 1530880, 'steps': 2989, 'loss/train': 3.5175106525421143} -09/21/2021 00:51:00 - INFO - __main__ - Step 47841: {'lr': 0.00019898090589415472, 'samples': 1530912, 'steps': 2990, 'loss/train': 1.6092137098312378} -09/21/2021 00:51:01 - INFO - __main__ - Step 47842: {'lr': 0.00019898090589415472, 'samples': 1530944, 'steps': 2990, 'loss/train': 0.37356483936309814} -09/21/2021 00:51:02 - INFO - __main__ - Step 47843: {'lr': 0.00019898090589415472, 'samples': 1530976, 'steps': 2990, 'loss/train': 1.9619272947311401} -09/21/2021 00:51:02 - INFO - __main__ - Step 47844: {'lr': 0.00019898090589415472, 'samples': 1531008, 'steps': 2990, 'loss/train': 2.5579302310943604} -09/21/2021 00:51:03 - INFO - __main__ - Step 47845: {'lr': 0.00019898090589415472, 'samples': 1531040, 'steps': 2990, 'loss/train': 2.3968005180358887} -09/21/2021 00:51:04 - INFO - __main__ - Step 47846: {'lr': 0.00019898090589415472, 'samples': 1531072, 'steps': 2990, 'loss/train': 2.1159067153930664} -09/21/2021 00:51:05 - INFO - __main__ - Step 47847: {'lr': 0.00019898090589415472, 'samples': 1531104, 'steps': 2990, 'loss/train': 1.5851850509643555} -09/21/2021 00:51:05 - INFO - __main__ - Step 47848: {'lr': 0.00019898090589415472, 'samples': 1531136, 'steps': 2990, 'loss/train': 2.3742337226867676} -09/21/2021 00:51:07 - INFO - __main__ - Step 47849: {'lr': 0.00019898090589415472, 'samples': 1531168, 'steps': 2990, 'loss/train': 1.4497051239013672} -09/21/2021 00:51:07 - INFO - __main__ - Step 47850: {'lr': 0.00019898090589415472, 'samples': 1531200, 'steps': 2990, 'loss/train': 0.22297482192516327} -09/21/2021 00:51:08 - INFO - __main__ - Step 47851: {'lr': 0.00019898090589415472, 'samples': 1531232, 'steps': 2990, 'loss/train': 2.352304458618164} -09/21/2021 00:51:09 - INFO - __main__ - Step 47852: {'lr': 0.00019898090589415472, 'samples': 1531264, 'steps': 2990, 'loss/train': 2.1734845638275146} -09/21/2021 00:51:10 - INFO - __main__ - Step 47853: {'lr': 0.00019898090589415472, 'samples': 1531296, 'steps': 2990, 'loss/train': 2.170323371887207} -09/21/2021 00:51:10 - INFO - __main__ - Step 47854: {'lr': 0.00019898090589415472, 'samples': 1531328, 'steps': 2990, 'loss/train': 1.9828405380249023} -09/21/2021 00:51:11 - INFO - __main__ - Step 47855: {'lr': 0.00019898090589415472, 'samples': 1531360, 'steps': 2990, 'loss/train': 1.9474185705184937} -09/21/2021 00:51:12 - INFO - __main__ - Step 47856: {'lr': 0.00019898090589415472, 'samples': 1531392, 'steps': 2990, 'loss/train': 1.7438108921051025} -09/21/2021 00:51:13 - INFO - __main__ - Step 47857: {'lr': 0.00019897999733595184, 'samples': 1531424, 'steps': 2991, 'loss/train': 2.196789264678955} -09/21/2021 00:51:14 - INFO - __main__ - Step 47858: {'lr': 0.00019897999733595184, 'samples': 1531456, 'steps': 2991, 'loss/train': 1.5258177518844604} -09/21/2021 00:51:14 - INFO - __main__ - Step 47859: {'lr': 0.00019897999733595184, 'samples': 1531488, 'steps': 2991, 'loss/train': 2.257906675338745} -09/21/2021 00:51:15 - INFO - __main__ - Step 47860: {'lr': 0.00019897999733595184, 'samples': 1531520, 'steps': 2991, 'loss/train': 1.680313229560852} -09/21/2021 00:51:16 - INFO - __main__ - Step 47861: {'lr': 0.00019897999733595184, 'samples': 1531552, 'steps': 2991, 'loss/train': 1.6964958906173706} -09/21/2021 00:51:17 - INFO - __main__ - Step 47862: {'lr': 0.00019897999733595184, 'samples': 1531584, 'steps': 2991, 'loss/train': 2.3866233825683594} -09/21/2021 00:51:17 - INFO - __main__ - Step 47863: {'lr': 0.00019897999733595184, 'samples': 1531616, 'steps': 2991, 'loss/train': 1.6911824941635132} -09/21/2021 00:51:18 - INFO - __main__ - Step 47864: {'lr': 0.00019897999733595184, 'samples': 1531648, 'steps': 2991, 'loss/train': 2.2423126697540283} -09/21/2021 00:51:19 - INFO - __main__ - Step 47865: {'lr': 0.00019897999733595184, 'samples': 1531680, 'steps': 2991, 'loss/train': 1.3883198499679565} -09/21/2021 00:51:20 - INFO - __main__ - Step 47866: {'lr': 0.00019897999733595184, 'samples': 1531712, 'steps': 2991, 'loss/train': 1.749175786972046} -09/21/2021 00:51:20 - INFO - __main__ - Step 47867: {'lr': 0.00019897999733595184, 'samples': 1531744, 'steps': 2991, 'loss/train': 0.16664676368236542} -09/21/2021 00:51:21 - INFO - __main__ - Step 47868: {'lr': 0.00019897999733595184, 'samples': 1531776, 'steps': 2991, 'loss/train': 2.393000364303589} -09/21/2021 00:51:22 - INFO - __main__ - Step 47869: {'lr': 0.00019897999733595184, 'samples': 1531808, 'steps': 2991, 'loss/train': 2.0078392028808594} -09/21/2021 00:51:23 - INFO - __main__ - Step 47870: {'lr': 0.00019897999733595184, 'samples': 1531840, 'steps': 2991, 'loss/train': 1.7613886594772339} -09/21/2021 00:51:23 - INFO - __main__ - Step 47871: {'lr': 0.00019897999733595184, 'samples': 1531872, 'steps': 2991, 'loss/train': 2.8069632053375244} -09/21/2021 00:51:24 - INFO - __main__ - Step 47872: {'lr': 0.00019897999733595184, 'samples': 1531904, 'steps': 2991, 'loss/train': 1.7313748598098755} -09/21/2021 00:51:25 - INFO - __main__ - Step 47873: {'lr': 0.00019897908837499974, 'samples': 1531936, 'steps': 2992, 'loss/train': 1.6854342222213745} -09/21/2021 00:51:26 - INFO - __main__ - Step 47874: {'lr': 0.00019897908837499974, 'samples': 1531968, 'steps': 2992, 'loss/train': 2.6548173427581787} -09/21/2021 00:51:26 - INFO - __main__ - Step 47875: {'lr': 0.00019897908837499974, 'samples': 1532000, 'steps': 2992, 'loss/train': 1.9458413124084473} -09/21/2021 00:51:27 - INFO - __main__ - Step 47876: {'lr': 0.00019897908837499974, 'samples': 1532032, 'steps': 2992, 'loss/train': 2.9107606410980225} -09/21/2021 00:51:28 - INFO - __main__ - Step 47877: {'lr': 0.00019897908837499974, 'samples': 1532064, 'steps': 2992, 'loss/train': 2.9074151515960693} -09/21/2021 00:51:29 - INFO - __main__ - Step 47878: {'lr': 0.00019897908837499974, 'samples': 1532096, 'steps': 2992, 'loss/train': 2.8702268600463867} -09/21/2021 00:51:29 - INFO - __main__ - Step 47879: {'lr': 0.00019897908837499974, 'samples': 1532128, 'steps': 2992, 'loss/train': 1.7777862548828125} -09/21/2021 00:51:31 - INFO - __main__ - Step 47880: {'lr': 0.00019897908837499974, 'samples': 1532160, 'steps': 2992, 'loss/train': 2.401850700378418} -09/21/2021 00:51:32 - INFO - __main__ - Step 47881: {'lr': 0.00019897908837499974, 'samples': 1532192, 'steps': 2992, 'loss/train': 2.1423754692077637} -09/21/2021 00:51:33 - INFO - __main__ - Step 47882: {'lr': 0.00019897908837499974, 'samples': 1532224, 'steps': 2992, 'loss/train': 2.2835934162139893} -09/21/2021 00:51:33 - INFO - __main__ - Step 47883: {'lr': 0.00019897908837499974, 'samples': 1532256, 'steps': 2992, 'loss/train': 2.0227348804473877} -09/21/2021 00:51:34 - INFO - __main__ - Step 47884: {'lr': 0.00019897908837499974, 'samples': 1532288, 'steps': 2992, 'loss/train': 2.032904624938965} -09/21/2021 00:51:35 - INFO - __main__ - Step 47885: {'lr': 0.00019897908837499974, 'samples': 1532320, 'steps': 2992, 'loss/train': 1.5995872020721436} -09/21/2021 00:51:36 - INFO - __main__ - Step 47886: {'lr': 0.00019897908837499974, 'samples': 1532352, 'steps': 2992, 'loss/train': 1.9200903177261353} -09/21/2021 00:51:36 - INFO - __main__ - Step 47887: {'lr': 0.00019897908837499974, 'samples': 1532384, 'steps': 2992, 'loss/train': 1.674941062927246} -09/21/2021 00:51:37 - INFO - __main__ - Step 47888: {'lr': 0.00019897908837499974, 'samples': 1532416, 'steps': 2992, 'loss/train': 1.4614336490631104} -09/21/2021 00:51:38 - INFO - __main__ - Step 47889: {'lr': 0.00019897817901130214, 'samples': 1532448, 'steps': 2993, 'loss/train': 2.285065174102783} -09/21/2021 00:51:39 - INFO - __main__ - Step 47890: {'lr': 0.00019897817901130214, 'samples': 1532480, 'steps': 2993, 'loss/train': 2.2305006980895996} -09/21/2021 00:51:39 - INFO - __main__ - Step 47891: {'lr': 0.00019897817901130214, 'samples': 1532512, 'steps': 2993, 'loss/train': 0.3459385931491852} -09/21/2021 00:51:40 - INFO - __main__ - Step 47892: {'lr': 0.00019897817901130214, 'samples': 1532544, 'steps': 2993, 'loss/train': 2.187897205352783} -09/21/2021 00:51:41 - INFO - __main__ - Step 47893: {'lr': 0.00019897817901130214, 'samples': 1532576, 'steps': 2993, 'loss/train': 2.150719165802002} -09/21/2021 00:51:42 - INFO - __main__ - Step 47894: {'lr': 0.00019897817901130214, 'samples': 1532608, 'steps': 2993, 'loss/train': 1.4307187795639038} -09/21/2021 00:51:42 - INFO - __main__ - Step 47895: {'lr': 0.00019897817901130214, 'samples': 1532640, 'steps': 2993, 'loss/train': 5.489540100097656} -09/21/2021 00:51:43 - INFO - __main__ - Step 47896: {'lr': 0.00019897817901130214, 'samples': 1532672, 'steps': 2993, 'loss/train': 1.3722796440124512} -09/21/2021 00:51:44 - INFO - __main__ - Step 47897: {'lr': 0.00019897817901130214, 'samples': 1532704, 'steps': 2993, 'loss/train': 2.626114845275879} -09/21/2021 00:51:45 - INFO - __main__ - Step 47898: {'lr': 0.00019897817901130214, 'samples': 1532736, 'steps': 2993, 'loss/train': 1.7428745031356812} -09/21/2021 00:51:45 - INFO - __main__ - Step 47899: {'lr': 0.00019897817901130214, 'samples': 1532768, 'steps': 2993, 'loss/train': 0.2532684803009033} -09/21/2021 00:51:46 - INFO - __main__ - Step 47900: {'lr': 0.00019897817901130214, 'samples': 1532800, 'steps': 2993, 'loss/train': 1.4643136262893677} -09/21/2021 00:51:47 - INFO - __main__ - Step 47901: {'lr': 0.00019897817901130214, 'samples': 1532832, 'steps': 2993, 'loss/train': 2.4139721393585205} -09/21/2021 00:51:48 - INFO - __main__ - Step 47902: {'lr': 0.00019897817901130214, 'samples': 1532864, 'steps': 2993, 'loss/train': 2.697753667831421} -09/21/2021 00:51:48 - INFO - __main__ - Step 47903: {'lr': 0.00019897817901130214, 'samples': 1532896, 'steps': 2993, 'loss/train': 1.9758734703063965} -09/21/2021 00:51:49 - INFO - __main__ - Step 47904: {'lr': 0.00019897817901130214, 'samples': 1532928, 'steps': 2993, 'loss/train': 2.331604480743408} -09/21/2021 00:51:50 - INFO - __main__ - Step 47905: {'lr': 0.00019897726924486268, 'samples': 1532960, 'steps': 2994, 'loss/train': 1.4415762424468994} -09/21/2021 00:51:51 - INFO - __main__ - Step 47906: {'lr': 0.00019897726924486268, 'samples': 1532992, 'steps': 2994, 'loss/train': 1.5528347492218018} -09/21/2021 00:51:52 - INFO - __main__ - Step 47907: {'lr': 0.00019897726924486268, 'samples': 1533024, 'steps': 2994, 'loss/train': 2.0059738159179688} -09/21/2021 00:51:52 - INFO - __main__ - Step 47908: {'lr': 0.00019897726924486268, 'samples': 1533056, 'steps': 2994, 'loss/train': 2.7754218578338623} -09/21/2021 00:51:53 - INFO - __main__ - Step 47909: {'lr': 0.00019897726924486268, 'samples': 1533088, 'steps': 2994, 'loss/train': 3.0096800327301025} -09/21/2021 00:51:54 - INFO - __main__ - Step 47910: {'lr': 0.00019897726924486268, 'samples': 1533120, 'steps': 2994, 'loss/train': 1.3636749982833862} -09/21/2021 00:51:55 - INFO - __main__ - Step 47911: {'lr': 0.00019897726924486268, 'samples': 1533152, 'steps': 2994, 'loss/train': 2.3016908168792725} -09/21/2021 00:51:55 - INFO - __main__ - Step 47912: {'lr': 0.00019897726924486268, 'samples': 1533184, 'steps': 2994, 'loss/train': 1.5245453119277954} -09/21/2021 00:51:56 - INFO - __main__ - Step 47913: {'lr': 0.00019897726924486268, 'samples': 1533216, 'steps': 2994, 'loss/train': 1.8899034261703491} -09/21/2021 00:51:57 - INFO - __main__ - Step 47914: {'lr': 0.00019897726924486268, 'samples': 1533248, 'steps': 2994, 'loss/train': 1.8233230113983154} -09/21/2021 00:51:58 - INFO - __main__ - Step 47915: {'lr': 0.00019897726924486268, 'samples': 1533280, 'steps': 2994, 'loss/train': 1.5363237857818604} -09/21/2021 00:51:59 - INFO - __main__ - Step 47916: {'lr': 0.00019897726924486268, 'samples': 1533312, 'steps': 2994, 'loss/train': 2.4588639736175537} -09/21/2021 00:52:00 - INFO - __main__ - Step 47917: {'lr': 0.00019897726924486268, 'samples': 1533344, 'steps': 2994, 'loss/train': 3.3617210388183594} -09/21/2021 00:52:00 - INFO - __main__ - Step 47918: {'lr': 0.00019897726924486268, 'samples': 1533376, 'steps': 2994, 'loss/train': 2.0690910816192627} -09/21/2021 00:52:01 - INFO - __main__ - Step 47919: {'lr': 0.00019897726924486268, 'samples': 1533408, 'steps': 2994, 'loss/train': 2.4620654582977295} -09/21/2021 00:52:02 - INFO - __main__ - Step 47920: {'lr': 0.00019897726924486268, 'samples': 1533440, 'steps': 2994, 'loss/train': 1.7074832916259766} -09/21/2021 00:52:03 - INFO - __main__ - Step 47921: {'lr': 0.0001989763590756851, 'samples': 1533472, 'steps': 2995, 'loss/train': 2.590388536453247} -09/21/2021 00:52:03 - INFO - __main__ - Step 47922: {'lr': 0.0001989763590756851, 'samples': 1533504, 'steps': 2995, 'loss/train': 1.0995126962661743} -09/21/2021 00:52:04 - INFO - __main__ - Step 47923: {'lr': 0.0001989763590756851, 'samples': 1533536, 'steps': 2995, 'loss/train': 1.3191367387771606} -09/21/2021 00:52:05 - INFO - __main__ - Step 47924: {'lr': 0.0001989763590756851, 'samples': 1533568, 'steps': 2995, 'loss/train': 1.9736841917037964} -09/21/2021 00:52:06 - INFO - __main__ - Step 47925: {'lr': 0.0001989763590756851, 'samples': 1533600, 'steps': 2995, 'loss/train': 2.009824752807617} -09/21/2021 00:52:06 - INFO - __main__ - Step 47926: {'lr': 0.0001989763590756851, 'samples': 1533632, 'steps': 2995, 'loss/train': 2.244602918624878} -09/21/2021 00:52:07 - INFO - __main__ - Step 47927: {'lr': 0.0001989763590756851, 'samples': 1533664, 'steps': 2995, 'loss/train': 1.6828560829162598} -09/21/2021 00:52:08 - INFO - __main__ - Step 47928: {'lr': 0.0001989763590756851, 'samples': 1533696, 'steps': 2995, 'loss/train': 1.5194600820541382} -09/21/2021 00:52:09 - INFO - __main__ - Step 47929: {'lr': 0.0001989763590756851, 'samples': 1533728, 'steps': 2995, 'loss/train': 1.0729002952575684} -09/21/2021 00:52:09 - INFO - __main__ - Step 47930: {'lr': 0.0001989763590756851, 'samples': 1533760, 'steps': 2995, 'loss/train': 1.9322408437728882} -09/21/2021 00:52:10 - INFO - __main__ - Step 47931: {'lr': 0.0001989763590756851, 'samples': 1533792, 'steps': 2995, 'loss/train': 2.0571563243865967} -09/21/2021 00:52:11 - INFO - __main__ - Step 47932: {'lr': 0.0001989763590756851, 'samples': 1533824, 'steps': 2995, 'loss/train': 0.8992849588394165} -09/21/2021 00:52:12 - INFO - __main__ - Step 47933: {'lr': 0.0001989763590756851, 'samples': 1533856, 'steps': 2995, 'loss/train': 2.5152368545532227} -09/21/2021 00:52:12 - INFO - __main__ - Step 47934: {'lr': 0.0001989763590756851, 'samples': 1533888, 'steps': 2995, 'loss/train': 2.0775063037872314} -09/21/2021 00:52:13 - INFO - __main__ - Step 47935: {'lr': 0.0001989763590756851, 'samples': 1533920, 'steps': 2995, 'loss/train': 1.5511246919631958} -09/21/2021 00:52:14 - INFO - __main__ - Step 47936: {'lr': 0.0001989763590756851, 'samples': 1533952, 'steps': 2995, 'loss/train': 2.6171228885650635} -09/21/2021 00:52:15 - INFO - __main__ - Step 47937: {'lr': 0.00019897544850377313, 'samples': 1533984, 'steps': 2996, 'loss/train': 1.960740089416504} -09/21/2021 00:52:16 - INFO - __main__ - Step 47938: {'lr': 0.00019897544850377313, 'samples': 1534016, 'steps': 2996, 'loss/train': 1.6907676458358765} -09/21/2021 00:52:16 - INFO - __main__ - Step 47939: {'lr': 0.00019897544850377313, 'samples': 1534048, 'steps': 2996, 'loss/train': 2.958409309387207} -09/21/2021 00:52:17 - INFO - __main__ - Step 47940: {'lr': 0.00019897544850377313, 'samples': 1534080, 'steps': 2996, 'loss/train': 2.328892707824707} -09/21/2021 00:52:18 - INFO - __main__ - Step 47941: {'lr': 0.00019897544850377313, 'samples': 1534112, 'steps': 2996, 'loss/train': 1.2543704509735107} -09/21/2021 00:52:19 - INFO - __main__ - Step 47942: {'lr': 0.00019897544850377313, 'samples': 1534144, 'steps': 2996, 'loss/train': 2.3298416137695312} -09/21/2021 00:52:19 - INFO - __main__ - Step 47943: {'lr': 0.00019897544850377313, 'samples': 1534176, 'steps': 2996, 'loss/train': 1.9401469230651855} -09/21/2021 00:52:20 - INFO - __main__ - Step 47944: {'lr': 0.00019897544850377313, 'samples': 1534208, 'steps': 2996, 'loss/train': 1.9153698682785034} -09/21/2021 00:52:21 - INFO - __main__ - Step 47945: {'lr': 0.00019897544850377313, 'samples': 1534240, 'steps': 2996, 'loss/train': 1.7281335592269897} -09/21/2021 00:52:22 - INFO - __main__ - Step 47946: {'lr': 0.00019897544850377313, 'samples': 1534272, 'steps': 2996, 'loss/train': 0.8027008175849915} -09/21/2021 00:52:23 - INFO - __main__ - Step 47947: {'lr': 0.00019897544850377313, 'samples': 1534304, 'steps': 2996, 'loss/train': 2.193479537963867} -09/21/2021 00:52:24 - INFO - __main__ - Step 47948: {'lr': 0.00019897544850377313, 'samples': 1534336, 'steps': 2996, 'loss/train': 2.504112482070923} -09/21/2021 00:52:24 - INFO - __main__ - Step 47949: {'lr': 0.00019897544850377313, 'samples': 1534368, 'steps': 2996, 'loss/train': 2.3121578693389893} -09/21/2021 00:52:25 - INFO - __main__ - Step 47950: {'lr': 0.00019897544850377313, 'samples': 1534400, 'steps': 2996, 'loss/train': 1.6413705348968506} -09/21/2021 00:52:26 - INFO - __main__ - Step 47951: {'lr': 0.00019897544850377313, 'samples': 1534432, 'steps': 2996, 'loss/train': 2.6202352046966553} -09/21/2021 00:52:27 - INFO - __main__ - Step 47952: {'lr': 0.00019897544850377313, 'samples': 1534464, 'steps': 2996, 'loss/train': 2.572628974914551} -09/21/2021 00:52:28 - INFO - __main__ - Step 47953: {'lr': 0.00019897453752913043, 'samples': 1534496, 'steps': 2997, 'loss/train': 1.4644044637680054} -09/21/2021 00:52:28 - INFO - __main__ - Step 47954: {'lr': 0.00019897453752913043, 'samples': 1534528, 'steps': 2997, 'loss/train': 2.352266550064087} -09/21/2021 00:52:29 - INFO - __main__ - Step 47955: {'lr': 0.00019897453752913043, 'samples': 1534560, 'steps': 2997, 'loss/train': 1.1813056468963623} -09/21/2021 00:52:30 - INFO - __main__ - Step 47956: {'lr': 0.00019897453752913043, 'samples': 1534592, 'steps': 2997, 'loss/train': 1.6438014507293701} -09/21/2021 00:52:31 - INFO - __main__ - Step 47957: {'lr': 0.00019897453752913043, 'samples': 1534624, 'steps': 2997, 'loss/train': 1.1668559312820435} -09/21/2021 00:52:31 - INFO - __main__ - Step 47958: {'lr': 0.00019897453752913043, 'samples': 1534656, 'steps': 2997, 'loss/train': 2.305696487426758} -09/21/2021 00:52:32 - INFO - __main__ - Step 47959: {'lr': 0.00019897453752913043, 'samples': 1534688, 'steps': 2997, 'loss/train': 2.433021068572998} -09/21/2021 00:52:33 - INFO - __main__ - Step 47960: {'lr': 0.00019897453752913043, 'samples': 1534720, 'steps': 2997, 'loss/train': 2.5742645263671875} -09/21/2021 00:52:34 - INFO - __main__ - Step 47961: {'lr': 0.00019897453752913043, 'samples': 1534752, 'steps': 2997, 'loss/train': 1.1156519651412964} -09/21/2021 00:52:34 - INFO - __main__ - Step 47962: {'lr': 0.00019897453752913043, 'samples': 1534784, 'steps': 2997, 'loss/train': 2.2941787242889404} -09/21/2021 00:52:35 - INFO - __main__ - Step 47963: {'lr': 0.00019897453752913043, 'samples': 1534816, 'steps': 2997, 'loss/train': 1.6802747249603271} -09/21/2021 00:52:36 - INFO - __main__ - Step 47964: {'lr': 0.00019897453752913043, 'samples': 1534848, 'steps': 2997, 'loss/train': 1.8225350379943848} -09/21/2021 00:52:37 - INFO - __main__ - Step 47965: {'lr': 0.00019897453752913043, 'samples': 1534880, 'steps': 2997, 'loss/train': 1.2054264545440674} -09/21/2021 00:52:37 - INFO - __main__ - Step 47966: {'lr': 0.00019897453752913043, 'samples': 1534912, 'steps': 2997, 'loss/train': 2.8723690509796143} -09/21/2021 00:52:38 - INFO - __main__ - Step 47967: {'lr': 0.00019897453752913043, 'samples': 1534944, 'steps': 2997, 'loss/train': 2.65592360496521} -09/21/2021 00:52:39 - INFO - __main__ - Step 47968: {'lr': 0.00019897453752913043, 'samples': 1534976, 'steps': 2997, 'loss/train': 1.737557291984558} -09/21/2021 00:52:40 - INFO - __main__ - Step 47969: {'lr': 0.0001989736261517607, 'samples': 1535008, 'steps': 2998, 'loss/train': 1.3114744424819946} -09/21/2021 00:52:40 - INFO - __main__ - Step 47970: {'lr': 0.0001989736261517607, 'samples': 1535040, 'steps': 2998, 'loss/train': 2.064547300338745} -09/21/2021 00:52:41 - INFO - __main__ - Step 47971: {'lr': 0.0001989736261517607, 'samples': 1535072, 'steps': 2998, 'loss/train': 1.850056767463684} -09/21/2021 00:52:42 - INFO - __main__ - Step 47972: {'lr': 0.0001989736261517607, 'samples': 1535104, 'steps': 2998, 'loss/train': 1.9517918825149536} -09/21/2021 00:52:43 - INFO - __main__ - Step 47973: {'lr': 0.0001989736261517607, 'samples': 1535136, 'steps': 2998, 'loss/train': 2.2883753776550293} -09/21/2021 00:52:43 - INFO - __main__ - Step 47974: {'lr': 0.0001989736261517607, 'samples': 1535168, 'steps': 2998, 'loss/train': 2.071599245071411} -09/21/2021 00:52:44 - INFO - __main__ - Step 47975: {'lr': 0.0001989736261517607, 'samples': 1535200, 'steps': 2998, 'loss/train': 2.221402645111084} -09/21/2021 00:52:46 - INFO - __main__ - Step 47976: {'lr': 0.0001989736261517607, 'samples': 1535232, 'steps': 2998, 'loss/train': 1.4765219688415527} -09/21/2021 00:52:47 - INFO - __main__ - Step 47977: {'lr': 0.0001989736261517607, 'samples': 1535264, 'steps': 2998, 'loss/train': 2.0940895080566406} -09/21/2021 00:52:47 - INFO - __main__ - Step 47978: {'lr': 0.0001989736261517607, 'samples': 1535296, 'steps': 2998, 'loss/train': 1.6435290575027466} -09/21/2021 00:52:48 - INFO - __main__ - Step 47979: {'lr': 0.0001989736261517607, 'samples': 1535328, 'steps': 2998, 'loss/train': 2.4097652435302734} -09/21/2021 00:52:49 - INFO - __main__ - Step 47980: {'lr': 0.0001989736261517607, 'samples': 1535360, 'steps': 2998, 'loss/train': 2.083270788192749} -09/21/2021 00:52:50 - INFO - __main__ - Step 47981: {'lr': 0.0001989736261517607, 'samples': 1535392, 'steps': 2998, 'loss/train': 1.868908166885376} -09/21/2021 00:52:50 - INFO - __main__ - Step 47982: {'lr': 0.0001989736261517607, 'samples': 1535424, 'steps': 2998, 'loss/train': 0.3586216866970062} -09/21/2021 00:52:51 - INFO - __main__ - Step 47983: {'lr': 0.0001989736261517607, 'samples': 1535456, 'steps': 2998, 'loss/train': 0.3880453109741211} -09/21/2021 00:52:52 - INFO - __main__ - Step 47984: {'lr': 0.0001989736261517607, 'samples': 1535488, 'steps': 2998, 'loss/train': 0.4242120385169983} -09/21/2021 00:52:53 - INFO - __main__ - Step 47985: {'lr': 0.0001989727143716677, 'samples': 1535520, 'steps': 2999, 'loss/train': 0.35471975803375244} -09/21/2021 00:52:53 - INFO - __main__ - Step 47986: {'lr': 0.0001989727143716677, 'samples': 1535552, 'steps': 2999, 'loss/train': 0.3190806806087494} -09/21/2021 00:52:54 - INFO - __main__ - Step 47987: {'lr': 0.0001989727143716677, 'samples': 1535584, 'steps': 2999, 'loss/train': 0.4404963254928589} -09/21/2021 00:52:55 - INFO - __main__ - Step 47988: {'lr': 0.0001989727143716677, 'samples': 1535616, 'steps': 2999, 'loss/train': 1.9539295434951782} -09/21/2021 00:52:56 - INFO - __main__ - Step 47989: {'lr': 0.0001989727143716677, 'samples': 1535648, 'steps': 2999, 'loss/train': 2.020026445388794} -09/21/2021 00:52:56 - INFO - __main__ - Step 47990: {'lr': 0.0001989727143716677, 'samples': 1535680, 'steps': 2999, 'loss/train': 2.860234260559082} -09/21/2021 00:52:57 - INFO - __main__ - Step 47991: {'lr': 0.0001989727143716677, 'samples': 1535712, 'steps': 2999, 'loss/train': 1.7176268100738525} -09/21/2021 00:52:58 - INFO - __main__ - Step 47992: {'lr': 0.0001989727143716677, 'samples': 1535744, 'steps': 2999, 'loss/train': 1.7598427534103394} -09/21/2021 00:52:59 - INFO - __main__ - Step 47993: {'lr': 0.0001989727143716677, 'samples': 1535776, 'steps': 2999, 'loss/train': 1.9255423545837402} -09/21/2021 00:52:59 - INFO - __main__ - Step 47994: {'lr': 0.0001989727143716677, 'samples': 1535808, 'steps': 2999, 'loss/train': 1.5750088691711426} -09/21/2021 00:53:00 - INFO - __main__ - Step 47995: {'lr': 0.0001989727143716677, 'samples': 1535840, 'steps': 2999, 'loss/train': 4.5909423828125} -09/21/2021 00:53:01 - INFO - __main__ - Step 47996: {'lr': 0.0001989727143716677, 'samples': 1535872, 'steps': 2999, 'loss/train': 2.0132319927215576} -09/21/2021 00:53:02 - INFO - __main__ - Step 47997: {'lr': 0.0001989727143716677, 'samples': 1535904, 'steps': 2999, 'loss/train': 2.2429332733154297} -09/21/2021 00:53:02 - INFO - __main__ - Step 47998: {'lr': 0.0001989727143716677, 'samples': 1535936, 'steps': 2999, 'loss/train': 2.4358959197998047} -09/21/2021 00:53:03 - INFO - __main__ - Step 47999: {'lr': 0.0001989727143716677, 'samples': 1535968, 'steps': 2999, 'loss/train': 1.6224005222320557} -09/21/2021 00:53:04 - INFO - __main__ - Step 48000: {'lr': 0.0001989727143716677, 'samples': 1536000, 'steps': 2999, 'loss/train': 1.7987626791000366} -09/21/2021 00:53:05 - INFO - __main__ - Step 48001: {'lr': 0.00019897180218885507, 'samples': 1536032, 'steps': 3000, 'loss/train': 1.5152450799942017} -09/21/2021 00:53:06 - INFO - __main__ - Step 48002: {'lr': 0.00019897180218885507, 'samples': 1536064, 'steps': 3000, 'loss/train': 2.4367384910583496} -09/21/2021 00:53:06 - INFO - __main__ - Step 48003: {'lr': 0.00019897180218885507, 'samples': 1536096, 'steps': 3000, 'loss/train': 2.611804962158203} -09/21/2021 00:53:07 - INFO - __main__ - Step 48004: {'lr': 0.00019897180218885507, 'samples': 1536128, 'steps': 3000, 'loss/train': 1.9873838424682617} -09/21/2021 00:53:08 - INFO - __main__ - Step 48005: {'lr': 0.00019897180218885507, 'samples': 1536160, 'steps': 3000, 'loss/train': 1.6324621438980103} -09/21/2021 00:53:09 - INFO - __main__ - Step 48006: {'lr': 0.00019897180218885507, 'samples': 1536192, 'steps': 3000, 'loss/train': 2.367278575897217} -09/21/2021 00:53:09 - INFO - __main__ - Step 48007: {'lr': 0.00019897180218885507, 'samples': 1536224, 'steps': 3000, 'loss/train': 3.5234076976776123} -09/21/2021 00:53:11 - INFO - __main__ - Step 48008: {'lr': 0.00019897180218885507, 'samples': 1536256, 'steps': 3000, 'loss/train': 1.9459272623062134} -09/21/2021 00:53:11 - INFO - __main__ - Step 48009: {'lr': 0.00019897180218885507, 'samples': 1536288, 'steps': 3000, 'loss/train': 0.149081289768219} -09/21/2021 00:53:12 - INFO - __main__ - Step 48010: {'lr': 0.00019897180218885507, 'samples': 1536320, 'steps': 3000, 'loss/train': 2.3573927879333496} -09/21/2021 00:53:13 - INFO - __main__ - Step 48011: {'lr': 0.00019897180218885507, 'samples': 1536352, 'steps': 3000, 'loss/train': 2.4931371212005615} -09/21/2021 00:53:14 - INFO - __main__ - Step 48012: {'lr': 0.00019897180218885507, 'samples': 1536384, 'steps': 3000, 'loss/train': 1.5165901184082031} -09/21/2021 00:53:14 - INFO - __main__ - Step 48013: {'lr': 0.00019897180218885507, 'samples': 1536416, 'steps': 3000, 'loss/train': 1.4534755945205688} -09/21/2021 00:53:15 - INFO - __main__ - Step 48014: {'lr': 0.00019897180218885507, 'samples': 1536448, 'steps': 3000, 'loss/train': 1.9187270402908325} -09/21/2021 00:53:16 - INFO - __main__ - Step 48015: {'lr': 0.00019897180218885507, 'samples': 1536480, 'steps': 3000, 'loss/train': 1.6311383247375488} -09/21/2021 00:53:17 - INFO - __main__ - Step 48016: {'lr': 0.00019897180218885507, 'samples': 1536512, 'steps': 3000, 'loss/train': 1.8317131996154785} -09/21/2021 00:53:17 - INFO - __main__ - Step 48017: {'lr': 0.0001989708896033266, 'samples': 1536544, 'steps': 3001, 'loss/train': 1.9009618759155273} -09/21/2021 00:53:18 - INFO - __main__ - Step 48018: {'lr': 0.0001989708896033266, 'samples': 1536576, 'steps': 3001, 'loss/train': 2.0461575984954834} -09/21/2021 00:53:19 - INFO - __main__ - Step 48019: {'lr': 0.0001989708896033266, 'samples': 1536608, 'steps': 3001, 'loss/train': 1.897226333618164} -09/21/2021 00:53:20 - INFO - __main__ - Step 48020: {'lr': 0.0001989708896033266, 'samples': 1536640, 'steps': 3001, 'loss/train': 1.7034978866577148} -09/21/2021 00:53:20 - INFO - __main__ - Step 48021: {'lr': 0.0001989708896033266, 'samples': 1536672, 'steps': 3001, 'loss/train': 1.9390357732772827} -09/21/2021 00:53:21 - INFO - __main__ - Step 48022: {'lr': 0.0001989708896033266, 'samples': 1536704, 'steps': 3001, 'loss/train': 2.3213250637054443} -09/21/2021 00:53:22 - INFO - __main__ - Step 48023: {'lr': 0.0001989708896033266, 'samples': 1536736, 'steps': 3001, 'loss/train': 2.1548879146575928} -09/21/2021 00:53:23 - INFO - __main__ - Step 48024: {'lr': 0.0001989708896033266, 'samples': 1536768, 'steps': 3001, 'loss/train': 2.009880304336548} -09/21/2021 00:53:23 - INFO - __main__ - Step 48025: {'lr': 0.0001989708896033266, 'samples': 1536800, 'steps': 3001, 'loss/train': 2.341525077819824} -09/21/2021 00:53:24 - INFO - __main__ - Step 48026: {'lr': 0.0001989708896033266, 'samples': 1536832, 'steps': 3001, 'loss/train': 2.5807864665985107} -09/21/2021 00:53:25 - INFO - __main__ - Step 48027: {'lr': 0.0001989708896033266, 'samples': 1536864, 'steps': 3001, 'loss/train': 2.1053481101989746} -09/21/2021 00:53:26 - INFO - __main__ - Step 48028: {'lr': 0.0001989708896033266, 'samples': 1536896, 'steps': 3001, 'loss/train': 1.539388656616211} -09/21/2021 00:53:26 - INFO - __main__ - Step 48029: {'lr': 0.0001989708896033266, 'samples': 1536928, 'steps': 3001, 'loss/train': 2.7234013080596924} -09/21/2021 00:53:27 - INFO - __main__ - Step 48030: {'lr': 0.0001989708896033266, 'samples': 1536960, 'steps': 3001, 'loss/train': 2.426219940185547} -09/21/2021 00:53:28 - INFO - __main__ - Step 48031: {'lr': 0.0001989708896033266, 'samples': 1536992, 'steps': 3001, 'loss/train': 1.9469629526138306} -09/21/2021 00:53:29 - INFO - __main__ - Step 48032: {'lr': 0.0001989708896033266, 'samples': 1537024, 'steps': 3001, 'loss/train': 2.121788263320923} -09/21/2021 00:53:30 - INFO - __main__ - Step 48033: {'lr': 0.00019896997661508593, 'samples': 1537056, 'steps': 3002, 'loss/train': 1.8695721626281738} -09/21/2021 00:53:30 - INFO - __main__ - Step 48034: {'lr': 0.00019896997661508593, 'samples': 1537088, 'steps': 3002, 'loss/train': 2.4423468112945557} -09/21/2021 00:53:31 - INFO - __main__ - Step 48035: {'lr': 0.00019896997661508593, 'samples': 1537120, 'steps': 3002, 'loss/train': 1.8610529899597168} -09/21/2021 00:53:32 - INFO - __main__ - Step 48036: {'lr': 0.00019896997661508593, 'samples': 1537152, 'steps': 3002, 'loss/train': 2.5052618980407715} -09/21/2021 00:53:33 - INFO - __main__ - Step 48037: {'lr': 0.00019896997661508593, 'samples': 1537184, 'steps': 3002, 'loss/train': 2.617469072341919} -09/21/2021 00:53:34 - INFO - __main__ - Step 48038: {'lr': 0.00019896997661508593, 'samples': 1537216, 'steps': 3002, 'loss/train': 0.3969762921333313} -09/21/2021 00:53:35 - INFO - __main__ - Step 48039: {'lr': 0.00019896997661508593, 'samples': 1537248, 'steps': 3002, 'loss/train': 2.4155092239379883} -09/21/2021 00:53:35 - INFO - __main__ - Step 48040: {'lr': 0.00019896997661508593, 'samples': 1537280, 'steps': 3002, 'loss/train': 1.5825481414794922} -09/21/2021 00:53:36 - INFO - __main__ - Step 48041: {'lr': 0.00019896997661508593, 'samples': 1537312, 'steps': 3002, 'loss/train': 2.140528678894043} -09/21/2021 00:53:37 - INFO - __main__ - Step 48042: {'lr': 0.00019896997661508593, 'samples': 1537344, 'steps': 3002, 'loss/train': 2.347140312194824} -09/21/2021 00:53:38 - INFO - __main__ - Step 48043: {'lr': 0.00019896997661508593, 'samples': 1537376, 'steps': 3002, 'loss/train': 0.19382672011852264} -09/21/2021 00:53:38 - INFO - __main__ - Step 48044: {'lr': 0.00019896997661508593, 'samples': 1537408, 'steps': 3002, 'loss/train': 1.7814364433288574} -09/21/2021 00:53:39 - INFO - __main__ - Step 48045: {'lr': 0.00019896997661508593, 'samples': 1537440, 'steps': 3002, 'loss/train': 2.2306065559387207} -09/21/2021 00:53:40 - INFO - __main__ - Step 48046: {'lr': 0.00019896997661508593, 'samples': 1537472, 'steps': 3002, 'loss/train': 1.9204806089401245} -09/21/2021 00:53:41 - INFO - __main__ - Step 48047: {'lr': 0.00019896997661508593, 'samples': 1537504, 'steps': 3002, 'loss/train': 1.7356507778167725} -09/21/2021 00:53:41 - INFO - __main__ - Step 48048: {'lr': 0.00019896997661508593, 'samples': 1537536, 'steps': 3002, 'loss/train': 2.338463068008423} -09/21/2021 00:53:42 - INFO - __main__ - Step 48049: {'lr': 0.00019896906322413682, 'samples': 1537568, 'steps': 3003, 'loss/train': 1.8972985744476318} -09/21/2021 00:53:43 - INFO - __main__ - Step 48050: {'lr': 0.00019896906322413682, 'samples': 1537600, 'steps': 3003, 'loss/train': 1.517460584640503} -09/21/2021 00:53:44 - INFO - __main__ - Step 48051: {'lr': 0.00019896906322413682, 'samples': 1537632, 'steps': 3003, 'loss/train': 1.782105803489685} -09/21/2021 00:53:45 - INFO - __main__ - Step 48052: {'lr': 0.00019896906322413682, 'samples': 1537664, 'steps': 3003, 'loss/train': 1.4236171245574951} -09/21/2021 00:53:45 - INFO - __main__ - Step 48053: {'lr': 0.00019896906322413682, 'samples': 1537696, 'steps': 3003, 'loss/train': 1.9915697574615479} -09/21/2021 00:53:46 - INFO - __main__ - Step 48054: {'lr': 0.00019896906322413682, 'samples': 1537728, 'steps': 3003, 'loss/train': 2.2256486415863037} -09/21/2021 00:53:47 - INFO - __main__ - Step 48055: {'lr': 0.00019896906322413682, 'samples': 1537760, 'steps': 3003, 'loss/train': 1.3921780586242676} -09/21/2021 00:53:48 - INFO - __main__ - Step 48056: {'lr': 0.00019896906322413682, 'samples': 1537792, 'steps': 3003, 'loss/train': 1.794731855392456} -09/21/2021 00:53:48 - INFO - __main__ - Step 48057: {'lr': 0.00019896906322413682, 'samples': 1537824, 'steps': 3003, 'loss/train': 1.8521034717559814} -09/21/2021 00:53:49 - INFO - __main__ - Step 48058: {'lr': 0.00019896906322413682, 'samples': 1537856, 'steps': 3003, 'loss/train': 2.501422882080078} -09/21/2021 00:53:50 - INFO - __main__ - Step 48059: {'lr': 0.00019896906322413682, 'samples': 1537888, 'steps': 3003, 'loss/train': 2.2759878635406494} -09/21/2021 00:53:51 - INFO - __main__ - Step 48060: {'lr': 0.00019896906322413682, 'samples': 1537920, 'steps': 3003, 'loss/train': 2.093964099884033} -09/21/2021 00:53:51 - INFO - __main__ - Step 48061: {'lr': 0.00019896906322413682, 'samples': 1537952, 'steps': 3003, 'loss/train': 2.4359538555145264} -09/21/2021 00:53:52 - INFO - __main__ - Step 48062: {'lr': 0.00019896906322413682, 'samples': 1537984, 'steps': 3003, 'loss/train': 2.04884672164917} -09/21/2021 00:53:53 - INFO - __main__ - Step 48063: {'lr': 0.00019896906322413682, 'samples': 1538016, 'steps': 3003, 'loss/train': 2.5695948600769043} -09/21/2021 00:53:54 - INFO - __main__ - Step 48064: {'lr': 0.00019896906322413682, 'samples': 1538048, 'steps': 3003, 'loss/train': 1.8289146423339844} -09/21/2021 00:53:54 - INFO - __main__ - Step 48065: {'lr': 0.000198968149430483, 'samples': 1538080, 'steps': 3004, 'loss/train': 2.2159945964813232} -09/21/2021 00:53:55 - INFO - __main__ - Step 48066: {'lr': 0.000198968149430483, 'samples': 1538112, 'steps': 3004, 'loss/train': 1.730291485786438} -09/21/2021 00:53:56 - INFO - __main__ - Step 48067: {'lr': 0.000198968149430483, 'samples': 1538144, 'steps': 3004, 'loss/train': 2.314105749130249} -09/21/2021 00:53:57 - INFO - __main__ - Step 48068: {'lr': 0.000198968149430483, 'samples': 1538176, 'steps': 3004, 'loss/train': 1.5222041606903076} -09/21/2021 00:53:58 - INFO - __main__ - Step 48069: {'lr': 0.000198968149430483, 'samples': 1538208, 'steps': 3004, 'loss/train': 1.894098162651062} -09/21/2021 00:53:59 - INFO - __main__ - Step 48070: {'lr': 0.000198968149430483, 'samples': 1538240, 'steps': 3004, 'loss/train': 1.8577535152435303} -09/21/2021 00:54:00 - INFO - __main__ - Step 48071: {'lr': 0.000198968149430483, 'samples': 1538272, 'steps': 3004, 'loss/train': 1.3158456087112427} -09/21/2021 00:54:00 - INFO - __main__ - Step 48072: {'lr': 0.000198968149430483, 'samples': 1538304, 'steps': 3004, 'loss/train': 1.9295941591262817} -09/21/2021 00:54:01 - INFO - __main__ - Step 48073: {'lr': 0.000198968149430483, 'samples': 1538336, 'steps': 3004, 'loss/train': 1.5448496341705322} -09/21/2021 00:54:02 - INFO - __main__ - Step 48074: {'lr': 0.000198968149430483, 'samples': 1538368, 'steps': 3004, 'loss/train': 1.6385467052459717} -09/21/2021 00:54:03 - INFO - __main__ - Step 48075: {'lr': 0.000198968149430483, 'samples': 1538400, 'steps': 3004, 'loss/train': 2.121063470840454} -09/21/2021 00:54:03 - INFO - __main__ - Step 48076: {'lr': 0.000198968149430483, 'samples': 1538432, 'steps': 3004, 'loss/train': 1.4960553646087646} -09/21/2021 00:54:04 - INFO - __main__ - Step 48077: {'lr': 0.000198968149430483, 'samples': 1538464, 'steps': 3004, 'loss/train': 1.9585344791412354} -09/21/2021 00:54:05 - INFO - __main__ - Step 48078: {'lr': 0.000198968149430483, 'samples': 1538496, 'steps': 3004, 'loss/train': 1.5997374057769775} -09/21/2021 00:54:06 - INFO - __main__ - Step 48079: {'lr': 0.000198968149430483, 'samples': 1538528, 'steps': 3004, 'loss/train': 1.7237610816955566} -09/21/2021 00:54:06 - INFO - __main__ - Step 48080: {'lr': 0.000198968149430483, 'samples': 1538560, 'steps': 3004, 'loss/train': 2.4906318187713623} -09/21/2021 00:54:07 - INFO - __main__ - Step 48081: {'lr': 0.00019896723523412814, 'samples': 1538592, 'steps': 3005, 'loss/train': 1.2129368782043457} -09/21/2021 00:54:08 - INFO - __main__ - Step 48082: {'lr': 0.00019896723523412814, 'samples': 1538624, 'steps': 3005, 'loss/train': 2.183342933654785} -09/21/2021 00:54:09 - INFO - __main__ - Step 48083: {'lr': 0.00019896723523412814, 'samples': 1538656, 'steps': 3005, 'loss/train': 2.3717219829559326} -09/21/2021 00:54:10 - INFO - __main__ - Step 48084: {'lr': 0.00019896723523412814, 'samples': 1538688, 'steps': 3005, 'loss/train': 1.0537025928497314} -09/21/2021 00:54:10 - INFO - __main__ - Step 48085: {'lr': 0.00019896723523412814, 'samples': 1538720, 'steps': 3005, 'loss/train': 2.360910415649414} -09/21/2021 00:54:11 - INFO - __main__ - Step 48086: {'lr': 0.00019896723523412814, 'samples': 1538752, 'steps': 3005, 'loss/train': 2.321281671524048} -09/21/2021 00:54:12 - INFO - __main__ - Step 48087: {'lr': 0.00019896723523412814, 'samples': 1538784, 'steps': 3005, 'loss/train': 1.690127968788147} -09/21/2021 00:54:13 - INFO - __main__ - Step 48088: {'lr': 0.00019896723523412814, 'samples': 1538816, 'steps': 3005, 'loss/train': 1.078078269958496} -09/21/2021 00:54:13 - INFO - __main__ - Step 48089: {'lr': 0.00019896723523412814, 'samples': 1538848, 'steps': 3005, 'loss/train': 2.445185661315918} -09/21/2021 00:54:14 - INFO - __main__ - Step 48090: {'lr': 0.00019896723523412814, 'samples': 1538880, 'steps': 3005, 'loss/train': 2.5022635459899902} -09/21/2021 00:54:15 - INFO - __main__ - Step 48091: {'lr': 0.00019896723523412814, 'samples': 1538912, 'steps': 3005, 'loss/train': 4.293898582458496} -09/21/2021 00:54:16 - INFO - __main__ - Step 48092: {'lr': 0.00019896723523412814, 'samples': 1538944, 'steps': 3005, 'loss/train': 2.645897626876831} -09/21/2021 00:54:16 - INFO - __main__ - Step 48093: {'lr': 0.00019896723523412814, 'samples': 1538976, 'steps': 3005, 'loss/train': 1.134460210800171} -09/21/2021 00:54:17 - INFO - __main__ - Step 48094: {'lr': 0.00019896723523412814, 'samples': 1539008, 'steps': 3005, 'loss/train': 1.4294265508651733} -09/21/2021 00:54:18 - INFO - __main__ - Step 48095: {'lr': 0.00019896723523412814, 'samples': 1539040, 'steps': 3005, 'loss/train': 2.841585874557495} -09/21/2021 00:54:19 - INFO - __main__ - Step 48096: {'lr': 0.00019896723523412814, 'samples': 1539072, 'steps': 3005, 'loss/train': 1.7175323963165283} -09/21/2021 00:54:19 - INFO - __main__ - Step 48097: {'lr': 0.000198966320635076, 'samples': 1539104, 'steps': 3006, 'loss/train': 2.1206510066986084} -09/21/2021 00:54:20 - INFO - __main__ - Step 48098: {'lr': 0.000198966320635076, 'samples': 1539136, 'steps': 3006, 'loss/train': 1.9871163368225098} -09/21/2021 00:54:21 - INFO - __main__ - Step 48099: {'lr': 0.000198966320635076, 'samples': 1539168, 'steps': 3006, 'loss/train': 1.1879029273986816} -09/21/2021 00:54:22 - INFO - __main__ - Step 48100: {'lr': 0.000198966320635076, 'samples': 1539200, 'steps': 3006, 'loss/train': 2.4170949459075928} -09/21/2021 00:54:23 - INFO - __main__ - Step 48101: {'lr': 0.000198966320635076, 'samples': 1539232, 'steps': 3006, 'loss/train': 2.0315115451812744} -09/21/2021 00:54:24 - INFO - __main__ - Step 48102: {'lr': 0.000198966320635076, 'samples': 1539264, 'steps': 3006, 'loss/train': 0.34479954838752747} -09/21/2021 00:54:24 - INFO - __main__ - Step 48103: {'lr': 0.000198966320635076, 'samples': 1539296, 'steps': 3006, 'loss/train': 2.132293701171875} -09/21/2021 00:54:25 - INFO - __main__ - Step 48104: {'lr': 0.000198966320635076, 'samples': 1539328, 'steps': 3006, 'loss/train': 2.4259660243988037} -09/21/2021 00:54:26 - INFO - __main__ - Step 48105: {'lr': 0.000198966320635076, 'samples': 1539360, 'steps': 3006, 'loss/train': 2.2984797954559326} -09/21/2021 00:54:27 - INFO - __main__ - Step 48106: {'lr': 0.000198966320635076, 'samples': 1539392, 'steps': 3006, 'loss/train': 2.3941683769226074} -09/21/2021 00:54:28 - INFO - __main__ - Step 48107: {'lr': 0.000198966320635076, 'samples': 1539424, 'steps': 3006, 'loss/train': 2.1520135402679443} -09/21/2021 00:54:28 - INFO - __main__ - Step 48108: {'lr': 0.000198966320635076, 'samples': 1539456, 'steps': 3006, 'loss/train': 1.385896921157837} -09/21/2021 00:54:29 - INFO - __main__ - Step 48109: {'lr': 0.000198966320635076, 'samples': 1539488, 'steps': 3006, 'loss/train': 1.5409687757492065} -09/21/2021 00:54:30 - INFO - __main__ - Step 48110: {'lr': 0.000198966320635076, 'samples': 1539520, 'steps': 3006, 'loss/train': 2.317502737045288} -09/21/2021 00:54:31 - INFO - __main__ - Step 48111: {'lr': 0.000198966320635076, 'samples': 1539552, 'steps': 3006, 'loss/train': 2.5256850719451904} -09/21/2021 00:54:31 - INFO - __main__ - Step 48112: {'lr': 0.000198966320635076, 'samples': 1539584, 'steps': 3006, 'loss/train': 0.5161177515983582} -09/21/2021 00:54:32 - INFO - __main__ - Step 48113: {'lr': 0.0001989654056333303, 'samples': 1539616, 'steps': 3007, 'loss/train': 1.5937857627868652} -09/21/2021 00:54:33 - INFO - __main__ - Step 48114: {'lr': 0.0001989654056333303, 'samples': 1539648, 'steps': 3007, 'loss/train': 2.1749448776245117} -09/21/2021 00:54:34 - INFO - __main__ - Step 48115: {'lr': 0.0001989654056333303, 'samples': 1539680, 'steps': 3007, 'loss/train': 1.9780195951461792} -09/21/2021 00:54:34 - INFO - __main__ - Step 48116: {'lr': 0.0001989654056333303, 'samples': 1539712, 'steps': 3007, 'loss/train': 1.172688603401184} -09/21/2021 00:54:35 - INFO - __main__ - Step 48117: {'lr': 0.0001989654056333303, 'samples': 1539744, 'steps': 3007, 'loss/train': 1.7960420846939087} -09/21/2021 00:54:36 - INFO - __main__ - Step 48118: {'lr': 0.0001989654056333303, 'samples': 1539776, 'steps': 3007, 'loss/train': 1.1636428833007812} -09/21/2021 00:54:37 - INFO - __main__ - Step 48119: {'lr': 0.0001989654056333303, 'samples': 1539808, 'steps': 3007, 'loss/train': 2.4562466144561768} -09/21/2021 00:54:37 - INFO - __main__ - Step 48120: {'lr': 0.0001989654056333303, 'samples': 1539840, 'steps': 3007, 'loss/train': 0.8377649188041687} -09/21/2021 00:54:38 - INFO - __main__ - Step 48121: {'lr': 0.0001989654056333303, 'samples': 1539872, 'steps': 3007, 'loss/train': 1.7370282411575317} -09/21/2021 00:54:39 - INFO - __main__ - Step 48122: {'lr': 0.0001989654056333303, 'samples': 1539904, 'steps': 3007, 'loss/train': 2.042917013168335} -09/21/2021 00:54:40 - INFO - __main__ - Step 48123: {'lr': 0.0001989654056333303, 'samples': 1539936, 'steps': 3007, 'loss/train': 2.8122737407684326} -09/21/2021 00:54:40 - INFO - __main__ - Step 48124: {'lr': 0.0001989654056333303, 'samples': 1539968, 'steps': 3007, 'loss/train': 2.3434154987335205} -09/21/2021 00:54:41 - INFO - __main__ - Step 48125: {'lr': 0.0001989654056333303, 'samples': 1540000, 'steps': 3007, 'loss/train': 2.335238218307495} -09/21/2021 00:54:42 - INFO - __main__ - Step 48126: {'lr': 0.0001989654056333303, 'samples': 1540032, 'steps': 3007, 'loss/train': 2.523768424987793} -09/21/2021 00:54:43 - INFO - __main__ - Step 48127: {'lr': 0.0001989654056333303, 'samples': 1540064, 'steps': 3007, 'loss/train': 0.8348320722579956} -09/21/2021 00:54:43 - INFO - __main__ - Step 48128: {'lr': 0.0001989654056333303, 'samples': 1540096, 'steps': 3007, 'loss/train': 1.846529483795166} -09/21/2021 00:54:44 - INFO - __main__ - Step 48129: {'lr': 0.00019896449022889468, 'samples': 1540128, 'steps': 3008, 'loss/train': 2.614609479904175} -09/21/2021 00:54:45 - INFO - __main__ - Step 48130: {'lr': 0.00019896449022889468, 'samples': 1540160, 'steps': 3008, 'loss/train': 2.96237850189209} -09/21/2021 00:54:47 - INFO - __main__ - Step 48131: {'lr': 0.00019896449022889468, 'samples': 1540192, 'steps': 3008, 'loss/train': 2.620410680770874} -09/21/2021 00:54:48 - INFO - __main__ - Step 48132: {'lr': 0.00019896449022889468, 'samples': 1540224, 'steps': 3008, 'loss/train': 2.0085339546203613} -09/21/2021 00:54:48 - INFO - __main__ - Step 48133: {'lr': 0.00019896449022889468, 'samples': 1540256, 'steps': 3008, 'loss/train': 0.7725510597229004} -09/21/2021 00:54:49 - INFO - __main__ - Step 48134: {'lr': 0.00019896449022889468, 'samples': 1540288, 'steps': 3008, 'loss/train': 2.4131085872650146} -09/21/2021 00:54:50 - INFO - __main__ - Step 48135: {'lr': 0.00019896449022889468, 'samples': 1540320, 'steps': 3008, 'loss/train': 1.915623664855957} -09/21/2021 00:54:51 - INFO - __main__ - Step 48136: {'lr': 0.00019896449022889468, 'samples': 1540352, 'steps': 3008, 'loss/train': 1.8718889951705933} -09/21/2021 00:54:51 - INFO - __main__ - Step 48137: {'lr': 0.00019896449022889468, 'samples': 1540384, 'steps': 3008, 'loss/train': 1.9368401765823364} -09/21/2021 00:54:52 - INFO - __main__ - Step 48138: {'lr': 0.00019896449022889468, 'samples': 1540416, 'steps': 3008, 'loss/train': 1.9729244709014893} -09/21/2021 00:54:53 - INFO - __main__ - Step 48139: {'lr': 0.00019896449022889468, 'samples': 1540448, 'steps': 3008, 'loss/train': 2.049654245376587} -09/21/2021 00:54:54 - INFO - __main__ - Step 48140: {'lr': 0.00019896449022889468, 'samples': 1540480, 'steps': 3008, 'loss/train': 2.191298007965088} -09/21/2021 00:54:54 - INFO - __main__ - Step 48141: {'lr': 0.00019896449022889468, 'samples': 1540512, 'steps': 3008, 'loss/train': 1.8465441465377808} -09/21/2021 00:54:55 - INFO - __main__ - Step 48142: {'lr': 0.00019896449022889468, 'samples': 1540544, 'steps': 3008, 'loss/train': 1.9343743324279785} -09/21/2021 00:54:56 - INFO - __main__ - Step 48143: {'lr': 0.00019896449022889468, 'samples': 1540576, 'steps': 3008, 'loss/train': 2.6145401000976562} -09/21/2021 00:54:57 - INFO - __main__ - Step 48144: {'lr': 0.00019896449022889468, 'samples': 1540608, 'steps': 3008, 'loss/train': 3.523590564727783} -09/21/2021 00:54:58 - INFO - __main__ - Step 48145: {'lr': 0.000198963574421773, 'samples': 1540640, 'steps': 3009, 'loss/train': 3.8001914024353027} -09/21/2021 00:54:58 - INFO - __main__ - Step 48146: {'lr': 0.000198963574421773, 'samples': 1540672, 'steps': 3009, 'loss/train': 3.60898494720459} -09/21/2021 00:54:59 - INFO - __main__ - Step 48147: {'lr': 0.000198963574421773, 'samples': 1540704, 'steps': 3009, 'loss/train': 2.287268877029419} -09/21/2021 00:55:00 - INFO - __main__ - Step 48148: {'lr': 0.000198963574421773, 'samples': 1540736, 'steps': 3009, 'loss/train': 2.1090214252471924} -09/21/2021 00:55:01 - INFO - __main__ - Step 48149: {'lr': 0.000198963574421773, 'samples': 1540768, 'steps': 3009, 'loss/train': 2.2845826148986816} -09/21/2021 00:55:01 - INFO - __main__ - Step 48150: {'lr': 0.000198963574421773, 'samples': 1540800, 'steps': 3009, 'loss/train': 1.842115879058838} -09/21/2021 00:55:02 - INFO - __main__ - Step 48151: {'lr': 0.000198963574421773, 'samples': 1540832, 'steps': 3009, 'loss/train': 2.8006484508514404} -09/21/2021 00:55:03 - INFO - __main__ - Step 48152: {'lr': 0.000198963574421773, 'samples': 1540864, 'steps': 3009, 'loss/train': 1.684345006942749} -09/21/2021 00:55:04 - INFO - __main__ - Step 48153: {'lr': 0.000198963574421773, 'samples': 1540896, 'steps': 3009, 'loss/train': 1.486064076423645} -09/21/2021 00:55:04 - INFO - __main__ - Step 48154: {'lr': 0.000198963574421773, 'samples': 1540928, 'steps': 3009, 'loss/train': 0.8986934423446655} -09/21/2021 00:55:05 - INFO - __main__ - Step 48155: {'lr': 0.000198963574421773, 'samples': 1540960, 'steps': 3009, 'loss/train': 3.0807225704193115} -09/21/2021 00:55:06 - INFO - __main__ - Step 48156: {'lr': 0.000198963574421773, 'samples': 1540992, 'steps': 3009, 'loss/train': 0.8781543374061584} -09/21/2021 00:55:07 - INFO - __main__ - Step 48157: {'lr': 0.000198963574421773, 'samples': 1541024, 'steps': 3009, 'loss/train': 1.7969543933868408} -09/21/2021 00:55:07 - INFO - __main__ - Step 48158: {'lr': 0.000198963574421773, 'samples': 1541056, 'steps': 3009, 'loss/train': 1.8891010284423828} -09/21/2021 00:55:08 - INFO - __main__ - Step 48159: {'lr': 0.000198963574421773, 'samples': 1541088, 'steps': 3009, 'loss/train': 2.040226459503174} -09/21/2021 00:55:09 - INFO - __main__ - Step 48160: {'lr': 0.000198963574421773, 'samples': 1541120, 'steps': 3009, 'loss/train': 2.4069011211395264} -09/21/2021 00:55:10 - INFO - __main__ - Step 48161: {'lr': 0.00019896265821196888, 'samples': 1541152, 'steps': 3010, 'loss/train': 1.7514469623565674} -09/21/2021 00:55:11 - INFO - __main__ - Step 48162: {'lr': 0.00019896265821196888, 'samples': 1541184, 'steps': 3010, 'loss/train': 1.6211518049240112} -09/21/2021 00:55:12 - INFO - __main__ - Step 48163: {'lr': 0.00019896265821196888, 'samples': 1541216, 'steps': 3010, 'loss/train': 2.8894615173339844} -09/21/2021 00:55:13 - INFO - __main__ - Step 48164: {'lr': 0.00019896265821196888, 'samples': 1541248, 'steps': 3010, 'loss/train': 2.784428358078003} -09/21/2021 00:55:13 - INFO - __main__ - Step 48165: {'lr': 0.00019896265821196888, 'samples': 1541280, 'steps': 3010, 'loss/train': 1.3489177227020264} -09/21/2021 00:55:14 - INFO - __main__ - Step 48166: {'lr': 0.00019896265821196888, 'samples': 1541312, 'steps': 3010, 'loss/train': 1.6035865545272827} -09/21/2021 00:55:15 - INFO - __main__ - Step 48167: {'lr': 0.00019896265821196888, 'samples': 1541344, 'steps': 3010, 'loss/train': 1.8842462301254272} -09/21/2021 00:55:16 - INFO - __main__ - Step 48168: {'lr': 0.00019896265821196888, 'samples': 1541376, 'steps': 3010, 'loss/train': 2.4977028369903564} -09/21/2021 00:55:16 - INFO - __main__ - Step 48169: {'lr': 0.00019896265821196888, 'samples': 1541408, 'steps': 3010, 'loss/train': 1.6446905136108398} -09/21/2021 00:55:17 - INFO - __main__ - Step 48170: {'lr': 0.00019896265821196888, 'samples': 1541440, 'steps': 3010, 'loss/train': 2.2854254245758057} -09/21/2021 00:55:18 - INFO - __main__ - Step 48171: {'lr': 0.00019896265821196888, 'samples': 1541472, 'steps': 3010, 'loss/train': 1.6151466369628906} -09/21/2021 00:55:19 - INFO - __main__ - Step 48172: {'lr': 0.00019896265821196888, 'samples': 1541504, 'steps': 3010, 'loss/train': 2.296172618865967} -09/21/2021 00:55:19 - INFO - __main__ - Step 48173: {'lr': 0.00019896265821196888, 'samples': 1541536, 'steps': 3010, 'loss/train': 0.24732287228107452} -09/21/2021 00:55:20 - INFO - __main__ - Step 48174: {'lr': 0.00019896265821196888, 'samples': 1541568, 'steps': 3010, 'loss/train': 1.49711012840271} -09/21/2021 00:55:21 - INFO - __main__ - Step 48175: {'lr': 0.00019896265821196888, 'samples': 1541600, 'steps': 3010, 'loss/train': 1.6970691680908203} -09/21/2021 00:55:22 - INFO - __main__ - Step 48176: {'lr': 0.00019896265821196888, 'samples': 1541632, 'steps': 3010, 'loss/train': 0.22516438364982605} -09/21/2021 00:55:22 - INFO - __main__ - Step 48177: {'lr': 0.00019896174159948613, 'samples': 1541664, 'steps': 3011, 'loss/train': 2.1556782722473145} -09/21/2021 00:55:23 - INFO - __main__ - Step 48178: {'lr': 0.00019896174159948613, 'samples': 1541696, 'steps': 3011, 'loss/train': 1.6170144081115723} -09/21/2021 00:55:24 - INFO - __main__ - Step 48179: {'lr': 0.00019896174159948613, 'samples': 1541728, 'steps': 3011, 'loss/train': 1.4410438537597656} -09/21/2021 00:55:25 - INFO - __main__ - Step 48180: {'lr': 0.00019896174159948613, 'samples': 1541760, 'steps': 3011, 'loss/train': 2.8310723304748535} -09/21/2021 00:55:25 - INFO - __main__ - Step 48181: {'lr': 0.00019896174159948613, 'samples': 1541792, 'steps': 3011, 'loss/train': 2.5824484825134277} -09/21/2021 00:55:26 - INFO - __main__ - Step 48182: {'lr': 0.00019896174159948613, 'samples': 1541824, 'steps': 3011, 'loss/train': 2.5619008541107178} -09/21/2021 00:55:27 - INFO - __main__ - Step 48183: {'lr': 0.00019896174159948613, 'samples': 1541856, 'steps': 3011, 'loss/train': 2.312094211578369} -09/21/2021 00:55:28 - INFO - __main__ - Step 48184: {'lr': 0.00019896174159948613, 'samples': 1541888, 'steps': 3011, 'loss/train': 0.6962572336196899} -09/21/2021 00:55:28 - INFO - __main__ - Step 48185: {'lr': 0.00019896174159948613, 'samples': 1541920, 'steps': 3011, 'loss/train': 2.068047523498535} -09/21/2021 00:55:29 - INFO - __main__ - Step 48186: {'lr': 0.00019896174159948613, 'samples': 1541952, 'steps': 3011, 'loss/train': 1.808139681816101} -09/21/2021 00:55:30 - INFO - __main__ - Step 48187: {'lr': 0.00019896174159948613, 'samples': 1541984, 'steps': 3011, 'loss/train': 1.385222315788269} -09/21/2021 00:55:31 - INFO - __main__ - Step 48188: {'lr': 0.00019896174159948613, 'samples': 1542016, 'steps': 3011, 'loss/train': 2.320824146270752} -09/21/2021 00:55:31 - INFO - __main__ - Step 48189: {'lr': 0.00019896174159948613, 'samples': 1542048, 'steps': 3011, 'loss/train': 2.2612357139587402} -09/21/2021 00:55:32 - INFO - __main__ - Step 48190: {'lr': 0.00019896174159948613, 'samples': 1542080, 'steps': 3011, 'loss/train': 1.8416707515716553} -09/21/2021 00:55:33 - INFO - __main__ - Step 48191: {'lr': 0.00019896174159948613, 'samples': 1542112, 'steps': 3011, 'loss/train': 0.8063122034072876} -09/21/2021 00:55:34 - INFO - __main__ - Step 48192: {'lr': 0.00019896174159948613, 'samples': 1542144, 'steps': 3011, 'loss/train': 1.453691840171814} -09/21/2021 00:55:35 - INFO - __main__ - Step 48193: {'lr': 0.0001989608245843284, 'samples': 1542176, 'steps': 3012, 'loss/train': 1.9827111959457397} -09/21/2021 00:55:36 - INFO - __main__ - Step 48194: {'lr': 0.0001989608245843284, 'samples': 1542208, 'steps': 3012, 'loss/train': 1.5224125385284424} -09/21/2021 00:55:37 - INFO - __main__ - Step 48195: {'lr': 0.0001989608245843284, 'samples': 1542240, 'steps': 3012, 'loss/train': 2.556685447692871} -09/21/2021 00:55:37 - INFO - __main__ - Step 48196: {'lr': 0.0001989608245843284, 'samples': 1542272, 'steps': 3012, 'loss/train': 1.361507773399353} -09/21/2021 00:55:38 - INFO - __main__ - Step 48197: {'lr': 0.0001989608245843284, 'samples': 1542304, 'steps': 3012, 'loss/train': 2.0972390174865723} -09/21/2021 00:55:39 - INFO - __main__ - Step 48198: {'lr': 0.0001989608245843284, 'samples': 1542336, 'steps': 3012, 'loss/train': 2.431065320968628} -09/21/2021 00:55:40 - INFO - __main__ - Step 48199: {'lr': 0.0001989608245843284, 'samples': 1542368, 'steps': 3012, 'loss/train': 1.672208309173584} -09/21/2021 00:55:40 - INFO - __main__ - Step 48200: {'lr': 0.0001989608245843284, 'samples': 1542400, 'steps': 3012, 'loss/train': 1.9331976175308228} -09/21/2021 00:55:41 - INFO - __main__ - Step 48201: {'lr': 0.0001989608245843284, 'samples': 1542432, 'steps': 3012, 'loss/train': 2.516317129135132} -09/21/2021 00:55:42 - INFO - __main__ - Step 48202: {'lr': 0.0001989608245843284, 'samples': 1542464, 'steps': 3012, 'loss/train': 2.2856898307800293} -09/21/2021 00:55:43 - INFO - __main__ - Step 48203: {'lr': 0.0001989608245843284, 'samples': 1542496, 'steps': 3012, 'loss/train': 1.5699353218078613} -09/21/2021 00:55:43 - INFO - __main__ - Step 48204: {'lr': 0.0001989608245843284, 'samples': 1542528, 'steps': 3012, 'loss/train': 2.160383462905884} -09/21/2021 00:55:44 - INFO - __main__ - Step 48205: {'lr': 0.0001989608245843284, 'samples': 1542560, 'steps': 3012, 'loss/train': 1.423164963722229} -09/21/2021 00:55:45 - INFO - __main__ - Step 48206: {'lr': 0.0001989608245843284, 'samples': 1542592, 'steps': 3012, 'loss/train': 1.464738130569458} -09/21/2021 00:55:46 - INFO - __main__ - Step 48207: {'lr': 0.0001989608245843284, 'samples': 1542624, 'steps': 3012, 'loss/train': 2.1679275035858154} -09/21/2021 00:55:46 - INFO - __main__ - Step 48208: {'lr': 0.0001989608245843284, 'samples': 1542656, 'steps': 3012, 'loss/train': 1.9096988439559937} -09/21/2021 00:55:47 - INFO - __main__ - Step 48209: {'lr': 0.00019895990716649946, 'samples': 1542688, 'steps': 3013, 'loss/train': 1.8054084777832031} -09/21/2021 00:55:48 - INFO - __main__ - Step 48210: {'lr': 0.00019895990716649946, 'samples': 1542720, 'steps': 3013, 'loss/train': 0.9440960884094238} -09/21/2021 00:55:49 - INFO - __main__ - Step 48211: {'lr': 0.00019895990716649946, 'samples': 1542752, 'steps': 3013, 'loss/train': 2.278555393218994} -09/21/2021 00:55:49 - INFO - __main__ - Step 48212: {'lr': 0.00019895990716649946, 'samples': 1542784, 'steps': 3013, 'loss/train': 2.541151762008667} -09/21/2021 00:55:50 - INFO - __main__ - Step 48213: {'lr': 0.00019895990716649946, 'samples': 1542816, 'steps': 3013, 'loss/train': 2.105685234069824} -09/21/2021 00:55:51 - INFO - __main__ - Step 48214: {'lr': 0.00019895990716649946, 'samples': 1542848, 'steps': 3013, 'loss/train': 2.1324658393859863} -09/21/2021 00:55:52 - INFO - __main__ - Step 48215: {'lr': 0.00019895990716649946, 'samples': 1542880, 'steps': 3013, 'loss/train': 2.3526718616485596} -09/21/2021 00:55:52 - INFO - __main__ - Step 48216: {'lr': 0.00019895990716649946, 'samples': 1542912, 'steps': 3013, 'loss/train': 2.849120616912842} -09/21/2021 00:55:53 - INFO - __main__ - Step 48217: {'lr': 0.00019895990716649946, 'samples': 1542944, 'steps': 3013, 'loss/train': 2.4690101146698} -09/21/2021 00:55:54 - INFO - __main__ - Step 48218: {'lr': 0.00019895990716649946, 'samples': 1542976, 'steps': 3013, 'loss/train': 2.178825855255127} -09/21/2021 00:55:55 - INFO - __main__ - Step 48219: {'lr': 0.00019895990716649946, 'samples': 1543008, 'steps': 3013, 'loss/train': 2.012251615524292} -09/21/2021 00:55:55 - INFO - __main__ - Step 48220: {'lr': 0.00019895990716649946, 'samples': 1543040, 'steps': 3013, 'loss/train': 1.8644800186157227} -09/21/2021 00:55:56 - INFO - __main__ - Step 48221: {'lr': 0.00019895990716649946, 'samples': 1543072, 'steps': 3013, 'loss/train': 2.3005430698394775} -09/21/2021 00:55:57 - INFO - __main__ - Step 48222: {'lr': 0.00019895990716649946, 'samples': 1543104, 'steps': 3013, 'loss/train': 1.6838382482528687} -09/21/2021 00:55:58 - INFO - __main__ - Step 48223: {'lr': 0.00019895990716649946, 'samples': 1543136, 'steps': 3013, 'loss/train': 1.4868468046188354} -09/21/2021 00:55:59 - INFO - __main__ - Step 48224: {'lr': 0.00019895990716649946, 'samples': 1543168, 'steps': 3013, 'loss/train': 2.280785322189331} -09/21/2021 00:56:00 - INFO - __main__ - Step 48225: {'lr': 0.00019895898934600305, 'samples': 1543200, 'steps': 3014, 'loss/train': 1.9822947978973389} -09/21/2021 00:56:01 - INFO - __main__ - Step 48226: {'lr': 0.00019895898934600305, 'samples': 1543232, 'steps': 3014, 'loss/train': 1.5368276834487915} -09/21/2021 00:56:01 - INFO - __main__ - Step 48227: {'lr': 0.00019895898934600305, 'samples': 1543264, 'steps': 3014, 'loss/train': 1.7971097230911255} -09/21/2021 00:56:02 - INFO - __main__ - Step 48228: {'lr': 0.00019895898934600305, 'samples': 1543296, 'steps': 3014, 'loss/train': 2.6010093688964844} -09/21/2021 00:56:03 - INFO - __main__ - Step 48229: {'lr': 0.00019895898934600305, 'samples': 1543328, 'steps': 3014, 'loss/train': 1.7535712718963623} -09/21/2021 00:56:04 - INFO - __main__ - Step 48230: {'lr': 0.00019895898934600305, 'samples': 1543360, 'steps': 3014, 'loss/train': 1.7454845905303955} -09/21/2021 00:56:04 - INFO - __main__ - Step 48231: {'lr': 0.00019895898934600305, 'samples': 1543392, 'steps': 3014, 'loss/train': 2.5294876098632812} -09/21/2021 00:56:05 - INFO - __main__ - Step 48232: {'lr': 0.00019895898934600305, 'samples': 1543424, 'steps': 3014, 'loss/train': 1.9099111557006836} -09/21/2021 00:56:06 - INFO - __main__ - Step 48233: {'lr': 0.00019895898934600305, 'samples': 1543456, 'steps': 3014, 'loss/train': 2.10585618019104} -09/21/2021 00:56:07 - INFO - __main__ - Step 48234: {'lr': 0.00019895898934600305, 'samples': 1543488, 'steps': 3014, 'loss/train': 1.5772608518600464} -09/21/2021 00:56:07 - INFO - __main__ - Step 48235: {'lr': 0.00019895898934600305, 'samples': 1543520, 'steps': 3014, 'loss/train': 2.214728355407715} -09/21/2021 00:56:08 - INFO - __main__ - Step 48236: {'lr': 0.00019895898934600305, 'samples': 1543552, 'steps': 3014, 'loss/train': 1.9999507665634155} -09/21/2021 00:56:09 - INFO - __main__ - Step 48237: {'lr': 0.00019895898934600305, 'samples': 1543584, 'steps': 3014, 'loss/train': 1.6059842109680176} -09/21/2021 00:56:10 - INFO - __main__ - Step 48238: {'lr': 0.00019895898934600305, 'samples': 1543616, 'steps': 3014, 'loss/train': 1.216603398323059} -09/21/2021 00:56:10 - INFO - __main__ - Step 48239: {'lr': 0.00019895898934600305, 'samples': 1543648, 'steps': 3014, 'loss/train': 2.2183597087860107} -09/21/2021 00:56:11 - INFO - __main__ - Step 48240: {'lr': 0.00019895898934600305, 'samples': 1543680, 'steps': 3014, 'loss/train': 2.6781702041625977} -09/21/2021 00:56:12 - INFO - __main__ - Step 48241: {'lr': 0.00019895807112284291, 'samples': 1543712, 'steps': 3015, 'loss/train': 1.1736122369766235} -09/21/2021 00:56:13 - INFO - __main__ - Step 48242: {'lr': 0.00019895807112284291, 'samples': 1543744, 'steps': 3015, 'loss/train': 2.9675936698913574} -09/21/2021 00:56:13 - INFO - __main__ - Step 48243: {'lr': 0.00019895807112284291, 'samples': 1543776, 'steps': 3015, 'loss/train': 2.1897101402282715} -09/21/2021 00:56:14 - INFO - __main__ - Step 48244: {'lr': 0.00019895807112284291, 'samples': 1543808, 'steps': 3015, 'loss/train': 2.8666694164276123} -09/21/2021 00:56:15 - INFO - __main__ - Step 48245: {'lr': 0.00019895807112284291, 'samples': 1543840, 'steps': 3015, 'loss/train': 1.2659786939620972} -09/21/2021 00:56:16 - INFO - __main__ - Step 48246: {'lr': 0.00019895807112284291, 'samples': 1543872, 'steps': 3015, 'loss/train': 1.8291490077972412} -09/21/2021 00:56:16 - INFO - __main__ - Step 48247: {'lr': 0.00019895807112284291, 'samples': 1543904, 'steps': 3015, 'loss/train': 1.5691859722137451} -09/21/2021 00:56:17 - INFO - __main__ - Step 48248: {'lr': 0.00019895807112284291, 'samples': 1543936, 'steps': 3015, 'loss/train': 1.919341802597046} -09/21/2021 00:56:18 - INFO - __main__ - Step 48249: {'lr': 0.00019895807112284291, 'samples': 1543968, 'steps': 3015, 'loss/train': 2.251854658126831} -09/21/2021 00:56:19 - INFO - __main__ - Step 48250: {'lr': 0.00019895807112284291, 'samples': 1544000, 'steps': 3015, 'loss/train': 1.7435890436172485} -09/21/2021 00:56:19 - INFO - __main__ - Step 48251: {'lr': 0.00019895807112284291, 'samples': 1544032, 'steps': 3015, 'loss/train': 2.755061626434326} -09/21/2021 00:56:20 - INFO - __main__ - Step 48252: {'lr': 0.00019895807112284291, 'samples': 1544064, 'steps': 3015, 'loss/train': 1.321824312210083} -09/21/2021 00:56:21 - INFO - __main__ - Step 48253: {'lr': 0.00019895807112284291, 'samples': 1544096, 'steps': 3015, 'loss/train': 2.3525266647338867} -09/21/2021 00:56:22 - INFO - __main__ - Step 48254: {'lr': 0.00019895807112284291, 'samples': 1544128, 'steps': 3015, 'loss/train': 2.04685640335083} -09/21/2021 00:56:23 - INFO - __main__ - Step 48255: {'lr': 0.00019895807112284291, 'samples': 1544160, 'steps': 3015, 'loss/train': 3.2424111366271973} -09/21/2021 00:56:24 - INFO - __main__ - Step 48256: {'lr': 0.00019895807112284291, 'samples': 1544192, 'steps': 3015, 'loss/train': 2.364567518234253} -09/21/2021 00:56:25 - INFO - __main__ - Step 48257: {'lr': 0.00019895715249702275, 'samples': 1544224, 'steps': 3016, 'loss/train': 1.681967854499817} -09/21/2021 00:56:26 - INFO - __main__ - Step 48258: {'lr': 0.00019895715249702275, 'samples': 1544256, 'steps': 3016, 'loss/train': 2.0673398971557617} -09/21/2021 00:56:26 - INFO - __main__ - Step 48259: {'lr': 0.00019895715249702275, 'samples': 1544288, 'steps': 3016, 'loss/train': 2.8323280811309814} -09/21/2021 00:56:27 - INFO - __main__ - Step 48260: {'lr': 0.00019895715249702275, 'samples': 1544320, 'steps': 3016, 'loss/train': 1.5804394483566284} -09/21/2021 00:56:28 - INFO - __main__ - Step 48261: {'lr': 0.00019895715249702275, 'samples': 1544352, 'steps': 3016, 'loss/train': 1.807645559310913} -09/21/2021 00:56:29 - INFO - __main__ - Step 48262: {'lr': 0.00019895715249702275, 'samples': 1544384, 'steps': 3016, 'loss/train': 2.082005023956299} -09/21/2021 00:56:29 - INFO - __main__ - Step 48263: {'lr': 0.00019895715249702275, 'samples': 1544416, 'steps': 3016, 'loss/train': 2.028932809829712} -09/21/2021 00:56:30 - INFO - __main__ - Step 48264: {'lr': 0.00019895715249702275, 'samples': 1544448, 'steps': 3016, 'loss/train': 2.41587233543396} -09/21/2021 00:56:31 - INFO - __main__ - Step 48265: {'lr': 0.00019895715249702275, 'samples': 1544480, 'steps': 3016, 'loss/train': 2.7697160243988037} -09/21/2021 00:56:31 - INFO - __main__ - Step 48266: {'lr': 0.00019895715249702275, 'samples': 1544512, 'steps': 3016, 'loss/train': 2.0949063301086426} -09/21/2021 00:56:32 - INFO - __main__ - Step 48267: {'lr': 0.00019895715249702275, 'samples': 1544544, 'steps': 3016, 'loss/train': 2.1516244411468506} -09/21/2021 00:56:33 - INFO - __main__ - Step 48268: {'lr': 0.00019895715249702275, 'samples': 1544576, 'steps': 3016, 'loss/train': 1.3082367181777954} -09/21/2021 00:56:34 - INFO - __main__ - Step 48269: {'lr': 0.00019895715249702275, 'samples': 1544608, 'steps': 3016, 'loss/train': 2.2442312240600586} -09/21/2021 00:56:34 - INFO - __main__ - Step 48270: {'lr': 0.00019895715249702275, 'samples': 1544640, 'steps': 3016, 'loss/train': 2.0711050033569336} -09/21/2021 00:56:35 - INFO - __main__ - Step 48271: {'lr': 0.00019895715249702275, 'samples': 1544672, 'steps': 3016, 'loss/train': 2.0081820487976074} -09/21/2021 00:56:36 - INFO - __main__ - Step 48272: {'lr': 0.00019895715249702275, 'samples': 1544704, 'steps': 3016, 'loss/train': 2.06424617767334} -09/21/2021 00:56:37 - INFO - __main__ - Step 48273: {'lr': 0.00019895623346854633, 'samples': 1544736, 'steps': 3017, 'loss/train': 1.50603187084198} -09/21/2021 00:56:38 - INFO - __main__ - Step 48274: {'lr': 0.00019895623346854633, 'samples': 1544768, 'steps': 3017, 'loss/train': 1.8659402132034302} -09/21/2021 00:56:38 - INFO - __main__ - Step 48275: {'lr': 0.00019895623346854633, 'samples': 1544800, 'steps': 3017, 'loss/train': 1.6469544172286987} -09/21/2021 00:56:39 - INFO - __main__ - Step 48276: {'lr': 0.00019895623346854633, 'samples': 1544832, 'steps': 3017, 'loss/train': 1.1201729774475098} -09/21/2021 00:56:40 - INFO - __main__ - Step 48277: {'lr': 0.00019895623346854633, 'samples': 1544864, 'steps': 3017, 'loss/train': 1.6358433961868286} -09/21/2021 00:56:41 - INFO - __main__ - Step 48278: {'lr': 0.00019895623346854633, 'samples': 1544896, 'steps': 3017, 'loss/train': 2.4364941120147705} -09/21/2021 00:56:41 - INFO - __main__ - Step 48279: {'lr': 0.00019895623346854633, 'samples': 1544928, 'steps': 3017, 'loss/train': 1.9334980249404907} -09/21/2021 00:56:42 - INFO - __main__ - Step 48280: {'lr': 0.00019895623346854633, 'samples': 1544960, 'steps': 3017, 'loss/train': 2.1246204376220703} -09/21/2021 00:56:43 - INFO - __main__ - Step 48281: {'lr': 0.00019895623346854633, 'samples': 1544992, 'steps': 3017, 'loss/train': 2.474400043487549} -09/21/2021 00:56:44 - INFO - __main__ - Step 48282: {'lr': 0.00019895623346854633, 'samples': 1545024, 'steps': 3017, 'loss/train': 2.7620866298675537} -09/21/2021 00:56:44 - INFO - __main__ - Step 48283: {'lr': 0.00019895623346854633, 'samples': 1545056, 'steps': 3017, 'loss/train': 1.4859668016433716} -09/21/2021 00:56:45 - INFO - __main__ - Step 48284: {'lr': 0.00019895623346854633, 'samples': 1545088, 'steps': 3017, 'loss/train': 1.982683539390564} -09/21/2021 00:56:47 - INFO - __main__ - Step 48285: {'lr': 0.00019895623346854633, 'samples': 1545120, 'steps': 3017, 'loss/train': 2.6752870082855225} -09/21/2021 00:56:48 - INFO - __main__ - Step 48286: {'lr': 0.00019895623346854633, 'samples': 1545152, 'steps': 3017, 'loss/train': 1.8989664316177368} -09/21/2021 00:56:48 - INFO - __main__ - Step 48287: {'lr': 0.00019895623346854633, 'samples': 1545184, 'steps': 3017, 'loss/train': 2.123704671859741} -09/21/2021 00:56:49 - INFO - __main__ - Step 48288: {'lr': 0.00019895623346854633, 'samples': 1545216, 'steps': 3017, 'loss/train': 1.5253245830535889} -09/21/2021 00:56:50 - INFO - __main__ - Step 48289: {'lr': 0.0001989553140374174, 'samples': 1545248, 'steps': 3018, 'loss/train': 2.35017991065979} -09/21/2021 00:56:51 - INFO - __main__ - Step 48290: {'lr': 0.0001989553140374174, 'samples': 1545280, 'steps': 3018, 'loss/train': 1.5984970331192017} -09/21/2021 00:56:52 - INFO - __main__ - Step 48291: {'lr': 0.0001989553140374174, 'samples': 1545312, 'steps': 3018, 'loss/train': 2.191962718963623} -09/21/2021 00:56:52 - INFO - __main__ - Step 48292: {'lr': 0.0001989553140374174, 'samples': 1545344, 'steps': 3018, 'loss/train': 1.7524774074554443} -09/21/2021 00:56:53 - INFO - __main__ - Step 48293: {'lr': 0.0001989553140374174, 'samples': 1545376, 'steps': 3018, 'loss/train': 2.351806163787842} -09/21/2021 00:56:54 - INFO - __main__ - Step 48294: {'lr': 0.0001989553140374174, 'samples': 1545408, 'steps': 3018, 'loss/train': 1.1342756748199463} -09/21/2021 00:56:55 - INFO - __main__ - Step 48295: {'lr': 0.0001989553140374174, 'samples': 1545440, 'steps': 3018, 'loss/train': 2.104457139968872} -09/21/2021 00:56:55 - INFO - __main__ - Step 48296: {'lr': 0.0001989553140374174, 'samples': 1545472, 'steps': 3018, 'loss/train': 0.47904300689697266} -09/21/2021 00:56:56 - INFO - __main__ - Step 48297: {'lr': 0.0001989553140374174, 'samples': 1545504, 'steps': 3018, 'loss/train': 0.21226036548614502} -09/21/2021 00:56:57 - INFO - __main__ - Step 48298: {'lr': 0.0001989553140374174, 'samples': 1545536, 'steps': 3018, 'loss/train': 0.24035774171352386} -09/21/2021 00:56:58 - INFO - __main__ - Step 48299: {'lr': 0.0001989553140374174, 'samples': 1545568, 'steps': 3018, 'loss/train': 0.319898396730423} -09/21/2021 00:56:58 - INFO - __main__ - Step 48300: {'lr': 0.0001989553140374174, 'samples': 1545600, 'steps': 3018, 'loss/train': 0.37408798933029175} -09/21/2021 00:56:59 - INFO - __main__ - Step 48301: {'lr': 0.0001989553140374174, 'samples': 1545632, 'steps': 3018, 'loss/train': 0.2555217444896698} -09/21/2021 00:57:00 - INFO - __main__ - Step 48302: {'lr': 0.0001989553140374174, 'samples': 1545664, 'steps': 3018, 'loss/train': 0.23137077689170837} -09/21/2021 00:57:01 - INFO - __main__ - Step 48303: {'lr': 0.0001989553140374174, 'samples': 1545696, 'steps': 3018, 'loss/train': 2.3566205501556396} -09/21/2021 00:57:01 - INFO - __main__ - Step 48304: {'lr': 0.0001989553140374174, 'samples': 1545728, 'steps': 3018, 'loss/train': 1.8480713367462158} -09/21/2021 00:57:02 - INFO - __main__ - Step 48305: {'lr': 0.00019895439420363964, 'samples': 1545760, 'steps': 3019, 'loss/train': 0.25128862261772156} -09/21/2021 00:57:03 - INFO - __main__ - Step 48306: {'lr': 0.00019895439420363964, 'samples': 1545792, 'steps': 3019, 'loss/train': 0.8297259211540222} -09/21/2021 00:57:04 - INFO - __main__ - Step 48307: {'lr': 0.00019895439420363964, 'samples': 1545824, 'steps': 3019, 'loss/train': 2.256276845932007} -09/21/2021 00:57:04 - INFO - __main__ - Step 48308: {'lr': 0.00019895439420363964, 'samples': 1545856, 'steps': 3019, 'loss/train': 1.941171407699585} -09/21/2021 00:57:05 - INFO - __main__ - Step 48309: {'lr': 0.00019895439420363964, 'samples': 1545888, 'steps': 3019, 'loss/train': 1.4441102743148804} -09/21/2021 00:57:06 - INFO - __main__ - Step 48310: {'lr': 0.00019895439420363964, 'samples': 1545920, 'steps': 3019, 'loss/train': 1.4922276735305786} -09/21/2021 00:57:07 - INFO - __main__ - Step 48311: {'lr': 0.00019895439420363964, 'samples': 1545952, 'steps': 3019, 'loss/train': 1.5349085330963135} -09/21/2021 00:57:07 - INFO - __main__ - Step 48312: {'lr': 0.00019895439420363964, 'samples': 1545984, 'steps': 3019, 'loss/train': 1.5072658061981201} -09/21/2021 00:57:08 - INFO - __main__ - Step 48313: {'lr': 0.00019895439420363964, 'samples': 1546016, 'steps': 3019, 'loss/train': 1.6099597215652466} -09/21/2021 00:57:09 - INFO - __main__ - Step 48314: {'lr': 0.00019895439420363964, 'samples': 1546048, 'steps': 3019, 'loss/train': 2.579958200454712} -09/21/2021 00:57:10 - INFO - __main__ - Step 48315: {'lr': 0.00019895439420363964, 'samples': 1546080, 'steps': 3019, 'loss/train': 1.6352349519729614} -09/21/2021 00:57:11 - INFO - __main__ - Step 48316: {'lr': 0.00019895439420363964, 'samples': 1546112, 'steps': 3019, 'loss/train': 1.0777456760406494} -09/21/2021 00:57:12 - INFO - __main__ - Step 48317: {'lr': 0.00019895439420363964, 'samples': 1546144, 'steps': 3019, 'loss/train': 1.6113346815109253} -09/21/2021 00:57:13 - INFO - __main__ - Step 48318: {'lr': 0.00019895439420363964, 'samples': 1546176, 'steps': 3019, 'loss/train': 2.2886643409729004} -09/21/2021 00:57:13 - INFO - __main__ - Step 48319: {'lr': 0.00019895439420363964, 'samples': 1546208, 'steps': 3019, 'loss/train': 2.1524953842163086} -09/21/2021 00:57:14 - INFO - __main__ - Step 48320: {'lr': 0.00019895439420363964, 'samples': 1546240, 'steps': 3019, 'loss/train': 1.9031168222427368} -09/21/2021 00:57:15 - INFO - __main__ - Step 48321: {'lr': 0.00019895347396721685, 'samples': 1546272, 'steps': 3020, 'loss/train': 1.9967336654663086} -09/21/2021 00:57:16 - INFO - __main__ - Step 48322: {'lr': 0.00019895347396721685, 'samples': 1546304, 'steps': 3020, 'loss/train': 1.8021024465560913} -09/21/2021 00:57:16 - INFO - __main__ - Step 48323: {'lr': 0.00019895347396721685, 'samples': 1546336, 'steps': 3020, 'loss/train': 1.718738317489624} -09/21/2021 00:57:17 - INFO - __main__ - Step 48324: {'lr': 0.00019895347396721685, 'samples': 1546368, 'steps': 3020, 'loss/train': 2.101491689682007} -09/21/2021 00:57:18 - INFO - __main__ - Step 48325: {'lr': 0.00019895347396721685, 'samples': 1546400, 'steps': 3020, 'loss/train': 1.1111708879470825} -09/21/2021 00:57:19 - INFO - __main__ - Step 48326: {'lr': 0.00019895347396721685, 'samples': 1546432, 'steps': 3020, 'loss/train': 2.083744525909424} -09/21/2021 00:57:19 - INFO - __main__ - Step 48327: {'lr': 0.00019895347396721685, 'samples': 1546464, 'steps': 3020, 'loss/train': 2.1537797451019287} -09/21/2021 00:57:20 - INFO - __main__ - Step 48328: {'lr': 0.00019895347396721685, 'samples': 1546496, 'steps': 3020, 'loss/train': 1.767717957496643} -09/21/2021 00:57:21 - INFO - __main__ - Step 48329: {'lr': 0.00019895347396721685, 'samples': 1546528, 'steps': 3020, 'loss/train': 2.463179588317871} -09/21/2021 00:57:22 - INFO - __main__ - Step 48330: {'lr': 0.00019895347396721685, 'samples': 1546560, 'steps': 3020, 'loss/train': 1.733313798904419} -09/21/2021 00:57:22 - INFO - __main__ - Step 48331: {'lr': 0.00019895347396721685, 'samples': 1546592, 'steps': 3020, 'loss/train': 2.0158286094665527} -09/21/2021 00:57:23 - INFO - __main__ - Step 48332: {'lr': 0.00019895347396721685, 'samples': 1546624, 'steps': 3020, 'loss/train': 1.6354326009750366} -09/21/2021 00:57:24 - INFO - __main__ - Step 48333: {'lr': 0.00019895347396721685, 'samples': 1546656, 'steps': 3020, 'loss/train': 0.29494884610176086} -09/21/2021 00:57:25 - INFO - __main__ - Step 48334: {'lr': 0.00019895347396721685, 'samples': 1546688, 'steps': 3020, 'loss/train': 1.8042112588882446} -09/21/2021 00:57:25 - INFO - __main__ - Step 48335: {'lr': 0.00019895347396721685, 'samples': 1546720, 'steps': 3020, 'loss/train': 1.6313385963439941} -09/21/2021 00:57:26 - INFO - __main__ - Step 48336: {'lr': 0.00019895347396721685, 'samples': 1546752, 'steps': 3020, 'loss/train': 1.7920130491256714} -09/21/2021 00:57:27 - INFO - __main__ - Step 48337: {'lr': 0.00019895255332815274, 'samples': 1546784, 'steps': 3021, 'loss/train': 2.072493314743042} -09/21/2021 00:57:28 - INFO - __main__ - Step 48338: {'lr': 0.00019895255332815274, 'samples': 1546816, 'steps': 3021, 'loss/train': 1.900696039199829} -09/21/2021 00:57:29 - INFO - __main__ - Step 48339: {'lr': 0.00019895255332815274, 'samples': 1546848, 'steps': 3021, 'loss/train': 2.4063234329223633} -09/21/2021 00:57:29 - INFO - __main__ - Step 48340: {'lr': 0.00019895255332815274, 'samples': 1546880, 'steps': 3021, 'loss/train': 1.7873640060424805} -09/21/2021 00:57:30 - INFO - __main__ - Step 48341: {'lr': 0.00019895255332815274, 'samples': 1546912, 'steps': 3021, 'loss/train': 1.5041651725769043} -09/21/2021 00:57:31 - INFO - __main__ - Step 48342: {'lr': 0.00019895255332815274, 'samples': 1546944, 'steps': 3021, 'loss/train': 1.820707082748413} -09/21/2021 00:57:32 - INFO - __main__ - Step 48343: {'lr': 0.00019895255332815274, 'samples': 1546976, 'steps': 3021, 'loss/train': 0.6305542588233948} -09/21/2021 00:57:32 - INFO - __main__ - Step 48344: {'lr': 0.00019895255332815274, 'samples': 1547008, 'steps': 3021, 'loss/train': 1.8031545877456665} -09/21/2021 00:57:33 - INFO - __main__ - Step 48345: {'lr': 0.00019895255332815274, 'samples': 1547040, 'steps': 3021, 'loss/train': 1.826785922050476} -09/21/2021 00:57:34 - INFO - __main__ - Step 48346: {'lr': 0.00019895255332815274, 'samples': 1547072, 'steps': 3021, 'loss/train': 6.137558937072754} -09/21/2021 00:57:35 - INFO - __main__ - Step 48347: {'lr': 0.00019895255332815274, 'samples': 1547104, 'steps': 3021, 'loss/train': 5.3959808349609375} -09/21/2021 00:57:35 - INFO - __main__ - Step 48348: {'lr': 0.00019895255332815274, 'samples': 1547136, 'steps': 3021, 'loss/train': 5.534483909606934} -09/21/2021 00:57:37 - INFO - __main__ - Step 48349: {'lr': 0.00019895255332815274, 'samples': 1547168, 'steps': 3021, 'loss/train': 2.859023332595825} -09/21/2021 00:57:37 - INFO - __main__ - Step 48350: {'lr': 0.00019895255332815274, 'samples': 1547200, 'steps': 3021, 'loss/train': 1.876248836517334} -09/21/2021 00:57:38 - INFO - __main__ - Step 48351: {'lr': 0.00019895255332815274, 'samples': 1547232, 'steps': 3021, 'loss/train': 2.0234262943267822} -09/21/2021 00:57:39 - INFO - __main__ - Step 48352: {'lr': 0.00019895255332815274, 'samples': 1547264, 'steps': 3021, 'loss/train': 4.860368728637695} -09/21/2021 00:57:40 - INFO - __main__ - Step 48353: {'lr': 0.00019895163228645112, 'samples': 1547296, 'steps': 3022, 'loss/train': 2.754121780395508} -09/21/2021 00:57:41 - INFO - __main__ - Step 48354: {'lr': 0.00019895163228645112, 'samples': 1547328, 'steps': 3022, 'loss/train': 1.7236285209655762} -09/21/2021 00:57:41 - INFO - __main__ - Step 48355: {'lr': 0.00019895163228645112, 'samples': 1547360, 'steps': 3022, 'loss/train': 1.9985941648483276} -09/21/2021 00:57:42 - INFO - __main__ - Step 48356: {'lr': 0.00019895163228645112, 'samples': 1547392, 'steps': 3022, 'loss/train': 1.6528589725494385} -09/21/2021 00:57:43 - INFO - __main__ - Step 48357: {'lr': 0.00019895163228645112, 'samples': 1547424, 'steps': 3022, 'loss/train': 1.9755818843841553} -09/21/2021 00:57:44 - INFO - __main__ - Step 48358: {'lr': 0.00019895163228645112, 'samples': 1547456, 'steps': 3022, 'loss/train': 1.641339898109436} -09/21/2021 00:57:44 - INFO - __main__ - Step 48359: {'lr': 0.00019895163228645112, 'samples': 1547488, 'steps': 3022, 'loss/train': 1.872385859489441} -09/21/2021 00:57:45 - INFO - __main__ - Step 48360: {'lr': 0.00019895163228645112, 'samples': 1547520, 'steps': 3022, 'loss/train': 2.9414570331573486} -09/21/2021 00:57:46 - INFO - __main__ - Step 48361: {'lr': 0.00019895163228645112, 'samples': 1547552, 'steps': 3022, 'loss/train': 1.1872105598449707} -09/21/2021 00:57:47 - INFO - __main__ - Step 48362: {'lr': 0.00019895163228645112, 'samples': 1547584, 'steps': 3022, 'loss/train': 1.230660080909729} -09/21/2021 00:57:47 - INFO - __main__ - Step 48363: {'lr': 0.00019895163228645112, 'samples': 1547616, 'steps': 3022, 'loss/train': 1.6527258157730103} -09/21/2021 00:57:48 - INFO - __main__ - Step 48364: {'lr': 0.00019895163228645112, 'samples': 1547648, 'steps': 3022, 'loss/train': 1.656637191772461} -09/21/2021 00:57:49 - INFO - __main__ - Step 48365: {'lr': 0.00019895163228645112, 'samples': 1547680, 'steps': 3022, 'loss/train': 2.370710849761963} -09/21/2021 00:57:50 - INFO - __main__ - Step 48366: {'lr': 0.00019895163228645112, 'samples': 1547712, 'steps': 3022, 'loss/train': 0.5667145252227783} -09/21/2021 00:57:50 - INFO - __main__ - Step 48367: {'lr': 0.00019895163228645112, 'samples': 1547744, 'steps': 3022, 'loss/train': 1.9549674987792969} -09/21/2021 00:57:51 - INFO - __main__ - Step 48368: {'lr': 0.00019895163228645112, 'samples': 1547776, 'steps': 3022, 'loss/train': 1.5752462148666382} -09/21/2021 00:57:52 - INFO - __main__ - Step 48369: {'lr': 0.00019895071084211565, 'samples': 1547808, 'steps': 3023, 'loss/train': 2.3583545684814453} -09/21/2021 00:57:53 - INFO - __main__ - Step 48370: {'lr': 0.00019895071084211565, 'samples': 1547840, 'steps': 3023, 'loss/train': 1.7242752313613892} -09/21/2021 00:57:53 - INFO - __main__ - Step 48371: {'lr': 0.00019895071084211565, 'samples': 1547872, 'steps': 3023, 'loss/train': 2.088421106338501} -09/21/2021 00:57:54 - INFO - __main__ - Step 48372: {'lr': 0.00019895071084211565, 'samples': 1547904, 'steps': 3023, 'loss/train': 1.0644375085830688} -09/21/2021 00:57:55 - INFO - __main__ - Step 48373: {'lr': 0.00019895071084211565, 'samples': 1547936, 'steps': 3023, 'loss/train': 1.436227798461914} -09/21/2021 00:57:56 - INFO - __main__ - Step 48374: {'lr': 0.00019895071084211565, 'samples': 1547968, 'steps': 3023, 'loss/train': 2.0848894119262695} -09/21/2021 00:57:56 - INFO - __main__ - Step 48375: {'lr': 0.00019895071084211565, 'samples': 1548000, 'steps': 3023, 'loss/train': 1.6468771696090698} -09/21/2021 00:57:57 - INFO - __main__ - Step 48376: {'lr': 0.00019895071084211565, 'samples': 1548032, 'steps': 3023, 'loss/train': 1.183835506439209} -09/21/2021 00:57:58 - INFO - __main__ - Step 48377: {'lr': 0.00019895071084211565, 'samples': 1548064, 'steps': 3023, 'loss/train': 1.6845663785934448} -09/21/2021 00:57:59 - INFO - __main__ - Step 48378: {'lr': 0.00019895071084211565, 'samples': 1548096, 'steps': 3023, 'loss/train': 1.6292980909347534} -09/21/2021 00:57:59 - INFO - __main__ - Step 48379: {'lr': 0.00019895071084211565, 'samples': 1548128, 'steps': 3023, 'loss/train': 2.4698338508605957} -09/21/2021 00:58:01 - INFO - __main__ - Step 48380: {'lr': 0.00019895071084211565, 'samples': 1548160, 'steps': 3023, 'loss/train': 2.22800874710083} -09/21/2021 00:58:01 - INFO - __main__ - Step 48381: {'lr': 0.00019895071084211565, 'samples': 1548192, 'steps': 3023, 'loss/train': 1.8301764726638794} -09/21/2021 00:58:02 - INFO - __main__ - Step 48382: {'lr': 0.00019895071084211565, 'samples': 1548224, 'steps': 3023, 'loss/train': 1.7328661680221558} -09/21/2021 00:58:03 - INFO - __main__ - Step 48383: {'lr': 0.00019895071084211565, 'samples': 1548256, 'steps': 3023, 'loss/train': 3.425797939300537} -09/21/2021 00:58:04 - INFO - __main__ - Step 48384: {'lr': 0.00019895071084211565, 'samples': 1548288, 'steps': 3023, 'loss/train': 2.2691197395324707} -09/21/2021 00:58:05 - INFO - __main__ - Step 48385: {'lr': 0.00019894978899515013, 'samples': 1548320, 'steps': 3024, 'loss/train': 1.7683030366897583} -09/21/2021 00:58:05 - INFO - __main__ - Step 48386: {'lr': 0.00019894978899515013, 'samples': 1548352, 'steps': 3024, 'loss/train': 1.4081552028656006} -09/21/2021 00:58:06 - INFO - __main__ - Step 48387: {'lr': 0.00019894978899515013, 'samples': 1548384, 'steps': 3024, 'loss/train': 1.0700387954711914} -09/21/2021 00:58:07 - INFO - __main__ - Step 48388: {'lr': 0.00019894978899515013, 'samples': 1548416, 'steps': 3024, 'loss/train': 1.5084704160690308} -09/21/2021 00:58:08 - INFO - __main__ - Step 48389: {'lr': 0.00019894978899515013, 'samples': 1548448, 'steps': 3024, 'loss/train': 2.403172254562378} -09/21/2021 00:58:08 - INFO - __main__ - Step 48390: {'lr': 0.00019894978899515013, 'samples': 1548480, 'steps': 3024, 'loss/train': 2.0332436561584473} -09/21/2021 00:58:09 - INFO - __main__ - Step 48391: {'lr': 0.00019894978899515013, 'samples': 1548512, 'steps': 3024, 'loss/train': 2.0188543796539307} -09/21/2021 00:58:10 - INFO - __main__ - Step 48392: {'lr': 0.00019894978899515013, 'samples': 1548544, 'steps': 3024, 'loss/train': 1.3037596940994263} -09/21/2021 00:58:11 - INFO - __main__ - Step 48393: {'lr': 0.00019894978899515013, 'samples': 1548576, 'steps': 3024, 'loss/train': 4.0880866050720215} -09/21/2021 00:58:11 - INFO - __main__ - Step 48394: {'lr': 0.00019894978899515013, 'samples': 1548608, 'steps': 3024, 'loss/train': 1.8237922191619873} -09/21/2021 00:58:12 - INFO - __main__ - Step 48395: {'lr': 0.00019894978899515013, 'samples': 1548640, 'steps': 3024, 'loss/train': 1.7529428005218506} -09/21/2021 00:58:13 - INFO - __main__ - Step 48396: {'lr': 0.00019894978899515013, 'samples': 1548672, 'steps': 3024, 'loss/train': 1.8269000053405762} -09/21/2021 00:58:14 - INFO - __main__ - Step 48397: {'lr': 0.00019894978899515013, 'samples': 1548704, 'steps': 3024, 'loss/train': 1.907530665397644} -09/21/2021 00:58:14 - INFO - __main__ - Step 48398: {'lr': 0.00019894978899515013, 'samples': 1548736, 'steps': 3024, 'loss/train': 2.0198428630828857} -09/21/2021 00:58:15 - INFO - __main__ - Step 48399: {'lr': 0.00019894978899515013, 'samples': 1548768, 'steps': 3024, 'loss/train': 2.36257004737854} -09/21/2021 00:58:16 - INFO - __main__ - Step 48400: {'lr': 0.00019894978899515013, 'samples': 1548800, 'steps': 3024, 'loss/train': 0.757607638835907} -09/21/2021 00:58:17 - INFO - __main__ - Step 48401: {'lr': 0.0001989488667455583, 'samples': 1548832, 'steps': 3025, 'loss/train': 1.9329646825790405} -09/21/2021 00:58:18 - INFO - __main__ - Step 48402: {'lr': 0.0001989488667455583, 'samples': 1548864, 'steps': 3025, 'loss/train': 1.5690393447875977} -09/21/2021 00:58:18 - INFO - __main__ - Step 48403: {'lr': 0.0001989488667455583, 'samples': 1548896, 'steps': 3025, 'loss/train': 1.4926272630691528} -09/21/2021 00:58:19 - INFO - __main__ - Step 48404: {'lr': 0.0001989488667455583, 'samples': 1548928, 'steps': 3025, 'loss/train': 1.6996933221817017} -09/21/2021 00:58:20 - INFO - __main__ - Step 48405: {'lr': 0.0001989488667455583, 'samples': 1548960, 'steps': 3025, 'loss/train': 0.4404924511909485} -09/21/2021 00:58:21 - INFO - __main__ - Step 48406: {'lr': 0.0001989488667455583, 'samples': 1548992, 'steps': 3025, 'loss/train': 1.3866991996765137} -09/21/2021 00:58:21 - INFO - __main__ - Step 48407: {'lr': 0.0001989488667455583, 'samples': 1549024, 'steps': 3025, 'loss/train': 1.9697387218475342} -09/21/2021 00:58:22 - INFO - __main__ - Step 48408: {'lr': 0.0001989488667455583, 'samples': 1549056, 'steps': 3025, 'loss/train': 2.52284836769104} -09/21/2021 00:58:23 - INFO - __main__ - Step 48409: {'lr': 0.0001989488667455583, 'samples': 1549088, 'steps': 3025, 'loss/train': 2.2295467853546143} -09/21/2021 00:58:24 - INFO - __main__ - Step 48410: {'lr': 0.0001989488667455583, 'samples': 1549120, 'steps': 3025, 'loss/train': 2.0020456314086914} -09/21/2021 00:58:24 - INFO - __main__ - Step 48411: {'lr': 0.0001989488667455583, 'samples': 1549152, 'steps': 3025, 'loss/train': 2.328589677810669} -09/21/2021 00:58:26 - INFO - __main__ - Step 48412: {'lr': 0.0001989488667455583, 'samples': 1549184, 'steps': 3025, 'loss/train': 1.7411729097366333} -09/21/2021 00:58:26 - INFO - __main__ - Step 48413: {'lr': 0.0001989488667455583, 'samples': 1549216, 'steps': 3025, 'loss/train': 1.8077336549758911} -09/21/2021 00:58:27 - INFO - __main__ - Step 48414: {'lr': 0.0001989488667455583, 'samples': 1549248, 'steps': 3025, 'loss/train': 4.000767707824707} -09/21/2021 00:58:28 - INFO - __main__ - Step 48415: {'lr': 0.0001989488667455583, 'samples': 1549280, 'steps': 3025, 'loss/train': 1.8161516189575195} -09/21/2021 00:58:29 - INFO - __main__ - Step 48416: {'lr': 0.0001989488667455583, 'samples': 1549312, 'steps': 3025, 'loss/train': 1.3967970609664917} -09/21/2021 00:58:30 - INFO - __main__ - Step 48417: {'lr': 0.00019894794409334394, 'samples': 1549344, 'steps': 3026, 'loss/train': 1.8118577003479004} -09/21/2021 00:58:30 - INFO - __main__ - Step 48418: {'lr': 0.00019894794409334394, 'samples': 1549376, 'steps': 3026, 'loss/train': 2.6066181659698486} -09/21/2021 00:58:31 - INFO - __main__ - Step 48419: {'lr': 0.00019894794409334394, 'samples': 1549408, 'steps': 3026, 'loss/train': 0.2892991006374359} -09/21/2021 00:58:32 - INFO - __main__ - Step 48420: {'lr': 0.00019894794409334394, 'samples': 1549440, 'steps': 3026, 'loss/train': 2.5369110107421875} -09/21/2021 00:58:33 - INFO - __main__ - Step 48421: {'lr': 0.00019894794409334394, 'samples': 1549472, 'steps': 3026, 'loss/train': 2.5930075645446777} -09/21/2021 00:58:33 - INFO - __main__ - Step 48422: {'lr': 0.00019894794409334394, 'samples': 1549504, 'steps': 3026, 'loss/train': 2.192422389984131} -09/21/2021 00:58:34 - INFO - __main__ - Step 48423: {'lr': 0.00019894794409334394, 'samples': 1549536, 'steps': 3026, 'loss/train': 1.4965554475784302} -09/21/2021 00:58:35 - INFO - __main__ - Step 48424: {'lr': 0.00019894794409334394, 'samples': 1549568, 'steps': 3026, 'loss/train': 1.5720497369766235} -09/21/2021 00:58:36 - INFO - __main__ - Step 48425: {'lr': 0.00019894794409334394, 'samples': 1549600, 'steps': 3026, 'loss/train': 2.37249493598938} -09/21/2021 00:58:36 - INFO - __main__ - Step 48426: {'lr': 0.00019894794409334394, 'samples': 1549632, 'steps': 3026, 'loss/train': 2.0653913021087646} -09/21/2021 00:58:37 - INFO - __main__ - Step 48427: {'lr': 0.00019894794409334394, 'samples': 1549664, 'steps': 3026, 'loss/train': 1.0543079376220703} -09/21/2021 00:58:38 - INFO - __main__ - Step 48428: {'lr': 0.00019894794409334394, 'samples': 1549696, 'steps': 3026, 'loss/train': 2.334886074066162} -09/21/2021 00:58:39 - INFO - __main__ - Step 48429: {'lr': 0.00019894794409334394, 'samples': 1549728, 'steps': 3026, 'loss/train': 1.9479076862335205} -09/21/2021 00:58:39 - INFO - __main__ - Step 48430: {'lr': 0.00019894794409334394, 'samples': 1549760, 'steps': 3026, 'loss/train': 2.0710103511810303} -09/21/2021 00:58:40 - INFO - __main__ - Step 48431: {'lr': 0.00019894794409334394, 'samples': 1549792, 'steps': 3026, 'loss/train': 1.4011647701263428} -09/21/2021 00:58:41 - INFO - __main__ - Step 48432: {'lr': 0.00019894794409334394, 'samples': 1549824, 'steps': 3026, 'loss/train': 1.5732156038284302} -09/21/2021 00:58:42 - INFO - __main__ - Step 48433: {'lr': 0.00019894702103851074, 'samples': 1549856, 'steps': 3027, 'loss/train': 2.553797721862793} -09/21/2021 00:58:42 - INFO - __main__ - Step 48434: {'lr': 0.00019894702103851074, 'samples': 1549888, 'steps': 3027, 'loss/train': 1.3340039253234863} -09/21/2021 00:58:43 - INFO - __main__ - Step 48435: {'lr': 0.00019894702103851074, 'samples': 1549920, 'steps': 3027, 'loss/train': 1.1674003601074219} -09/21/2021 00:58:44 - INFO - __main__ - Step 48436: {'lr': 0.00019894702103851074, 'samples': 1549952, 'steps': 3027, 'loss/train': 1.8817551136016846} -09/21/2021 00:58:45 - INFO - __main__ - Step 48437: {'lr': 0.00019894702103851074, 'samples': 1549984, 'steps': 3027, 'loss/train': 1.9271026849746704} -09/21/2021 00:58:45 - INFO - __main__ - Step 48438: {'lr': 0.00019894702103851074, 'samples': 1550016, 'steps': 3027, 'loss/train': 2.07820987701416} -09/21/2021 00:58:46 - INFO - __main__ - Step 48439: {'lr': 0.00019894702103851074, 'samples': 1550048, 'steps': 3027, 'loss/train': 1.5876160860061646} -09/21/2021 00:58:47 - INFO - __main__ - Step 48440: {'lr': 0.00019894702103851074, 'samples': 1550080, 'steps': 3027, 'loss/train': 1.4359805583953857} -09/21/2021 00:58:48 - INFO - __main__ - Step 48441: {'lr': 0.00019894702103851074, 'samples': 1550112, 'steps': 3027, 'loss/train': 2.3712828159332275} -09/21/2021 00:58:48 - INFO - __main__ - Step 48442: {'lr': 0.00019894702103851074, 'samples': 1550144, 'steps': 3027, 'loss/train': 1.2416775226593018} -09/21/2021 00:58:50 - INFO - __main__ - Step 48443: {'lr': 0.00019894702103851074, 'samples': 1550176, 'steps': 3027, 'loss/train': 1.812482237815857} -09/21/2021 00:58:51 - INFO - __main__ - Step 48444: {'lr': 0.00019894702103851074, 'samples': 1550208, 'steps': 3027, 'loss/train': 0.7429904341697693} -09/21/2021 00:58:51 - INFO - __main__ - Step 48445: {'lr': 0.00019894702103851074, 'samples': 1550240, 'steps': 3027, 'loss/train': 3.0746068954467773} -09/21/2021 00:58:52 - INFO - __main__ - Step 48446: {'lr': 0.00019894702103851074, 'samples': 1550272, 'steps': 3027, 'loss/train': 1.3912698030471802} -09/21/2021 00:58:53 - INFO - __main__ - Step 48447: {'lr': 0.00019894702103851074, 'samples': 1550304, 'steps': 3027, 'loss/train': 2.0063042640686035} -09/21/2021 00:58:54 - INFO - __main__ - Step 48448: {'lr': 0.00019894702103851074, 'samples': 1550336, 'steps': 3027, 'loss/train': 1.2223206758499146} -09/21/2021 00:58:55 - INFO - __main__ - Step 48449: {'lr': 0.00019894609758106256, 'samples': 1550368, 'steps': 3028, 'loss/train': 2.0777316093444824} -09/21/2021 00:58:55 - INFO - __main__ - Step 48450: {'lr': 0.00019894609758106256, 'samples': 1550400, 'steps': 3028, 'loss/train': 2.582146644592285} -09/21/2021 00:58:56 - INFO - __main__ - Step 48451: {'lr': 0.00019894609758106256, 'samples': 1550432, 'steps': 3028, 'loss/train': 1.5379045009613037} -09/21/2021 00:58:57 - INFO - __main__ - Step 48452: {'lr': 0.00019894609758106256, 'samples': 1550464, 'steps': 3028, 'loss/train': 2.3880696296691895} -09/21/2021 00:58:58 - INFO - __main__ - Step 48453: {'lr': 0.00019894609758106256, 'samples': 1550496, 'steps': 3028, 'loss/train': 2.557917594909668} -09/21/2021 00:58:58 - INFO - __main__ - Step 48454: {'lr': 0.00019894609758106256, 'samples': 1550528, 'steps': 3028, 'loss/train': 2.253455638885498} -09/21/2021 00:58:59 - INFO - __main__ - Step 48455: {'lr': 0.00019894609758106256, 'samples': 1550560, 'steps': 3028, 'loss/train': 0.5872236490249634} -09/21/2021 00:59:00 - INFO - __main__ - Step 48456: {'lr': 0.00019894609758106256, 'samples': 1550592, 'steps': 3028, 'loss/train': 0.33965131640434265} -09/21/2021 00:59:01 - INFO - __main__ - Step 48457: {'lr': 0.00019894609758106256, 'samples': 1550624, 'steps': 3028, 'loss/train': 0.4210735261440277} -09/21/2021 00:59:01 - INFO - __main__ - Step 48458: {'lr': 0.00019894609758106256, 'samples': 1550656, 'steps': 3028, 'loss/train': 0.5287995934486389} -09/21/2021 00:59:02 - INFO - __main__ - Step 48459: {'lr': 0.00019894609758106256, 'samples': 1550688, 'steps': 3028, 'loss/train': 0.47330421209335327} -09/21/2021 00:59:03 - INFO - __main__ - Step 48460: {'lr': 0.00019894609758106256, 'samples': 1550720, 'steps': 3028, 'loss/train': 1.9418593645095825} -09/21/2021 00:59:04 - INFO - __main__ - Step 48461: {'lr': 0.00019894609758106256, 'samples': 1550752, 'steps': 3028, 'loss/train': 2.8458380699157715} -09/21/2021 00:59:04 - INFO - __main__ - Step 48462: {'lr': 0.00019894609758106256, 'samples': 1550784, 'steps': 3028, 'loss/train': 1.4898767471313477} -09/21/2021 00:59:05 - INFO - __main__ - Step 48463: {'lr': 0.00019894609758106256, 'samples': 1550816, 'steps': 3028, 'loss/train': 1.9010769128799438} -09/21/2021 00:59:06 - INFO - __main__ - Step 48464: {'lr': 0.00019894609758106256, 'samples': 1550848, 'steps': 3028, 'loss/train': 3.1413419246673584} -09/21/2021 00:59:07 - INFO - __main__ - Step 48465: {'lr': 0.00019894517372100304, 'samples': 1550880, 'steps': 3029, 'loss/train': 1.5961252450942993} -09/21/2021 00:59:07 - INFO - __main__ - Step 48466: {'lr': 0.00019894517372100304, 'samples': 1550912, 'steps': 3029, 'loss/train': 1.7477525472640991} -09/21/2021 00:59:08 - INFO - __main__ - Step 48467: {'lr': 0.00019894517372100304, 'samples': 1550944, 'steps': 3029, 'loss/train': 0.18716642260551453} -09/21/2021 00:59:09 - INFO - __main__ - Step 48468: {'lr': 0.00019894517372100304, 'samples': 1550976, 'steps': 3029, 'loss/train': 2.5783886909484863} -09/21/2021 00:59:10 - INFO - __main__ - Step 48469: {'lr': 0.00019894517372100304, 'samples': 1551008, 'steps': 3029, 'loss/train': 2.7669196128845215} -09/21/2021 00:59:11 - INFO - __main__ - Step 48470: {'lr': 0.00019894517372100304, 'samples': 1551040, 'steps': 3029, 'loss/train': 1.9596537351608276} -09/21/2021 00:59:11 - INFO - __main__ - Step 48471: {'lr': 0.00019894517372100304, 'samples': 1551072, 'steps': 3029, 'loss/train': 0.15221546590328217} -09/21/2021 00:59:12 - INFO - __main__ - Step 48472: {'lr': 0.00019894517372100304, 'samples': 1551104, 'steps': 3029, 'loss/train': 1.4313298463821411} -09/21/2021 00:59:13 - INFO - __main__ - Step 48473: {'lr': 0.00019894517372100304, 'samples': 1551136, 'steps': 3029, 'loss/train': 2.0547146797180176} -09/21/2021 00:59:14 - INFO - __main__ - Step 48474: {'lr': 0.00019894517372100304, 'samples': 1551168, 'steps': 3029, 'loss/train': 1.9593268632888794} -09/21/2021 00:59:15 - INFO - __main__ - Step 48475: {'lr': 0.00019894517372100304, 'samples': 1551200, 'steps': 3029, 'loss/train': 2.207981586456299} -09/21/2021 00:59:16 - INFO - __main__ - Step 48476: {'lr': 0.00019894517372100304, 'samples': 1551232, 'steps': 3029, 'loss/train': 2.654851198196411} -09/21/2021 00:59:17 - INFO - __main__ - Step 48477: {'lr': 0.00019894517372100304, 'samples': 1551264, 'steps': 3029, 'loss/train': 1.366787314414978} -09/21/2021 00:59:18 - INFO - __main__ - Step 48478: {'lr': 0.00019894517372100304, 'samples': 1551296, 'steps': 3029, 'loss/train': 2.1542437076568604} -09/21/2021 00:59:18 - INFO - __main__ - Step 48479: {'lr': 0.00019894517372100304, 'samples': 1551328, 'steps': 3029, 'loss/train': 2.3309953212738037} -09/21/2021 00:59:19 - INFO - __main__ - Step 48480: {'lr': 0.00019894517372100304, 'samples': 1551360, 'steps': 3029, 'loss/train': 1.5746694803237915} -09/21/2021 00:59:20 - INFO - __main__ - Step 48481: {'lr': 0.000198944249458336, 'samples': 1551392, 'steps': 3030, 'loss/train': 0.7381595969200134} -09/21/2021 00:59:21 - INFO - __main__ - Step 48482: {'lr': 0.000198944249458336, 'samples': 1551424, 'steps': 3030, 'loss/train': 0.15574029088020325} -09/21/2021 00:59:21 - INFO - __main__ - Step 48483: {'lr': 0.000198944249458336, 'samples': 1551456, 'steps': 3030, 'loss/train': 0.22372567653656006} -09/21/2021 00:59:22 - INFO - __main__ - Step 48484: {'lr': 0.000198944249458336, 'samples': 1551488, 'steps': 3030, 'loss/train': 0.1580425202846527} -09/21/2021 00:59:23 - INFO - __main__ - Step 48485: {'lr': 0.000198944249458336, 'samples': 1551520, 'steps': 3030, 'loss/train': 1.1128895282745361} -09/21/2021 00:59:24 - INFO - __main__ - Step 48486: {'lr': 0.000198944249458336, 'samples': 1551552, 'steps': 3030, 'loss/train': 2.692230463027954} -09/21/2021 00:59:24 - INFO - __main__ - Step 48487: {'lr': 0.000198944249458336, 'samples': 1551584, 'steps': 3030, 'loss/train': 2.011613607406616} -09/21/2021 00:59:25 - INFO - __main__ - Step 48488: {'lr': 0.000198944249458336, 'samples': 1551616, 'steps': 3030, 'loss/train': 2.1696865558624268} -09/21/2021 00:59:26 - INFO - __main__ - Step 48489: {'lr': 0.000198944249458336, 'samples': 1551648, 'steps': 3030, 'loss/train': 0.18723735213279724} -09/21/2021 00:59:27 - INFO - __main__ - Step 48490: {'lr': 0.000198944249458336, 'samples': 1551680, 'steps': 3030, 'loss/train': 1.5586730241775513} -09/21/2021 00:59:27 - INFO - __main__ - Step 48491: {'lr': 0.000198944249458336, 'samples': 1551712, 'steps': 3030, 'loss/train': 2.4651899337768555} -09/21/2021 00:59:28 - INFO - __main__ - Step 48492: {'lr': 0.000198944249458336, 'samples': 1551744, 'steps': 3030, 'loss/train': 2.020817279815674} -09/21/2021 00:59:29 - INFO - __main__ - Step 48493: {'lr': 0.000198944249458336, 'samples': 1551776, 'steps': 3030, 'loss/train': 2.3092448711395264} -09/21/2021 00:59:30 - INFO - __main__ - Step 48494: {'lr': 0.000198944249458336, 'samples': 1551808, 'steps': 3030, 'loss/train': 1.4935038089752197} -09/21/2021 00:59:30 - INFO - __main__ - Step 48495: {'lr': 0.000198944249458336, 'samples': 1551840, 'steps': 3030, 'loss/train': 2.962407350540161} -09/21/2021 00:59:31 - INFO - __main__ - Step 48496: {'lr': 0.000198944249458336, 'samples': 1551872, 'steps': 3030, 'loss/train': 2.1105704307556152} -09/21/2021 00:59:32 - INFO - __main__ - Step 48497: {'lr': 0.0001989433247930652, 'samples': 1551904, 'steps': 3031, 'loss/train': 0.3171529471874237} -09/21/2021 00:59:33 - INFO - __main__ - Step 48498: {'lr': 0.0001989433247930652, 'samples': 1551936, 'steps': 3031, 'loss/train': 2.0033881664276123} -09/21/2021 00:59:34 - INFO - __main__ - Step 48499: {'lr': 0.0001989433247930652, 'samples': 1551968, 'steps': 3031, 'loss/train': 1.670362949371338} -09/21/2021 00:59:34 - INFO - __main__ - Step 48500: {'lr': 0.0001989433247930652, 'samples': 1552000, 'steps': 3031, 'loss/train': 1.6944785118103027} -09/21/2021 00:59:35 - INFO - __main__ - Step 48501: {'lr': 0.0001989433247930652, 'samples': 1552032, 'steps': 3031, 'loss/train': 2.3753318786621094} -09/21/2021 00:59:36 - INFO - __main__ - Step 48502: {'lr': 0.0001989433247930652, 'samples': 1552064, 'steps': 3031, 'loss/train': 0.9661498665809631} -09/21/2021 00:59:37 - INFO - __main__ - Step 48503: {'lr': 0.0001989433247930652, 'samples': 1552096, 'steps': 3031, 'loss/train': 1.6339136362075806} -09/21/2021 00:59:37 - INFO - __main__ - Step 48504: {'lr': 0.0001989433247930652, 'samples': 1552128, 'steps': 3031, 'loss/train': 0.9005047082901001} -09/21/2021 00:59:38 - INFO - __main__ - Step 48505: {'lr': 0.0001989433247930652, 'samples': 1552160, 'steps': 3031, 'loss/train': 2.325873851776123} -09/21/2021 00:59:39 - INFO - __main__ - Step 48506: {'lr': 0.0001989433247930652, 'samples': 1552192, 'steps': 3031, 'loss/train': 2.3292489051818848} -09/21/2021 00:59:40 - INFO - __main__ - Step 48507: {'lr': 0.0001989433247930652, 'samples': 1552224, 'steps': 3031, 'loss/train': 2.4282045364379883} -09/21/2021 00:59:41 - INFO - __main__ - Step 48508: {'lr': 0.0001989433247930652, 'samples': 1552256, 'steps': 3031, 'loss/train': 2.6921486854553223} -09/21/2021 00:59:42 - INFO - __main__ - Step 48509: {'lr': 0.0001989433247930652, 'samples': 1552288, 'steps': 3031, 'loss/train': 1.4019140005111694} -09/21/2021 00:59:42 - INFO - __main__ - Step 48510: {'lr': 0.0001989433247930652, 'samples': 1552320, 'steps': 3031, 'loss/train': 1.652304768562317} -09/21/2021 00:59:43 - INFO - __main__ - Step 48511: {'lr': 0.0001989433247930652, 'samples': 1552352, 'steps': 3031, 'loss/train': 1.9575265645980835} -09/21/2021 00:59:44 - INFO - __main__ - Step 48512: {'lr': 0.0001989433247930652, 'samples': 1552384, 'steps': 3031, 'loss/train': 2.931790590286255} -09/21/2021 00:59:45 - INFO - __main__ - Step 48513: {'lr': 0.00019894239972519437, 'samples': 1552416, 'steps': 3032, 'loss/train': 1.752094030380249} -09/21/2021 00:59:46 - INFO - __main__ - Step 48514: {'lr': 0.00019894239972519437, 'samples': 1552448, 'steps': 3032, 'loss/train': 2.022880792617798} -09/21/2021 00:59:46 - INFO - __main__ - Step 48515: {'lr': 0.00019894239972519437, 'samples': 1552480, 'steps': 3032, 'loss/train': 2.3562538623809814} -09/21/2021 00:59:47 - INFO - __main__ - Step 48516: {'lr': 0.00019894239972519437, 'samples': 1552512, 'steps': 3032, 'loss/train': 2.1775362491607666} -09/21/2021 00:59:48 - INFO - __main__ - Step 48517: {'lr': 0.00019894239972519437, 'samples': 1552544, 'steps': 3032, 'loss/train': 2.5058257579803467} -09/21/2021 00:59:49 - INFO - __main__ - Step 48518: {'lr': 0.00019894239972519437, 'samples': 1552576, 'steps': 3032, 'loss/train': 1.437996745109558} -09/21/2021 00:59:49 - INFO - __main__ - Step 48519: {'lr': 0.00019894239972519437, 'samples': 1552608, 'steps': 3032, 'loss/train': 2.0504722595214844} -09/21/2021 00:59:50 - INFO - __main__ - Step 48520: {'lr': 0.00019894239972519437, 'samples': 1552640, 'steps': 3032, 'loss/train': 0.9236171841621399} -09/21/2021 00:59:51 - INFO - __main__ - Step 48521: {'lr': 0.00019894239972519437, 'samples': 1552672, 'steps': 3032, 'loss/train': 1.480849266052246} -09/21/2021 00:59:52 - INFO - __main__ - Step 48522: {'lr': 0.00019894239972519437, 'samples': 1552704, 'steps': 3032, 'loss/train': 1.2037795782089233} -09/21/2021 00:59:52 - INFO - __main__ - Step 48523: {'lr': 0.00019894239972519437, 'samples': 1552736, 'steps': 3032, 'loss/train': 1.9167572259902954} -09/21/2021 00:59:53 - INFO - __main__ - Step 48524: {'lr': 0.00019894239972519437, 'samples': 1552768, 'steps': 3032, 'loss/train': 1.8949155807495117} -09/21/2021 00:59:54 - INFO - __main__ - Step 48525: {'lr': 0.00019894239972519437, 'samples': 1552800, 'steps': 3032, 'loss/train': 2.0493907928466797} -09/21/2021 00:59:55 - INFO - __main__ - Step 48526: {'lr': 0.00019894239972519437, 'samples': 1552832, 'steps': 3032, 'loss/train': 1.5878194570541382} -09/21/2021 00:59:55 - INFO - __main__ - Step 48527: {'lr': 0.00019894239972519437, 'samples': 1552864, 'steps': 3032, 'loss/train': 1.8472479581832886} -09/21/2021 00:59:56 - INFO - __main__ - Step 48528: {'lr': 0.00019894239972519437, 'samples': 1552896, 'steps': 3032, 'loss/train': 1.4248363971710205} -09/21/2021 00:59:57 - INFO - __main__ - Step 48529: {'lr': 0.00019894147425472735, 'samples': 1552928, 'steps': 3033, 'loss/train': 1.873091459274292} -09/21/2021 00:59:58 - INFO - __main__ - Step 48530: {'lr': 0.00019894147425472735, 'samples': 1552960, 'steps': 3033, 'loss/train': 1.8448550701141357} -09/21/2021 00:59:58 - INFO - __main__ - Step 48531: {'lr': 0.00019894147425472735, 'samples': 1552992, 'steps': 3033, 'loss/train': 2.0527751445770264} -09/21/2021 00:59:59 - INFO - __main__ - Step 48532: {'lr': 0.00019894147425472735, 'samples': 1553024, 'steps': 3033, 'loss/train': 1.7948329448699951} -09/21/2021 01:00:00 - INFO - __main__ - Step 48533: {'lr': 0.00019894147425472735, 'samples': 1553056, 'steps': 3033, 'loss/train': 2.2147724628448486} -09/21/2021 01:00:01 - INFO - __main__ - Step 48534: {'lr': 0.00019894147425472735, 'samples': 1553088, 'steps': 3033, 'loss/train': 2.4072694778442383} -09/21/2021 01:00:01 - INFO - __main__ - Step 48535: {'lr': 0.00019894147425472735, 'samples': 1553120, 'steps': 3033, 'loss/train': 2.3933775424957275} -09/21/2021 01:00:03 - INFO - __main__ - Step 48536: {'lr': 0.00019894147425472735, 'samples': 1553152, 'steps': 3033, 'loss/train': 1.7444626092910767} -09/21/2021 01:00:03 - INFO - __main__ - Step 48537: {'lr': 0.00019894147425472735, 'samples': 1553184, 'steps': 3033, 'loss/train': 2.252714157104492} -09/21/2021 01:00:04 - INFO - __main__ - Step 48538: {'lr': 0.00019894147425472735, 'samples': 1553216, 'steps': 3033, 'loss/train': 1.7440522909164429} -09/21/2021 01:00:05 - INFO - __main__ - Step 48539: {'lr': 0.00019894147425472735, 'samples': 1553248, 'steps': 3033, 'loss/train': 2.196058988571167} -09/21/2021 01:00:06 - INFO - __main__ - Step 48540: {'lr': 0.00019894147425472735, 'samples': 1553280, 'steps': 3033, 'loss/train': 1.9431517124176025} -09/21/2021 01:00:06 - INFO - __main__ - Step 48541: {'lr': 0.00019894147425472735, 'samples': 1553312, 'steps': 3033, 'loss/train': 2.077641010284424} -09/21/2021 01:00:07 - INFO - __main__ - Step 48542: {'lr': 0.00019894147425472735, 'samples': 1553344, 'steps': 3033, 'loss/train': 2.420219898223877} -09/21/2021 01:00:08 - INFO - __main__ - Step 48543: {'lr': 0.00019894147425472735, 'samples': 1553376, 'steps': 3033, 'loss/train': 1.5861141681671143} -09/21/2021 01:00:09 - INFO - __main__ - Step 48544: {'lr': 0.00019894147425472735, 'samples': 1553408, 'steps': 3033, 'loss/train': 2.2249913215637207} -09/21/2021 01:00:10 - INFO - __main__ - Step 48545: {'lr': 0.00019894054838166784, 'samples': 1553440, 'steps': 3034, 'loss/train': 1.167159914970398} -09/21/2021 01:00:10 - INFO - __main__ - Step 48546: {'lr': 0.00019894054838166784, 'samples': 1553472, 'steps': 3034, 'loss/train': 1.0805355310440063} -09/21/2021 01:00:11 - INFO - __main__ - Step 48547: {'lr': 0.00019894054838166784, 'samples': 1553504, 'steps': 3034, 'loss/train': 1.6624219417572021} -09/21/2021 01:00:12 - INFO - __main__ - Step 48548: {'lr': 0.00019894054838166784, 'samples': 1553536, 'steps': 3034, 'loss/train': 1.5563560724258423} -09/21/2021 01:00:13 - INFO - __main__ - Step 48549: {'lr': 0.00019894054838166784, 'samples': 1553568, 'steps': 3034, 'loss/train': 2.7019541263580322} -09/21/2021 01:00:13 - INFO - __main__ - Step 48550: {'lr': 0.00019894054838166784, 'samples': 1553600, 'steps': 3034, 'loss/train': 1.8123363256454468} -09/21/2021 01:00:14 - INFO - __main__ - Step 48551: {'lr': 0.00019894054838166784, 'samples': 1553632, 'steps': 3034, 'loss/train': 1.8804035186767578} -09/21/2021 01:00:15 - INFO - __main__ - Step 48552: {'lr': 0.00019894054838166784, 'samples': 1553664, 'steps': 3034, 'loss/train': 2.4818973541259766} -09/21/2021 01:00:16 - INFO - __main__ - Step 48553: {'lr': 0.00019894054838166784, 'samples': 1553696, 'steps': 3034, 'loss/train': 1.1134036779403687} -09/21/2021 01:00:16 - INFO - __main__ - Step 48554: {'lr': 0.00019894054838166784, 'samples': 1553728, 'steps': 3034, 'loss/train': 1.7792407274246216} -09/21/2021 01:00:17 - INFO - __main__ - Step 48555: {'lr': 0.00019894054838166784, 'samples': 1553760, 'steps': 3034, 'loss/train': 2.479767084121704} -09/21/2021 01:00:18 - INFO - __main__ - Step 48556: {'lr': 0.00019894054838166784, 'samples': 1553792, 'steps': 3034, 'loss/train': 1.6679385900497437} -09/21/2021 01:00:19 - INFO - __main__ - Step 48557: {'lr': 0.00019894054838166784, 'samples': 1553824, 'steps': 3034, 'loss/train': 1.6140249967575073} -09/21/2021 01:00:19 - INFO - __main__ - Step 48558: {'lr': 0.00019894054838166784, 'samples': 1553856, 'steps': 3034, 'loss/train': 2.211857318878174} -09/21/2021 01:00:20 - INFO - __main__ - Step 48559: {'lr': 0.00019894054838166784, 'samples': 1553888, 'steps': 3034, 'loss/train': 1.285366415977478} -09/21/2021 01:00:21 - INFO - __main__ - Step 48560: {'lr': 0.00019894054838166784, 'samples': 1553920, 'steps': 3034, 'loss/train': 1.8189183473587036} -09/21/2021 01:00:22 - INFO - __main__ - Step 48561: {'lr': 0.00019893962210601959, 'samples': 1553952, 'steps': 3035, 'loss/train': 1.9490364789962769} -09/21/2021 01:00:22 - INFO - __main__ - Step 48562: {'lr': 0.00019893962210601959, 'samples': 1553984, 'steps': 3035, 'loss/train': 1.1591627597808838} -09/21/2021 01:00:23 - INFO - __main__ - Step 48563: {'lr': 0.00019893962210601959, 'samples': 1554016, 'steps': 3035, 'loss/train': 1.6322517395019531} -09/21/2021 01:00:24 - INFO - __main__ - Step 48564: {'lr': 0.00019893962210601959, 'samples': 1554048, 'steps': 3035, 'loss/train': 1.7413818836212158} -09/21/2021 01:00:25 - INFO - __main__ - Step 48565: {'lr': 0.00019893962210601959, 'samples': 1554080, 'steps': 3035, 'loss/train': 1.1154597997665405} -09/21/2021 01:00:25 - INFO - __main__ - Step 48566: {'lr': 0.00019893962210601959, 'samples': 1554112, 'steps': 3035, 'loss/train': 2.404027223587036} -09/21/2021 01:00:26 - INFO - __main__ - Step 48567: {'lr': 0.00019893962210601959, 'samples': 1554144, 'steps': 3035, 'loss/train': 1.882049798965454} -09/21/2021 01:00:28 - INFO - __main__ - Step 48568: {'lr': 0.00019893962210601959, 'samples': 1554176, 'steps': 3035, 'loss/train': 2.065519094467163} -09/21/2021 01:00:29 - INFO - __main__ - Step 48569: {'lr': 0.00019893962210601959, 'samples': 1554208, 'steps': 3035, 'loss/train': 2.408118963241577} -09/21/2021 01:00:29 - INFO - __main__ - Step 48570: {'lr': 0.00019893962210601959, 'samples': 1554240, 'steps': 3035, 'loss/train': 2.0323991775512695} -09/21/2021 01:00:30 - INFO - __main__ - Step 48571: {'lr': 0.00019893962210601959, 'samples': 1554272, 'steps': 3035, 'loss/train': 1.6828347444534302} -09/21/2021 01:00:31 - INFO - __main__ - Step 48572: {'lr': 0.00019893962210601959, 'samples': 1554304, 'steps': 3035, 'loss/train': 2.845942735671997} -09/21/2021 01:00:32 - INFO - __main__ - Step 48573: {'lr': 0.00019893962210601959, 'samples': 1554336, 'steps': 3035, 'loss/train': 2.039524793624878} -09/21/2021 01:00:32 - INFO - __main__ - Step 48574: {'lr': 0.00019893962210601959, 'samples': 1554368, 'steps': 3035, 'loss/train': 1.6376959085464478} -09/21/2021 01:00:33 - INFO - __main__ - Step 48575: {'lr': 0.00019893962210601959, 'samples': 1554400, 'steps': 3035, 'loss/train': 2.3461503982543945} -09/21/2021 01:00:34 - INFO - __main__ - Step 48576: {'lr': 0.00019893962210601959, 'samples': 1554432, 'steps': 3035, 'loss/train': 2.387542486190796} -09/21/2021 01:00:35 - INFO - __main__ - Step 48577: {'lr': 0.00019893869542778641, 'samples': 1554464, 'steps': 3036, 'loss/train': 2.584155321121216} -09/21/2021 01:00:35 - INFO - __main__ - Step 48578: {'lr': 0.00019893869542778641, 'samples': 1554496, 'steps': 3036, 'loss/train': 2.5999274253845215} -09/21/2021 01:00:36 - INFO - __main__ - Step 48579: {'lr': 0.00019893869542778641, 'samples': 1554528, 'steps': 3036, 'loss/train': 2.561964273452759} -09/21/2021 01:00:37 - INFO - __main__ - Step 48580: {'lr': 0.00019893869542778641, 'samples': 1554560, 'steps': 3036, 'loss/train': 2.5843396186828613} -09/21/2021 01:00:38 - INFO - __main__ - Step 48581: {'lr': 0.00019893869542778641, 'samples': 1554592, 'steps': 3036, 'loss/train': 1.9008947610855103} -09/21/2021 01:00:38 - INFO - __main__ - Step 48582: {'lr': 0.00019893869542778641, 'samples': 1554624, 'steps': 3036, 'loss/train': 2.5328750610351562} -09/21/2021 01:00:39 - INFO - __main__ - Step 48583: {'lr': 0.00019893869542778641, 'samples': 1554656, 'steps': 3036, 'loss/train': 2.464214563369751} -09/21/2021 01:00:40 - INFO - __main__ - Step 48584: {'lr': 0.00019893869542778641, 'samples': 1554688, 'steps': 3036, 'loss/train': 0.21363866329193115} -09/21/2021 01:00:41 - INFO - __main__ - Step 48585: {'lr': 0.00019893869542778641, 'samples': 1554720, 'steps': 3036, 'loss/train': 0.5169707536697388} -09/21/2021 01:00:41 - INFO - __main__ - Step 48586: {'lr': 0.00019893869542778641, 'samples': 1554752, 'steps': 3036, 'loss/train': 0.5401352643966675} -09/21/2021 01:00:42 - INFO - __main__ - Step 48587: {'lr': 0.00019893869542778641, 'samples': 1554784, 'steps': 3036, 'loss/train': 0.44846564531326294} -09/21/2021 01:00:43 - INFO - __main__ - Step 48588: {'lr': 0.00019893869542778641, 'samples': 1554816, 'steps': 3036, 'loss/train': 0.37262052297592163} -09/21/2021 01:00:44 - INFO - __main__ - Step 48589: {'lr': 0.00019893869542778641, 'samples': 1554848, 'steps': 3036, 'loss/train': 2.018113136291504} -09/21/2021 01:00:44 - INFO - __main__ - Step 48590: {'lr': 0.00019893869542778641, 'samples': 1554880, 'steps': 3036, 'loss/train': 1.4417548179626465} -09/21/2021 01:00:45 - INFO - __main__ - Step 48591: {'lr': 0.00019893869542778641, 'samples': 1554912, 'steps': 3036, 'loss/train': 2.3021984100341797} -09/21/2021 01:00:46 - INFO - __main__ - Step 48592: {'lr': 0.00019893869542778641, 'samples': 1554944, 'steps': 3036, 'loss/train': 2.4809045791625977} -09/21/2021 01:00:47 - INFO - __main__ - Step 48593: {'lr': 0.0001989377683469721, 'samples': 1554976, 'steps': 3037, 'loss/train': 1.2545745372772217} -09/21/2021 01:00:48 - INFO - __main__ - Step 48594: {'lr': 0.0001989377683469721, 'samples': 1555008, 'steps': 3037, 'loss/train': 1.894775152206421} -09/21/2021 01:00:48 - INFO - __main__ - Step 48595: {'lr': 0.0001989377683469721, 'samples': 1555040, 'steps': 3037, 'loss/train': 1.9113290309906006} -09/21/2021 01:00:49 - INFO - __main__ - Step 48596: {'lr': 0.0001989377683469721, 'samples': 1555072, 'steps': 3037, 'loss/train': 2.0724241733551025} -09/21/2021 01:00:50 - INFO - __main__ - Step 48597: {'lr': 0.0001989377683469721, 'samples': 1555104, 'steps': 3037, 'loss/train': 2.0462450981140137} -09/21/2021 01:00:51 - INFO - __main__ - Step 48598: {'lr': 0.0001989377683469721, 'samples': 1555136, 'steps': 3037, 'loss/train': 0.40150028467178345} -09/21/2021 01:00:51 - INFO - __main__ - Step 48599: {'lr': 0.0001989377683469721, 'samples': 1555168, 'steps': 3037, 'loss/train': 2.141383171081543} -09/21/2021 01:00:52 - INFO - __main__ - Step 48600: {'lr': 0.0001989377683469721, 'samples': 1555200, 'steps': 3037, 'loss/train': 2.5275356769561768} -09/21/2021 01:00:53 - INFO - __main__ - Step 48601: {'lr': 0.0001989377683469721, 'samples': 1555232, 'steps': 3037, 'loss/train': 1.5030555725097656} -09/21/2021 01:00:54 - INFO - __main__ - Step 48602: {'lr': 0.0001989377683469721, 'samples': 1555264, 'steps': 3037, 'loss/train': 2.2892568111419678} -09/21/2021 01:00:54 - INFO - __main__ - Step 48603: {'lr': 0.0001989377683469721, 'samples': 1555296, 'steps': 3037, 'loss/train': 1.162206768989563} -09/21/2021 01:00:56 - INFO - __main__ - Step 48604: {'lr': 0.0001989377683469721, 'samples': 1555328, 'steps': 3037, 'loss/train': 1.7689040899276733} -09/21/2021 01:00:56 - INFO - __main__ - Step 48605: {'lr': 0.0001989377683469721, 'samples': 1555360, 'steps': 3037, 'loss/train': 1.1291751861572266} -09/21/2021 01:00:57 - INFO - __main__ - Step 48606: {'lr': 0.0001989377683469721, 'samples': 1555392, 'steps': 3037, 'loss/train': 1.9658225774765015} -09/21/2021 01:00:58 - INFO - __main__ - Step 48607: {'lr': 0.0001989377683469721, 'samples': 1555424, 'steps': 3037, 'loss/train': 1.841536283493042} -09/21/2021 01:00:59 - INFO - __main__ - Step 48608: {'lr': 0.0001989377683469721, 'samples': 1555456, 'steps': 3037, 'loss/train': 2.870750904083252} -09/21/2021 01:00:59 - INFO - __main__ - Step 48609: {'lr': 0.00019893684086358035, 'samples': 1555488, 'steps': 3038, 'loss/train': 1.5401068925857544} -09/21/2021 01:01:00 - INFO - __main__ - Step 48610: {'lr': 0.00019893684086358035, 'samples': 1555520, 'steps': 3038, 'loss/train': 2.5353291034698486} -09/21/2021 01:01:01 - INFO - __main__ - Step 48611: {'lr': 0.00019893684086358035, 'samples': 1555552, 'steps': 3038, 'loss/train': 1.897597074508667} -09/21/2021 01:01:02 - INFO - __main__ - Step 48612: {'lr': 0.00019893684086358035, 'samples': 1555584, 'steps': 3038, 'loss/train': 1.792630910873413} -09/21/2021 01:01:02 - INFO - __main__ - Step 48613: {'lr': 0.00019893684086358035, 'samples': 1555616, 'steps': 3038, 'loss/train': 1.9454365968704224} -09/21/2021 01:01:03 - INFO - __main__ - Step 48614: {'lr': 0.00019893684086358035, 'samples': 1555648, 'steps': 3038, 'loss/train': 1.975321650505066} -09/21/2021 01:01:04 - INFO - __main__ - Step 48615: {'lr': 0.00019893684086358035, 'samples': 1555680, 'steps': 3038, 'loss/train': 1.9900977611541748} -09/21/2021 01:01:05 - INFO - __main__ - Step 48616: {'lr': 0.00019893684086358035, 'samples': 1555712, 'steps': 3038, 'loss/train': 2.968933343887329} -09/21/2021 01:01:05 - INFO - __main__ - Step 48617: {'lr': 0.00019893684086358035, 'samples': 1555744, 'steps': 3038, 'loss/train': 1.9010303020477295} -09/21/2021 01:01:06 - INFO - __main__ - Step 48618: {'lr': 0.00019893684086358035, 'samples': 1555776, 'steps': 3038, 'loss/train': 0.2652278244495392} -09/21/2021 01:01:07 - INFO - __main__ - Step 48619: {'lr': 0.00019893684086358035, 'samples': 1555808, 'steps': 3038, 'loss/train': 2.6177878379821777} -09/21/2021 01:01:08 - INFO - __main__ - Step 48620: {'lr': 0.00019893684086358035, 'samples': 1555840, 'steps': 3038, 'loss/train': 2.1273958683013916} -09/21/2021 01:01:08 - INFO - __main__ - Step 48621: {'lr': 0.00019893684086358035, 'samples': 1555872, 'steps': 3038, 'loss/train': 0.8767625689506531} -09/21/2021 01:01:09 - INFO - __main__ - Step 48622: {'lr': 0.00019893684086358035, 'samples': 1555904, 'steps': 3038, 'loss/train': 2.2041447162628174} -09/21/2021 01:01:10 - INFO - __main__ - Step 48623: {'lr': 0.00019893684086358035, 'samples': 1555936, 'steps': 3038, 'loss/train': 1.7259721755981445} -09/21/2021 01:01:11 - INFO - __main__ - Step 48624: {'lr': 0.00019893684086358035, 'samples': 1555968, 'steps': 3038, 'loss/train': 2.1887362003326416} -09/21/2021 01:01:12 - INFO - __main__ - Step 48625: {'lr': 0.000198935912977615, 'samples': 1556000, 'steps': 3039, 'loss/train': 2.651552677154541} -09/21/2021 01:01:12 - INFO - __main__ - Step 48626: {'lr': 0.000198935912977615, 'samples': 1556032, 'steps': 3039, 'loss/train': 1.1606398820877075} -09/21/2021 01:01:13 - INFO - __main__ - Step 48627: {'lr': 0.000198935912977615, 'samples': 1556064, 'steps': 3039, 'loss/train': 2.102973222732544} -09/21/2021 01:01:14 - INFO - __main__ - Step 48628: {'lr': 0.000198935912977615, 'samples': 1556096, 'steps': 3039, 'loss/train': 2.4369466304779053} -09/21/2021 01:01:15 - INFO - __main__ - Step 48629: {'lr': 0.000198935912977615, 'samples': 1556128, 'steps': 3039, 'loss/train': 0.6424685120582581} -09/21/2021 01:01:15 - INFO - __main__ - Step 48630: {'lr': 0.000198935912977615, 'samples': 1556160, 'steps': 3039, 'loss/train': 1.145905613899231} -09/21/2021 01:01:16 - INFO - __main__ - Step 48631: {'lr': 0.000198935912977615, 'samples': 1556192, 'steps': 3039, 'loss/train': 2.3071837425231934} -09/21/2021 01:01:17 - INFO - __main__ - Step 48632: {'lr': 0.000198935912977615, 'samples': 1556224, 'steps': 3039, 'loss/train': 2.5816903114318848} -09/21/2021 01:01:18 - INFO - __main__ - Step 48633: {'lr': 0.000198935912977615, 'samples': 1556256, 'steps': 3039, 'loss/train': 1.0793014764785767} -09/21/2021 01:01:18 - INFO - __main__ - Step 48634: {'lr': 0.000198935912977615, 'samples': 1556288, 'steps': 3039, 'loss/train': 1.9646456241607666} -09/21/2021 01:01:19 - INFO - __main__ - Step 48635: {'lr': 0.000198935912977615, 'samples': 1556320, 'steps': 3039, 'loss/train': 2.1269121170043945} -09/21/2021 01:01:20 - INFO - __main__ - Step 48636: {'lr': 0.000198935912977615, 'samples': 1556352, 'steps': 3039, 'loss/train': 0.5349811315536499} -09/21/2021 01:01:21 - INFO - __main__ - Step 48637: {'lr': 0.000198935912977615, 'samples': 1556384, 'steps': 3039, 'loss/train': 1.549668312072754} -09/21/2021 01:01:22 - INFO - __main__ - Step 48638: {'lr': 0.000198935912977615, 'samples': 1556416, 'steps': 3039, 'loss/train': 1.8441355228424072} -09/21/2021 01:01:23 - INFO - __main__ - Step 48639: {'lr': 0.000198935912977615, 'samples': 1556448, 'steps': 3039, 'loss/train': 1.5451810359954834} -09/21/2021 01:01:23 - INFO - __main__ - Step 48640: {'lr': 0.000198935912977615, 'samples': 1556480, 'steps': 3039, 'loss/train': 2.144073486328125} -09/21/2021 01:01:24 - INFO - __main__ - Step 48641: {'lr': 0.00019893498468907982, 'samples': 1556512, 'steps': 3040, 'loss/train': 2.005173444747925} -09/21/2021 01:01:25 - INFO - __main__ - Step 48642: {'lr': 0.00019893498468907982, 'samples': 1556544, 'steps': 3040, 'loss/train': 2.0644192695617676} -09/21/2021 01:01:26 - INFO - __main__ - Step 48643: {'lr': 0.00019893498468907982, 'samples': 1556576, 'steps': 3040, 'loss/train': 2.71623158454895} -09/21/2021 01:01:27 - INFO - __main__ - Step 48644: {'lr': 0.00019893498468907982, 'samples': 1556608, 'steps': 3040, 'loss/train': 2.0808463096618652} -09/21/2021 01:01:27 - INFO - __main__ - Step 48645: {'lr': 0.00019893498468907982, 'samples': 1556640, 'steps': 3040, 'loss/train': 2.8384292125701904} -09/21/2021 01:01:28 - INFO - __main__ - Step 48646: {'lr': 0.00019893498468907982, 'samples': 1556672, 'steps': 3040, 'loss/train': 2.921929121017456} -09/21/2021 01:01:29 - INFO - __main__ - Step 48647: {'lr': 0.00019893498468907982, 'samples': 1556704, 'steps': 3040, 'loss/train': 2.3344883918762207} -09/21/2021 01:01:30 - INFO - __main__ - Step 48648: {'lr': 0.00019893498468907982, 'samples': 1556736, 'steps': 3040, 'loss/train': 2.0513646602630615} -09/21/2021 01:01:30 - INFO - __main__ - Step 48649: {'lr': 0.00019893498468907982, 'samples': 1556768, 'steps': 3040, 'loss/train': 6.73105525970459} -09/21/2021 01:01:31 - INFO - __main__ - Step 48650: {'lr': 0.00019893498468907982, 'samples': 1556800, 'steps': 3040, 'loss/train': 6.543516159057617} -09/21/2021 01:01:32 - INFO - __main__ - Step 48651: {'lr': 0.00019893498468907982, 'samples': 1556832, 'steps': 3040, 'loss/train': 2.3225927352905273} -09/21/2021 01:01:33 - INFO - __main__ - Step 48652: {'lr': 0.00019893498468907982, 'samples': 1556864, 'steps': 3040, 'loss/train': 2.0917394161224365} -09/21/2021 01:01:33 - INFO - __main__ - Step 48653: {'lr': 0.00019893498468907982, 'samples': 1556896, 'steps': 3040, 'loss/train': 1.5052809715270996} -09/21/2021 01:01:34 - INFO - __main__ - Step 48654: {'lr': 0.00019893498468907982, 'samples': 1556928, 'steps': 3040, 'loss/train': 1.846877932548523} -09/21/2021 01:01:35 - INFO - __main__ - Step 48655: {'lr': 0.00019893498468907982, 'samples': 1556960, 'steps': 3040, 'loss/train': 1.4563788175582886} -09/21/2021 01:01:36 - INFO - __main__ - Step 48656: {'lr': 0.00019893498468907982, 'samples': 1556992, 'steps': 3040, 'loss/train': 2.4952585697174072} -09/21/2021 01:01:36 - INFO - __main__ - Step 48657: {'lr': 0.00019893405599797853, 'samples': 1557024, 'steps': 3041, 'loss/train': 1.8948081731796265} -09/21/2021 01:01:37 - INFO - __main__ - Step 48658: {'lr': 0.00019893405599797853, 'samples': 1557056, 'steps': 3041, 'loss/train': 2.8673927783966064} -09/21/2021 01:01:38 - INFO - __main__ - Step 48659: {'lr': 0.00019893405599797853, 'samples': 1557088, 'steps': 3041, 'loss/train': 1.9249191284179688} -09/21/2021 01:01:39 - INFO - __main__ - Step 48660: {'lr': 0.00019893405599797853, 'samples': 1557120, 'steps': 3041, 'loss/train': 1.92599356174469} -09/21/2021 01:01:39 - INFO - __main__ - Step 48661: {'lr': 0.00019893405599797853, 'samples': 1557152, 'steps': 3041, 'loss/train': 1.9131885766983032} -09/21/2021 01:01:40 - INFO - __main__ - Step 48662: {'lr': 0.00019893405599797853, 'samples': 1557184, 'steps': 3041, 'loss/train': 1.746200680732727} -09/21/2021 01:01:41 - INFO - __main__ - Step 48663: {'lr': 0.00019893405599797853, 'samples': 1557216, 'steps': 3041, 'loss/train': 2.3539884090423584} -09/21/2021 01:01:42 - INFO - __main__ - Step 48664: {'lr': 0.00019893405599797853, 'samples': 1557248, 'steps': 3041, 'loss/train': 1.1640704870224} -09/21/2021 01:01:42 - INFO - __main__ - Step 48665: {'lr': 0.00019893405599797853, 'samples': 1557280, 'steps': 3041, 'loss/train': 2.4965243339538574} -09/21/2021 01:01:43 - INFO - __main__ - Step 48666: {'lr': 0.00019893405599797853, 'samples': 1557312, 'steps': 3041, 'loss/train': 1.8368167877197266} -09/21/2021 01:01:45 - INFO - __main__ - Step 48667: {'lr': 0.00019893405599797853, 'samples': 1557344, 'steps': 3041, 'loss/train': 1.2217813730239868} -09/21/2021 01:01:45 - INFO - __main__ - Step 48668: {'lr': 0.00019893405599797853, 'samples': 1557376, 'steps': 3041, 'loss/train': 2.1615583896636963} -09/21/2021 01:01:46 - INFO - __main__ - Step 48669: {'lr': 0.00019893405599797853, 'samples': 1557408, 'steps': 3041, 'loss/train': 1.5140981674194336} -09/21/2021 01:01:47 - INFO - __main__ - Step 48670: {'lr': 0.00019893405599797853, 'samples': 1557440, 'steps': 3041, 'loss/train': 3.36679744720459} -09/21/2021 01:01:48 - INFO - __main__ - Step 48671: {'lr': 0.00019893405599797853, 'samples': 1557472, 'steps': 3041, 'loss/train': 3.3945248126983643} -09/21/2021 01:01:48 - INFO - __main__ - Step 48672: {'lr': 0.00019893405599797853, 'samples': 1557504, 'steps': 3041, 'loss/train': 3.908125400543213} -09/21/2021 01:01:49 - INFO - __main__ - Step 48673: {'lr': 0.00019893312690431498, 'samples': 1557536, 'steps': 3042, 'loss/train': 0.9720869064331055} -09/21/2021 01:01:50 - INFO - __main__ - Step 48674: {'lr': 0.00019893312690431498, 'samples': 1557568, 'steps': 3042, 'loss/train': 2.491391658782959} -09/21/2021 01:01:51 - INFO - __main__ - Step 48675: {'lr': 0.00019893312690431498, 'samples': 1557600, 'steps': 3042, 'loss/train': 2.366501808166504} -09/21/2021 01:01:51 - INFO - __main__ - Step 48676: {'lr': 0.00019893312690431498, 'samples': 1557632, 'steps': 3042, 'loss/train': 1.6670429706573486} -09/21/2021 01:01:52 - INFO - __main__ - Step 48677: {'lr': 0.00019893312690431498, 'samples': 1557664, 'steps': 3042, 'loss/train': 2.1633830070495605} -09/21/2021 01:01:53 - INFO - __main__ - Step 48678: {'lr': 0.00019893312690431498, 'samples': 1557696, 'steps': 3042, 'loss/train': 2.1109163761138916} -09/21/2021 01:01:54 - INFO - __main__ - Step 48679: {'lr': 0.00019893312690431498, 'samples': 1557728, 'steps': 3042, 'loss/train': 2.1319358348846436} -09/21/2021 01:01:54 - INFO - __main__ - Step 48680: {'lr': 0.00019893312690431498, 'samples': 1557760, 'steps': 3042, 'loss/train': 2.455261468887329} -09/21/2021 01:01:55 - INFO - __main__ - Step 48681: {'lr': 0.00019893312690431498, 'samples': 1557792, 'steps': 3042, 'loss/train': 1.6882332563400269} -09/21/2021 01:01:56 - INFO - __main__ - Step 48682: {'lr': 0.00019893312690431498, 'samples': 1557824, 'steps': 3042, 'loss/train': 2.1333091259002686} -09/21/2021 01:01:57 - INFO - __main__ - Step 48683: {'lr': 0.00019893312690431498, 'samples': 1557856, 'steps': 3042, 'loss/train': 2.5688185691833496} -09/21/2021 01:01:57 - INFO - __main__ - Step 48684: {'lr': 0.00019893312690431498, 'samples': 1557888, 'steps': 3042, 'loss/train': 0.754177451133728} -09/21/2021 01:01:58 - INFO - __main__ - Step 48685: {'lr': 0.00019893312690431498, 'samples': 1557920, 'steps': 3042, 'loss/train': 2.2623989582061768} -09/21/2021 01:01:59 - INFO - __main__ - Step 48686: {'lr': 0.00019893312690431498, 'samples': 1557952, 'steps': 3042, 'loss/train': 1.1903252601623535} -09/21/2021 01:02:00 - INFO - __main__ - Step 48687: {'lr': 0.00019893312690431498, 'samples': 1557984, 'steps': 3042, 'loss/train': 2.085639476776123} -09/21/2021 01:02:00 - INFO - __main__ - Step 48688: {'lr': 0.00019893312690431498, 'samples': 1558016, 'steps': 3042, 'loss/train': 2.8511877059936523} -09/21/2021 01:02:01 - INFO - __main__ - Step 48689: {'lr': 0.00019893219740809294, 'samples': 1558048, 'steps': 3043, 'loss/train': 1.8600928783416748} -09/21/2021 01:02:02 - INFO - __main__ - Step 48690: {'lr': 0.00019893219740809294, 'samples': 1558080, 'steps': 3043, 'loss/train': 2.01574444770813} -09/21/2021 01:02:03 - INFO - __main__ - Step 48691: {'lr': 0.00019893219740809294, 'samples': 1558112, 'steps': 3043, 'loss/train': 4.273563861846924} -09/21/2021 01:02:04 - INFO - __main__ - Step 48692: {'lr': 0.00019893219740809294, 'samples': 1558144, 'steps': 3043, 'loss/train': 2.0528597831726074} -09/21/2021 01:02:04 - INFO - __main__ - Step 48693: {'lr': 0.00019893219740809294, 'samples': 1558176, 'steps': 3043, 'loss/train': 2.0559587478637695} -09/21/2021 01:02:05 - INFO - __main__ - Step 48694: {'lr': 0.00019893219740809294, 'samples': 1558208, 'steps': 3043, 'loss/train': 1.9421014785766602} -09/21/2021 01:02:06 - INFO - __main__ - Step 48695: {'lr': 0.00019893219740809294, 'samples': 1558240, 'steps': 3043, 'loss/train': 1.9244853258132935} -09/21/2021 01:02:07 - INFO - __main__ - Step 48696: {'lr': 0.00019893219740809294, 'samples': 1558272, 'steps': 3043, 'loss/train': 2.7511351108551025} -09/21/2021 01:02:07 - INFO - __main__ - Step 48697: {'lr': 0.00019893219740809294, 'samples': 1558304, 'steps': 3043, 'loss/train': 2.1058924198150635} -09/21/2021 01:02:08 - INFO - __main__ - Step 48698: {'lr': 0.00019893219740809294, 'samples': 1558336, 'steps': 3043, 'loss/train': 2.0751793384552} -09/21/2021 01:02:10 - INFO - __main__ - Step 48699: {'lr': 0.00019893219740809294, 'samples': 1558368, 'steps': 3043, 'loss/train': 2.0239226818084717} -09/21/2021 01:02:10 - INFO - __main__ - Step 48700: {'lr': 0.00019893219740809294, 'samples': 1558400, 'steps': 3043, 'loss/train': 0.9836754202842712} -09/21/2021 01:02:11 - INFO - __main__ - Step 48701: {'lr': 0.00019893219740809294, 'samples': 1558432, 'steps': 3043, 'loss/train': 2.70293927192688} -09/21/2021 01:02:12 - INFO - __main__ - Step 48702: {'lr': 0.00019893219740809294, 'samples': 1558464, 'steps': 3043, 'loss/train': 1.0569523572921753} -09/21/2021 01:02:13 - INFO - __main__ - Step 48703: {'lr': 0.00019893219740809294, 'samples': 1558496, 'steps': 3043, 'loss/train': 1.835891842842102} -09/21/2021 01:02:13 - INFO - __main__ - Step 48704: {'lr': 0.00019893219740809294, 'samples': 1558528, 'steps': 3043, 'loss/train': 1.6794127225875854} -09/21/2021 01:02:14 - INFO - __main__ - Step 48705: {'lr': 0.00019893126750931611, 'samples': 1558560, 'steps': 3044, 'loss/train': 2.7132742404937744} -09/21/2021 01:02:15 - INFO - __main__ - Step 48706: {'lr': 0.00019893126750931611, 'samples': 1558592, 'steps': 3044, 'loss/train': 2.0645315647125244} -09/21/2021 01:02:16 - INFO - __main__ - Step 48707: {'lr': 0.00019893126750931611, 'samples': 1558624, 'steps': 3044, 'loss/train': 2.1049139499664307} -09/21/2021 01:02:16 - INFO - __main__ - Step 48708: {'lr': 0.00019893126750931611, 'samples': 1558656, 'steps': 3044, 'loss/train': 2.5637502670288086} -09/21/2021 01:02:17 - INFO - __main__ - Step 48709: {'lr': 0.00019893126750931611, 'samples': 1558688, 'steps': 3044, 'loss/train': 1.2747604846954346} -09/21/2021 01:02:18 - INFO - __main__ - Step 48710: {'lr': 0.00019893126750931611, 'samples': 1558720, 'steps': 3044, 'loss/train': 2.3752083778381348} -09/21/2021 01:02:19 - INFO - __main__ - Step 48711: {'lr': 0.00019893126750931611, 'samples': 1558752, 'steps': 3044, 'loss/train': 2.5343973636627197} -09/21/2021 01:02:19 - INFO - __main__ - Step 48712: {'lr': 0.00019893126750931611, 'samples': 1558784, 'steps': 3044, 'loss/train': 1.3230654001235962} -09/21/2021 01:02:20 - INFO - __main__ - Step 48713: {'lr': 0.00019893126750931611, 'samples': 1558816, 'steps': 3044, 'loss/train': 2.1315433979034424} -09/21/2021 01:02:21 - INFO - __main__ - Step 48714: {'lr': 0.00019893126750931611, 'samples': 1558848, 'steps': 3044, 'loss/train': 1.541298508644104} -09/21/2021 01:02:22 - INFO - __main__ - Step 48715: {'lr': 0.00019893126750931611, 'samples': 1558880, 'steps': 3044, 'loss/train': 1.7149629592895508} -09/21/2021 01:02:22 - INFO - __main__ - Step 48716: {'lr': 0.00019893126750931611, 'samples': 1558912, 'steps': 3044, 'loss/train': 1.7911713123321533} -09/21/2021 01:02:23 - INFO - __main__ - Step 48717: {'lr': 0.00019893126750931611, 'samples': 1558944, 'steps': 3044, 'loss/train': 1.3982048034667969} -09/21/2021 01:02:24 - INFO - __main__ - Step 48718: {'lr': 0.00019893126750931611, 'samples': 1558976, 'steps': 3044, 'loss/train': 3.007437229156494} -09/21/2021 01:02:25 - INFO - __main__ - Step 48719: {'lr': 0.00019893126750931611, 'samples': 1559008, 'steps': 3044, 'loss/train': 3.015185594558716} -09/21/2021 01:02:25 - INFO - __main__ - Step 48720: {'lr': 0.00019893126750931611, 'samples': 1559040, 'steps': 3044, 'loss/train': 2.140284538269043} -09/21/2021 01:02:26 - INFO - __main__ - Step 48721: {'lr': 0.0001989303372079884, 'samples': 1559072, 'steps': 3045, 'loss/train': 2.0133161544799805} -09/21/2021 01:02:27 - INFO - __main__ - Step 48722: {'lr': 0.0001989303372079884, 'samples': 1559104, 'steps': 3045, 'loss/train': 2.361029863357544} -09/21/2021 01:02:28 - INFO - __main__ - Step 48723: {'lr': 0.0001989303372079884, 'samples': 1559136, 'steps': 3045, 'loss/train': 1.5048191547393799} -09/21/2021 01:02:29 - INFO - __main__ - Step 48724: {'lr': 0.0001989303372079884, 'samples': 1559168, 'steps': 3045, 'loss/train': 2.1240334510803223} -09/21/2021 01:02:29 - INFO - __main__ - Step 48725: {'lr': 0.0001989303372079884, 'samples': 1559200, 'steps': 3045, 'loss/train': 2.0467214584350586} -09/21/2021 01:02:30 - INFO - __main__ - Step 48726: {'lr': 0.0001989303372079884, 'samples': 1559232, 'steps': 3045, 'loss/train': 1.6569348573684692} -09/21/2021 01:02:31 - INFO - __main__ - Step 48727: {'lr': 0.0001989303372079884, 'samples': 1559264, 'steps': 3045, 'loss/train': 2.241140127182007} -09/21/2021 01:02:32 - INFO - __main__ - Step 48728: {'lr': 0.0001989303372079884, 'samples': 1559296, 'steps': 3045, 'loss/train': 2.270930767059326} -09/21/2021 01:02:33 - INFO - __main__ - Step 48729: {'lr': 0.0001989303372079884, 'samples': 1559328, 'steps': 3045, 'loss/train': 2.1728851795196533} -09/21/2021 01:02:34 - INFO - __main__ - Step 48730: {'lr': 0.0001989303372079884, 'samples': 1559360, 'steps': 3045, 'loss/train': 1.424780249595642} -09/21/2021 01:02:34 - INFO - __main__ - Step 48731: {'lr': 0.0001989303372079884, 'samples': 1559392, 'steps': 3045, 'loss/train': 1.5490343570709229} -09/21/2021 01:02:35 - INFO - __main__ - Step 48732: {'lr': 0.0001989303372079884, 'samples': 1559424, 'steps': 3045, 'loss/train': 2.4459400177001953} -09/21/2021 01:02:36 - INFO - __main__ - Step 48733: {'lr': 0.0001989303372079884, 'samples': 1559456, 'steps': 3045, 'loss/train': 2.0111324787139893} -09/21/2021 01:02:37 - INFO - __main__ - Step 48734: {'lr': 0.0001989303372079884, 'samples': 1559488, 'steps': 3045, 'loss/train': 2.6944847106933594} -09/21/2021 01:02:37 - INFO - __main__ - Step 48735: {'lr': 0.0001989303372079884, 'samples': 1559520, 'steps': 3045, 'loss/train': 2.1938247680664062} -09/21/2021 01:02:38 - INFO - __main__ - Step 48736: {'lr': 0.0001989303372079884, 'samples': 1559552, 'steps': 3045, 'loss/train': 1.6596794128417969} -09/21/2021 01:02:39 - INFO - __main__ - Step 48737: {'lr': 0.0001989294065041135, 'samples': 1559584, 'steps': 3046, 'loss/train': 1.3265749216079712} -09/21/2021 01:02:40 - INFO - __main__ - Step 48738: {'lr': 0.0001989294065041135, 'samples': 1559616, 'steps': 3046, 'loss/train': 1.529876470565796} -09/21/2021 01:02:41 - INFO - __main__ - Step 48739: {'lr': 0.0001989294065041135, 'samples': 1559648, 'steps': 3046, 'loss/train': 1.880266785621643} -09/21/2021 01:02:41 - INFO - __main__ - Step 48740: {'lr': 0.0001989294065041135, 'samples': 1559680, 'steps': 3046, 'loss/train': 0.9158751964569092} -09/21/2021 01:02:42 - INFO - __main__ - Step 48741: {'lr': 0.0001989294065041135, 'samples': 1559712, 'steps': 3046, 'loss/train': 1.5760513544082642} -09/21/2021 01:02:43 - INFO - __main__ - Step 48742: {'lr': 0.0001989294065041135, 'samples': 1559744, 'steps': 3046, 'loss/train': 2.7920002937316895} -09/21/2021 01:02:44 - INFO - __main__ - Step 48743: {'lr': 0.0001989294065041135, 'samples': 1559776, 'steps': 3046, 'loss/train': 1.5351756811141968} -09/21/2021 01:02:44 - INFO - __main__ - Step 48744: {'lr': 0.0001989294065041135, 'samples': 1559808, 'steps': 3046, 'loss/train': 1.692601203918457} -09/21/2021 01:02:45 - INFO - __main__ - Step 48745: {'lr': 0.0001989294065041135, 'samples': 1559840, 'steps': 3046, 'loss/train': 2.1738667488098145} -09/21/2021 01:02:46 - INFO - __main__ - Step 48746: {'lr': 0.0001989294065041135, 'samples': 1559872, 'steps': 3046, 'loss/train': 2.13238525390625} -09/21/2021 01:02:47 - INFO - __main__ - Step 48747: {'lr': 0.0001989294065041135, 'samples': 1559904, 'steps': 3046, 'loss/train': 0.9778468012809753} -09/21/2021 01:02:47 - INFO - __main__ - Step 48748: {'lr': 0.0001989294065041135, 'samples': 1559936, 'steps': 3046, 'loss/train': 2.6572155952453613} -09/21/2021 01:02:48 - INFO - __main__ - Step 48749: {'lr': 0.0001989294065041135, 'samples': 1559968, 'steps': 3046, 'loss/train': 1.9222711324691772} -09/21/2021 01:02:49 - INFO - __main__ - Step 48750: {'lr': 0.0001989294065041135, 'samples': 1560000, 'steps': 3046, 'loss/train': 2.1776978969573975} -09/21/2021 01:02:50 - INFO - __main__ - Step 48751: {'lr': 0.0001989294065041135, 'samples': 1560032, 'steps': 3046, 'loss/train': 0.12898468971252441} -09/21/2021 01:02:50 - INFO - __main__ - Step 48752: {'lr': 0.0001989294065041135, 'samples': 1560064, 'steps': 3046, 'loss/train': 2.6326985359191895} -09/21/2021 01:02:51 - INFO - __main__ - Step 48753: {'lr': 0.0001989284753976952, 'samples': 1560096, 'steps': 3047, 'loss/train': 2.292509078979492} -09/21/2021 01:02:52 - INFO - __main__ - Step 48754: {'lr': 0.0001989284753976952, 'samples': 1560128, 'steps': 3047, 'loss/train': 1.4901117086410522} -09/21/2021 01:02:53 - INFO - __main__ - Step 48755: {'lr': 0.0001989284753976952, 'samples': 1560160, 'steps': 3047, 'loss/train': 1.598055124282837} -09/21/2021 01:02:53 - INFO - __main__ - Step 48756: {'lr': 0.0001989284753976952, 'samples': 1560192, 'steps': 3047, 'loss/train': 1.9142757654190063} -09/21/2021 01:02:54 - INFO - __main__ - Step 48757: {'lr': 0.0001989284753976952, 'samples': 1560224, 'steps': 3047, 'loss/train': 1.6714560985565186} -09/21/2021 01:02:55 - INFO - __main__ - Step 48758: {'lr': 0.0001989284753976952, 'samples': 1560256, 'steps': 3047, 'loss/train': 3.191103219985962} -09/21/2021 01:02:56 - INFO - __main__ - Step 48759: {'lr': 0.0001989284753976952, 'samples': 1560288, 'steps': 3047, 'loss/train': 1.6442315578460693} -09/21/2021 01:02:56 - INFO - __main__ - Step 48760: {'lr': 0.0001989284753976952, 'samples': 1560320, 'steps': 3047, 'loss/train': 0.8739123940467834} -09/21/2021 01:02:58 - INFO - __main__ - Step 48761: {'lr': 0.0001989284753976952, 'samples': 1560352, 'steps': 3047, 'loss/train': 0.5467358231544495} -09/21/2021 01:02:58 - INFO - __main__ - Step 48762: {'lr': 0.0001989284753976952, 'samples': 1560384, 'steps': 3047, 'loss/train': 2.426499366760254} -09/21/2021 01:02:59 - INFO - __main__ - Step 48763: {'lr': 0.0001989284753976952, 'samples': 1560416, 'steps': 3047, 'loss/train': 1.9543049335479736} -09/21/2021 01:03:00 - INFO - __main__ - Step 48764: {'lr': 0.0001989284753976952, 'samples': 1560448, 'steps': 3047, 'loss/train': 2.5114119052886963} -09/21/2021 01:03:01 - INFO - __main__ - Step 48765: {'lr': 0.0001989284753976952, 'samples': 1560480, 'steps': 3047, 'loss/train': 2.2905311584472656} -09/21/2021 01:03:01 - INFO - __main__ - Step 48766: {'lr': 0.0001989284753976952, 'samples': 1560512, 'steps': 3047, 'loss/train': 1.6862421035766602} -09/21/2021 01:03:02 - INFO - __main__ - Step 48767: {'lr': 0.0001989284753976952, 'samples': 1560544, 'steps': 3047, 'loss/train': 2.2870452404022217} -09/21/2021 01:03:03 - INFO - __main__ - Step 48768: {'lr': 0.0001989284753976952, 'samples': 1560576, 'steps': 3047, 'loss/train': 2.020915985107422} -09/21/2021 01:03:04 - INFO - __main__ - Step 48769: {'lr': 0.00019892754388873738, 'samples': 1560608, 'steps': 3048, 'loss/train': 1.5980814695358276} -09/21/2021 01:03:05 - INFO - __main__ - Step 48770: {'lr': 0.00019892754388873738, 'samples': 1560640, 'steps': 3048, 'loss/train': 2.2737019062042236} -09/21/2021 01:03:05 - INFO - __main__ - Step 48771: {'lr': 0.00019892754388873738, 'samples': 1560672, 'steps': 3048, 'loss/train': 2.181469678878784} -09/21/2021 01:03:06 - INFO - __main__ - Step 48772: {'lr': 0.00019892754388873738, 'samples': 1560704, 'steps': 3048, 'loss/train': 1.612792730331421} -09/21/2021 01:03:07 - INFO - __main__ - Step 48773: {'lr': 0.00019892754388873738, 'samples': 1560736, 'steps': 3048, 'loss/train': 1.7085916996002197} -09/21/2021 01:03:08 - INFO - __main__ - Step 48774: {'lr': 0.00019892754388873738, 'samples': 1560768, 'steps': 3048, 'loss/train': 2.229694128036499} -09/21/2021 01:03:08 - INFO - __main__ - Step 48775: {'lr': 0.00019892754388873738, 'samples': 1560800, 'steps': 3048, 'loss/train': 1.0608450174331665} -09/21/2021 01:03:09 - INFO - __main__ - Step 48776: {'lr': 0.00019892754388873738, 'samples': 1560832, 'steps': 3048, 'loss/train': 1.5602598190307617} -09/21/2021 01:03:10 - INFO - __main__ - Step 48777: {'lr': 0.00019892754388873738, 'samples': 1560864, 'steps': 3048, 'loss/train': 2.6591289043426514} -09/21/2021 01:03:11 - INFO - __main__ - Step 48778: {'lr': 0.00019892754388873738, 'samples': 1560896, 'steps': 3048, 'loss/train': 2.2528419494628906} -09/21/2021 01:03:11 - INFO - __main__ - Step 48779: {'lr': 0.00019892754388873738, 'samples': 1560928, 'steps': 3048, 'loss/train': 1.776077389717102} -09/21/2021 01:03:12 - INFO - __main__ - Step 48780: {'lr': 0.00019892754388873738, 'samples': 1560960, 'steps': 3048, 'loss/train': 1.7259868383407593} -09/21/2021 01:03:13 - INFO - __main__ - Step 48781: {'lr': 0.00019892754388873738, 'samples': 1560992, 'steps': 3048, 'loss/train': 1.5590206384658813} -09/21/2021 01:03:14 - INFO - __main__ - Step 48782: {'lr': 0.00019892754388873738, 'samples': 1561024, 'steps': 3048, 'loss/train': 1.6343586444854736} -09/21/2021 01:03:14 - INFO - __main__ - Step 48783: {'lr': 0.00019892754388873738, 'samples': 1561056, 'steps': 3048, 'loss/train': 1.8451218605041504} -09/21/2021 01:03:15 - INFO - __main__ - Step 48784: {'lr': 0.00019892754388873738, 'samples': 1561088, 'steps': 3048, 'loss/train': 1.495078206062317} -09/21/2021 01:03:16 - INFO - __main__ - Step 48785: {'lr': 0.00019892661197724374, 'samples': 1561120, 'steps': 3049, 'loss/train': 2.1236164569854736} -09/21/2021 01:03:17 - INFO - __main__ - Step 48786: {'lr': 0.00019892661197724374, 'samples': 1561152, 'steps': 3049, 'loss/train': 2.1324775218963623} -09/21/2021 01:03:17 - INFO - __main__ - Step 48787: {'lr': 0.00019892661197724374, 'samples': 1561184, 'steps': 3049, 'loss/train': 0.658184826374054} -09/21/2021 01:03:18 - INFO - __main__ - Step 48788: {'lr': 0.00019892661197724374, 'samples': 1561216, 'steps': 3049, 'loss/train': 0.12383240461349487} -09/21/2021 01:03:19 - INFO - __main__ - Step 48789: {'lr': 0.00019892661197724374, 'samples': 1561248, 'steps': 3049, 'loss/train': 2.2066292762756348} -09/21/2021 01:03:20 - INFO - __main__ - Step 48790: {'lr': 0.00019892661197724374, 'samples': 1561280, 'steps': 3049, 'loss/train': 1.5618561506271362} -09/21/2021 01:03:20 - INFO - __main__ - Step 48791: {'lr': 0.00019892661197724374, 'samples': 1561312, 'steps': 3049, 'loss/train': 1.4327069520950317} -09/21/2021 01:03:22 - INFO - __main__ - Step 48792: {'lr': 0.00019892661197724374, 'samples': 1561344, 'steps': 3049, 'loss/train': 1.8229374885559082} -09/21/2021 01:03:23 - INFO - __main__ - Step 48793: {'lr': 0.00019892661197724374, 'samples': 1561376, 'steps': 3049, 'loss/train': 0.8578436970710754} -09/21/2021 01:03:24 - INFO - __main__ - Step 48794: {'lr': 0.00019892661197724374, 'samples': 1561408, 'steps': 3049, 'loss/train': 2.3783884048461914} -09/21/2021 01:03:24 - INFO - __main__ - Step 48795: {'lr': 0.00019892661197724374, 'samples': 1561440, 'steps': 3049, 'loss/train': 1.9671157598495483} -09/21/2021 01:03:25 - INFO - __main__ - Step 48796: {'lr': 0.00019892661197724374, 'samples': 1561472, 'steps': 3049, 'loss/train': 2.0538907051086426} -09/21/2021 01:03:26 - INFO - __main__ - Step 48797: {'lr': 0.00019892661197724374, 'samples': 1561504, 'steps': 3049, 'loss/train': 2.0580313205718994} -09/21/2021 01:03:27 - INFO - __main__ - Step 48798: {'lr': 0.00019892661197724374, 'samples': 1561536, 'steps': 3049, 'loss/train': 1.7957316637039185} -09/21/2021 01:03:27 - INFO - __main__ - Step 48799: {'lr': 0.00019892661197724374, 'samples': 1561568, 'steps': 3049, 'loss/train': 1.7560709714889526} -09/21/2021 01:03:28 - INFO - __main__ - Step 48800: {'lr': 0.00019892661197724374, 'samples': 1561600, 'steps': 3049, 'loss/train': 1.0789201259613037} -09/21/2021 01:03:29 - INFO - __main__ - Step 48801: {'lr': 0.0001989256796632181, 'samples': 1561632, 'steps': 3050, 'loss/train': 1.92118501663208} -09/21/2021 01:03:30 - INFO - __main__ - Step 48802: {'lr': 0.0001989256796632181, 'samples': 1561664, 'steps': 3050, 'loss/train': 1.7364341020584106} -09/21/2021 01:03:31 - INFO - __main__ - Step 48803: {'lr': 0.0001989256796632181, 'samples': 1561696, 'steps': 3050, 'loss/train': 1.6940864324569702} -09/21/2021 01:03:31 - INFO - __main__ - Step 48804: {'lr': 0.0001989256796632181, 'samples': 1561728, 'steps': 3050, 'loss/train': 2.0547821521759033} -09/21/2021 01:03:32 - INFO - __main__ - Step 48805: {'lr': 0.0001989256796632181, 'samples': 1561760, 'steps': 3050, 'loss/train': 1.4630377292633057} -09/21/2021 01:03:33 - INFO - __main__ - Step 48806: {'lr': 0.0001989256796632181, 'samples': 1561792, 'steps': 3050, 'loss/train': 2.4832074642181396} -09/21/2021 01:03:34 - INFO - __main__ - Step 48807: {'lr': 0.0001989256796632181, 'samples': 1561824, 'steps': 3050, 'loss/train': 2.3034560680389404} -09/21/2021 01:03:34 - INFO - __main__ - Step 48808: {'lr': 0.0001989256796632181, 'samples': 1561856, 'steps': 3050, 'loss/train': 2.1239848136901855} -09/21/2021 01:03:35 - INFO - __main__ - Step 48809: {'lr': 0.0001989256796632181, 'samples': 1561888, 'steps': 3050, 'loss/train': 1.7355434894561768} -09/21/2021 01:03:36 - INFO - __main__ - Step 48810: {'lr': 0.0001989256796632181, 'samples': 1561920, 'steps': 3050, 'loss/train': 2.362391710281372} -09/21/2021 01:03:37 - INFO - __main__ - Step 48811: {'lr': 0.0001989256796632181, 'samples': 1561952, 'steps': 3050, 'loss/train': 1.69521164894104} -09/21/2021 01:03:37 - INFO - __main__ - Step 48812: {'lr': 0.0001989256796632181, 'samples': 1561984, 'steps': 3050, 'loss/train': 1.2226979732513428} -09/21/2021 01:03:38 - INFO - __main__ - Step 48813: {'lr': 0.0001989256796632181, 'samples': 1562016, 'steps': 3050, 'loss/train': 1.6748679876327515} -09/21/2021 01:03:39 - INFO - __main__ - Step 48814: {'lr': 0.0001989256796632181, 'samples': 1562048, 'steps': 3050, 'loss/train': 1.4971743822097778} -09/21/2021 01:03:40 - INFO - __main__ - Step 48815: {'lr': 0.0001989256796632181, 'samples': 1562080, 'steps': 3050, 'loss/train': 2.230731964111328} -09/21/2021 01:03:40 - INFO - __main__ - Step 48816: {'lr': 0.0001989256796632181, 'samples': 1562112, 'steps': 3050, 'loss/train': 2.917020797729492} -09/21/2021 01:03:41 - INFO - __main__ - Step 48817: {'lr': 0.00019892474694666425, 'samples': 1562144, 'steps': 3051, 'loss/train': 2.4166340827941895} -09/21/2021 01:03:42 - INFO - __main__ - Step 48818: {'lr': 0.00019892474694666425, 'samples': 1562176, 'steps': 3051, 'loss/train': 1.8553636074066162} -09/21/2021 01:03:43 - INFO - __main__ - Step 48819: {'lr': 0.00019892474694666425, 'samples': 1562208, 'steps': 3051, 'loss/train': 2.428142547607422} -09/21/2021 01:03:43 - INFO - __main__ - Step 48820: {'lr': 0.00019892474694666425, 'samples': 1562240, 'steps': 3051, 'loss/train': 0.9574191570281982} -09/21/2021 01:03:44 - INFO - __main__ - Step 48821: {'lr': 0.00019892474694666425, 'samples': 1562272, 'steps': 3051, 'loss/train': 1.5273547172546387} -09/21/2021 01:03:45 - INFO - __main__ - Step 48822: {'lr': 0.00019892474694666425, 'samples': 1562304, 'steps': 3051, 'loss/train': 2.0410995483398438} -09/21/2021 01:03:46 - INFO - __main__ - Step 48823: {'lr': 0.00019892474694666425, 'samples': 1562336, 'steps': 3051, 'loss/train': 1.7173116207122803} -09/21/2021 01:03:47 - INFO - __main__ - Step 48824: {'lr': 0.00019892474694666425, 'samples': 1562368, 'steps': 3051, 'loss/train': 1.3601064682006836} -09/21/2021 01:03:48 - INFO - __main__ - Step 48825: {'lr': 0.00019892474694666425, 'samples': 1562400, 'steps': 3051, 'loss/train': 1.659468412399292} -09/21/2021 01:03:48 - INFO - __main__ - Step 48826: {'lr': 0.00019892474694666425, 'samples': 1562432, 'steps': 3051, 'loss/train': 1.8023312091827393} -09/21/2021 01:03:49 - INFO - __main__ - Step 48827: {'lr': 0.00019892474694666425, 'samples': 1562464, 'steps': 3051, 'loss/train': 1.913959264755249} -09/21/2021 01:03:50 - INFO - __main__ - Step 48828: {'lr': 0.00019892474694666425, 'samples': 1562496, 'steps': 3051, 'loss/train': 1.1116623878479004} -09/21/2021 01:03:51 - INFO - __main__ - Step 48829: {'lr': 0.00019892474694666425, 'samples': 1562528, 'steps': 3051, 'loss/train': 2.264708995819092} -09/21/2021 01:03:51 - INFO - __main__ - Step 48830: {'lr': 0.00019892474694666425, 'samples': 1562560, 'steps': 3051, 'loss/train': 2.2054316997528076} -09/21/2021 01:03:52 - INFO - __main__ - Step 48831: {'lr': 0.00019892474694666425, 'samples': 1562592, 'steps': 3051, 'loss/train': 1.9947125911712646} -09/21/2021 01:03:53 - INFO - __main__ - Step 48832: {'lr': 0.00019892474694666425, 'samples': 1562624, 'steps': 3051, 'loss/train': 2.020432472229004} -09/21/2021 01:03:54 - INFO - __main__ - Step 48833: {'lr': 0.00019892381382758602, 'samples': 1562656, 'steps': 3052, 'loss/train': 1.673569679260254} -09/21/2021 01:03:55 - INFO - __main__ - Step 48834: {'lr': 0.00019892381382758602, 'samples': 1562688, 'steps': 3052, 'loss/train': 2.1223201751708984} -09/21/2021 01:03:55 - INFO - __main__ - Step 48835: {'lr': 0.00019892381382758602, 'samples': 1562720, 'steps': 3052, 'loss/train': 1.9432021379470825} -09/21/2021 01:03:56 - INFO - __main__ - Step 48836: {'lr': 0.00019892381382758602, 'samples': 1562752, 'steps': 3052, 'loss/train': 2.2042980194091797} -09/21/2021 01:03:57 - INFO - __main__ - Step 48837: {'lr': 0.00019892381382758602, 'samples': 1562784, 'steps': 3052, 'loss/train': 1.4624172449111938} -09/21/2021 01:03:58 - INFO - __main__ - Step 48838: {'lr': 0.00019892381382758602, 'samples': 1562816, 'steps': 3052, 'loss/train': 1.5618246793746948} -09/21/2021 01:03:58 - INFO - __main__ - Step 48839: {'lr': 0.00019892381382758602, 'samples': 1562848, 'steps': 3052, 'loss/train': 1.847083568572998} -09/21/2021 01:03:59 - INFO - __main__ - Step 48840: {'lr': 0.00019892381382758602, 'samples': 1562880, 'steps': 3052, 'loss/train': 1.2189686298370361} -09/21/2021 01:04:00 - INFO - __main__ - Step 48841: {'lr': 0.00019892381382758602, 'samples': 1562912, 'steps': 3052, 'loss/train': 1.6631155014038086} -09/21/2021 01:04:01 - INFO - __main__ - Step 48842: {'lr': 0.00019892381382758602, 'samples': 1562944, 'steps': 3052, 'loss/train': 1.8816750049591064} -09/21/2021 01:04:01 - INFO - __main__ - Step 48843: {'lr': 0.00019892381382758602, 'samples': 1562976, 'steps': 3052, 'loss/train': 2.6553876399993896} -09/21/2021 01:04:02 - INFO - __main__ - Step 48844: {'lr': 0.00019892381382758602, 'samples': 1563008, 'steps': 3052, 'loss/train': 1.5021955966949463} -09/21/2021 01:04:03 - INFO - __main__ - Step 48845: {'lr': 0.00019892381382758602, 'samples': 1563040, 'steps': 3052, 'loss/train': 2.160024642944336} -09/21/2021 01:04:04 - INFO - __main__ - Step 48846: {'lr': 0.00019892381382758602, 'samples': 1563072, 'steps': 3052, 'loss/train': 0.6267435550689697} -09/21/2021 01:04:04 - INFO - __main__ - Step 48847: {'lr': 0.00019892381382758602, 'samples': 1563104, 'steps': 3052, 'loss/train': 2.256807804107666} -09/21/2021 01:04:05 - INFO - __main__ - Step 48848: {'lr': 0.00019892381382758602, 'samples': 1563136, 'steps': 3052, 'loss/train': 2.1734676361083984} -09/21/2021 01:04:06 - INFO - __main__ - Step 48849: {'lr': 0.00019892288030598713, 'samples': 1563168, 'steps': 3053, 'loss/train': 0.7246280312538147} -09/21/2021 01:04:07 - INFO - __main__ - Step 48850: {'lr': 0.00019892288030598713, 'samples': 1563200, 'steps': 3053, 'loss/train': 2.5133144855499268} -09/21/2021 01:04:07 - INFO - __main__ - Step 48851: {'lr': 0.00019892288030598713, 'samples': 1563232, 'steps': 3053, 'loss/train': 1.7461693286895752} -09/21/2021 01:04:08 - INFO - __main__ - Step 48852: {'lr': 0.00019892288030598713, 'samples': 1563264, 'steps': 3053, 'loss/train': 1.1926932334899902} -09/21/2021 01:04:10 - INFO - __main__ - Step 48853: {'lr': 0.00019892288030598713, 'samples': 1563296, 'steps': 3053, 'loss/train': 0.6218677759170532} -09/21/2021 01:04:10 - INFO - __main__ - Step 48854: {'lr': 0.00019892288030598713, 'samples': 1563328, 'steps': 3053, 'loss/train': 2.833838701248169} -09/21/2021 01:04:11 - INFO - __main__ - Step 48855: {'lr': 0.00019892288030598713, 'samples': 1563360, 'steps': 3053, 'loss/train': 2.118884801864624} -09/21/2021 01:04:12 - INFO - __main__ - Step 48856: {'lr': 0.00019892288030598713, 'samples': 1563392, 'steps': 3053, 'loss/train': 1.3516992330551147} -09/21/2021 01:04:13 - INFO - __main__ - Step 48857: {'lr': 0.00019892288030598713, 'samples': 1563424, 'steps': 3053, 'loss/train': 2.5372729301452637} -09/21/2021 01:04:13 - INFO - __main__ - Step 48858: {'lr': 0.00019892288030598713, 'samples': 1563456, 'steps': 3053, 'loss/train': 1.9904760122299194} -09/21/2021 01:04:14 - INFO - __main__ - Step 48859: {'lr': 0.00019892288030598713, 'samples': 1563488, 'steps': 3053, 'loss/train': 2.197918176651001} -09/21/2021 01:04:15 - INFO - __main__ - Step 48860: {'lr': 0.00019892288030598713, 'samples': 1563520, 'steps': 3053, 'loss/train': 1.6289939880371094} -09/21/2021 01:04:16 - INFO - __main__ - Step 48861: {'lr': 0.00019892288030598713, 'samples': 1563552, 'steps': 3053, 'loss/train': 2.5783421993255615} -09/21/2021 01:04:16 - INFO - __main__ - Step 48862: {'lr': 0.00019892288030598713, 'samples': 1563584, 'steps': 3053, 'loss/train': 1.8648459911346436} -09/21/2021 01:04:17 - INFO - __main__ - Step 48863: {'lr': 0.00019892288030598713, 'samples': 1563616, 'steps': 3053, 'loss/train': 2.5904107093811035} -09/21/2021 01:04:18 - INFO - __main__ - Step 48864: {'lr': 0.00019892288030598713, 'samples': 1563648, 'steps': 3053, 'loss/train': 2.9065029621124268} -09/21/2021 01:04:19 - INFO - __main__ - Step 48865: {'lr': 0.00019892194638187143, 'samples': 1563680, 'steps': 3054, 'loss/train': 3.4614577293395996} -09/21/2021 01:04:19 - INFO - __main__ - Step 48866: {'lr': 0.00019892194638187143, 'samples': 1563712, 'steps': 3054, 'loss/train': 3.356931447982788} -09/21/2021 01:04:20 - INFO - __main__ - Step 48867: {'lr': 0.00019892194638187143, 'samples': 1563744, 'steps': 3054, 'loss/train': 3.4315881729125977} -09/21/2021 01:04:21 - INFO - __main__ - Step 48868: {'lr': 0.00019892194638187143, 'samples': 1563776, 'steps': 3054, 'loss/train': 1.8597699403762817} -09/21/2021 01:04:22 - INFO - __main__ - Step 48869: {'lr': 0.00019892194638187143, 'samples': 1563808, 'steps': 3054, 'loss/train': 1.4794777631759644} -09/21/2021 01:04:22 - INFO - __main__ - Step 48870: {'lr': 0.00019892194638187143, 'samples': 1563840, 'steps': 3054, 'loss/train': 2.215402603149414} -09/21/2021 01:04:23 - INFO - __main__ - Step 48871: {'lr': 0.00019892194638187143, 'samples': 1563872, 'steps': 3054, 'loss/train': 1.163529396057129} -09/21/2021 01:04:24 - INFO - __main__ - Step 48872: {'lr': 0.00019892194638187143, 'samples': 1563904, 'steps': 3054, 'loss/train': 1.8836097717285156} -09/21/2021 01:04:25 - INFO - __main__ - Step 48873: {'lr': 0.00019892194638187143, 'samples': 1563936, 'steps': 3054, 'loss/train': 1.4970287084579468} -09/21/2021 01:04:25 - INFO - __main__ - Step 48874: {'lr': 0.00019892194638187143, 'samples': 1563968, 'steps': 3054, 'loss/train': 2.294368028640747} -09/21/2021 01:04:26 - INFO - __main__ - Step 48875: {'lr': 0.00019892194638187143, 'samples': 1564000, 'steps': 3054, 'loss/train': 2.44543194770813} -09/21/2021 01:04:27 - INFO - __main__ - Step 48876: {'lr': 0.00019892194638187143, 'samples': 1564032, 'steps': 3054, 'loss/train': 2.5683417320251465} -09/21/2021 01:04:28 - INFO - __main__ - Step 48877: {'lr': 0.00019892194638187143, 'samples': 1564064, 'steps': 3054, 'loss/train': 2.449814796447754} -09/21/2021 01:04:28 - INFO - __main__ - Step 48878: {'lr': 0.00019892194638187143, 'samples': 1564096, 'steps': 3054, 'loss/train': 1.757702350616455} -09/21/2021 01:04:29 - INFO - __main__ - Step 48879: {'lr': 0.00019892194638187143, 'samples': 1564128, 'steps': 3054, 'loss/train': 1.4961854219436646} -09/21/2021 01:04:30 - INFO - __main__ - Step 48880: {'lr': 0.00019892194638187143, 'samples': 1564160, 'steps': 3054, 'loss/train': 3.2120542526245117} -09/21/2021 01:04:31 - INFO - __main__ - Step 48881: {'lr': 0.00019892101205524272, 'samples': 1564192, 'steps': 3055, 'loss/train': 2.038051128387451} -09/21/2021 01:04:32 - INFO - __main__ - Step 48882: {'lr': 0.00019892101205524272, 'samples': 1564224, 'steps': 3055, 'loss/train': 2.360346794128418} -09/21/2021 01:04:32 - INFO - __main__ - Step 48883: {'lr': 0.00019892101205524272, 'samples': 1564256, 'steps': 3055, 'loss/train': 1.9909768104553223} -09/21/2021 01:04:34 - INFO - __main__ - Step 48884: {'lr': 0.00019892101205524272, 'samples': 1564288, 'steps': 3055, 'loss/train': 2.22552227973938} -09/21/2021 01:04:34 - INFO - __main__ - Step 48885: {'lr': 0.00019892101205524272, 'samples': 1564320, 'steps': 3055, 'loss/train': 2.9902868270874023} -09/21/2021 01:04:35 - INFO - __main__ - Step 48886: {'lr': 0.00019892101205524272, 'samples': 1564352, 'steps': 3055, 'loss/train': 1.7083300352096558} -09/21/2021 01:04:36 - INFO - __main__ - Step 48887: {'lr': 0.00019892101205524272, 'samples': 1564384, 'steps': 3055, 'loss/train': 2.309823751449585} -09/21/2021 01:04:37 - INFO - __main__ - Step 48888: {'lr': 0.00019892101205524272, 'samples': 1564416, 'steps': 3055, 'loss/train': 2.0765628814697266} -09/21/2021 01:04:37 - INFO - __main__ - Step 48889: {'lr': 0.00019892101205524272, 'samples': 1564448, 'steps': 3055, 'loss/train': 2.48213267326355} -09/21/2021 01:04:38 - INFO - __main__ - Step 48890: {'lr': 0.00019892101205524272, 'samples': 1564480, 'steps': 3055, 'loss/train': 4.639780521392822} -09/21/2021 01:04:39 - INFO - __main__ - Step 48891: {'lr': 0.00019892101205524272, 'samples': 1564512, 'steps': 3055, 'loss/train': 2.2810802459716797} -09/21/2021 01:04:40 - INFO - __main__ - Step 48892: {'lr': 0.00019892101205524272, 'samples': 1564544, 'steps': 3055, 'loss/train': 2.190709352493286} -09/21/2021 01:04:40 - INFO - __main__ - Step 48893: {'lr': 0.00019892101205524272, 'samples': 1564576, 'steps': 3055, 'loss/train': 1.863652229309082} -09/21/2021 01:04:41 - INFO - __main__ - Step 48894: {'lr': 0.00019892101205524272, 'samples': 1564608, 'steps': 3055, 'loss/train': 2.3566372394561768} -09/21/2021 01:04:42 - INFO - __main__ - Step 48895: {'lr': 0.00019892101205524272, 'samples': 1564640, 'steps': 3055, 'loss/train': 2.0739924907684326} -09/21/2021 01:04:43 - INFO - __main__ - Step 48896: {'lr': 0.00019892101205524272, 'samples': 1564672, 'steps': 3055, 'loss/train': 1.5924232006072998} -09/21/2021 01:04:44 - INFO - __main__ - Step 48897: {'lr': 0.0001989200773261048, 'samples': 1564704, 'steps': 3056, 'loss/train': 1.3119134902954102} -09/21/2021 01:04:44 - INFO - __main__ - Step 48898: {'lr': 0.0001989200773261048, 'samples': 1564736, 'steps': 3056, 'loss/train': 2.178676128387451} -09/21/2021 01:04:45 - INFO - __main__ - Step 48899: {'lr': 0.0001989200773261048, 'samples': 1564768, 'steps': 3056, 'loss/train': 2.1555213928222656} -09/21/2021 01:04:46 - INFO - __main__ - Step 48900: {'lr': 0.0001989200773261048, 'samples': 1564800, 'steps': 3056, 'loss/train': 1.715532898902893} -09/21/2021 01:04:47 - INFO - __main__ - Step 48901: {'lr': 0.0001989200773261048, 'samples': 1564832, 'steps': 3056, 'loss/train': 1.2051771879196167} -09/21/2021 01:04:47 - INFO - __main__ - Step 48902: {'lr': 0.0001989200773261048, 'samples': 1564864, 'steps': 3056, 'loss/train': 2.313002109527588} -09/21/2021 01:04:48 - INFO - __main__ - Step 48903: {'lr': 0.0001989200773261048, 'samples': 1564896, 'steps': 3056, 'loss/train': 2.2204577922821045} -09/21/2021 01:04:49 - INFO - __main__ - Step 48904: {'lr': 0.0001989200773261048, 'samples': 1564928, 'steps': 3056, 'loss/train': 2.0807337760925293} -09/21/2021 01:04:50 - INFO - __main__ - Step 48905: {'lr': 0.0001989200773261048, 'samples': 1564960, 'steps': 3056, 'loss/train': 1.901159405708313} -09/21/2021 01:04:50 - INFO - __main__ - Step 48906: {'lr': 0.0001989200773261048, 'samples': 1564992, 'steps': 3056, 'loss/train': 3.438167095184326} -09/21/2021 01:04:51 - INFO - __main__ - Step 48907: {'lr': 0.0001989200773261048, 'samples': 1565024, 'steps': 3056, 'loss/train': 2.839850425720215} -09/21/2021 01:04:52 - INFO - __main__ - Step 48908: {'lr': 0.0001989200773261048, 'samples': 1565056, 'steps': 3056, 'loss/train': 1.990059494972229} -09/21/2021 01:04:53 - INFO - __main__ - Step 48909: {'lr': 0.0001989200773261048, 'samples': 1565088, 'steps': 3056, 'loss/train': 2.0174989700317383} -09/21/2021 01:04:53 - INFO - __main__ - Step 48910: {'lr': 0.0001989200773261048, 'samples': 1565120, 'steps': 3056, 'loss/train': 1.6048941612243652} -09/21/2021 01:04:54 - INFO - __main__ - Step 48911: {'lr': 0.0001989200773261048, 'samples': 1565152, 'steps': 3056, 'loss/train': 2.0932371616363525} -09/21/2021 01:04:55 - INFO - __main__ - Step 48912: {'lr': 0.0001989200773261048, 'samples': 1565184, 'steps': 3056, 'loss/train': 2.54207181930542} -09/21/2021 01:04:56 - INFO - __main__ - Step 48913: {'lr': 0.00019891914219446148, 'samples': 1565216, 'steps': 3057, 'loss/train': 1.6324573755264282} -09/21/2021 01:04:56 - INFO - __main__ - Step 48914: {'lr': 0.00019891914219446148, 'samples': 1565248, 'steps': 3057, 'loss/train': 1.785766363143921} -09/21/2021 01:04:58 - INFO - __main__ - Step 48915: {'lr': 0.00019891914219446148, 'samples': 1565280, 'steps': 3057, 'loss/train': 1.8792824745178223} -09/21/2021 01:04:58 - INFO - __main__ - Step 48916: {'lr': 0.00019891914219446148, 'samples': 1565312, 'steps': 3057, 'loss/train': 0.12770460546016693} -09/21/2021 01:04:59 - INFO - __main__ - Step 48917: {'lr': 0.00019891914219446148, 'samples': 1565344, 'steps': 3057, 'loss/train': 1.7466305494308472} -09/21/2021 01:05:00 - INFO - __main__ - Step 48918: {'lr': 0.00019891914219446148, 'samples': 1565376, 'steps': 3057, 'loss/train': 2.387587547302246} -09/21/2021 01:05:01 - INFO - __main__ - Step 48919: {'lr': 0.00019891914219446148, 'samples': 1565408, 'steps': 3057, 'loss/train': 1.2674717903137207} -09/21/2021 01:05:01 - INFO - __main__ - Step 48920: {'lr': 0.00019891914219446148, 'samples': 1565440, 'steps': 3057, 'loss/train': 2.095233678817749} -09/21/2021 01:05:02 - INFO - __main__ - Step 48921: {'lr': 0.00019891914219446148, 'samples': 1565472, 'steps': 3057, 'loss/train': 1.291335105895996} -09/21/2021 01:05:03 - INFO - __main__ - Step 48922: {'lr': 0.00019891914219446148, 'samples': 1565504, 'steps': 3057, 'loss/train': 2.132087230682373} -09/21/2021 01:05:04 - INFO - __main__ - Step 48923: {'lr': 0.00019891914219446148, 'samples': 1565536, 'steps': 3057, 'loss/train': 2.4184725284576416} -09/21/2021 01:05:04 - INFO - __main__ - Step 48924: {'lr': 0.00019891914219446148, 'samples': 1565568, 'steps': 3057, 'loss/train': 2.2100841999053955} -09/21/2021 01:05:05 - INFO - __main__ - Step 48925: {'lr': 0.00019891914219446148, 'samples': 1565600, 'steps': 3057, 'loss/train': 1.951420545578003} -09/21/2021 01:05:06 - INFO - __main__ - Step 48926: {'lr': 0.00019891914219446148, 'samples': 1565632, 'steps': 3057, 'loss/train': 1.5630178451538086} -09/21/2021 01:05:07 - INFO - __main__ - Step 48927: {'lr': 0.00019891914219446148, 'samples': 1565664, 'steps': 3057, 'loss/train': 1.7345362901687622} -09/21/2021 01:05:07 - INFO - __main__ - Step 48928: {'lr': 0.00019891914219446148, 'samples': 1565696, 'steps': 3057, 'loss/train': 1.946605920791626} -09/21/2021 01:05:08 - INFO - __main__ - Step 48929: {'lr': 0.00019891820666031654, 'samples': 1565728, 'steps': 3058, 'loss/train': 2.2440686225891113} -09/21/2021 01:05:09 - INFO - __main__ - Step 48930: {'lr': 0.00019891820666031654, 'samples': 1565760, 'steps': 3058, 'loss/train': 1.0854763984680176} -09/21/2021 01:05:10 - INFO - __main__ - Step 48931: {'lr': 0.00019891820666031654, 'samples': 1565792, 'steps': 3058, 'loss/train': 2.5726704597473145} -09/21/2021 01:05:11 - INFO - __main__ - Step 48932: {'lr': 0.00019891820666031654, 'samples': 1565824, 'steps': 3058, 'loss/train': 1.4986990690231323} -09/21/2021 01:05:11 - INFO - __main__ - Step 48933: {'lr': 0.00019891820666031654, 'samples': 1565856, 'steps': 3058, 'loss/train': 2.0364890098571777} -09/21/2021 01:05:12 - INFO - __main__ - Step 48934: {'lr': 0.00019891820666031654, 'samples': 1565888, 'steps': 3058, 'loss/train': 1.6934489011764526} -09/21/2021 01:05:13 - INFO - __main__ - Step 48935: {'lr': 0.00019891820666031654, 'samples': 1565920, 'steps': 3058, 'loss/train': 1.719884991645813} -09/21/2021 01:05:14 - INFO - __main__ - Step 48936: {'lr': 0.00019891820666031654, 'samples': 1565952, 'steps': 3058, 'loss/train': 4.137562274932861} -09/21/2021 01:05:14 - INFO - __main__ - Step 48937: {'lr': 0.00019891820666031654, 'samples': 1565984, 'steps': 3058, 'loss/train': 1.5770543813705444} -09/21/2021 01:05:15 - INFO - __main__ - Step 48938: {'lr': 0.00019891820666031654, 'samples': 1566016, 'steps': 3058, 'loss/train': 2.248425006866455} -09/21/2021 01:05:16 - INFO - __main__ - Step 48939: {'lr': 0.00019891820666031654, 'samples': 1566048, 'steps': 3058, 'loss/train': 1.9215171337127686} -09/21/2021 01:05:17 - INFO - __main__ - Step 48940: {'lr': 0.00019891820666031654, 'samples': 1566080, 'steps': 3058, 'loss/train': 1.2115707397460938} -09/21/2021 01:05:17 - INFO - __main__ - Step 48941: {'lr': 0.00019891820666031654, 'samples': 1566112, 'steps': 3058, 'loss/train': 1.6610252857208252} -09/21/2021 01:05:18 - INFO - __main__ - Step 48942: {'lr': 0.00019891820666031654, 'samples': 1566144, 'steps': 3058, 'loss/train': 3.1765646934509277} -09/21/2021 01:05:19 - INFO - __main__ - Step 48943: {'lr': 0.00019891820666031654, 'samples': 1566176, 'steps': 3058, 'loss/train': 1.8580787181854248} -09/21/2021 01:05:20 - INFO - __main__ - Step 48944: {'lr': 0.00019891820666031654, 'samples': 1566208, 'steps': 3058, 'loss/train': 1.6689280271530151} -09/21/2021 01:05:20 - INFO - __main__ - Step 48945: {'lr': 0.00019891727072367382, 'samples': 1566240, 'steps': 3059, 'loss/train': 1.5475552082061768} -09/21/2021 01:05:22 - INFO - __main__ - Step 48946: {'lr': 0.00019891727072367382, 'samples': 1566272, 'steps': 3059, 'loss/train': 2.009572982788086} -09/21/2021 01:05:23 - INFO - __main__ - Step 48947: {'lr': 0.00019891727072367382, 'samples': 1566304, 'steps': 3059, 'loss/train': 2.1382837295532227} -09/21/2021 01:05:23 - INFO - __main__ - Step 48948: {'lr': 0.00019891727072367382, 'samples': 1566336, 'steps': 3059, 'loss/train': 2.4917359352111816} -09/21/2021 01:05:24 - INFO - __main__ - Step 48949: {'lr': 0.00019891727072367382, 'samples': 1566368, 'steps': 3059, 'loss/train': 1.6064379215240479} -09/21/2021 01:05:25 - INFO - __main__ - Step 48950: {'lr': 0.00019891727072367382, 'samples': 1566400, 'steps': 3059, 'loss/train': 0.31757205724716187} -09/21/2021 01:05:26 - INFO - __main__ - Step 48951: {'lr': 0.00019891727072367382, 'samples': 1566432, 'steps': 3059, 'loss/train': 0.37073996663093567} -09/21/2021 01:05:26 - INFO - __main__ - Step 48952: {'lr': 0.00019891727072367382, 'samples': 1566464, 'steps': 3059, 'loss/train': 0.3149455189704895} -09/21/2021 01:05:27 - INFO - __main__ - Step 48953: {'lr': 0.00019891727072367382, 'samples': 1566496, 'steps': 3059, 'loss/train': 0.37268319725990295} -09/21/2021 01:05:28 - INFO - __main__ - Step 48954: {'lr': 0.00019891727072367382, 'samples': 1566528, 'steps': 3059, 'loss/train': 0.8807190656661987} -09/21/2021 01:05:29 - INFO - __main__ - Step 48955: {'lr': 0.00019891727072367382, 'samples': 1566560, 'steps': 3059, 'loss/train': 0.3595525026321411} -09/21/2021 01:05:29 - INFO - __main__ - Step 48956: {'lr': 0.00019891727072367382, 'samples': 1566592, 'steps': 3059, 'loss/train': 0.17159105837345123} -09/21/2021 01:05:30 - INFO - __main__ - Step 48957: {'lr': 0.00019891727072367382, 'samples': 1566624, 'steps': 3059, 'loss/train': 0.5235256552696228} -09/21/2021 01:05:31 - INFO - __main__ - Step 48958: {'lr': 0.00019891727072367382, 'samples': 1566656, 'steps': 3059, 'loss/train': 2.832101821899414} -09/21/2021 01:05:32 - INFO - __main__ - Step 48959: {'lr': 0.00019891727072367382, 'samples': 1566688, 'steps': 3059, 'loss/train': 1.6292608976364136} -09/21/2021 01:05:32 - INFO - __main__ - Step 48960: {'lr': 0.00019891727072367382, 'samples': 1566720, 'steps': 3059, 'loss/train': 2.2424347400665283} -09/21/2021 01:05:33 - INFO - __main__ - Step 48961: {'lr': 0.00019891633438453709, 'samples': 1566752, 'steps': 3060, 'loss/train': 1.5392473936080933} -09/21/2021 01:05:34 - INFO - __main__ - Step 48962: {'lr': 0.00019891633438453709, 'samples': 1566784, 'steps': 3060, 'loss/train': 1.7042601108551025} -09/21/2021 01:05:35 - INFO - __main__ - Step 48963: {'lr': 0.00019891633438453709, 'samples': 1566816, 'steps': 3060, 'loss/train': 0.7872536182403564} -09/21/2021 01:05:36 - INFO - __main__ - Step 48964: {'lr': 0.00019891633438453709, 'samples': 1566848, 'steps': 3060, 'loss/train': 1.9363203048706055} -09/21/2021 01:05:36 - INFO - __main__ - Step 48965: {'lr': 0.00019891633438453709, 'samples': 1566880, 'steps': 3060, 'loss/train': 1.7288849353790283} -09/21/2021 01:05:37 - INFO - __main__ - Step 48966: {'lr': 0.00019891633438453709, 'samples': 1566912, 'steps': 3060, 'loss/train': 1.2739264965057373} -09/21/2021 01:05:38 - INFO - __main__ - Step 48967: {'lr': 0.00019891633438453709, 'samples': 1566944, 'steps': 3060, 'loss/train': 2.564870595932007} -09/21/2021 01:05:39 - INFO - __main__ - Step 48968: {'lr': 0.00019891633438453709, 'samples': 1566976, 'steps': 3060, 'loss/train': 2.187971830368042} -09/21/2021 01:05:39 - INFO - __main__ - Step 48969: {'lr': 0.00019891633438453709, 'samples': 1567008, 'steps': 3060, 'loss/train': 2.262310266494751} -09/21/2021 01:05:40 - INFO - __main__ - Step 48970: {'lr': 0.00019891633438453709, 'samples': 1567040, 'steps': 3060, 'loss/train': 1.6042674779891968} -09/21/2021 01:05:41 - INFO - __main__ - Step 48971: {'lr': 0.00019891633438453709, 'samples': 1567072, 'steps': 3060, 'loss/train': 1.7145425081253052} -09/21/2021 01:05:42 - INFO - __main__ - Step 48972: {'lr': 0.00019891633438453709, 'samples': 1567104, 'steps': 3060, 'loss/train': 2.202697277069092} -09/21/2021 01:05:42 - INFO - __main__ - Step 48973: {'lr': 0.00019891633438453709, 'samples': 1567136, 'steps': 3060, 'loss/train': 1.640343427658081} -09/21/2021 01:05:43 - INFO - __main__ - Step 48974: {'lr': 0.00019891633438453709, 'samples': 1567168, 'steps': 3060, 'loss/train': 0.3495367765426636} -09/21/2021 01:05:44 - INFO - __main__ - Step 48975: {'lr': 0.00019891633438453709, 'samples': 1567200, 'steps': 3060, 'loss/train': 0.1084466278553009} -09/21/2021 01:05:45 - INFO - __main__ - Step 48976: {'lr': 0.00019891633438453709, 'samples': 1567232, 'steps': 3060, 'loss/train': 0.4425932466983795} -09/21/2021 01:05:47 - INFO - __main__ - Step 48977: {'lr': 0.00019891539764291017, 'samples': 1567264, 'steps': 3061, 'loss/train': 1.2071717977523804} -09/21/2021 01:05:48 - INFO - __main__ - Step 48978: {'lr': 0.00019891539764291017, 'samples': 1567296, 'steps': 3061, 'loss/train': 2.333458423614502} -09/21/2021 01:05:48 - INFO - __main__ - Step 48979: {'lr': 0.00019891539764291017, 'samples': 1567328, 'steps': 3061, 'loss/train': 1.5089147090911865} -09/21/2021 01:05:49 - INFO - __main__ - Step 48980: {'lr': 0.00019891539764291017, 'samples': 1567360, 'steps': 3061, 'loss/train': 2.171314001083374} -09/21/2021 01:05:50 - INFO - __main__ - Step 48981: {'lr': 0.00019891539764291017, 'samples': 1567392, 'steps': 3061, 'loss/train': 1.893828272819519} -09/21/2021 01:05:51 - INFO - __main__ - Step 48982: {'lr': 0.00019891539764291017, 'samples': 1567424, 'steps': 3061, 'loss/train': 1.7899394035339355} -09/21/2021 01:05:51 - INFO - __main__ - Step 48983: {'lr': 0.00019891539764291017, 'samples': 1567456, 'steps': 3061, 'loss/train': 2.273898124694824} -09/21/2021 01:05:52 - INFO - __main__ - Step 48984: {'lr': 0.00019891539764291017, 'samples': 1567488, 'steps': 3061, 'loss/train': 1.0856478214263916} -09/21/2021 01:05:53 - INFO - __main__ - Step 48985: {'lr': 0.00019891539764291017, 'samples': 1567520, 'steps': 3061, 'loss/train': 2.6231541633605957} -09/21/2021 01:05:54 - INFO - __main__ - Step 48986: {'lr': 0.00019891539764291017, 'samples': 1567552, 'steps': 3061, 'loss/train': 1.7042548656463623} -09/21/2021 01:05:54 - INFO - __main__ - Step 48987: {'lr': 0.00019891539764291017, 'samples': 1567584, 'steps': 3061, 'loss/train': 1.1873080730438232} -09/21/2021 01:05:55 - INFO - __main__ - Step 48988: {'lr': 0.00019891539764291017, 'samples': 1567616, 'steps': 3061, 'loss/train': 1.646767258644104} -09/21/2021 01:05:56 - INFO - __main__ - Step 48989: {'lr': 0.00019891539764291017, 'samples': 1567648, 'steps': 3061, 'loss/train': 2.0009288787841797} -09/21/2021 01:05:57 - INFO - __main__ - Step 48990: {'lr': 0.00019891539764291017, 'samples': 1567680, 'steps': 3061, 'loss/train': 1.905615210533142} -09/21/2021 01:05:57 - INFO - __main__ - Step 48991: {'lr': 0.00019891539764291017, 'samples': 1567712, 'steps': 3061, 'loss/train': 2.6579270362854004} -09/21/2021 01:05:58 - INFO - __main__ - Step 48992: {'lr': 0.00019891539764291017, 'samples': 1567744, 'steps': 3061, 'loss/train': 2.265653610229492} -09/21/2021 01:05:59 - INFO - __main__ - Step 48993: {'lr': 0.0001989144604987969, 'samples': 1567776, 'steps': 3062, 'loss/train': 1.0275987386703491} -09/21/2021 01:06:00 - INFO - __main__ - Step 48994: {'lr': 0.0001989144604987969, 'samples': 1567808, 'steps': 3062, 'loss/train': 1.8347738981246948} -09/21/2021 01:06:01 - INFO - __main__ - Step 48995: {'lr': 0.0001989144604987969, 'samples': 1567840, 'steps': 3062, 'loss/train': 2.288846015930176} -09/21/2021 01:06:01 - INFO - __main__ - Step 48996: {'lr': 0.0001989144604987969, 'samples': 1567872, 'steps': 3062, 'loss/train': 1.503806233406067} -09/21/2021 01:06:02 - INFO - __main__ - Step 48997: {'lr': 0.0001989144604987969, 'samples': 1567904, 'steps': 3062, 'loss/train': 1.9752801656723022} -09/21/2021 01:06:03 - INFO - __main__ - Step 48998: {'lr': 0.0001989144604987969, 'samples': 1567936, 'steps': 3062, 'loss/train': 0.8024198412895203} -09/21/2021 01:06:04 - INFO - __main__ - Step 48999: {'lr': 0.0001989144604987969, 'samples': 1567968, 'steps': 3062, 'loss/train': 0.7012138962745667} -09/21/2021 01:06:04 - INFO - __main__ - Step 49000: {'lr': 0.0001989144604987969, 'samples': 1568000, 'steps': 3062, 'loss/train': 0.7556707262992859} -09/21/2021 01:06:05 - INFO - __main__ - Step 49001: {'lr': 0.0001989144604987969, 'samples': 1568032, 'steps': 3062, 'loss/train': 1.019164800643921} -09/21/2021 01:06:06 - INFO - __main__ - Step 49002: {'lr': 0.0001989144604987969, 'samples': 1568064, 'steps': 3062, 'loss/train': 1.1696743965148926} -09/21/2021 01:06:07 - INFO - __main__ - Step 49003: {'lr': 0.0001989144604987969, 'samples': 1568096, 'steps': 3062, 'loss/train': 1.1065834760665894} -09/21/2021 01:06:07 - INFO - __main__ - Step 49004: {'lr': 0.0001989144604987969, 'samples': 1568128, 'steps': 3062, 'loss/train': 0.7522376775741577} -09/21/2021 01:06:08 - INFO - __main__ - Step 49005: {'lr': 0.0001989144604987969, 'samples': 1568160, 'steps': 3062, 'loss/train': 0.882611095905304} -09/21/2021 01:06:09 - INFO - __main__ - Step 49006: {'lr': 0.0001989144604987969, 'samples': 1568192, 'steps': 3062, 'loss/train': 0.8760629892349243} -09/21/2021 01:06:10 - INFO - __main__ - Step 49007: {'lr': 0.0001989144604987969, 'samples': 1568224, 'steps': 3062, 'loss/train': 0.87737637758255} -09/21/2021 01:06:10 - INFO - __main__ - Step 49008: {'lr': 0.0001989144604987969, 'samples': 1568256, 'steps': 3062, 'loss/train': 0.9076058864593506} -09/21/2021 01:06:11 - INFO - __main__ - Step 49009: {'lr': 0.00019891352295220107, 'samples': 1568288, 'steps': 3063, 'loss/train': 0.9057530164718628} -09/21/2021 01:06:12 - INFO - __main__ - Step 49010: {'lr': 0.00019891352295220107, 'samples': 1568320, 'steps': 3063, 'loss/train': 0.9077416658401489} -09/21/2021 01:06:13 - INFO - __main__ - Step 49011: {'lr': 0.00019891352295220107, 'samples': 1568352, 'steps': 3063, 'loss/train': 0.7794804573059082} -09/21/2021 01:06:13 - INFO - __main__ - Step 49012: {'lr': 0.00019891352295220107, 'samples': 1568384, 'steps': 3063, 'loss/train': 0.8001611232757568} -09/21/2021 01:06:14 - INFO - __main__ - Step 49013: {'lr': 0.00019891352295220107, 'samples': 1568416, 'steps': 3063, 'loss/train': 0.7793707847595215} -09/21/2021 01:06:15 - INFO - __main__ - Step 49014: {'lr': 0.00019891352295220107, 'samples': 1568448, 'steps': 3063, 'loss/train': 2.748622179031372} -09/21/2021 01:06:16 - INFO - __main__ - Step 49015: {'lr': 0.00019891352295220107, 'samples': 1568480, 'steps': 3063, 'loss/train': 1.6629048585891724} -09/21/2021 01:06:17 - INFO - __main__ - Step 49016: {'lr': 0.00019891352295220107, 'samples': 1568512, 'steps': 3063, 'loss/train': 0.9343594312667847} -09/21/2021 01:06:18 - INFO - __main__ - Step 49017: {'lr': 0.00019891352295220107, 'samples': 1568544, 'steps': 3063, 'loss/train': 0.3604404032230377} -09/21/2021 01:06:19 - INFO - __main__ - Step 49018: {'lr': 0.00019891352295220107, 'samples': 1568576, 'steps': 3063, 'loss/train': 0.41759926080703735} -09/21/2021 01:06:19 - INFO - __main__ - Step 49019: {'lr': 0.00019891352295220107, 'samples': 1568608, 'steps': 3063, 'loss/train': 1.734925389289856} -09/21/2021 01:06:20 - INFO - __main__ - Step 49020: {'lr': 0.00019891352295220107, 'samples': 1568640, 'steps': 3063, 'loss/train': 1.7193771600723267} -09/21/2021 01:06:21 - INFO - __main__ - Step 49021: {'lr': 0.00019891352295220107, 'samples': 1568672, 'steps': 3063, 'loss/train': 1.6984878778457642} -09/21/2021 01:06:22 - INFO - __main__ - Step 49022: {'lr': 0.00019891352295220107, 'samples': 1568704, 'steps': 3063, 'loss/train': 1.3748706579208374} -09/21/2021 01:06:22 - INFO - __main__ - Step 49023: {'lr': 0.00019891352295220107, 'samples': 1568736, 'steps': 3063, 'loss/train': 1.6848030090332031} -09/21/2021 01:06:23 - INFO - __main__ - Step 49024: {'lr': 0.00019891352295220107, 'samples': 1568768, 'steps': 3063, 'loss/train': 2.0939316749572754} -09/21/2021 01:06:24 - INFO - __main__ - Step 49025: {'lr': 0.00019891258500312652, 'samples': 1568800, 'steps': 3064, 'loss/train': 2.461850166320801} -09/21/2021 01:06:25 - INFO - __main__ - Step 49026: {'lr': 0.00019891258500312652, 'samples': 1568832, 'steps': 3064, 'loss/train': 2.032210111618042} -09/21/2021 01:06:25 - INFO - __main__ - Step 49027: {'lr': 0.00019891258500312652, 'samples': 1568864, 'steps': 3064, 'loss/train': 2.0711781978607178} -09/21/2021 01:06:26 - INFO - __main__ - Step 49028: {'lr': 0.00019891258500312652, 'samples': 1568896, 'steps': 3064, 'loss/train': 1.5677460432052612} -09/21/2021 01:06:27 - INFO - __main__ - Step 49029: {'lr': 0.00019891258500312652, 'samples': 1568928, 'steps': 3064, 'loss/train': 1.8372622728347778} -09/21/2021 01:06:28 - INFO - __main__ - Step 49030: {'lr': 0.00019891258500312652, 'samples': 1568960, 'steps': 3064, 'loss/train': 2.0244193077087402} -09/21/2021 01:06:28 - INFO - __main__ - Step 49031: {'lr': 0.00019891258500312652, 'samples': 1568992, 'steps': 3064, 'loss/train': 2.1619644165039062} -09/21/2021 01:06:29 - INFO - __main__ - Step 49032: {'lr': 0.00019891258500312652, 'samples': 1569024, 'steps': 3064, 'loss/train': 1.967665672302246} -09/21/2021 01:06:30 - INFO - __main__ - Step 49033: {'lr': 0.00019891258500312652, 'samples': 1569056, 'steps': 3064, 'loss/train': 2.478607177734375} -09/21/2021 01:06:31 - INFO - __main__ - Step 49034: {'lr': 0.00019891258500312652, 'samples': 1569088, 'steps': 3064, 'loss/train': 3.8798937797546387} -09/21/2021 01:06:31 - INFO - __main__ - Step 49035: {'lr': 0.00019891258500312652, 'samples': 1569120, 'steps': 3064, 'loss/train': 1.669839859008789} -09/21/2021 01:06:32 - INFO - __main__ - Step 49036: {'lr': 0.00019891258500312652, 'samples': 1569152, 'steps': 3064, 'loss/train': 1.2773748636245728} -09/21/2021 01:06:33 - INFO - __main__ - Step 49037: {'lr': 0.00019891258500312652, 'samples': 1569184, 'steps': 3064, 'loss/train': 1.7013026475906372} -09/21/2021 01:06:34 - INFO - __main__ - Step 49038: {'lr': 0.00019891258500312652, 'samples': 1569216, 'steps': 3064, 'loss/train': 2.436063289642334} -09/21/2021 01:06:34 - INFO - __main__ - Step 49039: {'lr': 0.00019891258500312652, 'samples': 1569248, 'steps': 3064, 'loss/train': 2.7247071266174316} -09/21/2021 01:06:35 - INFO - __main__ - Step 49040: {'lr': 0.00019891258500312652, 'samples': 1569280, 'steps': 3064, 'loss/train': 1.9358892440795898} -09/21/2021 01:06:36 - INFO - __main__ - Step 49041: {'lr': 0.000198911646651577, 'samples': 1569312, 'steps': 3065, 'loss/train': 1.4666069746017456} -09/21/2021 01:06:37 - INFO - __main__ - Step 49042: {'lr': 0.000198911646651577, 'samples': 1569344, 'steps': 3065, 'loss/train': 1.458714485168457} -09/21/2021 01:06:38 - INFO - __main__ - Step 49043: {'lr': 0.000198911646651577, 'samples': 1569376, 'steps': 3065, 'loss/train': 2.104417324066162} -09/21/2021 01:06:38 - INFO - __main__ - Step 49044: {'lr': 0.000198911646651577, 'samples': 1569408, 'steps': 3065, 'loss/train': 1.5302491188049316} -09/21/2021 01:06:39 - INFO - __main__ - Step 49045: {'lr': 0.000198911646651577, 'samples': 1569440, 'steps': 3065, 'loss/train': 0.8637925982475281} -09/21/2021 01:06:40 - INFO - __main__ - Step 49046: {'lr': 0.000198911646651577, 'samples': 1569472, 'steps': 3065, 'loss/train': 0.9794675707817078} -09/21/2021 01:06:41 - INFO - __main__ - Step 49047: {'lr': 0.000198911646651577, 'samples': 1569504, 'steps': 3065, 'loss/train': 0.9109435081481934} -09/21/2021 01:06:42 - INFO - __main__ - Step 49048: {'lr': 0.000198911646651577, 'samples': 1569536, 'steps': 3065, 'loss/train': 0.6719691157341003} -09/21/2021 01:06:43 - INFO - __main__ - Step 49049: {'lr': 0.000198911646651577, 'samples': 1569568, 'steps': 3065, 'loss/train': 2.1477770805358887} -09/21/2021 01:06:43 - INFO - __main__ - Step 49050: {'lr': 0.000198911646651577, 'samples': 1569600, 'steps': 3065, 'loss/train': 0.7649105191230774} -09/21/2021 01:06:44 - INFO - __main__ - Step 49051: {'lr': 0.000198911646651577, 'samples': 1569632, 'steps': 3065, 'loss/train': 2.470005750656128} -09/21/2021 01:06:45 - INFO - __main__ - Step 49052: {'lr': 0.000198911646651577, 'samples': 1569664, 'steps': 3065, 'loss/train': 1.1042466163635254} -09/21/2021 01:06:46 - INFO - __main__ - Step 49053: {'lr': 0.000198911646651577, 'samples': 1569696, 'steps': 3065, 'loss/train': 0.38913625478744507} -09/21/2021 01:06:46 - INFO - __main__ - Step 49054: {'lr': 0.000198911646651577, 'samples': 1569728, 'steps': 3065, 'loss/train': 2.0670359134674072} -09/21/2021 01:06:47 - INFO - __main__ - Step 49055: {'lr': 0.000198911646651577, 'samples': 1569760, 'steps': 3065, 'loss/train': 2.168814182281494} -09/21/2021 01:06:48 - INFO - __main__ - Step 49056: {'lr': 0.000198911646651577, 'samples': 1569792, 'steps': 3065, 'loss/train': 1.207951545715332} -09/21/2021 01:06:49 - INFO - __main__ - Step 49057: {'lr': 0.00019891070789755641, 'samples': 1569824, 'steps': 3066, 'loss/train': 1.0664386749267578} -09/21/2021 01:06:50 - INFO - __main__ - Step 49058: {'lr': 0.00019891070789755641, 'samples': 1569856, 'steps': 3066, 'loss/train': 2.265211820602417} -09/21/2021 01:06:50 - INFO - __main__ - Step 49059: {'lr': 0.00019891070789755641, 'samples': 1569888, 'steps': 3066, 'loss/train': 2.406946897506714} -09/21/2021 01:06:51 - INFO - __main__ - Step 49060: {'lr': 0.00019891070789755641, 'samples': 1569920, 'steps': 3066, 'loss/train': 2.1085240840911865} -09/21/2021 01:06:52 - INFO - __main__ - Step 49061: {'lr': 0.00019891070789755641, 'samples': 1569952, 'steps': 3066, 'loss/train': 1.452200174331665} -09/21/2021 01:06:53 - INFO - __main__ - Step 49062: {'lr': 0.00019891070789755641, 'samples': 1569984, 'steps': 3066, 'loss/train': 1.6669868230819702} -09/21/2021 01:06:53 - INFO - __main__ - Step 49063: {'lr': 0.00019891070789755641, 'samples': 1570016, 'steps': 3066, 'loss/train': 2.0544936656951904} -09/21/2021 01:06:54 - INFO - __main__ - Step 49064: {'lr': 0.00019891070789755641, 'samples': 1570048, 'steps': 3066, 'loss/train': 1.3863046169281006} -09/21/2021 01:06:55 - INFO - __main__ - Step 49065: {'lr': 0.00019891070789755641, 'samples': 1570080, 'steps': 3066, 'loss/train': 1.6680357456207275} -09/21/2021 01:06:56 - INFO - __main__ - Step 49066: {'lr': 0.00019891070789755641, 'samples': 1570112, 'steps': 3066, 'loss/train': 1.8715323209762573} -09/21/2021 01:06:56 - INFO - __main__ - Step 49067: {'lr': 0.00019891070789755641, 'samples': 1570144, 'steps': 3066, 'loss/train': 1.3336673974990845} -09/21/2021 01:06:57 - INFO - __main__ - Step 49068: {'lr': 0.00019891070789755641, 'samples': 1570176, 'steps': 3066, 'loss/train': 1.5865530967712402} -09/21/2021 01:06:58 - INFO - __main__ - Step 49069: {'lr': 0.00019891070789755641, 'samples': 1570208, 'steps': 3066, 'loss/train': 1.6453619003295898} -09/21/2021 01:06:59 - INFO - __main__ - Step 49070: {'lr': 0.00019891070789755641, 'samples': 1570240, 'steps': 3066, 'loss/train': 2.6759934425354004} -09/21/2021 01:06:59 - INFO - __main__ - Step 49071: {'lr': 0.00019891070789755641, 'samples': 1570272, 'steps': 3066, 'loss/train': 1.407789945602417} -09/21/2021 01:07:00 - INFO - __main__ - Step 49072: {'lr': 0.00019891070789755641, 'samples': 1570304, 'steps': 3066, 'loss/train': 1.0540146827697754} -09/21/2021 01:07:01 - INFO - __main__ - Step 49073: {'lr': 0.0001989097687410685, 'samples': 1570336, 'steps': 3067, 'loss/train': 1.546940565109253} -09/21/2021 01:07:02 - INFO - __main__ - Step 49074: {'lr': 0.0001989097687410685, 'samples': 1570368, 'steps': 3067, 'loss/train': 2.0503897666931152} -09/21/2021 01:07:02 - INFO - __main__ - Step 49075: {'lr': 0.0001989097687410685, 'samples': 1570400, 'steps': 3067, 'loss/train': 1.345644474029541} -09/21/2021 01:07:03 - INFO - __main__ - Step 49076: {'lr': 0.0001989097687410685, 'samples': 1570432, 'steps': 3067, 'loss/train': 2.814913272857666} -09/21/2021 01:07:04 - INFO - __main__ - Step 49077: {'lr': 0.0001989097687410685, 'samples': 1570464, 'steps': 3067, 'loss/train': 2.6912031173706055} -09/21/2021 01:07:05 - INFO - __main__ - Step 49078: {'lr': 0.0001989097687410685, 'samples': 1570496, 'steps': 3067, 'loss/train': 1.9026850461959839} -09/21/2021 01:07:06 - INFO - __main__ - Step 49079: {'lr': 0.0001989097687410685, 'samples': 1570528, 'steps': 3067, 'loss/train': 1.6774564981460571} -09/21/2021 01:07:07 - INFO - __main__ - Step 49080: {'lr': 0.0001989097687410685, 'samples': 1570560, 'steps': 3067, 'loss/train': 2.344212532043457} -09/21/2021 01:07:07 - INFO - __main__ - Step 49081: {'lr': 0.0001989097687410685, 'samples': 1570592, 'steps': 3067, 'loss/train': 2.4086012840270996} -09/21/2021 01:07:08 - INFO - __main__ - Step 49082: {'lr': 0.0001989097687410685, 'samples': 1570624, 'steps': 3067, 'loss/train': 1.7805876731872559} -09/21/2021 01:07:09 - INFO - __main__ - Step 49083: {'lr': 0.0001989097687410685, 'samples': 1570656, 'steps': 3067, 'loss/train': 1.7380791902542114} -09/21/2021 01:07:10 - INFO - __main__ - Step 49084: {'lr': 0.0001989097687410685, 'samples': 1570688, 'steps': 3067, 'loss/train': 1.5141973495483398} -09/21/2021 01:07:10 - INFO - __main__ - Step 49085: {'lr': 0.0001989097687410685, 'samples': 1570720, 'steps': 3067, 'loss/train': 2.298165798187256} -09/21/2021 01:07:11 - INFO - __main__ - Step 49086: {'lr': 0.0001989097687410685, 'samples': 1570752, 'steps': 3067, 'loss/train': 1.564387321472168} -09/21/2021 01:07:12 - INFO - __main__ - Step 49087: {'lr': 0.0001989097687410685, 'samples': 1570784, 'steps': 3067, 'loss/train': 1.8330270051956177} -09/21/2021 01:07:13 - INFO - __main__ - Step 49088: {'lr': 0.0001989097687410685, 'samples': 1570816, 'steps': 3067, 'loss/train': 3.0807411670684814} -09/21/2021 01:07:14 - INFO - __main__ - Step 49089: {'lr': 0.00019890882918211715, 'samples': 1570848, 'steps': 3068, 'loss/train': 2.0864858627319336} -09/21/2021 01:07:14 - INFO - __main__ - Step 49090: {'lr': 0.00019890882918211715, 'samples': 1570880, 'steps': 3068, 'loss/train': 0.46861040592193604} -09/21/2021 01:07:15 - INFO - __main__ - Step 49091: {'lr': 0.00019890882918211715, 'samples': 1570912, 'steps': 3068, 'loss/train': 2.701913356781006} -09/21/2021 01:07:16 - INFO - __main__ - Step 49092: {'lr': 0.00019890882918211715, 'samples': 1570944, 'steps': 3068, 'loss/train': 2.3432981967926025} -09/21/2021 01:07:17 - INFO - __main__ - Step 49093: {'lr': 0.00019890882918211715, 'samples': 1570976, 'steps': 3068, 'loss/train': 0.4124363958835602} -09/21/2021 01:07:17 - INFO - __main__ - Step 49094: {'lr': 0.00019890882918211715, 'samples': 1571008, 'steps': 3068, 'loss/train': 2.549635648727417} -09/21/2021 01:07:18 - INFO - __main__ - Step 49095: {'lr': 0.00019890882918211715, 'samples': 1571040, 'steps': 3068, 'loss/train': 2.0715017318725586} -09/21/2021 01:07:19 - INFO - __main__ - Step 49096: {'lr': 0.00019890882918211715, 'samples': 1571072, 'steps': 3068, 'loss/train': 3.182750701904297} -09/21/2021 01:07:20 - INFO - __main__ - Step 49097: {'lr': 0.00019890882918211715, 'samples': 1571104, 'steps': 3068, 'loss/train': 1.8437151908874512} -09/21/2021 01:07:20 - INFO - __main__ - Step 49098: {'lr': 0.00019890882918211715, 'samples': 1571136, 'steps': 3068, 'loss/train': 2.1985719203948975} -09/21/2021 01:07:21 - INFO - __main__ - Step 49099: {'lr': 0.00019890882918211715, 'samples': 1571168, 'steps': 3068, 'loss/train': 1.447354793548584} -09/21/2021 01:07:22 - INFO - __main__ - Step 49100: {'lr': 0.00019890882918211715, 'samples': 1571200, 'steps': 3068, 'loss/train': 2.4804422855377197} -09/21/2021 01:07:23 - INFO - __main__ - Step 49101: {'lr': 0.00019890882918211715, 'samples': 1571232, 'steps': 3068, 'loss/train': 2.3856654167175293} -09/21/2021 01:07:23 - INFO - __main__ - Step 49102: {'lr': 0.00019890882918211715, 'samples': 1571264, 'steps': 3068, 'loss/train': 2.991438865661621} -09/21/2021 01:07:24 - INFO - __main__ - Step 49103: {'lr': 0.00019890882918211715, 'samples': 1571296, 'steps': 3068, 'loss/train': 1.8713202476501465} -09/21/2021 01:07:25 - INFO - __main__ - Step 49104: {'lr': 0.00019890882918211715, 'samples': 1571328, 'steps': 3068, 'loss/train': 1.3500211238861084} -09/21/2021 01:07:26 - INFO - __main__ - Step 49105: {'lr': 0.00019890788922070617, 'samples': 1571360, 'steps': 3069, 'loss/train': 1.6824814081192017} -09/21/2021 01:07:26 - INFO - __main__ - Step 49106: {'lr': 0.00019890788922070617, 'samples': 1571392, 'steps': 3069, 'loss/train': 0.6808580756187439} -09/21/2021 01:07:27 - INFO - __main__ - Step 49107: {'lr': 0.00019890788922070617, 'samples': 1571424, 'steps': 3069, 'loss/train': 1.8452131748199463} -09/21/2021 01:07:28 - INFO - __main__ - Step 49108: {'lr': 0.00019890788922070617, 'samples': 1571456, 'steps': 3069, 'loss/train': 1.534619927406311} -09/21/2021 01:07:29 - INFO - __main__ - Step 49109: {'lr': 0.00019890788922070617, 'samples': 1571488, 'steps': 3069, 'loss/train': 1.596219539642334} -09/21/2021 01:07:31 - INFO - __main__ - Step 49110: {'lr': 0.00019890788922070617, 'samples': 1571520, 'steps': 3069, 'loss/train': 1.6344172954559326} -09/21/2021 01:07:31 - INFO - __main__ - Step 49111: {'lr': 0.00019890788922070617, 'samples': 1571552, 'steps': 3069, 'loss/train': 0.89619380235672} -09/21/2021 01:07:32 - INFO - __main__ - Step 49112: {'lr': 0.00019890788922070617, 'samples': 1571584, 'steps': 3069, 'loss/train': 1.2585793733596802} -09/21/2021 01:07:33 - INFO - __main__ - Step 49113: {'lr': 0.00019890788922070617, 'samples': 1571616, 'steps': 3069, 'loss/train': 2.0027787685394287} -09/21/2021 01:07:34 - INFO - __main__ - Step 49114: {'lr': 0.00019890788922070617, 'samples': 1571648, 'steps': 3069, 'loss/train': 1.971976399421692} -09/21/2021 01:07:34 - INFO - __main__ - Step 49115: {'lr': 0.00019890788922070617, 'samples': 1571680, 'steps': 3069, 'loss/train': 2.272075653076172} -09/21/2021 01:07:35 - INFO - __main__ - Step 49116: {'lr': 0.00019890788922070617, 'samples': 1571712, 'steps': 3069, 'loss/train': 2.7485835552215576} -09/21/2021 01:07:36 - INFO - __main__ - Step 49117: {'lr': 0.00019890788922070617, 'samples': 1571744, 'steps': 3069, 'loss/train': 2.2696807384490967} -09/21/2021 01:07:37 - INFO - __main__ - Step 49118: {'lr': 0.00019890788922070617, 'samples': 1571776, 'steps': 3069, 'loss/train': 2.100651979446411} -09/21/2021 01:07:37 - INFO - __main__ - Step 49119: {'lr': 0.00019890788922070617, 'samples': 1571808, 'steps': 3069, 'loss/train': 0.9634273052215576} -09/21/2021 01:07:38 - INFO - __main__ - Step 49120: {'lr': 0.00019890788922070617, 'samples': 1571840, 'steps': 3069, 'loss/train': 2.108553409576416} -09/21/2021 01:07:39 - INFO - __main__ - Step 49121: {'lr': 0.00019890694885683937, 'samples': 1571872, 'steps': 3070, 'loss/train': 1.7264105081558228} -09/21/2021 01:07:40 - INFO - __main__ - Step 49122: {'lr': 0.00019890694885683937, 'samples': 1571904, 'steps': 3070, 'loss/train': 2.1581943035125732} -09/21/2021 01:07:40 - INFO - __main__ - Step 49123: {'lr': 0.00019890694885683937, 'samples': 1571936, 'steps': 3070, 'loss/train': 1.4095255136489868} -09/21/2021 01:07:41 - INFO - __main__ - Step 49124: {'lr': 0.00019890694885683937, 'samples': 1571968, 'steps': 3070, 'loss/train': 0.40183043479919434} -09/21/2021 01:07:42 - INFO - __main__ - Step 49125: {'lr': 0.00019890694885683937, 'samples': 1572000, 'steps': 3070, 'loss/train': 1.9926671981811523} -09/21/2021 01:07:43 - INFO - __main__ - Step 49126: {'lr': 0.00019890694885683937, 'samples': 1572032, 'steps': 3070, 'loss/train': 1.6962049007415771} -09/21/2021 01:07:43 - INFO - __main__ - Step 49127: {'lr': 0.00019890694885683937, 'samples': 1572064, 'steps': 3070, 'loss/train': 1.8696534633636475} -09/21/2021 01:07:44 - INFO - __main__ - Step 49128: {'lr': 0.00019890694885683937, 'samples': 1572096, 'steps': 3070, 'loss/train': 1.094985008239746} -09/21/2021 01:07:45 - INFO - __main__ - Step 49129: {'lr': 0.00019890694885683937, 'samples': 1572128, 'steps': 3070, 'loss/train': 2.264446973800659} -09/21/2021 01:07:46 - INFO - __main__ - Step 49130: {'lr': 0.00019890694885683937, 'samples': 1572160, 'steps': 3070, 'loss/train': 2.6161632537841797} -09/21/2021 01:07:46 - INFO - __main__ - Step 49131: {'lr': 0.00019890694885683937, 'samples': 1572192, 'steps': 3070, 'loss/train': 1.8653210401535034} -09/21/2021 01:07:47 - INFO - __main__ - Step 49132: {'lr': 0.00019890694885683937, 'samples': 1572224, 'steps': 3070, 'loss/train': 1.2936797142028809} -09/21/2021 01:07:48 - INFO - __main__ - Step 49133: {'lr': 0.00019890694885683937, 'samples': 1572256, 'steps': 3070, 'loss/train': 2.528961181640625} -09/21/2021 01:07:49 - INFO - __main__ - Step 49134: {'lr': 0.00019890694885683937, 'samples': 1572288, 'steps': 3070, 'loss/train': 2.6918294429779053} -09/21/2021 01:07:49 - INFO - __main__ - Step 49135: {'lr': 0.00019890694885683937, 'samples': 1572320, 'steps': 3070, 'loss/train': 2.3341569900512695} -09/21/2021 01:07:50 - INFO - __main__ - Step 49136: {'lr': 0.00019890694885683937, 'samples': 1572352, 'steps': 3070, 'loss/train': 1.5282628536224365} -09/21/2021 01:07:51 - INFO - __main__ - Step 49137: {'lr': 0.00019890600809052055, 'samples': 1572384, 'steps': 3071, 'loss/train': 2.119361162185669} -09/21/2021 01:07:52 - INFO - __main__ - Step 49138: {'lr': 0.00019890600809052055, 'samples': 1572416, 'steps': 3071, 'loss/train': 2.7856171131134033} -09/21/2021 01:07:53 - INFO - __main__ - Step 49139: {'lr': 0.00019890600809052055, 'samples': 1572448, 'steps': 3071, 'loss/train': 1.4294657707214355} -09/21/2021 01:07:53 - INFO - __main__ - Step 49140: {'lr': 0.00019890600809052055, 'samples': 1572480, 'steps': 3071, 'loss/train': 1.8163374662399292} -09/21/2021 01:07:55 - INFO - __main__ - Step 49141: {'lr': 0.00019890600809052055, 'samples': 1572512, 'steps': 3071, 'loss/train': 1.9530999660491943} -09/21/2021 01:07:55 - INFO - __main__ - Step 49142: {'lr': 0.00019890600809052055, 'samples': 1572544, 'steps': 3071, 'loss/train': 1.7711601257324219} -09/21/2021 01:07:56 - INFO - __main__ - Step 49143: {'lr': 0.00019890600809052055, 'samples': 1572576, 'steps': 3071, 'loss/train': 1.5904099941253662} -09/21/2021 01:07:57 - INFO - __main__ - Step 49144: {'lr': 0.00019890600809052055, 'samples': 1572608, 'steps': 3071, 'loss/train': 3.1259303092956543} -09/21/2021 01:07:58 - INFO - __main__ - Step 49145: {'lr': 0.00019890600809052055, 'samples': 1572640, 'steps': 3071, 'loss/train': 1.5026731491088867} -09/21/2021 01:07:58 - INFO - __main__ - Step 49146: {'lr': 0.00019890600809052055, 'samples': 1572672, 'steps': 3071, 'loss/train': 1.1229870319366455} -09/21/2021 01:07:59 - INFO - __main__ - Step 49147: {'lr': 0.00019890600809052055, 'samples': 1572704, 'steps': 3071, 'loss/train': 1.268630027770996} -09/21/2021 01:08:00 - INFO - __main__ - Step 49148: {'lr': 0.00019890600809052055, 'samples': 1572736, 'steps': 3071, 'loss/train': 1.794726848602295} -09/21/2021 01:08:01 - INFO - __main__ - Step 49149: {'lr': 0.00019890600809052055, 'samples': 1572768, 'steps': 3071, 'loss/train': 1.6815059185028076} -09/21/2021 01:08:01 - INFO - __main__ - Step 49150: {'lr': 0.00019890600809052055, 'samples': 1572800, 'steps': 3071, 'loss/train': 1.3053213357925415} -09/21/2021 01:08:02 - INFO - __main__ - Step 49151: {'lr': 0.00019890600809052055, 'samples': 1572832, 'steps': 3071, 'loss/train': 2.233527660369873} -09/21/2021 01:08:03 - INFO - __main__ - Step 49152: {'lr': 0.00019890600809052055, 'samples': 1572864, 'steps': 3071, 'loss/train': 2.8356235027313232} -09/21/2021 01:08:04 - INFO - __main__ - Step 49153: {'lr': 0.0001989050669217536, 'samples': 1572896, 'steps': 3072, 'loss/train': 1.6114264726638794} -09/21/2021 01:08:04 - INFO - __main__ - Step 49154: {'lr': 0.0001989050669217536, 'samples': 1572928, 'steps': 3072, 'loss/train': 1.9972532987594604} -09/21/2021 01:08:05 - INFO - __main__ - Step 49155: {'lr': 0.0001989050669217536, 'samples': 1572960, 'steps': 3072, 'loss/train': 2.70499587059021} -09/21/2021 01:08:06 - INFO - __main__ - Step 49156: {'lr': 0.0001989050669217536, 'samples': 1572992, 'steps': 3072, 'loss/train': 1.7062064409255981} -09/21/2021 01:08:07 - INFO - __main__ - Step 49157: {'lr': 0.0001989050669217536, 'samples': 1573024, 'steps': 3072, 'loss/train': 2.134737491607666} -09/21/2021 01:08:07 - INFO - __main__ - Step 49158: {'lr': 0.0001989050669217536, 'samples': 1573056, 'steps': 3072, 'loss/train': 0.33406373858451843} -09/21/2021 01:08:08 - INFO - __main__ - Step 49159: {'lr': 0.0001989050669217536, 'samples': 1573088, 'steps': 3072, 'loss/train': 2.302217483520508} -09/21/2021 01:08:09 - INFO - __main__ - Step 49160: {'lr': 0.0001989050669217536, 'samples': 1573120, 'steps': 3072, 'loss/train': 2.771975517272949} -09/21/2021 01:08:10 - INFO - __main__ - Step 49161: {'lr': 0.0001989050669217536, 'samples': 1573152, 'steps': 3072, 'loss/train': 1.4345945119857788} -09/21/2021 01:08:10 - INFO - __main__ - Step 49162: {'lr': 0.0001989050669217536, 'samples': 1573184, 'steps': 3072, 'loss/train': 1.8726357221603394} -09/21/2021 01:08:11 - INFO - __main__ - Step 49163: {'lr': 0.0001989050669217536, 'samples': 1573216, 'steps': 3072, 'loss/train': 2.561286211013794} -09/21/2021 01:08:12 - INFO - __main__ - Step 49164: {'lr': 0.0001989050669217536, 'samples': 1573248, 'steps': 3072, 'loss/train': 0.30670639872550964} -09/21/2021 01:08:13 - INFO - __main__ - Step 49165: {'lr': 0.0001989050669217536, 'samples': 1573280, 'steps': 3072, 'loss/train': 2.0526959896087646} -09/21/2021 01:08:13 - INFO - __main__ - Step 49166: {'lr': 0.0001989050669217536, 'samples': 1573312, 'steps': 3072, 'loss/train': 2.3882253170013428} -09/21/2021 01:08:14 - INFO - __main__ - Step 49167: {'lr': 0.0001989050669217536, 'samples': 1573344, 'steps': 3072, 'loss/train': 1.679928183555603} -09/21/2021 01:08:15 - INFO - __main__ - Step 49168: {'lr': 0.0001989050669217536, 'samples': 1573376, 'steps': 3072, 'loss/train': 2.229161024093628} -09/21/2021 01:08:16 - INFO - __main__ - Step 49169: {'lr': 0.00019890412535054227, 'samples': 1573408, 'steps': 3073, 'loss/train': 1.4060624837875366} -09/21/2021 01:08:17 - INFO - __main__ - Step 49170: {'lr': 0.00019890412535054227, 'samples': 1573440, 'steps': 3073, 'loss/train': 2.290374279022217} -09/21/2021 01:08:18 - INFO - __main__ - Step 49171: {'lr': 0.00019890412535054227, 'samples': 1573472, 'steps': 3073, 'loss/train': 1.274185061454773} -09/21/2021 01:08:19 - INFO - __main__ - Step 49172: {'lr': 0.00019890412535054227, 'samples': 1573504, 'steps': 3073, 'loss/train': 1.7829262018203735} -09/21/2021 01:08:19 - INFO - __main__ - Step 49173: {'lr': 0.00019890412535054227, 'samples': 1573536, 'steps': 3073, 'loss/train': 1.8883216381072998} -09/21/2021 01:08:20 - INFO - __main__ - Step 49174: {'lr': 0.00019890412535054227, 'samples': 1573568, 'steps': 3073, 'loss/train': 2.692335844039917} -09/21/2021 01:08:21 - INFO - __main__ - Step 49175: {'lr': 0.00019890412535054227, 'samples': 1573600, 'steps': 3073, 'loss/train': 2.9344658851623535} -09/21/2021 01:08:22 - INFO - __main__ - Step 49176: {'lr': 0.00019890412535054227, 'samples': 1573632, 'steps': 3073, 'loss/train': 2.0414435863494873} -09/21/2021 01:08:22 - INFO - __main__ - Step 49177: {'lr': 0.00019890412535054227, 'samples': 1573664, 'steps': 3073, 'loss/train': 0.2751642167568207} -09/21/2021 01:08:23 - INFO - __main__ - Step 49178: {'lr': 0.00019890412535054227, 'samples': 1573696, 'steps': 3073, 'loss/train': 1.9896959066390991} -09/21/2021 01:08:24 - INFO - __main__ - Step 49179: {'lr': 0.00019890412535054227, 'samples': 1573728, 'steps': 3073, 'loss/train': 1.851013422012329} -09/21/2021 01:08:25 - INFO - __main__ - Step 49180: {'lr': 0.00019890412535054227, 'samples': 1573760, 'steps': 3073, 'loss/train': 2.582336664199829} -09/21/2021 01:08:25 - INFO - __main__ - Step 49181: {'lr': 0.00019890412535054227, 'samples': 1573792, 'steps': 3073, 'loss/train': 1.6228346824645996} -09/21/2021 01:08:26 - INFO - __main__ - Step 49182: {'lr': 0.00019890412535054227, 'samples': 1573824, 'steps': 3073, 'loss/train': 0.9985591173171997} -09/21/2021 01:08:27 - INFO - __main__ - Step 49183: {'lr': 0.00019890412535054227, 'samples': 1573856, 'steps': 3073, 'loss/train': 1.1229314804077148} -09/21/2021 01:08:28 - INFO - __main__ - Step 49184: {'lr': 0.00019890412535054227, 'samples': 1573888, 'steps': 3073, 'loss/train': 2.025038242340088} -09/21/2021 01:08:28 - INFO - __main__ - Step 49185: {'lr': 0.00019890318337689047, 'samples': 1573920, 'steps': 3074, 'loss/train': 2.016986608505249} -09/21/2021 01:08:29 - INFO - __main__ - Step 49186: {'lr': 0.00019890318337689047, 'samples': 1573952, 'steps': 3074, 'loss/train': 1.5715551376342773} -09/21/2021 01:08:30 - INFO - __main__ - Step 49187: {'lr': 0.00019890318337689047, 'samples': 1573984, 'steps': 3074, 'loss/train': 1.7391328811645508} -09/21/2021 01:08:31 - INFO - __main__ - Step 49188: {'lr': 0.00019890318337689047, 'samples': 1574016, 'steps': 3074, 'loss/train': 1.7889000177383423} -09/21/2021 01:08:31 - INFO - __main__ - Step 49189: {'lr': 0.00019890318337689047, 'samples': 1574048, 'steps': 3074, 'loss/train': 2.166377544403076} -09/21/2021 01:08:32 - INFO - __main__ - Step 49190: {'lr': 0.00019890318337689047, 'samples': 1574080, 'steps': 3074, 'loss/train': 2.6206045150756836} -09/21/2021 01:08:33 - INFO - __main__ - Step 49191: {'lr': 0.00019890318337689047, 'samples': 1574112, 'steps': 3074, 'loss/train': 1.6866241693496704} -09/21/2021 01:08:34 - INFO - __main__ - Step 49192: {'lr': 0.00019890318337689047, 'samples': 1574144, 'steps': 3074, 'loss/train': 1.8419239521026611} -09/21/2021 01:08:34 - INFO - __main__ - Step 49193: {'lr': 0.00019890318337689047, 'samples': 1574176, 'steps': 3074, 'loss/train': 1.4971997737884521} -09/21/2021 01:08:35 - INFO - __main__ - Step 49194: {'lr': 0.00019890318337689047, 'samples': 1574208, 'steps': 3074, 'loss/train': 2.542888641357422} -09/21/2021 01:08:36 - INFO - __main__ - Step 49195: {'lr': 0.00019890318337689047, 'samples': 1574240, 'steps': 3074, 'loss/train': 2.2982888221740723} -09/21/2021 01:08:37 - INFO - __main__ - Step 49196: {'lr': 0.00019890318337689047, 'samples': 1574272, 'steps': 3074, 'loss/train': 1.866031289100647} -09/21/2021 01:08:37 - INFO - __main__ - Step 49197: {'lr': 0.00019890318337689047, 'samples': 1574304, 'steps': 3074, 'loss/train': 1.6665116548538208} -09/21/2021 01:08:38 - INFO - __main__ - Step 49198: {'lr': 0.00019890318337689047, 'samples': 1574336, 'steps': 3074, 'loss/train': 2.4890365600585938} -09/21/2021 01:08:39 - INFO - __main__ - Step 49199: {'lr': 0.00019890318337689047, 'samples': 1574368, 'steps': 3074, 'loss/train': 1.7071387767791748} -09/21/2021 01:08:40 - INFO - __main__ - Step 49200: {'lr': 0.00019890318337689047, 'samples': 1574400, 'steps': 3074, 'loss/train': 0.5964953899383545} -09/21/2021 01:08:41 - INFO - __main__ - Step 49201: {'lr': 0.00019890224100080198, 'samples': 1574432, 'steps': 3075, 'loss/train': 1.596996784210205} -09/21/2021 01:08:42 - INFO - __main__ - Step 49202: {'lr': 0.00019890224100080198, 'samples': 1574464, 'steps': 3075, 'loss/train': 2.218547821044922} -09/21/2021 01:08:43 - INFO - __main__ - Step 49203: {'lr': 0.00019890224100080198, 'samples': 1574496, 'steps': 3075, 'loss/train': 2.188422679901123} -09/21/2021 01:08:43 - INFO - __main__ - Step 49204: {'lr': 0.00019890224100080198, 'samples': 1574528, 'steps': 3075, 'loss/train': 2.5133838653564453} -09/21/2021 01:08:44 - INFO - __main__ - Step 49205: {'lr': 0.00019890224100080198, 'samples': 1574560, 'steps': 3075, 'loss/train': 1.0500203371047974} -09/21/2021 01:08:45 - INFO - __main__ - Step 49206: {'lr': 0.00019890224100080198, 'samples': 1574592, 'steps': 3075, 'loss/train': 1.2251105308532715} -09/21/2021 01:08:46 - INFO - __main__ - Step 49207: {'lr': 0.00019890224100080198, 'samples': 1574624, 'steps': 3075, 'loss/train': 2.7581992149353027} -09/21/2021 01:08:46 - INFO - __main__ - Step 49208: {'lr': 0.00019890224100080198, 'samples': 1574656, 'steps': 3075, 'loss/train': 2.6644976139068604} -09/21/2021 01:08:47 - INFO - __main__ - Step 49209: {'lr': 0.00019890224100080198, 'samples': 1574688, 'steps': 3075, 'loss/train': 2.170027494430542} -09/21/2021 01:08:48 - INFO - __main__ - Step 49210: {'lr': 0.00019890224100080198, 'samples': 1574720, 'steps': 3075, 'loss/train': 1.4006086587905884} -09/21/2021 01:08:49 - INFO - __main__ - Step 49211: {'lr': 0.00019890224100080198, 'samples': 1574752, 'steps': 3075, 'loss/train': 2.334583044052124} -09/21/2021 01:08:49 - INFO - __main__ - Step 49212: {'lr': 0.00019890224100080198, 'samples': 1574784, 'steps': 3075, 'loss/train': 1.922035813331604} -09/21/2021 01:08:50 - INFO - __main__ - Step 49213: {'lr': 0.00019890224100080198, 'samples': 1574816, 'steps': 3075, 'loss/train': 1.5475425720214844} -09/21/2021 01:08:51 - INFO - __main__ - Step 49214: {'lr': 0.00019890224100080198, 'samples': 1574848, 'steps': 3075, 'loss/train': 1.120805025100708} -09/21/2021 01:08:52 - INFO - __main__ - Step 49215: {'lr': 0.00019890224100080198, 'samples': 1574880, 'steps': 3075, 'loss/train': 2.6764976978302} -09/21/2021 01:08:52 - INFO - __main__ - Step 49216: {'lr': 0.00019890224100080198, 'samples': 1574912, 'steps': 3075, 'loss/train': 2.6497740745544434} -09/21/2021 01:08:53 - INFO - __main__ - Step 49217: {'lr': 0.0001989012982222807, 'samples': 1574944, 'steps': 3076, 'loss/train': 2.7652835845947266} -09/21/2021 01:08:54 - INFO - __main__ - Step 49218: {'lr': 0.0001989012982222807, 'samples': 1574976, 'steps': 3076, 'loss/train': 2.682170867919922} -09/21/2021 01:08:55 - INFO - __main__ - Step 49219: {'lr': 0.0001989012982222807, 'samples': 1575008, 'steps': 3076, 'loss/train': 2.797546625137329} -09/21/2021 01:08:56 - INFO - __main__ - Step 49220: {'lr': 0.0001989012982222807, 'samples': 1575040, 'steps': 3076, 'loss/train': 2.2378036975860596} -09/21/2021 01:08:56 - INFO - __main__ - Step 49221: {'lr': 0.0001989012982222807, 'samples': 1575072, 'steps': 3076, 'loss/train': 2.84684157371521} -09/21/2021 01:08:57 - INFO - __main__ - Step 49222: {'lr': 0.0001989012982222807, 'samples': 1575104, 'steps': 3076, 'loss/train': 2.547701597213745} -09/21/2021 01:08:58 - INFO - __main__ - Step 49223: {'lr': 0.0001989012982222807, 'samples': 1575136, 'steps': 3076, 'loss/train': 1.7820545434951782} -09/21/2021 01:08:59 - INFO - __main__ - Step 49224: {'lr': 0.0001989012982222807, 'samples': 1575168, 'steps': 3076, 'loss/train': 1.34065842628479} -09/21/2021 01:08:59 - INFO - __main__ - Step 49225: {'lr': 0.0001989012982222807, 'samples': 1575200, 'steps': 3076, 'loss/train': 1.6148152351379395} -09/21/2021 01:09:00 - INFO - __main__ - Step 49226: {'lr': 0.0001989012982222807, 'samples': 1575232, 'steps': 3076, 'loss/train': 2.293854236602783} -09/21/2021 01:09:01 - INFO - __main__ - Step 49227: {'lr': 0.0001989012982222807, 'samples': 1575264, 'steps': 3076, 'loss/train': 2.221907377243042} -09/21/2021 01:09:02 - INFO - __main__ - Step 49228: {'lr': 0.0001989012982222807, 'samples': 1575296, 'steps': 3076, 'loss/train': 1.9426794052124023} -09/21/2021 01:09:02 - INFO - __main__ - Step 49229: {'lr': 0.0001989012982222807, 'samples': 1575328, 'steps': 3076, 'loss/train': 1.5517055988311768} -09/21/2021 01:09:03 - INFO - __main__ - Step 49230: {'lr': 0.0001989012982222807, 'samples': 1575360, 'steps': 3076, 'loss/train': 1.2316900491714478} -09/21/2021 01:09:04 - INFO - __main__ - Step 49231: {'lr': 0.0001989012982222807, 'samples': 1575392, 'steps': 3076, 'loss/train': 1.921964168548584} -09/21/2021 01:09:05 - INFO - __main__ - Step 49232: {'lr': 0.0001989012982222807, 'samples': 1575424, 'steps': 3076, 'loss/train': 2.009887456893921} -09/21/2021 01:09:06 - INFO - __main__ - Step 49233: {'lr': 0.00019890035504133038, 'samples': 1575456, 'steps': 3077, 'loss/train': 2.246720790863037} -09/21/2021 01:09:07 - INFO - __main__ - Step 49234: {'lr': 0.00019890035504133038, 'samples': 1575488, 'steps': 3077, 'loss/train': 1.3333345651626587} -09/21/2021 01:09:07 - INFO - __main__ - Step 49235: {'lr': 0.00019890035504133038, 'samples': 1575520, 'steps': 3077, 'loss/train': 1.6022884845733643} -09/21/2021 01:09:08 - INFO - __main__ - Step 49236: {'lr': 0.00019890035504133038, 'samples': 1575552, 'steps': 3077, 'loss/train': 2.219236373901367} -09/21/2021 01:09:09 - INFO - __main__ - Step 49237: {'lr': 0.00019890035504133038, 'samples': 1575584, 'steps': 3077, 'loss/train': 2.4290740489959717} -09/21/2021 01:09:10 - INFO - __main__ - Step 49238: {'lr': 0.00019890035504133038, 'samples': 1575616, 'steps': 3077, 'loss/train': 1.4845850467681885} -09/21/2021 01:09:10 - INFO - __main__ - Step 49239: {'lr': 0.00019890035504133038, 'samples': 1575648, 'steps': 3077, 'loss/train': 2.7311525344848633} -09/21/2021 01:09:11 - INFO - __main__ - Step 49240: {'lr': 0.00019890035504133038, 'samples': 1575680, 'steps': 3077, 'loss/train': 2.776212453842163} -09/21/2021 01:09:12 - INFO - __main__ - Step 49241: {'lr': 0.00019890035504133038, 'samples': 1575712, 'steps': 3077, 'loss/train': 1.6355040073394775} -09/21/2021 01:09:13 - INFO - __main__ - Step 49242: {'lr': 0.00019890035504133038, 'samples': 1575744, 'steps': 3077, 'loss/train': 1.8035776615142822} -09/21/2021 01:09:13 - INFO - __main__ - Step 49243: {'lr': 0.00019890035504133038, 'samples': 1575776, 'steps': 3077, 'loss/train': 1.9634106159210205} -09/21/2021 01:09:14 - INFO - __main__ - Step 49244: {'lr': 0.00019890035504133038, 'samples': 1575808, 'steps': 3077, 'loss/train': 1.9353986978530884} -09/21/2021 01:09:15 - INFO - __main__ - Step 49245: {'lr': 0.00019890035504133038, 'samples': 1575840, 'steps': 3077, 'loss/train': 2.0717966556549072} -09/21/2021 01:09:16 - INFO - __main__ - Step 49246: {'lr': 0.00019890035504133038, 'samples': 1575872, 'steps': 3077, 'loss/train': 2.4311556816101074} -09/21/2021 01:09:16 - INFO - __main__ - Step 49247: {'lr': 0.00019890035504133038, 'samples': 1575904, 'steps': 3077, 'loss/train': 1.495231032371521} -09/21/2021 01:09:17 - INFO - __main__ - Step 49248: {'lr': 0.00019890035504133038, 'samples': 1575936, 'steps': 3077, 'loss/train': 1.6219373941421509} -09/21/2021 01:09:18 - INFO - __main__ - Step 49249: {'lr': 0.00019889941145795491, 'samples': 1575968, 'steps': 3078, 'loss/train': 0.8825077414512634} -09/21/2021 01:09:19 - INFO - __main__ - Step 49250: {'lr': 0.00019889941145795491, 'samples': 1576000, 'steps': 3078, 'loss/train': 2.3081772327423096} -09/21/2021 01:09:20 - INFO - __main__ - Step 49251: {'lr': 0.00019889941145795491, 'samples': 1576032, 'steps': 3078, 'loss/train': 0.9842280149459839} -09/21/2021 01:09:20 - INFO - __main__ - Step 49252: {'lr': 0.00019889941145795491, 'samples': 1576064, 'steps': 3078, 'loss/train': 2.1553354263305664} -09/21/2021 01:09:21 - INFO - __main__ - Step 49253: {'lr': 0.00019889941145795491, 'samples': 1576096, 'steps': 3078, 'loss/train': 1.2236963510513306} -09/21/2021 01:09:22 - INFO - __main__ - Step 49254: {'lr': 0.00019889941145795491, 'samples': 1576128, 'steps': 3078, 'loss/train': 2.9056403636932373} -09/21/2021 01:09:23 - INFO - __main__ - Step 49255: {'lr': 0.00019889941145795491, 'samples': 1576160, 'steps': 3078, 'loss/train': 2.209434986114502} -09/21/2021 01:09:23 - INFO - __main__ - Step 49256: {'lr': 0.00019889941145795491, 'samples': 1576192, 'steps': 3078, 'loss/train': 2.8319621086120605} -09/21/2021 01:09:24 - INFO - __main__ - Step 49257: {'lr': 0.00019889941145795491, 'samples': 1576224, 'steps': 3078, 'loss/train': 1.7277787923812866} -09/21/2021 01:09:25 - INFO - __main__ - Step 49258: {'lr': 0.00019889941145795491, 'samples': 1576256, 'steps': 3078, 'loss/train': 1.5136975049972534} -09/21/2021 01:09:26 - INFO - __main__ - Step 49259: {'lr': 0.00019889941145795491, 'samples': 1576288, 'steps': 3078, 'loss/train': 1.5249792337417603} -09/21/2021 01:09:26 - INFO - __main__ - Step 49260: {'lr': 0.00019889941145795491, 'samples': 1576320, 'steps': 3078, 'loss/train': 1.0988191366195679} -09/21/2021 01:09:27 - INFO - __main__ - Step 49261: {'lr': 0.00019889941145795491, 'samples': 1576352, 'steps': 3078, 'loss/train': 1.3299918174743652} -09/21/2021 01:09:29 - INFO - __main__ - Step 49262: {'lr': 0.00019889941145795491, 'samples': 1576384, 'steps': 3078, 'loss/train': 1.0853360891342163} -09/21/2021 01:09:29 - INFO - __main__ - Step 49263: {'lr': 0.00019889941145795491, 'samples': 1576416, 'steps': 3078, 'loss/train': 1.8436288833618164} -09/21/2021 01:09:30 - INFO - __main__ - Step 49264: {'lr': 0.00019889941145795491, 'samples': 1576448, 'steps': 3078, 'loss/train': 1.9753773212432861} -09/21/2021 01:09:31 - INFO - __main__ - Step 49265: {'lr': 0.00019889846747215813, 'samples': 1576480, 'steps': 3079, 'loss/train': 1.9683198928833008} -09/21/2021 01:09:32 - INFO - __main__ - Step 49266: {'lr': 0.00019889846747215813, 'samples': 1576512, 'steps': 3079, 'loss/train': 1.9101749658584595} -09/21/2021 01:09:32 - INFO - __main__ - Step 49267: {'lr': 0.00019889846747215813, 'samples': 1576544, 'steps': 3079, 'loss/train': 1.6507973670959473} -09/21/2021 01:09:33 - INFO - __main__ - Step 49268: {'lr': 0.00019889846747215813, 'samples': 1576576, 'steps': 3079, 'loss/train': 1.7734241485595703} -09/21/2021 01:09:34 - INFO - __main__ - Step 49269: {'lr': 0.00019889846747215813, 'samples': 1576608, 'steps': 3079, 'loss/train': 1.199483871459961} -09/21/2021 01:09:35 - INFO - __main__ - Step 49270: {'lr': 0.00019889846747215813, 'samples': 1576640, 'steps': 3079, 'loss/train': 0.9636411070823669} -09/21/2021 01:09:35 - INFO - __main__ - Step 49271: {'lr': 0.00019889846747215813, 'samples': 1576672, 'steps': 3079, 'loss/train': 2.1074726581573486} -09/21/2021 01:09:36 - INFO - __main__ - Step 49272: {'lr': 0.00019889846747215813, 'samples': 1576704, 'steps': 3079, 'loss/train': 3.3542935848236084} -09/21/2021 01:09:37 - INFO - __main__ - Step 49273: {'lr': 0.00019889846747215813, 'samples': 1576736, 'steps': 3079, 'loss/train': 1.7591246366500854} -09/21/2021 01:09:38 - INFO - __main__ - Step 49274: {'lr': 0.00019889846747215813, 'samples': 1576768, 'steps': 3079, 'loss/train': 3.780189275741577} -09/21/2021 01:09:38 - INFO - __main__ - Step 49275: {'lr': 0.00019889846747215813, 'samples': 1576800, 'steps': 3079, 'loss/train': 0.8341909646987915} -09/21/2021 01:09:39 - INFO - __main__ - Step 49276: {'lr': 0.00019889846747215813, 'samples': 1576832, 'steps': 3079, 'loss/train': 2.160505771636963} -09/21/2021 01:09:40 - INFO - __main__ - Step 49277: {'lr': 0.00019889846747215813, 'samples': 1576864, 'steps': 3079, 'loss/train': 2.1612958908081055} -09/21/2021 01:09:41 - INFO - __main__ - Step 49278: {'lr': 0.00019889846747215813, 'samples': 1576896, 'steps': 3079, 'loss/train': 2.038630962371826} -09/21/2021 01:09:41 - INFO - __main__ - Step 49279: {'lr': 0.00019889846747215813, 'samples': 1576928, 'steps': 3079, 'loss/train': 1.7096432447433472} -09/21/2021 01:09:42 - INFO - __main__ - Step 49280: {'lr': 0.00019889846747215813, 'samples': 1576960, 'steps': 3079, 'loss/train': 1.786086916923523} -09/21/2021 01:09:43 - INFO - __main__ - Step 49281: {'lr': 0.00019889752308394388, 'samples': 1576992, 'steps': 3080, 'loss/train': 1.957078456878662} -09/21/2021 01:09:44 - INFO - __main__ - Step 49282: {'lr': 0.00019889752308394388, 'samples': 1577024, 'steps': 3080, 'loss/train': 2.360809087753296} -09/21/2021 01:09:45 - INFO - __main__ - Step 49283: {'lr': 0.00019889752308394388, 'samples': 1577056, 'steps': 3080, 'loss/train': 2.26033091545105} -09/21/2021 01:09:45 - INFO - __main__ - Step 49284: {'lr': 0.00019889752308394388, 'samples': 1577088, 'steps': 3080, 'loss/train': 2.711683750152588} -09/21/2021 01:09:46 - INFO - __main__ - Step 49285: {'lr': 0.00019889752308394388, 'samples': 1577120, 'steps': 3080, 'loss/train': 2.5370826721191406} -09/21/2021 01:09:47 - INFO - __main__ - Step 49286: {'lr': 0.00019889752308394388, 'samples': 1577152, 'steps': 3080, 'loss/train': 1.5920573472976685} -09/21/2021 01:09:48 - INFO - __main__ - Step 49287: {'lr': 0.00019889752308394388, 'samples': 1577184, 'steps': 3080, 'loss/train': 1.9975643157958984} -09/21/2021 01:09:48 - INFO - __main__ - Step 49288: {'lr': 0.00019889752308394388, 'samples': 1577216, 'steps': 3080, 'loss/train': 2.307727336883545} -09/21/2021 01:09:49 - INFO - __main__ - Step 49289: {'lr': 0.00019889752308394388, 'samples': 1577248, 'steps': 3080, 'loss/train': 1.7394278049468994} -09/21/2021 01:09:50 - INFO - __main__ - Step 49290: {'lr': 0.00019889752308394388, 'samples': 1577280, 'steps': 3080, 'loss/train': 2.1757090091705322} -09/21/2021 01:09:51 - INFO - __main__ - Step 49291: {'lr': 0.00019889752308394388, 'samples': 1577312, 'steps': 3080, 'loss/train': 1.3506672382354736} -09/21/2021 01:09:51 - INFO - __main__ - Step 49292: {'lr': 0.00019889752308394388, 'samples': 1577344, 'steps': 3080, 'loss/train': 2.575955629348755} -09/21/2021 01:09:52 - INFO - __main__ - Step 49293: {'lr': 0.00019889752308394388, 'samples': 1577376, 'steps': 3080, 'loss/train': 1.305206298828125} -09/21/2021 01:09:53 - INFO - __main__ - Step 49294: {'lr': 0.00019889752308394388, 'samples': 1577408, 'steps': 3080, 'loss/train': 1.9265800714492798} -09/21/2021 01:09:54 - INFO - __main__ - Step 49295: {'lr': 0.00019889752308394388, 'samples': 1577440, 'steps': 3080, 'loss/train': 2.110795736312866} -09/21/2021 01:09:55 - INFO - __main__ - Step 49296: {'lr': 0.00019889752308394388, 'samples': 1577472, 'steps': 3080, 'loss/train': 1.8188395500183105} -09/21/2021 01:09:56 - INFO - __main__ - Step 49297: {'lr': 0.00019889657829331596, 'samples': 1577504, 'steps': 3081, 'loss/train': 1.466071367263794} -09/21/2021 01:09:57 - INFO - __main__ - Step 49298: {'lr': 0.00019889657829331596, 'samples': 1577536, 'steps': 3081, 'loss/train': 1.9451035261154175} -09/21/2021 01:09:57 - INFO - __main__ - Step 49299: {'lr': 0.00019889657829331596, 'samples': 1577568, 'steps': 3081, 'loss/train': 1.2812752723693848} -09/21/2021 01:09:58 - INFO - __main__ - Step 49300: {'lr': 0.00019889657829331596, 'samples': 1577600, 'steps': 3081, 'loss/train': 1.9848130941390991} -09/21/2021 01:09:59 - INFO - __main__ - Step 49301: {'lr': 0.00019889657829331596, 'samples': 1577632, 'steps': 3081, 'loss/train': 1.5742100477218628} -09/21/2021 01:10:00 - INFO - __main__ - Step 49302: {'lr': 0.00019889657829331596, 'samples': 1577664, 'steps': 3081, 'loss/train': 0.2255462259054184} -09/21/2021 01:10:00 - INFO - __main__ - Step 49303: {'lr': 0.00019889657829331596, 'samples': 1577696, 'steps': 3081, 'loss/train': 1.365713119506836} -09/21/2021 01:10:01 - INFO - __main__ - Step 49304: {'lr': 0.00019889657829331596, 'samples': 1577728, 'steps': 3081, 'loss/train': 1.706861972808838} -09/21/2021 01:10:02 - INFO - __main__ - Step 49305: {'lr': 0.00019889657829331596, 'samples': 1577760, 'steps': 3081, 'loss/train': 2.0545268058776855} -09/21/2021 01:10:03 - INFO - __main__ - Step 49306: {'lr': 0.00019889657829331596, 'samples': 1577792, 'steps': 3081, 'loss/train': 1.9003056287765503} -09/21/2021 01:10:03 - INFO - __main__ - Step 49307: {'lr': 0.00019889657829331596, 'samples': 1577824, 'steps': 3081, 'loss/train': 2.6686789989471436} -09/21/2021 01:10:04 - INFO - __main__ - Step 49308: {'lr': 0.00019889657829331596, 'samples': 1577856, 'steps': 3081, 'loss/train': 2.3595187664031982} -09/21/2021 01:10:05 - INFO - __main__ - Step 49309: {'lr': 0.00019889657829331596, 'samples': 1577888, 'steps': 3081, 'loss/train': 2.3639333248138428} -09/21/2021 01:10:06 - INFO - __main__ - Step 49310: {'lr': 0.00019889657829331596, 'samples': 1577920, 'steps': 3081, 'loss/train': 2.457929849624634} -09/21/2021 01:10:06 - INFO - __main__ - Step 49311: {'lr': 0.00019889657829331596, 'samples': 1577952, 'steps': 3081, 'loss/train': 2.2993087768554688} -09/21/2021 01:10:07 - INFO - __main__ - Step 49312: {'lr': 0.00019889657829331596, 'samples': 1577984, 'steps': 3081, 'loss/train': 2.415113687515259} -09/21/2021 01:10:08 - INFO - __main__ - Step 49313: {'lr': 0.00019889563310027824, 'samples': 1578016, 'steps': 3082, 'loss/train': 2.3964481353759766} -09/21/2021 01:10:09 - INFO - __main__ - Step 49314: {'lr': 0.00019889563310027824, 'samples': 1578048, 'steps': 3082, 'loss/train': 1.8132386207580566} -09/21/2021 01:10:10 - INFO - __main__ - Step 49315: {'lr': 0.00019889563310027824, 'samples': 1578080, 'steps': 3082, 'loss/train': 5.674674987792969} -09/21/2021 01:10:10 - INFO - __main__ - Step 49316: {'lr': 0.00019889563310027824, 'samples': 1578112, 'steps': 3082, 'loss/train': 6.424833297729492} -09/21/2021 01:10:11 - INFO - __main__ - Step 49317: {'lr': 0.00019889563310027824, 'samples': 1578144, 'steps': 3082, 'loss/train': 5.9293084144592285} -09/21/2021 01:10:12 - INFO - __main__ - Step 49318: {'lr': 0.00019889563310027824, 'samples': 1578176, 'steps': 3082, 'loss/train': 1.350334644317627} -09/21/2021 01:10:13 - INFO - __main__ - Step 49319: {'lr': 0.00019889563310027824, 'samples': 1578208, 'steps': 3082, 'loss/train': 1.4503694772720337} -09/21/2021 01:10:13 - INFO - __main__ - Step 49320: {'lr': 0.00019889563310027824, 'samples': 1578240, 'steps': 3082, 'loss/train': 1.6992257833480835} -09/21/2021 01:10:14 - INFO - __main__ - Step 49321: {'lr': 0.00019889563310027824, 'samples': 1578272, 'steps': 3082, 'loss/train': 2.041773796081543} -09/21/2021 01:10:15 - INFO - __main__ - Step 49322: {'lr': 0.00019889563310027824, 'samples': 1578304, 'steps': 3082, 'loss/train': 2.2144711017608643} -09/21/2021 01:10:16 - INFO - __main__ - Step 49323: {'lr': 0.00019889563310027824, 'samples': 1578336, 'steps': 3082, 'loss/train': 1.6501312255859375} -09/21/2021 01:10:16 - INFO - __main__ - Step 49324: {'lr': 0.00019889563310027824, 'samples': 1578368, 'steps': 3082, 'loss/train': 1.0779085159301758} -09/21/2021 01:10:17 - INFO - __main__ - Step 49325: {'lr': 0.00019889563310027824, 'samples': 1578400, 'steps': 3082, 'loss/train': 2.451056957244873} -09/21/2021 01:10:18 - INFO - __main__ - Step 49326: {'lr': 0.00019889563310027824, 'samples': 1578432, 'steps': 3082, 'loss/train': 2.4317235946655273} -09/21/2021 01:10:19 - INFO - __main__ - Step 49327: {'lr': 0.00019889563310027824, 'samples': 1578464, 'steps': 3082, 'loss/train': 0.24686303734779358} -09/21/2021 01:10:19 - INFO - __main__ - Step 49328: {'lr': 0.00019889563310027824, 'samples': 1578496, 'steps': 3082, 'loss/train': 0.1381988376379013} -09/21/2021 01:10:20 - INFO - __main__ - Step 49329: {'lr': 0.0001988946875048346, 'samples': 1578528, 'steps': 3083, 'loss/train': 1.6061995029449463} -09/21/2021 01:10:21 - INFO - __main__ - Step 49330: {'lr': 0.0001988946875048346, 'samples': 1578560, 'steps': 3083, 'loss/train': 1.81635320186615} -09/21/2021 01:10:22 - INFO - __main__ - Step 49331: {'lr': 0.0001988946875048346, 'samples': 1578592, 'steps': 3083, 'loss/train': 2.002774715423584} -09/21/2021 01:10:23 - INFO - __main__ - Step 49332: {'lr': 0.0001988946875048346, 'samples': 1578624, 'steps': 3083, 'loss/train': 2.2107527256011963} -09/21/2021 01:10:24 - INFO - __main__ - Step 49333: {'lr': 0.0001988946875048346, 'samples': 1578656, 'steps': 3083, 'loss/train': 2.619629383087158} -09/21/2021 01:10:24 - INFO - __main__ - Step 49334: {'lr': 0.0001988946875048346, 'samples': 1578688, 'steps': 3083, 'loss/train': 2.007615804672241} -09/21/2021 01:10:25 - INFO - __main__ - Step 49335: {'lr': 0.0001988946875048346, 'samples': 1578720, 'steps': 3083, 'loss/train': 1.2664705514907837} -09/21/2021 01:10:26 - INFO - __main__ - Step 49336: {'lr': 0.0001988946875048346, 'samples': 1578752, 'steps': 3083, 'loss/train': 2.237229108810425} -09/21/2021 01:10:27 - INFO - __main__ - Step 49337: {'lr': 0.0001988946875048346, 'samples': 1578784, 'steps': 3083, 'loss/train': 2.0878748893737793} -09/21/2021 01:10:27 - INFO - __main__ - Step 49338: {'lr': 0.0001988946875048346, 'samples': 1578816, 'steps': 3083, 'loss/train': 2.589385509490967} -09/21/2021 01:10:28 - INFO - __main__ - Step 49339: {'lr': 0.0001988946875048346, 'samples': 1578848, 'steps': 3083, 'loss/train': 0.9619991183280945} -09/21/2021 01:10:29 - INFO - __main__ - Step 49340: {'lr': 0.0001988946875048346, 'samples': 1578880, 'steps': 3083, 'loss/train': 1.6025049686431885} -09/21/2021 01:10:30 - INFO - __main__ - Step 49341: {'lr': 0.0001988946875048346, 'samples': 1578912, 'steps': 3083, 'loss/train': 2.291613817214966} -09/21/2021 01:10:30 - INFO - __main__ - Step 49342: {'lr': 0.0001988946875048346, 'samples': 1578944, 'steps': 3083, 'loss/train': 1.4724266529083252} -09/21/2021 01:10:31 - INFO - __main__ - Step 49343: {'lr': 0.0001988946875048346, 'samples': 1578976, 'steps': 3083, 'loss/train': 0.9927313923835754} -09/21/2021 01:10:32 - INFO - __main__ - Step 49344: {'lr': 0.0001988946875048346, 'samples': 1579008, 'steps': 3083, 'loss/train': 2.1479849815368652} -09/21/2021 01:10:33 - INFO - __main__ - Step 49345: {'lr': 0.00019889374150698888, 'samples': 1579040, 'steps': 3084, 'loss/train': 2.6711175441741943} -09/21/2021 01:10:34 - INFO - __main__ - Step 49346: {'lr': 0.00019889374150698888, 'samples': 1579072, 'steps': 3084, 'loss/train': 1.8437381982803345} -09/21/2021 01:10:34 - INFO - __main__ - Step 49347: {'lr': 0.00019889374150698888, 'samples': 1579104, 'steps': 3084, 'loss/train': 1.4109243154525757} -09/21/2021 01:10:35 - INFO - __main__ - Step 49348: {'lr': 0.00019889374150698888, 'samples': 1579136, 'steps': 3084, 'loss/train': 2.3726067543029785} -09/21/2021 01:10:36 - INFO - __main__ - Step 49349: {'lr': 0.00019889374150698888, 'samples': 1579168, 'steps': 3084, 'loss/train': 2.4595141410827637} -09/21/2021 01:10:37 - INFO - __main__ - Step 49350: {'lr': 0.00019889374150698888, 'samples': 1579200, 'steps': 3084, 'loss/train': 1.7122937440872192} -09/21/2021 01:10:37 - INFO - __main__ - Step 49351: {'lr': 0.00019889374150698888, 'samples': 1579232, 'steps': 3084, 'loss/train': 1.8912009000778198} -09/21/2021 01:10:38 - INFO - __main__ - Step 49352: {'lr': 0.00019889374150698888, 'samples': 1579264, 'steps': 3084, 'loss/train': 1.3072915077209473} -09/21/2021 01:10:39 - INFO - __main__ - Step 49353: {'lr': 0.00019889374150698888, 'samples': 1579296, 'steps': 3084, 'loss/train': 2.3398795127868652} -09/21/2021 01:10:40 - INFO - __main__ - Step 49354: {'lr': 0.00019889374150698888, 'samples': 1579328, 'steps': 3084, 'loss/train': 2.666757822036743} -09/21/2021 01:10:40 - INFO - __main__ - Step 49355: {'lr': 0.00019889374150698888, 'samples': 1579360, 'steps': 3084, 'loss/train': 2.524256706237793} -09/21/2021 01:10:41 - INFO - __main__ - Step 49356: {'lr': 0.00019889374150698888, 'samples': 1579392, 'steps': 3084, 'loss/train': 2.4145939350128174} -09/21/2021 01:10:42 - INFO - __main__ - Step 49357: {'lr': 0.00019889374150698888, 'samples': 1579424, 'steps': 3084, 'loss/train': 0.9652106761932373} -09/21/2021 01:10:43 - INFO - __main__ - Step 49358: {'lr': 0.00019889374150698888, 'samples': 1579456, 'steps': 3084, 'loss/train': 2.063075304031372} -09/21/2021 01:10:43 - INFO - __main__ - Step 49359: {'lr': 0.00019889374150698888, 'samples': 1579488, 'steps': 3084, 'loss/train': 1.569044828414917} -09/21/2021 01:10:44 - INFO - __main__ - Step 49360: {'lr': 0.00019889374150698888, 'samples': 1579520, 'steps': 3084, 'loss/train': 1.9834946393966675} -09/21/2021 01:10:45 - INFO - __main__ - Step 49361: {'lr': 0.00019889279510674487, 'samples': 1579552, 'steps': 3085, 'loss/train': 1.8395459651947021} -09/21/2021 01:10:46 - INFO - __main__ - Step 49362: {'lr': 0.00019889279510674487, 'samples': 1579584, 'steps': 3085, 'loss/train': 2.1909477710723877} -09/21/2021 01:10:47 - INFO - __main__ - Step 49363: {'lr': 0.00019889279510674487, 'samples': 1579616, 'steps': 3085, 'loss/train': 2.00498104095459} -09/21/2021 01:10:48 - INFO - __main__ - Step 49364: {'lr': 0.00019889279510674487, 'samples': 1579648, 'steps': 3085, 'loss/train': 2.218674421310425} -09/21/2021 01:10:48 - INFO - __main__ - Step 49365: {'lr': 0.00019889279510674487, 'samples': 1579680, 'steps': 3085, 'loss/train': 1.6416330337524414} -09/21/2021 01:10:49 - INFO - __main__ - Step 49366: {'lr': 0.00019889279510674487, 'samples': 1579712, 'steps': 3085, 'loss/train': 2.1812326908111572} -09/21/2021 01:10:50 - INFO - __main__ - Step 49367: {'lr': 0.00019889279510674487, 'samples': 1579744, 'steps': 3085, 'loss/train': 2.1425740718841553} -09/21/2021 01:10:51 - INFO - __main__ - Step 49368: {'lr': 0.00019889279510674487, 'samples': 1579776, 'steps': 3085, 'loss/train': 1.2633541822433472} -09/21/2021 01:10:51 - INFO - __main__ - Step 49369: {'lr': 0.00019889279510674487, 'samples': 1579808, 'steps': 3085, 'loss/train': 1.478402853012085} -09/21/2021 01:10:52 - INFO - __main__ - Step 49370: {'lr': 0.00019889279510674487, 'samples': 1579840, 'steps': 3085, 'loss/train': 2.3949904441833496} -09/21/2021 01:10:53 - INFO - __main__ - Step 49371: {'lr': 0.00019889279510674487, 'samples': 1579872, 'steps': 3085, 'loss/train': 2.1815237998962402} -09/21/2021 01:10:54 - INFO - __main__ - Step 49372: {'lr': 0.00019889279510674487, 'samples': 1579904, 'steps': 3085, 'loss/train': 2.3038361072540283} -09/21/2021 01:10:55 - INFO - __main__ - Step 49373: {'lr': 0.00019889279510674487, 'samples': 1579936, 'steps': 3085, 'loss/train': 2.649238109588623} -09/21/2021 01:10:55 - INFO - __main__ - Step 49374: {'lr': 0.00019889279510674487, 'samples': 1579968, 'steps': 3085, 'loss/train': 2.00512433052063} -09/21/2021 01:10:56 - INFO - __main__ - Step 49375: {'lr': 0.00019889279510674487, 'samples': 1580000, 'steps': 3085, 'loss/train': 2.6271309852600098} -09/21/2021 01:10:57 - INFO - __main__ - Step 49376: {'lr': 0.00019889279510674487, 'samples': 1580032, 'steps': 3085, 'loss/train': 2.094625949859619} -09/21/2021 01:10:58 - INFO - __main__ - Step 49377: {'lr': 0.0001988918483041065, 'samples': 1580064, 'steps': 3086, 'loss/train': 2.7195241451263428} -09/21/2021 01:10:58 - INFO - __main__ - Step 49378: {'lr': 0.0001988918483041065, 'samples': 1580096, 'steps': 3086, 'loss/train': 1.6030552387237549} -09/21/2021 01:10:59 - INFO - __main__ - Step 49379: {'lr': 0.0001988918483041065, 'samples': 1580128, 'steps': 3086, 'loss/train': 2.608790636062622} -09/21/2021 01:11:00 - INFO - __main__ - Step 49380: {'lr': 0.0001988918483041065, 'samples': 1580160, 'steps': 3086, 'loss/train': 1.8404070138931274} -09/21/2021 01:11:01 - INFO - __main__ - Step 49381: {'lr': 0.0001988918483041065, 'samples': 1580192, 'steps': 3086, 'loss/train': 1.345123291015625} -09/21/2021 01:11:01 - INFO - __main__ - Step 49382: {'lr': 0.0001988918483041065, 'samples': 1580224, 'steps': 3086, 'loss/train': 2.1813066005706787} -09/21/2021 01:11:02 - INFO - __main__ - Step 49383: {'lr': 0.0001988918483041065, 'samples': 1580256, 'steps': 3086, 'loss/train': 1.6681276559829712} -09/21/2021 01:11:03 - INFO - __main__ - Step 49384: {'lr': 0.0001988918483041065, 'samples': 1580288, 'steps': 3086, 'loss/train': 1.3289146423339844} -09/21/2021 01:11:04 - INFO - __main__ - Step 49385: {'lr': 0.0001988918483041065, 'samples': 1580320, 'steps': 3086, 'loss/train': 2.528324604034424} -09/21/2021 01:11:04 - INFO - __main__ - Step 49386: {'lr': 0.0001988918483041065, 'samples': 1580352, 'steps': 3086, 'loss/train': 1.9777007102966309} -09/21/2021 01:11:05 - INFO - __main__ - Step 49387: {'lr': 0.0001988918483041065, 'samples': 1580384, 'steps': 3086, 'loss/train': 2.797043561935425} -09/21/2021 01:11:06 - INFO - __main__ - Step 49388: {'lr': 0.0001988918483041065, 'samples': 1580416, 'steps': 3086, 'loss/train': 2.582612991333008} -09/21/2021 01:11:07 - INFO - __main__ - Step 49389: {'lr': 0.0001988918483041065, 'samples': 1580448, 'steps': 3086, 'loss/train': 1.9943639039993286} -09/21/2021 01:11:07 - INFO - __main__ - Step 49390: {'lr': 0.0001988918483041065, 'samples': 1580480, 'steps': 3086, 'loss/train': 2.482306718826294} -09/21/2021 01:11:08 - INFO - __main__ - Step 49391: {'lr': 0.0001988918483041065, 'samples': 1580512, 'steps': 3086, 'loss/train': 1.6209585666656494} -09/21/2021 01:11:10 - INFO - __main__ - Step 49392: {'lr': 0.0001988918483041065, 'samples': 1580544, 'steps': 3086, 'loss/train': 2.2112159729003906} -09/21/2021 01:11:10 - INFO - __main__ - Step 49393: {'lr': 0.00019889090109907756, 'samples': 1580576, 'steps': 3087, 'loss/train': 2.293592929840088} -09/21/2021 01:11:11 - INFO - __main__ - Step 49394: {'lr': 0.00019889090109907756, 'samples': 1580608, 'steps': 3087, 'loss/train': 2.0843167304992676} -09/21/2021 01:11:12 - INFO - __main__ - Step 49395: {'lr': 0.00019889090109907756, 'samples': 1580640, 'steps': 3087, 'loss/train': 1.433410406112671} -09/21/2021 01:11:13 - INFO - __main__ - Step 49396: {'lr': 0.00019889090109907756, 'samples': 1580672, 'steps': 3087, 'loss/train': 1.7863199710845947} -09/21/2021 01:11:13 - INFO - __main__ - Step 49397: {'lr': 0.00019889090109907756, 'samples': 1580704, 'steps': 3087, 'loss/train': 1.667680025100708} -09/21/2021 01:11:14 - INFO - __main__ - Step 49398: {'lr': 0.00019889090109907756, 'samples': 1580736, 'steps': 3087, 'loss/train': 2.3878493309020996} -09/21/2021 01:11:15 - INFO - __main__ - Step 49399: {'lr': 0.00019889090109907756, 'samples': 1580768, 'steps': 3087, 'loss/train': 1.9545633792877197} -09/21/2021 01:11:16 - INFO - __main__ - Step 49400: {'lr': 0.00019889090109907756, 'samples': 1580800, 'steps': 3087, 'loss/train': 1.896144986152649} -09/21/2021 01:11:16 - INFO - __main__ - Step 49401: {'lr': 0.00019889090109907756, 'samples': 1580832, 'steps': 3087, 'loss/train': 2.081819772720337} -09/21/2021 01:11:17 - INFO - __main__ - Step 49402: {'lr': 0.00019889090109907756, 'samples': 1580864, 'steps': 3087, 'loss/train': 1.604534387588501} -09/21/2021 01:11:18 - INFO - __main__ - Step 49403: {'lr': 0.00019889090109907756, 'samples': 1580896, 'steps': 3087, 'loss/train': 2.0536019802093506} -09/21/2021 01:11:19 - INFO - __main__ - Step 49404: {'lr': 0.00019889090109907756, 'samples': 1580928, 'steps': 3087, 'loss/train': 1.9148964881896973} -09/21/2021 01:11:19 - INFO - __main__ - Step 49405: {'lr': 0.00019889090109907756, 'samples': 1580960, 'steps': 3087, 'loss/train': 1.5812840461730957} -09/21/2021 01:11:20 - INFO - __main__ - Step 49406: {'lr': 0.00019889090109907756, 'samples': 1580992, 'steps': 3087, 'loss/train': 1.6057076454162598} -09/21/2021 01:11:21 - INFO - __main__ - Step 49407: {'lr': 0.00019889090109907756, 'samples': 1581024, 'steps': 3087, 'loss/train': 1.4692879915237427} -09/21/2021 01:11:22 - INFO - __main__ - Step 49408: {'lr': 0.00019889090109907756, 'samples': 1581056, 'steps': 3087, 'loss/train': 0.5333183407783508} -09/21/2021 01:11:23 - INFO - __main__ - Step 49409: {'lr': 0.0001988899534916619, 'samples': 1581088, 'steps': 3088, 'loss/train': 0.659551203250885} -09/21/2021 01:11:23 - INFO - __main__ - Step 49410: {'lr': 0.0001988899534916619, 'samples': 1581120, 'steps': 3088, 'loss/train': 2.1582915782928467} -09/21/2021 01:11:24 - INFO - __main__ - Step 49411: {'lr': 0.0001988899534916619, 'samples': 1581152, 'steps': 3088, 'loss/train': 2.8702731132507324} -09/21/2021 01:11:25 - INFO - __main__ - Step 49412: {'lr': 0.0001988899534916619, 'samples': 1581184, 'steps': 3088, 'loss/train': 1.130096673965454} -09/21/2021 01:11:26 - INFO - __main__ - Step 49413: {'lr': 0.0001988899534916619, 'samples': 1581216, 'steps': 3088, 'loss/train': 1.3252837657928467} -09/21/2021 01:11:26 - INFO - __main__ - Step 49414: {'lr': 0.0001988899534916619, 'samples': 1581248, 'steps': 3088, 'loss/train': 2.533903121948242} -09/21/2021 01:11:27 - INFO - __main__ - Step 49415: {'lr': 0.0001988899534916619, 'samples': 1581280, 'steps': 3088, 'loss/train': 2.681276798248291} -09/21/2021 01:11:28 - INFO - __main__ - Step 49416: {'lr': 0.0001988899534916619, 'samples': 1581312, 'steps': 3088, 'loss/train': 1.88289475440979} -09/21/2021 01:11:29 - INFO - __main__ - Step 49417: {'lr': 0.0001988899534916619, 'samples': 1581344, 'steps': 3088, 'loss/train': 3.287078857421875} -09/21/2021 01:11:29 - INFO - __main__ - Step 49418: {'lr': 0.0001988899534916619, 'samples': 1581376, 'steps': 3088, 'loss/train': 3.371675968170166} -09/21/2021 01:11:30 - INFO - __main__ - Step 49419: {'lr': 0.0001988899534916619, 'samples': 1581408, 'steps': 3088, 'loss/train': 3.1528542041778564} -09/21/2021 01:11:31 - INFO - __main__ - Step 49420: {'lr': 0.0001988899534916619, 'samples': 1581440, 'steps': 3088, 'loss/train': 2.3733763694763184} -09/21/2021 01:11:32 - INFO - __main__ - Step 49421: {'lr': 0.0001988899534916619, 'samples': 1581472, 'steps': 3088, 'loss/train': 1.7861971855163574} -09/21/2021 01:11:33 - INFO - __main__ - Step 49422: {'lr': 0.0001988899534916619, 'samples': 1581504, 'steps': 3088, 'loss/train': 2.3863184452056885} -09/21/2021 01:11:34 - INFO - __main__ - Step 49423: {'lr': 0.0001988899534916619, 'samples': 1581536, 'steps': 3088, 'loss/train': 1.8772306442260742} -09/21/2021 01:11:35 - INFO - __main__ - Step 49424: {'lr': 0.0001988899534916619, 'samples': 1581568, 'steps': 3088, 'loss/train': 1.3547132015228271} -09/21/2021 01:11:35 - INFO - __main__ - Step 49425: {'lr': 0.00019888900548186342, 'samples': 1581600, 'steps': 3089, 'loss/train': 2.7014570236206055} -09/21/2021 01:11:36 - INFO - __main__ - Step 49426: {'lr': 0.00019888900548186342, 'samples': 1581632, 'steps': 3089, 'loss/train': 2.333411455154419} -09/21/2021 01:11:37 - INFO - __main__ - Step 49427: {'lr': 0.00019888900548186342, 'samples': 1581664, 'steps': 3089, 'loss/train': 2.279599905014038} -09/21/2021 01:11:38 - INFO - __main__ - Step 49428: {'lr': 0.00019888900548186342, 'samples': 1581696, 'steps': 3089, 'loss/train': 2.0040700435638428} -09/21/2021 01:11:38 - INFO - __main__ - Step 49429: {'lr': 0.00019888900548186342, 'samples': 1581728, 'steps': 3089, 'loss/train': 2.0366456508636475} -09/21/2021 01:11:39 - INFO - __main__ - Step 49430: {'lr': 0.00019888900548186342, 'samples': 1581760, 'steps': 3089, 'loss/train': 2.9639718532562256} -09/21/2021 01:11:40 - INFO - __main__ - Step 49431: {'lr': 0.00019888900548186342, 'samples': 1581792, 'steps': 3089, 'loss/train': 1.8515795469284058} -09/21/2021 01:11:41 - INFO - __main__ - Step 49432: {'lr': 0.00019888900548186342, 'samples': 1581824, 'steps': 3089, 'loss/train': 2.153804063796997} -09/21/2021 01:11:41 - INFO - __main__ - Step 49433: {'lr': 0.00019888900548186342, 'samples': 1581856, 'steps': 3089, 'loss/train': 1.9980134963989258} -09/21/2021 01:11:42 - INFO - __main__ - Step 49434: {'lr': 0.00019888900548186342, 'samples': 1581888, 'steps': 3089, 'loss/train': 1.7776243686676025} -09/21/2021 01:11:43 - INFO - __main__ - Step 49435: {'lr': 0.00019888900548186342, 'samples': 1581920, 'steps': 3089, 'loss/train': 1.968940258026123} -09/21/2021 01:11:44 - INFO - __main__ - Step 49436: {'lr': 0.00019888900548186342, 'samples': 1581952, 'steps': 3089, 'loss/train': 1.8812706470489502} -09/21/2021 01:11:44 - INFO - __main__ - Step 49437: {'lr': 0.00019888900548186342, 'samples': 1581984, 'steps': 3089, 'loss/train': 1.4812952280044556} -09/21/2021 01:11:45 - INFO - __main__ - Step 49438: {'lr': 0.00019888900548186342, 'samples': 1582016, 'steps': 3089, 'loss/train': 0.34822046756744385} -09/21/2021 01:11:46 - INFO - __main__ - Step 49439: {'lr': 0.00019888900548186342, 'samples': 1582048, 'steps': 3089, 'loss/train': 2.338916540145874} -09/21/2021 01:11:47 - INFO - __main__ - Step 49440: {'lr': 0.00019888900548186342, 'samples': 1582080, 'steps': 3089, 'loss/train': 2.3444886207580566} -09/21/2021 01:11:48 - INFO - __main__ - Step 49441: {'lr': 0.00019888805706968598, 'samples': 1582112, 'steps': 3090, 'loss/train': 1.5367835760116577} -09/21/2021 01:11:48 - INFO - __main__ - Step 49442: {'lr': 0.00019888805706968598, 'samples': 1582144, 'steps': 3090, 'loss/train': 0.11083826422691345} -09/21/2021 01:11:49 - INFO - __main__ - Step 49443: {'lr': 0.00019888805706968598, 'samples': 1582176, 'steps': 3090, 'loss/train': 0.07839226722717285} -09/21/2021 01:11:50 - INFO - __main__ - Step 49444: {'lr': 0.00019888805706968598, 'samples': 1582208, 'steps': 3090, 'loss/train': 2.9833900928497314} -09/21/2021 01:11:51 - INFO - __main__ - Step 49445: {'lr': 0.00019888805706968598, 'samples': 1582240, 'steps': 3090, 'loss/train': 2.720038890838623} -09/21/2021 01:11:51 - INFO - __main__ - Step 49446: {'lr': 0.00019888805706968598, 'samples': 1582272, 'steps': 3090, 'loss/train': 2.6888184547424316} -09/21/2021 01:11:52 - INFO - __main__ - Step 49447: {'lr': 0.00019888805706968598, 'samples': 1582304, 'steps': 3090, 'loss/train': 3.7633328437805176} -09/21/2021 01:11:53 - INFO - __main__ - Step 49448: {'lr': 0.00019888805706968598, 'samples': 1582336, 'steps': 3090, 'loss/train': 1.7563778162002563} -09/21/2021 01:11:54 - INFO - __main__ - Step 49449: {'lr': 0.00019888805706968598, 'samples': 1582368, 'steps': 3090, 'loss/train': 2.129030466079712} -09/21/2021 01:11:54 - INFO - __main__ - Step 49450: {'lr': 0.00019888805706968598, 'samples': 1582400, 'steps': 3090, 'loss/train': 1.6542112827301025} -09/21/2021 01:11:55 - INFO - __main__ - Step 49451: {'lr': 0.00019888805706968598, 'samples': 1582432, 'steps': 3090, 'loss/train': 2.226012945175171} -09/21/2021 01:11:56 - INFO - __main__ - Step 49452: {'lr': 0.00019888805706968598, 'samples': 1582464, 'steps': 3090, 'loss/train': 2.7690775394439697} -09/21/2021 01:11:58 - INFO - __main__ - Step 49453: {'lr': 0.00019888805706968598, 'samples': 1582496, 'steps': 3090, 'loss/train': 1.0300230979919434} -09/21/2021 01:11:58 - INFO - __main__ - Step 49454: {'lr': 0.00019888805706968598, 'samples': 1582528, 'steps': 3090, 'loss/train': 2.311075448989868} -09/21/2021 01:11:59 - INFO - __main__ - Step 49455: {'lr': 0.00019888805706968598, 'samples': 1582560, 'steps': 3090, 'loss/train': 1.818976879119873} -09/21/2021 01:12:00 - INFO - __main__ - Step 49456: {'lr': 0.00019888805706968598, 'samples': 1582592, 'steps': 3090, 'loss/train': 1.5498464107513428} -09/21/2021 01:12:01 - INFO - __main__ - Step 49457: {'lr': 0.00019888710825513342, 'samples': 1582624, 'steps': 3091, 'loss/train': 1.3563834428787231} -09/21/2021 01:12:02 - INFO - __main__ - Step 49458: {'lr': 0.00019888710825513342, 'samples': 1582656, 'steps': 3091, 'loss/train': 1.9607641696929932} -09/21/2021 01:12:02 - INFO - __main__ - Step 49459: {'lr': 0.00019888710825513342, 'samples': 1582688, 'steps': 3091, 'loss/train': 2.006941080093384} -09/21/2021 01:12:03 - INFO - __main__ - Step 49460: {'lr': 0.00019888710825513342, 'samples': 1582720, 'steps': 3091, 'loss/train': 2.6715147495269775} -09/21/2021 01:12:04 - INFO - __main__ - Step 49461: {'lr': 0.00019888710825513342, 'samples': 1582752, 'steps': 3091, 'loss/train': 3.0686445236206055} -09/21/2021 01:12:05 - INFO - __main__ - Step 49462: {'lr': 0.00019888710825513342, 'samples': 1582784, 'steps': 3091, 'loss/train': 2.272603988647461} -09/21/2021 01:12:05 - INFO - __main__ - Step 49463: {'lr': 0.00019888710825513342, 'samples': 1582816, 'steps': 3091, 'loss/train': 1.8183538913726807} -09/21/2021 01:12:06 - INFO - __main__ - Step 49464: {'lr': 0.00019888710825513342, 'samples': 1582848, 'steps': 3091, 'loss/train': 2.0238242149353027} -09/21/2021 01:12:07 - INFO - __main__ - Step 49465: {'lr': 0.00019888710825513342, 'samples': 1582880, 'steps': 3091, 'loss/train': 1.3374855518341064} -09/21/2021 01:12:08 - INFO - __main__ - Step 49466: {'lr': 0.00019888710825513342, 'samples': 1582912, 'steps': 3091, 'loss/train': 1.832165002822876} -09/21/2021 01:12:08 - INFO - __main__ - Step 49467: {'lr': 0.00019888710825513342, 'samples': 1582944, 'steps': 3091, 'loss/train': 2.2693004608154297} -09/21/2021 01:12:09 - INFO - __main__ - Step 49468: {'lr': 0.00019888710825513342, 'samples': 1582976, 'steps': 3091, 'loss/train': 1.9795626401901245} -09/21/2021 01:12:10 - INFO - __main__ - Step 49469: {'lr': 0.00019888710825513342, 'samples': 1583008, 'steps': 3091, 'loss/train': 0.6208407878875732} -09/21/2021 01:12:11 - INFO - __main__ - Step 49470: {'lr': 0.00019888710825513342, 'samples': 1583040, 'steps': 3091, 'loss/train': 2.386125087738037} -09/21/2021 01:12:11 - INFO - __main__ - Step 49471: {'lr': 0.00019888710825513342, 'samples': 1583072, 'steps': 3091, 'loss/train': 1.7159944772720337} -09/21/2021 01:12:12 - INFO - __main__ - Step 49472: {'lr': 0.00019888710825513342, 'samples': 1583104, 'steps': 3091, 'loss/train': 1.096803069114685} -09/21/2021 01:12:13 - INFO - __main__ - Step 49473: {'lr': 0.00019888615903820958, 'samples': 1583136, 'steps': 3092, 'loss/train': 0.13838998973369598} -09/21/2021 01:12:14 - INFO - __main__ - Step 49474: {'lr': 0.00019888615903820958, 'samples': 1583168, 'steps': 3092, 'loss/train': 0.5160745978355408} -09/21/2021 01:12:14 - INFO - __main__ - Step 49475: {'lr': 0.00019888615903820958, 'samples': 1583200, 'steps': 3092, 'loss/train': 1.619842529296875} -09/21/2021 01:12:15 - INFO - __main__ - Step 49476: {'lr': 0.00019888615903820958, 'samples': 1583232, 'steps': 3092, 'loss/train': 1.7570006847381592} -09/21/2021 01:12:16 - INFO - __main__ - Step 49477: {'lr': 0.00019888615903820958, 'samples': 1583264, 'steps': 3092, 'loss/train': 2.0674638748168945} -09/21/2021 01:12:17 - INFO - __main__ - Step 49478: {'lr': 0.00019888615903820958, 'samples': 1583296, 'steps': 3092, 'loss/train': 1.9021869897842407} -09/21/2021 01:12:17 - INFO - __main__ - Step 49479: {'lr': 0.00019888615903820958, 'samples': 1583328, 'steps': 3092, 'loss/train': 0.45674172043800354} -09/21/2021 01:12:18 - INFO - __main__ - Step 49480: {'lr': 0.00019888615903820958, 'samples': 1583360, 'steps': 3092, 'loss/train': 0.32210981845855713} -09/21/2021 01:12:19 - INFO - __main__ - Step 49481: {'lr': 0.00019888615903820958, 'samples': 1583392, 'steps': 3092, 'loss/train': 2.6193079948425293} -09/21/2021 01:12:20 - INFO - __main__ - Step 49482: {'lr': 0.00019888615903820958, 'samples': 1583424, 'steps': 3092, 'loss/train': 2.6939196586608887} -09/21/2021 01:12:20 - INFO - __main__ - Step 49483: {'lr': 0.00019888615903820958, 'samples': 1583456, 'steps': 3092, 'loss/train': 1.631636381149292} -09/21/2021 01:12:22 - INFO - __main__ - Step 49484: {'lr': 0.00019888615903820958, 'samples': 1583488, 'steps': 3092, 'loss/train': 1.82465660572052} -09/21/2021 01:12:23 - INFO - __main__ - Step 49485: {'lr': 0.00019888615903820958, 'samples': 1583520, 'steps': 3092, 'loss/train': 1.1641966104507446} -09/21/2021 01:12:23 - INFO - __main__ - Step 49486: {'lr': 0.00019888615903820958, 'samples': 1583552, 'steps': 3092, 'loss/train': 1.0567160844802856} -09/21/2021 01:12:24 - INFO - __main__ - Step 49487: {'lr': 0.00019888615903820958, 'samples': 1583584, 'steps': 3092, 'loss/train': 0.6060000658035278} -09/21/2021 01:12:25 - INFO - __main__ - Step 49488: {'lr': 0.00019888615903820958, 'samples': 1583616, 'steps': 3092, 'loss/train': 0.7881088256835938} -09/21/2021 01:12:26 - INFO - __main__ - Step 49489: {'lr': 0.00019888520941891834, 'samples': 1583648, 'steps': 3093, 'loss/train': 1.9151039123535156} -09/21/2021 01:12:26 - INFO - __main__ - Step 49490: {'lr': 0.00019888520941891834, 'samples': 1583680, 'steps': 3093, 'loss/train': 1.4392930269241333} -09/21/2021 01:12:27 - INFO - __main__ - Step 49491: {'lr': 0.00019888520941891834, 'samples': 1583712, 'steps': 3093, 'loss/train': 2.795886516571045} -09/21/2021 01:12:28 - INFO - __main__ - Step 49492: {'lr': 0.00019888520941891834, 'samples': 1583744, 'steps': 3093, 'loss/train': 1.8641127347946167} -09/21/2021 01:12:29 - INFO - __main__ - Step 49493: {'lr': 0.00019888520941891834, 'samples': 1583776, 'steps': 3093, 'loss/train': 1.1531282663345337} -09/21/2021 01:12:29 - INFO - __main__ - Step 49494: {'lr': 0.00019888520941891834, 'samples': 1583808, 'steps': 3093, 'loss/train': 1.002015233039856} -09/21/2021 01:12:30 - INFO - __main__ - Step 49495: {'lr': 0.00019888520941891834, 'samples': 1583840, 'steps': 3093, 'loss/train': 2.4692161083221436} -09/21/2021 01:12:31 - INFO - __main__ - Step 49496: {'lr': 0.00019888520941891834, 'samples': 1583872, 'steps': 3093, 'loss/train': 2.6815030574798584} -09/21/2021 01:12:32 - INFO - __main__ - Step 49497: {'lr': 0.00019888520941891834, 'samples': 1583904, 'steps': 3093, 'loss/train': 2.068108320236206} -09/21/2021 01:12:32 - INFO - __main__ - Step 49498: {'lr': 0.00019888520941891834, 'samples': 1583936, 'steps': 3093, 'loss/train': 1.3784414529800415} -09/21/2021 01:12:33 - INFO - __main__ - Step 49499: {'lr': 0.00019888520941891834, 'samples': 1583968, 'steps': 3093, 'loss/train': 2.0946404933929443} -09/21/2021 01:12:34 - INFO - __main__ - Step 49500: {'lr': 0.00019888520941891834, 'samples': 1584000, 'steps': 3093, 'loss/train': 0.4763233959674835} -09/21/2021 01:12:35 - INFO - __main__ - Step 49501: {'lr': 0.00019888520941891834, 'samples': 1584032, 'steps': 3093, 'loss/train': 1.8566899299621582} -09/21/2021 01:12:35 - INFO - __main__ - Step 49502: {'lr': 0.00019888520941891834, 'samples': 1584064, 'steps': 3093, 'loss/train': 2.0227339267730713} -09/21/2021 01:12:36 - INFO - __main__ - Step 49503: {'lr': 0.00019888520941891834, 'samples': 1584096, 'steps': 3093, 'loss/train': 1.1642018556594849} -09/21/2021 01:12:37 - INFO - __main__ - Step 49504: {'lr': 0.00019888520941891834, 'samples': 1584128, 'steps': 3093, 'loss/train': 2.064680576324463} -09/21/2021 01:12:38 - INFO - __main__ - Step 49505: {'lr': 0.00019888425939726357, 'samples': 1584160, 'steps': 3094, 'loss/train': 2.1874947547912598} -09/21/2021 01:12:39 - INFO - __main__ - Step 49506: {'lr': 0.00019888425939726357, 'samples': 1584192, 'steps': 3094, 'loss/train': 1.3569711446762085} -09/21/2021 01:12:39 - INFO - __main__ - Step 49507: {'lr': 0.00019888425939726357, 'samples': 1584224, 'steps': 3094, 'loss/train': 0.3617711067199707} -09/21/2021 01:12:40 - INFO - __main__ - Step 49508: {'lr': 0.00019888425939726357, 'samples': 1584256, 'steps': 3094, 'loss/train': 0.35582172870635986} -09/21/2021 01:12:41 - INFO - __main__ - Step 49509: {'lr': 0.00019888425939726357, 'samples': 1584288, 'steps': 3094, 'loss/train': 0.18531282246112823} -09/21/2021 01:12:42 - INFO - __main__ - Step 49510: {'lr': 0.00019888425939726357, 'samples': 1584320, 'steps': 3094, 'loss/train': 3.1793360710144043} -09/21/2021 01:12:42 - INFO - __main__ - Step 49511: {'lr': 0.00019888425939726357, 'samples': 1584352, 'steps': 3094, 'loss/train': 1.4292488098144531} -09/21/2021 01:12:43 - INFO - __main__ - Step 49512: {'lr': 0.00019888425939726357, 'samples': 1584384, 'steps': 3094, 'loss/train': 2.398315191268921} -09/21/2021 01:12:44 - INFO - __main__ - Step 49513: {'lr': 0.00019888425939726357, 'samples': 1584416, 'steps': 3094, 'loss/train': 1.5679572820663452} -09/21/2021 01:12:45 - INFO - __main__ - Step 49514: {'lr': 0.00019888425939726357, 'samples': 1584448, 'steps': 3094, 'loss/train': 2.5775949954986572} -09/21/2021 01:12:46 - INFO - __main__ - Step 49515: {'lr': 0.00019888425939726357, 'samples': 1584480, 'steps': 3094, 'loss/train': 2.394287109375} -09/21/2021 01:12:47 - INFO - __main__ - Step 49516: {'lr': 0.00019888425939726357, 'samples': 1584512, 'steps': 3094, 'loss/train': 2.541801691055298} -09/21/2021 01:12:47 - INFO - __main__ - Step 49517: {'lr': 0.00019888425939726357, 'samples': 1584544, 'steps': 3094, 'loss/train': 2.1385557651519775} -09/21/2021 01:12:48 - INFO - __main__ - Step 49518: {'lr': 0.00019888425939726357, 'samples': 1584576, 'steps': 3094, 'loss/train': 2.4549481868743896} -09/21/2021 01:12:49 - INFO - __main__ - Step 49519: {'lr': 0.00019888425939726357, 'samples': 1584608, 'steps': 3094, 'loss/train': 2.1070923805236816} -09/21/2021 01:12:50 - INFO - __main__ - Step 49520: {'lr': 0.00019888425939726357, 'samples': 1584640, 'steps': 3094, 'loss/train': 0.8722805380821228} -09/21/2021 01:12:51 - INFO - __main__ - Step 49521: {'lr': 0.00019888330897324915, 'samples': 1584672, 'steps': 3095, 'loss/train': 0.3429686427116394} -09/21/2021 01:12:51 - INFO - __main__ - Step 49522: {'lr': 0.00019888330897324915, 'samples': 1584704, 'steps': 3095, 'loss/train': 0.17498624324798584} -09/21/2021 01:12:52 - INFO - __main__ - Step 49523: {'lr': 0.00019888330897324915, 'samples': 1584736, 'steps': 3095, 'loss/train': 0.1894054114818573} -09/21/2021 01:12:53 - INFO - __main__ - Step 49524: {'lr': 0.00019888330897324915, 'samples': 1584768, 'steps': 3095, 'loss/train': 0.9818824529647827} -09/21/2021 01:12:54 - INFO - __main__ - Step 49525: {'lr': 0.00019888330897324915, 'samples': 1584800, 'steps': 3095, 'loss/train': 1.8724403381347656} -09/21/2021 01:12:54 - INFO - __main__ - Step 49526: {'lr': 0.00019888330897324915, 'samples': 1584832, 'steps': 3095, 'loss/train': 2.144005060195923} -09/21/2021 01:12:55 - INFO - __main__ - Step 49527: {'lr': 0.00019888330897324915, 'samples': 1584864, 'steps': 3095, 'loss/train': 1.791505217552185} -09/21/2021 01:12:56 - INFO - __main__ - Step 49528: {'lr': 0.00019888330897324915, 'samples': 1584896, 'steps': 3095, 'loss/train': 2.193394184112549} -09/21/2021 01:12:57 - INFO - __main__ - Step 49529: {'lr': 0.00019888330897324915, 'samples': 1584928, 'steps': 3095, 'loss/train': 2.1363487243652344} -09/21/2021 01:12:57 - INFO - __main__ - Step 49530: {'lr': 0.00019888330897324915, 'samples': 1584960, 'steps': 3095, 'loss/train': 2.357496738433838} -09/21/2021 01:12:58 - INFO - __main__ - Step 49531: {'lr': 0.00019888330897324915, 'samples': 1584992, 'steps': 3095, 'loss/train': 1.6517304182052612} -09/21/2021 01:12:59 - INFO - __main__ - Step 49532: {'lr': 0.00019888330897324915, 'samples': 1585024, 'steps': 3095, 'loss/train': 1.7309962511062622} -09/21/2021 01:13:00 - INFO - __main__ - Step 49533: {'lr': 0.00019888330897324915, 'samples': 1585056, 'steps': 3095, 'loss/train': 3.2005348205566406} -09/21/2021 01:13:00 - INFO - __main__ - Step 49534: {'lr': 0.00019888330897324915, 'samples': 1585088, 'steps': 3095, 'loss/train': 2.1294126510620117} -09/21/2021 01:13:01 - INFO - __main__ - Step 49535: {'lr': 0.00019888330897324915, 'samples': 1585120, 'steps': 3095, 'loss/train': 2.2275333404541016} -09/21/2021 01:13:02 - INFO - __main__ - Step 49536: {'lr': 0.00019888330897324915, 'samples': 1585152, 'steps': 3095, 'loss/train': 2.522775411605835} -09/21/2021 01:13:03 - INFO - __main__ - Step 49537: {'lr': 0.00019888235814687893, 'samples': 1585184, 'steps': 3096, 'loss/train': 2.4841859340667725} -09/21/2021 01:13:04 - INFO - __main__ - Step 49538: {'lr': 0.00019888235814687893, 'samples': 1585216, 'steps': 3096, 'loss/train': 1.5037708282470703} -09/21/2021 01:13:04 - INFO - __main__ - Step 49539: {'lr': 0.00019888235814687893, 'samples': 1585248, 'steps': 3096, 'loss/train': 1.707245945930481} -09/21/2021 01:13:05 - INFO - __main__ - Step 49540: {'lr': 0.00019888235814687893, 'samples': 1585280, 'steps': 3096, 'loss/train': 1.2355948686599731} -09/21/2021 01:13:06 - INFO - __main__ - Step 49541: {'lr': 0.00019888235814687893, 'samples': 1585312, 'steps': 3096, 'loss/train': 2.1640961170196533} -09/21/2021 01:13:07 - INFO - __main__ - Step 49542: {'lr': 0.00019888235814687893, 'samples': 1585344, 'steps': 3096, 'loss/train': 1.8162506818771362} -09/21/2021 01:13:07 - INFO - __main__ - Step 49543: {'lr': 0.00019888235814687893, 'samples': 1585376, 'steps': 3096, 'loss/train': 1.8017604351043701} -09/21/2021 01:13:08 - INFO - __main__ - Step 49544: {'lr': 0.00019888235814687893, 'samples': 1585408, 'steps': 3096, 'loss/train': 0.4665776491165161} -09/21/2021 01:13:09 - INFO - __main__ - Step 49545: {'lr': 0.00019888235814687893, 'samples': 1585440, 'steps': 3096, 'loss/train': 2.6306445598602295} -09/21/2021 01:13:10 - INFO - __main__ - Step 49546: {'lr': 0.00019888235814687893, 'samples': 1585472, 'steps': 3096, 'loss/train': 1.7018768787384033} -09/21/2021 01:13:11 - INFO - __main__ - Step 49547: {'lr': 0.00019888235814687893, 'samples': 1585504, 'steps': 3096, 'loss/train': 1.9373201131820679} -09/21/2021 01:13:12 - INFO - __main__ - Step 49548: {'lr': 0.00019888235814687893, 'samples': 1585536, 'steps': 3096, 'loss/train': 2.0105154514312744} -09/21/2021 01:13:12 - INFO - __main__ - Step 49549: {'lr': 0.00019888235814687893, 'samples': 1585568, 'steps': 3096, 'loss/train': 2.350900888442993} -09/21/2021 01:13:13 - INFO - __main__ - Step 49550: {'lr': 0.00019888235814687893, 'samples': 1585600, 'steps': 3096, 'loss/train': 1.589539885520935} -09/21/2021 01:13:14 - INFO - __main__ - Step 49551: {'lr': 0.00019888235814687893, 'samples': 1585632, 'steps': 3096, 'loss/train': 1.6044659614562988} -09/21/2021 01:13:14 - INFO - __main__ - Step 49552: {'lr': 0.00019888235814687893, 'samples': 1585664, 'steps': 3096, 'loss/train': 1.9155676364898682} -09/21/2021 01:13:15 - INFO - __main__ - Step 49553: {'lr': 0.00019888140691815679, 'samples': 1585696, 'steps': 3097, 'loss/train': 1.6305650472640991} -09/21/2021 01:13:16 - INFO - __main__ - Step 49554: {'lr': 0.00019888140691815679, 'samples': 1585728, 'steps': 3097, 'loss/train': 0.25186675786972046} -09/21/2021 01:13:17 - INFO - __main__ - Step 49555: {'lr': 0.00019888140691815679, 'samples': 1585760, 'steps': 3097, 'loss/train': 2.7404608726501465} -09/21/2021 01:13:18 - INFO - __main__ - Step 49556: {'lr': 0.00019888140691815679, 'samples': 1585792, 'steps': 3097, 'loss/train': 1.6344212293624878} -09/21/2021 01:13:18 - INFO - __main__ - Step 49557: {'lr': 0.00019888140691815679, 'samples': 1585824, 'steps': 3097, 'loss/train': 1.7670491933822632} -09/21/2021 01:13:19 - INFO - __main__ - Step 49558: {'lr': 0.00019888140691815679, 'samples': 1585856, 'steps': 3097, 'loss/train': 2.235403537750244} -09/21/2021 01:13:20 - INFO - __main__ - Step 49559: {'lr': 0.00019888140691815679, 'samples': 1585888, 'steps': 3097, 'loss/train': 1.5303316116333008} -09/21/2021 01:13:21 - INFO - __main__ - Step 49560: {'lr': 0.00019888140691815679, 'samples': 1585920, 'steps': 3097, 'loss/train': 2.9283623695373535} -09/21/2021 01:13:21 - INFO - __main__ - Step 49561: {'lr': 0.00019888140691815679, 'samples': 1585952, 'steps': 3097, 'loss/train': 1.6081851720809937} -09/21/2021 01:13:22 - INFO - __main__ - Step 49562: {'lr': 0.00019888140691815679, 'samples': 1585984, 'steps': 3097, 'loss/train': 1.9611716270446777} -09/21/2021 01:13:23 - INFO - __main__ - Step 49563: {'lr': 0.00019888140691815679, 'samples': 1586016, 'steps': 3097, 'loss/train': 2.2052555084228516} -09/21/2021 01:13:24 - INFO - __main__ - Step 49564: {'lr': 0.00019888140691815679, 'samples': 1586048, 'steps': 3097, 'loss/train': 1.2886608839035034} -09/21/2021 01:13:24 - INFO - __main__ - Step 49565: {'lr': 0.00019888140691815679, 'samples': 1586080, 'steps': 3097, 'loss/train': 2.264979600906372} -09/21/2021 01:13:25 - INFO - __main__ - Step 49566: {'lr': 0.00019888140691815679, 'samples': 1586112, 'steps': 3097, 'loss/train': 2.4579670429229736} -09/21/2021 01:13:26 - INFO - __main__ - Step 49567: {'lr': 0.00019888140691815679, 'samples': 1586144, 'steps': 3097, 'loss/train': 1.9005558490753174} -09/21/2021 01:13:27 - INFO - __main__ - Step 49568: {'lr': 0.00019888140691815679, 'samples': 1586176, 'steps': 3097, 'loss/train': 1.8081327676773071} -09/21/2021 01:13:28 - INFO - __main__ - Step 49569: {'lr': 0.00019888045528708653, 'samples': 1586208, 'steps': 3098, 'loss/train': 1.832432746887207} -09/21/2021 01:13:28 - INFO - __main__ - Step 49570: {'lr': 0.00019888045528708653, 'samples': 1586240, 'steps': 3098, 'loss/train': 0.23542185127735138} -09/21/2021 01:13:29 - INFO - __main__ - Step 49571: {'lr': 0.00019888045528708653, 'samples': 1586272, 'steps': 3098, 'loss/train': 2.2666471004486084} -09/21/2021 01:13:30 - INFO - __main__ - Step 49572: {'lr': 0.00019888045528708653, 'samples': 1586304, 'steps': 3098, 'loss/train': 2.6314475536346436} -09/21/2021 01:13:31 - INFO - __main__ - Step 49573: {'lr': 0.00019888045528708653, 'samples': 1586336, 'steps': 3098, 'loss/train': 2.2284038066864014} -09/21/2021 01:13:31 - INFO - __main__ - Step 49574: {'lr': 0.00019888045528708653, 'samples': 1586368, 'steps': 3098, 'loss/train': 1.726871132850647} -09/21/2021 01:13:32 - INFO - __main__ - Step 49575: {'lr': 0.00019888045528708653, 'samples': 1586400, 'steps': 3098, 'loss/train': 1.2340563535690308} -09/21/2021 01:13:33 - INFO - __main__ - Step 49576: {'lr': 0.00019888045528708653, 'samples': 1586432, 'steps': 3098, 'loss/train': 1.2008775472640991} -09/21/2021 01:13:34 - INFO - __main__ - Step 49577: {'lr': 0.00019888045528708653, 'samples': 1586464, 'steps': 3098, 'loss/train': 2.708897829055786} -09/21/2021 01:13:35 - INFO - __main__ - Step 49578: {'lr': 0.00019888045528708653, 'samples': 1586496, 'steps': 3098, 'loss/train': 2.5213780403137207} -09/21/2021 01:13:36 - INFO - __main__ - Step 49579: {'lr': 0.00019888045528708653, 'samples': 1586528, 'steps': 3098, 'loss/train': 2.633230686187744} -09/21/2021 01:13:36 - INFO - __main__ - Step 49580: {'lr': 0.00019888045528708653, 'samples': 1586560, 'steps': 3098, 'loss/train': 1.7336790561676025} -09/21/2021 01:13:37 - INFO - __main__ - Step 49581: {'lr': 0.00019888045528708653, 'samples': 1586592, 'steps': 3098, 'loss/train': 1.512362003326416} -09/21/2021 01:13:38 - INFO - __main__ - Step 49582: {'lr': 0.00019888045528708653, 'samples': 1586624, 'steps': 3098, 'loss/train': 2.9864256381988525} -09/21/2021 01:13:39 - INFO - __main__ - Step 49583: {'lr': 0.00019888045528708653, 'samples': 1586656, 'steps': 3098, 'loss/train': 2.1766393184661865} -09/21/2021 01:13:40 - INFO - __main__ - Step 49584: {'lr': 0.00019888045528708653, 'samples': 1586688, 'steps': 3098, 'loss/train': 2.9532556533813477} -09/21/2021 01:13:40 - INFO - __main__ - Step 49585: {'lr': 0.00019887950325367214, 'samples': 1586720, 'steps': 3099, 'loss/train': 1.5641686916351318} -09/21/2021 01:13:41 - INFO - __main__ - Step 49586: {'lr': 0.00019887950325367214, 'samples': 1586752, 'steps': 3099, 'loss/train': 2.078918695449829} -09/21/2021 01:13:42 - INFO - __main__ - Step 49587: {'lr': 0.00019887950325367214, 'samples': 1586784, 'steps': 3099, 'loss/train': 1.8290365934371948} -09/21/2021 01:13:43 - INFO - __main__ - Step 49588: {'lr': 0.00019887950325367214, 'samples': 1586816, 'steps': 3099, 'loss/train': 1.6340914964675903} -09/21/2021 01:13:43 - INFO - __main__ - Step 49589: {'lr': 0.00019887950325367214, 'samples': 1586848, 'steps': 3099, 'loss/train': 1.7815730571746826} -09/21/2021 01:13:44 - INFO - __main__ - Step 49590: {'lr': 0.00019887950325367214, 'samples': 1586880, 'steps': 3099, 'loss/train': 0.20633357763290405} -09/21/2021 01:13:45 - INFO - __main__ - Step 49591: {'lr': 0.00019887950325367214, 'samples': 1586912, 'steps': 3099, 'loss/train': 2.55545973777771} -09/21/2021 01:13:46 - INFO - __main__ - Step 49592: {'lr': 0.00019887950325367214, 'samples': 1586944, 'steps': 3099, 'loss/train': 2.324096202850342} -09/21/2021 01:13:46 - INFO - __main__ - Step 49593: {'lr': 0.00019887950325367214, 'samples': 1586976, 'steps': 3099, 'loss/train': 1.7980270385742188} -09/21/2021 01:13:47 - INFO - __main__ - Step 49594: {'lr': 0.00019887950325367214, 'samples': 1587008, 'steps': 3099, 'loss/train': 1.5669684410095215} -09/21/2021 01:13:48 - INFO - __main__ - Step 49595: {'lr': 0.00019887950325367214, 'samples': 1587040, 'steps': 3099, 'loss/train': 1.8468893766403198} -09/21/2021 01:13:49 - INFO - __main__ - Step 49596: {'lr': 0.00019887950325367214, 'samples': 1587072, 'steps': 3099, 'loss/train': 2.1621625423431396} -09/21/2021 01:13:49 - INFO - __main__ - Step 49597: {'lr': 0.00019887950325367214, 'samples': 1587104, 'steps': 3099, 'loss/train': 1.176213026046753} -09/21/2021 01:13:50 - INFO - __main__ - Step 49598: {'lr': 0.00019887950325367214, 'samples': 1587136, 'steps': 3099, 'loss/train': 1.884447693824768} -09/21/2021 01:13:51 - INFO - __main__ - Step 49599: {'lr': 0.00019887950325367214, 'samples': 1587168, 'steps': 3099, 'loss/train': 1.7948172092437744} -09/21/2021 01:13:52 - INFO - __main__ - Step 49600: {'lr': 0.00019887950325367214, 'samples': 1587200, 'steps': 3099, 'loss/train': 3.05122709274292} -09/21/2021 01:13:53 - INFO - __main__ - Step 49601: {'lr': 0.0001988785508179174, 'samples': 1587232, 'steps': 3100, 'loss/train': 1.961228609085083} -09/21/2021 01:13:53 - INFO - __main__ - Step 49602: {'lr': 0.0001988785508179174, 'samples': 1587264, 'steps': 3100, 'loss/train': 0.15400326251983643} -09/21/2021 01:13:54 - INFO - __main__ - Step 49603: {'lr': 0.0001988785508179174, 'samples': 1587296, 'steps': 3100, 'loss/train': 2.311605215072632} -09/21/2021 01:13:55 - INFO - __main__ - Step 49604: {'lr': 0.0001988785508179174, 'samples': 1587328, 'steps': 3100, 'loss/train': 1.8708876371383667} -09/21/2021 01:13:56 - INFO - __main__ - Step 49605: {'lr': 0.0001988785508179174, 'samples': 1587360, 'steps': 3100, 'loss/train': 1.9954859018325806} -09/21/2021 01:13:56 - INFO - __main__ - Step 49606: {'lr': 0.0001988785508179174, 'samples': 1587392, 'steps': 3100, 'loss/train': 1.0251399278640747} -09/21/2021 01:13:57 - INFO - __main__ - Step 49607: {'lr': 0.0001988785508179174, 'samples': 1587424, 'steps': 3100, 'loss/train': 2.1888105869293213} -09/21/2021 01:13:58 - INFO - __main__ - Step 49608: {'lr': 0.0001988785508179174, 'samples': 1587456, 'steps': 3100, 'loss/train': 2.7616524696350098} -09/21/2021 01:13:59 - INFO - __main__ - Step 49609: {'lr': 0.0001988785508179174, 'samples': 1587488, 'steps': 3100, 'loss/train': 0.07502207905054092} -09/21/2021 01:13:59 - INFO - __main__ - Step 49610: {'lr': 0.0001988785508179174, 'samples': 1587520, 'steps': 3100, 'loss/train': 0.3042876720428467} -09/21/2021 01:14:01 - INFO - __main__ - Step 49611: {'lr': 0.0001988785508179174, 'samples': 1587552, 'steps': 3100, 'loss/train': 0.5407207012176514} -09/21/2021 01:14:01 - INFO - __main__ - Step 49612: {'lr': 0.0001988785508179174, 'samples': 1587584, 'steps': 3100, 'loss/train': 1.5398441553115845} -09/21/2021 01:14:02 - INFO - __main__ - Step 49613: {'lr': 0.0001988785508179174, 'samples': 1587616, 'steps': 3100, 'loss/train': 2.2843570709228516} -09/21/2021 01:14:03 - INFO - __main__ - Step 49614: {'lr': 0.0001988785508179174, 'samples': 1587648, 'steps': 3100, 'loss/train': 1.5444564819335938} -09/21/2021 01:14:04 - INFO - __main__ - Step 49615: {'lr': 0.0001988785508179174, 'samples': 1587680, 'steps': 3100, 'loss/train': 1.292847752571106} -09/21/2021 01:14:04 - INFO - __main__ - Step 49616: {'lr': 0.0001988785508179174, 'samples': 1587712, 'steps': 3100, 'loss/train': 2.671098232269287} -09/21/2021 01:14:05 - INFO - __main__ - Step 49617: {'lr': 0.00019887759797982625, 'samples': 1587744, 'steps': 3101, 'loss/train': 2.4561569690704346} -09/21/2021 01:14:06 - INFO - __main__ - Step 49618: {'lr': 0.00019887759797982625, 'samples': 1587776, 'steps': 3101, 'loss/train': 2.0411810874938965} -09/21/2021 01:14:07 - INFO - __main__ - Step 49619: {'lr': 0.00019887759797982625, 'samples': 1587808, 'steps': 3101, 'loss/train': 2.5693650245666504} -09/21/2021 01:14:07 - INFO - __main__ - Step 49620: {'lr': 0.00019887759797982625, 'samples': 1587840, 'steps': 3101, 'loss/train': 1.85087251663208} -09/21/2021 01:14:08 - INFO - __main__ - Step 49621: {'lr': 0.00019887759797982625, 'samples': 1587872, 'steps': 3101, 'loss/train': 1.9146888256072998} -09/21/2021 01:14:09 - INFO - __main__ - Step 49622: {'lr': 0.00019887759797982625, 'samples': 1587904, 'steps': 3101, 'loss/train': 1.685804843902588} -09/21/2021 01:14:10 - INFO - __main__ - Step 49623: {'lr': 0.00019887759797982625, 'samples': 1587936, 'steps': 3101, 'loss/train': 1.419175386428833} -09/21/2021 01:14:10 - INFO - __main__ - Step 49624: {'lr': 0.00019887759797982625, 'samples': 1587968, 'steps': 3101, 'loss/train': 1.8267337083816528} -09/21/2021 01:14:11 - INFO - __main__ - Step 49625: {'lr': 0.00019887759797982625, 'samples': 1588000, 'steps': 3101, 'loss/train': 2.9567317962646484} -09/21/2021 01:14:12 - INFO - __main__ - Step 49626: {'lr': 0.00019887759797982625, 'samples': 1588032, 'steps': 3101, 'loss/train': 1.9864983558654785} -09/21/2021 01:14:13 - INFO - __main__ - Step 49627: {'lr': 0.00019887759797982625, 'samples': 1588064, 'steps': 3101, 'loss/train': 1.4083844423294067} -09/21/2021 01:14:13 - INFO - __main__ - Step 49628: {'lr': 0.00019887759797982625, 'samples': 1588096, 'steps': 3101, 'loss/train': 1.7076081037521362} -09/21/2021 01:14:14 - INFO - __main__ - Step 49629: {'lr': 0.00019887759797982625, 'samples': 1588128, 'steps': 3101, 'loss/train': 1.7330412864685059} -09/21/2021 01:14:15 - INFO - __main__ - Step 49630: {'lr': 0.00019887759797982625, 'samples': 1588160, 'steps': 3101, 'loss/train': 2.086709499359131} -09/21/2021 01:14:16 - INFO - __main__ - Step 49631: {'lr': 0.00019887759797982625, 'samples': 1588192, 'steps': 3101, 'loss/train': 1.289830207824707} -09/21/2021 01:14:16 - INFO - __main__ - Step 49632: {'lr': 0.00019887759797982625, 'samples': 1588224, 'steps': 3101, 'loss/train': 1.6780564785003662} -09/21/2021 01:14:17 - INFO - __main__ - Step 49633: {'lr': 0.0001988766447394025, 'samples': 1588256, 'steps': 3102, 'loss/train': 2.072535276412964} -09/21/2021 01:14:18 - INFO - __main__ - Step 49634: {'lr': 0.0001988766447394025, 'samples': 1588288, 'steps': 3102, 'loss/train': 2.0314621925354004} -09/21/2021 01:14:19 - INFO - __main__ - Step 49635: {'lr': 0.0001988766447394025, 'samples': 1588320, 'steps': 3102, 'loss/train': 1.9170504808425903} -09/21/2021 01:14:20 - INFO - __main__ - Step 49636: {'lr': 0.0001988766447394025, 'samples': 1588352, 'steps': 3102, 'loss/train': 1.1709024906158447} -09/21/2021 01:14:20 - INFO - __main__ - Step 49637: {'lr': 0.0001988766447394025, 'samples': 1588384, 'steps': 3102, 'loss/train': 2.477620840072632} -09/21/2021 01:14:21 - INFO - __main__ - Step 49638: {'lr': 0.0001988766447394025, 'samples': 1588416, 'steps': 3102, 'loss/train': 1.7552480697631836} -09/21/2021 01:14:22 - INFO - __main__ - Step 49639: {'lr': 0.0001988766447394025, 'samples': 1588448, 'steps': 3102, 'loss/train': 1.8840479850769043} -09/21/2021 01:14:23 - INFO - __main__ - Step 49640: {'lr': 0.0001988766447394025, 'samples': 1588480, 'steps': 3102, 'loss/train': 1.7408114671707153} -09/21/2021 01:14:23 - INFO - __main__ - Step 49641: {'lr': 0.0001988766447394025, 'samples': 1588512, 'steps': 3102, 'loss/train': 2.2787926197052} -09/21/2021 01:14:25 - INFO - __main__ - Step 49642: {'lr': 0.0001988766447394025, 'samples': 1588544, 'steps': 3102, 'loss/train': 2.153440475463867} -09/21/2021 01:14:25 - INFO - __main__ - Step 49643: {'lr': 0.0001988766447394025, 'samples': 1588576, 'steps': 3102, 'loss/train': 2.5738894939422607} -09/21/2021 01:14:26 - INFO - __main__ - Step 49644: {'lr': 0.0001988766447394025, 'samples': 1588608, 'steps': 3102, 'loss/train': 5.008352756500244} -09/21/2021 01:14:27 - INFO - __main__ - Step 49645: {'lr': 0.0001988766447394025, 'samples': 1588640, 'steps': 3102, 'loss/train': 2.649553060531616} -09/21/2021 01:14:28 - INFO - __main__ - Step 49646: {'lr': 0.0001988766447394025, 'samples': 1588672, 'steps': 3102, 'loss/train': 1.7992113828659058} -09/21/2021 01:14:28 - INFO - __main__ - Step 49647: {'lr': 0.0001988766447394025, 'samples': 1588704, 'steps': 3102, 'loss/train': 1.6932092905044556} -09/21/2021 01:14:29 - INFO - __main__ - Step 49648: {'lr': 0.0001988766447394025, 'samples': 1588736, 'steps': 3102, 'loss/train': 2.556729555130005} -09/21/2021 01:14:30 - INFO - __main__ - Step 49649: {'lr': 0.0001988756910966501, 'samples': 1588768, 'steps': 3103, 'loss/train': 1.6460630893707275} -09/21/2021 01:14:31 - INFO - __main__ - Step 49650: {'lr': 0.0001988756910966501, 'samples': 1588800, 'steps': 3103, 'loss/train': 1.075819969177246} -09/21/2021 01:14:31 - INFO - __main__ - Step 49651: {'lr': 0.0001988756910966501, 'samples': 1588832, 'steps': 3103, 'loss/train': 1.4542698860168457} -09/21/2021 01:14:32 - INFO - __main__ - Step 49652: {'lr': 0.0001988756910966501, 'samples': 1588864, 'steps': 3103, 'loss/train': 2.3616111278533936} -09/21/2021 01:14:33 - INFO - __main__ - Step 49653: {'lr': 0.0001988756910966501, 'samples': 1588896, 'steps': 3103, 'loss/train': 0.94580078125} -09/21/2021 01:14:34 - INFO - __main__ - Step 49654: {'lr': 0.0001988756910966501, 'samples': 1588928, 'steps': 3103, 'loss/train': 1.1804083585739136} -09/21/2021 01:14:34 - INFO - __main__ - Step 49655: {'lr': 0.0001988756910966501, 'samples': 1588960, 'steps': 3103, 'loss/train': 1.6976901292800903} -09/21/2021 01:14:35 - INFO - __main__ - Step 49656: {'lr': 0.0001988756910966501, 'samples': 1588992, 'steps': 3103, 'loss/train': 1.6325663328170776} -09/21/2021 01:14:36 - INFO - __main__ - Step 49657: {'lr': 0.0001988756910966501, 'samples': 1589024, 'steps': 3103, 'loss/train': 0.9009270668029785} -09/21/2021 01:14:37 - INFO - __main__ - Step 49658: {'lr': 0.0001988756910966501, 'samples': 1589056, 'steps': 3103, 'loss/train': 2.2464852333068848} -09/21/2021 01:14:37 - INFO - __main__ - Step 49659: {'lr': 0.0001988756910966501, 'samples': 1589088, 'steps': 3103, 'loss/train': 2.1237175464630127} -09/21/2021 01:14:38 - INFO - __main__ - Step 49660: {'lr': 0.0001988756910966501, 'samples': 1589120, 'steps': 3103, 'loss/train': 3.172452449798584} -09/21/2021 01:14:39 - INFO - __main__ - Step 49661: {'lr': 0.0001988756910966501, 'samples': 1589152, 'steps': 3103, 'loss/train': 1.845544695854187} -09/21/2021 01:14:40 - INFO - __main__ - Step 49662: {'lr': 0.0001988756910966501, 'samples': 1589184, 'steps': 3103, 'loss/train': 1.6173794269561768} -09/21/2021 01:14:40 - INFO - __main__ - Step 49663: {'lr': 0.0001988756910966501, 'samples': 1589216, 'steps': 3103, 'loss/train': 1.530135154724121} -09/21/2021 01:14:41 - INFO - __main__ - Step 49664: {'lr': 0.0001988756910966501, 'samples': 1589248, 'steps': 3103, 'loss/train': 1.1837620735168457} -09/21/2021 01:14:42 - INFO - __main__ - Step 49665: {'lr': 0.00019887473705157288, 'samples': 1589280, 'steps': 3104, 'loss/train': 0.7107484936714172} -09/21/2021 01:14:43 - INFO - __main__ - Step 49666: {'lr': 0.00019887473705157288, 'samples': 1589312, 'steps': 3104, 'loss/train': 1.570874810218811} -09/21/2021 01:14:44 - INFO - __main__ - Step 49667: {'lr': 0.00019887473705157288, 'samples': 1589344, 'steps': 3104, 'loss/train': 2.4941811561584473} -09/21/2021 01:14:44 - INFO - __main__ - Step 49668: {'lr': 0.00019887473705157288, 'samples': 1589376, 'steps': 3104, 'loss/train': 1.9457768201828003} -09/21/2021 01:14:45 - INFO - __main__ - Step 49669: {'lr': 0.00019887473705157288, 'samples': 1589408, 'steps': 3104, 'loss/train': 2.6349263191223145} -09/21/2021 01:14:46 - INFO - __main__ - Step 49670: {'lr': 0.00019887473705157288, 'samples': 1589440, 'steps': 3104, 'loss/train': 1.4939552545547485} -09/21/2021 01:14:47 - INFO - __main__ - Step 49671: {'lr': 0.00019887473705157288, 'samples': 1589472, 'steps': 3104, 'loss/train': 1.7916356325149536} -09/21/2021 01:14:48 - INFO - __main__ - Step 49672: {'lr': 0.00019887473705157288, 'samples': 1589504, 'steps': 3104, 'loss/train': 1.8430476188659668} -09/21/2021 01:14:49 - INFO - __main__ - Step 49673: {'lr': 0.00019887473705157288, 'samples': 1589536, 'steps': 3104, 'loss/train': 1.80158269405365} -09/21/2021 01:14:49 - INFO - __main__ - Step 49674: {'lr': 0.00019887473705157288, 'samples': 1589568, 'steps': 3104, 'loss/train': 1.8367091417312622} -09/21/2021 01:14:50 - INFO - __main__ - Step 49675: {'lr': 0.00019887473705157288, 'samples': 1589600, 'steps': 3104, 'loss/train': 2.068549871444702} -09/21/2021 01:14:51 - INFO - __main__ - Step 49676: {'lr': 0.00019887473705157288, 'samples': 1589632, 'steps': 3104, 'loss/train': 1.7124077081680298} -09/21/2021 01:14:52 - INFO - __main__ - Step 49677: {'lr': 0.00019887473705157288, 'samples': 1589664, 'steps': 3104, 'loss/train': 1.299878716468811} -09/21/2021 01:14:52 - INFO - __main__ - Step 49678: {'lr': 0.00019887473705157288, 'samples': 1589696, 'steps': 3104, 'loss/train': 0.7839471101760864} -09/21/2021 01:14:53 - INFO - __main__ - Step 49679: {'lr': 0.00019887473705157288, 'samples': 1589728, 'steps': 3104, 'loss/train': 1.4200737476348877} -09/21/2021 01:14:54 - INFO - __main__ - Step 49680: {'lr': 0.00019887473705157288, 'samples': 1589760, 'steps': 3104, 'loss/train': 1.626668095588684} -09/21/2021 01:14:55 - INFO - __main__ - Step 49681: {'lr': 0.00019887378260417476, 'samples': 1589792, 'steps': 3105, 'loss/train': 1.9066816568374634} -09/21/2021 01:14:56 - INFO - __main__ - Step 49682: {'lr': 0.00019887378260417476, 'samples': 1589824, 'steps': 3105, 'loss/train': 2.576364040374756} -09/21/2021 01:14:56 - INFO - __main__ - Step 49683: {'lr': 0.00019887378260417476, 'samples': 1589856, 'steps': 3105, 'loss/train': 1.4603056907653809} -09/21/2021 01:14:57 - INFO - __main__ - Step 49684: {'lr': 0.00019887378260417476, 'samples': 1589888, 'steps': 3105, 'loss/train': 2.232992172241211} -09/21/2021 01:14:58 - INFO - __main__ - Step 49685: {'lr': 0.00019887378260417476, 'samples': 1589920, 'steps': 3105, 'loss/train': 2.3763720989227295} -09/21/2021 01:14:59 - INFO - __main__ - Step 49686: {'lr': 0.00019887378260417476, 'samples': 1589952, 'steps': 3105, 'loss/train': 2.031963348388672} -09/21/2021 01:14:59 - INFO - __main__ - Step 49687: {'lr': 0.00019887378260417476, 'samples': 1589984, 'steps': 3105, 'loss/train': 1.8081061840057373} -09/21/2021 01:15:00 - INFO - __main__ - Step 49688: {'lr': 0.00019887378260417476, 'samples': 1590016, 'steps': 3105, 'loss/train': 1.1110161542892456} -09/21/2021 01:15:01 - INFO - __main__ - Step 49689: {'lr': 0.00019887378260417476, 'samples': 1590048, 'steps': 3105, 'loss/train': 2.0885045528411865} -09/21/2021 01:15:02 - INFO - __main__ - Step 49690: {'lr': 0.00019887378260417476, 'samples': 1590080, 'steps': 3105, 'loss/train': 1.619615912437439} -09/21/2021 01:15:02 - INFO - __main__ - Step 49691: {'lr': 0.00019887378260417476, 'samples': 1590112, 'steps': 3105, 'loss/train': 2.2636055946350098} -09/21/2021 01:15:03 - INFO - __main__ - Step 49692: {'lr': 0.00019887378260417476, 'samples': 1590144, 'steps': 3105, 'loss/train': 0.271660178899765} -09/21/2021 01:15:04 - INFO - __main__ - Step 49693: {'lr': 0.00019887378260417476, 'samples': 1590176, 'steps': 3105, 'loss/train': 2.5752146244049072} -09/21/2021 01:15:05 - INFO - __main__ - Step 49694: {'lr': 0.00019887378260417476, 'samples': 1590208, 'steps': 3105, 'loss/train': 3.5306951999664307} -09/21/2021 01:15:05 - INFO - __main__ - Step 49695: {'lr': 0.00019887378260417476, 'samples': 1590240, 'steps': 3105, 'loss/train': 2.122593402862549} -09/21/2021 01:15:06 - INFO - __main__ - Step 49696: {'lr': 0.00019887378260417476, 'samples': 1590272, 'steps': 3105, 'loss/train': 2.4205682277679443} -09/21/2021 01:15:07 - INFO - __main__ - Step 49697: {'lr': 0.0001988728277544596, 'samples': 1590304, 'steps': 3106, 'loss/train': 1.5085198879241943} -09/21/2021 01:15:08 - INFO - __main__ - Step 49698: {'lr': 0.0001988728277544596, 'samples': 1590336, 'steps': 3106, 'loss/train': 1.378337025642395} -09/21/2021 01:15:08 - INFO - __main__ - Step 49699: {'lr': 0.0001988728277544596, 'samples': 1590368, 'steps': 3106, 'loss/train': 1.7624938488006592} -09/21/2021 01:15:09 - INFO - __main__ - Step 49700: {'lr': 0.0001988728277544596, 'samples': 1590400, 'steps': 3106, 'loss/train': 2.930652141571045} -09/21/2021 01:15:10 - INFO - __main__ - Step 49701: {'lr': 0.0001988728277544596, 'samples': 1590432, 'steps': 3106, 'loss/train': 1.3009060621261597} -09/21/2021 01:15:11 - INFO - __main__ - Step 49702: {'lr': 0.0001988728277544596, 'samples': 1590464, 'steps': 3106, 'loss/train': 1.9022537469863892} -09/21/2021 01:15:12 - INFO - __main__ - Step 49703: {'lr': 0.0001988728277544596, 'samples': 1590496, 'steps': 3106, 'loss/train': 1.8864209651947021} -09/21/2021 01:15:13 - INFO - __main__ - Step 49704: {'lr': 0.0001988728277544596, 'samples': 1590528, 'steps': 3106, 'loss/train': 5.407497406005859} -09/21/2021 01:15:14 - INFO - __main__ - Step 49705: {'lr': 0.0001988728277544596, 'samples': 1590560, 'steps': 3106, 'loss/train': 2.0156188011169434} -09/21/2021 01:15:15 - INFO - __main__ - Step 49706: {'lr': 0.0001988728277544596, 'samples': 1590592, 'steps': 3106, 'loss/train': 1.2431772947311401} -09/21/2021 01:15:15 - INFO - __main__ - Step 49707: {'lr': 0.0001988728277544596, 'samples': 1590624, 'steps': 3106, 'loss/train': 1.8944064378738403} -09/21/2021 01:15:16 - INFO - __main__ - Step 49708: {'lr': 0.0001988728277544596, 'samples': 1590656, 'steps': 3106, 'loss/train': 2.698320150375366} -09/21/2021 01:15:17 - INFO - __main__ - Step 49709: {'lr': 0.0001988728277544596, 'samples': 1590688, 'steps': 3106, 'loss/train': 2.579474449157715} -09/21/2021 01:15:18 - INFO - __main__ - Step 49710: {'lr': 0.0001988728277544596, 'samples': 1590720, 'steps': 3106, 'loss/train': 2.468097686767578} -09/21/2021 01:15:18 - INFO - __main__ - Step 49711: {'lr': 0.0001988728277544596, 'samples': 1590752, 'steps': 3106, 'loss/train': 0.8300555944442749} -09/21/2021 01:15:19 - INFO - __main__ - Step 49712: {'lr': 0.0001988728277544596, 'samples': 1590784, 'steps': 3106, 'loss/train': 1.9441968202590942} -09/21/2021 01:15:20 - INFO - __main__ - Step 49713: {'lr': 0.00019887187250243127, 'samples': 1590816, 'steps': 3107, 'loss/train': 1.2953723669052124} -09/21/2021 01:15:21 - INFO - __main__ - Step 49714: {'lr': 0.00019887187250243127, 'samples': 1590848, 'steps': 3107, 'loss/train': 1.3542786836624146} -09/21/2021 01:15:22 - INFO - __main__ - Step 49715: {'lr': 0.00019887187250243127, 'samples': 1590880, 'steps': 3107, 'loss/train': 1.7596731185913086} -09/21/2021 01:15:22 - INFO - __main__ - Step 49716: {'lr': 0.00019887187250243127, 'samples': 1590912, 'steps': 3107, 'loss/train': 0.2966572344303131} -09/21/2021 01:15:23 - INFO - __main__ - Step 49717: {'lr': 0.00019887187250243127, 'samples': 1590944, 'steps': 3107, 'loss/train': 0.5433789491653442} -09/21/2021 01:15:24 - INFO - __main__ - Step 49718: {'lr': 0.00019887187250243127, 'samples': 1590976, 'steps': 3107, 'loss/train': 0.20859017968177795} -09/21/2021 01:15:25 - INFO - __main__ - Step 49719: {'lr': 0.00019887187250243127, 'samples': 1591008, 'steps': 3107, 'loss/train': 0.15004564821720123} -09/21/2021 01:15:25 - INFO - __main__ - Step 49720: {'lr': 0.00019887187250243127, 'samples': 1591040, 'steps': 3107, 'loss/train': 0.12876109778881073} -09/21/2021 01:15:26 - INFO - __main__ - Step 49721: {'lr': 0.00019887187250243127, 'samples': 1591072, 'steps': 3107, 'loss/train': 0.25782060623168945} -09/21/2021 01:15:27 - INFO - __main__ - Step 49722: {'lr': 0.00019887187250243127, 'samples': 1591104, 'steps': 3107, 'loss/train': 0.2662268579006195} -09/21/2021 01:15:28 - INFO - __main__ - Step 49723: {'lr': 0.00019887187250243127, 'samples': 1591136, 'steps': 3107, 'loss/train': 0.5113983750343323} -09/21/2021 01:15:28 - INFO - __main__ - Step 49724: {'lr': 0.00019887187250243127, 'samples': 1591168, 'steps': 3107, 'loss/train': 2.5942697525024414} -09/21/2021 01:15:29 - INFO - __main__ - Step 49725: {'lr': 0.00019887187250243127, 'samples': 1591200, 'steps': 3107, 'loss/train': 1.9319769144058228} -09/21/2021 01:15:30 - INFO - __main__ - Step 49726: {'lr': 0.00019887187250243127, 'samples': 1591232, 'steps': 3107, 'loss/train': 1.516049861907959} -09/21/2021 01:15:31 - INFO - __main__ - Step 49727: {'lr': 0.00019887187250243127, 'samples': 1591264, 'steps': 3107, 'loss/train': 1.8745676279067993} -09/21/2021 01:15:31 - INFO - __main__ - Step 49728: {'lr': 0.00019887187250243127, 'samples': 1591296, 'steps': 3107, 'loss/train': 1.8580210208892822} -09/21/2021 01:15:32 - INFO - __main__ - Step 49729: {'lr': 0.00019887091684809365, 'samples': 1591328, 'steps': 3108, 'loss/train': 1.984983205795288} -09/21/2021 01:15:33 - INFO - __main__ - Step 49730: {'lr': 0.00019887091684809365, 'samples': 1591360, 'steps': 3108, 'loss/train': 2.1487810611724854} -09/21/2021 01:15:34 - INFO - __main__ - Step 49731: {'lr': 0.00019887091684809365, 'samples': 1591392, 'steps': 3108, 'loss/train': 2.1549363136291504} -09/21/2021 01:15:34 - INFO - __main__ - Step 49732: {'lr': 0.00019887091684809365, 'samples': 1591424, 'steps': 3108, 'loss/train': 0.9645564556121826} -09/21/2021 01:15:35 - INFO - __main__ - Step 49733: {'lr': 0.00019887091684809365, 'samples': 1591456, 'steps': 3108, 'loss/train': 1.553181767463684} -09/21/2021 01:15:36 - INFO - __main__ - Step 49734: {'lr': 0.00019887091684809365, 'samples': 1591488, 'steps': 3108, 'loss/train': 2.3658952713012695} -09/21/2021 01:15:37 - INFO - __main__ - Step 49735: {'lr': 0.00019887091684809365, 'samples': 1591520, 'steps': 3108, 'loss/train': 2.4047365188598633} -09/21/2021 01:15:38 - INFO - __main__ - Step 49736: {'lr': 0.00019887091684809365, 'samples': 1591552, 'steps': 3108, 'loss/train': 2.1354777812957764} -09/21/2021 01:15:39 - INFO - __main__ - Step 49737: {'lr': 0.00019887091684809365, 'samples': 1591584, 'steps': 3108, 'loss/train': 1.1845905780792236} -09/21/2021 01:15:39 - INFO - __main__ - Step 49738: {'lr': 0.00019887091684809365, 'samples': 1591616, 'steps': 3108, 'loss/train': 1.7716021537780762} -09/21/2021 01:15:40 - INFO - __main__ - Step 49739: {'lr': 0.00019887091684809365, 'samples': 1591648, 'steps': 3108, 'loss/train': 2.716925859451294} -09/21/2021 01:15:41 - INFO - __main__ - Step 49740: {'lr': 0.00019887091684809365, 'samples': 1591680, 'steps': 3108, 'loss/train': 1.9846384525299072} -09/21/2021 01:15:42 - INFO - __main__ - Step 49741: {'lr': 0.00019887091684809365, 'samples': 1591712, 'steps': 3108, 'loss/train': 2.315413475036621} -09/21/2021 01:15:42 - INFO - __main__ - Step 49742: {'lr': 0.00019887091684809365, 'samples': 1591744, 'steps': 3108, 'loss/train': 2.029344081878662} -09/21/2021 01:15:43 - INFO - __main__ - Step 49743: {'lr': 0.00019887091684809365, 'samples': 1591776, 'steps': 3108, 'loss/train': 2.4373974800109863} -09/21/2021 01:15:44 - INFO - __main__ - Step 49744: {'lr': 0.00019887091684809365, 'samples': 1591808, 'steps': 3108, 'loss/train': 2.025980234146118} -09/21/2021 01:15:45 - INFO - __main__ - Step 49745: {'lr': 0.0001988699607914507, 'samples': 1591840, 'steps': 3109, 'loss/train': 1.0765280723571777} -09/21/2021 01:15:46 - INFO - __main__ - Step 49746: {'lr': 0.0001988699607914507, 'samples': 1591872, 'steps': 3109, 'loss/train': 1.9866245985031128} -09/21/2021 01:15:46 - INFO - __main__ - Step 49747: {'lr': 0.0001988699607914507, 'samples': 1591904, 'steps': 3109, 'loss/train': 2.280344247817993} -09/21/2021 01:15:47 - INFO - __main__ - Step 49748: {'lr': 0.0001988699607914507, 'samples': 1591936, 'steps': 3109, 'loss/train': 1.9011499881744385} -09/21/2021 01:15:48 - INFO - __main__ - Step 49749: {'lr': 0.0001988699607914507, 'samples': 1591968, 'steps': 3109, 'loss/train': 2.1988797187805176} -09/21/2021 01:15:49 - INFO - __main__ - Step 49750: {'lr': 0.0001988699607914507, 'samples': 1592000, 'steps': 3109, 'loss/train': 2.5097835063934326} -09/21/2021 01:15:49 - INFO - __main__ - Step 49751: {'lr': 0.0001988699607914507, 'samples': 1592032, 'steps': 3109, 'loss/train': 2.982948064804077} -09/21/2021 01:15:50 - INFO - __main__ - Step 49752: {'lr': 0.0001988699607914507, 'samples': 1592064, 'steps': 3109, 'loss/train': 0.7451680898666382} -09/21/2021 01:15:51 - INFO - __main__ - Step 49753: {'lr': 0.0001988699607914507, 'samples': 1592096, 'steps': 3109, 'loss/train': 1.5879360437393188} -09/21/2021 01:15:52 - INFO - __main__ - Step 49754: {'lr': 0.0001988699607914507, 'samples': 1592128, 'steps': 3109, 'loss/train': 2.419832706451416} -09/21/2021 01:15:52 - INFO - __main__ - Step 49755: {'lr': 0.0001988699607914507, 'samples': 1592160, 'steps': 3109, 'loss/train': 2.1307761669158936} -09/21/2021 01:15:53 - INFO - __main__ - Step 49756: {'lr': 0.0001988699607914507, 'samples': 1592192, 'steps': 3109, 'loss/train': 2.3000643253326416} -09/21/2021 01:15:54 - INFO - __main__ - Step 49757: {'lr': 0.0001988699607914507, 'samples': 1592224, 'steps': 3109, 'loss/train': 1.316919207572937} -09/21/2021 01:15:55 - INFO - __main__ - Step 49758: {'lr': 0.0001988699607914507, 'samples': 1592256, 'steps': 3109, 'loss/train': 2.123011589050293} -09/21/2021 01:15:55 - INFO - __main__ - Step 49759: {'lr': 0.0001988699607914507, 'samples': 1592288, 'steps': 3109, 'loss/train': 1.4786456823349} -09/21/2021 01:15:56 - INFO - __main__ - Step 49760: {'lr': 0.0001988699607914507, 'samples': 1592320, 'steps': 3109, 'loss/train': 2.4581458568573} -09/21/2021 01:15:57 - INFO - __main__ - Step 49761: {'lr': 0.00019886900433250623, 'samples': 1592352, 'steps': 3110, 'loss/train': 2.8657219409942627} -09/21/2021 01:15:58 - INFO - __main__ - Step 49762: {'lr': 0.00019886900433250623, 'samples': 1592384, 'steps': 3110, 'loss/train': 2.277592897415161} -09/21/2021 01:15:58 - INFO - __main__ - Step 49763: {'lr': 0.00019886900433250623, 'samples': 1592416, 'steps': 3110, 'loss/train': 1.4237301349639893} -09/21/2021 01:15:59 - INFO - __main__ - Step 49764: {'lr': 0.00019886900433250623, 'samples': 1592448, 'steps': 3110, 'loss/train': 1.9766204357147217} -09/21/2021 01:16:01 - INFO - __main__ - Step 49765: {'lr': 0.00019886900433250623, 'samples': 1592480, 'steps': 3110, 'loss/train': 2.9655213356018066} -09/21/2021 01:16:02 - INFO - __main__ - Step 49766: {'lr': 0.00019886900433250623, 'samples': 1592512, 'steps': 3110, 'loss/train': 2.224619150161743} -09/21/2021 01:16:03 - INFO - __main__ - Step 49767: {'lr': 0.00019886900433250623, 'samples': 1592544, 'steps': 3110, 'loss/train': 1.2384179830551147} -09/21/2021 01:16:03 - INFO - __main__ - Step 49768: {'lr': 0.00019886900433250623, 'samples': 1592576, 'steps': 3110, 'loss/train': 1.953711748123169} -09/21/2021 01:16:04 - INFO - __main__ - Step 49769: {'lr': 0.00019886900433250623, 'samples': 1592608, 'steps': 3110, 'loss/train': 2.0343871116638184} -09/21/2021 01:16:05 - INFO - __main__ - Step 49770: {'lr': 0.00019886900433250623, 'samples': 1592640, 'steps': 3110, 'loss/train': 1.959947109222412} -09/21/2021 01:16:06 - INFO - __main__ - Step 49771: {'lr': 0.00019886900433250623, 'samples': 1592672, 'steps': 3110, 'loss/train': 2.038329601287842} -09/21/2021 01:16:06 - INFO - __main__ - Step 49772: {'lr': 0.00019886900433250623, 'samples': 1592704, 'steps': 3110, 'loss/train': 2.0387468338012695} -09/21/2021 01:16:07 - INFO - __main__ - Step 49773: {'lr': 0.00019886900433250623, 'samples': 1592736, 'steps': 3110, 'loss/train': 1.8349285125732422} -09/21/2021 01:16:08 - INFO - __main__ - Step 49774: {'lr': 0.00019886900433250623, 'samples': 1592768, 'steps': 3110, 'loss/train': 0.5797871351242065} -09/21/2021 01:16:09 - INFO - __main__ - Step 49775: {'lr': 0.00019886900433250623, 'samples': 1592800, 'steps': 3110, 'loss/train': 1.5702029466629028} -09/21/2021 01:16:09 - INFO - __main__ - Step 49776: {'lr': 0.00019886900433250623, 'samples': 1592832, 'steps': 3110, 'loss/train': 1.3667545318603516} -09/21/2021 01:16:10 - INFO - __main__ - Step 49777: {'lr': 0.00019886804747126416, 'samples': 1592864, 'steps': 3111, 'loss/train': 1.9794265031814575} -09/21/2021 01:16:11 - INFO - __main__ - Step 49778: {'lr': 0.00019886804747126416, 'samples': 1592896, 'steps': 3111, 'loss/train': 1.3897180557250977} -09/21/2021 01:16:12 - INFO - __main__ - Step 49779: {'lr': 0.00019886804747126416, 'samples': 1592928, 'steps': 3111, 'loss/train': 1.9592678546905518} -09/21/2021 01:16:12 - INFO - __main__ - Step 49780: {'lr': 0.00019886804747126416, 'samples': 1592960, 'steps': 3111, 'loss/train': 2.334561586380005} -09/21/2021 01:16:13 - INFO - __main__ - Step 49781: {'lr': 0.00019886804747126416, 'samples': 1592992, 'steps': 3111, 'loss/train': 2.4572927951812744} -09/21/2021 01:16:14 - INFO - __main__ - Step 49782: {'lr': 0.00019886804747126416, 'samples': 1593024, 'steps': 3111, 'loss/train': 1.8831340074539185} -09/21/2021 01:16:15 - INFO - __main__ - Step 49783: {'lr': 0.00019886804747126416, 'samples': 1593056, 'steps': 3111, 'loss/train': 2.1885313987731934} -09/21/2021 01:16:15 - INFO - __main__ - Step 49784: {'lr': 0.00019886804747126416, 'samples': 1593088, 'steps': 3111, 'loss/train': 1.7485381364822388} -09/21/2021 01:16:16 - INFO - __main__ - Step 49785: {'lr': 0.00019886804747126416, 'samples': 1593120, 'steps': 3111, 'loss/train': 1.2357968091964722} -09/21/2021 01:16:17 - INFO - __main__ - Step 49786: {'lr': 0.00019886804747126416, 'samples': 1593152, 'steps': 3111, 'loss/train': 2.14328670501709} -09/21/2021 01:16:18 - INFO - __main__ - Step 49787: {'lr': 0.00019886804747126416, 'samples': 1593184, 'steps': 3111, 'loss/train': 1.6838648319244385} -09/21/2021 01:16:18 - INFO - __main__ - Step 49788: {'lr': 0.00019886804747126416, 'samples': 1593216, 'steps': 3111, 'loss/train': 1.2684626579284668} -09/21/2021 01:16:19 - INFO - __main__ - Step 49789: {'lr': 0.00019886804747126416, 'samples': 1593248, 'steps': 3111, 'loss/train': 0.32219162583351135} -09/21/2021 01:16:20 - INFO - __main__ - Step 49790: {'lr': 0.00019886804747126416, 'samples': 1593280, 'steps': 3111, 'loss/train': 2.2586169242858887} -09/21/2021 01:16:21 - INFO - __main__ - Step 49791: {'lr': 0.00019886804747126416, 'samples': 1593312, 'steps': 3111, 'loss/train': 1.6774777173995972} -09/21/2021 01:16:21 - INFO - __main__ - Step 49792: {'lr': 0.00019886804747126416, 'samples': 1593344, 'steps': 3111, 'loss/train': 1.9689706563949585} -09/21/2021 01:16:22 - INFO - __main__ - Step 49793: {'lr': 0.00019886709020772845, 'samples': 1593376, 'steps': 3112, 'loss/train': 1.4886311292648315} -09/21/2021 01:16:23 - INFO - __main__ - Step 49794: {'lr': 0.00019886709020772845, 'samples': 1593408, 'steps': 3112, 'loss/train': 2.429863691329956} -09/21/2021 01:16:24 - INFO - __main__ - Step 49795: {'lr': 0.00019886709020772845, 'samples': 1593440, 'steps': 3112, 'loss/train': 2.2577672004699707} -09/21/2021 01:16:25 - INFO - __main__ - Step 49796: {'lr': 0.00019886709020772845, 'samples': 1593472, 'steps': 3112, 'loss/train': 1.0304388999938965} -09/21/2021 01:16:26 - INFO - __main__ - Step 49797: {'lr': 0.00019886709020772845, 'samples': 1593504, 'steps': 3112, 'loss/train': 2.214468240737915} -09/21/2021 01:16:27 - INFO - __main__ - Step 49798: {'lr': 0.00019886709020772845, 'samples': 1593536, 'steps': 3112, 'loss/train': 2.4294371604919434} -09/21/2021 01:16:27 - INFO - __main__ - Step 49799: {'lr': 0.00019886709020772845, 'samples': 1593568, 'steps': 3112, 'loss/train': 3.5547494888305664} -09/21/2021 01:16:28 - INFO - __main__ - Step 49800: {'lr': 0.00019886709020772845, 'samples': 1593600, 'steps': 3112, 'loss/train': 1.5682166814804077} -09/21/2021 01:16:29 - INFO - __main__ - Step 49801: {'lr': 0.00019886709020772845, 'samples': 1593632, 'steps': 3112, 'loss/train': 1.9589314460754395} -09/21/2021 01:16:30 - INFO - __main__ - Step 49802: {'lr': 0.00019886709020772845, 'samples': 1593664, 'steps': 3112, 'loss/train': 0.40528762340545654} -09/21/2021 01:16:30 - INFO - __main__ - Step 49803: {'lr': 0.00019886709020772845, 'samples': 1593696, 'steps': 3112, 'loss/train': 1.3360234498977661} -09/21/2021 01:16:31 - INFO - __main__ - Step 49804: {'lr': 0.00019886709020772845, 'samples': 1593728, 'steps': 3112, 'loss/train': 2.4027650356292725} -09/21/2021 01:16:32 - INFO - __main__ - Step 49805: {'lr': 0.00019886709020772845, 'samples': 1593760, 'steps': 3112, 'loss/train': 2.6239893436431885} -09/21/2021 01:16:33 - INFO - __main__ - Step 49806: {'lr': 0.00019886709020772845, 'samples': 1593792, 'steps': 3112, 'loss/train': 2.1689863204956055} -09/21/2021 01:16:33 - INFO - __main__ - Step 49807: {'lr': 0.00019886709020772845, 'samples': 1593824, 'steps': 3112, 'loss/train': 1.173625111579895} -09/21/2021 01:16:34 - INFO - __main__ - Step 49808: {'lr': 0.00019886709020772845, 'samples': 1593856, 'steps': 3112, 'loss/train': 0.7335273623466492} -09/21/2021 01:16:35 - INFO - __main__ - Step 49809: {'lr': 0.00019886613254190287, 'samples': 1593888, 'steps': 3113, 'loss/train': 1.603639006614685} -09/21/2021 01:16:36 - INFO - __main__ - Step 49810: {'lr': 0.00019886613254190287, 'samples': 1593920, 'steps': 3113, 'loss/train': 1.945695161819458} -09/21/2021 01:16:37 - INFO - __main__ - Step 49811: {'lr': 0.00019886613254190287, 'samples': 1593952, 'steps': 3113, 'loss/train': 1.673090934753418} -09/21/2021 01:16:37 - INFO - __main__ - Step 49812: {'lr': 0.00019886613254190287, 'samples': 1593984, 'steps': 3113, 'loss/train': 2.2533347606658936} -09/21/2021 01:16:38 - INFO - __main__ - Step 49813: {'lr': 0.00019886613254190287, 'samples': 1594016, 'steps': 3113, 'loss/train': 2.361334800720215} -09/21/2021 01:16:39 - INFO - __main__ - Step 49814: {'lr': 0.00019886613254190287, 'samples': 1594048, 'steps': 3113, 'loss/train': 1.3301444053649902} -09/21/2021 01:16:40 - INFO - __main__ - Step 49815: {'lr': 0.00019886613254190287, 'samples': 1594080, 'steps': 3113, 'loss/train': 0.8437974452972412} -09/21/2021 01:16:40 - INFO - __main__ - Step 49816: {'lr': 0.00019886613254190287, 'samples': 1594112, 'steps': 3113, 'loss/train': 0.9477530121803284} -09/21/2021 01:16:41 - INFO - __main__ - Step 49817: {'lr': 0.00019886613254190287, 'samples': 1594144, 'steps': 3113, 'loss/train': 1.898355484008789} -09/21/2021 01:16:42 - INFO - __main__ - Step 49818: {'lr': 0.00019886613254190287, 'samples': 1594176, 'steps': 3113, 'loss/train': 1.8466085195541382} -09/21/2021 01:16:43 - INFO - __main__ - Step 49819: {'lr': 0.00019886613254190287, 'samples': 1594208, 'steps': 3113, 'loss/train': 2.0510566234588623} -09/21/2021 01:16:43 - INFO - __main__ - Step 49820: {'lr': 0.00019886613254190287, 'samples': 1594240, 'steps': 3113, 'loss/train': 2.270216464996338} -09/21/2021 01:16:44 - INFO - __main__ - Step 49821: {'lr': 0.00019886613254190287, 'samples': 1594272, 'steps': 3113, 'loss/train': 1.3859670162200928} -09/21/2021 01:16:45 - INFO - __main__ - Step 49822: {'lr': 0.00019886613254190287, 'samples': 1594304, 'steps': 3113, 'loss/train': 0.6751554608345032} -09/21/2021 01:16:46 - INFO - __main__ - Step 49823: {'lr': 0.00019886613254190287, 'samples': 1594336, 'steps': 3113, 'loss/train': 1.6444083452224731} -09/21/2021 01:16:46 - INFO - __main__ - Step 49824: {'lr': 0.00019886613254190287, 'samples': 1594368, 'steps': 3113, 'loss/train': 1.6052769422531128} -09/21/2021 01:16:47 - INFO - __main__ - Step 49825: {'lr': 0.0001988651744737914, 'samples': 1594400, 'steps': 3114, 'loss/train': 1.7338180541992188} -09/21/2021 01:16:48 - INFO - __main__ - Step 49826: {'lr': 0.0001988651744737914, 'samples': 1594432, 'steps': 3114, 'loss/train': 0.24954098463058472} -09/21/2021 01:16:49 - INFO - __main__ - Step 49827: {'lr': 0.0001988651744737914, 'samples': 1594464, 'steps': 3114, 'loss/train': 2.141688346862793} -09/21/2021 01:16:50 - INFO - __main__ - Step 49828: {'lr': 0.0001988651744737914, 'samples': 1594496, 'steps': 3114, 'loss/train': 1.9296822547912598} -09/21/2021 01:16:51 - INFO - __main__ - Step 49829: {'lr': 0.0001988651744737914, 'samples': 1594528, 'steps': 3114, 'loss/train': 1.6096059083938599} -09/21/2021 01:16:51 - INFO - __main__ - Step 49830: {'lr': 0.0001988651744737914, 'samples': 1594560, 'steps': 3114, 'loss/train': 1.5805516242980957} -09/21/2021 01:16:52 - INFO - __main__ - Step 49831: {'lr': 0.0001988651744737914, 'samples': 1594592, 'steps': 3114, 'loss/train': 2.1893839836120605} -09/21/2021 01:16:53 - INFO - __main__ - Step 49832: {'lr': 0.0001988651744737914, 'samples': 1594624, 'steps': 3114, 'loss/train': 1.8661935329437256} -09/21/2021 01:16:54 - INFO - __main__ - Step 49833: {'lr': 0.0001988651744737914, 'samples': 1594656, 'steps': 3114, 'loss/train': 1.7844634056091309} -09/21/2021 01:16:54 - INFO - __main__ - Step 49834: {'lr': 0.0001988651744737914, 'samples': 1594688, 'steps': 3114, 'loss/train': 1.6341054439544678} -09/21/2021 01:16:55 - INFO - __main__ - Step 49835: {'lr': 0.0001988651744737914, 'samples': 1594720, 'steps': 3114, 'loss/train': 3.9475209712982178} -09/21/2021 01:16:56 - INFO - __main__ - Step 49836: {'lr': 0.0001988651744737914, 'samples': 1594752, 'steps': 3114, 'loss/train': 2.288140058517456} -09/21/2021 01:16:57 - INFO - __main__ - Step 49837: {'lr': 0.0001988651744737914, 'samples': 1594784, 'steps': 3114, 'loss/train': 1.146798014640808} -09/21/2021 01:16:57 - INFO - __main__ - Step 49838: {'lr': 0.0001988651744737914, 'samples': 1594816, 'steps': 3114, 'loss/train': 1.874954104423523} -09/21/2021 01:16:58 - INFO - __main__ - Step 49839: {'lr': 0.0001988651744737914, 'samples': 1594848, 'steps': 3114, 'loss/train': 1.9958089590072632} -09/21/2021 01:16:59 - INFO - __main__ - Step 49840: {'lr': 0.0001988651744737914, 'samples': 1594880, 'steps': 3114, 'loss/train': 2.1305155754089355} -09/21/2021 01:17:00 - INFO - __main__ - Step 49841: {'lr': 0.00019886421600339793, 'samples': 1594912, 'steps': 3115, 'loss/train': 1.7270759344100952} -09/21/2021 01:17:01 - INFO - __main__ - Step 49842: {'lr': 0.00019886421600339793, 'samples': 1594944, 'steps': 3115, 'loss/train': 1.3498342037200928} -09/21/2021 01:17:01 - INFO - __main__ - Step 49843: {'lr': 0.00019886421600339793, 'samples': 1594976, 'steps': 3115, 'loss/train': 2.7347466945648193} -09/21/2021 01:17:02 - INFO - __main__ - Step 49844: {'lr': 0.00019886421600339793, 'samples': 1595008, 'steps': 3115, 'loss/train': 1.9468144178390503} -09/21/2021 01:17:03 - INFO - __main__ - Step 49845: {'lr': 0.00019886421600339793, 'samples': 1595040, 'steps': 3115, 'loss/train': 1.8526748418807983} -09/21/2021 01:17:04 - INFO - __main__ - Step 49846: {'lr': 0.00019886421600339793, 'samples': 1595072, 'steps': 3115, 'loss/train': 1.0894368886947632} -09/21/2021 01:17:04 - INFO - __main__ - Step 49847: {'lr': 0.00019886421600339793, 'samples': 1595104, 'steps': 3115, 'loss/train': 1.3458091020584106} -09/21/2021 01:17:05 - INFO - __main__ - Step 49848: {'lr': 0.00019886421600339793, 'samples': 1595136, 'steps': 3115, 'loss/train': 0.7094192504882812} -09/21/2021 01:17:06 - INFO - __main__ - Step 49849: {'lr': 0.00019886421600339793, 'samples': 1595168, 'steps': 3115, 'loss/train': 2.0004539489746094} -09/21/2021 01:17:07 - INFO - __main__ - Step 49850: {'lr': 0.00019886421600339793, 'samples': 1595200, 'steps': 3115, 'loss/train': 1.926753282546997} -09/21/2021 01:17:07 - INFO - __main__ - Step 49851: {'lr': 0.00019886421600339793, 'samples': 1595232, 'steps': 3115, 'loss/train': 2.2199370861053467} -09/21/2021 01:17:08 - INFO - __main__ - Step 49852: {'lr': 0.00019886421600339793, 'samples': 1595264, 'steps': 3115, 'loss/train': 1.7915924787521362} -09/21/2021 01:17:09 - INFO - __main__ - Step 49853: {'lr': 0.00019886421600339793, 'samples': 1595296, 'steps': 3115, 'loss/train': 1.507541537284851} -09/21/2021 01:17:10 - INFO - __main__ - Step 49854: {'lr': 0.00019886421600339793, 'samples': 1595328, 'steps': 3115, 'loss/train': 2.302417278289795} -09/21/2021 01:17:10 - INFO - __main__ - Step 49855: {'lr': 0.00019886421600339793, 'samples': 1595360, 'steps': 3115, 'loss/train': 2.5548315048217773} -09/21/2021 01:17:11 - INFO - __main__ - Step 49856: {'lr': 0.00019886421600339793, 'samples': 1595392, 'steps': 3115, 'loss/train': 1.7845124006271362} -09/21/2021 01:17:13 - INFO - __main__ - Step 49857: {'lr': 0.00019886325713072632, 'samples': 1595424, 'steps': 3116, 'loss/train': 2.071998357772827} -09/21/2021 01:17:13 - INFO - __main__ - Step 49858: {'lr': 0.00019886325713072632, 'samples': 1595456, 'steps': 3116, 'loss/train': 2.423482656478882} -09/21/2021 01:17:14 - INFO - __main__ - Step 49859: {'lr': 0.00019886325713072632, 'samples': 1595488, 'steps': 3116, 'loss/train': 1.4802451133728027} -09/21/2021 01:17:15 - INFO - __main__ - Step 49860: {'lr': 0.00019886325713072632, 'samples': 1595520, 'steps': 3116, 'loss/train': 2.5488579273223877} -09/21/2021 01:17:16 - INFO - __main__ - Step 49861: {'lr': 0.00019886325713072632, 'samples': 1595552, 'steps': 3116, 'loss/train': 0.10735548287630081} -09/21/2021 01:17:16 - INFO - __main__ - Step 49862: {'lr': 0.00019886325713072632, 'samples': 1595584, 'steps': 3116, 'loss/train': 1.1589330434799194} -09/21/2021 01:17:17 - INFO - __main__ - Step 49863: {'lr': 0.00019886325713072632, 'samples': 1595616, 'steps': 3116, 'loss/train': 1.663339376449585} -09/21/2021 01:17:18 - INFO - __main__ - Step 49864: {'lr': 0.00019886325713072632, 'samples': 1595648, 'steps': 3116, 'loss/train': 1.6187632083892822} -09/21/2021 01:17:19 - INFO - __main__ - Step 49865: {'lr': 0.00019886325713072632, 'samples': 1595680, 'steps': 3116, 'loss/train': 1.9829543828964233} -09/21/2021 01:17:19 - INFO - __main__ - Step 49866: {'lr': 0.00019886325713072632, 'samples': 1595712, 'steps': 3116, 'loss/train': 1.5526596307754517} -09/21/2021 01:17:20 - INFO - __main__ - Step 49867: {'lr': 0.00019886325713072632, 'samples': 1595744, 'steps': 3116, 'loss/train': 1.499834656715393} -09/21/2021 01:17:21 - INFO - __main__ - Step 49868: {'lr': 0.00019886325713072632, 'samples': 1595776, 'steps': 3116, 'loss/train': 2.9499285221099854} -09/21/2021 01:17:22 - INFO - __main__ - Step 49869: {'lr': 0.00019886325713072632, 'samples': 1595808, 'steps': 3116, 'loss/train': 1.8651708364486694} -09/21/2021 01:17:22 - INFO - __main__ - Step 49870: {'lr': 0.00019886325713072632, 'samples': 1595840, 'steps': 3116, 'loss/train': 2.381650686264038} -09/21/2021 01:17:23 - INFO - __main__ - Step 49871: {'lr': 0.00019886325713072632, 'samples': 1595872, 'steps': 3116, 'loss/train': 1.4515864849090576} -09/21/2021 01:17:24 - INFO - __main__ - Step 49872: {'lr': 0.00019886325713072632, 'samples': 1595904, 'steps': 3116, 'loss/train': 1.6952494382858276} -09/21/2021 01:17:25 - INFO - __main__ - Step 49873: {'lr': 0.00019886229785578055, 'samples': 1595936, 'steps': 3117, 'loss/train': 1.980844497680664} -09/21/2021 01:17:25 - INFO - __main__ - Step 49874: {'lr': 0.00019886229785578055, 'samples': 1595968, 'steps': 3117, 'loss/train': 2.243724822998047} -09/21/2021 01:17:26 - INFO - __main__ - Step 49875: {'lr': 0.00019886229785578055, 'samples': 1596000, 'steps': 3117, 'loss/train': 1.8760462999343872} -09/21/2021 01:17:27 - INFO - __main__ - Step 49876: {'lr': 0.00019886229785578055, 'samples': 1596032, 'steps': 3117, 'loss/train': 2.2769691944122314} -09/21/2021 01:17:28 - INFO - __main__ - Step 49877: {'lr': 0.00019886229785578055, 'samples': 1596064, 'steps': 3117, 'loss/train': 1.801269292831421} -09/21/2021 01:17:28 - INFO - __main__ - Step 49878: {'lr': 0.00019886229785578055, 'samples': 1596096, 'steps': 3117, 'loss/train': 2.492680311203003} -09/21/2021 01:17:29 - INFO - __main__ - Step 49879: {'lr': 0.00019886229785578055, 'samples': 1596128, 'steps': 3117, 'loss/train': 2.28994083404541} -09/21/2021 01:17:30 - INFO - __main__ - Step 49880: {'lr': 0.00019886229785578055, 'samples': 1596160, 'steps': 3117, 'loss/train': 1.7346713542938232} -09/21/2021 01:17:31 - INFO - __main__ - Step 49881: {'lr': 0.00019886229785578055, 'samples': 1596192, 'steps': 3117, 'loss/train': 2.065685987472534} -09/21/2021 01:17:31 - INFO - __main__ - Step 49882: {'lr': 0.00019886229785578055, 'samples': 1596224, 'steps': 3117, 'loss/train': 1.5633569955825806} -09/21/2021 01:17:32 - INFO - __main__ - Step 49883: {'lr': 0.00019886229785578055, 'samples': 1596256, 'steps': 3117, 'loss/train': 2.3736608028411865} -09/21/2021 01:17:33 - INFO - __main__ - Step 49884: {'lr': 0.00019886229785578055, 'samples': 1596288, 'steps': 3117, 'loss/train': 2.2879998683929443} -09/21/2021 01:17:34 - INFO - __main__ - Step 49885: {'lr': 0.00019886229785578055, 'samples': 1596320, 'steps': 3117, 'loss/train': 1.5667997598648071} -09/21/2021 01:17:34 - INFO - __main__ - Step 49886: {'lr': 0.00019886229785578055, 'samples': 1596352, 'steps': 3117, 'loss/train': 2.477867364883423} -09/21/2021 01:17:35 - INFO - __main__ - Step 49887: {'lr': 0.00019886229785578055, 'samples': 1596384, 'steps': 3117, 'loss/train': 0.7180259823799133} -09/21/2021 01:17:36 - INFO - __main__ - Step 49888: {'lr': 0.00019886229785578055, 'samples': 1596416, 'steps': 3117, 'loss/train': 2.538119316101074} -09/21/2021 01:17:37 - INFO - __main__ - Step 49889: {'lr': 0.00019886133817856446, 'samples': 1596448, 'steps': 3118, 'loss/train': 0.7520202398300171} -09/21/2021 01:17:38 - INFO - __main__ - Step 49890: {'lr': 0.00019886133817856446, 'samples': 1596480, 'steps': 3118, 'loss/train': 1.8322622776031494} -09/21/2021 01:17:39 - INFO - __main__ - Step 49891: {'lr': 0.00019886133817856446, 'samples': 1596512, 'steps': 3118, 'loss/train': 2.0245296955108643} -09/21/2021 01:17:40 - INFO - __main__ - Step 49892: {'lr': 0.00019886133817856446, 'samples': 1596544, 'steps': 3118, 'loss/train': 0.21268391609191895} -09/21/2021 01:17:40 - INFO - __main__ - Step 49893: {'lr': 0.00019886133817856446, 'samples': 1596576, 'steps': 3118, 'loss/train': 1.4806057214736938} -09/21/2021 01:17:41 - INFO - __main__ - Step 49894: {'lr': 0.00019886133817856446, 'samples': 1596608, 'steps': 3118, 'loss/train': 1.4514323472976685} -09/21/2021 01:17:42 - INFO - __main__ - Step 49895: {'lr': 0.00019886133817856446, 'samples': 1596640, 'steps': 3118, 'loss/train': 1.55668306350708} -09/21/2021 01:17:43 - INFO - __main__ - Step 49896: {'lr': 0.00019886133817856446, 'samples': 1596672, 'steps': 3118, 'loss/train': 0.9236699342727661} -09/21/2021 01:17:43 - INFO - __main__ - Step 49897: {'lr': 0.00019886133817856446, 'samples': 1596704, 'steps': 3118, 'loss/train': 2.912004232406616} -09/21/2021 01:17:44 - INFO - __main__ - Step 49898: {'lr': 0.00019886133817856446, 'samples': 1596736, 'steps': 3118, 'loss/train': 1.6574772596359253} -09/21/2021 01:17:45 - INFO - __main__ - Step 49899: {'lr': 0.00019886133817856446, 'samples': 1596768, 'steps': 3118, 'loss/train': 1.975961446762085} -09/21/2021 01:17:46 - INFO - __main__ - Step 49900: {'lr': 0.00019886133817856446, 'samples': 1596800, 'steps': 3118, 'loss/train': 2.0873851776123047} -09/21/2021 01:17:46 - INFO - __main__ - Step 49901: {'lr': 0.00019886133817856446, 'samples': 1596832, 'steps': 3118, 'loss/train': 2.1196234226226807} -09/21/2021 01:17:47 - INFO - __main__ - Step 49902: {'lr': 0.00019886133817856446, 'samples': 1596864, 'steps': 3118, 'loss/train': 1.3740030527114868} -09/21/2021 01:17:48 - INFO - __main__ - Step 49903: {'lr': 0.00019886133817856446, 'samples': 1596896, 'steps': 3118, 'loss/train': 2.5985639095306396} -09/21/2021 01:17:49 - INFO - __main__ - Step 49904: {'lr': 0.00019886133817856446, 'samples': 1596928, 'steps': 3118, 'loss/train': 2.067319631576538} -09/21/2021 01:17:50 - INFO - __main__ - Step 49905: {'lr': 0.00019886037809908194, 'samples': 1596960, 'steps': 3119, 'loss/train': 1.5908281803131104} -09/21/2021 01:17:50 - INFO - __main__ - Step 49906: {'lr': 0.00019886037809908194, 'samples': 1596992, 'steps': 3119, 'loss/train': 0.9988732933998108} -09/21/2021 01:17:51 - INFO - __main__ - Step 49907: {'lr': 0.00019886037809908194, 'samples': 1597024, 'steps': 3119, 'loss/train': 1.4494651556015015} -09/21/2021 01:17:52 - INFO - __main__ - Step 49908: {'lr': 0.00019886037809908194, 'samples': 1597056, 'steps': 3119, 'loss/train': 2.4185221195220947} -09/21/2021 01:17:53 - INFO - __main__ - Step 49909: {'lr': 0.00019886037809908194, 'samples': 1597088, 'steps': 3119, 'loss/train': 1.880761981010437} -09/21/2021 01:17:53 - INFO - __main__ - Step 49910: {'lr': 0.00019886037809908194, 'samples': 1597120, 'steps': 3119, 'loss/train': 2.4946019649505615} -09/21/2021 01:17:54 - INFO - __main__ - Step 49911: {'lr': 0.00019886037809908194, 'samples': 1597152, 'steps': 3119, 'loss/train': 1.408590316772461} -09/21/2021 01:17:55 - INFO - __main__ - Step 49912: {'lr': 0.00019886037809908194, 'samples': 1597184, 'steps': 3119, 'loss/train': 1.8147292137145996} -09/21/2021 01:17:56 - INFO - __main__ - Step 49913: {'lr': 0.00019886037809908194, 'samples': 1597216, 'steps': 3119, 'loss/train': 2.546295166015625} -09/21/2021 01:17:56 - INFO - __main__ - Step 49914: {'lr': 0.00019886037809908194, 'samples': 1597248, 'steps': 3119, 'loss/train': 1.0992356538772583} -09/21/2021 01:17:57 - INFO - __main__ - Step 49915: {'lr': 0.00019886037809908194, 'samples': 1597280, 'steps': 3119, 'loss/train': 1.7590174674987793} -09/21/2021 01:17:58 - INFO - __main__ - Step 49916: {'lr': 0.00019886037809908194, 'samples': 1597312, 'steps': 3119, 'loss/train': 1.426370620727539} -09/21/2021 01:17:59 - INFO - __main__ - Step 49917: {'lr': 0.00019886037809908194, 'samples': 1597344, 'steps': 3119, 'loss/train': 2.901883363723755} -09/21/2021 01:17:59 - INFO - __main__ - Step 49918: {'lr': 0.00019886037809908194, 'samples': 1597376, 'steps': 3119, 'loss/train': 1.5031459331512451} -09/21/2021 01:18:01 - INFO - __main__ - Step 49919: {'lr': 0.00019886037809908194, 'samples': 1597408, 'steps': 3119, 'loss/train': 1.7362120151519775} -09/21/2021 01:18:01 - INFO - __main__ - Step 49920: {'lr': 0.00019886037809908194, 'samples': 1597440, 'steps': 3119, 'loss/train': 0.8256494402885437} -09/21/2021 01:18:02 - INFO - __main__ - Step 49921: {'lr': 0.00019885941761733694, 'samples': 1597472, 'steps': 3120, 'loss/train': 0.812838077545166} -09/21/2021 01:18:03 - INFO - __main__ - Step 49922: {'lr': 0.00019885941761733694, 'samples': 1597504, 'steps': 3120, 'loss/train': 1.1025978326797485} -09/21/2021 01:18:04 - INFO - __main__ - Step 49923: {'lr': 0.00019885941761733694, 'samples': 1597536, 'steps': 3120, 'loss/train': 2.1286933422088623} -09/21/2021 01:18:04 - INFO - __main__ - Step 49924: {'lr': 0.00019885941761733694, 'samples': 1597568, 'steps': 3120, 'loss/train': 2.7352664470672607} -09/21/2021 01:18:05 - INFO - __main__ - Step 49925: {'lr': 0.00019885941761733694, 'samples': 1597600, 'steps': 3120, 'loss/train': 1.7142685651779175} -09/21/2021 01:18:06 - INFO - __main__ - Step 49926: {'lr': 0.00019885941761733694, 'samples': 1597632, 'steps': 3120, 'loss/train': 3.5831825733184814} -09/21/2021 01:18:07 - INFO - __main__ - Step 49927: {'lr': 0.00019885941761733694, 'samples': 1597664, 'steps': 3120, 'loss/train': 1.7854446172714233} -09/21/2021 01:18:07 - INFO - __main__ - Step 49928: {'lr': 0.00019885941761733694, 'samples': 1597696, 'steps': 3120, 'loss/train': 1.4744610786437988} -09/21/2021 01:18:08 - INFO - __main__ - Step 49929: {'lr': 0.00019885941761733694, 'samples': 1597728, 'steps': 3120, 'loss/train': 2.4814281463623047} -09/21/2021 01:18:09 - INFO - __main__ - Step 49930: {'lr': 0.00019885941761733694, 'samples': 1597760, 'steps': 3120, 'loss/train': 2.2978947162628174} -09/21/2021 01:18:10 - INFO - __main__ - Step 49931: {'lr': 0.00019885941761733694, 'samples': 1597792, 'steps': 3120, 'loss/train': 2.376577377319336} -09/21/2021 01:18:10 - INFO - __main__ - Step 49932: {'lr': 0.00019885941761733694, 'samples': 1597824, 'steps': 3120, 'loss/train': 0.3609131872653961} -09/21/2021 01:18:11 - INFO - __main__ - Step 49933: {'lr': 0.00019885941761733694, 'samples': 1597856, 'steps': 3120, 'loss/train': 1.8948427438735962} -09/21/2021 01:18:12 - INFO - __main__ - Step 49934: {'lr': 0.00019885941761733694, 'samples': 1597888, 'steps': 3120, 'loss/train': 0.7548096776008606} -09/21/2021 01:18:13 - INFO - __main__ - Step 49935: {'lr': 0.00019885941761733694, 'samples': 1597920, 'steps': 3120, 'loss/train': 1.7000583410263062} -09/21/2021 01:18:13 - INFO - __main__ - Step 49936: {'lr': 0.00019885941761733694, 'samples': 1597952, 'steps': 3120, 'loss/train': 0.10804755985736847} -09/21/2021 01:18:14 - INFO - __main__ - Step 49937: {'lr': 0.00019885845673333334, 'samples': 1597984, 'steps': 3121, 'loss/train': 2.212947130203247} -09/21/2021 01:18:15 - INFO - __main__ - Step 49938: {'lr': 0.00019885845673333334, 'samples': 1598016, 'steps': 3121, 'loss/train': 2.128509998321533} -09/21/2021 01:18:16 - INFO - __main__ - Step 49939: {'lr': 0.00019885845673333334, 'samples': 1598048, 'steps': 3121, 'loss/train': 2.0953612327575684} -09/21/2021 01:18:17 - INFO - __main__ - Step 49940: {'lr': 0.00019885845673333334, 'samples': 1598080, 'steps': 3121, 'loss/train': 2.3541691303253174} -09/21/2021 01:18:17 - INFO - __main__ - Step 49941: {'lr': 0.00019885845673333334, 'samples': 1598112, 'steps': 3121, 'loss/train': 2.395423650741577} -09/21/2021 01:18:18 - INFO - __main__ - Step 49942: {'lr': 0.00019885845673333334, 'samples': 1598144, 'steps': 3121, 'loss/train': 1.9988425970077515} -09/21/2021 01:18:19 - INFO - __main__ - Step 49943: {'lr': 0.00019885845673333334, 'samples': 1598176, 'steps': 3121, 'loss/train': 2.22068452835083} -09/21/2021 01:18:20 - INFO - __main__ - Step 49944: {'lr': 0.00019885845673333334, 'samples': 1598208, 'steps': 3121, 'loss/train': 2.479196071624756} -09/21/2021 01:18:20 - INFO - __main__ - Step 49945: {'lr': 0.00019885845673333334, 'samples': 1598240, 'steps': 3121, 'loss/train': 2.8953702449798584} -09/21/2021 01:18:21 - INFO - __main__ - Step 49946: {'lr': 0.00019885845673333334, 'samples': 1598272, 'steps': 3121, 'loss/train': 2.045304298400879} -09/21/2021 01:18:22 - INFO - __main__ - Step 49947: {'lr': 0.00019885845673333334, 'samples': 1598304, 'steps': 3121, 'loss/train': 1.5984182357788086} -09/21/2021 01:18:23 - INFO - __main__ - Step 49948: {'lr': 0.00019885845673333334, 'samples': 1598336, 'steps': 3121, 'loss/train': 2.0171027183532715} -09/21/2021 01:18:23 - INFO - __main__ - Step 49949: {'lr': 0.00019885845673333334, 'samples': 1598368, 'steps': 3121, 'loss/train': 1.7669646739959717} -09/21/2021 01:18:25 - INFO - __main__ - Step 49950: {'lr': 0.00019885845673333334, 'samples': 1598400, 'steps': 3121, 'loss/train': 2.047757387161255} -09/21/2021 01:18:26 - INFO - __main__ - Step 49951: {'lr': 0.00019885845673333334, 'samples': 1598432, 'steps': 3121, 'loss/train': 1.5964975357055664} -09/21/2021 01:18:27 - INFO - __main__ - Step 49952: {'lr': 0.00019885845673333334, 'samples': 1598464, 'steps': 3121, 'loss/train': 1.9673911333084106} -09/21/2021 01:18:28 - INFO - __main__ - Step 49953: {'lr': 0.0001988574954470751, 'samples': 1598496, 'steps': 3122, 'loss/train': 2.512906312942505} -09/21/2021 01:18:28 - INFO - __main__ - Step 49954: {'lr': 0.0001988574954470751, 'samples': 1598528, 'steps': 3122, 'loss/train': 1.1298009157180786} -09/21/2021 01:18:29 - INFO - __main__ - Step 49955: {'lr': 0.0001988574954470751, 'samples': 1598560, 'steps': 3122, 'loss/train': 1.959102988243103} -09/21/2021 01:18:30 - INFO - __main__ - Step 49956: {'lr': 0.0001988574954470751, 'samples': 1598592, 'steps': 3122, 'loss/train': 2.144219398498535} -09/21/2021 01:18:31 - INFO - __main__ - Step 49957: {'lr': 0.0001988574954470751, 'samples': 1598624, 'steps': 3122, 'loss/train': 2.19738507270813} -09/21/2021 01:18:31 - INFO - __main__ - Step 49958: {'lr': 0.0001988574954470751, 'samples': 1598656, 'steps': 3122, 'loss/train': 2.0759401321411133} -09/21/2021 01:18:32 - INFO - __main__ - Step 49959: {'lr': 0.0001988574954470751, 'samples': 1598688, 'steps': 3122, 'loss/train': 1.898132085800171} -09/21/2021 01:18:33 - INFO - __main__ - Step 49960: {'lr': 0.0001988574954470751, 'samples': 1598720, 'steps': 3122, 'loss/train': 1.9147608280181885} -09/21/2021 01:18:34 - INFO - __main__ - Step 49961: {'lr': 0.0001988574954470751, 'samples': 1598752, 'steps': 3122, 'loss/train': 2.861966371536255} -09/21/2021 01:18:34 - INFO - __main__ - Step 49962: {'lr': 0.0001988574954470751, 'samples': 1598784, 'steps': 3122, 'loss/train': 1.105767846107483} -09/21/2021 01:18:35 - INFO - __main__ - Step 49963: {'lr': 0.0001988574954470751, 'samples': 1598816, 'steps': 3122, 'loss/train': 1.5876598358154297} -09/21/2021 01:18:36 - INFO - __main__ - Step 49964: {'lr': 0.0001988574954470751, 'samples': 1598848, 'steps': 3122, 'loss/train': 2.102626085281372} -09/21/2021 01:18:37 - INFO - __main__ - Step 49965: {'lr': 0.0001988574954470751, 'samples': 1598880, 'steps': 3122, 'loss/train': 1.6815803050994873} -09/21/2021 01:18:37 - INFO - __main__ - Step 49966: {'lr': 0.0001988574954470751, 'samples': 1598912, 'steps': 3122, 'loss/train': 2.061082124710083} -09/21/2021 01:18:38 - INFO - __main__ - Step 49967: {'lr': 0.0001988574954470751, 'samples': 1598944, 'steps': 3122, 'loss/train': 1.4136208295822144} -09/21/2021 01:18:39 - INFO - __main__ - Step 49968: {'lr': 0.0001988574954470751, 'samples': 1598976, 'steps': 3122, 'loss/train': 2.1992835998535156} -09/21/2021 01:18:40 - INFO - __main__ - Step 49969: {'lr': 0.00019885653375856604, 'samples': 1599008, 'steps': 3123, 'loss/train': 1.8383349180221558} -09/21/2021 01:18:41 - INFO - __main__ - Step 49970: {'lr': 0.00019885653375856604, 'samples': 1599040, 'steps': 3123, 'loss/train': 1.3036683797836304} -09/21/2021 01:18:41 - INFO - __main__ - Step 49971: {'lr': 0.00019885653375856604, 'samples': 1599072, 'steps': 3123, 'loss/train': 2.297966718673706} -09/21/2021 01:18:42 - INFO - __main__ - Step 49972: {'lr': 0.00019885653375856604, 'samples': 1599104, 'steps': 3123, 'loss/train': 2.205970287322998} -09/21/2021 01:18:43 - INFO - __main__ - Step 49973: {'lr': 0.00019885653375856604, 'samples': 1599136, 'steps': 3123, 'loss/train': 1.4929182529449463} -09/21/2021 01:18:44 - INFO - __main__ - Step 49974: {'lr': 0.00019885653375856604, 'samples': 1599168, 'steps': 3123, 'loss/train': 2.5667171478271484} -09/21/2021 01:18:44 - INFO - __main__ - Step 49975: {'lr': 0.00019885653375856604, 'samples': 1599200, 'steps': 3123, 'loss/train': 2.5095999240875244} -09/21/2021 01:18:45 - INFO - __main__ - Step 49976: {'lr': 0.00019885653375856604, 'samples': 1599232, 'steps': 3123, 'loss/train': 2.887631893157959} -09/21/2021 01:18:46 - INFO - __main__ - Step 49977: {'lr': 0.00019885653375856604, 'samples': 1599264, 'steps': 3123, 'loss/train': 2.0541133880615234} -09/21/2021 01:18:47 - INFO - __main__ - Step 49978: {'lr': 0.00019885653375856604, 'samples': 1599296, 'steps': 3123, 'loss/train': 1.8626216650009155} -09/21/2021 01:18:47 - INFO - __main__ - Step 49979: {'lr': 0.00019885653375856604, 'samples': 1599328, 'steps': 3123, 'loss/train': 1.8836528062820435} -09/21/2021 01:18:48 - INFO - __main__ - Step 49980: {'lr': 0.00019885653375856604, 'samples': 1599360, 'steps': 3123, 'loss/train': 2.39350962638855} -09/21/2021 01:18:49 - INFO - __main__ - Step 49981: {'lr': 0.00019885653375856604, 'samples': 1599392, 'steps': 3123, 'loss/train': 1.848259687423706} -09/21/2021 01:18:50 - INFO - __main__ - Step 49982: {'lr': 0.00019885653375856604, 'samples': 1599424, 'steps': 3123, 'loss/train': 1.6789182424545288} -09/21/2021 01:18:50 - INFO - __main__ - Step 49983: {'lr': 0.00019885653375856604, 'samples': 1599456, 'steps': 3123, 'loss/train': 1.8803012371063232} -09/21/2021 01:18:51 - INFO - __main__ - Step 49984: {'lr': 0.00019885653375856604, 'samples': 1599488, 'steps': 3123, 'loss/train': 1.783506155014038} -09/21/2021 01:18:52 - INFO - __main__ - Step 49985: {'lr': 0.00019885557166781018, 'samples': 1599520, 'steps': 3124, 'loss/train': 1.4371873140335083} -09/21/2021 01:18:53 - INFO - __main__ - Step 49986: {'lr': 0.00019885557166781018, 'samples': 1599552, 'steps': 3124, 'loss/train': 1.8268319368362427} -09/21/2021 01:18:54 - INFO - __main__ - Step 49987: {'lr': 0.00019885557166781018, 'samples': 1599584, 'steps': 3124, 'loss/train': 2.0482170581817627} -09/21/2021 01:18:55 - INFO - __main__ - Step 49988: {'lr': 0.00019885557166781018, 'samples': 1599616, 'steps': 3124, 'loss/train': 1.637382984161377} -09/21/2021 01:18:56 - INFO - __main__ - Step 49989: {'lr': 0.00019885557166781018, 'samples': 1599648, 'steps': 3124, 'loss/train': 2.0305488109588623} -09/21/2021 01:18:56 - INFO - __main__ - Step 49990: {'lr': 0.00019885557166781018, 'samples': 1599680, 'steps': 3124, 'loss/train': 1.1916102170944214} -09/21/2021 01:18:57 - INFO - __main__ - Step 49991: {'lr': 0.00019885557166781018, 'samples': 1599712, 'steps': 3124, 'loss/train': 0.14500190317630768} -09/21/2021 01:18:58 - INFO - __main__ - Step 49992: {'lr': 0.00019885557166781018, 'samples': 1599744, 'steps': 3124, 'loss/train': 2.143167018890381} -09/21/2021 01:18:59 - INFO - __main__ - Step 49993: {'lr': 0.00019885557166781018, 'samples': 1599776, 'steps': 3124, 'loss/train': 1.5032087564468384} -09/21/2021 01:18:59 - INFO - __main__ - Step 49994: {'lr': 0.00019885557166781018, 'samples': 1599808, 'steps': 3124, 'loss/train': 2.4022293090820312} -09/21/2021 01:19:00 - INFO - __main__ - Step 49995: {'lr': 0.00019885557166781018, 'samples': 1599840, 'steps': 3124, 'loss/train': 2.5239107608795166} -09/21/2021 01:19:01 - INFO - __main__ - Step 49996: {'lr': 0.00019885557166781018, 'samples': 1599872, 'steps': 3124, 'loss/train': 1.548075795173645} -09/21/2021 01:19:02 - INFO - __main__ - Step 49997: {'lr': 0.00019885557166781018, 'samples': 1599904, 'steps': 3124, 'loss/train': 2.0182995796203613} -09/21/2021 01:19:02 - INFO - __main__ - Step 49998: {'lr': 0.00019885557166781018, 'samples': 1599936, 'steps': 3124, 'loss/train': 1.7439806461334229} -09/21/2021 01:19:03 - INFO - __main__ - Step 49999: {'lr': 0.00019885557166781018, 'samples': 1599968, 'steps': 3124, 'loss/train': 2.1178438663482666} -09/21/2021 01:19:04 - INFO - __main__ - Step 50000: {'lr': 0.00019885557166781018, 'samples': 1600000, 'steps': 3124, 'loss/train': 1.4012274742126465} -09/21/2021 01:19:04 - INFO - __main__ - Evaluating and saving model checkpoint -09/21/2021 01:45:34 - INFO - __main__ - Step 50000: {'loss/eval': 1.7745720148086548, 'perplexity': 5.897756576538086} -09/21/2021 01:47:49 - WARNING - huggingface_hub.repository - Adding files tracked by Git LFS: ['wandb/debug-internal.log', 'wandb/run-20210920_142810-36cw69uv/logs/debug-internal.log', 'wandb/run-20210920_142810-36cw69uv/run-36cw69uv.wandb']. This may take a bit of time if the files are large. +version https://git-lfs.github.com/spec/v1 +oid sha256:9fc1159fa45c332cf92ee1914741f15cc6fa1b9e651296ef084d401aa4c83d9d +size 15094384